diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.2868, "train/learning_rate": 1.1267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 134750, "_timestamp": 1648276094, "_step": 22314, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 7.0, 6.0, 24.0, 16.0, 17.0, 28.0, 27.0, 41.0, 41.0, 57.0, 59.0, 69.0, 82.0, 96.0, 86.0, 78.0, 58.0, 45.0, 38.0, 26.0, 29.0, 15.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-151.30198669433594, -147.59866333007812, -143.8953399658203, -140.1920166015625, -136.4886932373047, -132.78536987304688, -129.08204650878906, -125.37871551513672, -121.6753921508789, -117.9720687866211, -114.26874542236328, -110.56542205810547, -106.86209106445312, -103.15876770019531, -99.4554443359375, -95.75212097167969, -92.04879760742188, -88.34547424316406, -84.64215087890625, -80.93882751464844, -77.23550415039062, -73.53218078613281, -69.82884979248047, -66.12552642822266, -62.422203063964844, -58.71887969970703, -55.01555633544922, -51.31222915649414, -47.60890579223633, -43.905582427978516, -40.20225524902344, -36.498931884765625, -32.795616149902344, -29.09229278564453, -25.388967514038086, -21.68564224243164, -17.982318878173828, -14.278995513916016, -10.57567024230957, -6.872344970703125, -3.1690216064453125, 0.5343027114868164, 4.237627029418945, 7.940951347351074, 11.644275665283203, 15.347599029541016, 19.05092430114746, 22.754249572753906, 26.45757293701172, 30.16089630126953, 33.864219665527344, 37.56754684448242, 41.270870208740234, 44.97419357299805, 48.677520751953125, 52.38084411621094, 56.08416748046875, 59.78749084472656, 63.490814208984375, 67.19413757324219, 70.8974609375, 74.60078430175781, 78.30411529541016, 82.00743865966797, 85.71076202392578]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 9.0, 9.0, 17.0, 11.0, 20.0, 22.0, 17.0, 22.0, 27.0, 28.0, 41.0, 43.0, 41.0, 38.0, 29.0, 37.0, 41.0, 42.0, 39.0, 49.0, 32.0, 36.0, 39.0, 43.0, 36.0, 28.0, 21.0, 19.0, 23.0, 23.0, 17.0, 19.0, 14.0, 11.0, 9.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.2059097290039, -65.8742904663086, -63.54267501831055, -61.2110595703125, -58.87944030761719, -56.54782485961914, -54.216209411621094, -51.88459014892578, -49.552974700927734, -47.22135925292969, -44.889739990234375, -42.55812454223633, -40.22650909423828, -37.89488983154297, -35.56327438354492, -33.231658935546875, -30.900039672851562, -28.568422317504883, -26.236804962158203, -23.905189514160156, -21.573572158813477, -19.241954803466797, -16.91033935546875, -14.57872200012207, -12.24710464477539, -9.915487289428711, -7.583870887756348, -5.252254009246826, -2.9206371307373047, -0.589019775390625, 1.7425966262817383, 4.074213027954102, 6.4058380126953125, 8.737455368041992, 11.069071769714355, 13.400688171386719, 15.732305526733398, 18.063922882080078, 20.395538330078125, 22.727155685424805, 25.058773040771484, 27.390390396118164, 29.722007751464844, 32.05362319946289, 34.38523864746094, 36.71685791015625, 39.0484733581543, 41.380088806152344, 43.711708068847656, 46.0433235168457, 48.374942779541016, 50.70655822753906, 53.038177490234375, 55.36979293823242, 57.70140838623047, 60.03302764892578, 62.36464309692383, 64.69625854492188, 67.02787780761719, 69.3594970703125, 71.69110870361328, 74.0227279663086, 76.3543472290039, 78.68595886230469, 81.017578125]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 12.0, 18.0, 28.0, 29.0, 53.0, 108.0, 107.0, 163.0, 256.0, 330.0, 564.0, 776.0, 1236.0, 1872.0, 3065.0, 4669.0, 7626.0, 12886.0, 22633.0, 41141.0, 80592.0, 188661.0, 947081.0, 2287244.0, 348355.0, 115935.0, 55682.0, 29584.0, 16883.0, 9812.0, 5959.0, 3823.0, 2390.0, 1520.0, 1027.0, 673.0, 441.0, 317.0, 229.0, 154.0, 100.0, 75.0, 41.0, 39.0, 20.0, 21.0, 11.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-244.5, -236.67578125, -228.8515625, -221.02734375, -213.203125, -205.37890625, -197.5546875, -189.73046875, -181.90625, -174.08203125, -166.2578125, -158.43359375, -150.609375, -142.78515625, -134.9609375, -127.13671875, -119.3125, -111.48828125, -103.6640625, -95.83984375, -88.015625, -80.19140625, -72.3671875, -64.54296875, -56.71875, -48.89453125, -41.0703125, -33.24609375, -25.421875, -17.59765625, -9.7734375, -1.94921875, 5.875, 13.69921875, 21.5234375, 29.34765625, 37.171875, 44.99609375, 52.8203125, 60.64453125, 68.46875, 76.29296875, 84.1171875, 91.94140625, 99.765625, 107.58984375, 115.4140625, 123.23828125, 131.0625, 138.88671875, 146.7109375, 154.53515625, 162.359375, 170.18359375, 178.0078125, 185.83203125, 193.65625, 201.48046875, 209.3046875, 217.12890625, 224.953125, 232.77734375, 240.6015625, 248.42578125, 256.25]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 5.0, 15.0, 13.0, 16.0, 16.0, 22.0, 22.0, 35.0, 32.0, 24.0, 40.0, 39.0, 38.0, 48.0, 53.0, 53.0, 38.0, 57.0, 37.0, 41.0, 35.0, 37.0, 40.0, 33.0, 40.0, 27.0, 18.0, 25.0, 19.0, 18.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.5, -73.923828125, -71.34765625, -68.771484375, -66.1953125, -63.619140625, -61.04296875, -58.466796875, -55.890625, -53.314453125, -50.73828125, -48.162109375, -45.5859375, -43.009765625, -40.43359375, -37.857421875, -35.28125, -32.705078125, -30.12890625, -27.552734375, -24.9765625, -22.400390625, -19.82421875, -17.248046875, -14.671875, -12.095703125, -9.51953125, -6.943359375, -4.3671875, -1.791015625, 0.78515625, 3.361328125, 5.9375, 8.513671875, 11.08984375, 13.666015625, 16.2421875, 18.818359375, 21.39453125, 23.970703125, 26.546875, 29.123046875, 31.69921875, 34.275390625, 36.8515625, 39.427734375, 42.00390625, 44.580078125, 47.15625, 49.732421875, 52.30859375, 54.884765625, 57.4609375, 60.037109375, 62.61328125, 65.189453125, 67.765625, 70.341796875, 72.91796875, 75.494140625, 78.0703125, 80.646484375, 83.22265625, 85.798828125, 88.375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 20.0, 13.0, 26.0, 36.0, 60.0, 61.0, 107.0, 158.0, 234.0, 376.0, 559.0, 822.0, 1219.0, 1891.0, 2835.0, 4483.0, 6999.0, 11484.0, 18649.0, 30897.0, 51990.0, 92909.0, 172017.0, 372599.0, 1327744.0, 1326657.0, 371097.0, 172183.0, 92267.0, 52629.0, 30890.0, 18748.0, 11327.0, 7083.0, 4602.0, 2971.0, 1872.0, 1273.0, 849.0, 554.0, 355.0, 248.0, 153.0, 111.0, 74.0, 40.0, 28.0, 33.0, 17.0, 10.0, 14.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-139.5, -135.0, -130.5, -126.0, -121.5, -117.0, -112.5, -108.0, -103.5, -99.0, -94.5, -90.0, -85.5, -81.0, -76.5, -72.0, -67.5, -63.0, -58.5, -54.0, -49.5, -45.0, -40.5, -36.0, -31.5, -27.0, -22.5, -18.0, -13.5, -9.0, -4.5, 0.0, 4.5, 9.0, 13.5, 18.0, 22.5, 27.0, 31.5, 36.0, 40.5, 45.0, 49.5, 54.0, 58.5, 63.0, 67.5, 72.0, 76.5, 81.0, 85.5, 90.0, 94.5, 99.0, 103.5, 108.0, 112.5, 117.0, 121.5, 126.0, 130.5, 135.0, 139.5, 144.0, 148.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 10.0, 14.0, 13.0, 21.0, 25.0, 29.0, 37.0, 45.0, 39.0, 60.0, 77.0, 63.0, 91.0, 122.0, 121.0, 154.0, 196.0, 273.0, 395.0, 473.0, 384.0, 271.0, 196.0, 160.0, 122.0, 113.0, 95.0, 72.0, 69.0, 50.0, 55.0, 37.0, 27.0, 33.0, 22.0, 22.0, 19.0, 15.0, 6.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.5, -37.1904296875, -35.880859375, -34.5712890625, -33.26171875, -31.9521484375, -30.642578125, -29.3330078125, -28.0234375, -26.7138671875, -25.404296875, -24.0947265625, -22.78515625, -21.4755859375, -20.166015625, -18.8564453125, -17.546875, -16.2373046875, -14.927734375, -13.6181640625, -12.30859375, -10.9990234375, -9.689453125, -8.3798828125, -7.0703125, -5.7607421875, -4.451171875, -3.1416015625, -1.83203125, -0.5224609375, 0.787109375, 2.0966796875, 3.40625, 4.7158203125, 6.025390625, 7.3349609375, 8.64453125, 9.9541015625, 11.263671875, 12.5732421875, 13.8828125, 15.1923828125, 16.501953125, 17.8115234375, 19.12109375, 20.4306640625, 21.740234375, 23.0498046875, 24.359375, 25.6689453125, 26.978515625, 28.2880859375, 29.59765625, 30.9072265625, 32.216796875, 33.5263671875, 34.8359375, 36.1455078125, 37.455078125, 38.7646484375, 40.07421875, 41.3837890625, 42.693359375, 44.0029296875, 45.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 9.0, 10.0, 12.0, 17.0, 13.0, 20.0, 25.0, 30.0, 36.0, 38.0, 49.0, 56.0, 69.0, 71.0, 65.0, 79.0, 60.0, 48.0, 52.0, 39.0, 31.0, 24.0, 20.0, 18.0, 16.0, 11.0, 11.0, 12.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.65741729736328, -107.41815948486328, -104.17890930175781, -100.93965148925781, -97.70040130615234, -94.46114349365234, -91.22189331054688, -87.98263549804688, -84.7433853149414, -81.5041275024414, -78.26487731933594, -75.02561950683594, -71.78636932373047, -68.54711151123047, -65.307861328125, -62.068603515625, -58.829349517822266, -55.59009552001953, -52.3508415222168, -49.11158752441406, -45.87233352661133, -42.633079528808594, -39.393821716308594, -36.154571533203125, -32.915313720703125, -29.67605972290039, -26.436805725097656, -23.197551727294922, -19.958297729492188, -16.71904182434082, -13.479787826538086, -10.240533828735352, -7.00128173828125, -3.7620275020599365, -0.522773265838623, 2.7164812088012695, 5.955735206604004, 9.194990158081055, 12.434244155883789, 15.673498153686523, 18.912752151489258, 22.152006149291992, 25.391260147094727, 28.630516052246094, 31.869770050048828, 35.10902404785156, 38.3482780456543, 41.58753204345703, 44.826786041259766, 48.0660400390625, 51.305294036865234, 54.54454803466797, 57.7838020324707, 61.02305603027344, 64.26231384277344, 67.5015640258789, 70.7408218383789, 73.9800796508789, 77.21932983398438, 80.45858764648438, 83.69783782958984, 86.93709564208984, 90.17634582519531, 93.41560363769531, 96.65485382080078]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 6.0, 13.0, 15.0, 16.0, 26.0, 25.0, 34.0, 25.0, 30.0, 30.0, 37.0, 28.0, 49.0, 48.0, 43.0, 34.0, 41.0, 42.0, 50.0, 34.0, 32.0, 41.0, 42.0, 37.0, 29.0, 22.0, 22.0, 21.0, 22.0, 16.0, 17.0, 9.0, 16.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-101.45652770996094, -98.67851257324219, -95.9004898071289, -93.12247467041016, -90.34445190429688, -87.56643676757812, -84.78842163085938, -82.0103988647461, -79.23237609863281, -76.45436096191406, -73.67633819580078, -70.89832305908203, -68.12030029296875, -65.34228515625, -62.564266204833984, -59.78624725341797, -57.00823211669922, -54.2302131652832, -51.45219421386719, -48.67417907714844, -45.896156311035156, -43.118141174316406, -40.34012222290039, -37.562103271484375, -34.78408432006836, -32.006065368652344, -29.228046417236328, -26.450029373168945, -23.67201042175293, -20.893991470336914, -18.11597442626953, -15.337955474853516, -12.559944152832031, -9.781925201416016, -7.003907203674316, -4.225889205932617, -1.4478702545166016, 1.330148696899414, 4.108165740966797, 6.8861846923828125, 9.664203643798828, 12.442222595214844, 15.220240592956543, 17.998258590698242, 20.776277542114258, 23.554296493530273, 26.332313537597656, 29.110332489013672, 31.888351440429688, 34.6663703918457, 37.44438934326172, 40.22240447998047, 43.00042724609375, 45.7784423828125, 48.556461334228516, 51.33448028564453, 54.11249923706055, 56.89051818847656, 59.66853713989258, 62.446556091308594, 65.22457122802734, 68.00259399414062, 70.78060913085938, 73.55862426757812, 76.3366470336914]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 26.0, 24.0, 39.0, 48.0, 84.0, 112.0, 173.0, 247.0, 394.0, 600.0, 972.0, 1362.0, 2078.0, 3369.0, 5550.0, 9380.0, 15744.0, 27919.0, 51158.0, 97672.0, 192739.0, 285786.0, 164591.0, 83739.0, 44649.0, 24379.0, 13724.0, 8155.0, 5048.0, 3137.0, 2009.0, 1239.0, 806.0, 506.0, 340.0, 213.0, 175.0, 123.0, 72.0, 50.0, 37.0, 24.0, 14.0, 15.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.375, -132.1640625, -127.953125, -123.7421875, -119.53125, -115.3203125, -111.109375, -106.8984375, -102.6875, -98.4765625, -94.265625, -90.0546875, -85.84375, -81.6328125, -77.421875, -73.2109375, -69.0, -64.7890625, -60.578125, -56.3671875, -52.15625, -47.9453125, -43.734375, -39.5234375, -35.3125, -31.1015625, -26.890625, -22.6796875, -18.46875, -14.2578125, -10.046875, -5.8359375, -1.625, 2.5859375, 6.796875, 11.0078125, 15.21875, 19.4296875, 23.640625, 27.8515625, 32.0625, 36.2734375, 40.484375, 44.6953125, 48.90625, 53.1171875, 57.328125, 61.5390625, 65.75, 69.9609375, 74.171875, 78.3828125, 82.59375, 86.8046875, 91.015625, 95.2265625, 99.4375, 103.6484375, 107.859375, 112.0703125, 116.28125, 120.4921875, 124.703125, 128.9140625, 133.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 8.0, 8.0, 18.0, 17.0, 18.0, 25.0, 28.0, 28.0, 36.0, 27.0, 40.0, 37.0, 43.0, 51.0, 56.0, 49.0, 43.0, 38.0, 38.0, 37.0, 35.0, 36.0, 46.0, 27.0, 27.0, 29.0, 15.0, 22.0, 27.0, 11.0, 17.0, 9.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-101.3125, -98.515625, -95.71875, -92.921875, -90.125, -87.328125, -84.53125, -81.734375, -78.9375, -76.140625, -73.34375, -70.546875, -67.75, -64.953125, -62.15625, -59.359375, -56.5625, -53.765625, -50.96875, -48.171875, -45.375, -42.578125, -39.78125, -36.984375, -34.1875, -31.390625, -28.59375, -25.796875, -23.0, -20.203125, -17.40625, -14.609375, -11.8125, -9.015625, -6.21875, -3.421875, -0.625, 2.171875, 4.96875, 7.765625, 10.5625, 13.359375, 16.15625, 18.953125, 21.75, 24.546875, 27.34375, 30.140625, 32.9375, 35.734375, 38.53125, 41.328125, 44.125, 46.921875, 49.71875, 52.515625, 55.3125, 58.109375, 60.90625, 63.703125, 66.5, 69.296875, 72.09375, 74.890625, 77.6875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 7.0, 13.0, 19.0, 24.0, 34.0, 45.0, 66.0, 85.0, 112.0, 158.0, 243.0, 334.0, 523.0, 690.0, 988.0, 1460.0, 2228.0, 3397.0, 5229.0, 8498.0, 14213.0, 24711.0, 45831.0, 94309.0, 216723.0, 322761.0, 151198.0, 68890.0, 35120.0, 19395.0, 11253.0, 6939.0, 4341.0, 2797.0, 1896.0, 1244.0, 798.0, 608.0, 414.0, 270.0, 184.0, 124.0, 102.0, 74.0, 62.0, 41.0, 31.0, 19.0, 10.0, 9.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 4.0], "bins": [-166.0, -160.859375, -155.71875, -150.578125, -145.4375, -140.296875, -135.15625, -130.015625, -124.875, -119.734375, -114.59375, -109.453125, -104.3125, -99.171875, -94.03125, -88.890625, -83.75, -78.609375, -73.46875, -68.328125, -63.1875, -58.046875, -52.90625, -47.765625, -42.625, -37.484375, -32.34375, -27.203125, -22.0625, -16.921875, -11.78125, -6.640625, -1.5, 3.640625, 8.78125, 13.921875, 19.0625, 24.203125, 29.34375, 34.484375, 39.625, 44.765625, 49.90625, 55.046875, 60.1875, 65.328125, 70.46875, 75.609375, 80.75, 85.890625, 91.03125, 96.171875, 101.3125, 106.453125, 111.59375, 116.734375, 121.875, 127.015625, 132.15625, 137.296875, 142.4375, 147.578125, 152.71875, 157.859375, 163.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 10.0, 19.0, 18.0, 21.0, 16.0, 20.0, 21.0, 24.0, 28.0, 34.0, 32.0, 41.0, 50.0, 37.0, 50.0, 44.0, 42.0, 44.0, 38.0, 52.0, 42.0, 51.0, 31.0, 39.0, 32.0, 18.0, 23.0, 11.0, 24.0, 16.0, 6.0, 12.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.21875, -57.23388671875, -55.2490234375, -53.26416015625, -51.279296875, -49.29443359375, -47.3095703125, -45.32470703125, -43.33984375, -41.35498046875, -39.3701171875, -37.38525390625, -35.400390625, -33.41552734375, -31.4306640625, -29.44580078125, -27.4609375, -25.47607421875, -23.4912109375, -21.50634765625, -19.521484375, -17.53662109375, -15.5517578125, -13.56689453125, -11.58203125, -9.59716796875, -7.6123046875, -5.62744140625, -3.642578125, -1.65771484375, 0.3271484375, 2.31201171875, 4.296875, 6.28173828125, 8.2666015625, 10.25146484375, 12.236328125, 14.22119140625, 16.2060546875, 18.19091796875, 20.17578125, 22.16064453125, 24.1455078125, 26.13037109375, 28.115234375, 30.10009765625, 32.0849609375, 34.06982421875, 36.0546875, 38.03955078125, 40.0244140625, 42.00927734375, 43.994140625, 45.97900390625, 47.9638671875, 49.94873046875, 51.93359375, 53.91845703125, 55.9033203125, 57.88818359375, 59.873046875, 61.85791015625, 63.8427734375, 65.82763671875, 67.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 6.0, 16.0, 10.0, 16.0, 17.0, 25.0, 34.0, 50.0, 68.0, 106.0, 120.0, 207.0, 333.0, 490.0, 827.0, 1416.0, 2519.0, 5305.0, 14173.0, 68530.0, 698566.0, 211555.0, 27635.0, 8116.0, 3588.0, 1828.0, 1113.0, 652.0, 415.0, 286.0, 164.0, 112.0, 81.0, 50.0, 35.0, 36.0, 16.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-159.875, -155.13671875, -150.3984375, -145.66015625, -140.921875, -136.18359375, -131.4453125, -126.70703125, -121.96875, -117.23046875, -112.4921875, -107.75390625, -103.015625, -98.27734375, -93.5390625, -88.80078125, -84.0625, -79.32421875, -74.5859375, -69.84765625, -65.109375, -60.37109375, -55.6328125, -50.89453125, -46.15625, -41.41796875, -36.6796875, -31.94140625, -27.203125, -22.46484375, -17.7265625, -12.98828125, -8.25, -3.51171875, 1.2265625, 5.96484375, 10.703125, 15.44140625, 20.1796875, 24.91796875, 29.65625, 34.39453125, 39.1328125, 43.87109375, 48.609375, 53.34765625, 58.0859375, 62.82421875, 67.5625, 72.30078125, 77.0390625, 81.77734375, 86.515625, 91.25390625, 95.9921875, 100.73046875, 105.46875, 110.20703125, 114.9453125, 119.68359375, 124.421875, 129.16015625, 133.8984375, 138.63671875, 143.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 15.0, 17.0, 22.0, 48.0, 69.0, 143.0, 243.0, 187.0, 101.0, 54.0, 45.0, 15.0, 18.0, 6.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007694244384765625, -0.007286727428436279, -0.006879210472106934, -0.006471693515777588, -0.006064176559448242, -0.0056566596031188965, -0.005249142646789551, -0.004841625690460205, -0.004434108734130859, -0.004026591777801514, -0.003619074821472168, -0.0032115578651428223, -0.0028040409088134766, -0.002396523952484131, -0.001989006996154785, -0.0015814900398254395, -0.0011739730834960938, -0.000766456127166748, -0.00035893917083740234, 4.857778549194336e-05, 0.00045609474182128906, 0.0008636116981506348, 0.0012711286544799805, 0.0016786456108093262, 0.002086162567138672, 0.0024936795234680176, 0.0029011964797973633, 0.003308713436126709, 0.0037162303924560547, 0.0041237473487854, 0.004531264305114746, 0.004938781261444092, 0.0053462982177734375, 0.005753815174102783, 0.006161332130432129, 0.006568849086761475, 0.00697636604309082, 0.007383882999420166, 0.007791399955749512, 0.008198916912078857, 0.008606433868408203, 0.009013950824737549, 0.009421467781066895, 0.00982898473739624, 0.010236501693725586, 0.010644018650054932, 0.011051535606384277, 0.011459052562713623, 0.011866569519042969, 0.012274086475372314, 0.01268160343170166, 0.013089120388031006, 0.013496637344360352, 0.013904154300689697, 0.014311671257019043, 0.014719188213348389, 0.015126705169677734, 0.01553422212600708, 0.015941739082336426, 0.01634925603866577, 0.016756772994995117, 0.017164289951324463, 0.01757180690765381, 0.017979323863983154, 0.0183868408203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 10.0, 16.0, 20.0, 31.0, 37.0, 58.0, 74.0, 94.0, 134.0, 155.0, 234.0, 334.0, 498.0, 635.0, 947.0, 1422.0, 2075.0, 3224.0, 5257.0, 9635.0, 17862.0, 37229.0, 86105.0, 228337.0, 372032.0, 157571.0, 61598.0, 27801.0, 14210.0, 7636.0, 4549.0, 2787.0, 1787.0, 1180.0, 863.0, 599.0, 406.0, 295.0, 219.0, 142.0, 127.0, 84.0, 67.0, 48.0, 41.0, 31.0, 10.0, 13.0, 5.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-60.75, -58.8701171875, -56.990234375, -55.1103515625, -53.23046875, -51.3505859375, -49.470703125, -47.5908203125, -45.7109375, -43.8310546875, -41.951171875, -40.0712890625, -38.19140625, -36.3115234375, -34.431640625, -32.5517578125, -30.671875, -28.7919921875, -26.912109375, -25.0322265625, -23.15234375, -21.2724609375, -19.392578125, -17.5126953125, -15.6328125, -13.7529296875, -11.873046875, -9.9931640625, -8.11328125, -6.2333984375, -4.353515625, -2.4736328125, -0.59375, 1.2861328125, 3.166015625, 5.0458984375, 6.92578125, 8.8056640625, 10.685546875, 12.5654296875, 14.4453125, 16.3251953125, 18.205078125, 20.0849609375, 21.96484375, 23.8447265625, 25.724609375, 27.6044921875, 29.484375, 31.3642578125, 33.244140625, 35.1240234375, 37.00390625, 38.8837890625, 40.763671875, 42.6435546875, 44.5234375, 46.4033203125, 48.283203125, 50.1630859375, 52.04296875, 53.9228515625, 55.802734375, 57.6826171875, 59.5625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 13.0, 13.0, 15.0, 23.0, 27.0, 25.0, 44.0, 70.0, 45.0, 71.0, 79.0, 96.0, 93.0, 78.0, 59.0, 47.0, 30.0, 30.0, 28.0, 22.0, 17.0, 15.0, 9.0, 4.0, 12.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.265625, -19.658203125, -19.05078125, -18.443359375, -17.8359375, -17.228515625, -16.62109375, -16.013671875, -15.40625, -14.798828125, -14.19140625, -13.583984375, -12.9765625, -12.369140625, -11.76171875, -11.154296875, -10.546875, -9.939453125, -9.33203125, -8.724609375, -8.1171875, -7.509765625, -6.90234375, -6.294921875, -5.6875, -5.080078125, -4.47265625, -3.865234375, -3.2578125, -2.650390625, -2.04296875, -1.435546875, -0.828125, -0.220703125, 0.38671875, 0.994140625, 1.6015625, 2.208984375, 2.81640625, 3.423828125, 4.03125, 4.638671875, 5.24609375, 5.853515625, 6.4609375, 7.068359375, 7.67578125, 8.283203125, 8.890625, 9.498046875, 10.10546875, 10.712890625, 11.3203125, 11.927734375, 12.53515625, 13.142578125, 13.75, 14.357421875, 14.96484375, 15.572265625, 16.1796875, 16.787109375, 17.39453125, 18.001953125, 18.609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 4.0, 14.0, 8.0, 17.0, 24.0, 13.0, 27.0, 36.0, 35.0, 48.0, 62.0, 71.0, 63.0, 84.0, 88.0, 73.0, 60.0, 51.0, 34.0, 33.0, 36.0, 29.0, 16.0, 17.0, 13.0, 10.0, 8.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-125.12419128417969, -121.61530303955078, -118.10641479492188, -114.5975341796875, -111.0886459350586, -107.57975769042969, -104.07087707519531, -100.5619888305664, -97.0531005859375, -93.5442123413086, -90.03532409667969, -86.52644348144531, -83.0175552368164, -79.5086669921875, -75.99978637695312, -72.49089813232422, -68.98200988769531, -65.4731216430664, -61.964237213134766, -58.455352783203125, -54.94646453857422, -51.43757629394531, -47.92869186401367, -44.41980743408203, -40.910919189453125, -37.40203094482422, -33.89314651489258, -30.384260177612305, -26.87537384033203, -23.366487503051758, -19.857601165771484, -16.34871482849121, -12.839820861816406, -9.330934524536133, -5.822048187255859, -2.313161849975586, 1.1957244873046875, 4.704610824584961, 8.213497161865234, 11.722383499145508, 15.231269836425781, 18.740156173706055, 22.249042510986328, 25.7579288482666, 29.266815185546875, 32.77570343017578, 36.28458786010742, 39.79347229003906, 43.30236053466797, 46.811248779296875, 50.320133209228516, 53.829017639160156, 57.33790588378906, 60.84679412841797, 64.35568237304688, 67.86456298828125, 71.37345123291016, 74.88233947753906, 78.39122009277344, 81.90010833740234, 85.40899658203125, 88.91788482666016, 92.42677307128906, 95.93565368652344, 99.44454193115234]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 7.0, 8.0, 15.0, 12.0, 26.0, 22.0, 27.0, 34.0, 29.0, 34.0, 38.0, 34.0, 38.0, 43.0, 47.0, 46.0, 32.0, 33.0, 39.0, 44.0, 35.0, 42.0, 38.0, 38.0, 37.0, 26.0, 20.0, 15.0, 22.0, 19.0, 18.0, 9.0, 12.0, 18.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-89.54629516601562, -87.0429458618164, -84.53958892822266, -82.03623962402344, -79.53289031982422, -77.029541015625, -74.52618408203125, -72.02283477783203, -69.51948547363281, -67.0161361694336, -64.51277923583984, -62.009429931640625, -59.506080627441406, -57.00272750854492, -54.49937438964844, -51.99602508544922, -49.49266815185547, -46.989315032958984, -44.485965728759766, -41.98261260986328, -39.47926330566406, -36.97591018676758, -34.472557067871094, -31.969205856323242, -29.46585464477539, -26.96250343322754, -24.459152221679688, -21.955799102783203, -19.45244789123535, -16.9490966796875, -14.445744514465332, -11.942392349243164, -9.439041137695312, -6.935689449310303, -4.432337760925293, -1.9289860725402832, 0.5743656158447266, 3.077716827392578, 5.581068992614746, 8.084421157836914, 10.587772369384766, 13.091123580932617, 15.594475746154785, 18.097827911376953, 20.601179122924805, 23.104530334472656, 25.60788345336914, 28.111234664916992, 30.614585876464844, 33.11793899536133, 35.62128829956055, 38.12464141845703, 40.62799072265625, 43.131343841552734, 45.63469696044922, 48.13804626464844, 50.64139938354492, 53.144752502441406, 55.648101806640625, 58.15145492553711, 60.654808044433594, 63.15815734863281, 65.66150665283203, 68.16486358642578, 70.668212890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 32.0, 44.0, 69.0, 95.0, 152.0, 197.0, 315.0, 444.0, 679.0, 994.0, 1504.0, 2203.0, 3243.0, 5054.0, 7190.0, 10846.0, 16108.0, 24199.0, 36866.0, 57281.0, 89018.0, 142174.0, 203276.0, 159389.0, 100229.0, 64158.0, 41377.0, 27044.0, 17762.0, 11889.0, 8055.0, 5426.0, 3711.0, 2378.0, 1686.0, 1085.0, 757.0, 513.0, 335.0, 221.0, 146.0, 128.0, 64.0, 60.0, 34.0, 21.0, 26.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0], "bins": [-95.1875, -92.177734375, -89.16796875, -86.158203125, -83.1484375, -80.138671875, -77.12890625, -74.119140625, -71.109375, -68.099609375, -65.08984375, -62.080078125, -59.0703125, -56.060546875, -53.05078125, -50.041015625, -47.03125, -44.021484375, -41.01171875, -38.001953125, -34.9921875, -31.982421875, -28.97265625, -25.962890625, -22.953125, -19.943359375, -16.93359375, -13.923828125, -10.9140625, -7.904296875, -4.89453125, -1.884765625, 1.125, 4.134765625, 7.14453125, 10.154296875, 13.1640625, 16.173828125, 19.18359375, 22.193359375, 25.203125, 28.212890625, 31.22265625, 34.232421875, 37.2421875, 40.251953125, 43.26171875, 46.271484375, 49.28125, 52.291015625, 55.30078125, 58.310546875, 61.3203125, 64.330078125, 67.33984375, 70.349609375, 73.359375, 76.369140625, 79.37890625, 82.388671875, 85.3984375, 88.408203125, 91.41796875, 94.427734375, 97.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 8.0, 12.0, 16.0, 17.0, 24.0, 33.0, 33.0, 28.0, 34.0, 41.0, 28.0, 36.0, 43.0, 54.0, 49.0, 39.0, 39.0, 42.0, 43.0, 46.0, 37.0, 40.0, 35.0, 32.0, 34.0, 19.0, 18.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 11.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-93.0, -90.3916015625, -87.783203125, -85.1748046875, -82.56640625, -79.9580078125, -77.349609375, -74.7412109375, -72.1328125, -69.5244140625, -66.916015625, -64.3076171875, -61.69921875, -59.0908203125, -56.482421875, -53.8740234375, -51.265625, -48.6572265625, -46.048828125, -43.4404296875, -40.83203125, -38.2236328125, -35.615234375, -33.0068359375, -30.3984375, -27.7900390625, -25.181640625, -22.5732421875, -19.96484375, -17.3564453125, -14.748046875, -12.1396484375, -9.53125, -6.9228515625, -4.314453125, -1.7060546875, 0.90234375, 3.5107421875, 6.119140625, 8.7275390625, 11.3359375, 13.9443359375, 16.552734375, 19.1611328125, 21.76953125, 24.3779296875, 26.986328125, 29.5947265625, 32.203125, 34.8115234375, 37.419921875, 40.0283203125, 42.63671875, 45.2451171875, 47.853515625, 50.4619140625, 53.0703125, 55.6787109375, 58.287109375, 60.8955078125, 63.50390625, 66.1123046875, 68.720703125, 71.3291015625, 73.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 4.0, 5.0, 1.0, 6.0, 12.0, 16.0, 28.0, 31.0, 38.0, 58.0, 82.0, 120.0, 173.0, 260.0, 403.0, 604.0, 816.0, 1255.0, 1846.0, 2711.0, 4182.0, 6623.0, 10072.0, 15696.0, 24913.0, 39863.0, 63703.0, 104523.0, 167050.0, 211371.0, 147841.0, 90886.0, 56324.0, 34853.0, 22104.0, 14053.0, 8968.0, 5694.0, 3752.0, 2427.0, 1642.0, 1098.0, 739.0, 548.0, 323.0, 269.0, 186.0, 138.0, 73.0, 60.0, 35.0, 29.0, 18.0, 14.0, 10.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-129.375, -125.25, -121.125, -117.0, -112.875, -108.75, -104.625, -100.5, -96.375, -92.25, -88.125, -84.0, -79.875, -75.75, -71.625, -67.5, -63.375, -59.25, -55.125, -51.0, -46.875, -42.75, -38.625, -34.5, -30.375, -26.25, -22.125, -18.0, -13.875, -9.75, -5.625, -1.5, 2.625, 6.75, 10.875, 15.0, 19.125, 23.25, 27.375, 31.5, 35.625, 39.75, 43.875, 48.0, 52.125, 56.25, 60.375, 64.5, 68.625, 72.75, 76.875, 81.0, 85.125, 89.25, 93.375, 97.5, 101.625, 105.75, 109.875, 114.0, 118.125, 122.25, 126.375, 130.5, 134.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 12.0, 9.0, 13.0, 10.0, 11.0, 12.0, 21.0, 18.0, 27.0, 22.0, 30.0, 24.0, 21.0, 35.0, 31.0, 37.0, 57.0, 33.0, 42.0, 56.0, 51.0, 41.0, 28.0, 36.0, 38.0, 43.0, 30.0, 22.0, 34.0, 19.0, 22.0, 18.0, 17.0, 11.0, 13.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.099609375, -42.57421875, -41.048828125, -39.5234375, -37.998046875, -36.47265625, -34.947265625, -33.421875, -31.896484375, -30.37109375, -28.845703125, -27.3203125, -25.794921875, -24.26953125, -22.744140625, -21.21875, -19.693359375, -18.16796875, -16.642578125, -15.1171875, -13.591796875, -12.06640625, -10.541015625, -9.015625, -7.490234375, -5.96484375, -4.439453125, -2.9140625, -1.388671875, 0.13671875, 1.662109375, 3.1875, 4.712890625, 6.23828125, 7.763671875, 9.2890625, 10.814453125, 12.33984375, 13.865234375, 15.390625, 16.916015625, 18.44140625, 19.966796875, 21.4921875, 23.017578125, 24.54296875, 26.068359375, 27.59375, 29.119140625, 30.64453125, 32.169921875, 33.6953125, 35.220703125, 36.74609375, 38.271484375, 39.796875, 41.322265625, 42.84765625, 44.373046875, 45.8984375, 47.423828125, 48.94921875, 50.474609375, 52.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 21.0, 31.0, 36.0, 54.0, 85.0, 103.0, 169.0, 268.0, 396.0, 570.0, 924.0, 1300.0, 1935.0, 2953.0, 4609.0, 7268.0, 11211.0, 18543.0, 31490.0, 56343.0, 112241.0, 248774.0, 274061.0, 125109.0, 61803.0, 33886.0, 20235.0, 11931.0, 7785.0, 4947.0, 3153.0, 2072.0, 1416.0, 915.0, 616.0, 412.0, 300.0, 176.0, 144.0, 93.0, 62.0, 32.0, 26.0, 13.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-34.6875, -33.66943359375, -32.6513671875, -31.63330078125, -30.615234375, -29.59716796875, -28.5791015625, -27.56103515625, -26.54296875, -25.52490234375, -24.5068359375, -23.48876953125, -22.470703125, -21.45263671875, -20.4345703125, -19.41650390625, -18.3984375, -17.38037109375, -16.3623046875, -15.34423828125, -14.326171875, -13.30810546875, -12.2900390625, -11.27197265625, -10.25390625, -9.23583984375, -8.2177734375, -7.19970703125, -6.181640625, -5.16357421875, -4.1455078125, -3.12744140625, -2.109375, -1.09130859375, -0.0732421875, 0.94482421875, 1.962890625, 2.98095703125, 3.9990234375, 5.01708984375, 6.03515625, 7.05322265625, 8.0712890625, 9.08935546875, 10.107421875, 11.12548828125, 12.1435546875, 13.16162109375, 14.1796875, 15.19775390625, 16.2158203125, 17.23388671875, 18.251953125, 19.27001953125, 20.2880859375, 21.30615234375, 22.32421875, 23.34228515625, 24.3603515625, 25.37841796875, 26.396484375, 27.41455078125, 28.4326171875, 29.45068359375, 30.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 10.0, 9.0, 30.0, 32.0, 28.0, 68.0, 75.0, 114.0, 170.0, 127.0, 82.0, 69.0, 51.0, 36.0, 17.0, 17.0, 12.0, 4.0, 8.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00492095947265625, -0.0047539472579956055, -0.004586935043334961, -0.004419922828674316, -0.004252910614013672, -0.004085898399353027, -0.003918886184692383, -0.0037518739700317383, -0.0035848617553710938, -0.0034178495407104492, -0.0032508373260498047, -0.00308382511138916, -0.0029168128967285156, -0.002749800682067871, -0.0025827884674072266, -0.002415776252746582, -0.0022487640380859375, -0.002081751823425293, -0.0019147396087646484, -0.001747727394104004, -0.0015807151794433594, -0.0014137029647827148, -0.0012466907501220703, -0.0010796785354614258, -0.0009126663208007812, -0.0007456541061401367, -0.0005786418914794922, -0.00041162967681884766, -0.0002446174621582031, -7.76052474975586e-05, 8.940696716308594e-05, 0.00025641918182373047, 0.000423431396484375, 0.0005904436111450195, 0.0007574558258056641, 0.0009244680404663086, 0.0010914802551269531, 0.0012584924697875977, 0.0014255046844482422, 0.0015925168991088867, 0.0017595291137695312, 0.0019265413284301758, 0.0020935535430908203, 0.002260565757751465, 0.0024275779724121094, 0.002594590187072754, 0.0027616024017333984, 0.002928614616394043, 0.0030956268310546875, 0.003262639045715332, 0.0034296512603759766, 0.003596663475036621, 0.0037636756896972656, 0.00393068790435791, 0.004097700119018555, 0.004264712333679199, 0.004431724548339844, 0.004598736763000488, 0.004765748977661133, 0.004932761192321777, 0.005099773406982422, 0.005266785621643066, 0.005433797836303711, 0.0056008100509643555, 0.005767822265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 10.0, 13.0, 24.0, 26.0, 55.0, 53.0, 79.0, 145.0, 190.0, 284.0, 373.0, 503.0, 686.0, 1005.0, 1281.0, 1882.0, 2659.0, 3780.0, 5578.0, 8129.0, 12536.0, 19250.0, 30144.0, 50059.0, 89445.0, 168913.0, 255632.0, 168325.0, 89393.0, 49738.0, 30067.0, 19065.0, 12491.0, 8205.0, 5482.0, 3802.0, 2599.0, 1838.0, 1351.0, 896.0, 697.0, 541.0, 409.0, 285.0, 199.0, 134.0, 108.0, 58.0, 40.0, 39.0, 26.0, 11.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0], "bins": [-25.578125, -24.791015625, -24.00390625, -23.216796875, -22.4296875, -21.642578125, -20.85546875, -20.068359375, -19.28125, -18.494140625, -17.70703125, -16.919921875, -16.1328125, -15.345703125, -14.55859375, -13.771484375, -12.984375, -12.197265625, -11.41015625, -10.623046875, -9.8359375, -9.048828125, -8.26171875, -7.474609375, -6.6875, -5.900390625, -5.11328125, -4.326171875, -3.5390625, -2.751953125, -1.96484375, -1.177734375, -0.390625, 0.396484375, 1.18359375, 1.970703125, 2.7578125, 3.544921875, 4.33203125, 5.119140625, 5.90625, 6.693359375, 7.48046875, 8.267578125, 9.0546875, 9.841796875, 10.62890625, 11.416015625, 12.203125, 12.990234375, 13.77734375, 14.564453125, 15.3515625, 16.138671875, 16.92578125, 17.712890625, 18.5, 19.287109375, 20.07421875, 20.861328125, 21.6484375, 22.435546875, 23.22265625, 24.009765625, 24.796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 11.0, 5.0, 5.0, 14.0, 13.0, 15.0, 15.0, 28.0, 25.0, 36.0, 30.0, 41.0, 41.0, 49.0, 61.0, 74.0, 63.0, 67.0, 51.0, 67.0, 41.0, 30.0, 23.0, 30.0, 25.0, 25.0, 16.0, 16.0, 20.0, 5.0, 9.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.677490234375, -9.38623046875, -9.094970703125, -8.8037109375, -8.512451171875, -8.22119140625, -7.929931640625, -7.638671875, -7.347412109375, -7.05615234375, -6.764892578125, -6.4736328125, -6.182373046875, -5.89111328125, -5.599853515625, -5.30859375, -5.017333984375, -4.72607421875, -4.434814453125, -4.1435546875, -3.852294921875, -3.56103515625, -3.269775390625, -2.978515625, -2.687255859375, -2.39599609375, -2.104736328125, -1.8134765625, -1.522216796875, -1.23095703125, -0.939697265625, -0.6484375, -0.357177734375, -0.06591796875, 0.225341796875, 0.5166015625, 0.807861328125, 1.09912109375, 1.390380859375, 1.681640625, 1.972900390625, 2.26416015625, 2.555419921875, 2.8466796875, 3.137939453125, 3.42919921875, 3.720458984375, 4.01171875, 4.302978515625, 4.59423828125, 4.885498046875, 5.1767578125, 5.468017578125, 5.75927734375, 6.050537109375, 6.341796875, 6.633056640625, 6.92431640625, 7.215576171875, 7.5068359375, 7.798095703125, 8.08935546875, 8.380615234375, 8.671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 17.0, 14.0, 20.0, 25.0, 27.0, 37.0, 40.0, 40.0, 65.0, 77.0, 86.0, 73.0, 80.0, 78.0, 72.0, 46.0, 32.0, 43.0, 30.0, 16.0, 11.0, 12.0, 11.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-133.5307159423828, -129.7549285888672, -125.9791488647461, -122.20336151123047, -118.42757415771484, -114.65179443359375, -110.87600708007812, -107.1002197265625, -103.32443237304688, -99.54864501953125, -95.77286529541016, -91.99707794189453, -88.2212905883789, -84.44551086425781, -80.66972351074219, -76.89393615722656, -73.11815643310547, -69.34236907958984, -65.56658935546875, -61.790802001953125, -58.0150146484375, -54.23923110961914, -50.46344757080078, -46.687660217285156, -42.9118766784668, -39.13609313964844, -35.36030578613281, -31.584522247314453, -27.80873680114746, -24.03295135498047, -20.25716781616211, -16.481382369995117, -12.705589294433594, -8.929803848266602, -5.154019355773926, -1.37823486328125, 2.397550582885742, 6.173336029052734, 9.949119567871094, 13.724905014038086, 17.500690460205078, 21.27647590637207, 25.052261352539062, 28.828044891357422, 32.60382843017578, 36.379615783691406, 40.155399322509766, 43.931182861328125, 47.70697021484375, 51.48275375366211, 55.258541107177734, 59.034324645996094, 62.81011199951172, 66.58589172363281, 70.36167907714844, 74.13746643066406, 77.91325378417969, 81.68904113769531, 85.4648208618164, 89.24060821533203, 93.01639556884766, 96.79217529296875, 100.56796264648438, 104.34375, 108.1195297241211]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 8.0, 10.0, 11.0, 18.0, 24.0, 15.0, 20.0, 22.0, 27.0, 35.0, 36.0, 34.0, 40.0, 58.0, 35.0, 50.0, 37.0, 34.0, 32.0, 52.0, 38.0, 48.0, 31.0, 25.0, 35.0, 28.0, 32.0, 17.0, 17.0, 17.0, 14.0, 10.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-87.68623352050781, -85.16998291015625, -82.65373992919922, -80.13748931884766, -77.62124633789062, -75.10499572753906, -72.58875274658203, -70.07250213623047, -67.55625915527344, -65.04000854492188, -62.523765563964844, -60.00751876831055, -57.49127197265625, -54.97502136230469, -52.45877456665039, -49.942527770996094, -47.42627716064453, -44.910030364990234, -42.39378356933594, -39.87753677368164, -37.361289978027344, -34.84503936767578, -32.328792572021484, -29.812545776367188, -27.29629898071289, -24.780052185058594, -22.263805389404297, -19.747556686401367, -17.23130989074707, -14.715063095092773, -12.19881534576416, -9.682567596435547, -7.166313171386719, -4.650065898895264, -2.1338186264038086, 0.3824286460876465, 2.8986759185791016, 5.414922714233398, 7.931170463562012, 10.447418212890625, 12.963665008544922, 15.479911804199219, 17.996158599853516, 20.512407302856445, 23.028654098510742, 25.54490089416504, 28.06114959716797, 30.577396392822266, 33.09364318847656, 35.60988998413086, 38.126136779785156, 40.64238357543945, 43.15863037109375, 45.67488098144531, 48.19112777709961, 50.707374572753906, 53.2236213684082, 55.7398681640625, 58.2561149597168, 60.772361755371094, 63.288612365722656, 65.80485534667969, 68.32110595703125, 70.83735656738281, 73.35359954833984]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 19.0, 14.0, 29.0, 32.0, 55.0, 74.0, 103.0, 119.0, 210.0, 282.0, 412.0, 556.0, 895.0, 1187.0, 1883.0, 2776.0, 4309.0, 6704.0, 10315.0, 17003.0, 28306.0, 48684.0, 88053.0, 187379.0, 630551.0, 1835347.0, 857478.0, 225933.0, 101559.0, 55886.0, 32868.0, 19804.0, 12638.0, 8068.0, 5071.0, 3309.0, 2185.0, 1377.0, 940.0, 616.0, 411.0, 274.0, 193.0, 130.0, 78.0, 56.0, 38.0, 23.0, 8.0, 7.0, 13.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-133.75, -129.6484375, -125.546875, -121.4453125, -117.34375, -113.2421875, -109.140625, -105.0390625, -100.9375, -96.8359375, -92.734375, -88.6328125, -84.53125, -80.4296875, -76.328125, -72.2265625, -68.125, -64.0234375, -59.921875, -55.8203125, -51.71875, -47.6171875, -43.515625, -39.4140625, -35.3125, -31.2109375, -27.109375, -23.0078125, -18.90625, -14.8046875, -10.703125, -6.6015625, -2.5, 1.6015625, 5.703125, 9.8046875, 13.90625, 18.0078125, 22.109375, 26.2109375, 30.3125, 34.4140625, 38.515625, 42.6171875, 46.71875, 50.8203125, 54.921875, 59.0234375, 63.125, 67.2265625, 71.328125, 75.4296875, 79.53125, 83.6328125, 87.734375, 91.8359375, 95.9375, 100.0390625, 104.140625, 108.2421875, 112.34375, 116.4453125, 120.546875, 124.6484375, 128.75]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 14.0, 11.0, 11.0, 20.0, 20.0, 22.0, 17.0, 32.0, 26.0, 26.0, 38.0, 52.0, 47.0, 46.0, 47.0, 42.0, 46.0, 32.0, 48.0, 42.0, 36.0, 39.0, 33.0, 37.0, 30.0, 24.0, 31.0, 16.0, 16.0, 18.0, 15.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-72.25, -70.15234375, -68.0546875, -65.95703125, -63.859375, -61.76171875, -59.6640625, -57.56640625, -55.46875, -53.37109375, -51.2734375, -49.17578125, -47.078125, -44.98046875, -42.8828125, -40.78515625, -38.6875, -36.58984375, -34.4921875, -32.39453125, -30.296875, -28.19921875, -26.1015625, -24.00390625, -21.90625, -19.80859375, -17.7109375, -15.61328125, -13.515625, -11.41796875, -9.3203125, -7.22265625, -5.125, -3.02734375, -0.9296875, 1.16796875, 3.265625, 5.36328125, 7.4609375, 9.55859375, 11.65625, 13.75390625, 15.8515625, 17.94921875, 20.046875, 22.14453125, 24.2421875, 26.33984375, 28.4375, 30.53515625, 32.6328125, 34.73046875, 36.828125, 38.92578125, 41.0234375, 43.12109375, 45.21875, 47.31640625, 49.4140625, 51.51171875, 53.609375, 55.70703125, 57.8046875, 59.90234375, 62.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 19.0, 17.0, 40.0, 50.0, 89.0, 114.0, 193.0, 280.0, 424.0, 602.0, 905.0, 1415.0, 2100.0, 3419.0, 5309.0, 8701.0, 13909.0, 23288.0, 40078.0, 72269.0, 138113.0, 291672.0, 795463.0, 1711127.0, 583313.0, 235998.0, 115113.0, 61729.0, 34852.0, 20393.0, 12335.0, 7590.0, 4657.0, 3061.0, 1885.0, 1269.0, 812.0, 571.0, 349.0, 246.0, 159.0, 101.0, 82.0, 44.0, 29.0, 29.0, 19.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-115.5, -111.931640625, -108.36328125, -104.794921875, -101.2265625, -97.658203125, -94.08984375, -90.521484375, -86.953125, -83.384765625, -79.81640625, -76.248046875, -72.6796875, -69.111328125, -65.54296875, -61.974609375, -58.40625, -54.837890625, -51.26953125, -47.701171875, -44.1328125, -40.564453125, -36.99609375, -33.427734375, -29.859375, -26.291015625, -22.72265625, -19.154296875, -15.5859375, -12.017578125, -8.44921875, -4.880859375, -1.3125, 2.255859375, 5.82421875, 9.392578125, 12.9609375, 16.529296875, 20.09765625, 23.666015625, 27.234375, 30.802734375, 34.37109375, 37.939453125, 41.5078125, 45.076171875, 48.64453125, 52.212890625, 55.78125, 59.349609375, 62.91796875, 66.486328125, 70.0546875, 73.623046875, 77.19140625, 80.759765625, 84.328125, 87.896484375, 91.46484375, 95.033203125, 98.6015625, 102.169921875, 105.73828125, 109.306640625, 112.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 6.0, 10.0, 9.0, 14.0, 20.0, 19.0, 21.0, 30.0, 34.0, 35.0, 45.0, 62.0, 86.0, 87.0, 117.0, 158.0, 162.0, 239.0, 259.0, 396.0, 427.0, 376.0, 284.0, 231.0, 190.0, 127.0, 121.0, 113.0, 83.0, 68.0, 47.0, 36.0, 32.0, 23.0, 27.0, 12.0, 11.0, 9.0, 8.0, 16.0, 11.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4033203125, -33.275390625, -32.1474609375, -31.01953125, -29.8916015625, -28.763671875, -27.6357421875, -26.5078125, -25.3798828125, -24.251953125, -23.1240234375, -21.99609375, -20.8681640625, -19.740234375, -18.6123046875, -17.484375, -16.3564453125, -15.228515625, -14.1005859375, -12.97265625, -11.8447265625, -10.716796875, -9.5888671875, -8.4609375, -7.3330078125, -6.205078125, -5.0771484375, -3.94921875, -2.8212890625, -1.693359375, -0.5654296875, 0.5625, 1.6904296875, 2.818359375, 3.9462890625, 5.07421875, 6.2021484375, 7.330078125, 8.4580078125, 9.5859375, 10.7138671875, 11.841796875, 12.9697265625, 14.09765625, 15.2255859375, 16.353515625, 17.4814453125, 18.609375, 19.7373046875, 20.865234375, 21.9931640625, 23.12109375, 24.2490234375, 25.376953125, 26.5048828125, 27.6328125, 28.7607421875, 29.888671875, 31.0166015625, 32.14453125, 33.2724609375, 34.400390625, 35.5283203125, 36.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 5.0, 20.0, 24.0, 27.0, 39.0, 28.0, 41.0, 41.0, 66.0, 80.0, 75.0, 93.0, 101.0, 62.0, 61.0, 46.0, 34.0, 31.0, 28.0, 20.0, 13.0, 13.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-138.45950317382812, -134.84710693359375, -131.2346954345703, -127.6222915649414, -124.0098876953125, -120.3974838256836, -116.78507995605469, -113.17267608642578, -109.56027221679688, -105.94786834716797, -102.33546447753906, -98.72306060791016, -95.11065673828125, -91.49825286865234, -87.88584899902344, -84.27344512939453, -80.66104125976562, -77.04863739013672, -73.43623352050781, -69.8238296508789, -66.21142578125, -62.599021911621094, -58.98661804199219, -55.37421417236328, -51.761810302734375, -48.14940643310547, -44.53700256347656, -40.924598693847656, -37.31219482421875, -33.699790954589844, -30.087387084960938, -26.47498321533203, -22.862579345703125, -19.25017547607422, -15.637771606445312, -12.025367736816406, -8.4129638671875, -4.800559997558594, -1.1881561279296875, 2.4242477416992188, 6.036651611328125, 9.649055480957031, 13.261459350585938, 16.873863220214844, 20.48626708984375, 24.098670959472656, 27.711074829101562, 31.32347869873047, 34.935882568359375, 38.54828643798828, 42.16069030761719, 45.773094177246094, 49.385498046875, 52.997901916503906, 56.61030578613281, 60.22270965576172, 63.835113525390625, 67.44751739501953, 71.05992126464844, 74.67232513427734, 78.28472900390625, 81.89713287353516, 85.50953674316406, 89.12194061279297, 92.73434448242188]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 10.0, 8.0, 7.0, 14.0, 22.0, 21.0, 29.0, 28.0, 23.0, 28.0, 37.0, 30.0, 36.0, 54.0, 43.0, 43.0, 52.0, 48.0, 48.0, 43.0, 36.0, 32.0, 33.0, 30.0, 32.0, 32.0, 30.0, 15.0, 16.0, 16.0, 15.0, 13.0, 11.0, 10.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.64378356933594, -71.24819946289062, -68.85261535644531, -66.45703887939453, -64.06145477294922, -61.665870666503906, -59.270286560058594, -56.87470245361328, -54.479122161865234, -52.08353805541992, -49.687957763671875, -47.29237365722656, -44.89678955078125, -42.5012092590332, -40.10562515258789, -37.710044860839844, -35.31446075439453, -32.91887664794922, -30.523296356201172, -28.12771224975586, -25.73213005065918, -23.3365478515625, -20.940963745117188, -18.545381546020508, -16.149799346923828, -13.754217147827148, -11.358633995056152, -8.963050842285156, -6.567468643188477, -4.171886444091797, -1.7763032913208008, 0.6192798614501953, 3.0148544311523438, 5.410437107086182, 7.8060197830200195, 10.201602935791016, 12.597185134887695, 14.992767333984375, 17.388351440429688, 19.783933639526367, 22.179515838623047, 24.575098037719727, 26.970680236816406, 29.36626434326172, 31.7618465423584, 34.15742874145508, 36.55301284790039, 38.94859313964844, 41.34417724609375, 43.73976135253906, 46.13534164428711, 48.53092575073242, 50.92650604248047, 53.32209014892578, 55.717674255371094, 58.113258361816406, 60.50883865356445, 62.904422760009766, 65.30000305175781, 67.69558715820312, 70.09117126464844, 72.48675537109375, 74.88233184814453, 77.27791595458984, 79.67350006103516]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 14.0, 21.0, 33.0, 41.0, 58.0, 69.0, 122.0, 198.0, 276.0, 397.0, 624.0, 912.0, 1322.0, 1827.0, 2915.0, 4343.0, 6503.0, 9940.0, 15338.0, 23651.0, 36824.0, 58933.0, 93955.0, 150048.0, 202967.0, 160531.0, 101126.0, 62567.0, 39714.0, 25510.0, 16402.0, 10563.0, 6899.0, 4569.0, 3042.0, 2045.0, 1306.0, 932.0, 638.0, 464.0, 291.0, 180.0, 142.0, 113.0, 68.0, 33.0, 22.0, 22.0, 19.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-97.5625, -94.47265625, -91.3828125, -88.29296875, -85.203125, -82.11328125, -79.0234375, -75.93359375, -72.84375, -69.75390625, -66.6640625, -63.57421875, -60.484375, -57.39453125, -54.3046875, -51.21484375, -48.125, -45.03515625, -41.9453125, -38.85546875, -35.765625, -32.67578125, -29.5859375, -26.49609375, -23.40625, -20.31640625, -17.2265625, -14.13671875, -11.046875, -7.95703125, -4.8671875, -1.77734375, 1.3125, 4.40234375, 7.4921875, 10.58203125, 13.671875, 16.76171875, 19.8515625, 22.94140625, 26.03125, 29.12109375, 32.2109375, 35.30078125, 38.390625, 41.48046875, 44.5703125, 47.66015625, 50.75, 53.83984375, 56.9296875, 60.01953125, 63.109375, 66.19921875, 69.2890625, 72.37890625, 75.46875, 78.55859375, 81.6484375, 84.73828125, 87.828125, 90.91796875, 94.0078125, 97.09765625, 100.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 1.0, 6.0, 7.0, 8.0, 11.0, 15.0, 14.0, 19.0, 31.0, 25.0, 28.0, 35.0, 26.0, 36.0, 49.0, 52.0, 34.0, 49.0, 52.0, 57.0, 56.0, 36.0, 37.0, 28.0, 43.0, 32.0, 34.0, 33.0, 25.0, 17.0, 17.0, 13.0, 13.0, 11.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5625, -62.53515625, -60.5078125, -58.48046875, -56.453125, -54.42578125, -52.3984375, -50.37109375, -48.34375, -46.31640625, -44.2890625, -42.26171875, -40.234375, -38.20703125, -36.1796875, -34.15234375, -32.125, -30.09765625, -28.0703125, -26.04296875, -24.015625, -21.98828125, -19.9609375, -17.93359375, -15.90625, -13.87890625, -11.8515625, -9.82421875, -7.796875, -5.76953125, -3.7421875, -1.71484375, 0.3125, 2.33984375, 4.3671875, 6.39453125, 8.421875, 10.44921875, 12.4765625, 14.50390625, 16.53125, 18.55859375, 20.5859375, 22.61328125, 24.640625, 26.66796875, 28.6953125, 30.72265625, 32.75, 34.77734375, 36.8046875, 38.83203125, 40.859375, 42.88671875, 44.9140625, 46.94140625, 48.96875, 50.99609375, 53.0234375, 55.05078125, 57.078125, 59.10546875, 61.1328125, 63.16015625, 65.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 15.0, 14.0, 26.0, 29.0, 51.0, 71.0, 89.0, 134.0, 204.0, 268.0, 452.0, 605.0, 999.0, 1445.0, 2177.0, 3375.0, 5440.0, 8817.0, 14969.0, 26013.0, 47212.0, 91576.0, 193380.0, 301798.0, 167041.0, 80722.0, 42159.0, 23484.0, 13572.0, 8147.0, 4956.0, 3176.0, 2060.0, 1354.0, 881.0, 593.0, 375.0, 281.0, 208.0, 131.0, 84.0, 70.0, 40.0, 21.0, 16.0, 11.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-169.5, -164.26953125, -159.0390625, -153.80859375, -148.578125, -143.34765625, -138.1171875, -132.88671875, -127.65625, -122.42578125, -117.1953125, -111.96484375, -106.734375, -101.50390625, -96.2734375, -91.04296875, -85.8125, -80.58203125, -75.3515625, -70.12109375, -64.890625, -59.66015625, -54.4296875, -49.19921875, -43.96875, -38.73828125, -33.5078125, -28.27734375, -23.046875, -17.81640625, -12.5859375, -7.35546875, -2.125, 3.10546875, 8.3359375, 13.56640625, 18.796875, 24.02734375, 29.2578125, 34.48828125, 39.71875, 44.94921875, 50.1796875, 55.41015625, 60.640625, 65.87109375, 71.1015625, 76.33203125, 81.5625, 86.79296875, 92.0234375, 97.25390625, 102.484375, 107.71484375, 112.9453125, 118.17578125, 123.40625, 128.63671875, 133.8671875, 139.09765625, 144.328125, 149.55859375, 154.7890625, 160.01953125, 165.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 7.0, 8.0, 14.0, 14.0, 14.0, 25.0, 21.0, 16.0, 27.0, 38.0, 37.0, 28.0, 42.0, 46.0, 37.0, 41.0, 45.0, 43.0, 33.0, 51.0, 34.0, 37.0, 35.0, 34.0, 43.0, 24.0, 22.0, 25.0, 23.0, 13.0, 15.0, 16.0, 12.0, 9.0, 6.0, 8.0, 5.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-56.5625, -54.79833984375, -53.0341796875, -51.27001953125, -49.505859375, -47.74169921875, -45.9775390625, -44.21337890625, -42.44921875, -40.68505859375, -38.9208984375, -37.15673828125, -35.392578125, -33.62841796875, -31.8642578125, -30.10009765625, -28.3359375, -26.57177734375, -24.8076171875, -23.04345703125, -21.279296875, -19.51513671875, -17.7509765625, -15.98681640625, -14.22265625, -12.45849609375, -10.6943359375, -8.93017578125, -7.166015625, -5.40185546875, -3.6376953125, -1.87353515625, -0.109375, 1.65478515625, 3.4189453125, 5.18310546875, 6.947265625, 8.71142578125, 10.4755859375, 12.23974609375, 14.00390625, 15.76806640625, 17.5322265625, 19.29638671875, 21.060546875, 22.82470703125, 24.5888671875, 26.35302734375, 28.1171875, 29.88134765625, 31.6455078125, 33.40966796875, 35.173828125, 36.93798828125, 38.7021484375, 40.46630859375, 42.23046875, 43.99462890625, 45.7587890625, 47.52294921875, 49.287109375, 51.05126953125, 52.8154296875, 54.57958984375, 56.34375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 19.0, 22.0, 36.0, 50.0, 72.0, 108.0, 169.0, 198.0, 375.0, 600.0, 883.0, 1375.0, 2328.0, 3837.0, 6596.0, 12337.0, 26910.0, 79133.0, 524016.0, 285298.0, 57454.0, 21479.0, 10566.0, 5634.0, 3358.0, 2069.0, 1290.0, 849.0, 532.0, 327.0, 205.0, 138.0, 82.0, 72.0, 48.0, 25.0, 16.0, 7.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-88.6875, -86.0693359375, -83.451171875, -80.8330078125, -78.21484375, -75.5966796875, -72.978515625, -70.3603515625, -67.7421875, -65.1240234375, -62.505859375, -59.8876953125, -57.26953125, -54.6513671875, -52.033203125, -49.4150390625, -46.796875, -44.1787109375, -41.560546875, -38.9423828125, -36.32421875, -33.7060546875, -31.087890625, -28.4697265625, -25.8515625, -23.2333984375, -20.615234375, -17.9970703125, -15.37890625, -12.7607421875, -10.142578125, -7.5244140625, -4.90625, -2.2880859375, 0.330078125, 2.9482421875, 5.56640625, 8.1845703125, 10.802734375, 13.4208984375, 16.0390625, 18.6572265625, 21.275390625, 23.8935546875, 26.51171875, 29.1298828125, 31.748046875, 34.3662109375, 36.984375, 39.6025390625, 42.220703125, 44.8388671875, 47.45703125, 50.0751953125, 52.693359375, 55.3115234375, 57.9296875, 60.5478515625, 63.166015625, 65.7841796875, 68.40234375, 71.0205078125, 73.638671875, 76.2568359375, 78.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 19.0, 24.0, 52.0, 98.0, 225.0, 281.0, 89.0, 72.0, 40.0, 12.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012359619140625, -0.011920452117919922, -0.011481285095214844, -0.011042118072509766, -0.010602951049804688, -0.01016378402709961, -0.009724617004394531, -0.009285449981689453, -0.008846282958984375, -0.008407115936279297, -0.007967948913574219, -0.007528781890869141, -0.0070896148681640625, -0.006650447845458984, -0.006211280822753906, -0.005772113800048828, -0.00533294677734375, -0.004893779754638672, -0.004454612731933594, -0.004015445709228516, -0.0035762786865234375, -0.0031371116638183594, -0.0026979446411132812, -0.002258777618408203, -0.001819610595703125, -0.0013804435729980469, -0.0009412765502929688, -0.0005021095275878906, -6.29425048828125e-05, 0.0003762245178222656, 0.0008153915405273438, 0.0012545585632324219, 0.0016937255859375, 0.002132892608642578, 0.0025720596313476562, 0.0030112266540527344, 0.0034503936767578125, 0.0038895606994628906, 0.004328727722167969, 0.004767894744873047, 0.005207061767578125, 0.005646228790283203, 0.006085395812988281, 0.006524562835693359, 0.0069637298583984375, 0.007402896881103516, 0.007842063903808594, 0.008281230926513672, 0.00872039794921875, 0.009159564971923828, 0.009598731994628906, 0.010037899017333984, 0.010477066040039062, 0.01091623306274414, 0.011355400085449219, 0.011794567108154297, 0.012233734130859375, 0.012672901153564453, 0.013112068176269531, 0.01355123519897461, 0.013990402221679688, 0.014429569244384766, 0.014868736267089844, 0.015307903289794922, 0.0157470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 13.0, 11.0, 18.0, 18.0, 37.0, 50.0, 56.0, 118.0, 166.0, 231.0, 381.0, 534.0, 854.0, 1202.0, 1742.0, 2720.0, 4026.0, 5883.0, 9786.0, 17114.0, 32652.0, 81597.0, 320462.0, 393386.0, 92535.0, 35811.0, 17655.0, 10295.0, 6364.0, 4159.0, 2898.0, 1953.0, 1228.0, 845.0, 603.0, 377.0, 224.0, 169.0, 115.0, 84.0, 53.0, 33.0, 31.0, 19.0, 17.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-73.6875, -71.388671875, -69.08984375, -66.791015625, -64.4921875, -62.193359375, -59.89453125, -57.595703125, -55.296875, -52.998046875, -50.69921875, -48.400390625, -46.1015625, -43.802734375, -41.50390625, -39.205078125, -36.90625, -34.607421875, -32.30859375, -30.009765625, -27.7109375, -25.412109375, -23.11328125, -20.814453125, -18.515625, -16.216796875, -13.91796875, -11.619140625, -9.3203125, -7.021484375, -4.72265625, -2.423828125, -0.125, 2.173828125, 4.47265625, 6.771484375, 9.0703125, 11.369140625, 13.66796875, 15.966796875, 18.265625, 20.564453125, 22.86328125, 25.162109375, 27.4609375, 29.759765625, 32.05859375, 34.357421875, 36.65625, 38.955078125, 41.25390625, 43.552734375, 45.8515625, 48.150390625, 50.44921875, 52.748046875, 55.046875, 57.345703125, 59.64453125, 61.943359375, 64.2421875, 66.541015625, 68.83984375, 71.138671875, 73.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 8.0, 6.0, 5.0, 6.0, 13.0, 16.0, 24.0, 29.0, 28.0, 50.0, 63.0, 83.0, 123.0, 141.0, 78.0, 66.0, 46.0, 29.0, 34.0, 30.0, 21.0, 15.0, 8.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.52734375, -17.8203125, -17.11328125, -16.40625, -15.69921875, -14.9921875, -14.28515625, -13.578125, -12.87109375, -12.1640625, -11.45703125, -10.75, -10.04296875, -9.3359375, -8.62890625, -7.921875, -7.21484375, -6.5078125, -5.80078125, -5.09375, -4.38671875, -3.6796875, -2.97265625, -2.265625, -1.55859375, -0.8515625, -0.14453125, 0.5625, 1.26953125, 1.9765625, 2.68359375, 3.390625, 4.09765625, 4.8046875, 5.51171875, 6.21875, 6.92578125, 7.6328125, 8.33984375, 9.046875, 9.75390625, 10.4609375, 11.16796875, 11.875, 12.58203125, 13.2890625, 13.99609375, 14.703125, 15.41015625, 16.1171875, 16.82421875, 17.53125, 18.23828125, 18.9453125, 19.65234375, 20.359375, 21.06640625, 21.7734375, 22.48046875, 23.1875, 23.89453125, 24.6015625, 25.30859375, 26.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 10.0, 13.0, 22.0, 28.0, 41.0, 52.0, 77.0, 106.0, 129.0, 123.0, 121.0, 73.0, 54.0, 46.0, 29.0, 23.0, 19.0, 14.0, 8.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.34735107421875, -130.0435333251953, -125.73973083496094, -121.4359130859375, -117.1321029663086, -112.82829284667969, -108.52448272705078, -104.22067260742188, -99.91685485839844, -95.61304473876953, -91.30923461914062, -87.00541687011719, -82.70160675048828, -78.39779663085938, -74.09398651123047, -69.79017639160156, -65.48636627197266, -61.18255615234375, -56.87874221801758, -52.57493209838867, -48.2711181640625, -43.967308044433594, -39.66349792480469, -35.35968780517578, -31.05587387084961, -26.75206184387207, -22.44824981689453, -18.144439697265625, -13.840627670288086, -9.536815643310547, -5.233005523681641, -0.9291934967041016, 3.3746185302734375, 7.678430080413818, 11.9822416305542, 16.286052703857422, 20.58986473083496, 24.8936767578125, 29.197486877441406, 33.50129699707031, 37.805110931396484, 42.10892105102539, 46.41273498535156, 50.71654510498047, 55.020355224609375, 59.32416915893555, 63.62797927856445, 67.93179321289062, 72.23560333251953, 76.53941345214844, 80.84322357177734, 85.14703369140625, 89.45085144042969, 93.7546615600586, 98.0584716796875, 102.3622817993164, 106.66609191894531, 110.96990203857422, 115.27371215820312, 119.57752990722656, 123.88134002685547, 128.18515014648438, 132.48895263671875, 136.7927703857422, 141.09658813476562]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 11.0, 0.0, 2.0, 7.0, 7.0, 10.0, 7.0, 14.0, 14.0, 12.0, 23.0, 32.0, 28.0, 33.0, 34.0, 41.0, 29.0, 42.0, 36.0, 51.0, 47.0, 51.0, 44.0, 39.0, 40.0, 42.0, 30.0, 33.0, 29.0, 30.0, 27.0, 28.0, 22.0, 17.0, 12.0, 16.0, 7.0, 8.0, 14.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.6181526184082, -61.656272888183594, -59.694393157958984, -57.732513427734375, -55.770633697509766, -53.808753967285156, -51.84687423706055, -49.88499450683594, -47.92311477661133, -45.96123504638672, -43.99935531616211, -42.0374755859375, -40.07559585571289, -38.11371612548828, -36.15183639526367, -34.18995666503906, -32.22807693481445, -30.266197204589844, -28.304317474365234, -26.342437744140625, -24.380558013916016, -22.418678283691406, -20.456798553466797, -18.494918823242188, -16.533039093017578, -14.571159362792969, -12.60927963256836, -10.64739990234375, -8.68552017211914, -6.723640441894531, -4.761760711669922, -2.7998809814453125, -0.8380050659179688, 1.1238746643066406, 3.08575439453125, 5.047634124755859, 7.009513854980469, 8.971393585205078, 10.933273315429688, 12.895153045654297, 14.857032775878906, 16.818912506103516, 18.780792236328125, 20.742671966552734, 22.704551696777344, 24.666431427001953, 26.628311157226562, 28.590190887451172, 30.55207061767578, 32.51395034790039, 34.475830078125, 36.43770980834961, 38.39958953857422, 40.36146926879883, 42.32334899902344, 44.28522872924805, 46.247108459472656, 48.208988189697266, 50.170867919921875, 52.132747650146484, 54.094627380371094, 56.0565071105957, 58.01838684082031, 59.98026657104492, 61.94214630126953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 12.0, 16.0, 19.0, 34.0, 46.0, 61.0, 98.0, 141.0, 229.0, 331.0, 459.0, 718.0, 1187.0, 1768.0, 2722.0, 4268.0, 6802.0, 10662.0, 17295.0, 28020.0, 46306.0, 76621.0, 127731.0, 204091.0, 201055.0, 124722.0, 74656.0, 45253.0, 27464.0, 16742.0, 10535.0, 6455.0, 4175.0, 2676.0, 1787.0, 1200.0, 748.0, 482.0, 333.0, 203.0, 138.0, 109.0, 66.0, 41.0, 27.0, 19.0, 10.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-75.1875, -72.974609375, -70.76171875, -68.548828125, -66.3359375, -64.123046875, -61.91015625, -59.697265625, -57.484375, -55.271484375, -53.05859375, -50.845703125, -48.6328125, -46.419921875, -44.20703125, -41.994140625, -39.78125, -37.568359375, -35.35546875, -33.142578125, -30.9296875, -28.716796875, -26.50390625, -24.291015625, -22.078125, -19.865234375, -17.65234375, -15.439453125, -13.2265625, -11.013671875, -8.80078125, -6.587890625, -4.375, -2.162109375, 0.05078125, 2.263671875, 4.4765625, 6.689453125, 8.90234375, 11.115234375, 13.328125, 15.541015625, 17.75390625, 19.966796875, 22.1796875, 24.392578125, 26.60546875, 28.818359375, 31.03125, 33.244140625, 35.45703125, 37.669921875, 39.8828125, 42.095703125, 44.30859375, 46.521484375, 48.734375, 50.947265625, 53.16015625, 55.373046875, 57.5859375, 59.798828125, 62.01171875, 64.224609375, 66.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 10.0, 15.0, 12.0, 26.0, 22.0, 22.0, 30.0, 31.0, 39.0, 41.0, 33.0, 35.0, 47.0, 44.0, 54.0, 45.0, 36.0, 39.0, 48.0, 31.0, 45.0, 40.0, 28.0, 30.0, 23.0, 23.0, 17.0, 20.0, 16.0, 12.0, 9.0, 4.0, 3.0, 12.0, 9.0, 1.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0625, -52.27001953125, -50.4775390625, -48.68505859375, -46.892578125, -45.10009765625, -43.3076171875, -41.51513671875, -39.72265625, -37.93017578125, -36.1376953125, -34.34521484375, -32.552734375, -30.76025390625, -28.9677734375, -27.17529296875, -25.3828125, -23.59033203125, -21.7978515625, -20.00537109375, -18.212890625, -16.42041015625, -14.6279296875, -12.83544921875, -11.04296875, -9.25048828125, -7.4580078125, -5.66552734375, -3.873046875, -2.08056640625, -0.2880859375, 1.50439453125, 3.296875, 5.08935546875, 6.8818359375, 8.67431640625, 10.466796875, 12.25927734375, 14.0517578125, 15.84423828125, 17.63671875, 19.42919921875, 21.2216796875, 23.01416015625, 24.806640625, 26.59912109375, 28.3916015625, 30.18408203125, 31.9765625, 33.76904296875, 35.5615234375, 37.35400390625, 39.146484375, 40.93896484375, 42.7314453125, 44.52392578125, 46.31640625, 48.10888671875, 49.9013671875, 51.69384765625, 53.486328125, 55.27880859375, 57.0712890625, 58.86376953125, 60.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 10.0, 9.0, 21.0, 27.0, 31.0, 77.0, 86.0, 131.0, 172.0, 243.0, 413.0, 520.0, 748.0, 1167.0, 1663.0, 2524.0, 3729.0, 5382.0, 8103.0, 12290.0, 19038.0, 29361.0, 46655.0, 74970.0, 124149.0, 192016.0, 191574.0, 124685.0, 75751.0, 46728.0, 29480.0, 18988.0, 12366.0, 8323.0, 5386.0, 3740.0, 2551.0, 1738.0, 1135.0, 827.0, 543.0, 394.0, 262.0, 174.0, 109.0, 87.0, 67.0, 37.0, 33.0, 15.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-99.4375, -96.4248046875, -93.412109375, -90.3994140625, -87.38671875, -84.3740234375, -81.361328125, -78.3486328125, -75.3359375, -72.3232421875, -69.310546875, -66.2978515625, -63.28515625, -60.2724609375, -57.259765625, -54.2470703125, -51.234375, -48.2216796875, -45.208984375, -42.1962890625, -39.18359375, -36.1708984375, -33.158203125, -30.1455078125, -27.1328125, -24.1201171875, -21.107421875, -18.0947265625, -15.08203125, -12.0693359375, -9.056640625, -6.0439453125, -3.03125, -0.0185546875, 2.994140625, 6.0068359375, 9.01953125, 12.0322265625, 15.044921875, 18.0576171875, 21.0703125, 24.0830078125, 27.095703125, 30.1083984375, 33.12109375, 36.1337890625, 39.146484375, 42.1591796875, 45.171875, 48.1845703125, 51.197265625, 54.2099609375, 57.22265625, 60.2353515625, 63.248046875, 66.2607421875, 69.2734375, 72.2861328125, 75.298828125, 78.3115234375, 81.32421875, 84.3369140625, 87.349609375, 90.3623046875, 93.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 5.0, 5.0, 14.0, 16.0, 16.0, 10.0, 20.0, 25.0, 31.0, 25.0, 25.0, 27.0, 32.0, 32.0, 32.0, 38.0, 38.0, 36.0, 38.0, 37.0, 49.0, 36.0, 22.0, 34.0, 34.0, 35.0, 36.0, 31.0, 26.0, 27.0, 14.0, 18.0, 22.0, 13.0, 11.0, 13.0, 8.0, 9.0, 9.0, 5.0, 13.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-38.84375, -37.69384765625, -36.5439453125, -35.39404296875, -34.244140625, -33.09423828125, -31.9443359375, -30.79443359375, -29.64453125, -28.49462890625, -27.3447265625, -26.19482421875, -25.044921875, -23.89501953125, -22.7451171875, -21.59521484375, -20.4453125, -19.29541015625, -18.1455078125, -16.99560546875, -15.845703125, -14.69580078125, -13.5458984375, -12.39599609375, -11.24609375, -10.09619140625, -8.9462890625, -7.79638671875, -6.646484375, -5.49658203125, -4.3466796875, -3.19677734375, -2.046875, -0.89697265625, 0.2529296875, 1.40283203125, 2.552734375, 3.70263671875, 4.8525390625, 6.00244140625, 7.15234375, 8.30224609375, 9.4521484375, 10.60205078125, 11.751953125, 12.90185546875, 14.0517578125, 15.20166015625, 16.3515625, 17.50146484375, 18.6513671875, 19.80126953125, 20.951171875, 22.10107421875, 23.2509765625, 24.40087890625, 25.55078125, 26.70068359375, 27.8505859375, 29.00048828125, 30.150390625, 31.30029296875, 32.4501953125, 33.60009765625, 34.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 18.0, 9.0, 29.0, 40.0, 58.0, 83.0, 121.0, 165.0, 236.0, 385.0, 528.0, 743.0, 1138.0, 1768.0, 2636.0, 4227.0, 6845.0, 11684.0, 19872.0, 35091.0, 64425.0, 125521.0, 236923.0, 245870.0, 132498.0, 68463.0, 36765.0, 20720.0, 12067.0, 7096.0, 4336.0, 2723.0, 1754.0, 1168.0, 790.0, 518.0, 411.0, 244.0, 169.0, 143.0, 89.0, 61.0, 42.0, 29.0, 19.0, 11.0, 8.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.311279296875, -18.62255859375, -17.933837890625, -17.2451171875, -16.556396484375, -15.86767578125, -15.178955078125, -14.490234375, -13.801513671875, -13.11279296875, -12.424072265625, -11.7353515625, -11.046630859375, -10.35791015625, -9.669189453125, -8.98046875, -8.291748046875, -7.60302734375, -6.914306640625, -6.2255859375, -5.536865234375, -4.84814453125, -4.159423828125, -3.470703125, -2.781982421875, -2.09326171875, -1.404541015625, -0.7158203125, -0.027099609375, 0.66162109375, 1.350341796875, 2.0390625, 2.727783203125, 3.41650390625, 4.105224609375, 4.7939453125, 5.482666015625, 6.17138671875, 6.860107421875, 7.548828125, 8.237548828125, 8.92626953125, 9.614990234375, 10.3037109375, 10.992431640625, 11.68115234375, 12.369873046875, 13.05859375, 13.747314453125, 14.43603515625, 15.124755859375, 15.8134765625, 16.502197265625, 17.19091796875, 17.879638671875, 18.568359375, 19.257080078125, 19.94580078125, 20.634521484375, 21.3232421875, 22.011962890625, 22.70068359375, 23.389404296875, 24.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 10.0, 5.0, 18.0, 17.0, 24.0, 33.0, 38.0, 47.0, 46.0, 65.0, 83.0, 88.0, 95.0, 96.0, 81.0, 41.0, 39.0, 38.0, 21.0, 28.0, 10.0, 10.0, 11.0, 5.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.002114593982696533, -0.0020357370376586914, -0.0019568800926208496, -0.0018780231475830078, -0.001799166202545166, -0.0017203092575073242, -0.0016414523124694824, -0.0015625953674316406, -0.0014837384223937988, -0.001404881477355957, -0.0013260245323181152, -0.0012471675872802734, -0.0011683106422424316, -0.0010894536972045898, -0.001010596752166748, -0.0009317398071289062, -0.0008528828620910645, -0.0007740259170532227, -0.0006951689720153809, -0.0006163120269775391, -0.0005374550819396973, -0.00045859813690185547, -0.00037974119186401367, -0.0003008842468261719, -0.00022202730178833008, -0.00014317035675048828, -6.431341171264648e-05, 1.4543533325195312e-05, 9.340047836303711e-05, 0.0001722574234008789, 0.0002511143684387207, 0.0003299713134765625, 0.0004088282585144043, 0.0004876852035522461, 0.0005665421485900879, 0.0006453990936279297, 0.0007242560386657715, 0.0008031129837036133, 0.0008819699287414551, 0.0009608268737792969, 0.0010396838188171387, 0.0011185407638549805, 0.0011973977088928223, 0.001276254653930664, 0.0013551115989685059, 0.0014339685440063477, 0.0015128254890441895, 0.0015916824340820312, 0.001670539379119873, 0.0017493963241577148, 0.0018282532691955566, 0.0019071102142333984, 0.0019859671592712402, 0.002064824104309082, 0.002143681049346924, 0.0022225379943847656, 0.0023013949394226074, 0.0023802518844604492, 0.002459108829498291, 0.002537965774536133, 0.0026168227195739746, 0.0026956796646118164, 0.002774536609649658, 0.0028533935546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 7.0, 13.0, 19.0, 23.0, 45.0, 47.0, 95.0, 128.0, 153.0, 258.0, 345.0, 489.0, 748.0, 1074.0, 1608.0, 2326.0, 3561.0, 5740.0, 8773.0, 13919.0, 23266.0, 40024.0, 70654.0, 125302.0, 206549.0, 217522.0, 137177.0, 77002.0, 43610.0, 25560.0, 15348.0, 9558.0, 5995.0, 3784.0, 2524.0, 1702.0, 1060.0, 820.0, 524.0, 379.0, 263.0, 162.0, 133.0, 85.0, 68.0, 39.0, 19.0, 16.0, 14.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.34716796875, -17.7568359375, -17.16650390625, -16.576171875, -15.98583984375, -15.3955078125, -14.80517578125, -14.21484375, -13.62451171875, -13.0341796875, -12.44384765625, -11.853515625, -11.26318359375, -10.6728515625, -10.08251953125, -9.4921875, -8.90185546875, -8.3115234375, -7.72119140625, -7.130859375, -6.54052734375, -5.9501953125, -5.35986328125, -4.76953125, -4.17919921875, -3.5888671875, -2.99853515625, -2.408203125, -1.81787109375, -1.2275390625, -0.63720703125, -0.046875, 0.54345703125, 1.1337890625, 1.72412109375, 2.314453125, 2.90478515625, 3.4951171875, 4.08544921875, 4.67578125, 5.26611328125, 5.8564453125, 6.44677734375, 7.037109375, 7.62744140625, 8.2177734375, 8.80810546875, 9.3984375, 9.98876953125, 10.5791015625, 11.16943359375, 11.759765625, 12.35009765625, 12.9404296875, 13.53076171875, 14.12109375, 14.71142578125, 15.3017578125, 15.89208984375, 16.482421875, 17.07275390625, 17.6630859375, 18.25341796875, 18.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 9.0, 6.0, 9.0, 10.0, 12.0, 16.0, 24.0, 23.0, 33.0, 28.0, 42.0, 45.0, 56.0, 41.0, 50.0, 68.0, 63.0, 53.0, 54.0, 48.0, 35.0, 50.0, 33.0, 31.0, 17.0, 21.0, 20.0, 21.0, 15.0, 7.0, 14.0, 10.0, 3.0, 6.0, 1.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.57421875, -6.378173828125, -6.18212890625, -5.986083984375, -5.7900390625, -5.593994140625, -5.39794921875, -5.201904296875, -5.005859375, -4.809814453125, -4.61376953125, -4.417724609375, -4.2216796875, -4.025634765625, -3.82958984375, -3.633544921875, -3.4375, -3.241455078125, -3.04541015625, -2.849365234375, -2.6533203125, -2.457275390625, -2.26123046875, -2.065185546875, -1.869140625, -1.673095703125, -1.47705078125, -1.281005859375, -1.0849609375, -0.888916015625, -0.69287109375, -0.496826171875, -0.30078125, -0.104736328125, 0.09130859375, 0.287353515625, 0.4833984375, 0.679443359375, 0.87548828125, 1.071533203125, 1.267578125, 1.463623046875, 1.65966796875, 1.855712890625, 2.0517578125, 2.247802734375, 2.44384765625, 2.639892578125, 2.8359375, 3.031982421875, 3.22802734375, 3.424072265625, 3.6201171875, 3.816162109375, 4.01220703125, 4.208251953125, 4.404296875, 4.600341796875, 4.79638671875, 4.992431640625, 5.1884765625, 5.384521484375, 5.58056640625, 5.776611328125, 5.97265625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 13.0, 12.0, 22.0, 25.0, 37.0, 51.0, 60.0, 85.0, 99.0, 117.0, 96.0, 85.0, 69.0, 73.0, 42.0, 21.0, 25.0, 15.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.57764434814453, -114.96800994873047, -111.35836791992188, -107.74873352050781, -104.13909149169922, -100.52945709228516, -96.91981506347656, -93.3101806640625, -89.7005386352539, -86.09090423583984, -82.48126220703125, -78.87162780761719, -75.2619857788086, -71.65235137939453, -68.04270935058594, -64.43307495117188, -60.82343673706055, -57.21379852294922, -53.60416030883789, -49.99452209472656, -46.384883880615234, -42.775245666503906, -39.165611267089844, -35.55596923828125, -31.946332931518555, -28.336694717407227, -24.7270565032959, -21.117420196533203, -17.507781982421875, -13.898143768310547, -10.288505554199219, -6.678867340087891, -3.0692291259765625, 0.5404088497161865, 4.1500468254089355, 7.7596845626831055, 11.369322776794434, 14.978960037231445, 18.588598251342773, 22.1982364654541, 25.80787467956543, 29.417512893676758, 33.02714920043945, 36.63678741455078, 40.24642562866211, 43.85606384277344, 47.465702056884766, 51.075340270996094, 54.68497848510742, 58.29461669921875, 61.90425491333008, 65.5138931274414, 69.12352752685547, 72.73316955566406, 76.34280395507812, 79.95244598388672, 83.56208038330078, 87.17171478271484, 90.78135681152344, 94.3909912109375, 98.0006332397461, 101.61026763916016, 105.21990966796875, 108.82954406738281, 112.4391860961914]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 0.0, 6.0, 5.0, 3.0, 6.0, 3.0, 7.0, 13.0, 9.0, 16.0, 18.0, 24.0, 15.0, 33.0, 22.0, 26.0, 39.0, 35.0, 32.0, 40.0, 34.0, 34.0, 47.0, 38.0, 48.0, 40.0, 45.0, 41.0, 30.0, 30.0, 35.0, 30.0, 27.0, 19.0, 18.0, 18.0, 19.0, 10.0, 19.0, 10.0, 9.0, 14.0, 6.0, 3.0, 6.0, 1.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-57.111000061035156, -55.35655975341797, -53.60212326049805, -51.84768295288086, -50.09324645996094, -48.33880615234375, -46.58436584472656, -44.82992935180664, -43.07549285888672, -41.32105255126953, -39.56661605834961, -37.81217575073242, -36.0577392578125, -34.30329895019531, -32.548858642578125, -30.794422149658203, -29.039981842041016, -27.28554344177246, -25.531105041503906, -23.77666473388672, -22.022228240966797, -20.26778793334961, -18.513349533081055, -16.7589111328125, -15.004472732543945, -13.25003433227539, -11.495595932006836, -9.741156578063965, -7.98671817779541, -6.2322797775268555, -4.477840423583984, -2.7234020233154297, -0.9689598083496094, 0.7854788303375244, 2.539917469024658, 4.294356346130371, 6.048794746398926, 7.8032331466674805, 9.557672500610352, 11.312110900878906, 13.066549301147461, 14.820987701416016, 16.57542610168457, 18.329864501953125, 20.084304809570312, 21.838741302490234, 23.593181610107422, 25.347620010375977, 27.10205841064453, 28.856496810913086, 30.61093521118164, 32.36537551879883, 34.11981201171875, 35.87425231933594, 37.628692626953125, 39.38312911987305, 41.13756561279297, 42.892005920410156, 44.64644241333008, 46.400882720947266, 48.15531921386719, 49.909759521484375, 51.66419982910156, 53.418636322021484, 55.17307662963867]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 16.0, 32.0, 36.0, 49.0, 73.0, 97.0, 135.0, 211.0, 286.0, 393.0, 638.0, 900.0, 1351.0, 1990.0, 3004.0, 4795.0, 7559.0, 12518.0, 21141.0, 37572.0, 70918.0, 163143.0, 560551.0, 1619468.0, 1130163.0, 318665.0, 112459.0, 53638.0, 28960.0, 16505.0, 9773.0, 6069.0, 3795.0, 2525.0, 1560.0, 1126.0, 726.0, 471.0, 320.0, 225.0, 150.0, 92.0, 59.0, 36.0, 22.0, 14.0, 12.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-77.125, -74.6982421875, -72.271484375, -69.8447265625, -67.41796875, -64.9912109375, -62.564453125, -60.1376953125, -57.7109375, -55.2841796875, -52.857421875, -50.4306640625, -48.00390625, -45.5771484375, -43.150390625, -40.7236328125, -38.296875, -35.8701171875, -33.443359375, -31.0166015625, -28.58984375, -26.1630859375, -23.736328125, -21.3095703125, -18.8828125, -16.4560546875, -14.029296875, -11.6025390625, -9.17578125, -6.7490234375, -4.322265625, -1.8955078125, 0.53125, 2.9580078125, 5.384765625, 7.8115234375, 10.23828125, 12.6650390625, 15.091796875, 17.5185546875, 19.9453125, 22.3720703125, 24.798828125, 27.2255859375, 29.65234375, 32.0791015625, 34.505859375, 36.9326171875, 39.359375, 41.7861328125, 44.212890625, 46.6396484375, 49.06640625, 51.4931640625, 53.919921875, 56.3466796875, 58.7734375, 61.2001953125, 63.626953125, 66.0537109375, 68.48046875, 70.9072265625, 73.333984375, 75.7607421875, 78.1875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 3.0, 6.0, 5.0, 15.0, 11.0, 10.0, 13.0, 21.0, 23.0, 20.0, 39.0, 23.0, 24.0, 30.0, 47.0, 29.0, 39.0, 38.0, 51.0, 41.0, 47.0, 43.0, 32.0, 39.0, 51.0, 35.0, 32.0, 26.0, 22.0, 34.0, 19.0, 21.0, 13.0, 11.0, 14.0, 6.0, 14.0, 9.0, 8.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-41.5625, -40.2880859375, -39.013671875, -37.7392578125, -36.46484375, -35.1904296875, -33.916015625, -32.6416015625, -31.3671875, -30.0927734375, -28.818359375, -27.5439453125, -26.26953125, -24.9951171875, -23.720703125, -22.4462890625, -21.171875, -19.8974609375, -18.623046875, -17.3486328125, -16.07421875, -14.7998046875, -13.525390625, -12.2509765625, -10.9765625, -9.7021484375, -8.427734375, -7.1533203125, -5.87890625, -4.6044921875, -3.330078125, -2.0556640625, -0.78125, 0.4931640625, 1.767578125, 3.0419921875, 4.31640625, 5.5908203125, 6.865234375, 8.1396484375, 9.4140625, 10.6884765625, 11.962890625, 13.2373046875, 14.51171875, 15.7861328125, 17.060546875, 18.3349609375, 19.609375, 20.8837890625, 22.158203125, 23.4326171875, 24.70703125, 25.9814453125, 27.255859375, 28.5302734375, 29.8046875, 31.0791015625, 32.353515625, 33.6279296875, 34.90234375, 36.1767578125, 37.451171875, 38.7255859375, 40.0]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 22.0, 44.0, 50.0, 45.0, 112.0, 149.0, 241.0, 421.0, 634.0, 1011.0, 1682.0, 2706.0, 4563.0, 7833.0, 13554.0, 23477.0, 42373.0, 79959.0, 155866.0, 333833.0, 861504.0, 1540961.0, 601759.0, 252917.0, 122352.0, 64258.0, 35007.0, 19596.0, 11293.0, 6419.0, 3826.0, 2278.0, 1387.0, 856.0, 499.0, 306.0, 181.0, 110.0, 71.0, 35.0, 22.0, 16.0, 19.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.875, -61.6201171875, -59.365234375, -57.1103515625, -54.85546875, -52.6005859375, -50.345703125, -48.0908203125, -45.8359375, -43.5810546875, -41.326171875, -39.0712890625, -36.81640625, -34.5615234375, -32.306640625, -30.0517578125, -27.796875, -25.5419921875, -23.287109375, -21.0322265625, -18.77734375, -16.5224609375, -14.267578125, -12.0126953125, -9.7578125, -7.5029296875, -5.248046875, -2.9931640625, -0.73828125, 1.5166015625, 3.771484375, 6.0263671875, 8.28125, 10.5361328125, 12.791015625, 15.0458984375, 17.30078125, 19.5556640625, 21.810546875, 24.0654296875, 26.3203125, 28.5751953125, 30.830078125, 33.0849609375, 35.33984375, 37.5947265625, 39.849609375, 42.1044921875, 44.359375, 46.6142578125, 48.869140625, 51.1240234375, 53.37890625, 55.6337890625, 57.888671875, 60.1435546875, 62.3984375, 64.6533203125, 66.908203125, 69.1630859375, 71.41796875, 73.6728515625, 75.927734375, 78.1826171875, 80.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 13.0, 7.0, 11.0, 22.0, 16.0, 24.0, 36.0, 33.0, 50.0, 59.0, 72.0, 109.0, 104.0, 141.0, 163.0, 200.0, 235.0, 275.0, 336.0, 389.0, 278.0, 230.0, 202.0, 163.0, 149.0, 121.0, 89.0, 78.0, 78.0, 65.0, 55.0, 44.0, 27.0, 39.0, 35.0, 16.0, 17.0, 21.0, 10.0, 10.0, 10.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.4375, -18.8076171875, -18.177734375, -17.5478515625, -16.91796875, -16.2880859375, -15.658203125, -15.0283203125, -14.3984375, -13.7685546875, -13.138671875, -12.5087890625, -11.87890625, -11.2490234375, -10.619140625, -9.9892578125, -9.359375, -8.7294921875, -8.099609375, -7.4697265625, -6.83984375, -6.2099609375, -5.580078125, -4.9501953125, -4.3203125, -3.6904296875, -3.060546875, -2.4306640625, -1.80078125, -1.1708984375, -0.541015625, 0.0888671875, 0.71875, 1.3486328125, 1.978515625, 2.6083984375, 3.23828125, 3.8681640625, 4.498046875, 5.1279296875, 5.7578125, 6.3876953125, 7.017578125, 7.6474609375, 8.27734375, 8.9072265625, 9.537109375, 10.1669921875, 10.796875, 11.4267578125, 12.056640625, 12.6865234375, 13.31640625, 13.9462890625, 14.576171875, 15.2060546875, 15.8359375, 16.4658203125, 17.095703125, 17.7255859375, 18.35546875, 18.9853515625, 19.615234375, 20.2451171875, 20.875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 3.0, 12.0, 9.0, 16.0, 19.0, 30.0, 33.0, 38.0, 38.0, 43.0, 50.0, 67.0, 71.0, 62.0, 75.0, 63.0, 71.0, 43.0, 52.0, 33.0, 36.0, 15.0, 20.0, 20.0, 12.0, 7.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.30702209472656, -55.384098052978516, -53.46117401123047, -51.538246154785156, -49.61532211303711, -47.69239807128906, -45.769474029541016, -43.84654998779297, -41.92362594604492, -40.000701904296875, -38.07777786254883, -36.15485382080078, -34.23192596435547, -32.30900192260742, -30.386077880859375, -28.463153839111328, -26.54022789001465, -24.6173038482666, -22.694377899169922, -20.771453857421875, -18.848529815673828, -16.92560577392578, -15.002679824829102, -13.079755783081055, -11.156830787658691, -9.233905792236328, -7.310981750488281, -5.388056755065918, -3.465132236480713, -1.5422077178955078, 0.38071727752685547, 2.3036413192749023, 4.226566314697266, 6.149490833282471, 8.072415351867676, 9.995340347290039, 11.918264389038086, 13.84118938446045, 15.764114379882812, 17.68703842163086, 19.609962463378906, 21.532886505126953, 23.455812454223633, 25.37873649597168, 27.301660537719727, 29.224586486816406, 31.147510528564453, 33.0704345703125, 34.99336242675781, 36.91628646850586, 38.839210510253906, 40.76213836669922, 42.685062408447266, 44.60798645019531, 46.53091049194336, 48.453834533691406, 50.37675857543945, 52.2996826171875, 54.22260665893555, 56.145530700683594, 58.068458557128906, 59.99138259887695, 61.914306640625, 63.83723068237305, 65.7601547241211]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 11.0, 18.0, 18.0, 13.0, 24.0, 20.0, 24.0, 27.0, 38.0, 37.0, 36.0, 45.0, 51.0, 42.0, 38.0, 54.0, 40.0, 36.0, 42.0, 54.0, 31.0, 32.0, 38.0, 24.0, 21.0, 26.0, 25.0, 12.0, 19.0, 18.0, 10.0, 11.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.858299255371094, -49.344215393066406, -47.830135345458984, -46.3160514831543, -44.801971435546875, -43.28788757324219, -41.7738037109375, -40.25972366333008, -38.745643615722656, -37.23155975341797, -35.71747970581055, -34.20339584350586, -32.68931579589844, -31.17523193359375, -29.661149978637695, -28.14706802368164, -26.632984161376953, -25.1189022064209, -23.604820251464844, -22.090736389160156, -20.576656341552734, -19.062572479248047, -17.548490524291992, -16.034408569335938, -14.520326614379883, -13.006244659423828, -11.492162704467773, -9.978079795837402, -8.463997840881348, -6.949915885925293, -5.435832977294922, -3.921751022338867, -2.407672882080078, -0.8935906887054443, 0.6204915046691895, 2.1345739364624023, 3.648655891418457, 5.162737846374512, 6.676820755004883, 8.190902709960938, 9.704984664916992, 11.219066619873047, 12.733148574829102, 14.247231483459473, 15.761313438415527, 17.275394439697266, 18.789478302001953, 20.303560256958008, 21.817642211914062, 23.331724166870117, 24.845806121826172, 26.35988998413086, 27.87397003173828, 29.38805389404297, 30.902135848999023, 32.41621780395508, 33.9302978515625, 35.44438171386719, 36.95846176147461, 38.4725456237793, 39.98662567138672, 41.500709533691406, 43.014793395996094, 44.528873443603516, 46.0429573059082]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 8.0, 21.0, 21.0, 23.0, 48.0, 78.0, 113.0, 189.0, 224.0, 338.0, 519.0, 790.0, 1350.0, 1957.0, 3063.0, 4528.0, 7627.0, 12342.0, 20637.0, 35370.0, 61580.0, 108851.0, 192780.0, 241600.0, 150328.0, 84377.0, 48605.0, 28015.0, 16262.0, 9853.0, 6164.0, 3791.0, 2436.0, 1561.0, 1052.0, 683.0, 475.0, 337.0, 178.0, 116.0, 94.0, 63.0, 31.0, 25.0, 18.0, 14.0, 11.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-91.875, -89.1142578125, -86.353515625, -83.5927734375, -80.83203125, -78.0712890625, -75.310546875, -72.5498046875, -69.7890625, -67.0283203125, -64.267578125, -61.5068359375, -58.74609375, -55.9853515625, -53.224609375, -50.4638671875, -47.703125, -44.9423828125, -42.181640625, -39.4208984375, -36.66015625, -33.8994140625, -31.138671875, -28.3779296875, -25.6171875, -22.8564453125, -20.095703125, -17.3349609375, -14.57421875, -11.8134765625, -9.052734375, -6.2919921875, -3.53125, -0.7705078125, 1.990234375, 4.7509765625, 7.51171875, 10.2724609375, 13.033203125, 15.7939453125, 18.5546875, 21.3154296875, 24.076171875, 26.8369140625, 29.59765625, 32.3583984375, 35.119140625, 37.8798828125, 40.640625, 43.4013671875, 46.162109375, 48.9228515625, 51.68359375, 54.4443359375, 57.205078125, 59.9658203125, 62.7265625, 65.4873046875, 68.248046875, 71.0087890625, 73.76953125, 76.5302734375, 79.291015625, 82.0517578125, 84.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 8.0, 8.0, 13.0, 15.0, 20.0, 11.0, 27.0, 28.0, 26.0, 39.0, 38.0, 43.0, 43.0, 48.0, 42.0, 45.0, 40.0, 51.0, 42.0, 44.0, 52.0, 42.0, 25.0, 36.0, 37.0, 24.0, 17.0, 24.0, 16.0, 20.0, 20.0, 9.0, 4.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.40625, -46.970703125, -45.53515625, -44.099609375, -42.6640625, -41.228515625, -39.79296875, -38.357421875, -36.921875, -35.486328125, -34.05078125, -32.615234375, -31.1796875, -29.744140625, -28.30859375, -26.873046875, -25.4375, -24.001953125, -22.56640625, -21.130859375, -19.6953125, -18.259765625, -16.82421875, -15.388671875, -13.953125, -12.517578125, -11.08203125, -9.646484375, -8.2109375, -6.775390625, -5.33984375, -3.904296875, -2.46875, -1.033203125, 0.40234375, 1.837890625, 3.2734375, 4.708984375, 6.14453125, 7.580078125, 9.015625, 10.451171875, 11.88671875, 13.322265625, 14.7578125, 16.193359375, 17.62890625, 19.064453125, 20.5, 21.935546875, 23.37109375, 24.806640625, 26.2421875, 27.677734375, 29.11328125, 30.548828125, 31.984375, 33.419921875, 34.85546875, 36.291015625, 37.7265625, 39.162109375, 40.59765625, 42.033203125, 43.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 29.0, 25.0, 36.0, 47.0, 59.0, 82.0, 96.0, 149.0, 241.0, 370.0, 542.0, 787.0, 1130.0, 1924.0, 2850.0, 4670.0, 7648.0, 13094.0, 23282.0, 43363.0, 88525.0, 204858.0, 335954.0, 161347.0, 72189.0, 36215.0, 19474.0, 11242.0, 6723.0, 4017.0, 2615.0, 1654.0, 1033.0, 727.0, 489.0, 344.0, 239.0, 146.0, 111.0, 73.0, 46.0, 29.0, 23.0, 17.0, 11.0, 5.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.375, -108.7919921875, -105.208984375, -101.6259765625, -98.04296875, -94.4599609375, -90.876953125, -87.2939453125, -83.7109375, -80.1279296875, -76.544921875, -72.9619140625, -69.37890625, -65.7958984375, -62.212890625, -58.6298828125, -55.046875, -51.4638671875, -47.880859375, -44.2978515625, -40.71484375, -37.1318359375, -33.548828125, -29.9658203125, -26.3828125, -22.7998046875, -19.216796875, -15.6337890625, -12.05078125, -8.4677734375, -4.884765625, -1.3017578125, 2.28125, 5.8642578125, 9.447265625, 13.0302734375, 16.61328125, 20.1962890625, 23.779296875, 27.3623046875, 30.9453125, 34.5283203125, 38.111328125, 41.6943359375, 45.27734375, 48.8603515625, 52.443359375, 56.0263671875, 59.609375, 63.1923828125, 66.775390625, 70.3583984375, 73.94140625, 77.5244140625, 81.107421875, 84.6904296875, 88.2734375, 91.8564453125, 95.439453125, 99.0224609375, 102.60546875, 106.1884765625, 109.771484375, 113.3544921875, 116.9375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 9.0, 13.0, 8.0, 12.0, 19.0, 18.0, 16.0, 24.0, 32.0, 26.0, 31.0, 34.0, 32.0, 41.0, 43.0, 61.0, 38.0, 41.0, 47.0, 46.0, 37.0, 37.0, 47.0, 28.0, 28.0, 22.0, 34.0, 28.0, 18.0, 19.0, 23.0, 15.0, 9.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.186767578125, -29.13916015625, -28.091552734375, -27.0439453125, -25.996337890625, -24.94873046875, -23.901123046875, -22.853515625, -21.805908203125, -20.75830078125, -19.710693359375, -18.6630859375, -17.615478515625, -16.56787109375, -15.520263671875, -14.47265625, -13.425048828125, -12.37744140625, -11.329833984375, -10.2822265625, -9.234619140625, -8.18701171875, -7.139404296875, -6.091796875, -5.044189453125, -3.99658203125, -2.948974609375, -1.9013671875, -0.853759765625, 0.19384765625, 1.241455078125, 2.2890625, 3.336669921875, 4.38427734375, 5.431884765625, 6.4794921875, 7.527099609375, 8.57470703125, 9.622314453125, 10.669921875, 11.717529296875, 12.76513671875, 13.812744140625, 14.8603515625, 15.907958984375, 16.95556640625, 18.003173828125, 19.05078125, 20.098388671875, 21.14599609375, 22.193603515625, 23.2412109375, 24.288818359375, 25.33642578125, 26.384033203125, 27.431640625, 28.479248046875, 29.52685546875, 30.574462890625, 31.6220703125, 32.669677734375, 33.71728515625, 34.764892578125, 35.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 18.0, 14.0, 20.0, 24.0, 38.0, 41.0, 60.0, 62.0, 81.0, 118.0, 143.0, 222.0, 304.0, 477.0, 764.0, 1324.0, 2672.0, 6039.0, 16609.0, 79438.0, 717217.0, 179517.0, 26755.0, 8286.0, 3492.0, 1826.0, 1043.0, 587.0, 399.0, 267.0, 177.0, 140.0, 83.0, 75.0, 57.0, 34.0, 27.0, 21.0, 16.0, 13.0, 5.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.3125, -75.759765625, -73.20703125, -70.654296875, -68.1015625, -65.548828125, -62.99609375, -60.443359375, -57.890625, -55.337890625, -52.78515625, -50.232421875, -47.6796875, -45.126953125, -42.57421875, -40.021484375, -37.46875, -34.916015625, -32.36328125, -29.810546875, -27.2578125, -24.705078125, -22.15234375, -19.599609375, -17.046875, -14.494140625, -11.94140625, -9.388671875, -6.8359375, -4.283203125, -1.73046875, 0.822265625, 3.375, 5.927734375, 8.48046875, 11.033203125, 13.5859375, 16.138671875, 18.69140625, 21.244140625, 23.796875, 26.349609375, 28.90234375, 31.455078125, 34.0078125, 36.560546875, 39.11328125, 41.666015625, 44.21875, 46.771484375, 49.32421875, 51.876953125, 54.4296875, 56.982421875, 59.53515625, 62.087890625, 64.640625, 67.193359375, 69.74609375, 72.298828125, 74.8515625, 77.404296875, 79.95703125, 82.509765625, 85.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 8.0, 14.0, 20.0, 37.0, 92.0, 232.0, 316.0, 142.0, 63.0, 28.0, 9.0, 7.0, 10.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01021575927734375, -0.009941577911376953, -0.009667396545410156, -0.00939321517944336, -0.009119033813476562, -0.008844852447509766, -0.008570671081542969, -0.008296489715576172, -0.008022308349609375, -0.007748126983642578, -0.007473945617675781, -0.007199764251708984, -0.0069255828857421875, -0.006651401519775391, -0.006377220153808594, -0.006103038787841797, -0.005828857421875, -0.005554676055908203, -0.005280494689941406, -0.005006313323974609, -0.0047321319580078125, -0.004457950592041016, -0.004183769226074219, -0.003909587860107422, -0.003635406494140625, -0.003361225128173828, -0.0030870437622070312, -0.0028128623962402344, -0.0025386810302734375, -0.0022644996643066406, -0.0019903182983398438, -0.0017161369323730469, -0.00144195556640625, -0.0011677742004394531, -0.0008935928344726562, -0.0006194114685058594, -0.0003452301025390625, -7.104873657226562e-05, 0.00020313262939453125, 0.0004773139953613281, 0.000751495361328125, 0.0010256767272949219, 0.0012998580932617188, 0.0015740394592285156, 0.0018482208251953125, 0.0021224021911621094, 0.0023965835571289062, 0.002670764923095703, 0.0029449462890625, 0.003219127655029297, 0.0034933090209960938, 0.0037674903869628906, 0.0040416717529296875, 0.004315853118896484, 0.004590034484863281, 0.004864215850830078, 0.005138397216796875, 0.005412578582763672, 0.005686759948730469, 0.005960941314697266, 0.0062351226806640625, 0.006509304046630859, 0.006783485412597656, 0.007057666778564453, 0.00733184814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 7.0, 6.0, 8.0, 12.0, 17.0, 15.0, 23.0, 47.0, 50.0, 89.0, 107.0, 183.0, 270.0, 395.0, 632.0, 1040.0, 1712.0, 2920.0, 5096.0, 10367.0, 26470.0, 111332.0, 599301.0, 219077.0, 40359.0, 13771.0, 6276.0, 3486.0, 2012.0, 1241.0, 727.0, 454.0, 344.0, 253.0, 154.0, 102.0, 54.0, 47.0, 31.0, 21.0, 13.0, 15.0, 6.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-84.25, -81.95263671875, -79.6552734375, -77.35791015625, -75.060546875, -72.76318359375, -70.4658203125, -68.16845703125, -65.87109375, -63.57373046875, -61.2763671875, -58.97900390625, -56.681640625, -54.38427734375, -52.0869140625, -49.78955078125, -47.4921875, -45.19482421875, -42.8974609375, -40.60009765625, -38.302734375, -36.00537109375, -33.7080078125, -31.41064453125, -29.11328125, -26.81591796875, -24.5185546875, -22.22119140625, -19.923828125, -17.62646484375, -15.3291015625, -13.03173828125, -10.734375, -8.43701171875, -6.1396484375, -3.84228515625, -1.544921875, 0.75244140625, 3.0498046875, 5.34716796875, 7.64453125, 9.94189453125, 12.2392578125, 14.53662109375, 16.833984375, 19.13134765625, 21.4287109375, 23.72607421875, 26.0234375, 28.32080078125, 30.6181640625, 32.91552734375, 35.212890625, 37.51025390625, 39.8076171875, 42.10498046875, 44.40234375, 46.69970703125, 48.9970703125, 51.29443359375, 53.591796875, 55.88916015625, 58.1865234375, 60.48388671875, 62.78125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 10.0, 11.0, 18.0, 29.0, 48.0, 76.0, 131.0, 151.0, 144.0, 101.0, 90.0, 43.0, 31.0, 22.0, 13.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3778076171875, -12.794677734375, -12.2115478515625, -11.62841796875, -11.0452880859375, -10.462158203125, -9.8790283203125, -9.2958984375, -8.7127685546875, -8.129638671875, -7.5465087890625, -6.96337890625, -6.3802490234375, -5.797119140625, -5.2139892578125, -4.630859375, -4.0477294921875, -3.464599609375, -2.8814697265625, -2.29833984375, -1.7152099609375, -1.132080078125, -0.5489501953125, 0.0341796875, 0.6173095703125, 1.200439453125, 1.7835693359375, 2.36669921875, 2.9498291015625, 3.532958984375, 4.1160888671875, 4.69921875, 5.2823486328125, 5.865478515625, 6.4486083984375, 7.03173828125, 7.6148681640625, 8.197998046875, 8.7811279296875, 9.3642578125, 9.9473876953125, 10.530517578125, 11.1136474609375, 11.69677734375, 12.2799072265625, 12.863037109375, 13.4461669921875, 14.029296875, 14.6124267578125, 15.195556640625, 15.7786865234375, 16.36181640625, 16.9449462890625, 17.528076171875, 18.1112060546875, 18.6943359375, 19.2774658203125, 19.860595703125, 20.4437255859375, 21.02685546875, 21.6099853515625, 22.193115234375, 22.7762451171875, 23.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 8.0, 4.0, 8.0, 14.0, 15.0, 19.0, 33.0, 35.0, 46.0, 36.0, 48.0, 55.0, 61.0, 62.0, 59.0, 66.0, 53.0, 55.0, 45.0, 42.0, 28.0, 30.0, 32.0, 22.0, 21.0, 12.0, 16.0, 11.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.002079010009766, -41.50918960571289, -40.016300201416016, -38.523406982421875, -37.030517578125, -35.537628173828125, -34.04473876953125, -32.551849365234375, -31.058958053588867, -29.566068649291992, -28.073177337646484, -26.58028793334961, -25.087398529052734, -23.594507217407227, -22.10161781311035, -20.608726501464844, -19.11583709716797, -17.622947692871094, -16.130056381225586, -14.637166976928711, -13.14427661895752, -11.651386260986328, -10.158496856689453, -8.665606498718262, -7.17271614074707, -5.679825782775879, -4.186935901641846, -2.6940460205078125, -1.201155662536621, 0.2917346954345703, 1.7846240997314453, 3.2775144577026367, 4.770404815673828, 6.2632951736450195, 7.756185054779053, 9.249074935913086, 10.741965293884277, 12.234855651855469, 13.727745056152344, 15.220635414123535, 16.713525772094727, 18.2064151763916, 19.69930648803711, 21.192195892333984, 22.68508529663086, 24.177976608276367, 25.670866012573242, 27.16375732421875, 28.656646728515625, 30.1495361328125, 31.642427444458008, 33.13531494140625, 34.62820816040039, 36.121097564697266, 37.61398696899414, 39.106876373291016, 40.599769592285156, 42.09265899658203, 43.585548400878906, 45.07843780517578, 46.57133102416992, 48.0642204284668, 49.55710983276367, 51.04999923706055, 52.54288864135742]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 4.0, 7.0, 10.0, 13.0, 17.0, 15.0, 14.0, 13.0, 25.0, 22.0, 30.0, 25.0, 43.0, 47.0, 50.0, 32.0, 30.0, 40.0, 38.0, 48.0, 57.0, 38.0, 40.0, 36.0, 35.0, 26.0, 27.0, 26.0, 28.0, 21.0, 17.0, 18.0, 20.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-44.74073791503906, -43.462337493896484, -42.18394088745117, -40.905540466308594, -39.627140045166016, -38.34873962402344, -37.070343017578125, -35.79194259643555, -34.51354217529297, -33.23514175415039, -31.956743240356445, -30.6783447265625, -29.399944305419922, -28.121545791625977, -26.84314727783203, -25.564746856689453, -24.28635025024414, -23.007951736450195, -21.729551315307617, -20.451152801513672, -19.172752380371094, -17.89435386657715, -16.615955352783203, -15.337555885314941, -14.05915641784668, -12.780756950378418, -11.502357482910156, -10.223958969116211, -8.94555950164795, -7.6671600341796875, -6.388761043548584, -5.1103620529174805, -3.8319664001464844, -2.5535671710968018, -1.2751679420471191, 0.0032312870025634766, 1.281630516052246, 2.560029983520508, 3.8384289741516113, 5.116827964782715, 6.395227432250977, 7.673626899719238, 8.9520263671875, 10.230424880981445, 11.508824348449707, 12.787223815917969, 14.065622329711914, 15.344021797180176, 16.622421264648438, 17.900819778442383, 19.17922019958496, 20.457618713378906, 21.736019134521484, 23.01441764831543, 24.292816162109375, 25.571216583251953, 26.8496150970459, 28.128013610839844, 29.406414031982422, 30.684812545776367, 31.963211059570312, 33.24161148071289, 34.52001190185547, 35.79840850830078, 37.07680892944336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 10.0, 16.0, 28.0, 43.0, 48.0, 67.0, 146.0, 216.0, 326.0, 473.0, 708.0, 1058.0, 1579.0, 2557.0, 3953.0, 6163.0, 9856.0, 15872.0, 25872.0, 41218.0, 66957.0, 108330.0, 166545.0, 198222.0, 148217.0, 95088.0, 58839.0, 35885.0, 22316.0, 13767.0, 8713.0, 5455.0, 3497.0, 2256.0, 1481.0, 999.0, 567.0, 398.0, 277.0, 159.0, 125.0, 78.0, 51.0, 35.0, 26.0, 23.0, 10.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-50.6875, -49.16796875, -47.6484375, -46.12890625, -44.609375, -43.08984375, -41.5703125, -40.05078125, -38.53125, -37.01171875, -35.4921875, -33.97265625, -32.453125, -30.93359375, -29.4140625, -27.89453125, -26.375, -24.85546875, -23.3359375, -21.81640625, -20.296875, -18.77734375, -17.2578125, -15.73828125, -14.21875, -12.69921875, -11.1796875, -9.66015625, -8.140625, -6.62109375, -5.1015625, -3.58203125, -2.0625, -0.54296875, 0.9765625, 2.49609375, 4.015625, 5.53515625, 7.0546875, 8.57421875, 10.09375, 11.61328125, 13.1328125, 14.65234375, 16.171875, 17.69140625, 19.2109375, 20.73046875, 22.25, 23.76953125, 25.2890625, 26.80859375, 28.328125, 29.84765625, 31.3671875, 32.88671875, 34.40625, 35.92578125, 37.4453125, 38.96484375, 40.484375, 42.00390625, 43.5234375, 45.04296875, 46.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 2.0, 6.0, 3.0, 6.0, 3.0, 4.0, 8.0, 11.0, 15.0, 17.0, 14.0, 17.0, 22.0, 22.0, 29.0, 30.0, 44.0, 50.0, 45.0, 32.0, 47.0, 35.0, 45.0, 39.0, 48.0, 40.0, 46.0, 43.0, 36.0, 27.0, 32.0, 29.0, 23.0, 26.0, 17.0, 17.0, 16.0, 10.0, 11.0, 7.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-45.3125, -44.0087890625, -42.705078125, -41.4013671875, -40.09765625, -38.7939453125, -37.490234375, -36.1865234375, -34.8828125, -33.5791015625, -32.275390625, -30.9716796875, -29.66796875, -28.3642578125, -27.060546875, -25.7568359375, -24.453125, -23.1494140625, -21.845703125, -20.5419921875, -19.23828125, -17.9345703125, -16.630859375, -15.3271484375, -14.0234375, -12.7197265625, -11.416015625, -10.1123046875, -8.80859375, -7.5048828125, -6.201171875, -4.8974609375, -3.59375, -2.2900390625, -0.986328125, 0.3173828125, 1.62109375, 2.9248046875, 4.228515625, 5.5322265625, 6.8359375, 8.1396484375, 9.443359375, 10.7470703125, 12.05078125, 13.3544921875, 14.658203125, 15.9619140625, 17.265625, 18.5693359375, 19.873046875, 21.1767578125, 22.48046875, 23.7841796875, 25.087890625, 26.3916015625, 27.6953125, 28.9990234375, 30.302734375, 31.6064453125, 32.91015625, 34.2138671875, 35.517578125, 36.8212890625, 38.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 12.0, 15.0, 14.0, 19.0, 39.0, 52.0, 77.0, 128.0, 202.0, 278.0, 477.0, 827.0, 1381.0, 2356.0, 4108.0, 7529.0, 13944.0, 26707.0, 51895.0, 102817.0, 199559.0, 272697.0, 176477.0, 89715.0, 45059.0, 23886.0, 12478.0, 6841.0, 3775.0, 2056.0, 1217.0, 689.0, 421.0, 286.0, 170.0, 130.0, 66.0, 46.0, 35.0, 22.0, 17.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.3125, -68.8017578125, -66.291015625, -63.7802734375, -61.26953125, -58.7587890625, -56.248046875, -53.7373046875, -51.2265625, -48.7158203125, -46.205078125, -43.6943359375, -41.18359375, -38.6728515625, -36.162109375, -33.6513671875, -31.140625, -28.6298828125, -26.119140625, -23.6083984375, -21.09765625, -18.5869140625, -16.076171875, -13.5654296875, -11.0546875, -8.5439453125, -6.033203125, -3.5224609375, -1.01171875, 1.4990234375, 4.009765625, 6.5205078125, 9.03125, 11.5419921875, 14.052734375, 16.5634765625, 19.07421875, 21.5849609375, 24.095703125, 26.6064453125, 29.1171875, 31.6279296875, 34.138671875, 36.6494140625, 39.16015625, 41.6708984375, 44.181640625, 46.6923828125, 49.203125, 51.7138671875, 54.224609375, 56.7353515625, 59.24609375, 61.7568359375, 64.267578125, 66.7783203125, 69.2890625, 71.7998046875, 74.310546875, 76.8212890625, 79.33203125, 81.8427734375, 84.353515625, 86.8642578125, 89.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 14.0, 8.0, 13.0, 11.0, 20.0, 22.0, 32.0, 16.0, 32.0, 30.0, 29.0, 49.0, 37.0, 44.0, 28.0, 49.0, 34.0, 42.0, 49.0, 42.0, 45.0, 40.0, 30.0, 37.0, 29.0, 32.0, 28.0, 28.0, 17.0, 12.0, 17.0, 19.0, 9.0, 14.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -29.06884765625, -28.2001953125, -27.33154296875, -26.462890625, -25.59423828125, -24.7255859375, -23.85693359375, -22.98828125, -22.11962890625, -21.2509765625, -20.38232421875, -19.513671875, -18.64501953125, -17.7763671875, -16.90771484375, -16.0390625, -15.17041015625, -14.3017578125, -13.43310546875, -12.564453125, -11.69580078125, -10.8271484375, -9.95849609375, -9.08984375, -8.22119140625, -7.3525390625, -6.48388671875, -5.615234375, -4.74658203125, -3.8779296875, -3.00927734375, -2.140625, -1.27197265625, -0.4033203125, 0.46533203125, 1.333984375, 2.20263671875, 3.0712890625, 3.93994140625, 4.80859375, 5.67724609375, 6.5458984375, 7.41455078125, 8.283203125, 9.15185546875, 10.0205078125, 10.88916015625, 11.7578125, 12.62646484375, 13.4951171875, 14.36376953125, 15.232421875, 16.10107421875, 16.9697265625, 17.83837890625, 18.70703125, 19.57568359375, 20.4443359375, 21.31298828125, 22.181640625, 23.05029296875, 23.9189453125, 24.78759765625, 25.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 23.0, 32.0, 34.0, 54.0, 90.0, 100.0, 143.0, 216.0, 354.0, 463.0, 743.0, 1142.0, 1844.0, 3024.0, 5075.0, 9225.0, 17601.0, 36579.0, 88436.0, 249293.0, 373052.0, 149232.0, 56263.0, 25236.0, 12728.0, 6892.0, 4029.0, 2300.0, 1462.0, 915.0, 591.0, 428.0, 277.0, 178.0, 130.0, 96.0, 85.0, 45.0, 32.0, 24.0, 15.0, 20.0, 10.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.21875, -32.18896484375, -31.1591796875, -30.12939453125, -29.099609375, -28.06982421875, -27.0400390625, -26.01025390625, -24.98046875, -23.95068359375, -22.9208984375, -21.89111328125, -20.861328125, -19.83154296875, -18.8017578125, -17.77197265625, -16.7421875, -15.71240234375, -14.6826171875, -13.65283203125, -12.623046875, -11.59326171875, -10.5634765625, -9.53369140625, -8.50390625, -7.47412109375, -6.4443359375, -5.41455078125, -4.384765625, -3.35498046875, -2.3251953125, -1.29541015625, -0.265625, 0.76416015625, 1.7939453125, 2.82373046875, 3.853515625, 4.88330078125, 5.9130859375, 6.94287109375, 7.97265625, 9.00244140625, 10.0322265625, 11.06201171875, 12.091796875, 13.12158203125, 14.1513671875, 15.18115234375, 16.2109375, 17.24072265625, 18.2705078125, 19.30029296875, 20.330078125, 21.35986328125, 22.3896484375, 23.41943359375, 24.44921875, 25.47900390625, 26.5087890625, 27.53857421875, 28.568359375, 29.59814453125, 30.6279296875, 31.65771484375, 32.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 5.0, 11.0, 8.0, 19.0, 19.0, 32.0, 54.0, 90.0, 155.0, 188.0, 154.0, 84.0, 68.0, 45.0, 20.0, 15.0, 16.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004175961017608643, -0.00402987003326416, -0.0038837790489196777, -0.0037376880645751953, -0.003591597080230713, -0.0034455060958862305, -0.003299415111541748, -0.0031533241271972656, -0.003007233142852783, -0.0028611421585083008, -0.0027150511741638184, -0.002568960189819336, -0.0024228692054748535, -0.002276778221130371, -0.0021306872367858887, -0.0019845962524414062, -0.0018385052680969238, -0.0016924142837524414, -0.001546323299407959, -0.0014002323150634766, -0.0012541413307189941, -0.0011080503463745117, -0.0009619593620300293, -0.0008158683776855469, -0.0006697773933410645, -0.000523686408996582, -0.0003775954246520996, -0.0002315044403076172, -8.541345596313477e-05, 6.0677528381347656e-05, 0.00020676851272583008, 0.0003528594970703125, 0.0004989504814147949, 0.0006450414657592773, 0.0007911324501037598, 0.0009372234344482422, 0.0010833144187927246, 0.001229405403137207, 0.0013754963874816895, 0.0015215873718261719, 0.0016676783561706543, 0.0018137693405151367, 0.001959860324859619, 0.0021059513092041016, 0.002252042293548584, 0.0023981332778930664, 0.002544224262237549, 0.0026903152465820312, 0.0028364062309265137, 0.002982497215270996, 0.0031285881996154785, 0.003274679183959961, 0.0034207701683044434, 0.0035668611526489258, 0.003712952136993408, 0.0038590431213378906, 0.004005134105682373, 0.0041512250900268555, 0.004297316074371338, 0.00444340705871582, 0.004589498043060303, 0.004735589027404785, 0.004881680011749268, 0.00502777099609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 8.0, 14.0, 11.0, 13.0, 26.0, 30.0, 63.0, 63.0, 114.0, 164.0, 252.0, 389.0, 645.0, 1053.0, 1819.0, 3290.0, 6125.0, 12201.0, 26035.0, 63161.0, 177763.0, 408843.0, 213376.0, 74138.0, 29930.0, 13580.0, 6827.0, 3600.0, 1919.0, 1156.0, 680.0, 445.0, 282.0, 156.0, 117.0, 70.0, 58.0, 41.0, 31.0, 18.0, 12.0, 10.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-37.5, -36.38330078125, -35.2666015625, -34.14990234375, -33.033203125, -31.91650390625, -30.7998046875, -29.68310546875, -28.56640625, -27.44970703125, -26.3330078125, -25.21630859375, -24.099609375, -22.98291015625, -21.8662109375, -20.74951171875, -19.6328125, -18.51611328125, -17.3994140625, -16.28271484375, -15.166015625, -14.04931640625, -12.9326171875, -11.81591796875, -10.69921875, -9.58251953125, -8.4658203125, -7.34912109375, -6.232421875, -5.11572265625, -3.9990234375, -2.88232421875, -1.765625, -0.64892578125, 0.4677734375, 1.58447265625, 2.701171875, 3.81787109375, 4.9345703125, 6.05126953125, 7.16796875, 8.28466796875, 9.4013671875, 10.51806640625, 11.634765625, 12.75146484375, 13.8681640625, 14.98486328125, 16.1015625, 17.21826171875, 18.3349609375, 19.45166015625, 20.568359375, 21.68505859375, 22.8017578125, 23.91845703125, 25.03515625, 26.15185546875, 27.2685546875, 28.38525390625, 29.501953125, 30.61865234375, 31.7353515625, 32.85205078125, 33.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 12.0, 14.0, 24.0, 23.0, 26.0, 42.0, 29.0, 40.0, 65.0, 76.0, 63.0, 70.0, 70.0, 73.0, 68.0, 61.0, 41.0, 25.0, 33.0, 23.0, 18.0, 21.0, 11.0, 15.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.55615234375, -7.2998046875, -7.04345703125, -6.787109375, -6.53076171875, -6.2744140625, -6.01806640625, -5.76171875, -5.50537109375, -5.2490234375, -4.99267578125, -4.736328125, -4.47998046875, -4.2236328125, -3.96728515625, -3.7109375, -3.45458984375, -3.1982421875, -2.94189453125, -2.685546875, -2.42919921875, -2.1728515625, -1.91650390625, -1.66015625, -1.40380859375, -1.1474609375, -0.89111328125, -0.634765625, -0.37841796875, -0.1220703125, 0.13427734375, 0.390625, 0.64697265625, 0.9033203125, 1.15966796875, 1.416015625, 1.67236328125, 1.9287109375, 2.18505859375, 2.44140625, 2.69775390625, 2.9541015625, 3.21044921875, 3.466796875, 3.72314453125, 3.9794921875, 4.23583984375, 4.4921875, 4.74853515625, 5.0048828125, 5.26123046875, 5.517578125, 5.77392578125, 6.0302734375, 6.28662109375, 6.54296875, 6.79931640625, 7.0556640625, 7.31201171875, 7.568359375, 7.82470703125, 8.0810546875, 8.33740234375, 8.59375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 10.0, 11.0, 13.0, 20.0, 20.0, 19.0, 26.0, 37.0, 43.0, 48.0, 42.0, 68.0, 51.0, 49.0, 59.0, 66.0, 58.0, 52.0, 40.0, 38.0, 25.0, 32.0, 23.0, 18.0, 17.0, 18.0, 21.0, 9.0, 9.0, 6.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.66911697387695, -39.29092788696289, -37.912742614746094, -36.53455352783203, -35.15636444091797, -33.778175354003906, -32.399986267089844, -31.021800994873047, -29.643611907958984, -28.265422821044922, -26.887235641479492, -25.509048461914062, -24.130859375, -22.752670288085938, -21.374483108520508, -19.996295928955078, -18.618106842041016, -17.239917755126953, -15.861730575561523, -14.483542442321777, -13.105354309082031, -11.727166175842285, -10.348978042602539, -8.970789909362793, -7.592601776123047, -6.214413642883301, -4.836225509643555, -3.4580373764038086, -2.0798492431640625, -0.7016611099243164, 0.6765270233154297, 2.054715156555176, 3.4329071044921875, 4.811095237731934, 6.18928337097168, 7.567471504211426, 8.945659637451172, 10.323847770690918, 11.702035903930664, 13.08022403717041, 14.458412170410156, 15.836600303649902, 17.21478843688965, 18.592975616455078, 19.97116470336914, 21.349353790283203, 22.727540969848633, 24.105728149414062, 25.483917236328125, 26.862106323242188, 28.240293502807617, 29.618480682373047, 30.99666976928711, 32.37485885620117, 33.75304412841797, 35.13123321533203, 36.509422302246094, 37.887611389160156, 39.26580047607422, 40.643985748291016, 42.02217483520508, 43.40036392211914, 44.77854919433594, 46.15673828125, 47.53492736816406]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 10.0, 10.0, 8.0, 17.0, 16.0, 16.0, 29.0, 21.0, 24.0, 23.0, 35.0, 31.0, 40.0, 50.0, 51.0, 42.0, 45.0, 46.0, 54.0, 43.0, 46.0, 41.0, 34.0, 35.0, 40.0, 22.0, 25.0, 23.0, 18.0, 25.0, 16.0, 12.0, 10.0, 3.0, 11.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09554672241211, -40.7083854675293, -39.321224212646484, -37.934059143066406, -36.546897888183594, -35.15973663330078, -33.77257537841797, -32.385414123535156, -30.998252868652344, -29.61109161376953, -28.223928451538086, -26.836767196655273, -25.44960594177246, -24.062442779541016, -22.675281524658203, -21.28812026977539, -19.900957107543945, -18.513795852661133, -17.126632690429688, -15.739471435546875, -14.352310180664062, -12.965147972106934, -11.577985763549805, -10.190824508666992, -8.803662300109863, -7.416500568389893, -6.029338836669922, -4.642176628112793, -3.2550148963928223, -1.8678531646728516, -0.48069095611572266, 0.9064702987670898, 2.2936325073242188, 3.6807942390441895, 5.06795597076416, 6.455118179321289, 7.84227991104126, 9.22944164276123, 10.61660385131836, 12.003765106201172, 13.3909273147583, 14.77808952331543, 16.165250778198242, 17.552413940429688, 18.9395751953125, 20.326736450195312, 21.713897705078125, 23.101058959960938, 24.488222122192383, 25.875383377075195, 27.26254653930664, 28.649707794189453, 30.036869049072266, 31.424030303955078, 32.811195373535156, 34.19835662841797, 35.58551788330078, 36.972679138183594, 38.359840393066406, 39.74700164794922, 41.1341667175293, 42.52132797241211, 43.90848922729492, 45.295650482177734, 46.68281173706055]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 10.0, 13.0, 22.0, 23.0, 48.0, 59.0, 94.0, 135.0, 196.0, 314.0, 445.0, 676.0, 1100.0, 1742.0, 2935.0, 4821.0, 8480.0, 15336.0, 28358.0, 55106.0, 117470.0, 331195.0, 1103656.0, 1549676.0, 609556.0, 192868.0, 81404.0, 40173.0, 21282.0, 11449.0, 6509.0, 3605.0, 2121.0, 1273.0, 731.0, 509.0, 317.0, 216.0, 112.0, 90.0, 46.0, 44.0, 27.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.9375, -58.134765625, -56.33203125, -54.529296875, -52.7265625, -50.923828125, -49.12109375, -47.318359375, -45.515625, -43.712890625, -41.91015625, -40.107421875, -38.3046875, -36.501953125, -34.69921875, -32.896484375, -31.09375, -29.291015625, -27.48828125, -25.685546875, -23.8828125, -22.080078125, -20.27734375, -18.474609375, -16.671875, -14.869140625, -13.06640625, -11.263671875, -9.4609375, -7.658203125, -5.85546875, -4.052734375, -2.25, -0.447265625, 1.35546875, 3.158203125, 4.9609375, 6.763671875, 8.56640625, 10.369140625, 12.171875, 13.974609375, 15.77734375, 17.580078125, 19.3828125, 21.185546875, 22.98828125, 24.791015625, 26.59375, 28.396484375, 30.19921875, 32.001953125, 33.8046875, 35.607421875, 37.41015625, 39.212890625, 41.015625, 42.818359375, 44.62109375, 46.423828125, 48.2265625, 50.029296875, 51.83203125, 53.634765625, 55.4375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 12.0, 17.0, 15.0, 14.0, 26.0, 25.0, 25.0, 31.0, 29.0, 29.0, 39.0, 46.0, 41.0, 34.0, 35.0, 50.0, 27.0, 34.0, 39.0, 54.0, 43.0, 33.0, 31.0, 36.0, 24.0, 14.0, 28.0, 18.0, 11.0, 21.0, 12.0, 19.0, 6.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-34.53125, -33.583251953125, -32.63525390625, -31.687255859375, -30.7392578125, -29.791259765625, -28.84326171875, -27.895263671875, -26.947265625, -25.999267578125, -25.05126953125, -24.103271484375, -23.1552734375, -22.207275390625, -21.25927734375, -20.311279296875, -19.36328125, -18.415283203125, -17.46728515625, -16.519287109375, -15.5712890625, -14.623291015625, -13.67529296875, -12.727294921875, -11.779296875, -10.831298828125, -9.88330078125, -8.935302734375, -7.9873046875, -7.039306640625, -6.09130859375, -5.143310546875, -4.1953125, -3.247314453125, -2.29931640625, -1.351318359375, -0.4033203125, 0.544677734375, 1.49267578125, 2.440673828125, 3.388671875, 4.336669921875, 5.28466796875, 6.232666015625, 7.1806640625, 8.128662109375, 9.07666015625, 10.024658203125, 10.97265625, 11.920654296875, 12.86865234375, 13.816650390625, 14.7646484375, 15.712646484375, 16.66064453125, 17.608642578125, 18.556640625, 19.504638671875, 20.45263671875, 21.400634765625, 22.3486328125, 23.296630859375, 24.24462890625, 25.192626953125, 26.140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 16.0, 24.0, 39.0, 55.0, 68.0, 107.0, 175.0, 254.0, 410.0, 698.0, 1103.0, 1747.0, 2784.0, 4998.0, 8297.0, 15276.0, 28117.0, 53791.0, 110263.0, 241838.0, 597793.0, 1499201.0, 953570.0, 358724.0, 156486.0, 74229.0, 37562.0, 19931.0, 11108.0, 6221.0, 3613.0, 2092.0, 1350.0, 851.0, 535.0, 356.0, 184.0, 131.0, 82.0, 61.0, 47.0, 26.0, 22.0, 16.0, 5.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.90625, -49.13427734375, -47.3623046875, -45.59033203125, -43.818359375, -42.04638671875, -40.2744140625, -38.50244140625, -36.73046875, -34.95849609375, -33.1865234375, -31.41455078125, -29.642578125, -27.87060546875, -26.0986328125, -24.32666015625, -22.5546875, -20.78271484375, -19.0107421875, -17.23876953125, -15.466796875, -13.69482421875, -11.9228515625, -10.15087890625, -8.37890625, -6.60693359375, -4.8349609375, -3.06298828125, -1.291015625, 0.48095703125, 2.2529296875, 4.02490234375, 5.796875, 7.56884765625, 9.3408203125, 11.11279296875, 12.884765625, 14.65673828125, 16.4287109375, 18.20068359375, 19.97265625, 21.74462890625, 23.5166015625, 25.28857421875, 27.060546875, 28.83251953125, 30.6044921875, 32.37646484375, 34.1484375, 35.92041015625, 37.6923828125, 39.46435546875, 41.236328125, 43.00830078125, 44.7802734375, 46.55224609375, 48.32421875, 50.09619140625, 51.8681640625, 53.64013671875, 55.412109375, 57.18408203125, 58.9560546875, 60.72802734375, 62.5]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 18.0, 19.0, 23.0, 24.0, 36.0, 56.0, 59.0, 75.0, 78.0, 99.0, 121.0, 142.0, 207.0, 186.0, 251.0, 314.0, 347.0, 291.0, 305.0, 262.0, 210.0, 149.0, 143.0, 120.0, 89.0, 74.0, 60.0, 44.0, 42.0, 42.0, 25.0, 26.0, 28.0, 16.0, 12.0, 8.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.3671875, -13.8990478515625, -13.430908203125, -12.9627685546875, -12.49462890625, -12.0264892578125, -11.558349609375, -11.0902099609375, -10.6220703125, -10.1539306640625, -9.685791015625, -9.2176513671875, -8.74951171875, -8.2813720703125, -7.813232421875, -7.3450927734375, -6.876953125, -6.4088134765625, -5.940673828125, -5.4725341796875, -5.00439453125, -4.5362548828125, -4.068115234375, -3.5999755859375, -3.1318359375, -2.6636962890625, -2.195556640625, -1.7274169921875, -1.25927734375, -0.7911376953125, -0.322998046875, 0.1451416015625, 0.61328125, 1.0814208984375, 1.549560546875, 2.0177001953125, 2.48583984375, 2.9539794921875, 3.422119140625, 3.8902587890625, 4.3583984375, 4.8265380859375, 5.294677734375, 5.7628173828125, 6.23095703125, 6.6990966796875, 7.167236328125, 7.6353759765625, 8.103515625, 8.5716552734375, 9.039794921875, 9.5079345703125, 9.97607421875, 10.4442138671875, 10.912353515625, 11.3804931640625, 11.8486328125, 12.3167724609375, 12.784912109375, 13.2530517578125, 13.72119140625, 14.1893310546875, 14.657470703125, 15.1256103515625, 15.59375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 5.0, 5.0, 11.0, 17.0, 19.0, 24.0, 26.0, 37.0, 43.0, 56.0, 51.0, 63.0, 54.0, 63.0, 59.0, 68.0, 68.0, 52.0, 56.0, 38.0, 33.0, 25.0, 28.0, 24.0, 17.0, 14.0, 5.0, 3.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03245544433594, -38.56648254394531, -37.10050964355469, -35.63453674316406, -34.16856384277344, -32.70259094238281, -31.236618041992188, -29.770645141601562, -28.304672241210938, -26.838699340820312, -25.372726440429688, -23.906753540039062, -22.440780639648438, -20.974807739257812, -19.508834838867188, -18.042861938476562, -16.576889038085938, -15.110916137695312, -13.644943237304688, -12.178970336914062, -10.712997436523438, -9.247024536132812, -7.7810516357421875, -6.3150787353515625, -4.8491058349609375, -3.3831329345703125, -1.9171600341796875, -0.4511871337890625, 1.0147857666015625, 2.4807586669921875, 3.9467315673828125, 5.4127044677734375, 6.878681182861328, 8.344654083251953, 9.810626983642578, 11.276599884033203, 12.742572784423828, 14.208545684814453, 15.674518585205078, 17.140491485595703, 18.606464385986328, 20.072437286376953, 21.538410186767578, 23.004383087158203, 24.470355987548828, 25.936328887939453, 27.402301788330078, 28.868274688720703, 30.334247589111328, 31.800220489501953, 33.26619338989258, 34.7321662902832, 36.19813919067383, 37.66411209106445, 39.13008499145508, 40.5960578918457, 42.06203079223633, 43.52800369262695, 44.99397659301758, 46.4599494934082, 47.92592239379883, 49.39189529418945, 50.85786819458008, 52.3238410949707, 53.78981399536133]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 14.0, 5.0, 8.0, 12.0, 20.0, 23.0, 22.0, 26.0, 28.0, 21.0, 47.0, 28.0, 37.0, 42.0, 41.0, 40.0, 36.0, 40.0, 34.0, 50.0, 44.0, 35.0, 40.0, 37.0, 39.0, 32.0, 24.0, 23.0, 26.0, 20.0, 14.0, 16.0, 10.0, 15.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.90105438232422, -34.77497482299805, -33.64889907836914, -32.52281951904297, -31.396739959716797, -30.270662307739258, -29.14458465576172, -28.018505096435547, -26.892427444458008, -25.76634979248047, -24.640270233154297, -23.514192581176758, -22.38811492919922, -21.262035369873047, -20.135957717895508, -19.00988006591797, -17.883800506591797, -16.757722854614258, -15.631643295288086, -14.505565643310547, -13.379487037658691, -12.253408432006836, -11.127330780029297, -10.001252174377441, -8.875173568725586, -7.7490949630737305, -6.623016834259033, -5.496938705444336, -4.3708600997924805, -3.244781494140625, -2.1187033653259277, -0.9926252365112305, 0.13345718383789062, 1.259535551071167, 2.3856139183044434, 3.5116922855377197, 4.637770652770996, 5.763849258422852, 6.889927387237549, 8.016005516052246, 9.142084121704102, 10.268162727355957, 11.394241333007812, 12.520318984985352, 13.646397590637207, 14.772476196289062, 15.898553848266602, 17.02463150024414, 18.150711059570312, 19.27678871154785, 20.402868270874023, 21.528945922851562, 22.655025482177734, 23.781103134155273, 24.907180786132812, 26.033260345458984, 27.159337997436523, 28.285415649414062, 29.411495208740234, 30.537572860717773, 31.663650512695312, 32.789730072021484, 33.915809631347656, 35.04188537597656, 36.167964935302734]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 18.0, 20.0, 24.0, 41.0, 65.0, 76.0, 135.0, 206.0, 346.0, 556.0, 969.0, 1730.0, 3159.0, 5925.0, 11661.0, 23425.0, 51624.0, 123203.0, 305118.0, 301255.0, 120544.0, 50393.0, 23352.0, 11430.0, 5922.0, 3120.0, 1717.0, 936.0, 594.0, 345.0, 190.0, 140.0, 95.0, 55.0, 41.0, 29.0, 30.0, 20.0, 8.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-78.25, -75.55078125, -72.8515625, -70.15234375, -67.453125, -64.75390625, -62.0546875, -59.35546875, -56.65625, -53.95703125, -51.2578125, -48.55859375, -45.859375, -43.16015625, -40.4609375, -37.76171875, -35.0625, -32.36328125, -29.6640625, -26.96484375, -24.265625, -21.56640625, -18.8671875, -16.16796875, -13.46875, -10.76953125, -8.0703125, -5.37109375, -2.671875, 0.02734375, 2.7265625, 5.42578125, 8.125, 10.82421875, 13.5234375, 16.22265625, 18.921875, 21.62109375, 24.3203125, 27.01953125, 29.71875, 32.41796875, 35.1171875, 37.81640625, 40.515625, 43.21484375, 45.9140625, 48.61328125, 51.3125, 54.01171875, 56.7109375, 59.41015625, 62.109375, 64.80859375, 67.5078125, 70.20703125, 72.90625, 75.60546875, 78.3046875, 81.00390625, 83.703125, 86.40234375, 89.1015625, 91.80078125, 94.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 9.0, 9.0, 4.0, 14.0, 19.0, 18.0, 22.0, 35.0, 28.0, 30.0, 38.0, 36.0, 40.0, 39.0, 44.0, 48.0, 36.0, 42.0, 38.0, 37.0, 50.0, 31.0, 38.0, 49.0, 40.0, 26.0, 23.0, 25.0, 21.0, 19.0, 25.0, 13.0, 9.0, 10.0, 6.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.21875, -35.0673828125, -33.916015625, -32.7646484375, -31.61328125, -30.4619140625, -29.310546875, -28.1591796875, -27.0078125, -25.8564453125, -24.705078125, -23.5537109375, -22.40234375, -21.2509765625, -20.099609375, -18.9482421875, -17.796875, -16.6455078125, -15.494140625, -14.3427734375, -13.19140625, -12.0400390625, -10.888671875, -9.7373046875, -8.5859375, -7.4345703125, -6.283203125, -5.1318359375, -3.98046875, -2.8291015625, -1.677734375, -0.5263671875, 0.625, 1.7763671875, 2.927734375, 4.0791015625, 5.23046875, 6.3818359375, 7.533203125, 8.6845703125, 9.8359375, 10.9873046875, 12.138671875, 13.2900390625, 14.44140625, 15.5927734375, 16.744140625, 17.8955078125, 19.046875, 20.1982421875, 21.349609375, 22.5009765625, 23.65234375, 24.8037109375, 25.955078125, 27.1064453125, 28.2578125, 29.4091796875, 30.560546875, 31.7119140625, 32.86328125, 34.0146484375, 35.166015625, 36.3173828125, 37.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 6.0, 4.0, 10.0, 18.0, 34.0, 45.0, 73.0, 81.0, 133.0, 193.0, 301.0, 470.0, 672.0, 1053.0, 1615.0, 2682.0, 4449.0, 7539.0, 13317.0, 24864.0, 49374.0, 112462.0, 291515.0, 305570.0, 120250.0, 52469.0, 25785.0, 13612.0, 7847.0, 4465.0, 2741.0, 1678.0, 1092.0, 672.0, 489.0, 301.0, 217.0, 149.0, 90.0, 62.0, 42.0, 32.0, 24.0, 17.0, 14.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-77.0625, -74.5791015625, -72.095703125, -69.6123046875, -67.12890625, -64.6455078125, -62.162109375, -59.6787109375, -57.1953125, -54.7119140625, -52.228515625, -49.7451171875, -47.26171875, -44.7783203125, -42.294921875, -39.8115234375, -37.328125, -34.8447265625, -32.361328125, -29.8779296875, -27.39453125, -24.9111328125, -22.427734375, -19.9443359375, -17.4609375, -14.9775390625, -12.494140625, -10.0107421875, -7.52734375, -5.0439453125, -2.560546875, -0.0771484375, 2.40625, 4.8896484375, 7.373046875, 9.8564453125, 12.33984375, 14.8232421875, 17.306640625, 19.7900390625, 22.2734375, 24.7568359375, 27.240234375, 29.7236328125, 32.20703125, 34.6904296875, 37.173828125, 39.6572265625, 42.140625, 44.6240234375, 47.107421875, 49.5908203125, 52.07421875, 54.5576171875, 57.041015625, 59.5244140625, 62.0078125, 64.4912109375, 66.974609375, 69.4580078125, 71.94140625, 74.4248046875, 76.908203125, 79.3916015625, 81.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 6.0, 5.0, 9.0, 11.0, 15.0, 11.0, 11.0, 13.0, 24.0, 30.0, 20.0, 36.0, 28.0, 34.0, 36.0, 49.0, 43.0, 30.0, 33.0, 54.0, 39.0, 44.0, 42.0, 36.0, 37.0, 39.0, 33.0, 31.0, 25.0, 29.0, 21.0, 23.0, 21.0, 14.0, 12.0, 7.0, 5.0, 5.0, 8.0, 3.0, 7.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.376220703125, -21.64306640625, -20.909912109375, -20.1767578125, -19.443603515625, -18.71044921875, -17.977294921875, -17.244140625, -16.510986328125, -15.77783203125, -15.044677734375, -14.3115234375, -13.578369140625, -12.84521484375, -12.112060546875, -11.37890625, -10.645751953125, -9.91259765625, -9.179443359375, -8.4462890625, -7.713134765625, -6.97998046875, -6.246826171875, -5.513671875, -4.780517578125, -4.04736328125, -3.314208984375, -2.5810546875, -1.847900390625, -1.11474609375, -0.381591796875, 0.3515625, 1.084716796875, 1.81787109375, 2.551025390625, 3.2841796875, 4.017333984375, 4.75048828125, 5.483642578125, 6.216796875, 6.949951171875, 7.68310546875, 8.416259765625, 9.1494140625, 9.882568359375, 10.61572265625, 11.348876953125, 12.08203125, 12.815185546875, 13.54833984375, 14.281494140625, 15.0146484375, 15.747802734375, 16.48095703125, 17.214111328125, 17.947265625, 18.680419921875, 19.41357421875, 20.146728515625, 20.8798828125, 21.613037109375, 22.34619140625, 23.079345703125, 23.8125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 9.0, 14.0, 25.0, 33.0, 27.0, 76.0, 95.0, 135.0, 206.0, 300.0, 502.0, 885.0, 1489.0, 2845.0, 5399.0, 11367.0, 27477.0, 75206.0, 268835.0, 446563.0, 130843.0, 42612.0, 17100.0, 7639.0, 3816.0, 2067.0, 1094.0, 690.0, 412.0, 283.0, 163.0, 103.0, 72.0, 44.0, 40.0, 32.0, 14.0, 10.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-26.375, -25.530517578125, -24.68603515625, -23.841552734375, -22.9970703125, -22.152587890625, -21.30810546875, -20.463623046875, -19.619140625, -18.774658203125, -17.93017578125, -17.085693359375, -16.2412109375, -15.396728515625, -14.55224609375, -13.707763671875, -12.86328125, -12.018798828125, -11.17431640625, -10.329833984375, -9.4853515625, -8.640869140625, -7.79638671875, -6.951904296875, -6.107421875, -5.262939453125, -4.41845703125, -3.573974609375, -2.7294921875, -1.885009765625, -1.04052734375, -0.196044921875, 0.6484375, 1.492919921875, 2.33740234375, 3.181884765625, 4.0263671875, 4.870849609375, 5.71533203125, 6.559814453125, 7.404296875, 8.248779296875, 9.09326171875, 9.937744140625, 10.7822265625, 11.626708984375, 12.47119140625, 13.315673828125, 14.16015625, 15.004638671875, 15.84912109375, 16.693603515625, 17.5380859375, 18.382568359375, 19.22705078125, 20.071533203125, 20.916015625, 21.760498046875, 22.60498046875, 23.449462890625, 24.2939453125, 25.138427734375, 25.98291015625, 26.827392578125, 27.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 11.0, 15.0, 22.0, 15.0, 46.0, 46.0, 57.0, 74.0, 90.0, 106.0, 110.0, 78.0, 76.0, 56.0, 46.0, 32.0, 21.0, 18.0, 9.0, 9.0, 9.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002593994140625, -0.0025217533111572266, -0.002449512481689453, -0.0023772716522216797, -0.0023050308227539062, -0.002232789993286133, -0.0021605491638183594, -0.002088308334350586, -0.0020160675048828125, -0.001943826675415039, -0.0018715858459472656, -0.0017993450164794922, -0.0017271041870117188, -0.0016548633575439453, -0.0015826225280761719, -0.0015103816986083984, -0.001438140869140625, -0.0013659000396728516, -0.0012936592102050781, -0.0012214183807373047, -0.0011491775512695312, -0.0010769367218017578, -0.0010046958923339844, -0.0009324550628662109, -0.0008602142333984375, -0.0007879734039306641, -0.0007157325744628906, -0.0006434917449951172, -0.0005712509155273438, -0.0004990100860595703, -0.0004267692565917969, -0.00035452842712402344, -0.00028228759765625, -0.00021004676818847656, -0.00013780593872070312, -6.556510925292969e-05, 6.67572021484375e-06, 7.891654968261719e-05, 0.00015115737915039062, 0.00022339820861816406, 0.0002956390380859375, 0.00036787986755371094, 0.0004401206970214844, 0.0005123615264892578, 0.0005846023559570312, 0.0006568431854248047, 0.0007290840148925781, 0.0008013248443603516, 0.000873565673828125, 0.0009458065032958984, 0.0010180473327636719, 0.0010902881622314453, 0.0011625289916992188, 0.0012347698211669922, 0.0013070106506347656, 0.001379251480102539, 0.0014514923095703125, 0.001523733139038086, 0.0015959739685058594, 0.0016682147979736328, 0.0017404556274414062, 0.0018126964569091797, 0.0018849372863769531, 0.0019571781158447266, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 3.0, 10.0, 16.0, 15.0, 36.0, 44.0, 48.0, 94.0, 121.0, 209.0, 281.0, 469.0, 693.0, 1132.0, 1913.0, 3295.0, 6165.0, 12607.0, 26493.0, 62347.0, 157100.0, 336697.0, 254709.0, 103027.0, 42064.0, 18765.0, 8950.0, 4600.0, 2602.0, 1457.0, 867.0, 589.0, 334.0, 245.0, 189.0, 128.0, 65.0, 49.0, 35.0, 29.0, 15.0, 17.0, 12.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.15625, -25.358154296875, -24.56005859375, -23.761962890625, -22.9638671875, -22.165771484375, -21.36767578125, -20.569580078125, -19.771484375, -18.973388671875, -18.17529296875, -17.377197265625, -16.5791015625, -15.781005859375, -14.98291015625, -14.184814453125, -13.38671875, -12.588623046875, -11.79052734375, -10.992431640625, -10.1943359375, -9.396240234375, -8.59814453125, -7.800048828125, -7.001953125, -6.203857421875, -5.40576171875, -4.607666015625, -3.8095703125, -3.011474609375, -2.21337890625, -1.415283203125, -0.6171875, 0.180908203125, 0.97900390625, 1.777099609375, 2.5751953125, 3.373291015625, 4.17138671875, 4.969482421875, 5.767578125, 6.565673828125, 7.36376953125, 8.161865234375, 8.9599609375, 9.758056640625, 10.55615234375, 11.354248046875, 12.15234375, 12.950439453125, 13.74853515625, 14.546630859375, 15.3447265625, 16.142822265625, 16.94091796875, 17.739013671875, 18.537109375, 19.335205078125, 20.13330078125, 20.931396484375, 21.7294921875, 22.527587890625, 23.32568359375, 24.123779296875, 24.921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 13.0, 13.0, 18.0, 25.0, 25.0, 41.0, 46.0, 54.0, 80.0, 67.0, 74.0, 66.0, 85.0, 66.0, 58.0, 59.0, 46.0, 40.0, 26.0, 20.0, 16.0, 15.0, 11.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0093994140625, -7.745361328125, -7.4813232421875, -7.21728515625, -6.9532470703125, -6.689208984375, -6.4251708984375, -6.1611328125, -5.8970947265625, -5.633056640625, -5.3690185546875, -5.10498046875, -4.8409423828125, -4.576904296875, -4.3128662109375, -4.048828125, -3.7847900390625, -3.520751953125, -3.2567138671875, -2.99267578125, -2.7286376953125, -2.464599609375, -2.2005615234375, -1.9365234375, -1.6724853515625, -1.408447265625, -1.1444091796875, -0.88037109375, -0.6163330078125, -0.352294921875, -0.0882568359375, 0.17578125, 0.4398193359375, 0.703857421875, 0.9678955078125, 1.23193359375, 1.4959716796875, 1.760009765625, 2.0240478515625, 2.2880859375, 2.5521240234375, 2.816162109375, 3.0802001953125, 3.34423828125, 3.6082763671875, 3.872314453125, 4.1363525390625, 4.400390625, 4.6644287109375, 4.928466796875, 5.1925048828125, 5.45654296875, 5.7205810546875, 5.984619140625, 6.2486572265625, 6.5126953125, 6.7767333984375, 7.040771484375, 7.3048095703125, 7.56884765625, 7.8328857421875, 8.096923828125, 8.3609619140625, 8.625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 7.0, 9.0, 9.0, 14.0, 20.0, 10.0, 20.0, 30.0, 42.0, 38.0, 57.0, 48.0, 57.0, 51.0, 70.0, 56.0, 71.0, 58.0, 70.0, 41.0, 37.0, 40.0, 26.0, 27.0, 13.0, 19.0, 11.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.675437927246094, -33.38908386230469, -32.102725982666016, -30.816370010375977, -29.530014038085938, -28.2436580657959, -26.95730209350586, -25.67094612121582, -24.38459014892578, -23.098234176635742, -21.811878204345703, -20.525522232055664, -19.239166259765625, -17.952810287475586, -16.666454315185547, -15.380098342895508, -14.093742370605469, -12.80738639831543, -11.52103042602539, -10.234674453735352, -8.948318481445312, -7.661962509155273, -6.375606536865234, -5.089250564575195, -3.8028945922851562, -2.516538619995117, -1.2301826477050781, 0.05617332458496094, 1.342529296875, 2.628885269165039, 3.915241241455078, 5.201597213745117, 6.487953186035156, 7.774309158325195, 9.060665130615234, 10.347021102905273, 11.633377075195312, 12.919733047485352, 14.20608901977539, 15.49244499206543, 16.77880096435547, 18.065156936645508, 19.351512908935547, 20.637868881225586, 21.924224853515625, 23.210580825805664, 24.496936798095703, 25.783292770385742, 27.06964874267578, 28.35600471496582, 29.64236068725586, 30.9287166595459, 32.21507263183594, 33.501426696777344, 34.787784576416016, 36.07414245605469, 37.360496520996094, 38.6468505859375, 39.93320846557617, 41.219566345214844, 42.50592041015625, 43.792274475097656, 45.07863235473633, 46.364990234375, 47.651344299316406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 20.0, 26.0, 34.0, 41.0, 42.0, 26.0, 35.0, 51.0, 40.0, 32.0, 38.0, 43.0, 55.0, 35.0, 44.0, 44.0, 40.0, 28.0, 25.0, 20.0, 25.0, 28.0, 21.0, 19.0, 13.0, 15.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.04462432861328, -32.96225357055664, -31.8798828125, -30.797510147094727, -29.715139389038086, -28.632768630981445, -27.550395965576172, -26.46802520751953, -25.38565444946289, -24.30328369140625, -23.22091293334961, -22.138540267944336, -21.056169509887695, -19.973798751831055, -18.89142608642578, -17.80905532836914, -16.7266845703125, -15.64431381225586, -14.561942100524902, -13.479570388793945, -12.397199630737305, -11.314828872680664, -10.232457160949707, -9.15008544921875, -8.06771469116211, -6.9853434562683105, -5.902972221374512, -4.820600986480713, -3.738229751586914, -2.6558585166931152, -1.5734872817993164, -0.4911160469055176, 0.5912551879882812, 1.67362642288208, 2.755997657775879, 3.8383688926696777, 4.920740127563477, 6.003111362457275, 7.085482597351074, 8.167854309082031, 9.250225067138672, 10.332595825195312, 11.41496753692627, 12.497339248657227, 13.579710006713867, 14.662080764770508, 15.744452476501465, 16.826824188232422, 17.909194946289062, 18.991565704345703, 20.073936462402344, 21.156309127807617, 22.238679885864258, 23.3210506439209, 24.403423309326172, 25.485794067382812, 26.568164825439453, 27.650535583496094, 28.732906341552734, 29.815279006958008, 30.89764976501465, 31.98002052307129, 33.06239318847656, 34.1447639465332, 35.227134704589844]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 18.0, 16.0, 33.0, 47.0, 68.0, 103.0, 146.0, 218.0, 378.0, 606.0, 909.0, 1549.0, 2423.0, 4103.0, 6944.0, 12397.0, 21484.0, 37783.0, 67915.0, 119462.0, 188676.0, 213966.0, 155537.0, 92330.0, 52299.0, 29274.0, 16477.0, 9322.0, 5585.0, 3248.0, 1948.0, 1160.0, 741.0, 491.0, 323.0, 199.0, 119.0, 84.0, 54.0, 39.0, 18.0, 16.0, 17.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-53.96875, -52.4384765625, -50.908203125, -49.3779296875, -47.84765625, -46.3173828125, -44.787109375, -43.2568359375, -41.7265625, -40.1962890625, -38.666015625, -37.1357421875, -35.60546875, -34.0751953125, -32.544921875, -31.0146484375, -29.484375, -27.9541015625, -26.423828125, -24.8935546875, -23.36328125, -21.8330078125, -20.302734375, -18.7724609375, -17.2421875, -15.7119140625, -14.181640625, -12.6513671875, -11.12109375, -9.5908203125, -8.060546875, -6.5302734375, -5.0, -3.4697265625, -1.939453125, -0.4091796875, 1.12109375, 2.6513671875, 4.181640625, 5.7119140625, 7.2421875, 8.7724609375, 10.302734375, 11.8330078125, 13.36328125, 14.8935546875, 16.423828125, 17.9541015625, 19.484375, 21.0146484375, 22.544921875, 24.0751953125, 25.60546875, 27.1357421875, 28.666015625, 30.1962890625, 31.7265625, 33.2568359375, 34.787109375, 36.3173828125, 37.84765625, 39.3779296875, 40.908203125, 42.4384765625, 43.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 5.0, 10.0, 16.0, 19.0, 27.0, 28.0, 26.0, 26.0, 38.0, 47.0, 36.0, 43.0, 33.0, 41.0, 44.0, 33.0, 51.0, 51.0, 57.0, 40.0, 55.0, 43.0, 23.0, 27.0, 27.0, 22.0, 16.0, 24.0, 13.0, 12.0, 14.0, 6.0, 4.0, 4.0, 8.0, 1.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -34.04638671875, -32.9365234375, -31.82666015625, -30.716796875, -29.60693359375, -28.4970703125, -27.38720703125, -26.27734375, -25.16748046875, -24.0576171875, -22.94775390625, -21.837890625, -20.72802734375, -19.6181640625, -18.50830078125, -17.3984375, -16.28857421875, -15.1787109375, -14.06884765625, -12.958984375, -11.84912109375, -10.7392578125, -9.62939453125, -8.51953125, -7.40966796875, -6.2998046875, -5.18994140625, -4.080078125, -2.97021484375, -1.8603515625, -0.75048828125, 0.359375, 1.46923828125, 2.5791015625, 3.68896484375, 4.798828125, 5.90869140625, 7.0185546875, 8.12841796875, 9.23828125, 10.34814453125, 11.4580078125, 12.56787109375, 13.677734375, 14.78759765625, 15.8974609375, 17.00732421875, 18.1171875, 19.22705078125, 20.3369140625, 21.44677734375, 22.556640625, 23.66650390625, 24.7763671875, 25.88623046875, 26.99609375, 28.10595703125, 29.2158203125, 30.32568359375, 31.435546875, 32.54541015625, 33.6552734375, 34.76513671875, 35.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 17.0, 17.0, 41.0, 58.0, 76.0, 134.0, 211.0, 285.0, 484.0, 700.0, 1100.0, 1754.0, 2741.0, 4315.0, 6872.0, 10901.0, 17583.0, 28749.0, 47217.0, 78003.0, 124260.0, 179172.0, 187472.0, 135345.0, 85541.0, 52170.0, 31567.0, 19417.0, 11903.0, 7394.0, 4760.0, 2883.0, 1908.0, 1218.0, 766.0, 537.0, 323.0, 230.0, 138.0, 91.0, 72.0, 38.0, 34.0, 23.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.5, -48.00439453125, -46.5087890625, -45.01318359375, -43.517578125, -42.02197265625, -40.5263671875, -39.03076171875, -37.53515625, -36.03955078125, -34.5439453125, -33.04833984375, -31.552734375, -30.05712890625, -28.5615234375, -27.06591796875, -25.5703125, -24.07470703125, -22.5791015625, -21.08349609375, -19.587890625, -18.09228515625, -16.5966796875, -15.10107421875, -13.60546875, -12.10986328125, -10.6142578125, -9.11865234375, -7.623046875, -6.12744140625, -4.6318359375, -3.13623046875, -1.640625, -0.14501953125, 1.3505859375, 2.84619140625, 4.341796875, 5.83740234375, 7.3330078125, 8.82861328125, 10.32421875, 11.81982421875, 13.3154296875, 14.81103515625, 16.306640625, 17.80224609375, 19.2978515625, 20.79345703125, 22.2890625, 23.78466796875, 25.2802734375, 26.77587890625, 28.271484375, 29.76708984375, 31.2626953125, 32.75830078125, 34.25390625, 35.74951171875, 37.2451171875, 38.74072265625, 40.236328125, 41.73193359375, 43.2275390625, 44.72314453125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 4.0, 6.0, 14.0, 20.0, 14.0, 20.0, 16.0, 12.0, 17.0, 19.0, 27.0, 42.0, 39.0, 33.0, 45.0, 33.0, 39.0, 49.0, 49.0, 42.0, 40.0, 40.0, 31.0, 40.0, 34.0, 32.0, 34.0, 25.0, 28.0, 23.0, 22.0, 14.0, 13.0, 19.0, 10.0, 6.0, 5.0, 7.0, 4.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.671875, -19.99560546875, -19.3193359375, -18.64306640625, -17.966796875, -17.29052734375, -16.6142578125, -15.93798828125, -15.26171875, -14.58544921875, -13.9091796875, -13.23291015625, -12.556640625, -11.88037109375, -11.2041015625, -10.52783203125, -9.8515625, -9.17529296875, -8.4990234375, -7.82275390625, -7.146484375, -6.47021484375, -5.7939453125, -5.11767578125, -4.44140625, -3.76513671875, -3.0888671875, -2.41259765625, -1.736328125, -1.06005859375, -0.3837890625, 0.29248046875, 0.96875, 1.64501953125, 2.3212890625, 2.99755859375, 3.673828125, 4.35009765625, 5.0263671875, 5.70263671875, 6.37890625, 7.05517578125, 7.7314453125, 8.40771484375, 9.083984375, 9.76025390625, 10.4365234375, 11.11279296875, 11.7890625, 12.46533203125, 13.1416015625, 13.81787109375, 14.494140625, 15.17041015625, 15.8466796875, 16.52294921875, 17.19921875, 17.87548828125, 18.5517578125, 19.22802734375, 19.904296875, 20.58056640625, 21.2568359375, 21.93310546875, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 11.0, 16.0, 25.0, 46.0, 60.0, 79.0, 117.0, 177.0, 259.0, 384.0, 605.0, 897.0, 1549.0, 2340.0, 3885.0, 6554.0, 11388.0, 21592.0, 42626.0, 89888.0, 194805.0, 302208.0, 190256.0, 87595.0, 41638.0, 21436.0, 11470.0, 6386.0, 3869.0, 2300.0, 1395.0, 934.0, 590.0, 359.0, 262.0, 166.0, 108.0, 82.0, 48.0, 36.0, 21.0, 30.0, 12.0, 11.0, 3.0, 5.0, 5.0, 0.0, 4.0, 4.0, 0.0, 3.0], "bins": [-18.5, -17.947509765625, -17.39501953125, -16.842529296875, -16.2900390625, -15.737548828125, -15.18505859375, -14.632568359375, -14.080078125, -13.527587890625, -12.97509765625, -12.422607421875, -11.8701171875, -11.317626953125, -10.76513671875, -10.212646484375, -9.66015625, -9.107666015625, -8.55517578125, -8.002685546875, -7.4501953125, -6.897705078125, -6.34521484375, -5.792724609375, -5.240234375, -4.687744140625, -4.13525390625, -3.582763671875, -3.0302734375, -2.477783203125, -1.92529296875, -1.372802734375, -0.8203125, -0.267822265625, 0.28466796875, 0.837158203125, 1.3896484375, 1.942138671875, 2.49462890625, 3.047119140625, 3.599609375, 4.152099609375, 4.70458984375, 5.257080078125, 5.8095703125, 6.362060546875, 6.91455078125, 7.467041015625, 8.01953125, 8.572021484375, 9.12451171875, 9.677001953125, 10.2294921875, 10.781982421875, 11.33447265625, 11.886962890625, 12.439453125, 12.991943359375, 13.54443359375, 14.096923828125, 14.6494140625, 15.201904296875, 15.75439453125, 16.306884765625, 16.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 17.0, 23.0, 47.0, 56.0, 77.0, 99.0, 146.0, 132.0, 97.0, 68.0, 45.0, 29.0, 32.0, 25.0, 14.0, 12.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.00199282169342041, -0.0019161701202392578, -0.0018395185470581055, -0.0017628669738769531, -0.0016862154006958008, -0.0016095638275146484, -0.001532912254333496, -0.0014562606811523438, -0.0013796091079711914, -0.001302957534790039, -0.0012263059616088867, -0.0011496543884277344, -0.001073002815246582, -0.0009963512420654297, -0.0009196996688842773, -0.000843048095703125, -0.0007663965225219727, -0.0006897449493408203, -0.000613093376159668, -0.0005364418029785156, -0.0004597902297973633, -0.00038313865661621094, -0.0003064870834350586, -0.00022983551025390625, -0.0001531839370727539, -7.653236389160156e-05, 1.1920928955078125e-07, 7.677078247070312e-05, 0.00015342235565185547, 0.0002300739288330078, 0.00030672550201416016, 0.0003833770751953125, 0.00046002864837646484, 0.0005366802215576172, 0.0006133317947387695, 0.0006899833679199219, 0.0007666349411010742, 0.0008432865142822266, 0.0009199380874633789, 0.0009965896606445312, 0.0010732412338256836, 0.001149892807006836, 0.0012265443801879883, 0.0013031959533691406, 0.001379847526550293, 0.0014564990997314453, 0.0015331506729125977, 0.00160980224609375, 0.0016864538192749023, 0.0017631053924560547, 0.001839756965637207, 0.0019164085388183594, 0.0019930601119995117, 0.002069711685180664, 0.0021463632583618164, 0.0022230148315429688, 0.002299666404724121, 0.0023763179779052734, 0.0024529695510864258, 0.002529621124267578, 0.0026062726974487305, 0.002682924270629883, 0.002759575843811035, 0.0028362274169921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 7.0, 15.0, 23.0, 31.0, 42.0, 57.0, 88.0, 153.0, 199.0, 312.0, 559.0, 869.0, 1626.0, 2810.0, 5282.0, 9870.0, 20253.0, 43133.0, 96989.0, 217999.0, 318493.0, 179618.0, 79028.0, 35383.0, 16846.0, 8518.0, 4454.0, 2445.0, 1321.0, 796.0, 490.0, 283.0, 174.0, 119.0, 82.0, 51.0, 24.0, 29.0, 23.0, 14.0, 11.0, 12.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.834716796875, -17.24755859375, -16.660400390625, -16.0732421875, -15.486083984375, -14.89892578125, -14.311767578125, -13.724609375, -13.137451171875, -12.55029296875, -11.963134765625, -11.3759765625, -10.788818359375, -10.20166015625, -9.614501953125, -9.02734375, -8.440185546875, -7.85302734375, -7.265869140625, -6.6787109375, -6.091552734375, -5.50439453125, -4.917236328125, -4.330078125, -3.742919921875, -3.15576171875, -2.568603515625, -1.9814453125, -1.394287109375, -0.80712890625, -0.219970703125, 0.3671875, 0.954345703125, 1.54150390625, 2.128662109375, 2.7158203125, 3.302978515625, 3.89013671875, 4.477294921875, 5.064453125, 5.651611328125, 6.23876953125, 6.825927734375, 7.4130859375, 8.000244140625, 8.58740234375, 9.174560546875, 9.76171875, 10.348876953125, 10.93603515625, 11.523193359375, 12.1103515625, 12.697509765625, 13.28466796875, 13.871826171875, 14.458984375, 15.046142578125, 15.63330078125, 16.220458984375, 16.8076171875, 17.394775390625, 17.98193359375, 18.569091796875, 19.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 8.0, 10.0, 9.0, 21.0, 18.0, 27.0, 22.0, 48.0, 32.0, 36.0, 33.0, 43.0, 56.0, 66.0, 66.0, 76.0, 72.0, 43.0, 50.0, 35.0, 31.0, 29.0, 23.0, 23.0, 15.0, 17.0, 11.0, 16.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6851806640625, -4.550048828125, -4.4149169921875, -4.27978515625, -4.1446533203125, -4.009521484375, -3.8743896484375, -3.7392578125, -3.6041259765625, -3.468994140625, -3.3338623046875, -3.19873046875, -3.0635986328125, -2.928466796875, -2.7933349609375, -2.658203125, -2.5230712890625, -2.387939453125, -2.2528076171875, -2.11767578125, -1.9825439453125, -1.847412109375, -1.7122802734375, -1.5771484375, -1.4420166015625, -1.306884765625, -1.1717529296875, -1.03662109375, -0.9014892578125, -0.766357421875, -0.6312255859375, -0.49609375, -0.3609619140625, -0.225830078125, -0.0906982421875, 0.04443359375, 0.1795654296875, 0.314697265625, 0.4498291015625, 0.5849609375, 0.7200927734375, 0.855224609375, 0.9903564453125, 1.12548828125, 1.2606201171875, 1.395751953125, 1.5308837890625, 1.666015625, 1.8011474609375, 1.936279296875, 2.0714111328125, 2.20654296875, 2.3416748046875, 2.476806640625, 2.6119384765625, 2.7470703125, 2.8822021484375, 3.017333984375, 3.1524658203125, 3.28759765625, 3.4227294921875, 3.557861328125, 3.6929931640625, 3.828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 15.0, 17.0, 21.0, 18.0, 25.0, 22.0, 46.0, 51.0, 50.0, 70.0, 55.0, 73.0, 67.0, 78.0, 55.0, 55.0, 45.0, 41.0, 35.0, 27.0, 29.0, 24.0, 10.0, 16.0, 10.0, 7.0, 6.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.27734375, -35.90780258178711, -34.53826141357422, -33.16872024536133, -31.799179077148438, -30.429637908935547, -29.060096740722656, -27.690555572509766, -26.321014404296875, -24.951473236083984, -23.581932067871094, -22.212390899658203, -20.842849731445312, -19.473308563232422, -18.10376739501953, -16.73422622680664, -15.36468505859375, -13.99514389038086, -12.625602722167969, -11.256061553955078, -9.886520385742188, -8.516979217529297, -7.147438049316406, -5.777896881103516, -4.408355712890625, -3.0388145446777344, -1.6692733764648438, -0.2997322082519531, 1.0698089599609375, 2.439350128173828, 3.8088912963867188, 5.178432464599609, 6.547977447509766, 7.917518615722656, 9.287059783935547, 10.656600952148438, 12.026142120361328, 13.395683288574219, 14.76522445678711, 16.134765625, 17.50430679321289, 18.87384796142578, 20.243389129638672, 21.612930297851562, 22.982471466064453, 24.352012634277344, 25.721553802490234, 27.091094970703125, 28.460636138916016, 29.830177307128906, 31.199718475341797, 32.56925964355469, 33.93880081176758, 35.30834197998047, 36.67788314819336, 38.04742431640625, 39.41696548461914, 40.78650665283203, 42.15604782104492, 43.52558898925781, 44.8951301574707, 46.264671325683594, 47.634212493896484, 49.003753662109375, 50.373294830322266]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 2.0, 4.0, 6.0, 10.0, 12.0, 10.0, 9.0, 18.0, 19.0, 27.0, 33.0, 23.0, 26.0, 27.0, 34.0, 36.0, 32.0, 46.0, 47.0, 40.0, 29.0, 44.0, 40.0, 43.0, 45.0, 28.0, 32.0, 41.0, 38.0, 25.0, 27.0, 24.0, 13.0, 26.0, 18.0, 12.0, 9.0, 6.0, 7.0, 8.0, 5.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.34229278564453, -36.2725944519043, -35.20289611816406, -34.13319778442383, -33.063499450683594, -31.993799209594727, -30.924100875854492, -29.854402542114258, -28.78470230102539, -27.715003967285156, -26.645305633544922, -25.575607299804688, -24.50590705871582, -23.436208724975586, -22.36651039123535, -21.296812057495117, -20.227113723754883, -19.15741539001465, -18.087717056274414, -17.018016815185547, -15.948318481445312, -14.878620147705078, -13.808921813964844, -12.73922348022461, -11.669524192810059, -10.599825859069824, -9.530126571655273, -8.460428237915039, -7.3907294273376465, -6.321030616760254, -5.2513322830200195, -4.181633472442627, -3.1119327545166016, -2.042233943939209, -0.9725353717803955, 0.09716320037841797, 1.1668620109558105, 2.236560821533203, 3.3062591552734375, 4.37595796585083, 5.445656776428223, 6.515355587005615, 7.585054397583008, 8.654752731323242, 9.724451065063477, 10.794150352478027, 11.863848686218262, 12.933547973632812, 14.003246307373047, 15.072944641113281, 16.142642974853516, 17.21234130859375, 18.282041549682617, 19.35173988342285, 20.421438217163086, 21.49113655090332, 22.560836791992188, 23.630535125732422, 24.700233459472656, 25.76993179321289, 26.839632034301758, 27.909330368041992, 28.979028701782227, 30.04872703552246, 31.118425369262695]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 15.0, 25.0, 30.0, 40.0, 73.0, 131.0, 176.0, 270.0, 404.0, 613.0, 960.0, 1434.0, 2209.0, 3379.0, 5078.0, 7926.0, 12431.0, 20153.0, 33511.0, 59514.0, 119271.0, 311421.0, 838834.0, 1337144.0, 858503.0, 316341.0, 119757.0, 58782.0, 32842.0, 19275.0, 11914.0, 7573.0, 4867.0, 3185.0, 2064.0, 1387.0, 890.0, 565.0, 411.0, 273.0, 200.0, 143.0, 70.0, 57.0, 44.0, 20.0, 19.0, 10.0, 14.0, 11.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.8125, -36.57275390625, -35.3330078125, -34.09326171875, -32.853515625, -31.61376953125, -30.3740234375, -29.13427734375, -27.89453125, -26.65478515625, -25.4150390625, -24.17529296875, -22.935546875, -21.69580078125, -20.4560546875, -19.21630859375, -17.9765625, -16.73681640625, -15.4970703125, -14.25732421875, -13.017578125, -11.77783203125, -10.5380859375, -9.29833984375, -8.05859375, -6.81884765625, -5.5791015625, -4.33935546875, -3.099609375, -1.85986328125, -0.6201171875, 0.61962890625, 1.859375, 3.09912109375, 4.3388671875, 5.57861328125, 6.818359375, 8.05810546875, 9.2978515625, 10.53759765625, 11.77734375, 13.01708984375, 14.2568359375, 15.49658203125, 16.736328125, 17.97607421875, 19.2158203125, 20.45556640625, 21.6953125, 22.93505859375, 24.1748046875, 25.41455078125, 26.654296875, 27.89404296875, 29.1337890625, 30.37353515625, 31.61328125, 32.85302734375, 34.0927734375, 35.33251953125, 36.572265625, 37.81201171875, 39.0517578125, 40.29150390625, 41.53125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 18.0, 15.0, 18.0, 11.0, 24.0, 24.0, 27.0, 33.0, 31.0, 41.0, 33.0, 31.0, 51.0, 41.0, 39.0, 38.0, 40.0, 50.0, 37.0, 33.0, 30.0, 41.0, 31.0, 38.0, 30.0, 29.0, 18.0, 18.0, 17.0, 15.0, 14.0, 12.0, 10.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.47021484375, -26.5810546875, -25.69189453125, -24.802734375, -23.91357421875, -23.0244140625, -22.13525390625, -21.24609375, -20.35693359375, -19.4677734375, -18.57861328125, -17.689453125, -16.80029296875, -15.9111328125, -15.02197265625, -14.1328125, -13.24365234375, -12.3544921875, -11.46533203125, -10.576171875, -9.68701171875, -8.7978515625, -7.90869140625, -7.01953125, -6.13037109375, -5.2412109375, -4.35205078125, -3.462890625, -2.57373046875, -1.6845703125, -0.79541015625, 0.09375, 0.98291015625, 1.8720703125, 2.76123046875, 3.650390625, 4.53955078125, 5.4287109375, 6.31787109375, 7.20703125, 8.09619140625, 8.9853515625, 9.87451171875, 10.763671875, 11.65283203125, 12.5419921875, 13.43115234375, 14.3203125, 15.20947265625, 16.0986328125, 16.98779296875, 17.876953125, 18.76611328125, 19.6552734375, 20.54443359375, 21.43359375, 22.32275390625, 23.2119140625, 24.10107421875, 24.990234375, 25.87939453125, 26.7685546875, 27.65771484375, 28.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 30.0, 29.0, 43.0, 65.0, 84.0, 174.0, 242.0, 407.0, 668.0, 1123.0, 1861.0, 3152.0, 5618.0, 9926.0, 17822.0, 33271.0, 65933.0, 138641.0, 323027.0, 909416.0, 1632692.0, 601930.0, 232897.0, 104413.0, 50886.0, 26461.0, 14313.0, 7961.0, 4514.0, 2674.0, 1498.0, 940.0, 571.0, 333.0, 238.0, 142.0, 87.0, 55.0, 32.0, 24.0, 20.0, 8.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-53.8125, -52.197265625, -50.58203125, -48.966796875, -47.3515625, -45.736328125, -44.12109375, -42.505859375, -40.890625, -39.275390625, -37.66015625, -36.044921875, -34.4296875, -32.814453125, -31.19921875, -29.583984375, -27.96875, -26.353515625, -24.73828125, -23.123046875, -21.5078125, -19.892578125, -18.27734375, -16.662109375, -15.046875, -13.431640625, -11.81640625, -10.201171875, -8.5859375, -6.970703125, -5.35546875, -3.740234375, -2.125, -0.509765625, 1.10546875, 2.720703125, 4.3359375, 5.951171875, 7.56640625, 9.181640625, 10.796875, 12.412109375, 14.02734375, 15.642578125, 17.2578125, 18.873046875, 20.48828125, 22.103515625, 23.71875, 25.333984375, 26.94921875, 28.564453125, 30.1796875, 31.794921875, 33.41015625, 35.025390625, 36.640625, 38.255859375, 39.87109375, 41.486328125, 43.1015625, 44.716796875, 46.33203125, 47.947265625, 49.5625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 12.0, 20.0, 30.0, 26.0, 39.0, 52.0, 78.0, 87.0, 139.0, 186.0, 265.0, 282.0, 361.0, 485.0, 442.0, 386.0, 290.0, 208.0, 168.0, 105.0, 93.0, 82.0, 40.0, 36.0, 33.0, 34.0, 23.0, 17.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.171875, -19.59375, -19.015625, -18.4375, -17.859375, -17.28125, -16.703125, -16.125, -15.546875, -14.96875, -14.390625, -13.8125, -13.234375, -12.65625, -12.078125, -11.5, -10.921875, -10.34375, -9.765625, -9.1875, -8.609375, -8.03125, -7.453125, -6.875, -6.296875, -5.71875, -5.140625, -4.5625, -3.984375, -3.40625, -2.828125, -2.25, -1.671875, -1.09375, -0.515625, 0.0625, 0.640625, 1.21875, 1.796875, 2.375, 2.953125, 3.53125, 4.109375, 4.6875, 5.265625, 5.84375, 6.421875, 7.0, 7.578125, 8.15625, 8.734375, 9.3125, 9.890625, 10.46875, 11.046875, 11.625, 12.203125, 12.78125, 13.359375, 13.9375, 14.515625, 15.09375, 15.671875, 16.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 22.0, 13.0, 22.0, 19.0, 33.0, 44.0, 56.0, 49.0, 54.0, 68.0, 65.0, 66.0, 77.0, 54.0, 48.0, 45.0, 45.0, 32.0, 37.0, 19.0, 20.0, 13.0, 7.0, 14.0, 5.0, 8.0, 3.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.2828483581543, -34.0324592590332, -32.78207015991211, -31.53168296813965, -30.281293869018555, -29.03090476989746, -27.780517578125, -26.530128479003906, -25.279739379882812, -24.02935028076172, -22.778961181640625, -21.528573989868164, -20.27818489074707, -19.027795791625977, -17.777408599853516, -16.527019500732422, -15.276630401611328, -14.026241302490234, -12.775853157043457, -11.52546501159668, -10.275075912475586, -9.024686813354492, -7.774298667907715, -6.5239105224609375, -5.273521423339844, -4.023132801055908, -2.7727441787719727, -1.522355556488037, -0.27196693420410156, 0.978421688079834, 2.2288103103637695, 3.479198455810547, 4.729587554931641, 5.979976177215576, 7.230364799499512, 8.480752944946289, 9.731142044067383, 10.981531143188477, 12.231919288635254, 13.482307434082031, 14.732696533203125, 15.983085632324219, 17.233474731445312, 18.483861923217773, 19.734251022338867, 20.98464012145996, 22.235027313232422, 23.485416412353516, 24.73580551147461, 25.986194610595703, 27.236583709716797, 28.486970901489258, 29.73736000061035, 30.987749099731445, 32.238136291503906, 33.488525390625, 34.738914489746094, 35.98930358886719, 37.23969268798828, 38.490081787109375, 39.74047088623047, 40.9908561706543, 42.24124526977539, 43.491634368896484, 44.74202346801758]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 9.0, 11.0, 18.0, 15.0, 21.0, 21.0, 16.0, 26.0, 22.0, 25.0, 27.0, 29.0, 33.0, 32.0, 35.0, 37.0, 36.0, 43.0, 41.0, 42.0, 27.0, 32.0, 39.0, 48.0, 28.0, 24.0, 42.0, 31.0, 19.0, 17.0, 24.0, 19.0, 15.0, 19.0, 10.0, 10.0, 3.0, 9.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.321773529052734, -30.385770797729492, -29.44976806640625, -28.513765335083008, -27.577762603759766, -26.641759872436523, -25.70575714111328, -24.76975440979004, -23.833751678466797, -22.897748947143555, -21.961746215820312, -21.02574348449707, -20.089740753173828, -19.153738021850586, -18.217735290527344, -17.2817325592041, -16.34572982788086, -15.409727096557617, -14.473724365234375, -13.537721633911133, -12.60171890258789, -11.665716171264648, -10.729713439941406, -9.793710708618164, -8.857709884643555, -7.9217071533203125, -6.98570442199707, -6.049701690673828, -5.113698959350586, -4.177696704864502, -3.2416939735412598, -2.3056912422180176, -1.3696880340576172, -0.4336853623390198, 0.5023173093795776, 1.4383199214935303, 2.3743226528167725, 3.3103251457214355, 4.246327877044678, 5.18233060836792, 6.118333339691162, 7.054336071014404, 7.9903388023376465, 8.92634105682373, 9.862343788146973, 10.798346519470215, 11.734349250793457, 12.6703519821167, 13.606354713439941, 14.542357444763184, 15.478360176086426, 16.41436195373535, 17.350364685058594, 18.286367416381836, 19.222370147705078, 20.15837287902832, 21.094375610351562, 22.030378341674805, 22.966381072998047, 23.90238380432129, 24.83838653564453, 25.774389266967773, 26.710391998291016, 27.646394729614258, 28.5823974609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 10.0, 18.0, 18.0, 23.0, 59.0, 69.0, 131.0, 246.0, 431.0, 773.0, 1331.0, 2332.0, 4549.0, 8796.0, 18500.0, 43790.0, 125115.0, 399205.0, 291256.0, 88913.0, 33156.0, 14435.0, 7031.0, 3709.0, 2040.0, 1072.0, 673.0, 362.0, 191.0, 117.0, 63.0, 42.0, 28.0, 16.0, 13.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.625, -80.25390625, -77.8828125, -75.51171875, -73.140625, -70.76953125, -68.3984375, -66.02734375, -63.65625, -61.28515625, -58.9140625, -56.54296875, -54.171875, -51.80078125, -49.4296875, -47.05859375, -44.6875, -42.31640625, -39.9453125, -37.57421875, -35.203125, -32.83203125, -30.4609375, -28.08984375, -25.71875, -23.34765625, -20.9765625, -18.60546875, -16.234375, -13.86328125, -11.4921875, -9.12109375, -6.75, -4.37890625, -2.0078125, 0.36328125, 2.734375, 5.10546875, 7.4765625, 9.84765625, 12.21875, 14.58984375, 16.9609375, 19.33203125, 21.703125, 24.07421875, 26.4453125, 28.81640625, 31.1875, 33.55859375, 35.9296875, 38.30078125, 40.671875, 43.04296875, 45.4140625, 47.78515625, 50.15625, 52.52734375, 54.8984375, 57.26953125, 59.640625, 62.01171875, 64.3828125, 66.75390625, 69.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 21.0, 12.0, 17.0, 22.0, 14.0, 16.0, 20.0, 20.0, 28.0, 31.0, 39.0, 29.0, 43.0, 41.0, 41.0, 35.0, 37.0, 41.0, 49.0, 30.0, 25.0, 46.0, 36.0, 31.0, 39.0, 34.0, 23.0, 18.0, 12.0, 18.0, 25.0, 11.0, 13.0, 11.0, 11.0, 2.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-31.828125, -30.891845703125, -29.95556640625, -29.019287109375, -28.0830078125, -27.146728515625, -26.21044921875, -25.274169921875, -24.337890625, -23.401611328125, -22.46533203125, -21.529052734375, -20.5927734375, -19.656494140625, -18.72021484375, -17.783935546875, -16.84765625, -15.911376953125, -14.97509765625, -14.038818359375, -13.1025390625, -12.166259765625, -11.22998046875, -10.293701171875, -9.357421875, -8.421142578125, -7.48486328125, -6.548583984375, -5.6123046875, -4.676025390625, -3.73974609375, -2.803466796875, -1.8671875, -0.930908203125, 0.00537109375, 0.941650390625, 1.8779296875, 2.814208984375, 3.75048828125, 4.686767578125, 5.623046875, 6.559326171875, 7.49560546875, 8.431884765625, 9.3681640625, 10.304443359375, 11.24072265625, 12.177001953125, 13.11328125, 14.049560546875, 14.98583984375, 15.922119140625, 16.8583984375, 17.794677734375, 18.73095703125, 19.667236328125, 20.603515625, 21.539794921875, 22.47607421875, 23.412353515625, 24.3486328125, 25.284912109375, 26.22119140625, 27.157470703125, 28.09375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 7.0, 18.0, 25.0, 33.0, 66.0, 93.0, 105.0, 153.0, 232.0, 335.0, 444.0, 695.0, 963.0, 1489.0, 2329.0, 3883.0, 6533.0, 11740.0, 21125.0, 42824.0, 94243.0, 252209.0, 353056.0, 134892.0, 57377.0, 27909.0, 14417.0, 8135.0, 4753.0, 2976.0, 1858.0, 1141.0, 770.0, 495.0, 367.0, 271.0, 165.0, 107.0, 93.0, 51.0, 45.0, 28.0, 24.0, 25.0, 9.0, 9.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-57.90625, -56.0498046875, -54.193359375, -52.3369140625, -50.48046875, -48.6240234375, -46.767578125, -44.9111328125, -43.0546875, -41.1982421875, -39.341796875, -37.4853515625, -35.62890625, -33.7724609375, -31.916015625, -30.0595703125, -28.203125, -26.3466796875, -24.490234375, -22.6337890625, -20.77734375, -18.9208984375, -17.064453125, -15.2080078125, -13.3515625, -11.4951171875, -9.638671875, -7.7822265625, -5.92578125, -4.0693359375, -2.212890625, -0.3564453125, 1.5, 3.3564453125, 5.212890625, 7.0693359375, 8.92578125, 10.7822265625, 12.638671875, 14.4951171875, 16.3515625, 18.2080078125, 20.064453125, 21.9208984375, 23.77734375, 25.6337890625, 27.490234375, 29.3466796875, 31.203125, 33.0595703125, 34.916015625, 36.7724609375, 38.62890625, 40.4853515625, 42.341796875, 44.1982421875, 46.0546875, 47.9111328125, 49.767578125, 51.6240234375, 53.48046875, 55.3369140625, 57.193359375, 59.0498046875, 60.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 4.0, 12.0, 10.0, 12.0, 10.0, 14.0, 14.0, 27.0, 35.0, 27.0, 27.0, 25.0, 33.0, 34.0, 36.0, 35.0, 39.0, 45.0, 46.0, 43.0, 39.0, 39.0, 42.0, 38.0, 39.0, 35.0, 27.0, 29.0, 20.0, 36.0, 22.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.5, -19.8662109375, -19.232421875, -18.5986328125, -17.96484375, -17.3310546875, -16.697265625, -16.0634765625, -15.4296875, -14.7958984375, -14.162109375, -13.5283203125, -12.89453125, -12.2607421875, -11.626953125, -10.9931640625, -10.359375, -9.7255859375, -9.091796875, -8.4580078125, -7.82421875, -7.1904296875, -6.556640625, -5.9228515625, -5.2890625, -4.6552734375, -4.021484375, -3.3876953125, -2.75390625, -2.1201171875, -1.486328125, -0.8525390625, -0.21875, 0.4150390625, 1.048828125, 1.6826171875, 2.31640625, 2.9501953125, 3.583984375, 4.2177734375, 4.8515625, 5.4853515625, 6.119140625, 6.7529296875, 7.38671875, 8.0205078125, 8.654296875, 9.2880859375, 9.921875, 10.5556640625, 11.189453125, 11.8232421875, 12.45703125, 13.0908203125, 13.724609375, 14.3583984375, 14.9921875, 15.6259765625, 16.259765625, 16.8935546875, 17.52734375, 18.1611328125, 18.794921875, 19.4287109375, 20.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 11.0, 21.0, 16.0, 30.0, 40.0, 68.0, 56.0, 100.0, 138.0, 202.0, 278.0, 390.0, 620.0, 882.0, 1305.0, 2034.0, 3204.0, 5279.0, 9869.0, 21683.0, 67695.0, 369025.0, 437182.0, 78303.0, 24045.0, 10669.0, 5643.0, 3262.0, 2040.0, 1345.0, 913.0, 611.0, 424.0, 308.0, 233.0, 182.0, 131.0, 82.0, 74.0, 42.0, 27.0, 20.0, 13.0, 14.0, 12.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.8125, -25.948974609375, -25.08544921875, -24.221923828125, -23.3583984375, -22.494873046875, -21.63134765625, -20.767822265625, -19.904296875, -19.040771484375, -18.17724609375, -17.313720703125, -16.4501953125, -15.586669921875, -14.72314453125, -13.859619140625, -12.99609375, -12.132568359375, -11.26904296875, -10.405517578125, -9.5419921875, -8.678466796875, -7.81494140625, -6.951416015625, -6.087890625, -5.224365234375, -4.36083984375, -3.497314453125, -2.6337890625, -1.770263671875, -0.90673828125, -0.043212890625, 0.8203125, 1.683837890625, 2.54736328125, 3.410888671875, 4.2744140625, 5.137939453125, 6.00146484375, 6.864990234375, 7.728515625, 8.592041015625, 9.45556640625, 10.319091796875, 11.1826171875, 12.046142578125, 12.90966796875, 13.773193359375, 14.63671875, 15.500244140625, 16.36376953125, 17.227294921875, 18.0908203125, 18.954345703125, 19.81787109375, 20.681396484375, 21.544921875, 22.408447265625, 23.27197265625, 24.135498046875, 24.9990234375, 25.862548828125, 26.72607421875, 27.589599609375, 28.453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 4.0, 8.0, 9.0, 22.0, 45.0, 80.0, 138.0, 200.0, 193.0, 116.0, 68.0, 43.0, 28.0, 11.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003154754638671875, -0.0030614733695983887, -0.0029681921005249023, -0.002874910831451416, -0.0027816295623779297, -0.0026883482933044434, -0.002595067024230957, -0.0025017857551574707, -0.0024085044860839844, -0.002315223217010498, -0.0022219419479370117, -0.0021286606788635254, -0.002035379409790039, -0.0019420981407165527, -0.0018488168716430664, -0.00175553560256958, -0.0016622543334960938, -0.0015689730644226074, -0.001475691795349121, -0.0013824105262756348, -0.0012891292572021484, -0.0011958479881286621, -0.0011025667190551758, -0.0010092854499816895, -0.0009160041809082031, -0.0008227229118347168, -0.0007294416427612305, -0.0006361603736877441, -0.0005428791046142578, -0.0004495978355407715, -0.00035631656646728516, -0.00026303529739379883, -0.0001697540283203125, -7.647275924682617e-05, 1.6808509826660156e-05, 0.00011008977890014648, 0.0002033710479736328, 0.00029665231704711914, 0.00038993358612060547, 0.0004832148551940918, 0.0005764961242675781, 0.0006697773933410645, 0.0007630586624145508, 0.0008563399314880371, 0.0009496212005615234, 0.0010429024696350098, 0.001136183738708496, 0.0012294650077819824, 0.0013227462768554688, 0.001416027545928955, 0.0015093088150024414, 0.0016025900840759277, 0.001695871353149414, 0.0017891526222229004, 0.0018824338912963867, 0.001975715160369873, 0.0020689964294433594, 0.0021622776985168457, 0.002255558967590332, 0.0023488402366638184, 0.0024421215057373047, 0.002535402774810791, 0.0026286840438842773, 0.0027219653129577637, 0.00281524658203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 11.0, 25.0, 34.0, 37.0, 61.0, 115.0, 145.0, 222.0, 362.0, 554.0, 903.0, 1332.0, 2044.0, 3206.0, 5177.0, 8702.0, 17189.0, 41884.0, 147818.0, 495454.0, 219652.0, 56002.0, 21168.0, 10435.0, 5876.0, 3680.0, 2288.0, 1525.0, 924.0, 600.0, 401.0, 242.0, 191.0, 110.0, 49.0, 46.0, 25.0, 27.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.90625, -31.9560546875, -31.005859375, -30.0556640625, -29.10546875, -28.1552734375, -27.205078125, -26.2548828125, -25.3046875, -24.3544921875, -23.404296875, -22.4541015625, -21.50390625, -20.5537109375, -19.603515625, -18.6533203125, -17.703125, -16.7529296875, -15.802734375, -14.8525390625, -13.90234375, -12.9521484375, -12.001953125, -11.0517578125, -10.1015625, -9.1513671875, -8.201171875, -7.2509765625, -6.30078125, -5.3505859375, -4.400390625, -3.4501953125, -2.5, -1.5498046875, -0.599609375, 0.3505859375, 1.30078125, 2.2509765625, 3.201171875, 4.1513671875, 5.1015625, 6.0517578125, 7.001953125, 7.9521484375, 8.90234375, 9.8525390625, 10.802734375, 11.7529296875, 12.703125, 13.6533203125, 14.603515625, 15.5537109375, 16.50390625, 17.4541015625, 18.404296875, 19.3544921875, 20.3046875, 21.2548828125, 22.205078125, 23.1552734375, 24.10546875, 25.0556640625, 26.005859375, 26.9560546875, 27.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 10.0, 13.0, 23.0, 30.0, 41.0, 55.0, 89.0, 108.0, 109.0, 96.0, 91.0, 67.0, 57.0, 38.0, 26.0, 17.0, 17.0, 8.0, 11.0, 11.0, 3.0, 8.0, 3.0, 6.0, 4.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-8.8984375, -8.649658203125, -8.40087890625, -8.152099609375, -7.9033203125, -7.654541015625, -7.40576171875, -7.156982421875, -6.908203125, -6.659423828125, -6.41064453125, -6.161865234375, -5.9130859375, -5.664306640625, -5.41552734375, -5.166748046875, -4.91796875, -4.669189453125, -4.42041015625, -4.171630859375, -3.9228515625, -3.674072265625, -3.42529296875, -3.176513671875, -2.927734375, -2.678955078125, -2.43017578125, -2.181396484375, -1.9326171875, -1.683837890625, -1.43505859375, -1.186279296875, -0.9375, -0.688720703125, -0.43994140625, -0.191162109375, 0.0576171875, 0.306396484375, 0.55517578125, 0.803955078125, 1.052734375, 1.301513671875, 1.55029296875, 1.799072265625, 2.0478515625, 2.296630859375, 2.54541015625, 2.794189453125, 3.04296875, 3.291748046875, 3.54052734375, 3.789306640625, 4.0380859375, 4.286865234375, 4.53564453125, 4.784423828125, 5.033203125, 5.281982421875, 5.53076171875, 5.779541015625, 6.0283203125, 6.277099609375, 6.52587890625, 6.774658203125, 7.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 10.0, 15.0, 11.0, 10.0, 20.0, 19.0, 24.0, 34.0, 38.0, 44.0, 58.0, 62.0, 66.0, 58.0, 65.0, 64.0, 58.0, 57.0, 53.0, 39.0, 35.0, 26.0, 25.0, 17.0, 9.0, 14.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.382720947265625, -27.211339950561523, -26.03995704650879, -24.868576049804688, -23.697195053100586, -22.525814056396484, -21.35443115234375, -20.18305015563965, -19.011669158935547, -17.840288162231445, -16.66890525817871, -15.49752426147461, -14.326143264770508, -13.15476131439209, -11.983379364013672, -10.81199836730957, -9.640615463256836, -8.469233512878418, -7.297852516174316, -6.126470565795898, -4.955089092254639, -3.783707618713379, -2.612325668334961, -1.4409446716308594, -0.2695627212524414, 0.9018188714981079, 2.0732004642486572, 3.244582176208496, 4.415963649749756, 5.587345123291016, 6.758727073669434, 7.930108070373535, 9.101490020751953, 10.272871971130371, 11.444252967834473, 12.61563491821289, 13.787015914916992, 14.95839786529541, 16.129779815673828, 17.30116081237793, 18.47254180908203, 19.643922805786133, 20.815305709838867, 21.98668670654297, 23.15806770324707, 24.329448699951172, 25.500831604003906, 26.672212600708008, 27.843595504760742, 29.014976501464844, 30.186359405517578, 31.35774040222168, 32.52912139892578, 33.700504302978516, 34.87188720703125, 36.04326629638672, 37.21464920043945, 38.38603210449219, 39.557411193847656, 40.72879409790039, 41.900177001953125, 43.071556091308594, 44.24293899536133, 45.41432189941406, 46.58570098876953]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 3.0, 8.0, 8.0, 11.0, 12.0, 16.0, 17.0, 13.0, 21.0, 13.0, 31.0, 23.0, 34.0, 36.0, 17.0, 39.0, 30.0, 36.0, 36.0, 42.0, 35.0, 31.0, 45.0, 34.0, 25.0, 27.0, 37.0, 42.0, 33.0, 29.0, 22.0, 21.0, 22.0, 21.0, 22.0, 15.0, 14.0, 13.0, 11.0, 6.0, 12.0, 8.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-28.52808380126953, -27.666709899902344, -26.80533790588379, -25.9439640045166, -25.082592010498047, -24.22121810913086, -23.359844207763672, -22.498472213745117, -21.63709831237793, -20.775724411010742, -19.914352416992188, -19.052978515625, -18.191606521606445, -17.330232620239258, -16.468860626220703, -15.607486724853516, -14.746113777160645, -13.884740829467773, -13.023367881774902, -12.161994934082031, -11.300621032714844, -10.439248085021973, -9.577875137329102, -8.716501235961914, -7.855128765106201, -6.99375581741333, -6.132382392883301, -5.27100944519043, -4.409636497497559, -3.5482630729675293, -2.686890125274658, -1.825516700744629, -0.9641437530517578, -0.10277062654495239, 0.758602499961853, 1.6199755668640137, 2.481348752975464, 3.342721939086914, 4.204094886779785, 5.0654683113098145, 5.9268412590026855, 6.788214206695557, 7.649587631225586, 8.510960578918457, 9.372333526611328, 10.233707427978516, 11.09507942199707, 11.956453323364258, 12.817826271057129, 13.67919921875, 14.540572166442871, 15.401945114135742, 16.26331901550293, 17.124691009521484, 17.986064910888672, 18.84743881225586, 19.708810806274414, 20.5701847076416, 21.431556701660156, 22.292930603027344, 23.1543025970459, 24.015676498413086, 24.87704849243164, 25.738422393798828, 26.599796295166016]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 13.0, 35.0, 46.0, 55.0, 85.0, 152.0, 186.0, 289.0, 373.0, 546.0, 788.0, 1116.0, 1635.0, 2256.0, 3115.0, 4468.0, 6286.0, 9171.0, 13442.0, 19462.0, 28856.0, 43676.0, 64935.0, 98087.0, 139287.0, 164778.0, 141518.0, 99244.0, 66553.0, 44216.0, 29190.0, 19888.0, 13351.0, 9428.0, 6588.0, 4575.0, 3161.0, 2293.0, 1555.0, 1148.0, 852.0, 533.0, 388.0, 281.0, 191.0, 128.0, 103.0, 63.0, 45.0, 36.0, 17.0, 9.0, 14.0, 5.0, 3.0, 4.0, 4.0, 3.0], "bins": [-29.28125, -28.352294921875, -27.42333984375, -26.494384765625, -25.5654296875, -24.636474609375, -23.70751953125, -22.778564453125, -21.849609375, -20.920654296875, -19.99169921875, -19.062744140625, -18.1337890625, -17.204833984375, -16.27587890625, -15.346923828125, -14.41796875, -13.489013671875, -12.56005859375, -11.631103515625, -10.7021484375, -9.773193359375, -8.84423828125, -7.915283203125, -6.986328125, -6.057373046875, -5.12841796875, -4.199462890625, -3.2705078125, -2.341552734375, -1.41259765625, -0.483642578125, 0.4453125, 1.374267578125, 2.30322265625, 3.232177734375, 4.1611328125, 5.090087890625, 6.01904296875, 6.947998046875, 7.876953125, 8.805908203125, 9.73486328125, 10.663818359375, 11.5927734375, 12.521728515625, 13.45068359375, 14.379638671875, 15.30859375, 16.237548828125, 17.16650390625, 18.095458984375, 19.0244140625, 19.953369140625, 20.88232421875, 21.811279296875, 22.740234375, 23.669189453125, 24.59814453125, 25.527099609375, 26.4560546875, 27.385009765625, 28.31396484375, 29.242919921875, 30.171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 15.0, 12.0, 16.0, 17.0, 11.0, 13.0, 27.0, 19.0, 28.0, 34.0, 36.0, 27.0, 29.0, 43.0, 36.0, 34.0, 32.0, 39.0, 30.0, 44.0, 31.0, 33.0, 29.0, 32.0, 36.0, 39.0, 37.0, 25.0, 26.0, 19.0, 14.0, 21.0, 14.0, 17.0, 11.0, 11.0, 5.0, 9.0, 12.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-27.1875, -26.344970703125, -25.50244140625, -24.659912109375, -23.8173828125, -22.974853515625, -22.13232421875, -21.289794921875, -20.447265625, -19.604736328125, -18.76220703125, -17.919677734375, -17.0771484375, -16.234619140625, -15.39208984375, -14.549560546875, -13.70703125, -12.864501953125, -12.02197265625, -11.179443359375, -10.3369140625, -9.494384765625, -8.65185546875, -7.809326171875, -6.966796875, -6.124267578125, -5.28173828125, -4.439208984375, -3.5966796875, -2.754150390625, -1.91162109375, -1.069091796875, -0.2265625, 0.615966796875, 1.45849609375, 2.301025390625, 3.1435546875, 3.986083984375, 4.82861328125, 5.671142578125, 6.513671875, 7.356201171875, 8.19873046875, 9.041259765625, 9.8837890625, 10.726318359375, 11.56884765625, 12.411376953125, 13.25390625, 14.096435546875, 14.93896484375, 15.781494140625, 16.6240234375, 17.466552734375, 18.30908203125, 19.151611328125, 19.994140625, 20.836669921875, 21.67919921875, 22.521728515625, 23.3642578125, 24.206787109375, 25.04931640625, 25.891845703125, 26.734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 14.0, 10.0, 21.0, 26.0, 50.0, 72.0, 102.0, 174.0, 274.0, 400.0, 641.0, 995.0, 1611.0, 2712.0, 4543.0, 7240.0, 12187.0, 21308.0, 37633.0, 69287.0, 128201.0, 216967.0, 228647.0, 140303.0, 76502.0, 41357.0, 23334.0, 13451.0, 8081.0, 4698.0, 2903.0, 1823.0, 1102.0, 721.0, 402.0, 262.0, 171.0, 103.0, 73.0, 46.0, 35.0, 28.0, 18.0, 13.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.53125, -43.05078125, -41.5703125, -40.08984375, -38.609375, -37.12890625, -35.6484375, -34.16796875, -32.6875, -31.20703125, -29.7265625, -28.24609375, -26.765625, -25.28515625, -23.8046875, -22.32421875, -20.84375, -19.36328125, -17.8828125, -16.40234375, -14.921875, -13.44140625, -11.9609375, -10.48046875, -9.0, -7.51953125, -6.0390625, -4.55859375, -3.078125, -1.59765625, -0.1171875, 1.36328125, 2.84375, 4.32421875, 5.8046875, 7.28515625, 8.765625, 10.24609375, 11.7265625, 13.20703125, 14.6875, 16.16796875, 17.6484375, 19.12890625, 20.609375, 22.08984375, 23.5703125, 25.05078125, 26.53125, 28.01171875, 29.4921875, 30.97265625, 32.453125, 33.93359375, 35.4140625, 36.89453125, 38.375, 39.85546875, 41.3359375, 42.81640625, 44.296875, 45.77734375, 47.2578125, 48.73828125, 50.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 9.0, 12.0, 10.0, 17.0, 21.0, 19.0, 22.0, 27.0, 36.0, 26.0, 39.0, 48.0, 39.0, 51.0, 42.0, 45.0, 48.0, 36.0, 49.0, 40.0, 51.0, 33.0, 34.0, 38.0, 22.0, 29.0, 18.0, 21.0, 19.0, 14.0, 8.0, 10.0, 11.0, 5.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.3125, -18.662353515625, -18.01220703125, -17.362060546875, -16.7119140625, -16.061767578125, -15.41162109375, -14.761474609375, -14.111328125, -13.461181640625, -12.81103515625, -12.160888671875, -11.5107421875, -10.860595703125, -10.21044921875, -9.560302734375, -8.91015625, -8.260009765625, -7.60986328125, -6.959716796875, -6.3095703125, -5.659423828125, -5.00927734375, -4.359130859375, -3.708984375, -3.058837890625, -2.40869140625, -1.758544921875, -1.1083984375, -0.458251953125, 0.19189453125, 0.842041015625, 1.4921875, 2.142333984375, 2.79248046875, 3.442626953125, 4.0927734375, 4.742919921875, 5.39306640625, 6.043212890625, 6.693359375, 7.343505859375, 7.99365234375, 8.643798828125, 9.2939453125, 9.944091796875, 10.59423828125, 11.244384765625, 11.89453125, 12.544677734375, 13.19482421875, 13.844970703125, 14.4951171875, 15.145263671875, 15.79541015625, 16.445556640625, 17.095703125, 17.745849609375, 18.39599609375, 19.046142578125, 19.6962890625, 20.346435546875, 20.99658203125, 21.646728515625, 22.296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 8.0, 10.0, 27.0, 42.0, 48.0, 88.0, 115.0, 188.0, 281.0, 481.0, 731.0, 1090.0, 1844.0, 3102.0, 5097.0, 9015.0, 15700.0, 28433.0, 52139.0, 98316.0, 183573.0, 255465.0, 179427.0, 96880.0, 51284.0, 28008.0, 15482.0, 8730.0, 5097.0, 3049.0, 1794.0, 1062.0, 676.0, 412.0, 283.0, 192.0, 123.0, 79.0, 65.0, 37.0, 20.0, 18.0, 13.0, 11.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.4908447265625, -12.036376953125, -11.5819091796875, -11.12744140625, -10.6729736328125, -10.218505859375, -9.7640380859375, -9.3095703125, -8.8551025390625, -8.400634765625, -7.9461669921875, -7.49169921875, -7.0372314453125, -6.582763671875, -6.1282958984375, -5.673828125, -5.2193603515625, -4.764892578125, -4.3104248046875, -3.85595703125, -3.4014892578125, -2.947021484375, -2.4925537109375, -2.0380859375, -1.5836181640625, -1.129150390625, -0.6746826171875, -0.22021484375, 0.2342529296875, 0.688720703125, 1.1431884765625, 1.59765625, 2.0521240234375, 2.506591796875, 2.9610595703125, 3.41552734375, 3.8699951171875, 4.324462890625, 4.7789306640625, 5.2333984375, 5.6878662109375, 6.142333984375, 6.5968017578125, 7.05126953125, 7.5057373046875, 7.960205078125, 8.4146728515625, 8.869140625, 9.3236083984375, 9.778076171875, 10.2325439453125, 10.68701171875, 11.1414794921875, 11.595947265625, 12.0504150390625, 12.5048828125, 12.9593505859375, 13.413818359375, 13.8682861328125, 14.32275390625, 14.7772216796875, 15.231689453125, 15.6861572265625, 16.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 8.0, 16.0, 17.0, 15.0, 22.0, 33.0, 42.0, 37.0, 56.0, 52.0, 68.0, 75.0, 76.0, 75.0, 62.0, 61.0, 49.0, 41.0, 33.0, 31.0, 18.0, 16.0, 17.0, 13.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012683868408203125, -0.0012215673923492432, -0.0011747479438781738, -0.0011279284954071045, -0.0010811090469360352, -0.0010342895984649658, -0.0009874701499938965, -0.0009406507015228271, -0.0008938312530517578, -0.0008470118045806885, -0.0008001923561096191, -0.0007533729076385498, -0.0007065534591674805, -0.0006597340106964111, -0.0006129145622253418, -0.0005660951137542725, -0.0005192756652832031, -0.0004724562168121338, -0.00042563676834106445, -0.0003788173198699951, -0.0003319978713989258, -0.00028517842292785645, -0.0002383589744567871, -0.00019153952598571777, -0.00014472007751464844, -9.79006290435791e-05, -5.1081180572509766e-05, -4.26173210144043e-06, 4.2557716369628906e-05, 8.937716484069824e-05, 0.00013619661331176758, 0.00018301606178283691, 0.00022983551025390625, 0.0002766549587249756, 0.0003234744071960449, 0.00037029385566711426, 0.0004171133041381836, 0.00046393275260925293, 0.0005107522010803223, 0.0005575716495513916, 0.0006043910980224609, 0.0006512105464935303, 0.0006980299949645996, 0.0007448494434356689, 0.0007916688919067383, 0.0008384883403778076, 0.000885307788848877, 0.0009321272373199463, 0.0009789466857910156, 0.001025766134262085, 0.0010725855827331543, 0.0011194050312042236, 0.001166224479675293, 0.0012130439281463623, 0.0012598633766174316, 0.001306682825088501, 0.0013535022735595703, 0.0014003217220306396, 0.001447141170501709, 0.0014939606189727783, 0.0015407800674438477, 0.001587599515914917, 0.0016344189643859863, 0.0016812384128570557, 0.001728057861328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 27.0, 28.0, 44.0, 85.0, 130.0, 198.0, 274.0, 434.0, 679.0, 1068.0, 1721.0, 2733.0, 4437.0, 7395.0, 12285.0, 20579.0, 35165.0, 60715.0, 104789.0, 173913.0, 216022.0, 166123.0, 100225.0, 56791.0, 33186.0, 19402.0, 11586.0, 6958.0, 4321.0, 2586.0, 1671.0, 1064.0, 678.0, 425.0, 227.0, 193.0, 116.0, 66.0, 61.0, 46.0, 21.0, 11.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9736328125, -10.587890625, -10.2021484375, -9.81640625, -9.4306640625, -9.044921875, -8.6591796875, -8.2734375, -7.8876953125, -7.501953125, -7.1162109375, -6.73046875, -6.3447265625, -5.958984375, -5.5732421875, -5.1875, -4.8017578125, -4.416015625, -4.0302734375, -3.64453125, -3.2587890625, -2.873046875, -2.4873046875, -2.1015625, -1.7158203125, -1.330078125, -0.9443359375, -0.55859375, -0.1728515625, 0.212890625, 0.5986328125, 0.984375, 1.3701171875, 1.755859375, 2.1416015625, 2.52734375, 2.9130859375, 3.298828125, 3.6845703125, 4.0703125, 4.4560546875, 4.841796875, 5.2275390625, 5.61328125, 5.9990234375, 6.384765625, 6.7705078125, 7.15625, 7.5419921875, 7.927734375, 8.3134765625, 8.69921875, 9.0849609375, 9.470703125, 9.8564453125, 10.2421875, 10.6279296875, 11.013671875, 11.3994140625, 11.78515625, 12.1708984375, 12.556640625, 12.9423828125, 13.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 4.0, 4.0, 10.0, 6.0, 11.0, 12.0, 24.0, 22.0, 25.0, 17.0, 30.0, 35.0, 39.0, 31.0, 41.0, 45.0, 65.0, 54.0, 64.0, 62.0, 52.0, 45.0, 38.0, 41.0, 39.0, 21.0, 18.0, 23.0, 13.0, 15.0, 15.0, 9.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-3.482421875, -3.3782958984375, -3.274169921875, -3.1700439453125, -3.06591796875, -2.9617919921875, -2.857666015625, -2.7535400390625, -2.6494140625, -2.5452880859375, -2.441162109375, -2.3370361328125, -2.23291015625, -2.1287841796875, -2.024658203125, -1.9205322265625, -1.81640625, -1.7122802734375, -1.608154296875, -1.5040283203125, -1.39990234375, -1.2957763671875, -1.191650390625, -1.0875244140625, -0.9833984375, -0.8792724609375, -0.775146484375, -0.6710205078125, -0.56689453125, -0.4627685546875, -0.358642578125, -0.2545166015625, -0.150390625, -0.0462646484375, 0.057861328125, 0.1619873046875, 0.26611328125, 0.3702392578125, 0.474365234375, 0.5784912109375, 0.6826171875, 0.7867431640625, 0.890869140625, 0.9949951171875, 1.09912109375, 1.2032470703125, 1.307373046875, 1.4114990234375, 1.515625, 1.6197509765625, 1.723876953125, 1.8280029296875, 1.93212890625, 2.0362548828125, 2.140380859375, 2.2445068359375, 2.3486328125, 2.4527587890625, 2.556884765625, 2.6610107421875, 2.76513671875, 2.8692626953125, 2.973388671875, 3.0775146484375, 3.181640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 2.0, 7.0, 13.0, 11.0, 12.0, 13.0, 24.0, 17.0, 23.0, 29.0, 39.0, 40.0, 58.0, 55.0, 57.0, 61.0, 72.0, 48.0, 47.0, 65.0, 43.0, 50.0, 34.0, 28.0, 20.0, 19.0, 16.0, 18.0, 12.0, 9.0, 10.0, 8.0, 5.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.04131317138672, -32.99440383911133, -31.947498321533203, -30.900588989257812, -29.853681564331055, -28.806774139404297, -27.759864807128906, -26.71295738220215, -25.66604995727539, -24.619142532348633, -23.572235107421875, -22.525325775146484, -21.478418350219727, -20.43151092529297, -19.384601593017578, -18.33769416809082, -17.290786743164062, -16.243879318237305, -15.19697093963623, -14.150062561035156, -13.103155136108398, -12.05624771118164, -11.009339332580566, -9.962430953979492, -8.915523529052734, -7.868615627288818, -6.821707725524902, -5.774799823760986, -4.72789192199707, -3.6809840202331543, -2.6340761184692383, -1.5871682167053223, -0.5402565002441406, 0.5066514015197754, 1.5535593032836914, 2.6004672050476074, 3.6473751068115234, 4.6942830085754395, 5.7411909103393555, 6.7880988121032715, 7.8350067138671875, 8.881914138793945, 9.92882251739502, 10.975730895996094, 12.022638320922852, 13.06954574584961, 14.116454124450684, 15.163362503051758, 16.210269927978516, 17.257177352905273, 18.30408477783203, 19.350994110107422, 20.39790153503418, 21.444808959960938, 22.491718292236328, 23.538625717163086, 24.585533142089844, 25.6324405670166, 26.67934799194336, 27.72625732421875, 28.773164749145508, 29.820072174072266, 30.866981506347656, 31.913888931274414, 32.96079635620117]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 5.0, 5.0, 9.0, 9.0, 7.0, 19.0, 13.0, 18.0, 18.0, 15.0, 17.0, 29.0, 27.0, 29.0, 31.0, 20.0, 28.0, 32.0, 26.0, 42.0, 27.0, 17.0, 32.0, 49.0, 33.0, 37.0, 40.0, 23.0, 34.0, 25.0, 24.0, 25.0, 20.0, 30.0, 12.0, 22.0, 20.0, 26.0, 15.0, 15.0, 16.0, 8.0, 9.0, 12.0, 5.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0], "bins": [-28.643796920776367, -27.812063217163086, -26.980331420898438, -26.148597717285156, -25.316865921020508, -24.485132217407227, -23.653400421142578, -22.821666717529297, -21.989933013916016, -21.158199310302734, -20.326467514038086, -19.494733810424805, -18.663002014160156, -17.831268310546875, -16.999534606933594, -16.167802810668945, -15.336071014404297, -14.504338264465332, -13.672605514526367, -12.840871810913086, -12.009140014648438, -11.177406311035156, -10.345673561096191, -9.513940811157227, -8.682208061218262, -7.850475311279297, -7.018742561340332, -6.187009334564209, -5.355276584625244, -4.523543834686279, -3.6918106079101562, -2.8600778579711914, -2.0283432006835938, -1.1966103315353394, -0.36487746238708496, 0.466855525970459, 1.2985882759094238, 2.1303210258483887, 2.9620542526245117, 3.7937870025634766, 4.625519752502441, 5.457252502441406, 6.288985252380371, 7.120718479156494, 7.952451229095459, 8.784183502197266, 9.615917205810547, 10.447649955749512, 11.279382705688477, 12.111115455627441, 12.942848205566406, 13.774581909179688, 14.606313705444336, 15.438047409057617, 16.269779205322266, 17.101512908935547, 17.933246612548828, 18.76498031616211, 19.596712112426758, 20.42844581604004, 21.260177612304688, 22.09191131591797, 22.92364501953125, 23.7553768157959, 24.587108612060547]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 15.0, 18.0, 16.0, 32.0, 45.0, 67.0, 97.0, 144.0, 213.0, 315.0, 481.0, 736.0, 1097.0, 1604.0, 2505.0, 3557.0, 5300.0, 8082.0, 12363.0, 20033.0, 32894.0, 58627.0, 120909.0, 315600.0, 795236.0, 1258741.0, 883546.0, 370366.0, 141137.0, 64482.0, 36005.0, 21425.0, 13309.0, 8588.0, 5509.0, 3633.0, 2464.0, 1677.0, 1186.0, 796.0, 487.0, 340.0, 211.0, 141.0, 73.0, 64.0, 42.0, 30.0, 20.0, 11.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-33.6875, -32.62060546875, -31.5537109375, -30.48681640625, -29.419921875, -28.35302734375, -27.2861328125, -26.21923828125, -25.15234375, -24.08544921875, -23.0185546875, -21.95166015625, -20.884765625, -19.81787109375, -18.7509765625, -17.68408203125, -16.6171875, -15.55029296875, -14.4833984375, -13.41650390625, -12.349609375, -11.28271484375, -10.2158203125, -9.14892578125, -8.08203125, -7.01513671875, -5.9482421875, -4.88134765625, -3.814453125, -2.74755859375, -1.6806640625, -0.61376953125, 0.453125, 1.52001953125, 2.5869140625, 3.65380859375, 4.720703125, 5.78759765625, 6.8544921875, 7.92138671875, 8.98828125, 10.05517578125, 11.1220703125, 12.18896484375, 13.255859375, 14.32275390625, 15.3896484375, 16.45654296875, 17.5234375, 18.59033203125, 19.6572265625, 20.72412109375, 21.791015625, 22.85791015625, 23.9248046875, 24.99169921875, 26.05859375, 27.12548828125, 28.1923828125, 29.25927734375, 30.326171875, 31.39306640625, 32.4599609375, 33.52685546875, 34.59375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 15.0, 14.0, 17.0, 23.0, 16.0, 19.0, 25.0, 24.0, 21.0, 29.0, 35.0, 22.0, 38.0, 25.0, 48.0, 28.0, 32.0, 37.0, 38.0, 34.0, 38.0, 34.0, 40.0, 28.0, 23.0, 35.0, 23.0, 26.0, 22.0, 25.0, 21.0, 13.0, 23.0, 7.0, 16.0, 9.0, 10.0, 9.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-25.40625, -24.650146484375, -23.89404296875, -23.137939453125, -22.3818359375, -21.625732421875, -20.86962890625, -20.113525390625, -19.357421875, -18.601318359375, -17.84521484375, -17.089111328125, -16.3330078125, -15.576904296875, -14.82080078125, -14.064697265625, -13.30859375, -12.552490234375, -11.79638671875, -11.040283203125, -10.2841796875, -9.528076171875, -8.77197265625, -8.015869140625, -7.259765625, -6.503662109375, -5.74755859375, -4.991455078125, -4.2353515625, -3.479248046875, -2.72314453125, -1.967041015625, -1.2109375, -0.454833984375, 0.30126953125, 1.057373046875, 1.8134765625, 2.569580078125, 3.32568359375, 4.081787109375, 4.837890625, 5.593994140625, 6.35009765625, 7.106201171875, 7.8623046875, 8.618408203125, 9.37451171875, 10.130615234375, 10.88671875, 11.642822265625, 12.39892578125, 13.155029296875, 13.9111328125, 14.667236328125, 15.42333984375, 16.179443359375, 16.935546875, 17.691650390625, 18.44775390625, 19.203857421875, 19.9599609375, 20.716064453125, 21.47216796875, 22.228271484375, 22.984375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 11.0, 17.0, 27.0, 56.0, 66.0, 103.0, 173.0, 291.0, 470.0, 820.0, 1357.0, 2352.0, 4110.0, 7776.0, 14719.0, 29469.0, 61083.0, 137014.0, 346713.0, 1113030.0, 1634558.0, 497543.0, 184335.0, 80031.0, 37476.0, 18831.0, 9749.0, 5255.0, 2876.0, 1600.0, 905.0, 537.0, 319.0, 223.0, 137.0, 83.0, 57.0, 36.0, 19.0, 19.0, 8.0, 9.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.208984375, -49.51171875, -47.814453125, -46.1171875, -44.419921875, -42.72265625, -41.025390625, -39.328125, -37.630859375, -35.93359375, -34.236328125, -32.5390625, -30.841796875, -29.14453125, -27.447265625, -25.75, -24.052734375, -22.35546875, -20.658203125, -18.9609375, -17.263671875, -15.56640625, -13.869140625, -12.171875, -10.474609375, -8.77734375, -7.080078125, -5.3828125, -3.685546875, -1.98828125, -0.291015625, 1.40625, 3.103515625, 4.80078125, 6.498046875, 8.1953125, 9.892578125, 11.58984375, 13.287109375, 14.984375, 16.681640625, 18.37890625, 20.076171875, 21.7734375, 23.470703125, 25.16796875, 26.865234375, 28.5625, 30.259765625, 31.95703125, 33.654296875, 35.3515625, 37.048828125, 38.74609375, 40.443359375, 42.140625, 43.837890625, 45.53515625, 47.232421875, 48.9296875, 50.626953125, 52.32421875, 54.021484375, 55.71875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 4.0, 4.0, 7.0, 14.0, 23.0, 22.0, 25.0, 31.0, 51.0, 65.0, 91.0, 93.0, 105.0, 125.0, 155.0, 248.0, 289.0, 379.0, 457.0, 374.0, 302.0, 253.0, 200.0, 157.0, 115.0, 90.0, 74.0, 61.0, 61.0, 32.0, 33.0, 32.0, 26.0, 16.0, 10.0, 8.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8853759765625, -11.419189453125, -10.9530029296875, -10.48681640625, -10.0206298828125, -9.554443359375, -9.0882568359375, -8.6220703125, -8.1558837890625, -7.689697265625, -7.2235107421875, -6.75732421875, -6.2911376953125, -5.824951171875, -5.3587646484375, -4.892578125, -4.4263916015625, -3.960205078125, -3.4940185546875, -3.02783203125, -2.5616455078125, -2.095458984375, -1.6292724609375, -1.1630859375, -0.6968994140625, -0.230712890625, 0.2354736328125, 0.70166015625, 1.1678466796875, 1.634033203125, 2.1002197265625, 2.56640625, 3.0325927734375, 3.498779296875, 3.9649658203125, 4.43115234375, 4.8973388671875, 5.363525390625, 5.8297119140625, 6.2958984375, 6.7620849609375, 7.228271484375, 7.6944580078125, 8.16064453125, 8.6268310546875, 9.093017578125, 9.5592041015625, 10.025390625, 10.4915771484375, 10.957763671875, 11.4239501953125, 11.89013671875, 12.3563232421875, 12.822509765625, 13.2886962890625, 13.7548828125, 14.2210693359375, 14.687255859375, 15.1534423828125, 15.61962890625, 16.0858154296875, 16.552001953125, 17.0181884765625, 17.484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 3.0, 14.0, 6.0, 5.0, 14.0, 18.0, 16.0, 24.0, 21.0, 34.0, 31.0, 32.0, 50.0, 49.0, 52.0, 54.0, 72.0, 53.0, 65.0, 59.0, 61.0, 46.0, 42.0, 27.0, 24.0, 17.0, 19.0, 11.0, 12.0, 14.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.91046142578125, -29.837297439575195, -28.76413345336914, -27.690969467163086, -26.61780548095703, -25.54464340209961, -24.471479415893555, -23.3983154296875, -22.325151443481445, -21.25198745727539, -20.178823471069336, -19.10565948486328, -18.03249740600586, -16.959331512451172, -15.88616943359375, -14.813005447387695, -13.73984146118164, -12.666677474975586, -11.593513488769531, -10.520350456237793, -9.447186470031738, -8.374022483825684, -7.300858974456787, -6.227695465087891, -5.154531478881836, -4.081367492675781, -3.0082039833068848, -1.9350402355194092, -0.8618764877319336, 0.2112874984741211, 1.2844510078430176, 2.357614517211914, 3.4307823181152344, 4.503946304321289, 5.5771098136901855, 6.650273323059082, 7.723437309265137, 8.796601295471191, 9.86976432800293, 10.942928314208984, 12.016092300415039, 13.089256286621094, 14.162420272827148, 15.235583305358887, 16.308746337890625, 17.381912231445312, 18.455074310302734, 19.52823829650879, 20.601402282714844, 21.6745662689209, 22.747730255126953, 23.820894241333008, 24.894058227539062, 25.967220306396484, 27.04038429260254, 28.113548278808594, 29.18671226501465, 30.259876251220703, 31.333040237426758, 32.40620422363281, 33.479366302490234, 34.55253219604492, 35.625694274902344, 36.69886016845703, 37.77202224731445]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 8.0, 7.0, 16.0, 16.0, 18.0, 26.0, 20.0, 18.0, 32.0, 23.0, 33.0, 36.0, 31.0, 36.0, 40.0, 39.0, 37.0, 49.0, 37.0, 36.0, 31.0, 37.0, 36.0, 37.0, 31.0, 36.0, 34.0, 20.0, 30.0, 24.0, 19.0, 13.0, 16.0, 15.0, 13.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.769123077392578, -28.83692741394043, -27.90473175048828, -26.972537994384766, -26.040342330932617, -25.10814666748047, -24.17595100402832, -23.243755340576172, -22.311561584472656, -21.379365921020508, -20.44717025756836, -19.514976501464844, -18.582780838012695, -17.650585174560547, -16.7183895111084, -15.78619384765625, -14.853998184204102, -13.921802520751953, -12.989607810974121, -12.057412147521973, -11.12521743774414, -10.193021774291992, -9.260826110839844, -8.328630447387695, -7.396435737609863, -6.464240550994873, -5.532045364379883, -4.599849700927734, -3.667654514312744, -2.735459327697754, -1.8032636642456055, -0.8710684776306152, 0.06112480163574219, 0.993320107460022, 1.9255154132843018, 2.857710838317871, 3.7899060249328613, 4.722101211547852, 5.654296875, 6.58649206161499, 7.5186872482299805, 8.450882911682129, 9.383077621459961, 10.31527328491211, 11.247468948364258, 12.17966365814209, 13.111859321594238, 14.04405403137207, 14.976249694824219, 15.908445358276367, 16.840641021728516, 17.77283477783203, 18.70503044128418, 19.637226104736328, 20.569421768188477, 21.501617431640625, 22.43381118774414, 23.36600685119629, 24.298202514648438, 25.230396270751953, 26.1625919342041, 27.09478759765625, 28.0269832611084, 28.959178924560547, 29.891374588012695]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 13.0, 11.0, 22.0, 39.0, 44.0, 82.0, 108.0, 150.0, 212.0, 312.0, 466.0, 709.0, 1027.0, 1551.0, 2240.0, 3424.0, 5133.0, 7858.0, 12162.0, 19079.0, 29745.0, 48122.0, 78486.0, 127820.0, 192305.0, 189134.0, 123635.0, 75381.0, 46811.0, 29256.0, 18435.0, 11953.0, 7690.0, 5013.0, 3284.0, 2177.0, 1468.0, 995.0, 708.0, 464.0, 338.0, 227.0, 147.0, 89.0, 69.0, 51.0, 26.0, 21.0, 21.0, 9.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.219970703125, -21.50244140625, -20.784912109375, -20.0673828125, -19.349853515625, -18.63232421875, -17.914794921875, -17.197265625, -16.479736328125, -15.76220703125, -15.044677734375, -14.3271484375, -13.609619140625, -12.89208984375, -12.174560546875, -11.45703125, -10.739501953125, -10.02197265625, -9.304443359375, -8.5869140625, -7.869384765625, -7.15185546875, -6.434326171875, -5.716796875, -4.999267578125, -4.28173828125, -3.564208984375, -2.8466796875, -2.129150390625, -1.41162109375, -0.694091796875, 0.0234375, 0.740966796875, 1.45849609375, 2.176025390625, 2.8935546875, 3.611083984375, 4.32861328125, 5.046142578125, 5.763671875, 6.481201171875, 7.19873046875, 7.916259765625, 8.6337890625, 9.351318359375, 10.06884765625, 10.786376953125, 11.50390625, 12.221435546875, 12.93896484375, 13.656494140625, 14.3740234375, 15.091552734375, 15.80908203125, 16.526611328125, 17.244140625, 17.961669921875, 18.67919921875, 19.396728515625, 20.1142578125, 20.831787109375, 21.54931640625, 22.266845703125, 22.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 4.0, 3.0, 7.0, 16.0, 15.0, 16.0, 24.0, 16.0, 26.0, 34.0, 32.0, 24.0, 33.0, 28.0, 39.0, 42.0, 42.0, 40.0, 43.0, 53.0, 39.0, 32.0, 34.0, 33.0, 36.0, 44.0, 36.0, 33.0, 29.0, 26.0, 20.0, 21.0, 10.0, 14.0, 15.0, 10.0, 7.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.738037109375, -29.74169921875, -28.745361328125, -27.7490234375, -26.752685546875, -25.75634765625, -24.760009765625, -23.763671875, -22.767333984375, -21.77099609375, -20.774658203125, -19.7783203125, -18.781982421875, -17.78564453125, -16.789306640625, -15.79296875, -14.796630859375, -13.80029296875, -12.803955078125, -11.8076171875, -10.811279296875, -9.81494140625, -8.818603515625, -7.822265625, -6.825927734375, -5.82958984375, -4.833251953125, -3.8369140625, -2.840576171875, -1.84423828125, -0.847900390625, 0.1484375, 1.144775390625, 2.14111328125, 3.137451171875, 4.1337890625, 5.130126953125, 6.12646484375, 7.122802734375, 8.119140625, 9.115478515625, 10.11181640625, 11.108154296875, 12.1044921875, 13.100830078125, 14.09716796875, 15.093505859375, 16.08984375, 17.086181640625, 18.08251953125, 19.078857421875, 20.0751953125, 21.071533203125, 22.06787109375, 23.064208984375, 24.060546875, 25.056884765625, 26.05322265625, 27.049560546875, 28.0458984375, 29.042236328125, 30.03857421875, 31.034912109375, 32.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 17.0, 30.0, 29.0, 48.0, 66.0, 101.0, 153.0, 194.0, 287.0, 423.0, 645.0, 984.0, 1592.0, 2490.0, 3977.0, 6738.0, 11371.0, 20600.0, 38926.0, 80717.0, 185181.0, 327926.0, 191314.0, 83592.0, 40478.0, 20975.0, 11687.0, 6741.0, 3978.0, 2531.0, 1638.0, 1026.0, 648.0, 440.0, 292.0, 208.0, 146.0, 104.0, 71.0, 53.0, 28.0, 26.0, 21.0, 11.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.84814453125, -34.6337890625, -33.41943359375, -32.205078125, -30.99072265625, -29.7763671875, -28.56201171875, -27.34765625, -26.13330078125, -24.9189453125, -23.70458984375, -22.490234375, -21.27587890625, -20.0615234375, -18.84716796875, -17.6328125, -16.41845703125, -15.2041015625, -13.98974609375, -12.775390625, -11.56103515625, -10.3466796875, -9.13232421875, -7.91796875, -6.70361328125, -5.4892578125, -4.27490234375, -3.060546875, -1.84619140625, -0.6318359375, 0.58251953125, 1.796875, 3.01123046875, 4.2255859375, 5.43994140625, 6.654296875, 7.86865234375, 9.0830078125, 10.29736328125, 11.51171875, 12.72607421875, 13.9404296875, 15.15478515625, 16.369140625, 17.58349609375, 18.7978515625, 20.01220703125, 21.2265625, 22.44091796875, 23.6552734375, 24.86962890625, 26.083984375, 27.29833984375, 28.5126953125, 29.72705078125, 30.94140625, 32.15576171875, 33.3701171875, 34.58447265625, 35.798828125, 37.01318359375, 38.2275390625, 39.44189453125, 40.65625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 11.0, 15.0, 10.0, 13.0, 24.0, 25.0, 16.0, 27.0, 43.0, 25.0, 36.0, 32.0, 39.0, 39.0, 48.0, 24.0, 34.0, 43.0, 35.0, 39.0, 36.0, 37.0, 44.0, 40.0, 33.0, 32.0, 31.0, 29.0, 18.0, 12.0, 16.0, 11.0, 6.0, 15.0, 6.0, 5.0, 9.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.578125, -20.93798828125, -20.2978515625, -19.65771484375, -19.017578125, -18.37744140625, -17.7373046875, -17.09716796875, -16.45703125, -15.81689453125, -15.1767578125, -14.53662109375, -13.896484375, -13.25634765625, -12.6162109375, -11.97607421875, -11.3359375, -10.69580078125, -10.0556640625, -9.41552734375, -8.775390625, -8.13525390625, -7.4951171875, -6.85498046875, -6.21484375, -5.57470703125, -4.9345703125, -4.29443359375, -3.654296875, -3.01416015625, -2.3740234375, -1.73388671875, -1.09375, -0.45361328125, 0.1865234375, 0.82666015625, 1.466796875, 2.10693359375, 2.7470703125, 3.38720703125, 4.02734375, 4.66748046875, 5.3076171875, 5.94775390625, 6.587890625, 7.22802734375, 7.8681640625, 8.50830078125, 9.1484375, 9.78857421875, 10.4287109375, 11.06884765625, 11.708984375, 12.34912109375, 12.9892578125, 13.62939453125, 14.26953125, 14.90966796875, 15.5498046875, 16.18994140625, 16.830078125, 17.47021484375, 18.1103515625, 18.75048828125, 19.390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 11.0, 16.0, 30.0, 33.0, 46.0, 58.0, 102.0, 133.0, 184.0, 300.0, 436.0, 713.0, 1143.0, 1894.0, 3376.0, 6278.0, 12230.0, 27807.0, 77434.0, 286475.0, 435226.0, 120734.0, 39262.0, 16287.0, 7794.0, 4218.0, 2442.0, 1354.0, 849.0, 555.0, 361.0, 225.0, 165.0, 104.0, 58.0, 57.0, 33.0, 26.0, 18.0, 19.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.6484375, -15.1466064453125, -14.644775390625, -14.1429443359375, -13.64111328125, -13.1392822265625, -12.637451171875, -12.1356201171875, -11.6337890625, -11.1319580078125, -10.630126953125, -10.1282958984375, -9.62646484375, -9.1246337890625, -8.622802734375, -8.1209716796875, -7.619140625, -7.1173095703125, -6.615478515625, -6.1136474609375, -5.61181640625, -5.1099853515625, -4.608154296875, -4.1063232421875, -3.6044921875, -3.1026611328125, -2.600830078125, -2.0989990234375, -1.59716796875, -1.0953369140625, -0.593505859375, -0.0916748046875, 0.41015625, 0.9119873046875, 1.413818359375, 1.9156494140625, 2.41748046875, 2.9193115234375, 3.421142578125, 3.9229736328125, 4.4248046875, 4.9266357421875, 5.428466796875, 5.9302978515625, 6.43212890625, 6.9339599609375, 7.435791015625, 7.9376220703125, 8.439453125, 8.9412841796875, 9.443115234375, 9.9449462890625, 10.44677734375, 10.9486083984375, 11.450439453125, 11.9522705078125, 12.4541015625, 12.9559326171875, 13.457763671875, 13.9595947265625, 14.46142578125, 14.9632568359375, 15.465087890625, 15.9669189453125, 16.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 14.0, 18.0, 35.0, 41.0, 81.0, 87.0, 148.0, 159.0, 115.0, 96.0, 56.0, 37.0, 27.0, 19.0, 13.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018739700317382812, -0.0018118172883987427, -0.001749664545059204, -0.0016875118017196655, -0.001625359058380127, -0.0015632063150405884, -0.0015010535717010498, -0.0014389008283615112, -0.0013767480850219727, -0.001314595341682434, -0.0012524425983428955, -0.001190289855003357, -0.0011281371116638184, -0.0010659843683242798, -0.0010038316249847412, -0.0009416788816452026, -0.0008795261383056641, -0.0008173733949661255, -0.0007552206516265869, -0.0006930679082870483, -0.0006309151649475098, -0.0005687624216079712, -0.0005066096782684326, -0.00044445693492889404, -0.00038230419158935547, -0.0003201514482498169, -0.0002579987049102783, -0.00019584596157073975, -0.00013369321823120117, -7.15404748916626e-05, -9.387731552124023e-06, 5.276501178741455e-05, 0.00011491775512695312, 0.0001770704984664917, 0.00023922324180603027, 0.00030137598514556885, 0.0003635287284851074, 0.000425681471824646, 0.00048783421516418457, 0.0005499869585037231, 0.0006121397018432617, 0.0006742924451828003, 0.0007364451885223389, 0.0007985979318618774, 0.000860750675201416, 0.0009229034185409546, 0.0009850561618804932, 0.0010472089052200317, 0.0011093616485595703, 0.0011715143918991089, 0.0012336671352386475, 0.001295819878578186, 0.0013579726219177246, 0.0014201253652572632, 0.0014822781085968018, 0.0015444308519363403, 0.001606583595275879, 0.0016687363386154175, 0.001730889081954956, 0.0017930418252944946, 0.0018551945686340332, 0.0019173473119735718, 0.0019795000553131104, 0.002041652798652649, 0.0021038055419921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 21.0, 29.0, 45.0, 79.0, 119.0, 134.0, 208.0, 363.0, 427.0, 713.0, 1147.0, 1743.0, 2782.0, 4729.0, 7822.0, 14249.0, 27808.0, 60494.0, 153811.0, 334810.0, 250617.0, 98027.0, 41014.0, 20323.0, 10889.0, 6058.0, 3624.0, 2217.0, 1441.0, 892.0, 603.0, 412.0, 286.0, 174.0, 129.0, 86.0, 62.0, 41.0, 22.0, 25.0, 17.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.21875, -14.781005859375, -14.34326171875, -13.905517578125, -13.4677734375, -13.030029296875, -12.59228515625, -12.154541015625, -11.716796875, -11.279052734375, -10.84130859375, -10.403564453125, -9.9658203125, -9.528076171875, -9.09033203125, -8.652587890625, -8.21484375, -7.777099609375, -7.33935546875, -6.901611328125, -6.4638671875, -6.026123046875, -5.58837890625, -5.150634765625, -4.712890625, -4.275146484375, -3.83740234375, -3.399658203125, -2.9619140625, -2.524169921875, -2.08642578125, -1.648681640625, -1.2109375, -0.773193359375, -0.33544921875, 0.102294921875, 0.5400390625, 0.977783203125, 1.41552734375, 1.853271484375, 2.291015625, 2.728759765625, 3.16650390625, 3.604248046875, 4.0419921875, 4.479736328125, 4.91748046875, 5.355224609375, 5.79296875, 6.230712890625, 6.66845703125, 7.106201171875, 7.5439453125, 7.981689453125, 8.41943359375, 8.857177734375, 9.294921875, 9.732666015625, 10.17041015625, 10.608154296875, 11.0458984375, 11.483642578125, 11.92138671875, 12.359130859375, 12.796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 7.0, 5.0, 7.0, 7.0, 15.0, 16.0, 25.0, 24.0, 34.0, 52.0, 79.0, 63.0, 86.0, 71.0, 88.0, 82.0, 74.0, 61.0, 36.0, 21.0, 28.0, 24.0, 13.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.284912109375, -4.14013671875, -3.995361328125, -3.8505859375, -3.705810546875, -3.56103515625, -3.416259765625, -3.271484375, -3.126708984375, -2.98193359375, -2.837158203125, -2.6923828125, -2.547607421875, -2.40283203125, -2.258056640625, -2.11328125, -1.968505859375, -1.82373046875, -1.678955078125, -1.5341796875, -1.389404296875, -1.24462890625, -1.099853515625, -0.955078125, -0.810302734375, -0.66552734375, -0.520751953125, -0.3759765625, -0.231201171875, -0.08642578125, 0.058349609375, 0.203125, 0.347900390625, 0.49267578125, 0.637451171875, 0.7822265625, 0.927001953125, 1.07177734375, 1.216552734375, 1.361328125, 1.506103515625, 1.65087890625, 1.795654296875, 1.9404296875, 2.085205078125, 2.22998046875, 2.374755859375, 2.51953125, 2.664306640625, 2.80908203125, 2.953857421875, 3.0986328125, 3.243408203125, 3.38818359375, 3.532958984375, 3.677734375, 3.822509765625, 3.96728515625, 4.112060546875, 4.2568359375, 4.401611328125, 4.54638671875, 4.691162109375, 4.8359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 8.0, 10.0, 7.0, 9.0, 12.0, 15.0, 21.0, 16.0, 23.0, 32.0, 22.0, 34.0, 32.0, 47.0, 54.0, 65.0, 61.0, 70.0, 51.0, 64.0, 43.0, 49.0, 41.0, 37.0, 30.0, 22.0, 23.0, 16.0, 17.0, 9.0, 12.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.662500381469727, -27.651273727416992, -26.64004898071289, -25.628822326660156, -24.617595672607422, -23.606369018554688, -22.595144271850586, -21.58391761779785, -20.57269287109375, -19.561466217041016, -18.550241470336914, -17.53901481628418, -16.527788162231445, -15.516562461853027, -14.50533676147461, -13.494110107421875, -12.48288345336914, -11.471657752990723, -10.460431098937988, -9.44920539855957, -8.437978744506836, -7.426753044128418, -6.41552734375, -5.404301166534424, -4.393074989318848, -3.3818488121032715, -2.3706228733062744, -1.3593969345092773, -0.34817075729370117, 0.663055419921875, 1.674281120300293, 2.685507297515869, 3.696735382080078, 4.707961559295654, 5.7191877365112305, 6.730413436889648, 7.741639614105225, 8.7528657913208, 9.764091491699219, 10.775318145751953, 11.786543846130371, 12.797769546508789, 13.808996200561523, 14.820221900939941, 15.83144760131836, 16.842674255371094, 17.853900909423828, 18.86512565612793, 19.876352310180664, 20.8875789642334, 21.8988037109375, 22.910030364990234, 23.92125701904297, 24.932483673095703, 25.943708419799805, 26.95493507385254, 27.96615982055664, 28.977386474609375, 29.988611221313477, 30.99983787536621, 32.01106262207031, 33.02228927612305, 34.03351593017578, 35.044742584228516, 36.05596923828125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 4.0, 10.0, 8.0, 14.0, 20.0, 23.0, 23.0, 25.0, 23.0, 30.0, 26.0, 27.0, 35.0, 35.0, 43.0, 27.0, 47.0, 38.0, 40.0, 40.0, 30.0, 39.0, 34.0, 42.0, 32.0, 35.0, 36.0, 23.0, 25.0, 32.0, 25.0, 10.0, 16.0, 11.0, 16.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-29.438772201538086, -28.533864974975586, -27.628957748413086, -26.724050521850586, -25.819143295288086, -24.914236068725586, -24.009328842163086, -23.104421615600586, -22.199514389038086, -21.294607162475586, -20.389699935913086, -19.484792709350586, -18.579885482788086, -17.674978256225586, -16.770071029663086, -15.865163803100586, -14.96025562286377, -14.05534839630127, -13.15044116973877, -12.24553394317627, -11.34062671661377, -10.435718536376953, -9.530811309814453, -8.625904083251953, -7.720997333526611, -6.816090106964111, -5.911182880401611, -5.006275177001953, -4.101367950439453, -3.196460723876953, -2.291553497314453, -1.3866462707519531, -0.4817390441894531, 0.42316824197769165, 1.3280755281448364, 2.232982873916626, 3.137890100479126, 4.042797565460205, 4.947704792022705, 5.852612018585205, 6.757519245147705, 7.662426471710205, 8.567334175109863, 9.472241401672363, 10.377148628234863, 11.282055854797363, 12.186963081359863, 13.091870307922363, 13.996777534484863, 14.901684761047363, 15.806591987609863, 16.71150016784668, 17.61640739440918, 18.52131462097168, 19.42622184753418, 20.33112907409668, 21.23603630065918, 22.14094352722168, 23.04585075378418, 23.95075798034668, 24.85566520690918, 25.76057243347168, 26.66547966003418, 27.57038688659668, 28.47529411315918]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 18.0, 46.0, 56.0, 94.0, 118.0, 212.0, 264.0, 460.0, 700.0, 1208.0, 1735.0, 2766.0, 4426.0, 6932.0, 11013.0, 17526.0, 28044.0, 45617.0, 72881.0, 115724.0, 169015.0, 187846.0, 140297.0, 91082.0, 55964.0, 35287.0, 21762.0, 13875.0, 8596.0, 5464.0, 3345.0, 2179.0, 1433.0, 923.0, 568.0, 380.0, 215.0, 152.0, 99.0, 82.0, 50.0, 24.0, 17.0, 10.0, 9.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.71875, -33.6416015625, -32.564453125, -31.4873046875, -30.41015625, -29.3330078125, -28.255859375, -27.1787109375, -26.1015625, -25.0244140625, -23.947265625, -22.8701171875, -21.79296875, -20.7158203125, -19.638671875, -18.5615234375, -17.484375, -16.4072265625, -15.330078125, -14.2529296875, -13.17578125, -12.0986328125, -11.021484375, -9.9443359375, -8.8671875, -7.7900390625, -6.712890625, -5.6357421875, -4.55859375, -3.4814453125, -2.404296875, -1.3271484375, -0.25, 0.8271484375, 1.904296875, 2.9814453125, 4.05859375, 5.1357421875, 6.212890625, 7.2900390625, 8.3671875, 9.4443359375, 10.521484375, 11.5986328125, 12.67578125, 13.7529296875, 14.830078125, 15.9072265625, 16.984375, 18.0615234375, 19.138671875, 20.2158203125, 21.29296875, 22.3701171875, 23.447265625, 24.5244140625, 25.6015625, 26.6787109375, 27.755859375, 28.8330078125, 29.91015625, 30.9873046875, 32.064453125, 33.1416015625, 34.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 13.0, 6.0, 9.0, 5.0, 13.0, 15.0, 25.0, 26.0, 14.0, 24.0, 29.0, 25.0, 28.0, 36.0, 41.0, 41.0, 30.0, 31.0, 31.0, 45.0, 51.0, 40.0, 36.0, 31.0, 36.0, 36.0, 46.0, 30.0, 33.0, 22.0, 24.0, 26.0, 19.0, 13.0, 19.0, 16.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-31.234375, -30.31689453125, -29.3994140625, -28.48193359375, -27.564453125, -26.64697265625, -25.7294921875, -24.81201171875, -23.89453125, -22.97705078125, -22.0595703125, -21.14208984375, -20.224609375, -19.30712890625, -18.3896484375, -17.47216796875, -16.5546875, -15.63720703125, -14.7197265625, -13.80224609375, -12.884765625, -11.96728515625, -11.0498046875, -10.13232421875, -9.21484375, -8.29736328125, -7.3798828125, -6.46240234375, -5.544921875, -4.62744140625, -3.7099609375, -2.79248046875, -1.875, -0.95751953125, -0.0400390625, 0.87744140625, 1.794921875, 2.71240234375, 3.6298828125, 4.54736328125, 5.46484375, 6.38232421875, 7.2998046875, 8.21728515625, 9.134765625, 10.05224609375, 10.9697265625, 11.88720703125, 12.8046875, 13.72216796875, 14.6396484375, 15.55712890625, 16.474609375, 17.39208984375, 18.3095703125, 19.22705078125, 20.14453125, 21.06201171875, 21.9794921875, 22.89697265625, 23.814453125, 24.73193359375, 25.6494140625, 26.56689453125, 27.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 11.0, 22.0, 26.0, 34.0, 62.0, 101.0, 139.0, 271.0, 411.0, 708.0, 1132.0, 2097.0, 3602.0, 6459.0, 11792.0, 22277.0, 42685.0, 86421.0, 174303.0, 278965.0, 205499.0, 103223.0, 51100.0, 25981.0, 13821.0, 7483.0, 4117.0, 2372.0, 1388.0, 839.0, 453.0, 262.0, 189.0, 104.0, 80.0, 43.0, 28.0, 18.0, 18.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.853515625, -46.23828125, -44.623046875, -43.0078125, -41.392578125, -39.77734375, -38.162109375, -36.546875, -34.931640625, -33.31640625, -31.701171875, -30.0859375, -28.470703125, -26.85546875, -25.240234375, -23.625, -22.009765625, -20.39453125, -18.779296875, -17.1640625, -15.548828125, -13.93359375, -12.318359375, -10.703125, -9.087890625, -7.47265625, -5.857421875, -4.2421875, -2.626953125, -1.01171875, 0.603515625, 2.21875, 3.833984375, 5.44921875, 7.064453125, 8.6796875, 10.294921875, 11.91015625, 13.525390625, 15.140625, 16.755859375, 18.37109375, 19.986328125, 21.6015625, 23.216796875, 24.83203125, 26.447265625, 28.0625, 29.677734375, 31.29296875, 32.908203125, 34.5234375, 36.138671875, 37.75390625, 39.369140625, 40.984375, 42.599609375, 44.21484375, 45.830078125, 47.4453125, 49.060546875, 50.67578125, 52.291015625, 53.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 2.0, 2.0, 9.0, 7.0, 18.0, 13.0, 16.0, 11.0, 23.0, 25.0, 20.0, 31.0, 38.0, 32.0, 35.0, 37.0, 59.0, 52.0, 41.0, 40.0, 53.0, 38.0, 46.0, 49.0, 32.0, 34.0, 35.0, 36.0, 20.0, 16.0, 21.0, 23.0, 17.0, 12.0, 15.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.890625, -20.250732421875, -19.61083984375, -18.970947265625, -18.3310546875, -17.691162109375, -17.05126953125, -16.411376953125, -15.771484375, -15.131591796875, -14.49169921875, -13.851806640625, -13.2119140625, -12.572021484375, -11.93212890625, -11.292236328125, -10.65234375, -10.012451171875, -9.37255859375, -8.732666015625, -8.0927734375, -7.452880859375, -6.81298828125, -6.173095703125, -5.533203125, -4.893310546875, -4.25341796875, -3.613525390625, -2.9736328125, -2.333740234375, -1.69384765625, -1.053955078125, -0.4140625, 0.225830078125, 0.86572265625, 1.505615234375, 2.1455078125, 2.785400390625, 3.42529296875, 4.065185546875, 4.705078125, 5.344970703125, 5.98486328125, 6.624755859375, 7.2646484375, 7.904541015625, 8.54443359375, 9.184326171875, 9.82421875, 10.464111328125, 11.10400390625, 11.743896484375, 12.3837890625, 13.023681640625, 13.66357421875, 14.303466796875, 14.943359375, 15.583251953125, 16.22314453125, 16.863037109375, 17.5029296875, 18.142822265625, 18.78271484375, 19.422607421875, 20.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 11.0, 18.0, 26.0, 26.0, 33.0, 54.0, 78.0, 94.0, 117.0, 171.0, 260.0, 353.0, 507.0, 740.0, 1143.0, 1831.0, 3001.0, 5140.0, 9083.0, 18024.0, 37542.0, 85294.0, 206669.0, 336021.0, 190600.0, 78129.0, 34960.0, 16904.0, 8737.0, 4892.0, 2818.0, 1760.0, 1064.0, 706.0, 507.0, 355.0, 244.0, 174.0, 116.0, 105.0, 60.0, 45.0, 37.0, 36.0, 15.0, 11.0, 14.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.59375, -19.91748046875, -19.2412109375, -18.56494140625, -17.888671875, -17.21240234375, -16.5361328125, -15.85986328125, -15.18359375, -14.50732421875, -13.8310546875, -13.15478515625, -12.478515625, -11.80224609375, -11.1259765625, -10.44970703125, -9.7734375, -9.09716796875, -8.4208984375, -7.74462890625, -7.068359375, -6.39208984375, -5.7158203125, -5.03955078125, -4.36328125, -3.68701171875, -3.0107421875, -2.33447265625, -1.658203125, -0.98193359375, -0.3056640625, 0.37060546875, 1.046875, 1.72314453125, 2.3994140625, 3.07568359375, 3.751953125, 4.42822265625, 5.1044921875, 5.78076171875, 6.45703125, 7.13330078125, 7.8095703125, 8.48583984375, 9.162109375, 9.83837890625, 10.5146484375, 11.19091796875, 11.8671875, 12.54345703125, 13.2197265625, 13.89599609375, 14.572265625, 15.24853515625, 15.9248046875, 16.60107421875, 17.27734375, 17.95361328125, 18.6298828125, 19.30615234375, 19.982421875, 20.65869140625, 21.3349609375, 22.01123046875, 22.6875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 26.0, 33.0, 60.0, 78.0, 90.0, 137.0, 126.0, 108.0, 80.0, 66.0, 36.0, 38.0, 11.0, 19.0, 11.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0028972625732421875, -0.0028096139430999756, -0.0027219653129577637, -0.0026343166828155518, -0.00254666805267334, -0.002459019422531128, -0.002371370792388916, -0.002283722162246704, -0.002196073532104492, -0.0021084249019622803, -0.0020207762718200684, -0.0019331276416778564, -0.0018454790115356445, -0.0017578303813934326, -0.0016701817512512207, -0.0015825331211090088, -0.0014948844909667969, -0.001407235860824585, -0.001319587230682373, -0.0012319386005401611, -0.0011442899703979492, -0.0010566413402557373, -0.0009689927101135254, -0.0008813440799713135, -0.0007936954498291016, -0.0007060468196868896, -0.0006183981895446777, -0.0005307495594024658, -0.0004431009292602539, -0.000355452299118042, -0.0002678036689758301, -0.00018015503883361816, -9.250640869140625e-05, -4.857778549194336e-06, 8.279085159301758e-05, 0.0001704394817352295, 0.0002580881118774414, 0.0003457367420196533, 0.00043338537216186523, 0.0005210340023040771, 0.0006086826324462891, 0.000696331262588501, 0.0007839798927307129, 0.0008716285228729248, 0.0009592771530151367, 0.0010469257831573486, 0.0011345744132995605, 0.0012222230434417725, 0.0013098716735839844, 0.0013975203037261963, 0.0014851689338684082, 0.0015728175640106201, 0.001660466194152832, 0.001748114824295044, 0.0018357634544372559, 0.0019234120845794678, 0.0020110607147216797, 0.0020987093448638916, 0.0021863579750061035, 0.0022740066051483154, 0.0023616552352905273, 0.0024493038654327393, 0.002536952495574951, 0.002624601125717163, 0.002712249755859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 33.0, 28.0, 38.0, 52.0, 97.0, 146.0, 250.0, 419.0, 661.0, 1118.0, 1947.0, 3390.0, 6399.0, 12480.0, 26415.0, 58982.0, 137365.0, 289205.0, 276118.0, 127457.0, 55422.0, 24742.0, 11874.0, 6008.0, 3260.0, 1867.0, 1044.0, 612.0, 379.0, 219.0, 156.0, 100.0, 77.0, 43.0, 33.0, 17.0, 13.0, 12.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.828125, -19.166259765625, -18.50439453125, -17.842529296875, -17.1806640625, -16.518798828125, -15.85693359375, -15.195068359375, -14.533203125, -13.871337890625, -13.20947265625, -12.547607421875, -11.8857421875, -11.223876953125, -10.56201171875, -9.900146484375, -9.23828125, -8.576416015625, -7.91455078125, -7.252685546875, -6.5908203125, -5.928955078125, -5.26708984375, -4.605224609375, -3.943359375, -3.281494140625, -2.61962890625, -1.957763671875, -1.2958984375, -0.634033203125, 0.02783203125, 0.689697265625, 1.3515625, 2.013427734375, 2.67529296875, 3.337158203125, 3.9990234375, 4.660888671875, 5.32275390625, 5.984619140625, 6.646484375, 7.308349609375, 7.97021484375, 8.632080078125, 9.2939453125, 9.955810546875, 10.61767578125, 11.279541015625, 11.94140625, 12.603271484375, 13.26513671875, 13.927001953125, 14.5888671875, 15.250732421875, 15.91259765625, 16.574462890625, 17.236328125, 17.898193359375, 18.56005859375, 19.221923828125, 19.8837890625, 20.545654296875, 21.20751953125, 21.869384765625, 22.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 16.0, 16.0, 17.0, 32.0, 32.0, 35.0, 50.0, 50.0, 66.0, 56.0, 71.0, 79.0, 83.0, 84.0, 57.0, 46.0, 41.0, 32.0, 34.0, 17.0, 13.0, 12.0, 13.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.22869873046875, -4.0355224609375, -3.84234619140625, -3.649169921875, -3.45599365234375, -3.2628173828125, -3.06964111328125, -2.87646484375, -2.68328857421875, -2.4901123046875, -2.29693603515625, -2.103759765625, -1.91058349609375, -1.7174072265625, -1.52423095703125, -1.3310546875, -1.13787841796875, -0.9447021484375, -0.75152587890625, -0.558349609375, -0.36517333984375, -0.1719970703125, 0.02117919921875, 0.21435546875, 0.40753173828125, 0.6007080078125, 0.79388427734375, 0.987060546875, 1.18023681640625, 1.3734130859375, 1.56658935546875, 1.759765625, 1.95294189453125, 2.1461181640625, 2.33929443359375, 2.532470703125, 2.72564697265625, 2.9188232421875, 3.11199951171875, 3.30517578125, 3.49835205078125, 3.6915283203125, 3.88470458984375, 4.077880859375, 4.27105712890625, 4.4642333984375, 4.65740966796875, 4.8505859375, 5.04376220703125, 5.2369384765625, 5.43011474609375, 5.623291015625, 5.81646728515625, 6.0096435546875, 6.20281982421875, 6.39599609375, 6.58917236328125, 6.7823486328125, 6.97552490234375, 7.168701171875, 7.36187744140625, 7.5550537109375, 7.74822998046875, 7.94140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 5.0, 9.0, 15.0, 20.0, 16.0, 18.0, 30.0, 33.0, 28.0, 41.0, 35.0, 50.0, 45.0, 59.0, 47.0, 49.0, 53.0, 48.0, 64.0, 43.0, 38.0, 43.0, 27.0, 20.0, 19.0, 18.0, 16.0, 22.0, 16.0, 6.0, 5.0, 8.0, 7.0, 3.0, 2.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0], "bins": [-28.101316452026367, -27.175453186035156, -26.249591827392578, -25.323728561401367, -24.397865295410156, -23.472002029418945, -22.546138763427734, -21.620277404785156, -20.694414138793945, -19.768550872802734, -18.842689514160156, -17.916826248168945, -16.990962982177734, -16.065099716186523, -15.139237403869629, -14.213375091552734, -13.287511825561523, -12.361648559570312, -11.435786247253418, -10.509923934936523, -9.584060668945312, -8.658197402954102, -7.732335090637207, -6.806472301483154, -5.880609512329102, -4.954746723175049, -4.028883934020996, -3.1030211448669434, -2.1771583557128906, -1.251295566558838, -0.32543277740478516, 0.6004300117492676, 1.5262908935546875, 2.4521536827087402, 3.378016471862793, 4.303879261016846, 5.229742050170898, 6.155604839324951, 7.081467628479004, 8.007329940795898, 8.93319320678711, 9.85905647277832, 10.784918785095215, 11.71078109741211, 12.63664436340332, 13.562507629394531, 14.488369941711426, 15.41423225402832, 16.34009552001953, 17.265958786010742, 18.191822052001953, 19.11768341064453, 20.043546676635742, 20.969409942626953, 21.89527130126953, 22.821134567260742, 23.746997833251953, 24.672861099243164, 25.598724365234375, 26.524585723876953, 27.450448989868164, 28.376312255859375, 29.302173614501953, 30.228036880493164, 31.153900146484375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 5.0, 11.0, 10.0, 7.0, 19.0, 15.0, 22.0, 17.0, 20.0, 21.0, 26.0, 27.0, 33.0, 35.0, 38.0, 34.0, 30.0, 39.0, 40.0, 28.0, 30.0, 30.0, 36.0, 25.0, 31.0, 40.0, 29.0, 28.0, 35.0, 30.0, 29.0, 27.0, 17.0, 17.0, 17.0, 16.0, 12.0, 6.0, 7.0, 12.0, 5.0, 9.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0], "bins": [-28.420991897583008, -27.608470916748047, -26.795949935913086, -25.983428955078125, -25.170909881591797, -24.358386993408203, -23.545867919921875, -22.733346939086914, -21.920825958251953, -21.108304977416992, -20.29578399658203, -19.48326301574707, -18.67074203491211, -17.85822296142578, -17.04570198059082, -16.23318099975586, -15.420660018920898, -14.608139038085938, -13.795618057250977, -12.983098030090332, -12.170577049255371, -11.35805606842041, -10.545536041259766, -9.733015060424805, -8.920494079589844, -8.107973098754883, -7.29545259475708, -6.482932090759277, -5.670411109924316, -4.8578901290893555, -4.045369625091553, -3.23284912109375, -2.4203262329101562, -1.6078054904937744, -0.7952847480773926, 0.017235994338989258, 0.8297567367553711, 1.642277717590332, 2.4547982215881348, 3.2673187255859375, 4.079839706420898, 4.892360687255859, 5.704881191253662, 6.517401695251465, 7.329922676086426, 8.142443656921387, 8.954963684082031, 9.767484664916992, 10.580005645751953, 11.392526626586914, 12.205047607421875, 13.01756763458252, 13.83008861541748, 14.642609596252441, 15.455129623413086, 16.267650604248047, 17.080171585083008, 17.89269256591797, 18.70521354675293, 19.51773452758789, 20.33025360107422, 21.142776489257812, 21.95529556274414, 22.7678165435791, 23.580337524414062]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 9.0, 7.0, 9.0, 10.0, 14.0, 24.0, 38.0, 45.0, 51.0, 89.0, 155.0, 182.0, 314.0, 412.0, 578.0, 899.0, 1249.0, 1954.0, 2973.0, 4645.0, 6920.0, 10970.0, 17514.0, 29326.0, 52229.0, 108345.0, 295432.0, 852505.0, 1386435.0, 847479.0, 320843.0, 119100.0, 56137.0, 30531.0, 17605.0, 10655.0, 6609.0, 4254.0, 2650.0, 1786.0, 1109.0, 750.0, 483.0, 328.0, 230.0, 147.0, 100.0, 42.0, 44.0, 28.0, 20.0, 13.0, 12.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-38.5625, -37.4453125, -36.328125, -35.2109375, -34.09375, -32.9765625, -31.859375, -30.7421875, -29.625, -28.5078125, -27.390625, -26.2734375, -25.15625, -24.0390625, -22.921875, -21.8046875, -20.6875, -19.5703125, -18.453125, -17.3359375, -16.21875, -15.1015625, -13.984375, -12.8671875, -11.75, -10.6328125, -9.515625, -8.3984375, -7.28125, -6.1640625, -5.046875, -3.9296875, -2.8125, -1.6953125, -0.578125, 0.5390625, 1.65625, 2.7734375, 3.890625, 5.0078125, 6.125, 7.2421875, 8.359375, 9.4765625, 10.59375, 11.7109375, 12.828125, 13.9453125, 15.0625, 16.1796875, 17.296875, 18.4140625, 19.53125, 20.6484375, 21.765625, 22.8828125, 24.0, 25.1171875, 26.234375, 27.3515625, 28.46875, 29.5859375, 30.703125, 31.8203125, 32.9375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 12.0, 18.0, 12.0, 13.0, 12.0, 21.0, 24.0, 30.0, 15.0, 27.0, 29.0, 39.0, 29.0, 37.0, 30.0, 38.0, 39.0, 40.0, 25.0, 40.0, 32.0, 42.0, 45.0, 39.0, 24.0, 30.0, 33.0, 28.0, 29.0, 14.0, 17.0, 12.0, 11.0, 18.0, 18.0, 7.0, 5.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.671875, -24.945556640625, -24.21923828125, -23.492919921875, -22.7666015625, -22.040283203125, -21.31396484375, -20.587646484375, -19.861328125, -19.135009765625, -18.40869140625, -17.682373046875, -16.9560546875, -16.229736328125, -15.50341796875, -14.777099609375, -14.05078125, -13.324462890625, -12.59814453125, -11.871826171875, -11.1455078125, -10.419189453125, -9.69287109375, -8.966552734375, -8.240234375, -7.513916015625, -6.78759765625, -6.061279296875, -5.3349609375, -4.608642578125, -3.88232421875, -3.156005859375, -2.4296875, -1.703369140625, -0.97705078125, -0.250732421875, 0.4755859375, 1.201904296875, 1.92822265625, 2.654541015625, 3.380859375, 4.107177734375, 4.83349609375, 5.559814453125, 6.2861328125, 7.012451171875, 7.73876953125, 8.465087890625, 9.19140625, 9.917724609375, 10.64404296875, 11.370361328125, 12.0966796875, 12.822998046875, 13.54931640625, 14.275634765625, 15.001953125, 15.728271484375, 16.45458984375, 17.180908203125, 17.9072265625, 18.633544921875, 19.35986328125, 20.086181640625, 20.8125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 1.0, 21.0, 33.0, 35.0, 38.0, 64.0, 98.0, 159.0, 226.0, 372.0, 508.0, 879.0, 1303.0, 2175.0, 3481.0, 5669.0, 10039.0, 17643.0, 32848.0, 62899.0, 128569.0, 293018.0, 771625.0, 1628720.0, 708548.0, 271835.0, 121760.0, 59737.0, 30933.0, 16951.0, 9594.0, 5520.0, 3315.0, 2060.0, 1298.0, 781.0, 509.0, 322.0, 235.0, 159.0, 101.0, 77.0, 44.0, 22.0, 22.0, 12.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.09375, -39.74462890625, -38.3955078125, -37.04638671875, -35.697265625, -34.34814453125, -32.9990234375, -31.64990234375, -30.30078125, -28.95166015625, -27.6025390625, -26.25341796875, -24.904296875, -23.55517578125, -22.2060546875, -20.85693359375, -19.5078125, -18.15869140625, -16.8095703125, -15.46044921875, -14.111328125, -12.76220703125, -11.4130859375, -10.06396484375, -8.71484375, -7.36572265625, -6.0166015625, -4.66748046875, -3.318359375, -1.96923828125, -0.6201171875, 0.72900390625, 2.078125, 3.42724609375, 4.7763671875, 6.12548828125, 7.474609375, 8.82373046875, 10.1728515625, 11.52197265625, 12.87109375, 14.22021484375, 15.5693359375, 16.91845703125, 18.267578125, 19.61669921875, 20.9658203125, 22.31494140625, 23.6640625, 25.01318359375, 26.3623046875, 27.71142578125, 29.060546875, 30.40966796875, 31.7587890625, 33.10791015625, 34.45703125, 35.80615234375, 37.1552734375, 38.50439453125, 39.853515625, 41.20263671875, 42.5517578125, 43.90087890625, 45.25]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 9.0, 12.0, 23.0, 30.0, 29.0, 46.0, 41.0, 48.0, 83.0, 96.0, 139.0, 183.0, 247.0, 341.0, 416.0, 466.0, 431.0, 334.0, 267.0, 181.0, 169.0, 107.0, 92.0, 63.0, 56.0, 39.0, 32.0, 24.0, 16.0, 11.0, 16.0, 3.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.466552734375, -11.97998046875, -11.493408203125, -11.0068359375, -10.520263671875, -10.03369140625, -9.547119140625, -9.060546875, -8.573974609375, -8.08740234375, -7.600830078125, -7.1142578125, -6.627685546875, -6.14111328125, -5.654541015625, -5.16796875, -4.681396484375, -4.19482421875, -3.708251953125, -3.2216796875, -2.735107421875, -2.24853515625, -1.761962890625, -1.275390625, -0.788818359375, -0.30224609375, 0.184326171875, 0.6708984375, 1.157470703125, 1.64404296875, 2.130615234375, 2.6171875, 3.103759765625, 3.59033203125, 4.076904296875, 4.5634765625, 5.050048828125, 5.53662109375, 6.023193359375, 6.509765625, 6.996337890625, 7.48291015625, 7.969482421875, 8.4560546875, 8.942626953125, 9.42919921875, 9.915771484375, 10.40234375, 10.888916015625, 11.37548828125, 11.862060546875, 12.3486328125, 12.835205078125, 13.32177734375, 13.808349609375, 14.294921875, 14.781494140625, 15.26806640625, 15.754638671875, 16.2412109375, 16.727783203125, 17.21435546875, 17.700927734375, 18.1875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 8.0, 19.0, 24.0, 26.0, 35.0, 39.0, 45.0, 54.0, 76.0, 62.0, 67.0, 82.0, 69.0, 73.0, 60.0, 43.0, 32.0, 29.0, 31.0, 15.0, 17.0, 16.0, 7.0, 12.0, 5.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-43.4337272644043, -42.22896194458008, -41.024200439453125, -39.819435119628906, -38.61466979980469, -37.40990447998047, -36.20513916015625, -35.0003776550293, -33.79561233520508, -32.59084701538086, -31.386083602905273, -30.181320190429688, -28.97655487060547, -27.77178955078125, -26.567026138305664, -25.362262725830078, -24.15749740600586, -22.95273208618164, -21.747968673706055, -20.54320526123047, -19.33843994140625, -18.13367462158203, -16.928911209106445, -15.724146842956543, -14.51938247680664, -13.314618110656738, -12.109853744506836, -10.905089378356934, -9.700325012207031, -8.495560646057129, -7.290796279907227, -6.086031913757324, -4.8812713623046875, -3.676506996154785, -2.471742630004883, -1.2669782638549805, -0.062213897705078125, 1.1425504684448242, 2.3473148345947266, 3.552079200744629, 4.756843566894531, 5.961607933044434, 7.166372299194336, 8.371136665344238, 9.57590103149414, 10.780665397644043, 11.985429763793945, 13.190194129943848, 14.39495849609375, 15.599722862243652, 16.804487228393555, 18.00925064086914, 19.21401596069336, 20.418781280517578, 21.623544692993164, 22.82830810546875, 24.03307342529297, 25.237838745117188, 26.442602157592773, 27.64736557006836, 28.852130889892578, 30.056896209716797, 31.261659622192383, 32.46642303466797, 33.67118835449219]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 15.0, 9.0, 8.0, 10.0, 17.0, 18.0, 16.0, 14.0, 23.0, 23.0, 23.0, 26.0, 34.0, 30.0, 37.0, 37.0, 44.0, 41.0, 41.0, 33.0, 51.0, 34.0, 37.0, 36.0, 35.0, 35.0, 25.0, 35.0, 29.0, 19.0, 15.0, 21.0, 22.0, 22.0, 12.0, 16.0, 8.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.403141021728516, -27.558950424194336, -26.714757919311523, -25.870567321777344, -25.026376724243164, -24.182186126708984, -23.337993621826172, -22.493803024291992, -21.649612426757812, -20.805421829223633, -19.96122932434082, -19.11703872680664, -18.27284812927246, -17.42865753173828, -16.58446502685547, -15.740274429321289, -14.896081924438477, -14.05189037322998, -13.2076997756958, -12.363508224487305, -11.519317626953125, -10.675126075744629, -9.830934524536133, -8.986743927001953, -8.142552375793457, -7.298361301422119, -6.454170227050781, -5.609978675842285, -4.765787601470947, -3.9215965270996094, -3.0774049758911133, -2.2332139015197754, -1.3890228271484375, -0.5448316335678101, 0.2993595600128174, 1.1435508728027344, 1.9877419471740723, 2.83193302154541, 3.6761245727539062, 4.520315647125244, 5.364506721496582, 6.20869779586792, 7.052888870239258, 7.897080421447754, 8.74127197265625, 9.58546257019043, 10.429654121398926, 11.273845672607422, 12.118036270141602, 12.962227821350098, 13.806418418884277, 14.650609970092773, 15.494800567626953, 16.338993072509766, 17.183183670043945, 18.027374267578125, 18.871566772460938, 19.715757369995117, 20.55994987487793, 21.40414047241211, 22.24833106994629, 23.09252166748047, 23.93671417236328, 24.78090476989746, 25.62509536743164]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 9.0, 11.0, 27.0, 30.0, 45.0, 62.0, 93.0, 143.0, 210.0, 359.0, 516.0, 911.0, 1582.0, 2843.0, 4881.0, 8905.0, 16162.0, 30746.0, 59894.0, 127007.0, 271466.0, 268490.0, 127189.0, 59912.0, 30562.0, 16110.0, 8726.0, 4836.0, 2793.0, 1533.0, 949.0, 558.0, 335.0, 216.0, 134.0, 102.0, 70.0, 37.0, 23.0, 22.0, 16.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -27.927490234375, -26.96435546875, -26.001220703125, -25.0380859375, -24.074951171875, -23.11181640625, -22.148681640625, -21.185546875, -20.222412109375, -19.25927734375, -18.296142578125, -17.3330078125, -16.369873046875, -15.40673828125, -14.443603515625, -13.48046875, -12.517333984375, -11.55419921875, -10.591064453125, -9.6279296875, -8.664794921875, -7.70166015625, -6.738525390625, -5.775390625, -4.812255859375, -3.84912109375, -2.885986328125, -1.9228515625, -0.959716796875, 0.00341796875, 0.966552734375, 1.9296875, 2.892822265625, 3.85595703125, 4.819091796875, 5.7822265625, 6.745361328125, 7.70849609375, 8.671630859375, 9.634765625, 10.597900390625, 11.56103515625, 12.524169921875, 13.4873046875, 14.450439453125, 15.41357421875, 16.376708984375, 17.33984375, 18.302978515625, 19.26611328125, 20.229248046875, 21.1923828125, 22.155517578125, 23.11865234375, 24.081787109375, 25.044921875, 26.008056640625, 26.97119140625, 27.934326171875, 28.8974609375, 29.860595703125, 30.82373046875, 31.786865234375, 32.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 7.0, 6.0, 13.0, 17.0, 14.0, 20.0, 7.0, 16.0, 19.0, 26.0, 26.0, 25.0, 34.0, 35.0, 43.0, 31.0, 33.0, 44.0, 46.0, 34.0, 43.0, 41.0, 30.0, 40.0, 35.0, 24.0, 34.0, 29.0, 30.0, 28.0, 16.0, 16.0, 19.0, 15.0, 15.0, 13.0, 19.0, 12.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.25, -27.404052734375, -26.55810546875, -25.712158203125, -24.8662109375, -24.020263671875, -23.17431640625, -22.328369140625, -21.482421875, -20.636474609375, -19.79052734375, -18.944580078125, -18.0986328125, -17.252685546875, -16.40673828125, -15.560791015625, -14.71484375, -13.868896484375, -13.02294921875, -12.177001953125, -11.3310546875, -10.485107421875, -9.63916015625, -8.793212890625, -7.947265625, -7.101318359375, -6.25537109375, -5.409423828125, -4.5634765625, -3.717529296875, -2.87158203125, -2.025634765625, -1.1796875, -0.333740234375, 0.51220703125, 1.358154296875, 2.2041015625, 3.050048828125, 3.89599609375, 4.741943359375, 5.587890625, 6.433837890625, 7.27978515625, 8.125732421875, 8.9716796875, 9.817626953125, 10.66357421875, 11.509521484375, 12.35546875, 13.201416015625, 14.04736328125, 14.893310546875, 15.7392578125, 16.585205078125, 17.43115234375, 18.277099609375, 19.123046875, 19.968994140625, 20.81494140625, 21.660888671875, 22.5068359375, 23.352783203125, 24.19873046875, 25.044677734375, 25.890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 9.0, 18.0, 35.0, 58.0, 62.0, 100.0, 155.0, 197.0, 352.0, 550.0, 901.0, 1409.0, 2295.0, 3898.0, 6346.0, 11108.0, 20127.0, 39549.0, 87323.0, 226993.0, 363424.0, 152195.0, 63045.0, 30192.0, 15956.0, 8876.0, 5144.0, 3067.0, 1914.0, 1175.0, 754.0, 426.0, 313.0, 199.0, 117.0, 82.0, 55.0, 44.0, 32.0, 20.0, 8.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40625, -37.21728515625, -36.0283203125, -34.83935546875, -33.650390625, -32.46142578125, -31.2724609375, -30.08349609375, -28.89453125, -27.70556640625, -26.5166015625, -25.32763671875, -24.138671875, -22.94970703125, -21.7607421875, -20.57177734375, -19.3828125, -18.19384765625, -17.0048828125, -15.81591796875, -14.626953125, -13.43798828125, -12.2490234375, -11.06005859375, -9.87109375, -8.68212890625, -7.4931640625, -6.30419921875, -5.115234375, -3.92626953125, -2.7373046875, -1.54833984375, -0.359375, 0.82958984375, 2.0185546875, 3.20751953125, 4.396484375, 5.58544921875, 6.7744140625, 7.96337890625, 9.15234375, 10.34130859375, 11.5302734375, 12.71923828125, 13.908203125, 15.09716796875, 16.2861328125, 17.47509765625, 18.6640625, 19.85302734375, 21.0419921875, 22.23095703125, 23.419921875, 24.60888671875, 25.7978515625, 26.98681640625, 28.17578125, 29.36474609375, 30.5537109375, 31.74267578125, 32.931640625, 34.12060546875, 35.3095703125, 36.49853515625, 37.6875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 3.0, 8.0, 9.0, 13.0, 19.0, 14.0, 18.0, 21.0, 20.0, 26.0, 33.0, 28.0, 39.0, 38.0, 43.0, 51.0, 46.0, 49.0, 41.0, 44.0, 37.0, 46.0, 35.0, 43.0, 43.0, 32.0, 25.0, 18.0, 29.0, 21.0, 24.0, 15.0, 7.0, 10.0, 9.0, 5.0, 9.0, 4.0, 1.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.0712890625, -19.439453125, -18.8076171875, -18.17578125, -17.5439453125, -16.912109375, -16.2802734375, -15.6484375, -15.0166015625, -14.384765625, -13.7529296875, -13.12109375, -12.4892578125, -11.857421875, -11.2255859375, -10.59375, -9.9619140625, -9.330078125, -8.6982421875, -8.06640625, -7.4345703125, -6.802734375, -6.1708984375, -5.5390625, -4.9072265625, -4.275390625, -3.6435546875, -3.01171875, -2.3798828125, -1.748046875, -1.1162109375, -0.484375, 0.1474609375, 0.779296875, 1.4111328125, 2.04296875, 2.6748046875, 3.306640625, 3.9384765625, 4.5703125, 5.2021484375, 5.833984375, 6.4658203125, 7.09765625, 7.7294921875, 8.361328125, 8.9931640625, 9.625, 10.2568359375, 10.888671875, 11.5205078125, 12.15234375, 12.7841796875, 13.416015625, 14.0478515625, 14.6796875, 15.3115234375, 15.943359375, 16.5751953125, 17.20703125, 17.8388671875, 18.470703125, 19.1025390625, 19.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 12.0, 9.0, 15.0, 27.0, 36.0, 43.0, 51.0, 87.0, 104.0, 173.0, 254.0, 364.0, 545.0, 845.0, 1400.0, 2192.0, 3773.0, 6596.0, 12241.0, 25278.0, 56288.0, 133764.0, 308554.0, 279554.0, 117789.0, 49360.0, 22486.0, 11294.0, 6004.0, 3468.0, 2095.0, 1365.0, 819.0, 564.0, 373.0, 219.0, 148.0, 104.0, 65.0, 58.0, 33.0, 27.0, 18.0, 13.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0], "bins": [-10.2734375, -9.96142578125, -9.6494140625, -9.33740234375, -9.025390625, -8.71337890625, -8.4013671875, -8.08935546875, -7.77734375, -7.46533203125, -7.1533203125, -6.84130859375, -6.529296875, -6.21728515625, -5.9052734375, -5.59326171875, -5.28125, -4.96923828125, -4.6572265625, -4.34521484375, -4.033203125, -3.72119140625, -3.4091796875, -3.09716796875, -2.78515625, -2.47314453125, -2.1611328125, -1.84912109375, -1.537109375, -1.22509765625, -0.9130859375, -0.60107421875, -0.2890625, 0.02294921875, 0.3349609375, 0.64697265625, 0.958984375, 1.27099609375, 1.5830078125, 1.89501953125, 2.20703125, 2.51904296875, 2.8310546875, 3.14306640625, 3.455078125, 3.76708984375, 4.0791015625, 4.39111328125, 4.703125, 5.01513671875, 5.3271484375, 5.63916015625, 5.951171875, 6.26318359375, 6.5751953125, 6.88720703125, 7.19921875, 7.51123046875, 7.8232421875, 8.13525390625, 8.447265625, 8.75927734375, 9.0712890625, 9.38330078125, 9.6953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 9.0, 11.0, 22.0, 32.0, 29.0, 30.0, 39.0, 51.0, 67.0, 59.0, 75.0, 67.0, 64.0, 58.0, 63.0, 58.0, 43.0, 34.0, 29.0, 26.0, 25.0, 19.0, 18.0, 7.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006732940673828125, -0.0006482452154159546, -0.0006231963634490967, -0.0005981475114822388, -0.0005730986595153809, -0.000548049807548523, -0.000523000955581665, -0.0004979521036148071, -0.0004729032516479492, -0.0004478543996810913, -0.0004228055477142334, -0.0003977566957473755, -0.0003727078437805176, -0.00034765899181365967, -0.00032261013984680176, -0.00029756128787994385, -0.00027251243591308594, -0.00024746358394622803, -0.00022241473197937012, -0.0001973658800125122, -0.0001723170280456543, -0.0001472681760787964, -0.00012221932411193848, -9.717047214508057e-05, -7.212162017822266e-05, -4.7072768211364746e-05, -2.2023916244506836e-05, 3.0249357223510742e-06, 2.8073787689208984e-05, 5.3122639656066895e-05, 7.81714916229248e-05, 0.00010322034358978271, 0.00012826919555664062, 0.00015331804752349854, 0.00017836689949035645, 0.00020341575145721436, 0.00022846460342407227, 0.0002535134553909302, 0.0002785623073577881, 0.000303611159324646, 0.0003286600112915039, 0.0003537088632583618, 0.0003787577152252197, 0.00040380656719207764, 0.00042885541915893555, 0.00045390427112579346, 0.00047895312309265137, 0.0005040019750595093, 0.0005290508270263672, 0.0005540996789932251, 0.000579148530960083, 0.0006041973829269409, 0.0006292462348937988, 0.0006542950868606567, 0.0006793439388275146, 0.0007043927907943726, 0.0007294416427612305, 0.0007544904947280884, 0.0007795393466949463, 0.0008045881986618042, 0.0008296370506286621, 0.00085468590259552, 0.0008797347545623779, 0.0009047836065292358, 0.0009298324584960938]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 26.0, 24.0, 36.0, 49.0, 60.0, 103.0, 155.0, 228.0, 315.0, 487.0, 802.0, 1391.0, 2262.0, 4103.0, 7155.0, 13721.0, 27192.0, 56831.0, 132686.0, 284589.0, 277865.0, 127116.0, 55081.0, 26162.0, 13188.0, 7107.0, 3941.0, 2298.0, 1318.0, 761.0, 459.0, 310.0, 231.0, 143.0, 97.0, 71.0, 37.0, 42.0, 25.0, 19.0, 8.0, 14.0, 11.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.1314697265625, -10.747314453125, -10.3631591796875, -9.97900390625, -9.5948486328125, -9.210693359375, -8.8265380859375, -8.4423828125, -8.0582275390625, -7.674072265625, -7.2899169921875, -6.90576171875, -6.5216064453125, -6.137451171875, -5.7532958984375, -5.369140625, -4.9849853515625, -4.600830078125, -4.2166748046875, -3.83251953125, -3.4483642578125, -3.064208984375, -2.6800537109375, -2.2958984375, -1.9117431640625, -1.527587890625, -1.1434326171875, -0.75927734375, -0.3751220703125, 0.009033203125, 0.3931884765625, 0.77734375, 1.1614990234375, 1.545654296875, 1.9298095703125, 2.31396484375, 2.6981201171875, 3.082275390625, 3.4664306640625, 3.8505859375, 4.2347412109375, 4.618896484375, 5.0030517578125, 5.38720703125, 5.7713623046875, 6.155517578125, 6.5396728515625, 6.923828125, 7.3079833984375, 7.692138671875, 8.0762939453125, 8.46044921875, 8.8446044921875, 9.228759765625, 9.6129150390625, 9.9970703125, 10.3812255859375, 10.765380859375, 11.1495361328125, 11.53369140625, 11.9178466796875, 12.302001953125, 12.6861572265625, 13.0703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 10.0, 7.0, 8.0, 12.0, 7.0, 16.0, 26.0, 23.0, 18.0, 25.0, 44.0, 59.0, 48.0, 67.0, 85.0, 61.0, 74.0, 84.0, 52.0, 43.0, 30.0, 41.0, 33.0, 17.0, 23.0, 12.0, 16.0, 11.0, 8.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7421875, -3.6197509765625, -3.497314453125, -3.3748779296875, -3.25244140625, -3.1300048828125, -3.007568359375, -2.8851318359375, -2.7626953125, -2.6402587890625, -2.517822265625, -2.3953857421875, -2.27294921875, -2.1505126953125, -2.028076171875, -1.9056396484375, -1.783203125, -1.6607666015625, -1.538330078125, -1.4158935546875, -1.29345703125, -1.1710205078125, -1.048583984375, -0.9261474609375, -0.8037109375, -0.6812744140625, -0.558837890625, -0.4364013671875, -0.31396484375, -0.1915283203125, -0.069091796875, 0.0533447265625, 0.17578125, 0.2982177734375, 0.420654296875, 0.5430908203125, 0.66552734375, 0.7879638671875, 0.910400390625, 1.0328369140625, 1.1552734375, 1.2777099609375, 1.400146484375, 1.5225830078125, 1.64501953125, 1.7674560546875, 1.889892578125, 2.0123291015625, 2.134765625, 2.2572021484375, 2.379638671875, 2.5020751953125, 2.62451171875, 2.7469482421875, 2.869384765625, 2.9918212890625, 3.1142578125, 3.2366943359375, 3.359130859375, 3.4815673828125, 3.60400390625, 3.7264404296875, 3.848876953125, 3.9713134765625, 4.09375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 12.0, 16.0, 13.0, 20.0, 24.0, 33.0, 39.0, 33.0, 57.0, 62.0, 73.0, 64.0, 79.0, 70.0, 71.0, 76.0, 45.0, 31.0, 39.0, 22.0, 17.0, 16.0, 20.0, 12.0, 9.0, 7.0, 6.0, 1.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.1654167175293, -42.00754928588867, -40.84968185424805, -39.69181442260742, -38.53395080566406, -37.37608337402344, -36.21821594238281, -35.06034851074219, -33.90248107910156, -32.74461364746094, -31.586746215820312, -30.42888069152832, -29.271013259887695, -28.11314582824707, -26.955280303955078, -25.797412872314453, -24.639545440673828, -23.481678009033203, -22.323810577392578, -21.165945053100586, -20.00807762145996, -18.850210189819336, -17.692344665527344, -16.53447723388672, -15.376609802246094, -14.218742370605469, -13.06087589263916, -11.903009414672852, -10.745141983032227, -9.587274551391602, -8.429408073425293, -7.271541595458984, -6.113676071166992, -4.955809116363525, -3.7979421615600586, -2.640075206756592, -1.482208251953125, -0.3243412971496582, 0.8335256576538086, 1.9913921356201172, 3.149259567260742, 4.307126522064209, 5.464993476867676, 6.622860431671143, 7.780727386474609, 8.938594818115234, 10.096461296081543, 11.254327774047852, 12.412195205688477, 13.570062637329102, 14.72792911529541, 15.885795593261719, 17.043663024902344, 18.20153045654297, 19.359397888183594, 20.517263412475586, 21.67513084411621, 22.832998275756836, 23.990863800048828, 25.148731231689453, 26.306598663330078, 27.464466094970703, 28.622333526611328, 29.78019905090332, 30.938066482543945]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 7.0, 7.0, 17.0, 12.0, 17.0, 20.0, 21.0, 17.0, 22.0, 17.0, 26.0, 32.0, 35.0, 35.0, 40.0, 31.0, 44.0, 47.0, 29.0, 42.0, 45.0, 39.0, 44.0, 37.0, 33.0, 22.0, 29.0, 28.0, 18.0, 21.0, 20.0, 20.0, 24.0, 13.0, 14.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.629261016845703, -25.817188262939453, -25.005117416381836, -24.193044662475586, -23.380971908569336, -22.56890106201172, -21.75682830810547, -20.94475555419922, -20.13268280029297, -19.32061004638672, -18.5085391998291, -17.69646644592285, -16.8843936920166, -16.072322845458984, -15.260250091552734, -14.448177337646484, -13.636106491088867, -12.824034690856934, -12.011961936950684, -11.19989013671875, -10.3878173828125, -9.575745582580566, -8.763673782348633, -7.951601505279541, -7.139529228210449, -6.327456951141357, -5.515384674072266, -4.703312873840332, -3.8912405967712402, -3.0791683197021484, -2.267096519470215, -1.455024242401123, -0.6429519653320312, 0.169120192527771, 0.9811923503875732, 1.793264389038086, 2.6053366661071777, 3.4174089431762695, 4.229480743408203, 5.041553020477295, 5.853625297546387, 6.6656975746154785, 7.47776985168457, 8.289841651916504, 9.101913452148438, 9.913986206054688, 10.726058006286621, 11.538129806518555, 12.350202560424805, 13.162274360656738, 13.974347114562988, 14.786418914794922, 15.598491668701172, 16.410564422607422, 17.22263526916504, 18.03470802307129, 18.846778869628906, 19.658851623535156, 20.470922470092773, 21.282995223999023, 22.095067977905273, 22.90713882446289, 23.71921157836914, 24.53128433227539, 25.34335708618164]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 7.0, 26.0, 29.0, 46.0, 66.0, 94.0, 103.0, 193.0, 275.0, 418.0, 595.0, 867.0, 1227.0, 1786.0, 2693.0, 3842.0, 5901.0, 8841.0, 13363.0, 20522.0, 31955.0, 49995.0, 79080.0, 121049.0, 167738.0, 172279.0, 128502.0, 84280.0, 53910.0, 34106.0, 21931.0, 14165.0, 9448.0, 6216.0, 4192.0, 2840.0, 1916.0, 1252.0, 872.0, 614.0, 428.0, 273.0, 184.0, 155.0, 73.0, 70.0, 44.0, 27.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-28.625, -27.703857421875, -26.78271484375, -25.861572265625, -24.9404296875, -24.019287109375, -23.09814453125, -22.177001953125, -21.255859375, -20.334716796875, -19.41357421875, -18.492431640625, -17.5712890625, -16.650146484375, -15.72900390625, -14.807861328125, -13.88671875, -12.965576171875, -12.04443359375, -11.123291015625, -10.2021484375, -9.281005859375, -8.35986328125, -7.438720703125, -6.517578125, -5.596435546875, -4.67529296875, -3.754150390625, -2.8330078125, -1.911865234375, -0.99072265625, -0.069580078125, 0.8515625, 1.772705078125, 2.69384765625, 3.614990234375, 4.5361328125, 5.457275390625, 6.37841796875, 7.299560546875, 8.220703125, 9.141845703125, 10.06298828125, 10.984130859375, 11.9052734375, 12.826416015625, 13.74755859375, 14.668701171875, 15.58984375, 16.510986328125, 17.43212890625, 18.353271484375, 19.2744140625, 20.195556640625, 21.11669921875, 22.037841796875, 22.958984375, 23.880126953125, 24.80126953125, 25.722412109375, 26.6435546875, 27.564697265625, 28.48583984375, 29.406982421875, 30.328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 9.0, 8.0, 13.0, 14.0, 18.0, 14.0, 14.0, 16.0, 30.0, 21.0, 28.0, 31.0, 41.0, 35.0, 34.0, 27.0, 43.0, 41.0, 46.0, 30.0, 51.0, 48.0, 32.0, 36.0, 37.0, 29.0, 28.0, 21.0, 24.0, 19.0, 21.0, 23.0, 16.0, 20.0, 13.0, 12.0, 12.0, 11.0, 3.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.84326171875, -25.0146484375, -24.18603515625, -23.357421875, -22.52880859375, -21.7001953125, -20.87158203125, -20.04296875, -19.21435546875, -18.3857421875, -17.55712890625, -16.728515625, -15.89990234375, -15.0712890625, -14.24267578125, -13.4140625, -12.58544921875, -11.7568359375, -10.92822265625, -10.099609375, -9.27099609375, -8.4423828125, -7.61376953125, -6.78515625, -5.95654296875, -5.1279296875, -4.29931640625, -3.470703125, -2.64208984375, -1.8134765625, -0.98486328125, -0.15625, 0.67236328125, 1.5009765625, 2.32958984375, 3.158203125, 3.98681640625, 4.8154296875, 5.64404296875, 6.47265625, 7.30126953125, 8.1298828125, 8.95849609375, 9.787109375, 10.61572265625, 11.4443359375, 12.27294921875, 13.1015625, 13.93017578125, 14.7587890625, 15.58740234375, 16.416015625, 17.24462890625, 18.0732421875, 18.90185546875, 19.73046875, 20.55908203125, 21.3876953125, 22.21630859375, 23.044921875, 23.87353515625, 24.7021484375, 25.53076171875, 26.359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 10.0, 8.0, 18.0, 15.0, 38.0, 42.0, 73.0, 131.0, 223.0, 293.0, 510.0, 806.0, 1214.0, 1953.0, 2997.0, 4762.0, 7716.0, 12501.0, 20206.0, 33788.0, 58153.0, 101080.0, 168514.0, 218334.0, 168854.0, 101090.0, 57975.0, 33532.0, 20255.0, 12409.0, 7718.0, 4829.0, 3123.0, 2021.0, 1237.0, 783.0, 449.0, 351.0, 193.0, 156.0, 73.0, 48.0, 33.0, 20.0, 10.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.53125, -36.37646484375, -35.2216796875, -34.06689453125, -32.912109375, -31.75732421875, -30.6025390625, -29.44775390625, -28.29296875, -27.13818359375, -25.9833984375, -24.82861328125, -23.673828125, -22.51904296875, -21.3642578125, -20.20947265625, -19.0546875, -17.89990234375, -16.7451171875, -15.59033203125, -14.435546875, -13.28076171875, -12.1259765625, -10.97119140625, -9.81640625, -8.66162109375, -7.5068359375, -6.35205078125, -5.197265625, -4.04248046875, -2.8876953125, -1.73291015625, -0.578125, 0.57666015625, 1.7314453125, 2.88623046875, 4.041015625, 5.19580078125, 6.3505859375, 7.50537109375, 8.66015625, 9.81494140625, 10.9697265625, 12.12451171875, 13.279296875, 14.43408203125, 15.5888671875, 16.74365234375, 17.8984375, 19.05322265625, 20.2080078125, 21.36279296875, 22.517578125, 23.67236328125, 24.8271484375, 25.98193359375, 27.13671875, 28.29150390625, 29.4462890625, 30.60107421875, 31.755859375, 32.91064453125, 34.0654296875, 35.22021484375, 36.375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 7.0, 16.0, 21.0, 19.0, 11.0, 18.0, 18.0, 26.0, 23.0, 25.0, 25.0, 42.0, 26.0, 41.0, 39.0, 35.0, 47.0, 36.0, 38.0, 46.0, 43.0, 28.0, 37.0, 35.0, 39.0, 29.0, 32.0, 29.0, 12.0, 16.0, 20.0, 20.0, 14.0, 9.0, 15.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.75, -17.2158203125, -16.681640625, -16.1474609375, -15.61328125, -15.0791015625, -14.544921875, -14.0107421875, -13.4765625, -12.9423828125, -12.408203125, -11.8740234375, -11.33984375, -10.8056640625, -10.271484375, -9.7373046875, -9.203125, -8.6689453125, -8.134765625, -7.6005859375, -7.06640625, -6.5322265625, -5.998046875, -5.4638671875, -4.9296875, -4.3955078125, -3.861328125, -3.3271484375, -2.79296875, -2.2587890625, -1.724609375, -1.1904296875, -0.65625, -0.1220703125, 0.412109375, 0.9462890625, 1.48046875, 2.0146484375, 2.548828125, 3.0830078125, 3.6171875, 4.1513671875, 4.685546875, 5.2197265625, 5.75390625, 6.2880859375, 6.822265625, 7.3564453125, 7.890625, 8.4248046875, 8.958984375, 9.4931640625, 10.02734375, 10.5615234375, 11.095703125, 11.6298828125, 12.1640625, 12.6982421875, 13.232421875, 13.7666015625, 14.30078125, 14.8349609375, 15.369140625, 15.9033203125, 16.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 15.0, 15.0, 29.0, 30.0, 48.0, 65.0, 105.0, 156.0, 208.0, 327.0, 494.0, 727.0, 1156.0, 1781.0, 2919.0, 4789.0, 7852.0, 13825.0, 25051.0, 46071.0, 89734.0, 172152.0, 259253.0, 196347.0, 103955.0, 53728.0, 28562.0, 15783.0, 9036.0, 5321.0, 3257.0, 2043.0, 1243.0, 818.0, 540.0, 357.0, 228.0, 157.0, 107.0, 78.0, 46.0, 42.0, 29.0, 19.0, 16.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-13.296875, -12.88916015625, -12.4814453125, -12.07373046875, -11.666015625, -11.25830078125, -10.8505859375, -10.44287109375, -10.03515625, -9.62744140625, -9.2197265625, -8.81201171875, -8.404296875, -7.99658203125, -7.5888671875, -7.18115234375, -6.7734375, -6.36572265625, -5.9580078125, -5.55029296875, -5.142578125, -4.73486328125, -4.3271484375, -3.91943359375, -3.51171875, -3.10400390625, -2.6962890625, -2.28857421875, -1.880859375, -1.47314453125, -1.0654296875, -0.65771484375, -0.25, 0.15771484375, 0.5654296875, 0.97314453125, 1.380859375, 1.78857421875, 2.1962890625, 2.60400390625, 3.01171875, 3.41943359375, 3.8271484375, 4.23486328125, 4.642578125, 5.05029296875, 5.4580078125, 5.86572265625, 6.2734375, 6.68115234375, 7.0888671875, 7.49658203125, 7.904296875, 8.31201171875, 8.7197265625, 9.12744140625, 9.53515625, 9.94287109375, 10.3505859375, 10.75830078125, 11.166015625, 11.57373046875, 11.9814453125, 12.38916015625, 12.796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 9.0, 10.0, 12.0, 12.0, 15.0, 25.0, 37.0, 52.0, 88.0, 96.0, 128.0, 113.0, 112.0, 87.0, 59.0, 45.0, 27.0, 18.0, 18.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017309188842773438, -0.0016647130250930786, -0.0015985071659088135, -0.0015323013067245483, -0.0014660954475402832, -0.001399889588356018, -0.001333683729171753, -0.0012674778699874878, -0.0012012720108032227, -0.0011350661516189575, -0.0010688602924346924, -0.0010026544332504272, -0.0009364485740661621, -0.000870242714881897, -0.0008040368556976318, -0.0007378309965133667, -0.0006716251373291016, -0.0006054192781448364, -0.0005392134189605713, -0.00047300755977630615, -0.000406801700592041, -0.0003405958414077759, -0.00027438998222351074, -0.0002081841230392456, -0.00014197826385498047, -7.577240467071533e-05, -9.566545486450195e-06, 5.663931369781494e-05, 0.00012284517288208008, 0.00018905103206634521, 0.00025525689125061035, 0.0003214627504348755, 0.0003876686096191406, 0.00045387446880340576, 0.0005200803279876709, 0.000586286187171936, 0.0006524920463562012, 0.0007186979055404663, 0.0007849037647247314, 0.0008511096239089966, 0.0009173154830932617, 0.0009835213422775269, 0.001049727201461792, 0.0011159330606460571, 0.0011821389198303223, 0.0012483447790145874, 0.0013145506381988525, 0.0013807564973831177, 0.0014469623565673828, 0.001513168215751648, 0.001579374074935913, 0.0016455799341201782, 0.0017117857933044434, 0.0017779916524887085, 0.0018441975116729736, 0.0019104033708572388, 0.001976609230041504, 0.002042815089225769, 0.002109020948410034, 0.0021752268075942993, 0.0022414326667785645, 0.0023076385259628296, 0.0023738443851470947, 0.00244005024433136, 0.002506256103515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 16.0, 20.0, 32.0, 45.0, 55.0, 71.0, 96.0, 143.0, 188.0, 267.0, 403.0, 527.0, 760.0, 1043.0, 1682.0, 2420.0, 3479.0, 5413.0, 8295.0, 13206.0, 21171.0, 35188.0, 58665.0, 99786.0, 165383.0, 215301.0, 163863.0, 99056.0, 58414.0, 34835.0, 21127.0, 13155.0, 8088.0, 5241.0, 3455.0, 2332.0, 1590.0, 1065.0, 795.0, 548.0, 359.0, 269.0, 198.0, 138.0, 106.0, 75.0, 62.0, 33.0, 28.0, 23.0, 13.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-10.8515625, -10.5069580078125, -10.162353515625, -9.8177490234375, -9.47314453125, -9.1285400390625, -8.783935546875, -8.4393310546875, -8.0947265625, -7.7501220703125, -7.405517578125, -7.0609130859375, -6.71630859375, -6.3717041015625, -6.027099609375, -5.6824951171875, -5.337890625, -4.9932861328125, -4.648681640625, -4.3040771484375, -3.95947265625, -3.6148681640625, -3.270263671875, -2.9256591796875, -2.5810546875, -2.2364501953125, -1.891845703125, -1.5472412109375, -1.20263671875, -0.8580322265625, -0.513427734375, -0.1688232421875, 0.17578125, 0.5203857421875, 0.864990234375, 1.2095947265625, 1.55419921875, 1.8988037109375, 2.243408203125, 2.5880126953125, 2.9326171875, 3.2772216796875, 3.621826171875, 3.9664306640625, 4.31103515625, 4.6556396484375, 5.000244140625, 5.3448486328125, 5.689453125, 6.0340576171875, 6.378662109375, 6.7232666015625, 7.06787109375, 7.4124755859375, 7.757080078125, 8.1016845703125, 8.4462890625, 8.7908935546875, 9.135498046875, 9.4801025390625, 9.82470703125, 10.1693115234375, 10.513916015625, 10.8585205078125, 11.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 13.0, 14.0, 14.0, 22.0, 25.0, 36.0, 31.0, 25.0, 44.0, 44.0, 45.0, 71.0, 72.0, 70.0, 54.0, 50.0, 56.0, 48.0, 29.0, 35.0, 39.0, 23.0, 26.0, 18.0, 12.0, 12.0, 6.0, 2.0, 5.0, 4.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.0289306640625, -3.885986328125, -3.7430419921875, -3.60009765625, -3.4571533203125, -3.314208984375, -3.1712646484375, -3.0283203125, -2.8853759765625, -2.742431640625, -2.5994873046875, -2.45654296875, -2.3135986328125, -2.170654296875, -2.0277099609375, -1.884765625, -1.7418212890625, -1.598876953125, -1.4559326171875, -1.31298828125, -1.1700439453125, -1.027099609375, -0.8841552734375, -0.7412109375, -0.5982666015625, -0.455322265625, -0.3123779296875, -0.16943359375, -0.0264892578125, 0.116455078125, 0.2593994140625, 0.40234375, 0.5452880859375, 0.688232421875, 0.8311767578125, 0.97412109375, 1.1170654296875, 1.260009765625, 1.4029541015625, 1.5458984375, 1.6888427734375, 1.831787109375, 1.9747314453125, 2.11767578125, 2.2606201171875, 2.403564453125, 2.5465087890625, 2.689453125, 2.8323974609375, 2.975341796875, 3.1182861328125, 3.26123046875, 3.4041748046875, 3.547119140625, 3.6900634765625, 3.8330078125, 3.9759521484375, 4.118896484375, 4.2618408203125, 4.40478515625, 4.5477294921875, 4.690673828125, 4.8336181640625, 4.9765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 9.0, 10.0, 12.0, 23.0, 14.0, 33.0, 25.0, 34.0, 52.0, 52.0, 51.0, 69.0, 80.0, 69.0, 71.0, 63.0, 56.0, 50.0, 37.0, 38.0, 32.0, 24.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.26683807373047, -42.10720443725586, -40.947574615478516, -39.787940979003906, -38.62831115722656, -37.46867752075195, -36.30904769897461, -35.1494140625, -33.989784240722656, -32.83015060424805, -31.670520782470703, -30.510889053344727, -29.35125732421875, -28.19162368774414, -27.031991958618164, -25.872360229492188, -24.712726593017578, -23.5530948638916, -22.393463134765625, -21.23383140563965, -20.074199676513672, -18.914566040039062, -17.754934310913086, -16.59530258178711, -15.435670852661133, -14.276039123535156, -13.11640739440918, -11.956774711608887, -10.79714298248291, -9.637511253356934, -8.47787857055664, -7.318246841430664, -6.158613204956055, -4.998981475830078, -3.8393492698669434, -2.6797173023223877, -1.520085334777832, -0.36045360565185547, 0.7991786003112793, 1.958810806274414, 3.1184425354003906, 4.278074264526367, 5.437706470489502, 6.597338676452637, 7.756970405578613, 8.91660213470459, 10.076234817504883, 11.23586654663086, 12.395498275756836, 13.555130004882812, 14.714761734008789, 15.874394416809082, 17.034027099609375, 18.19365692138672, 19.353290557861328, 20.512922286987305, 21.67255401611328, 22.832185745239258, 23.991817474365234, 25.15144920349121, 26.311080932617188, 27.470714569091797, 28.630346298217773, 29.78997802734375, 30.949609756469727]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 7.0, 15.0, 15.0, 12.0, 13.0, 27.0, 22.0, 25.0, 26.0, 19.0, 32.0, 35.0, 33.0, 39.0, 49.0, 41.0, 45.0, 39.0, 50.0, 49.0, 36.0, 39.0, 28.0, 31.0, 32.0, 22.0, 32.0, 21.0, 23.0, 24.0, 15.0, 21.0, 14.0, 10.0, 5.0, 10.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-29.358545303344727, -28.471513748168945, -27.584484100341797, -26.697452545166016, -25.810420989990234, -24.923389434814453, -24.036357879638672, -23.149328231811523, -22.262296676635742, -21.37526512145996, -20.488235473632812, -19.60120391845703, -18.71417236328125, -17.82714080810547, -16.940109252929688, -16.05307960510254, -15.166048049926758, -14.279016494750977, -13.391985893249512, -12.504955291748047, -11.617923736572266, -10.730892181396484, -9.84386157989502, -8.956830978393555, -8.069799423217773, -7.18276834487915, -6.295737266540527, -5.408706188201904, -4.521675109863281, -3.634644031524658, -2.747612953186035, -1.860581874847412, -0.9735527038574219, -0.08652162551879883, 0.8005094528198242, 1.6875405311584473, 2.5745716094970703, 3.4616026878356934, 4.348633766174316, 5.2356648445129395, 6.1226959228515625, 7.0097270011901855, 7.896758079528809, 8.783788681030273, 9.670820236206055, 10.557851791381836, 11.4448823928833, 12.331912994384766, 13.218944549560547, 14.105976104736328, 14.993006706237793, 15.880037307739258, 16.76706886291504, 17.65410041809082, 18.54113006591797, 19.42816162109375, 20.31519317626953, 21.202224731445312, 22.089256286621094, 22.976285934448242, 23.863317489624023, 24.750349044799805, 25.637378692626953, 26.524410247802734, 27.411441802978516]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 17.0, 27.0, 44.0, 49.0, 80.0, 122.0, 136.0, 221.0, 345.0, 466.0, 804.0, 1178.0, 1860.0, 3111.0, 5185.0, 8839.0, 15820.0, 30271.0, 62163.0, 154929.0, 539737.0, 1535579.0, 1229159.0, 379015.0, 117786.0, 50151.0, 24996.0, 13398.0, 7456.0, 4337.0, 2628.0, 1590.0, 986.0, 628.0, 387.0, 255.0, 175.0, 120.0, 64.0, 57.0, 34.0, 26.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-49.65625, -48.30908203125, -46.9619140625, -45.61474609375, -44.267578125, -42.92041015625, -41.5732421875, -40.22607421875, -38.87890625, -37.53173828125, -36.1845703125, -34.83740234375, -33.490234375, -32.14306640625, -30.7958984375, -29.44873046875, -28.1015625, -26.75439453125, -25.4072265625, -24.06005859375, -22.712890625, -21.36572265625, -20.0185546875, -18.67138671875, -17.32421875, -15.97705078125, -14.6298828125, -13.28271484375, -11.935546875, -10.58837890625, -9.2412109375, -7.89404296875, -6.546875, -5.19970703125, -3.8525390625, -2.50537109375, -1.158203125, 0.18896484375, 1.5361328125, 2.88330078125, 4.23046875, 5.57763671875, 6.9248046875, 8.27197265625, 9.619140625, 10.96630859375, 12.3134765625, 13.66064453125, 15.0078125, 16.35498046875, 17.7021484375, 19.04931640625, 20.396484375, 21.74365234375, 23.0908203125, 24.43798828125, 25.78515625, 27.13232421875, 28.4794921875, 29.82666015625, 31.173828125, 32.52099609375, 33.8681640625, 35.21533203125, 36.5625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 6.0, 13.0, 15.0, 14.0, 13.0, 19.0, 21.0, 27.0, 29.0, 18.0, 29.0, 36.0, 40.0, 38.0, 37.0, 35.0, 49.0, 48.0, 49.0, 52.0, 43.0, 48.0, 36.0, 28.0, 31.0, 23.0, 21.0, 26.0, 26.0, 16.0, 17.0, 20.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.84375, -25.05224609375, -24.2607421875, -23.46923828125, -22.677734375, -21.88623046875, -21.0947265625, -20.30322265625, -19.51171875, -18.72021484375, -17.9287109375, -17.13720703125, -16.345703125, -15.55419921875, -14.7626953125, -13.97119140625, -13.1796875, -12.38818359375, -11.5966796875, -10.80517578125, -10.013671875, -9.22216796875, -8.4306640625, -7.63916015625, -6.84765625, -6.05615234375, -5.2646484375, -4.47314453125, -3.681640625, -2.89013671875, -2.0986328125, -1.30712890625, -0.515625, 0.27587890625, 1.0673828125, 1.85888671875, 2.650390625, 3.44189453125, 4.2333984375, 5.02490234375, 5.81640625, 6.60791015625, 7.3994140625, 8.19091796875, 8.982421875, 9.77392578125, 10.5654296875, 11.35693359375, 12.1484375, 12.93994140625, 13.7314453125, 14.52294921875, 15.314453125, 16.10595703125, 16.8974609375, 17.68896484375, 18.48046875, 19.27197265625, 20.0634765625, 20.85498046875, 21.646484375, 22.43798828125, 23.2294921875, 24.02099609375, 24.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 9.0, 10.0, 12.0, 14.0, 21.0, 38.0, 55.0, 68.0, 102.0, 154.0, 227.0, 343.0, 557.0, 834.0, 1308.0, 1975.0, 3129.0, 5135.0, 8686.0, 14954.0, 26342.0, 49705.0, 98836.0, 216866.0, 547488.0, 1462841.0, 1051277.0, 377911.0, 159083.0, 75207.0, 38878.0, 21143.0, 12090.0, 7223.0, 4312.0, 2631.0, 1649.0, 1104.0, 711.0, 437.0, 352.0, 192.0, 128.0, 98.0, 43.0, 42.0, 21.0, 24.0, 10.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.46875, -39.1552734375, -37.841796875, -36.5283203125, -35.21484375, -33.9013671875, -32.587890625, -31.2744140625, -29.9609375, -28.6474609375, -27.333984375, -26.0205078125, -24.70703125, -23.3935546875, -22.080078125, -20.7666015625, -19.453125, -18.1396484375, -16.826171875, -15.5126953125, -14.19921875, -12.8857421875, -11.572265625, -10.2587890625, -8.9453125, -7.6318359375, -6.318359375, -5.0048828125, -3.69140625, -2.3779296875, -1.064453125, 0.2490234375, 1.5625, 2.8759765625, 4.189453125, 5.5029296875, 6.81640625, 8.1298828125, 9.443359375, 10.7568359375, 12.0703125, 13.3837890625, 14.697265625, 16.0107421875, 17.32421875, 18.6376953125, 19.951171875, 21.2646484375, 22.578125, 23.8916015625, 25.205078125, 26.5185546875, 27.83203125, 29.1455078125, 30.458984375, 31.7724609375, 33.0859375, 34.3994140625, 35.712890625, 37.0263671875, 38.33984375, 39.6533203125, 40.966796875, 42.2802734375, 43.59375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 14.0, 11.0, 17.0, 17.0, 23.0, 43.0, 51.0, 58.0, 56.0, 94.0, 112.0, 165.0, 217.0, 251.0, 324.0, 411.0, 439.0, 369.0, 310.0, 258.0, 183.0, 139.0, 119.0, 91.0, 60.0, 56.0, 41.0, 26.0, 26.0, 12.0, 18.0, 4.0, 9.0, 6.0, 9.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.2232666015625, -12.774658203125, -12.3260498046875, -11.87744140625, -11.4288330078125, -10.980224609375, -10.5316162109375, -10.0830078125, -9.6343994140625, -9.185791015625, -8.7371826171875, -8.28857421875, -7.8399658203125, -7.391357421875, -6.9427490234375, -6.494140625, -6.0455322265625, -5.596923828125, -5.1483154296875, -4.69970703125, -4.2510986328125, -3.802490234375, -3.3538818359375, -2.9052734375, -2.4566650390625, -2.008056640625, -1.5594482421875, -1.11083984375, -0.6622314453125, -0.213623046875, 0.2349853515625, 0.68359375, 1.1322021484375, 1.580810546875, 2.0294189453125, 2.47802734375, 2.9266357421875, 3.375244140625, 3.8238525390625, 4.2724609375, 4.7210693359375, 5.169677734375, 5.6182861328125, 6.06689453125, 6.5155029296875, 6.964111328125, 7.4127197265625, 7.861328125, 8.3099365234375, 8.758544921875, 9.2071533203125, 9.65576171875, 10.1043701171875, 10.552978515625, 11.0015869140625, 11.4501953125, 11.8988037109375, 12.347412109375, 12.7960205078125, 13.24462890625, 13.6932373046875, 14.141845703125, 14.5904541015625, 15.0390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 10.0, 20.0, 22.0, 15.0, 34.0, 47.0, 37.0, 35.0, 70.0, 61.0, 78.0, 71.0, 83.0, 68.0, 68.0, 56.0, 43.0, 35.0, 27.0, 20.0, 18.0, 17.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.255611419677734, -37.085819244384766, -35.91602325439453, -34.74623107910156, -33.57643508911133, -32.40664291381836, -31.236846923828125, -30.067054748535156, -28.897258758544922, -27.72746467590332, -26.55767059326172, -25.387876510620117, -24.218082427978516, -23.048288345336914, -21.878494262695312, -20.708702087402344, -19.538908004760742, -18.36911392211914, -17.19931983947754, -16.029525756835938, -14.859731674194336, -13.689937591552734, -12.52014446258545, -11.350350379943848, -10.180556297302246, -9.010762214660645, -7.840968132019043, -6.6711745262146, -5.501380443572998, -4.3315863609313965, -3.161792755126953, -1.9919986724853516, -0.82220458984375, 0.347589373588562, 1.517383337020874, 2.6871771812438965, 3.856971263885498, 5.0267653465271, 6.196558952331543, 7.3663530349731445, 8.536147117614746, 9.705941200256348, 10.87573528289795, 12.045528411865234, 13.215322494506836, 14.385116577148438, 15.554910659790039, 16.72470474243164, 17.894498825073242, 19.064292907714844, 20.234086990356445, 21.403881072998047, 22.57367515563965, 23.74346923828125, 24.91326141357422, 26.083057403564453, 27.252849578857422, 28.422643661499023, 29.592437744140625, 30.762231826782227, 31.932025909423828, 33.1018180847168, 34.27161407470703, 35.44140625, 36.611202239990234]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 9.0, 18.0, 14.0, 13.0, 23.0, 15.0, 18.0, 28.0, 28.0, 33.0, 25.0, 24.0, 40.0, 31.0, 42.0, 36.0, 35.0, 44.0, 39.0, 44.0, 35.0, 45.0, 43.0, 43.0, 40.0, 27.0, 15.0, 20.0, 36.0, 21.0, 13.0, 14.0, 11.0, 13.0, 11.0, 9.0, 4.0, 4.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.972131729125977, -27.14262580871582, -26.31311798095703, -25.483612060546875, -24.65410614013672, -23.82459831237793, -22.995092391967773, -22.165584564208984, -21.336078643798828, -20.506572723388672, -19.677064895629883, -18.847558975219727, -18.018051147460938, -17.18854522705078, -16.359039306640625, -15.529532432556152, -14.70002555847168, -13.870518684387207, -13.041011810302734, -12.211505889892578, -11.381999015808105, -10.552492141723633, -9.722986221313477, -8.893479347229004, -8.063972473144531, -7.234465599060059, -6.404959201812744, -5.57545280456543, -4.745945930480957, -3.9164390563964844, -3.08693265914917, -2.2574262619018555, -1.4279193878173828, -0.5984127521514893, 0.2310938835144043, 1.0606005191802979, 1.8901071548461914, 2.719614028930664, 3.5491204261779785, 4.378626823425293, 5.208133697509766, 6.037640571594238, 6.867146968841553, 7.696653366088867, 8.52616024017334, 9.355667114257812, 10.185173034667969, 11.014679908752441, 11.844186782836914, 12.673693656921387, 13.50320053100586, 14.332706451416016, 15.162213325500488, 15.991720199584961, 16.821226119995117, 17.650733947753906, 18.480239868164062, 19.30974578857422, 20.139253616333008, 20.968759536743164, 21.798267364501953, 22.62777328491211, 23.457279205322266, 24.286785125732422, 25.11629295349121]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 13.0, 11.0, 40.0, 57.0, 71.0, 112.0, 148.0, 282.0, 403.0, 660.0, 978.0, 1592.0, 2518.0, 3827.0, 6479.0, 10157.0, 17138.0, 29844.0, 54302.0, 104605.0, 210993.0, 273010.0, 154197.0, 76789.0, 41323.0, 23243.0, 13595.0, 8291.0, 5007.0, 3311.0, 2010.0, 1297.0, 789.0, 504.0, 323.0, 213.0, 137.0, 87.0, 62.0, 42.0, 24.0, 23.0, 15.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.4443359375, -22.669921875, -21.8955078125, -21.12109375, -20.3466796875, -19.572265625, -18.7978515625, -18.0234375, -17.2490234375, -16.474609375, -15.7001953125, -14.92578125, -14.1513671875, -13.376953125, -12.6025390625, -11.828125, -11.0537109375, -10.279296875, -9.5048828125, -8.73046875, -7.9560546875, -7.181640625, -6.4072265625, -5.6328125, -4.8583984375, -4.083984375, -3.3095703125, -2.53515625, -1.7607421875, -0.986328125, -0.2119140625, 0.5625, 1.3369140625, 2.111328125, 2.8857421875, 3.66015625, 4.4345703125, 5.208984375, 5.9833984375, 6.7578125, 7.5322265625, 8.306640625, 9.0810546875, 9.85546875, 10.6298828125, 11.404296875, 12.1787109375, 12.953125, 13.7275390625, 14.501953125, 15.2763671875, 16.05078125, 16.8251953125, 17.599609375, 18.3740234375, 19.1484375, 19.9228515625, 20.697265625, 21.4716796875, 22.24609375, 23.0205078125, 23.794921875, 24.5693359375, 25.34375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 11.0, 22.0, 20.0, 16.0, 22.0, 26.0, 21.0, 24.0, 30.0, 41.0, 30.0, 35.0, 51.0, 36.0, 54.0, 46.0, 52.0, 42.0, 34.0, 55.0, 45.0, 33.0, 33.0, 19.0, 19.0, 29.0, 26.0, 17.0, 16.0, 9.0, 10.0, 12.0, 6.0, 2.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.03125, -29.1220703125, -28.212890625, -27.3037109375, -26.39453125, -25.4853515625, -24.576171875, -23.6669921875, -22.7578125, -21.8486328125, -20.939453125, -20.0302734375, -19.12109375, -18.2119140625, -17.302734375, -16.3935546875, -15.484375, -14.5751953125, -13.666015625, -12.7568359375, -11.84765625, -10.9384765625, -10.029296875, -9.1201171875, -8.2109375, -7.3017578125, -6.392578125, -5.4833984375, -4.57421875, -3.6650390625, -2.755859375, -1.8466796875, -0.9375, -0.0283203125, 0.880859375, 1.7900390625, 2.69921875, 3.6083984375, 4.517578125, 5.4267578125, 6.3359375, 7.2451171875, 8.154296875, 9.0634765625, 9.97265625, 10.8818359375, 11.791015625, 12.7001953125, 13.609375, 14.5185546875, 15.427734375, 16.3369140625, 17.24609375, 18.1552734375, 19.064453125, 19.9736328125, 20.8828125, 21.7919921875, 22.701171875, 23.6103515625, 24.51953125, 25.4287109375, 26.337890625, 27.2470703125, 28.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 13.0, 8.0, 13.0, 20.0, 31.0, 28.0, 53.0, 81.0, 90.0, 152.0, 198.0, 325.0, 455.0, 632.0, 959.0, 1420.0, 2204.0, 3270.0, 5262.0, 8152.0, 13313.0, 22071.0, 39399.0, 74392.0, 155012.0, 302880.0, 205408.0, 94305.0, 48727.0, 26908.0, 15764.0, 9438.0, 5960.0, 3918.0, 2451.0, 1656.0, 1114.0, 810.0, 521.0, 376.0, 211.0, 150.0, 135.0, 88.0, 62.0, 34.0, 24.0, 24.0, 9.0, 10.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-28.65625, -27.75146484375, -26.8466796875, -25.94189453125, -25.037109375, -24.13232421875, -23.2275390625, -22.32275390625, -21.41796875, -20.51318359375, -19.6083984375, -18.70361328125, -17.798828125, -16.89404296875, -15.9892578125, -15.08447265625, -14.1796875, -13.27490234375, -12.3701171875, -11.46533203125, -10.560546875, -9.65576171875, -8.7509765625, -7.84619140625, -6.94140625, -6.03662109375, -5.1318359375, -4.22705078125, -3.322265625, -2.41748046875, -1.5126953125, -0.60791015625, 0.296875, 1.20166015625, 2.1064453125, 3.01123046875, 3.916015625, 4.82080078125, 5.7255859375, 6.63037109375, 7.53515625, 8.43994140625, 9.3447265625, 10.24951171875, 11.154296875, 12.05908203125, 12.9638671875, 13.86865234375, 14.7734375, 15.67822265625, 16.5830078125, 17.48779296875, 18.392578125, 19.29736328125, 20.2021484375, 21.10693359375, 22.01171875, 22.91650390625, 23.8212890625, 24.72607421875, 25.630859375, 26.53564453125, 27.4404296875, 28.34521484375, 29.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 10.0, 4.0, 12.0, 9.0, 16.0, 18.0, 15.0, 13.0, 23.0, 25.0, 19.0, 26.0, 33.0, 28.0, 26.0, 38.0, 31.0, 30.0, 41.0, 34.0, 44.0, 41.0, 42.0, 39.0, 34.0, 31.0, 35.0, 32.0, 33.0, 34.0, 24.0, 27.0, 19.0, 19.0, 19.0, 10.0, 11.0, 5.0, 14.0, 6.0, 3.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.65625, -14.1484375, -13.640625, -13.1328125, -12.625, -12.1171875, -11.609375, -11.1015625, -10.59375, -10.0859375, -9.578125, -9.0703125, -8.5625, -8.0546875, -7.546875, -7.0390625, -6.53125, -6.0234375, -5.515625, -5.0078125, -4.5, -3.9921875, -3.484375, -2.9765625, -2.46875, -1.9609375, -1.453125, -0.9453125, -0.4375, 0.0703125, 0.578125, 1.0859375, 1.59375, 2.1015625, 2.609375, 3.1171875, 3.625, 4.1328125, 4.640625, 5.1484375, 5.65625, 6.1640625, 6.671875, 7.1796875, 7.6875, 8.1953125, 8.703125, 9.2109375, 9.71875, 10.2265625, 10.734375, 11.2421875, 11.75, 12.2578125, 12.765625, 13.2734375, 13.78125, 14.2890625, 14.796875, 15.3046875, 15.8125, 16.3203125, 16.828125, 17.3359375, 17.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 8.0, 11.0, 24.0, 20.0, 41.0, 68.0, 82.0, 117.0, 197.0, 335.0, 528.0, 909.0, 1559.0, 3005.0, 5702.0, 11659.0, 25370.0, 62858.0, 182163.0, 431196.0, 201097.0, 68036.0, 27710.0, 12551.0, 5988.0, 3102.0, 1697.0, 1001.0, 534.0, 340.0, 224.0, 138.0, 76.0, 56.0, 42.0, 27.0, 33.0, 15.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.70703125, -11.296875, -10.88671875, -10.4765625, -10.06640625, -9.65625, -9.24609375, -8.8359375, -8.42578125, -8.015625, -7.60546875, -7.1953125, -6.78515625, -6.375, -5.96484375, -5.5546875, -5.14453125, -4.734375, -4.32421875, -3.9140625, -3.50390625, -3.09375, -2.68359375, -2.2734375, -1.86328125, -1.453125, -1.04296875, -0.6328125, -0.22265625, 0.1875, 0.59765625, 1.0078125, 1.41796875, 1.828125, 2.23828125, 2.6484375, 3.05859375, 3.46875, 3.87890625, 4.2890625, 4.69921875, 5.109375, 5.51953125, 5.9296875, 6.33984375, 6.75, 7.16015625, 7.5703125, 7.98046875, 8.390625, 8.80078125, 9.2109375, 9.62109375, 10.03125, 10.44140625, 10.8515625, 11.26171875, 11.671875, 12.08203125, 12.4921875, 12.90234375, 13.3125, 13.72265625, 14.1328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 23.0, 41.0, 36.0, 37.0, 66.0, 86.0, 108.0, 89.0, 115.0, 93.0, 50.0, 50.0, 44.0, 35.0, 18.0, 14.0, 20.0, 8.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013818740844726562, -0.0013416856527328491, -0.001301497220993042, -0.0012613087892532349, -0.0012211203575134277, -0.0011809319257736206, -0.0011407434940338135, -0.0011005550622940063, -0.0010603666305541992, -0.001020178198814392, -0.000979989767074585, -0.0009398013353347778, -0.0008996129035949707, -0.0008594244718551636, -0.0008192360401153564, -0.0007790476083755493, -0.0007388591766357422, -0.0006986707448959351, -0.0006584823131561279, -0.0006182938814163208, -0.0005781054496765137, -0.0005379170179367065, -0.0004977285861968994, -0.0004575401544570923, -0.00041735172271728516, -0.00037716329097747803, -0.0003369748592376709, -0.00029678642749786377, -0.00025659799575805664, -0.0002164095640182495, -0.00017622113227844238, -0.00013603270053863525, -9.584426879882812e-05, -5.5655837059020996e-05, -1.5467405319213867e-05, 2.4721026420593262e-05, 6.490945816040039e-05, 0.00010509788990020752, 0.00014528632164001465, 0.00018547475337982178, 0.0002256631851196289, 0.00026585161685943604, 0.00030604004859924316, 0.0003462284803390503, 0.0003864169120788574, 0.00042660534381866455, 0.0004667937755584717, 0.0005069822072982788, 0.0005471706390380859, 0.0005873590707778931, 0.0006275475025177002, 0.0006677359342575073, 0.0007079243659973145, 0.0007481127977371216, 0.0007883012294769287, 0.0008284896612167358, 0.000868678092956543, 0.0009088665246963501, 0.0009490549564361572, 0.0009892433881759644, 0.0010294318199157715, 0.0010696202516555786, 0.0011098086833953857, 0.0011499971151351929, 0.001190185546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 16.0, 26.0, 37.0, 40.0, 74.0, 90.0, 161.0, 207.0, 311.0, 472.0, 739.0, 1183.0, 1844.0, 3029.0, 5032.0, 8606.0, 14913.0, 26812.0, 50837.0, 101220.0, 211750.0, 290174.0, 161745.0, 77637.0, 39747.0, 21536.0, 12099.0, 7020.0, 4257.0, 2455.0, 1576.0, 969.0, 662.0, 412.0, 260.0, 186.0, 110.0, 80.0, 62.0, 40.0, 25.0, 17.0, 15.0, 12.0, 9.0, 5.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5703125, -10.209716796875, -9.84912109375, -9.488525390625, -9.1279296875, -8.767333984375, -8.40673828125, -8.046142578125, -7.685546875, -7.324951171875, -6.96435546875, -6.603759765625, -6.2431640625, -5.882568359375, -5.52197265625, -5.161376953125, -4.80078125, -4.440185546875, -4.07958984375, -3.718994140625, -3.3583984375, -2.997802734375, -2.63720703125, -2.276611328125, -1.916015625, -1.555419921875, -1.19482421875, -0.834228515625, -0.4736328125, -0.113037109375, 0.24755859375, 0.608154296875, 0.96875, 1.329345703125, 1.68994140625, 2.050537109375, 2.4111328125, 2.771728515625, 3.13232421875, 3.492919921875, 3.853515625, 4.214111328125, 4.57470703125, 4.935302734375, 5.2958984375, 5.656494140625, 6.01708984375, 6.377685546875, 6.73828125, 7.098876953125, 7.45947265625, 7.820068359375, 8.1806640625, 8.541259765625, 8.90185546875, 9.262451171875, 9.623046875, 9.983642578125, 10.34423828125, 10.704833984375, 11.0654296875, 11.426025390625, 11.78662109375, 12.147216796875, 12.5078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 8.0, 1.0, 7.0, 7.0, 9.0, 10.0, 15.0, 21.0, 29.0, 29.0, 27.0, 38.0, 46.0, 50.0, 67.0, 61.0, 79.0, 60.0, 64.0, 55.0, 61.0, 52.0, 44.0, 37.0, 27.0, 16.0, 17.0, 21.0, 12.0, 10.0, 7.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.131256103515625, -3.01446533203125, -2.897674560546875, -2.7808837890625, -2.664093017578125, -2.54730224609375, -2.430511474609375, -2.313720703125, -2.196929931640625, -2.08013916015625, -1.963348388671875, -1.8465576171875, -1.729766845703125, -1.61297607421875, -1.496185302734375, -1.37939453125, -1.262603759765625, -1.14581298828125, -1.029022216796875, -0.9122314453125, -0.795440673828125, -0.67864990234375, -0.561859130859375, -0.445068359375, -0.328277587890625, -0.21148681640625, -0.094696044921875, 0.0220947265625, 0.138885498046875, 0.25567626953125, 0.372467041015625, 0.4892578125, 0.606048583984375, 0.72283935546875, 0.839630126953125, 0.9564208984375, 1.073211669921875, 1.19000244140625, 1.306793212890625, 1.423583984375, 1.540374755859375, 1.65716552734375, 1.773956298828125, 1.8907470703125, 2.007537841796875, 2.12432861328125, 2.241119384765625, 2.35791015625, 2.474700927734375, 2.59149169921875, 2.708282470703125, 2.8250732421875, 2.941864013671875, 3.05865478515625, 3.175445556640625, 3.292236328125, 3.409027099609375, 3.52581787109375, 3.642608642578125, 3.7593994140625, 3.876190185546875, 3.99298095703125, 4.109771728515625, 4.2265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 12.0, 13.0, 14.0, 19.0, 22.0, 24.0, 32.0, 39.0, 55.0, 54.0, 59.0, 75.0, 83.0, 86.0, 63.0, 61.0, 52.0, 43.0, 40.0, 30.0, 22.0, 19.0, 14.0, 24.0, 16.0, 10.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.25048828125, -36.11517333984375, -34.9798583984375, -33.84454345703125, -32.709228515625, -31.573911666870117, -30.438594818115234, -29.303279876708984, -28.167964935302734, -27.032649993896484, -25.897335052490234, -24.76201820373535, -23.6267032623291, -22.49138832092285, -21.35607147216797, -20.22075653076172, -19.08544158935547, -17.95012664794922, -16.81481170654297, -15.679494857788086, -14.544179916381836, -13.408864974975586, -12.27354907989502, -11.138233184814453, -10.002918243408203, -8.867603302001953, -7.732287406921387, -6.5969719886779785, -5.46165657043457, -4.326341152191162, -3.191025733947754, -2.0557103157043457, -0.9203987121582031, 0.21491670608520508, 1.3502321243286133, 2.4855475425720215, 3.6208629608154297, 4.756178379058838, 5.891493797302246, 7.026809215545654, 8.162124633789062, 9.297439575195312, 10.432755470275879, 11.568071365356445, 12.703386306762695, 13.838701248168945, 14.974017143249512, 16.109333038330078, 17.244647979736328, 18.379962921142578, 19.515277862548828, 20.65059471130371, 21.78590965270996, 22.92122459411621, 24.056541442871094, 25.191856384277344, 26.327171325683594, 27.462486267089844, 28.597801208496094, 29.733118057250977, 30.868432998657227, 32.00374984741211, 33.13906478881836, 34.27437973022461, 35.40969467163086]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 11.0, 11.0, 14.0, 10.0, 14.0, 22.0, 15.0, 15.0, 30.0, 25.0, 21.0, 26.0, 29.0, 34.0, 31.0, 41.0, 42.0, 31.0, 40.0, 43.0, 39.0, 35.0, 40.0, 36.0, 46.0, 45.0, 32.0, 25.0, 19.0, 26.0, 30.0, 17.0, 11.0, 13.0, 15.0, 14.0, 8.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.385093688964844, -25.59136962890625, -24.79764747619629, -24.003923416137695, -23.210201263427734, -22.41647720336914, -21.622753143310547, -20.829030990600586, -20.035308837890625, -19.24158477783203, -18.44786262512207, -17.654138565063477, -16.860416412353516, -16.066692352294922, -15.272969245910645, -14.479246139526367, -13.685522079467773, -12.891798973083496, -12.098075866699219, -11.304351806640625, -10.510629653930664, -9.71690559387207, -8.923182487487793, -8.129459381103516, -7.335736274719238, -6.542013168334961, -5.748290061950684, -4.954566478729248, -4.160843372344971, -3.3671202659606934, -2.573396682739258, -1.7796735763549805, -0.9859504699707031, -0.19222724437713623, 0.6014959812164307, 1.395219326019287, 2.1889424324035645, 2.982665538787842, 3.7763891220092773, 4.570112228393555, 5.363835334777832, 6.157558441162109, 6.951281547546387, 7.745005130767822, 8.538728713989258, 9.332450866699219, 10.126174926757812, 10.91989803314209, 11.713621139526367, 12.507344245910645, 13.301067352294922, 14.094791412353516, 14.888513565063477, 15.68223762512207, 16.47595977783203, 17.269683837890625, 18.06340789794922, 18.857131958007812, 19.650854110717773, 20.444578170776367, 21.238300323486328, 22.032024383544922, 22.825748443603516, 23.619470596313477, 24.413192749023438]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 11.0, 21.0, 15.0, 18.0, 36.0, 66.0, 80.0, 108.0, 156.0, 196.0, 297.0, 463.0, 707.0, 973.0, 1564.0, 2392.0, 3562.0, 5637.0, 9027.0, 14300.0, 23560.0, 39083.0, 66204.0, 111337.0, 173931.0, 204217.0, 153534.0, 94311.0, 55750.0, 32982.0, 19821.0, 12400.0, 7579.0, 4932.0, 3126.0, 2074.0, 1324.0, 880.0, 572.0, 383.0, 306.0, 185.0, 138.0, 83.0, 72.0, 47.0, 29.0, 23.0, 17.0, 17.0, 3.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0], "bins": [-34.59375, -33.52392578125, -32.4541015625, -31.38427734375, -30.314453125, -29.24462890625, -28.1748046875, -27.10498046875, -26.03515625, -24.96533203125, -23.8955078125, -22.82568359375, -21.755859375, -20.68603515625, -19.6162109375, -18.54638671875, -17.4765625, -16.40673828125, -15.3369140625, -14.26708984375, -13.197265625, -12.12744140625, -11.0576171875, -9.98779296875, -8.91796875, -7.84814453125, -6.7783203125, -5.70849609375, -4.638671875, -3.56884765625, -2.4990234375, -1.42919921875, -0.359375, 0.71044921875, 1.7802734375, 2.85009765625, 3.919921875, 4.98974609375, 6.0595703125, 7.12939453125, 8.19921875, 9.26904296875, 10.3388671875, 11.40869140625, 12.478515625, 13.54833984375, 14.6181640625, 15.68798828125, 16.7578125, 17.82763671875, 18.8974609375, 19.96728515625, 21.037109375, 22.10693359375, 23.1767578125, 24.24658203125, 25.31640625, 26.38623046875, 27.4560546875, 28.52587890625, 29.595703125, 30.66552734375, 31.7353515625, 32.80517578125, 33.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 9.0, 7.0, 15.0, 12.0, 10.0, 21.0, 14.0, 18.0, 24.0, 22.0, 26.0, 24.0, 30.0, 30.0, 42.0, 47.0, 35.0, 43.0, 31.0, 38.0, 38.0, 51.0, 41.0, 46.0, 32.0, 44.0, 32.0, 20.0, 25.0, 19.0, 26.0, 29.0, 19.0, 11.0, 13.0, 10.0, 10.0, 4.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.046875, -26.2158203125, -25.384765625, -24.5537109375, -23.72265625, -22.8916015625, -22.060546875, -21.2294921875, -20.3984375, -19.5673828125, -18.736328125, -17.9052734375, -17.07421875, -16.2431640625, -15.412109375, -14.5810546875, -13.75, -12.9189453125, -12.087890625, -11.2568359375, -10.42578125, -9.5947265625, -8.763671875, -7.9326171875, -7.1015625, -6.2705078125, -5.439453125, -4.6083984375, -3.77734375, -2.9462890625, -2.115234375, -1.2841796875, -0.453125, 0.3779296875, 1.208984375, 2.0400390625, 2.87109375, 3.7021484375, 4.533203125, 5.3642578125, 6.1953125, 7.0263671875, 7.857421875, 8.6884765625, 9.51953125, 10.3505859375, 11.181640625, 12.0126953125, 12.84375, 13.6748046875, 14.505859375, 15.3369140625, 16.16796875, 16.9990234375, 17.830078125, 18.6611328125, 19.4921875, 20.3232421875, 21.154296875, 21.9853515625, 22.81640625, 23.6474609375, 24.478515625, 25.3095703125, 26.140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 10.0, 15.0, 21.0, 42.0, 58.0, 81.0, 104.0, 160.0, 235.0, 336.0, 545.0, 717.0, 1109.0, 1699.0, 2526.0, 3658.0, 5751.0, 8589.0, 13531.0, 21243.0, 33847.0, 54834.0, 89713.0, 140775.0, 185413.0, 171065.0, 117404.0, 72494.0, 44769.0, 27648.0, 17343.0, 11180.0, 7223.0, 4815.0, 3152.0, 2132.0, 1366.0, 905.0, 618.0, 479.0, 311.0, 213.0, 121.0, 90.0, 57.0, 45.0, 34.0, 27.0, 15.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-32.59375, -31.568359375, -30.54296875, -29.517578125, -28.4921875, -27.466796875, -26.44140625, -25.416015625, -24.390625, -23.365234375, -22.33984375, -21.314453125, -20.2890625, -19.263671875, -18.23828125, -17.212890625, -16.1875, -15.162109375, -14.13671875, -13.111328125, -12.0859375, -11.060546875, -10.03515625, -9.009765625, -7.984375, -6.958984375, -5.93359375, -4.908203125, -3.8828125, -2.857421875, -1.83203125, -0.806640625, 0.21875, 1.244140625, 2.26953125, 3.294921875, 4.3203125, 5.345703125, 6.37109375, 7.396484375, 8.421875, 9.447265625, 10.47265625, 11.498046875, 12.5234375, 13.548828125, 14.57421875, 15.599609375, 16.625, 17.650390625, 18.67578125, 19.701171875, 20.7265625, 21.751953125, 22.77734375, 23.802734375, 24.828125, 25.853515625, 26.87890625, 27.904296875, 28.9296875, 29.955078125, 30.98046875, 32.005859375, 33.03125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 6.0, 21.0, 14.0, 23.0, 25.0, 25.0, 30.0, 30.0, 25.0, 31.0, 39.0, 36.0, 35.0, 36.0, 42.0, 44.0, 39.0, 43.0, 38.0, 34.0, 35.0, 37.0, 32.0, 26.0, 28.0, 27.0, 24.0, 13.0, 14.0, 12.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 12.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.515625, -16.00146484375, -15.4873046875, -14.97314453125, -14.458984375, -13.94482421875, -13.4306640625, -12.91650390625, -12.40234375, -11.88818359375, -11.3740234375, -10.85986328125, -10.345703125, -9.83154296875, -9.3173828125, -8.80322265625, -8.2890625, -7.77490234375, -7.2607421875, -6.74658203125, -6.232421875, -5.71826171875, -5.2041015625, -4.68994140625, -4.17578125, -3.66162109375, -3.1474609375, -2.63330078125, -2.119140625, -1.60498046875, -1.0908203125, -0.57666015625, -0.0625, 0.45166015625, 0.9658203125, 1.47998046875, 1.994140625, 2.50830078125, 3.0224609375, 3.53662109375, 4.05078125, 4.56494140625, 5.0791015625, 5.59326171875, 6.107421875, 6.62158203125, 7.1357421875, 7.64990234375, 8.1640625, 8.67822265625, 9.1923828125, 9.70654296875, 10.220703125, 10.73486328125, 11.2490234375, 11.76318359375, 12.27734375, 12.79150390625, 13.3056640625, 13.81982421875, 14.333984375, 14.84814453125, 15.3623046875, 15.87646484375, 16.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 17.0, 26.0, 33.0, 65.0, 92.0, 140.0, 216.0, 314.0, 512.0, 898.0, 1341.0, 2109.0, 3410.0, 5805.0, 10145.0, 18105.0, 34563.0, 71358.0, 154123.0, 275540.0, 236089.0, 117056.0, 54267.0, 27059.0, 14440.0, 8170.0, 4831.0, 2901.0, 1765.0, 1139.0, 721.0, 462.0, 280.0, 197.0, 113.0, 78.0, 50.0, 43.0, 22.0, 7.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.5535888671875, -12.146240234375, -11.7388916015625, -11.33154296875, -10.9241943359375, -10.516845703125, -10.1094970703125, -9.7021484375, -9.2947998046875, -8.887451171875, -8.4801025390625, -8.07275390625, -7.6654052734375, -7.258056640625, -6.8507080078125, -6.443359375, -6.0360107421875, -5.628662109375, -5.2213134765625, -4.81396484375, -4.4066162109375, -3.999267578125, -3.5919189453125, -3.1845703125, -2.7772216796875, -2.369873046875, -1.9625244140625, -1.55517578125, -1.1478271484375, -0.740478515625, -0.3331298828125, 0.07421875, 0.4815673828125, 0.888916015625, 1.2962646484375, 1.70361328125, 2.1109619140625, 2.518310546875, 2.9256591796875, 3.3330078125, 3.7403564453125, 4.147705078125, 4.5550537109375, 4.96240234375, 5.3697509765625, 5.777099609375, 6.1844482421875, 6.591796875, 6.9991455078125, 7.406494140625, 7.8138427734375, 8.22119140625, 8.6285400390625, 9.035888671875, 9.4432373046875, 9.8505859375, 10.2579345703125, 10.665283203125, 11.0726318359375, 11.47998046875, 11.8873291015625, 12.294677734375, 12.7020263671875, 13.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 8.0, 17.0, 13.0, 18.0, 43.0, 42.0, 65.0, 90.0, 112.0, 137.0, 124.0, 96.0, 63.0, 49.0, 33.0, 21.0, 15.0, 15.0, 8.0, 8.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00164794921875, -0.0015880763530731201, -0.0015282034873962402, -0.0014683306217193604, -0.0014084577560424805, -0.0013485848903656006, -0.0012887120246887207, -0.0012288391590118408, -0.001168966293334961, -0.001109093427658081, -0.0010492205619812012, -0.0009893476963043213, -0.0009294748306274414, -0.0008696019649505615, -0.0008097290992736816, -0.0007498562335968018, -0.0006899833679199219, -0.000630110502243042, -0.0005702376365661621, -0.0005103647708892822, -0.00045049190521240234, -0.00039061903953552246, -0.0003307461738586426, -0.0002708733081817627, -0.0002110004425048828, -0.00015112757682800293, -9.125471115112305e-05, -3.1381845474243164e-05, 2.849102020263672e-05, 8.83638858795166e-05, 0.00014823675155639648, 0.00020810961723327637, 0.00026798248291015625, 0.00032785534858703613, 0.000387728214263916, 0.0004476010799407959, 0.0005074739456176758, 0.0005673468112945557, 0.0006272196769714355, 0.0006870925426483154, 0.0007469654083251953, 0.0008068382740020752, 0.0008667111396789551, 0.000926584005355835, 0.0009864568710327148, 0.0010463297367095947, 0.0011062026023864746, 0.0011660754680633545, 0.0012259483337402344, 0.0012858211994171143, 0.0013456940650939941, 0.001405566930770874, 0.001465439796447754, 0.0015253126621246338, 0.0015851855278015137, 0.0016450583934783936, 0.0017049312591552734, 0.0017648041248321533, 0.0018246769905090332, 0.001884549856185913, 0.001944422721862793, 0.002004295587539673, 0.0020641684532165527, 0.0021240413188934326, 0.0021839141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 5.0, 5.0, 16.0, 26.0, 45.0, 70.0, 112.0, 150.0, 263.0, 365.0, 639.0, 870.0, 1484.0, 2409.0, 3989.0, 6755.0, 12309.0, 23693.0, 48522.0, 105058.0, 219719.0, 289671.0, 172236.0, 79897.0, 37345.0, 18603.0, 10065.0, 5497.0, 3287.0, 2049.0, 1265.0, 732.0, 536.0, 290.0, 204.0, 126.0, 89.0, 61.0, 41.0, 18.0, 15.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6737060546875, -11.230224609375, -10.7867431640625, -10.34326171875, -9.8997802734375, -9.456298828125, -9.0128173828125, -8.5693359375, -8.1258544921875, -7.682373046875, -7.2388916015625, -6.79541015625, -6.3519287109375, -5.908447265625, -5.4649658203125, -5.021484375, -4.5780029296875, -4.134521484375, -3.6910400390625, -3.24755859375, -2.8040771484375, -2.360595703125, -1.9171142578125, -1.4736328125, -1.0301513671875, -0.586669921875, -0.1431884765625, 0.30029296875, 0.7437744140625, 1.187255859375, 1.6307373046875, 2.07421875, 2.5177001953125, 2.961181640625, 3.4046630859375, 3.84814453125, 4.2916259765625, 4.735107421875, 5.1785888671875, 5.6220703125, 6.0655517578125, 6.509033203125, 6.9525146484375, 7.39599609375, 7.8394775390625, 8.282958984375, 8.7264404296875, 9.169921875, 9.6134033203125, 10.056884765625, 10.5003662109375, 10.94384765625, 11.3873291015625, 11.830810546875, 12.2742919921875, 12.7177734375, 13.1612548828125, 13.604736328125, 14.0482177734375, 14.49169921875, 14.9351806640625, 15.378662109375, 15.8221435546875, 16.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 4.0, 11.0, 6.0, 7.0, 6.0, 13.0, 20.0, 16.0, 20.0, 35.0, 27.0, 32.0, 42.0, 37.0, 59.0, 73.0, 57.0, 61.0, 70.0, 66.0, 55.0, 54.0, 42.0, 30.0, 27.0, 25.0, 17.0, 23.0, 14.0, 9.0, 9.0, 8.0, 4.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.93927001953125, -2.8277587890625, -2.71624755859375, -2.604736328125, -2.49322509765625, -2.3817138671875, -2.27020263671875, -2.15869140625, -2.04718017578125, -1.9356689453125, -1.82415771484375, -1.712646484375, -1.60113525390625, -1.4896240234375, -1.37811279296875, -1.2666015625, -1.15509033203125, -1.0435791015625, -0.93206787109375, -0.820556640625, -0.70904541015625, -0.5975341796875, -0.48602294921875, -0.37451171875, -0.26300048828125, -0.1514892578125, -0.03997802734375, 0.071533203125, 0.18304443359375, 0.2945556640625, 0.40606689453125, 0.517578125, 0.62908935546875, 0.7406005859375, 0.85211181640625, 0.963623046875, 1.07513427734375, 1.1866455078125, 1.29815673828125, 1.40966796875, 1.52117919921875, 1.6326904296875, 1.74420166015625, 1.855712890625, 1.96722412109375, 2.0787353515625, 2.19024658203125, 2.3017578125, 2.41326904296875, 2.5247802734375, 2.63629150390625, 2.747802734375, 2.85931396484375, 2.9708251953125, 3.08233642578125, 3.19384765625, 3.30535888671875, 3.4168701171875, 3.52838134765625, 3.639892578125, 3.75140380859375, 3.8629150390625, 3.97442626953125, 4.0859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 16.0, 24.0, 30.0, 36.0, 39.0, 61.0, 60.0, 75.0, 59.0, 88.0, 73.0, 60.0, 71.0, 49.0, 38.0, 42.0, 28.0, 23.0, 26.0, 17.0, 12.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.118370056152344, -42.949161529541016, -41.77995300292969, -40.610748291015625, -39.4415397644043, -38.27233123779297, -37.10312271118164, -35.93391418457031, -34.76470947265625, -33.59550094604492, -32.426292419433594, -31.2570858001709, -30.087879180908203, -28.918670654296875, -27.749462127685547, -26.58025550842285, -25.411046981811523, -24.241838455200195, -23.0726318359375, -21.903423309326172, -20.734216690063477, -19.56500816345215, -18.395801544189453, -17.226593017578125, -16.057384490966797, -14.888176918029785, -13.718969345092773, -12.549760818481445, -11.38055419921875, -10.211345672607422, -9.04213809967041, -7.872930526733398, -6.70372200012207, -5.534514427185059, -4.365306854248047, -3.196098804473877, -2.0268912315368652, -0.8576836585998535, 0.3115243911743164, 1.4807319641113281, 2.64993953704834, 3.8191471099853516, 4.988354682922363, 6.157562732696533, 7.326770305633545, 8.495977401733398, 9.665185928344727, 10.834393501281738, 12.00360107421875, 13.172808647155762, 14.342016220092773, 15.511224746704102, 16.680431365966797, 17.849639892578125, 19.018848419189453, 20.18805503845215, 21.357261657714844, 22.526470184326172, 23.695676803588867, 24.864885330200195, 26.03409194946289, 27.20330047607422, 28.372509002685547, 29.541715621948242, 30.71092414855957]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 10.0, 4.0, 12.0, 15.0, 15.0, 15.0, 15.0, 10.0, 23.0, 24.0, 27.0, 32.0, 32.0, 37.0, 28.0, 38.0, 38.0, 30.0, 21.0, 38.0, 37.0, 43.0, 40.0, 39.0, 41.0, 29.0, 29.0, 31.0, 29.0, 29.0, 24.0, 19.0, 21.0, 12.0, 15.0, 9.0, 10.0, 18.0, 4.0, 5.0, 3.0, 11.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.878774642944336, -24.09693145751953, -23.315088272094727, -22.533245086669922, -21.751399993896484, -20.96955680847168, -20.187713623046875, -19.40587043762207, -18.624027252197266, -17.84218406677246, -17.060340881347656, -16.27849578857422, -15.496652603149414, -14.71480941772461, -13.932966232299805, -13.151123046875, -12.369277954101562, -11.587434768676758, -10.805590629577637, -10.023747444152832, -9.241903305053711, -8.460060119628906, -7.678216934204102, -6.896373271942139, -6.114529609680176, -5.332685947418213, -4.55084228515625, -3.7689990997314453, -2.9871554374694824, -2.2053117752075195, -1.4234685897827148, -0.641624927520752, 0.14022064208984375, 0.9220641851425171, 1.7039077281951904, 2.485751152038574, 3.267594814300537, 4.0494384765625, 4.831281661987305, 5.613125324249268, 6.3949689865112305, 7.176812648773193, 7.958656311035156, 8.740499496459961, 9.522342681884766, 10.304186820983887, 11.086030006408691, 11.867874145507812, 12.649717330932617, 13.431560516357422, 14.213404655456543, 14.995247840881348, 15.777091979980469, 16.558935165405273, 17.340778350830078, 18.122621536254883, 18.904464721679688, 19.686307907104492, 20.468151092529297, 21.249996185302734, 22.03183937072754, 22.813682556152344, 23.59552574157715, 24.377368927001953, 25.15921401977539]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 15.0, 18.0, 23.0, 35.0, 39.0, 69.0, 101.0, 116.0, 158.0, 247.0, 353.0, 500.0, 694.0, 1040.0, 1593.0, 2468.0, 3790.0, 6468.0, 10965.0, 19271.0, 35639.0, 71373.0, 166347.0, 493834.0, 1277056.0, 1271683.0, 500511.0, 175041.0, 73067.0, 35833.0, 18963.0, 10621.0, 6055.0, 3705.0, 2222.0, 1443.0, 931.0, 637.0, 435.0, 261.0, 183.0, 141.0, 104.0, 77.0, 46.0, 27.0, 28.0, 20.0, 7.0, 12.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.53125, -37.36376953125, -36.1962890625, -35.02880859375, -33.861328125, -32.69384765625, -31.5263671875, -30.35888671875, -29.19140625, -28.02392578125, -26.8564453125, -25.68896484375, -24.521484375, -23.35400390625, -22.1865234375, -21.01904296875, -19.8515625, -18.68408203125, -17.5166015625, -16.34912109375, -15.181640625, -14.01416015625, -12.8466796875, -11.67919921875, -10.51171875, -9.34423828125, -8.1767578125, -7.00927734375, -5.841796875, -4.67431640625, -3.5068359375, -2.33935546875, -1.171875, -0.00439453125, 1.1630859375, 2.33056640625, 3.498046875, 4.66552734375, 5.8330078125, 7.00048828125, 8.16796875, 9.33544921875, 10.5029296875, 11.67041015625, 12.837890625, 14.00537109375, 15.1728515625, 16.34033203125, 17.5078125, 18.67529296875, 19.8427734375, 21.01025390625, 22.177734375, 23.34521484375, 24.5126953125, 25.68017578125, 26.84765625, 28.01513671875, 29.1826171875, 30.35009765625, 31.517578125, 32.68505859375, 33.8525390625, 35.02001953125, 36.1875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 6.0, 7.0, 7.0, 4.0, 12.0, 7.0, 19.0, 11.0, 14.0, 17.0, 22.0, 24.0, 23.0, 38.0, 38.0, 30.0, 44.0, 39.0, 30.0, 36.0, 35.0, 34.0, 41.0, 36.0, 48.0, 43.0, 37.0, 43.0, 32.0, 21.0, 22.0, 26.0, 22.0, 21.0, 12.0, 16.0, 14.0, 15.0, 5.0, 16.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.140625, -22.42431640625, -21.7080078125, -20.99169921875, -20.275390625, -19.55908203125, -18.8427734375, -18.12646484375, -17.41015625, -16.69384765625, -15.9775390625, -15.26123046875, -14.544921875, -13.82861328125, -13.1123046875, -12.39599609375, -11.6796875, -10.96337890625, -10.2470703125, -9.53076171875, -8.814453125, -8.09814453125, -7.3818359375, -6.66552734375, -5.94921875, -5.23291015625, -4.5166015625, -3.80029296875, -3.083984375, -2.36767578125, -1.6513671875, -0.93505859375, -0.21875, 0.49755859375, 1.2138671875, 1.93017578125, 2.646484375, 3.36279296875, 4.0791015625, 4.79541015625, 5.51171875, 6.22802734375, 6.9443359375, 7.66064453125, 8.376953125, 9.09326171875, 9.8095703125, 10.52587890625, 11.2421875, 11.95849609375, 12.6748046875, 13.39111328125, 14.107421875, 14.82373046875, 15.5400390625, 16.25634765625, 16.97265625, 17.68896484375, 18.4052734375, 19.12158203125, 19.837890625, 20.55419921875, 21.2705078125, 21.98681640625, 22.703125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 15.0, 14.0, 26.0, 41.0, 67.0, 101.0, 135.0, 247.0, 344.0, 513.0, 820.0, 1189.0, 1870.0, 3061.0, 5018.0, 8260.0, 13816.0, 24881.0, 47202.0, 97556.0, 223215.0, 576722.0, 1513856.0, 1012689.0, 363797.0, 148805.0, 68519.0, 34579.0, 18873.0, 10733.0, 6376.0, 3941.0, 2571.0, 1553.0, 1001.0, 631.0, 426.0, 250.0, 189.0, 136.0, 73.0, 44.0, 33.0, 31.0, 22.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-47.34375, -45.98193359375, -44.6201171875, -43.25830078125, -41.896484375, -40.53466796875, -39.1728515625, -37.81103515625, -36.44921875, -35.08740234375, -33.7255859375, -32.36376953125, -31.001953125, -29.64013671875, -28.2783203125, -26.91650390625, -25.5546875, -24.19287109375, -22.8310546875, -21.46923828125, -20.107421875, -18.74560546875, -17.3837890625, -16.02197265625, -14.66015625, -13.29833984375, -11.9365234375, -10.57470703125, -9.212890625, -7.85107421875, -6.4892578125, -5.12744140625, -3.765625, -2.40380859375, -1.0419921875, 0.31982421875, 1.681640625, 3.04345703125, 4.4052734375, 5.76708984375, 7.12890625, 8.49072265625, 9.8525390625, 11.21435546875, 12.576171875, 13.93798828125, 15.2998046875, 16.66162109375, 18.0234375, 19.38525390625, 20.7470703125, 22.10888671875, 23.470703125, 24.83251953125, 26.1943359375, 27.55615234375, 28.91796875, 30.27978515625, 31.6416015625, 33.00341796875, 34.365234375, 35.72705078125, 37.0888671875, 38.45068359375, 39.8125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 9.0, 21.0, 17.0, 39.0, 46.0, 68.0, 68.0, 84.0, 106.0, 128.0, 204.0, 233.0, 318.0, 367.0, 429.0, 401.0, 344.0, 259.0, 199.0, 167.0, 110.0, 89.0, 63.0, 49.0, 51.0, 29.0, 23.0, 21.0, 23.0, 18.0, 9.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.663818359375, -13.21826171875, -12.772705078125, -12.3271484375, -11.881591796875, -11.43603515625, -10.990478515625, -10.544921875, -10.099365234375, -9.65380859375, -9.208251953125, -8.7626953125, -8.317138671875, -7.87158203125, -7.426025390625, -6.98046875, -6.534912109375, -6.08935546875, -5.643798828125, -5.1982421875, -4.752685546875, -4.30712890625, -3.861572265625, -3.416015625, -2.970458984375, -2.52490234375, -2.079345703125, -1.6337890625, -1.188232421875, -0.74267578125, -0.297119140625, 0.1484375, 0.593994140625, 1.03955078125, 1.485107421875, 1.9306640625, 2.376220703125, 2.82177734375, 3.267333984375, 3.712890625, 4.158447265625, 4.60400390625, 5.049560546875, 5.4951171875, 5.940673828125, 6.38623046875, 6.831787109375, 7.27734375, 7.722900390625, 8.16845703125, 8.614013671875, 9.0595703125, 9.505126953125, 9.95068359375, 10.396240234375, 10.841796875, 11.287353515625, 11.73291015625, 12.178466796875, 12.6240234375, 13.069580078125, 13.51513671875, 13.960693359375, 14.40625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 12.0, 10.0, 24.0, 16.0, 26.0, 29.0, 38.0, 39.0, 40.0, 65.0, 70.0, 90.0, 81.0, 68.0, 73.0, 56.0, 43.0, 44.0, 36.0, 29.0, 27.0, 14.0, 11.0, 6.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.50014877319336, -39.3203010559082, -38.14045715332031, -36.960609436035156, -35.78076171875, -34.600914001464844, -33.42106628417969, -32.2412223815918, -31.06137466430664, -29.881526947021484, -28.70168113708496, -27.521835327148438, -26.34198760986328, -25.162139892578125, -23.9822940826416, -22.802448272705078, -21.622600555419922, -20.442752838134766, -19.262907028198242, -18.08306121826172, -16.903213500976562, -15.723366737365723, -14.543519973754883, -13.363673210144043, -12.183826446533203, -11.003979682922363, -9.824132919311523, -8.644286155700684, -7.464439392089844, -6.284592628479004, -5.104745864868164, -3.924899101257324, -2.7450523376464844, -1.5652055740356445, -0.3853588104248047, 0.7944879531860352, 1.974334716796875, 3.154181480407715, 4.334028244018555, 5.5138750076293945, 6.693721771240234, 7.873568534851074, 9.053415298461914, 10.233262062072754, 11.413108825683594, 12.592955589294434, 13.772802352905273, 14.952649116516113, 16.132495880126953, 17.31234359741211, 18.492189407348633, 19.672035217285156, 20.851882934570312, 22.03173065185547, 23.211576461791992, 24.391422271728516, 25.571269989013672, 26.751117706298828, 27.93096351623535, 29.110809326171875, 30.29065704345703, 31.470504760742188, 32.650352478027344, 33.830196380615234, 35.01004409790039]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 9.0, 5.0, 9.0, 9.0, 7.0, 14.0, 13.0, 19.0, 15.0, 20.0, 22.0, 19.0, 30.0, 39.0, 36.0, 27.0, 26.0, 47.0, 39.0, 43.0, 47.0, 39.0, 28.0, 38.0, 44.0, 42.0, 38.0, 20.0, 32.0, 28.0, 20.0, 29.0, 19.0, 18.0, 16.0, 19.0, 12.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 0.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.00770378112793, -26.189672470092773, -25.37164306640625, -24.553611755371094, -23.735580444335938, -22.917551040649414, -22.099519729614258, -21.281490325927734, -20.463459014892578, -19.645427703857422, -18.8273983001709, -18.009366989135742, -17.19133758544922, -16.373306274414062, -15.555274963378906, -14.737244606018066, -13.919214248657227, -13.101183891296387, -12.283153533935547, -11.46512222290039, -10.64709186553955, -9.829061508178711, -9.011030197143555, -8.192999839782715, -7.374969482421875, -6.556939125061035, -5.738908290863037, -4.920877456665039, -4.102847099304199, -3.2848167419433594, -2.4667859077453613, -1.6487550735473633, -0.8307228088378906, -0.01269221305847168, 0.8053383827209473, 1.6233689785003662, 2.441399574279785, 3.259429931640625, 4.077460765838623, 4.895491600036621, 5.713521957397461, 6.531552314758301, 7.349583148956299, 8.167613983154297, 8.985644340515137, 9.803674697875977, 10.621706008911133, 11.439736366271973, 12.257766723632812, 13.075797080993652, 13.893827438354492, 14.711858749389648, 15.529889106750488, 16.347919464111328, 17.165950775146484, 17.98398208618164, 18.802011489868164, 19.62004280090332, 20.438072204589844, 21.256103515625, 22.074134826660156, 22.89216423034668, 23.710195541381836, 24.52822494506836, 25.346256256103516]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 14.0, 13.0, 21.0, 31.0, 47.0, 50.0, 94.0, 140.0, 221.0, 352.0, 499.0, 779.0, 1235.0, 1989.0, 3218.0, 5306.0, 9033.0, 15735.0, 28390.0, 54843.0, 112559.0, 234187.0, 281370.0, 146667.0, 69528.0, 35559.0, 19205.0, 10934.0, 6299.0, 3764.0, 2385.0, 1457.0, 897.0, 579.0, 408.0, 259.0, 157.0, 115.0, 76.0, 44.0, 33.0, 28.0, 7.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.282958984375, -22.45654296875, -21.630126953125, -20.8037109375, -19.977294921875, -19.15087890625, -18.324462890625, -17.498046875, -16.671630859375, -15.84521484375, -15.018798828125, -14.1923828125, -13.365966796875, -12.53955078125, -11.713134765625, -10.88671875, -10.060302734375, -9.23388671875, -8.407470703125, -7.5810546875, -6.754638671875, -5.92822265625, -5.101806640625, -4.275390625, -3.448974609375, -2.62255859375, -1.796142578125, -0.9697265625, -0.143310546875, 0.68310546875, 1.509521484375, 2.3359375, 3.162353515625, 3.98876953125, 4.815185546875, 5.6416015625, 6.468017578125, 7.29443359375, 8.120849609375, 8.947265625, 9.773681640625, 10.60009765625, 11.426513671875, 12.2529296875, 13.079345703125, 13.90576171875, 14.732177734375, 15.55859375, 16.385009765625, 17.21142578125, 18.037841796875, 18.8642578125, 19.690673828125, 20.51708984375, 21.343505859375, 22.169921875, 22.996337890625, 23.82275390625, 24.649169921875, 25.4755859375, 26.302001953125, 27.12841796875, 27.954833984375, 28.78125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 11.0, 13.0, 13.0, 24.0, 17.0, 18.0, 26.0, 31.0, 30.0, 38.0, 40.0, 51.0, 38.0, 36.0, 47.0, 36.0, 23.0, 50.0, 40.0, 44.0, 35.0, 39.0, 29.0, 37.0, 24.0, 27.0, 22.0, 20.0, 10.0, 18.0, 12.0, 6.0, 4.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.75, -26.885498046875, -26.02099609375, -25.156494140625, -24.2919921875, -23.427490234375, -22.56298828125, -21.698486328125, -20.833984375, -19.969482421875, -19.10498046875, -18.240478515625, -17.3759765625, -16.511474609375, -15.64697265625, -14.782470703125, -13.91796875, -13.053466796875, -12.18896484375, -11.324462890625, -10.4599609375, -9.595458984375, -8.73095703125, -7.866455078125, -7.001953125, -6.137451171875, -5.27294921875, -4.408447265625, -3.5439453125, -2.679443359375, -1.81494140625, -0.950439453125, -0.0859375, 0.778564453125, 1.64306640625, 2.507568359375, 3.3720703125, 4.236572265625, 5.10107421875, 5.965576171875, 6.830078125, 7.694580078125, 8.55908203125, 9.423583984375, 10.2880859375, 11.152587890625, 12.01708984375, 12.881591796875, 13.74609375, 14.610595703125, 15.47509765625, 16.339599609375, 17.2041015625, 18.068603515625, 18.93310546875, 19.797607421875, 20.662109375, 21.526611328125, 22.39111328125, 23.255615234375, 24.1201171875, 24.984619140625, 25.84912109375, 26.713623046875, 27.578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 7.0, 13.0, 15.0, 28.0, 39.0, 53.0, 73.0, 124.0, 139.0, 184.0, 307.0, 413.0, 557.0, 887.0, 1253.0, 1956.0, 3020.0, 4691.0, 7591.0, 12507.0, 21374.0, 38597.0, 73828.0, 161121.0, 316051.0, 203853.0, 90588.0, 45469.0, 25069.0, 14428.0, 8731.0, 5290.0, 3469.0, 2154.0, 1461.0, 974.0, 680.0, 490.0, 294.0, 214.0, 149.0, 113.0, 81.0, 60.0, 42.0, 28.0, 23.0, 11.0, 9.0, 12.0, 11.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-30.71875, -29.747802734375, -28.77685546875, -27.805908203125, -26.8349609375, -25.864013671875, -24.89306640625, -23.922119140625, -22.951171875, -21.980224609375, -21.00927734375, -20.038330078125, -19.0673828125, -18.096435546875, -17.12548828125, -16.154541015625, -15.18359375, -14.212646484375, -13.24169921875, -12.270751953125, -11.2998046875, -10.328857421875, -9.35791015625, -8.386962890625, -7.416015625, -6.445068359375, -5.47412109375, -4.503173828125, -3.5322265625, -2.561279296875, -1.59033203125, -0.619384765625, 0.3515625, 1.322509765625, 2.29345703125, 3.264404296875, 4.2353515625, 5.206298828125, 6.17724609375, 7.148193359375, 8.119140625, 9.090087890625, 10.06103515625, 11.031982421875, 12.0029296875, 12.973876953125, 13.94482421875, 14.915771484375, 15.88671875, 16.857666015625, 17.82861328125, 18.799560546875, 19.7705078125, 20.741455078125, 21.71240234375, 22.683349609375, 23.654296875, 24.625244140625, 25.59619140625, 26.567138671875, 27.5380859375, 28.509033203125, 29.47998046875, 30.450927734375, 31.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 7.0, 7.0, 12.0, 4.0, 21.0, 11.0, 18.0, 15.0, 18.0, 21.0, 23.0, 26.0, 32.0, 28.0, 29.0, 27.0, 41.0, 43.0, 38.0, 36.0, 36.0, 29.0, 37.0, 38.0, 35.0, 39.0, 44.0, 34.0, 29.0, 23.0, 31.0, 20.0, 16.0, 20.0, 20.0, 18.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.03125, -16.510498046875, -15.98974609375, -15.468994140625, -14.9482421875, -14.427490234375, -13.90673828125, -13.385986328125, -12.865234375, -12.344482421875, -11.82373046875, -11.302978515625, -10.7822265625, -10.261474609375, -9.74072265625, -9.219970703125, -8.69921875, -8.178466796875, -7.65771484375, -7.136962890625, -6.6162109375, -6.095458984375, -5.57470703125, -5.053955078125, -4.533203125, -4.012451171875, -3.49169921875, -2.970947265625, -2.4501953125, -1.929443359375, -1.40869140625, -0.887939453125, -0.3671875, 0.153564453125, 0.67431640625, 1.195068359375, 1.7158203125, 2.236572265625, 2.75732421875, 3.278076171875, 3.798828125, 4.319580078125, 4.84033203125, 5.361083984375, 5.8818359375, 6.402587890625, 6.92333984375, 7.444091796875, 7.96484375, 8.485595703125, 9.00634765625, 9.527099609375, 10.0478515625, 10.568603515625, 11.08935546875, 11.610107421875, 12.130859375, 12.651611328125, 13.17236328125, 13.693115234375, 14.2138671875, 14.734619140625, 15.25537109375, 15.776123046875, 16.296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 7.0, 8.0, 8.0, 13.0, 17.0, 16.0, 28.0, 35.0, 69.0, 73.0, 104.0, 153.0, 226.0, 293.0, 494.0, 674.0, 1014.0, 1632.0, 2551.0, 4373.0, 8143.0, 16482.0, 38717.0, 108711.0, 345287.0, 338790.0, 106200.0, 38250.0, 16362.0, 8053.0, 4461.0, 2539.0, 1591.0, 983.0, 680.0, 417.0, 301.0, 231.0, 155.0, 125.0, 86.0, 50.0, 39.0, 29.0, 24.0, 21.0, 11.0, 7.0, 6.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.3828125, -11.9957275390625, -11.608642578125, -11.2215576171875, -10.83447265625, -10.4473876953125, -10.060302734375, -9.6732177734375, -9.2861328125, -8.8990478515625, -8.511962890625, -8.1248779296875, -7.73779296875, -7.3507080078125, -6.963623046875, -6.5765380859375, -6.189453125, -5.8023681640625, -5.415283203125, -5.0281982421875, -4.64111328125, -4.2540283203125, -3.866943359375, -3.4798583984375, -3.0927734375, -2.7056884765625, -2.318603515625, -1.9315185546875, -1.54443359375, -1.1573486328125, -0.770263671875, -0.3831787109375, 0.00390625, 0.3909912109375, 0.778076171875, 1.1651611328125, 1.55224609375, 1.9393310546875, 2.326416015625, 2.7135009765625, 3.1005859375, 3.4876708984375, 3.874755859375, 4.2618408203125, 4.64892578125, 5.0360107421875, 5.423095703125, 5.8101806640625, 6.197265625, 6.5843505859375, 6.971435546875, 7.3585205078125, 7.74560546875, 8.1326904296875, 8.519775390625, 8.9068603515625, 9.2939453125, 9.6810302734375, 10.068115234375, 10.4552001953125, 10.84228515625, 11.2293701171875, 11.616455078125, 12.0035400390625, 12.390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 6.0, 6.0, 21.0, 15.0, 22.0, 40.0, 58.0, 85.0, 90.0, 123.0, 131.0, 109.0, 78.0, 62.0, 28.0, 31.0, 16.0, 18.0, 8.0, 17.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001354217529296875, -0.0013121068477630615, -0.001269996166229248, -0.0012278854846954346, -0.001185774803161621, -0.0011436641216278076, -0.0011015534400939941, -0.0010594427585601807, -0.0010173320770263672, -0.0009752213954925537, -0.0009331107139587402, -0.0008910000324249268, -0.0008488893508911133, -0.0008067786693572998, -0.0007646679878234863, -0.0007225573062896729, -0.0006804466247558594, -0.0006383359432220459, -0.0005962252616882324, -0.0005541145801544189, -0.0005120038986206055, -0.000469893217086792, -0.0004277825355529785, -0.00038567185401916504, -0.00034356117248535156, -0.0003014504909515381, -0.0002593398094177246, -0.00021722912788391113, -0.00017511844635009766, -0.00013300776481628418, -9.08970832824707e-05, -4.8786401748657227e-05, -6.67572021484375e-06, 3.5434961318969727e-05, 7.75456428527832e-05, 0.00011965632438659668, 0.00016176700592041016, 0.00020387768745422363, 0.0002459883689880371, 0.0002880990505218506, 0.00033020973205566406, 0.00037232041358947754, 0.000414431095123291, 0.0004565417766571045, 0.000498652458190918, 0.0005407631397247314, 0.0005828738212585449, 0.0006249845027923584, 0.0006670951843261719, 0.0007092058658599854, 0.0007513165473937988, 0.0007934272289276123, 0.0008355379104614258, 0.0008776485919952393, 0.0009197592735290527, 0.0009618699550628662, 0.0010039806365966797, 0.0010460913181304932, 0.0010882019996643066, 0.0011303126811981201, 0.0011724233627319336, 0.001214534044265747, 0.0012566447257995605, 0.001298755407333374, 0.0013408660888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 20.0, 27.0, 35.0, 44.0, 89.0, 104.0, 142.0, 266.0, 381.0, 558.0, 931.0, 1436.0, 2421.0, 4361.0, 8479.0, 18028.0, 42162.0, 110200.0, 302873.0, 337153.0, 129158.0, 47914.0, 20440.0, 9449.0, 4912.0, 2693.0, 1532.0, 945.0, 604.0, 407.0, 256.0, 172.0, 109.0, 79.0, 56.0, 36.0, 31.0, 14.0, 14.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1484375, -14.6904296875, -14.232421875, -13.7744140625, -13.31640625, -12.8583984375, -12.400390625, -11.9423828125, -11.484375, -11.0263671875, -10.568359375, -10.1103515625, -9.65234375, -9.1943359375, -8.736328125, -8.2783203125, -7.8203125, -7.3623046875, -6.904296875, -6.4462890625, -5.98828125, -5.5302734375, -5.072265625, -4.6142578125, -4.15625, -3.6982421875, -3.240234375, -2.7822265625, -2.32421875, -1.8662109375, -1.408203125, -0.9501953125, -0.4921875, -0.0341796875, 0.423828125, 0.8818359375, 1.33984375, 1.7978515625, 2.255859375, 2.7138671875, 3.171875, 3.6298828125, 4.087890625, 4.5458984375, 5.00390625, 5.4619140625, 5.919921875, 6.3779296875, 6.8359375, 7.2939453125, 7.751953125, 8.2099609375, 8.66796875, 9.1259765625, 9.583984375, 10.0419921875, 10.5, 10.9580078125, 11.416015625, 11.8740234375, 12.33203125, 12.7900390625, 13.248046875, 13.7060546875, 14.1640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 13.0, 13.0, 13.0, 20.0, 21.0, 24.0, 36.0, 44.0, 34.0, 69.0, 51.0, 71.0, 79.0, 68.0, 94.0, 59.0, 45.0, 34.0, 38.0, 35.0, 18.0, 27.0, 17.0, 13.0, 10.0, 7.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.673370361328125, -3.55377197265625, -3.434173583984375, -3.3145751953125, -3.194976806640625, -3.07537841796875, -2.955780029296875, -2.836181640625, -2.716583251953125, -2.59698486328125, -2.477386474609375, -2.3577880859375, -2.238189697265625, -2.11859130859375, -1.998992919921875, -1.87939453125, -1.759796142578125, -1.64019775390625, -1.520599365234375, -1.4010009765625, -1.281402587890625, -1.16180419921875, -1.042205810546875, -0.922607421875, -0.803009033203125, -0.68341064453125, -0.563812255859375, -0.4442138671875, -0.324615478515625, -0.20501708984375, -0.085418701171875, 0.0341796875, 0.153778076171875, 0.27337646484375, 0.392974853515625, 0.5125732421875, 0.632171630859375, 0.75177001953125, 0.871368408203125, 0.990966796875, 1.110565185546875, 1.23016357421875, 1.349761962890625, 1.4693603515625, 1.588958740234375, 1.70855712890625, 1.828155517578125, 1.94775390625, 2.067352294921875, 2.18695068359375, 2.306549072265625, 2.4261474609375, 2.545745849609375, 2.66534423828125, 2.784942626953125, 2.904541015625, 3.024139404296875, 3.14373779296875, 3.263336181640625, 3.3829345703125, 3.502532958984375, 3.62213134765625, 3.741729736328125, 3.861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 0.0, 4.0, 4.0, 6.0, 12.0, 13.0, 13.0, 18.0, 18.0, 22.0, 25.0, 37.0, 31.0, 47.0, 37.0, 78.0, 67.0, 81.0, 60.0, 73.0, 62.0, 51.0, 45.0, 44.0, 37.0, 21.0, 19.0, 20.0, 13.0, 4.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.11933517456055, -35.052528381347656, -33.98572540283203, -32.91891860961914, -31.85211181640625, -30.78530502319336, -29.7185001373291, -28.651695251464844, -27.584888458251953, -26.518081665039062, -25.451276779174805, -24.384471893310547, -23.317665100097656, -22.250858306884766, -21.184053421020508, -20.11724853515625, -19.05044174194336, -17.98363494873047, -16.91683006286621, -15.850024223327637, -14.783218383789062, -13.716412544250488, -12.649606704711914, -11.58280086517334, -10.515995025634766, -9.449189186096191, -8.382383346557617, -7.315577507019043, -6.248771667480469, -5.1819658279418945, -4.11515998840332, -3.048354148864746, -1.9815483093261719, -0.9147424697875977, 0.15206336975097656, 1.2188692092895508, 2.285675048828125, 3.352480888366699, 4.419286727905273, 5.486092567443848, 6.552898406982422, 7.619704246520996, 8.68651008605957, 9.753315925598145, 10.820121765136719, 11.886927604675293, 12.953733444213867, 14.020539283752441, 15.087345123291016, 16.154151916503906, 17.220956802368164, 18.287761688232422, 19.354568481445312, 20.421375274658203, 21.48818016052246, 22.55498504638672, 23.62179183959961, 24.6885986328125, 25.755403518676758, 26.822208404541016, 27.889015197753906, 28.955821990966797, 30.022626876831055, 31.089431762695312, 32.1562385559082]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 10.0, 10.0, 20.0, 11.0, 15.0, 17.0, 20.0, 28.0, 34.0, 29.0, 29.0, 37.0, 34.0, 42.0, 40.0, 40.0, 43.0, 55.0, 36.0, 35.0, 39.0, 38.0, 44.0, 20.0, 33.0, 28.0, 22.0, 24.0, 20.0, 16.0, 17.0, 17.0, 14.0, 11.0, 6.0, 12.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.12033462524414, -26.297992706298828, -25.47565269470215, -24.65331268310547, -23.830970764160156, -23.008628845214844, -22.186288833618164, -21.363948822021484, -20.541606903076172, -19.71926498413086, -18.89692497253418, -18.0745849609375, -17.252243041992188, -16.429901123046875, -15.607561111450195, -14.7852201461792, -13.962879180908203, -13.140538215637207, -12.318197250366211, -11.495856285095215, -10.673515319824219, -9.851174354553223, -9.028833389282227, -8.20649242401123, -7.384151458740234, -6.561810493469238, -5.739469528198242, -4.917128562927246, -4.09478759765625, -3.272446632385254, -2.450105667114258, -1.6277647018432617, -0.8054256439208984, 0.016915321350097656, 0.8392562866210938, 1.6615972518920898, 2.483938217163086, 3.306279182434082, 4.128620147705078, 4.950961112976074, 5.77330207824707, 6.595643043518066, 7.4179840087890625, 8.240324974060059, 9.062665939331055, 9.88500690460205, 10.707347869873047, 11.529688835144043, 12.352029800415039, 13.174370765686035, 13.996711730957031, 14.819052696228027, 15.641393661499023, 16.463733673095703, 17.286075592041016, 18.108417510986328, 18.930757522583008, 19.753097534179688, 20.575439453125, 21.397781372070312, 22.220121383666992, 23.042461395263672, 23.864803314208984, 24.687145233154297, 25.509485244750977]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 11.0, 23.0, 26.0, 50.0, 61.0, 86.0, 136.0, 185.0, 267.0, 462.0, 668.0, 1018.0, 1528.0, 2482.0, 4022.0, 6486.0, 10565.0, 17866.0, 30177.0, 51644.0, 90415.0, 155859.0, 223901.0, 185500.0, 110358.0, 62959.0, 36558.0, 21603.0, 12812.0, 7783.0, 4844.0, 2892.0, 1879.0, 1202.0, 747.0, 493.0, 330.0, 186.0, 145.0, 105.0, 83.0, 40.0, 25.0, 24.0, 19.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.5, -33.4443359375, -32.388671875, -31.3330078125, -30.27734375, -29.2216796875, -28.166015625, -27.1103515625, -26.0546875, -24.9990234375, -23.943359375, -22.8876953125, -21.83203125, -20.7763671875, -19.720703125, -18.6650390625, -17.609375, -16.5537109375, -15.498046875, -14.4423828125, -13.38671875, -12.3310546875, -11.275390625, -10.2197265625, -9.1640625, -8.1083984375, -7.052734375, -5.9970703125, -4.94140625, -3.8857421875, -2.830078125, -1.7744140625, -0.71875, 0.3369140625, 1.392578125, 2.4482421875, 3.50390625, 4.5595703125, 5.615234375, 6.6708984375, 7.7265625, 8.7822265625, 9.837890625, 10.8935546875, 11.94921875, 13.0048828125, 14.060546875, 15.1162109375, 16.171875, 17.2275390625, 18.283203125, 19.3388671875, 20.39453125, 21.4501953125, 22.505859375, 23.5615234375, 24.6171875, 25.6728515625, 26.728515625, 27.7841796875, 28.83984375, 29.8955078125, 30.951171875, 32.0068359375, 33.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 7.0, 14.0, 8.0, 7.0, 21.0, 16.0, 21.0, 25.0, 17.0, 31.0, 32.0, 31.0, 32.0, 34.0, 51.0, 50.0, 49.0, 44.0, 49.0, 51.0, 42.0, 39.0, 37.0, 36.0, 30.0, 23.0, 29.0, 21.0, 29.0, 17.0, 16.0, 19.0, 13.0, 10.0, 9.0, 4.0, 9.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.353759765625, -27.45751953125, -26.561279296875, -25.6650390625, -24.768798828125, -23.87255859375, -22.976318359375, -22.080078125, -21.183837890625, -20.28759765625, -19.391357421875, -18.4951171875, -17.598876953125, -16.70263671875, -15.806396484375, -14.91015625, -14.013916015625, -13.11767578125, -12.221435546875, -11.3251953125, -10.428955078125, -9.53271484375, -8.636474609375, -7.740234375, -6.843994140625, -5.94775390625, -5.051513671875, -4.1552734375, -3.259033203125, -2.36279296875, -1.466552734375, -0.5703125, 0.325927734375, 1.22216796875, 2.118408203125, 3.0146484375, 3.910888671875, 4.80712890625, 5.703369140625, 6.599609375, 7.495849609375, 8.39208984375, 9.288330078125, 10.1845703125, 11.080810546875, 11.97705078125, 12.873291015625, 13.76953125, 14.665771484375, 15.56201171875, 16.458251953125, 17.3544921875, 18.250732421875, 19.14697265625, 20.043212890625, 20.939453125, 21.835693359375, 22.73193359375, 23.628173828125, 24.5244140625, 25.420654296875, 26.31689453125, 27.213134765625, 28.109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 16.0, 33.0, 45.0, 72.0, 94.0, 156.0, 214.0, 336.0, 521.0, 774.0, 1145.0, 1670.0, 2568.0, 4167.0, 6660.0, 10820.0, 17870.0, 30627.0, 53721.0, 91574.0, 150177.0, 205882.0, 181913.0, 117987.0, 69567.0, 39868.0, 22959.0, 13917.0, 8489.0, 5319.0, 3217.0, 2074.0, 1349.0, 924.0, 613.0, 412.0, 249.0, 190.0, 109.0, 75.0, 53.0, 45.0, 28.0, 15.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.28955078125, -34.1416015625, -32.99365234375, -31.845703125, -30.69775390625, -29.5498046875, -28.40185546875, -27.25390625, -26.10595703125, -24.9580078125, -23.81005859375, -22.662109375, -21.51416015625, -20.3662109375, -19.21826171875, -18.0703125, -16.92236328125, -15.7744140625, -14.62646484375, -13.478515625, -12.33056640625, -11.1826171875, -10.03466796875, -8.88671875, -7.73876953125, -6.5908203125, -5.44287109375, -4.294921875, -3.14697265625, -1.9990234375, -0.85107421875, 0.296875, 1.44482421875, 2.5927734375, 3.74072265625, 4.888671875, 6.03662109375, 7.1845703125, 8.33251953125, 9.48046875, 10.62841796875, 11.7763671875, 12.92431640625, 14.072265625, 15.22021484375, 16.3681640625, 17.51611328125, 18.6640625, 19.81201171875, 20.9599609375, 22.10791015625, 23.255859375, 24.40380859375, 25.5517578125, 26.69970703125, 27.84765625, 28.99560546875, 30.1435546875, 31.29150390625, 32.439453125, 33.58740234375, 34.7353515625, 35.88330078125, 37.03125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 12.0, 20.0, 26.0, 31.0, 39.0, 29.0, 29.0, 35.0, 44.0, 35.0, 46.0, 32.0, 36.0, 27.0, 40.0, 42.0, 48.0, 37.0, 36.0, 27.0, 30.0, 43.0, 39.0, 27.0, 24.0, 16.0, 15.0, 11.0, 10.0, 5.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.34375, -15.7919921875, -15.240234375, -14.6884765625, -14.13671875, -13.5849609375, -13.033203125, -12.4814453125, -11.9296875, -11.3779296875, -10.826171875, -10.2744140625, -9.72265625, -9.1708984375, -8.619140625, -8.0673828125, -7.515625, -6.9638671875, -6.412109375, -5.8603515625, -5.30859375, -4.7568359375, -4.205078125, -3.6533203125, -3.1015625, -2.5498046875, -1.998046875, -1.4462890625, -0.89453125, -0.3427734375, 0.208984375, 0.7607421875, 1.3125, 1.8642578125, 2.416015625, 2.9677734375, 3.51953125, 4.0712890625, 4.623046875, 5.1748046875, 5.7265625, 6.2783203125, 6.830078125, 7.3818359375, 7.93359375, 8.4853515625, 9.037109375, 9.5888671875, 10.140625, 10.6923828125, 11.244140625, 11.7958984375, 12.34765625, 12.8994140625, 13.451171875, 14.0029296875, 14.5546875, 15.1064453125, 15.658203125, 16.2099609375, 16.76171875, 17.3134765625, 17.865234375, 18.4169921875, 18.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 8.0, 14.0, 23.0, 21.0, 44.0, 66.0, 68.0, 122.0, 185.0, 291.0, 395.0, 608.0, 1017.0, 1666.0, 3040.0, 5700.0, 11886.0, 27226.0, 70105.0, 209928.0, 423218.0, 183367.0, 62248.0, 24285.0, 10688.0, 5259.0, 2680.0, 1602.0, 951.0, 580.0, 409.0, 269.0, 171.0, 125.0, 92.0, 60.0, 41.0, 33.0, 20.0, 10.0, 12.0, 6.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.109375, -20.392333984375, -19.67529296875, -18.958251953125, -18.2412109375, -17.524169921875, -16.80712890625, -16.090087890625, -15.373046875, -14.656005859375, -13.93896484375, -13.221923828125, -12.5048828125, -11.787841796875, -11.07080078125, -10.353759765625, -9.63671875, -8.919677734375, -8.20263671875, -7.485595703125, -6.7685546875, -6.051513671875, -5.33447265625, -4.617431640625, -3.900390625, -3.183349609375, -2.46630859375, -1.749267578125, -1.0322265625, -0.315185546875, 0.40185546875, 1.118896484375, 1.8359375, 2.552978515625, 3.27001953125, 3.987060546875, 4.7041015625, 5.421142578125, 6.13818359375, 6.855224609375, 7.572265625, 8.289306640625, 9.00634765625, 9.723388671875, 10.4404296875, 11.157470703125, 11.87451171875, 12.591552734375, 13.30859375, 14.025634765625, 14.74267578125, 15.459716796875, 16.1767578125, 16.893798828125, 17.61083984375, 18.327880859375, 19.044921875, 19.761962890625, 20.47900390625, 21.196044921875, 21.9130859375, 22.630126953125, 23.34716796875, 24.064208984375, 24.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 5.0, 13.0, 10.0, 27.0, 39.0, 54.0, 81.0, 125.0, 201.0, 166.0, 106.0, 57.0, 35.0, 20.0, 16.0, 11.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.002658754587173462, -0.0025690197944641113, -0.0024792850017547607, -0.00238955020904541, -0.0022998154163360596, -0.002210080623626709, -0.0021203458309173584, -0.002030611038208008, -0.0019408762454986572, -0.0018511414527893066, -0.001761406660079956, -0.0016716718673706055, -0.0015819370746612549, -0.0014922022819519043, -0.0014024674892425537, -0.0013127326965332031, -0.0012229979038238525, -0.001133263111114502, -0.0010435283184051514, -0.0009537935256958008, -0.0008640587329864502, -0.0007743239402770996, -0.000684589147567749, -0.0005948543548583984, -0.0005051195621490479, -0.00041538476943969727, -0.0003256499767303467, -0.0002359151840209961, -0.0001461803913116455, -5.644559860229492e-05, 3.3289194107055664e-05, 0.00012302398681640625, 0.00021275877952575684, 0.0003024935722351074, 0.000392228364944458, 0.0004819631576538086, 0.0005716979503631592, 0.0006614327430725098, 0.0007511675357818604, 0.0008409023284912109, 0.0009306371212005615, 0.0010203719139099121, 0.0011101067066192627, 0.0011998414993286133, 0.0012895762920379639, 0.0013793110847473145, 0.001469045877456665, 0.0015587806701660156, 0.0016485154628753662, 0.0017382502555847168, 0.0018279850482940674, 0.001917719841003418, 0.0020074546337127686, 0.002097189426422119, 0.0021869242191314697, 0.0022766590118408203, 0.002366393804550171, 0.0024561285972595215, 0.002545863389968872, 0.0026355981826782227, 0.0027253329753875732, 0.002815067768096924, 0.0029048025608062744, 0.002994537353515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 15.0, 23.0, 38.0, 37.0, 56.0, 79.0, 109.0, 137.0, 188.0, 315.0, 418.0, 631.0, 993.0, 1495.0, 2242.0, 3685.0, 6216.0, 10991.0, 19692.0, 37247.0, 74553.0, 156111.0, 280633.0, 225012.0, 109639.0, 53671.0, 27452.0, 15172.0, 8334.0, 4905.0, 2913.0, 1824.0, 1176.0, 790.0, 548.0, 364.0, 222.0, 167.0, 117.0, 81.0, 62.0, 48.0, 23.0, 33.0, 18.0, 18.0, 9.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0], "bins": [-14.78125, -14.28466796875, -13.7880859375, -13.29150390625, -12.794921875, -12.29833984375, -11.8017578125, -11.30517578125, -10.80859375, -10.31201171875, -9.8154296875, -9.31884765625, -8.822265625, -8.32568359375, -7.8291015625, -7.33251953125, -6.8359375, -6.33935546875, -5.8427734375, -5.34619140625, -4.849609375, -4.35302734375, -3.8564453125, -3.35986328125, -2.86328125, -2.36669921875, -1.8701171875, -1.37353515625, -0.876953125, -0.38037109375, 0.1162109375, 0.61279296875, 1.109375, 1.60595703125, 2.1025390625, 2.59912109375, 3.095703125, 3.59228515625, 4.0888671875, 4.58544921875, 5.08203125, 5.57861328125, 6.0751953125, 6.57177734375, 7.068359375, 7.56494140625, 8.0615234375, 8.55810546875, 9.0546875, 9.55126953125, 10.0478515625, 10.54443359375, 11.041015625, 11.53759765625, 12.0341796875, 12.53076171875, 13.02734375, 13.52392578125, 14.0205078125, 14.51708984375, 15.013671875, 15.51025390625, 16.0068359375, 16.50341796875, 17.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 3.0, 4.0, 12.0, 13.0, 10.0, 13.0, 13.0, 23.0, 15.0, 41.0, 32.0, 44.0, 60.0, 53.0, 82.0, 87.0, 80.0, 68.0, 53.0, 40.0, 34.0, 37.0, 26.0, 30.0, 21.0, 21.0, 12.0, 23.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.97265625, -4.8109130859375, -4.649169921875, -4.4874267578125, -4.32568359375, -4.1639404296875, -4.002197265625, -3.8404541015625, -3.6787109375, -3.5169677734375, -3.355224609375, -3.1934814453125, -3.03173828125, -2.8699951171875, -2.708251953125, -2.5465087890625, -2.384765625, -2.2230224609375, -2.061279296875, -1.8995361328125, -1.73779296875, -1.5760498046875, -1.414306640625, -1.2525634765625, -1.0908203125, -0.9290771484375, -0.767333984375, -0.6055908203125, -0.44384765625, -0.2821044921875, -0.120361328125, 0.0413818359375, 0.203125, 0.3648681640625, 0.526611328125, 0.6883544921875, 0.85009765625, 1.0118408203125, 1.173583984375, 1.3353271484375, 1.4970703125, 1.6588134765625, 1.820556640625, 1.9822998046875, 2.14404296875, 2.3057861328125, 2.467529296875, 2.6292724609375, 2.791015625, 2.9527587890625, 3.114501953125, 3.2762451171875, 3.43798828125, 3.5997314453125, 3.761474609375, 3.9232177734375, 4.0849609375, 4.2467041015625, 4.408447265625, 4.5701904296875, 4.73193359375, 4.8936767578125, 5.055419921875, 5.2171630859375, 5.37890625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 12.0, 14.0, 17.0, 24.0, 30.0, 35.0, 55.0, 40.0, 56.0, 76.0, 90.0, 67.0, 73.0, 64.0, 54.0, 52.0, 43.0, 39.0, 26.0, 20.0, 12.0, 14.0, 10.0, 7.0, 10.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.735443115234375, -35.59249496459961, -34.44954299926758, -33.30659484863281, -32.16364288330078, -31.020694732666016, -29.877744674682617, -28.73479461669922, -27.59184455871582, -26.448894500732422, -25.305944442749023, -24.162994384765625, -23.02004623413086, -21.877094268798828, -20.734146118164062, -19.591196060180664, -18.448246002197266, -17.305295944213867, -16.16234588623047, -15.019396781921387, -13.876446723937988, -12.73349666595459, -11.590547561645508, -10.44759750366211, -9.304647445678711, -8.161697387695312, -7.018747806549072, -5.875798225402832, -4.732848167419434, -3.589898109436035, -2.446948528289795, -1.3039989471435547, -0.16104507446289062, 0.9819047451019287, 2.124854564666748, 3.2678043842315674, 4.410754203796387, 5.553704261779785, 6.696653842926025, 7.839603424072266, 8.982553482055664, 10.125503540039062, 11.268453598022461, 12.411402702331543, 13.554352760314941, 14.69730281829834, 15.840251922607422, 16.98320198059082, 18.12615203857422, 19.269102096557617, 20.412052154541016, 21.555002212524414, 22.697952270507812, 23.840900421142578, 24.983850479125977, 26.126800537109375, 27.269750595092773, 28.412700653076172, 29.55565071105957, 30.69860076904297, 31.841548919677734, 32.984500885009766, 34.12744903564453, 35.27040100097656, 36.41334915161133]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 10.0, 10.0, 7.0, 10.0, 13.0, 13.0, 21.0, 23.0, 26.0, 29.0, 45.0, 35.0, 38.0, 33.0, 31.0, 45.0, 50.0, 40.0, 47.0, 37.0, 37.0, 39.0, 43.0, 43.0, 44.0, 25.0, 32.0, 26.0, 21.0, 29.0, 17.0, 17.0, 14.0, 7.0, 14.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.86671257019043, -25.917133331298828, -24.967554092407227, -24.017974853515625, -23.068397521972656, -22.118816375732422, -21.169239044189453, -20.21965980529785, -19.27008056640625, -18.32050132751465, -17.370922088623047, -16.421342849731445, -15.47176456451416, -14.522185325622559, -13.572607040405273, -12.623027801513672, -11.67344856262207, -10.723869323730469, -9.774290084838867, -8.824711799621582, -7.8751325607299805, -6.925553321838379, -5.9759745597839355, -5.026395797729492, -4.076816558837891, -3.127237558364868, -2.1776585578918457, -1.2280795574188232, -0.2785005569458008, 0.6710786819458008, 1.6206574440002441, 2.5702362060546875, 3.5198135375976562, 4.469392776489258, 5.418971538543701, 6.3685503005981445, 7.318129539489746, 8.267708778381348, 9.217287063598633, 10.166866302490234, 11.116445541381836, 12.066024780273438, 13.015604019165039, 13.965182304382324, 14.914761543273926, 15.864340782165527, 16.813919067382812, 17.763498306274414, 18.713077545166016, 19.662656784057617, 20.61223602294922, 21.56181526184082, 22.511394500732422, 23.46097183227539, 24.410551071166992, 25.360130310058594, 26.309709548950195, 27.259288787841797, 28.2088680267334, 29.158447265625, 30.10802459716797, 31.057605743408203, 32.00718307495117, 32.956764221191406, 33.906341552734375]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 12.0, 18.0, 19.0, 25.0, 44.0, 71.0, 76.0, 118.0, 197.0, 265.0, 390.0, 572.0, 816.0, 1203.0, 1902.0, 2836.0, 4372.0, 7179.0, 11711.0, 20385.0, 37611.0, 77496.0, 183391.0, 533117.0, 1277159.0, 1214469.0, 480743.0, 175517.0, 74058.0, 37242.0, 20494.0, 11794.0, 6987.0, 4307.0, 2668.0, 1668.0, 1178.0, 735.0, 471.0, 308.0, 209.0, 151.0, 91.0, 61.0, 47.0, 39.0, 18.0, 12.0, 8.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.5625, -31.39794921875, -30.2333984375, -29.06884765625, -27.904296875, -26.73974609375, -25.5751953125, -24.41064453125, -23.24609375, -22.08154296875, -20.9169921875, -19.75244140625, -18.587890625, -17.42333984375, -16.2587890625, -15.09423828125, -13.9296875, -12.76513671875, -11.6005859375, -10.43603515625, -9.271484375, -8.10693359375, -6.9423828125, -5.77783203125, -4.61328125, -3.44873046875, -2.2841796875, -1.11962890625, 0.044921875, 1.20947265625, 2.3740234375, 3.53857421875, 4.703125, 5.86767578125, 7.0322265625, 8.19677734375, 9.361328125, 10.52587890625, 11.6904296875, 12.85498046875, 14.01953125, 15.18408203125, 16.3486328125, 17.51318359375, 18.677734375, 19.84228515625, 21.0068359375, 22.17138671875, 23.3359375, 24.50048828125, 25.6650390625, 26.82958984375, 27.994140625, 29.15869140625, 30.3232421875, 31.48779296875, 32.65234375, 33.81689453125, 34.9814453125, 36.14599609375, 37.310546875, 38.47509765625, 39.6396484375, 40.80419921875, 41.96875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 9.0, 10.0, 18.0, 22.0, 25.0, 26.0, 28.0, 43.0, 47.0, 27.0, 52.0, 35.0, 49.0, 44.0, 51.0, 51.0, 38.0, 32.0, 52.0, 40.0, 39.0, 38.0, 32.0, 19.0, 23.0, 20.0, 34.0, 12.0, 14.0, 14.0, 5.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.49072265625, -22.6064453125, -21.72216796875, -20.837890625, -19.95361328125, -19.0693359375, -18.18505859375, -17.30078125, -16.41650390625, -15.5322265625, -14.64794921875, -13.763671875, -12.87939453125, -11.9951171875, -11.11083984375, -10.2265625, -9.34228515625, -8.4580078125, -7.57373046875, -6.689453125, -5.80517578125, -4.9208984375, -4.03662109375, -3.15234375, -2.26806640625, -1.3837890625, -0.49951171875, 0.384765625, 1.26904296875, 2.1533203125, 3.03759765625, 3.921875, 4.80615234375, 5.6904296875, 6.57470703125, 7.458984375, 8.34326171875, 9.2275390625, 10.11181640625, 10.99609375, 11.88037109375, 12.7646484375, 13.64892578125, 14.533203125, 15.41748046875, 16.3017578125, 17.18603515625, 18.0703125, 18.95458984375, 19.8388671875, 20.72314453125, 21.607421875, 22.49169921875, 23.3759765625, 24.26025390625, 25.14453125, 26.02880859375, 26.9130859375, 27.79736328125, 28.681640625, 29.56591796875, 30.4501953125, 31.33447265625, 32.21875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 15.0, 18.0, 12.0, 25.0, 39.0, 65.0, 84.0, 125.0, 159.0, 239.0, 366.0, 577.0, 779.0, 1158.0, 1687.0, 2609.0, 3975.0, 6297.0, 10359.0, 16809.0, 28425.0, 50058.0, 93015.0, 182286.0, 385855.0, 886596.0, 1299613.0, 630591.0, 282965.0, 137642.0, 72103.0, 39403.0, 22726.0, 13624.0, 8399.0, 5280.0, 3483.0, 2263.0, 1458.0, 1006.0, 652.0, 471.0, 317.0, 197.0, 162.0, 101.0, 62.0, 44.0, 27.0, 19.0, 19.0, 14.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.25, -36.0966796875, -34.943359375, -33.7900390625, -32.63671875, -31.4833984375, -30.330078125, -29.1767578125, -28.0234375, -26.8701171875, -25.716796875, -24.5634765625, -23.41015625, -22.2568359375, -21.103515625, -19.9501953125, -18.796875, -17.6435546875, -16.490234375, -15.3369140625, -14.18359375, -13.0302734375, -11.876953125, -10.7236328125, -9.5703125, -8.4169921875, -7.263671875, -6.1103515625, -4.95703125, -3.8037109375, -2.650390625, -1.4970703125, -0.34375, 0.8095703125, 1.962890625, 3.1162109375, 4.26953125, 5.4228515625, 6.576171875, 7.7294921875, 8.8828125, 10.0361328125, 11.189453125, 12.3427734375, 13.49609375, 14.6494140625, 15.802734375, 16.9560546875, 18.109375, 19.2626953125, 20.416015625, 21.5693359375, 22.72265625, 23.8759765625, 25.029296875, 26.1826171875, 27.3359375, 28.4892578125, 29.642578125, 30.7958984375, 31.94921875, 33.1025390625, 34.255859375, 35.4091796875, 36.5625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 12.0, 12.0, 14.0, 20.0, 18.0, 26.0, 34.0, 30.0, 38.0, 61.0, 82.0, 105.0, 119.0, 140.0, 189.0, 234.0, 268.0, 330.0, 370.0, 346.0, 281.0, 256.0, 191.0, 164.0, 134.0, 129.0, 88.0, 84.0, 52.0, 44.0, 39.0, 34.0, 28.0, 28.0, 15.0, 13.0, 6.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.78125, -12.3785400390625, -11.975830078125, -11.5731201171875, -11.17041015625, -10.7677001953125, -10.364990234375, -9.9622802734375, -9.5595703125, -9.1568603515625, -8.754150390625, -8.3514404296875, -7.94873046875, -7.5460205078125, -7.143310546875, -6.7406005859375, -6.337890625, -5.9351806640625, -5.532470703125, -5.1297607421875, -4.72705078125, -4.3243408203125, -3.921630859375, -3.5189208984375, -3.1162109375, -2.7135009765625, -2.310791015625, -1.9080810546875, -1.50537109375, -1.1026611328125, -0.699951171875, -0.2972412109375, 0.10546875, 0.5081787109375, 0.910888671875, 1.3135986328125, 1.71630859375, 2.1190185546875, 2.521728515625, 2.9244384765625, 3.3271484375, 3.7298583984375, 4.132568359375, 4.5352783203125, 4.93798828125, 5.3406982421875, 5.743408203125, 6.1461181640625, 6.548828125, 6.9515380859375, 7.354248046875, 7.7569580078125, 8.15966796875, 8.5623779296875, 8.965087890625, 9.3677978515625, 9.7705078125, 10.1732177734375, 10.575927734375, 10.9786376953125, 11.38134765625, 11.7840576171875, 12.186767578125, 12.5894775390625, 12.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 12.0, 17.0, 15.0, 19.0, 28.0, 37.0, 43.0, 58.0, 71.0, 67.0, 68.0, 61.0, 60.0, 71.0, 71.0, 52.0, 51.0, 33.0, 29.0, 24.0, 21.0, 14.0, 7.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9119758605957, -35.81083679199219, -34.709693908691406, -33.60855484008789, -32.507415771484375, -31.406272888183594, -30.305133819580078, -29.20399284362793, -28.10285186767578, -27.001710891723633, -25.900569915771484, -24.79943084716797, -23.69828987121582, -22.597148895263672, -21.496009826660156, -20.394868850708008, -19.29372787475586, -18.19258689880371, -17.091445922851562, -15.990306854248047, -14.889165878295898, -13.78802490234375, -12.686884880065918, -11.585744857788086, -10.484603881835938, -9.383462905883789, -8.282322883605957, -7.181182384490967, -6.080041885375977, -4.978901386260986, -3.877760887145996, -2.776620388031006, -1.6754798889160156, -0.5743393898010254, 0.5268011093139648, 1.627941608428955, 2.7290821075439453, 3.8302226066589355, 4.931363105773926, 6.032503604888916, 7.133644104003906, 8.234785079956055, 9.335925102233887, 10.437065124511719, 11.538206100463867, 12.639347076416016, 13.740487098693848, 14.84162712097168, 15.942768096923828, 17.043909072875977, 18.145050048828125, 19.24618911743164, 20.34733009338379, 21.448471069335938, 22.549610137939453, 23.6507511138916, 24.75189208984375, 25.8530330657959, 26.954174041748047, 28.055313110351562, 29.15645408630371, 30.25759506225586, 31.358734130859375, 32.459877014160156, 33.56101608276367]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 12.0, 9.0, 10.0, 8.0, 18.0, 15.0, 28.0, 21.0, 23.0, 31.0, 32.0, 37.0, 24.0, 32.0, 31.0, 36.0, 45.0, 53.0, 38.0, 37.0, 34.0, 60.0, 27.0, 35.0, 24.0, 29.0, 34.0, 30.0, 20.0, 30.0, 17.0, 25.0, 15.0, 11.0, 10.0, 8.0, 10.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.57047462463379, -25.722055435180664, -24.87363624572754, -24.025217056274414, -23.17679786682129, -22.328378677368164, -21.47995948791504, -20.631540298461914, -19.78312110900879, -18.934701919555664, -18.08628273010254, -17.237863540649414, -16.38944435119629, -15.541025161743164, -14.692605972290039, -13.844186782836914, -12.995767593383789, -12.147348403930664, -11.298929214477539, -10.450510025024414, -9.602090835571289, -8.753671646118164, -7.905252456665039, -7.056833267211914, -6.208414077758789, -5.359994888305664, -4.511575698852539, -3.663156509399414, -2.814737319946289, -1.966318130493164, -1.117898941040039, -0.26947975158691406, 0.5789413452148438, 1.4273605346679688, 2.2757797241210938, 3.1241989135742188, 3.9726181030273438, 4.821037292480469, 5.669456481933594, 6.517875671386719, 7.366294860839844, 8.214714050292969, 9.063133239746094, 9.911552429199219, 10.759971618652344, 11.608390808105469, 12.456809997558594, 13.305229187011719, 14.153648376464844, 15.002067565917969, 15.850486755371094, 16.69890594482422, 17.547325134277344, 18.39574432373047, 19.244163513183594, 20.09258270263672, 20.941001892089844, 21.78942108154297, 22.637840270996094, 23.48625946044922, 24.334678649902344, 25.18309783935547, 26.031517028808594, 26.87993621826172, 27.728355407714844]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 15.0, 16.0, 27.0, 44.0, 45.0, 70.0, 96.0, 143.0, 184.0, 309.0, 418.0, 566.0, 819.0, 1226.0, 1890.0, 2784.0, 4068.0, 6376.0, 9887.0, 15692.0, 24234.0, 39118.0, 65207.0, 112547.0, 192558.0, 222163.0, 138914.0, 79704.0, 47739.0, 29465.0, 18334.0, 11453.0, 7454.0, 4921.0, 3231.0, 2199.0, 1477.0, 956.0, 679.0, 451.0, 321.0, 238.0, 153.0, 100.0, 88.0, 51.0, 31.0, 23.0, 26.0, 16.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0], "bins": [-18.453125, -17.8798828125, -17.306640625, -16.7333984375, -16.16015625, -15.5869140625, -15.013671875, -14.4404296875, -13.8671875, -13.2939453125, -12.720703125, -12.1474609375, -11.57421875, -11.0009765625, -10.427734375, -9.8544921875, -9.28125, -8.7080078125, -8.134765625, -7.5615234375, -6.98828125, -6.4150390625, -5.841796875, -5.2685546875, -4.6953125, -4.1220703125, -3.548828125, -2.9755859375, -2.40234375, -1.8291015625, -1.255859375, -0.6826171875, -0.109375, 0.4638671875, 1.037109375, 1.6103515625, 2.18359375, 2.7568359375, 3.330078125, 3.9033203125, 4.4765625, 5.0498046875, 5.623046875, 6.1962890625, 6.76953125, 7.3427734375, 7.916015625, 8.4892578125, 9.0625, 9.6357421875, 10.208984375, 10.7822265625, 11.35546875, 11.9287109375, 12.501953125, 13.0751953125, 13.6484375, 14.2216796875, 14.794921875, 15.3681640625, 15.94140625, 16.5146484375, 17.087890625, 17.6611328125, 18.234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 7.0, 13.0, 6.0, 13.0, 21.0, 26.0, 31.0, 33.0, 31.0, 35.0, 31.0, 31.0, 26.0, 30.0, 36.0, 51.0, 46.0, 38.0, 51.0, 42.0, 50.0, 33.0, 33.0, 27.0, 32.0, 22.0, 29.0, 22.0, 19.0, 15.0, 18.0, 15.0, 11.0, 9.0, 5.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.8125, -26.935546875, -26.05859375, -25.181640625, -24.3046875, -23.427734375, -22.55078125, -21.673828125, -20.796875, -19.919921875, -19.04296875, -18.166015625, -17.2890625, -16.412109375, -15.53515625, -14.658203125, -13.78125, -12.904296875, -12.02734375, -11.150390625, -10.2734375, -9.396484375, -8.51953125, -7.642578125, -6.765625, -5.888671875, -5.01171875, -4.134765625, -3.2578125, -2.380859375, -1.50390625, -0.626953125, 0.25, 1.126953125, 2.00390625, 2.880859375, 3.7578125, 4.634765625, 5.51171875, 6.388671875, 7.265625, 8.142578125, 9.01953125, 9.896484375, 10.7734375, 11.650390625, 12.52734375, 13.404296875, 14.28125, 15.158203125, 16.03515625, 16.912109375, 17.7890625, 18.666015625, 19.54296875, 20.419921875, 21.296875, 22.173828125, 23.05078125, 23.927734375, 24.8046875, 25.681640625, 26.55859375, 27.435546875, 28.3125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 15.0, 22.0, 24.0, 53.0, 60.0, 118.0, 158.0, 220.0, 375.0, 620.0, 899.0, 1390.0, 2304.0, 3907.0, 6554.0, 11660.0, 21292.0, 41404.0, 89085.0, 231667.0, 359984.0, 146292.0, 61939.0, 30226.0, 16078.0, 8808.0, 5171.0, 3117.0, 1833.0, 1200.0, 704.0, 448.0, 321.0, 201.0, 122.0, 77.0, 51.0, 40.0, 27.0, 19.0, 20.0, 14.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0], "bins": [-38.0, -36.952392578125, -35.90478515625, -34.857177734375, -33.8095703125, -32.761962890625, -31.71435546875, -30.666748046875, -29.619140625, -28.571533203125, -27.52392578125, -26.476318359375, -25.4287109375, -24.381103515625, -23.33349609375, -22.285888671875, -21.23828125, -20.190673828125, -19.14306640625, -18.095458984375, -17.0478515625, -16.000244140625, -14.95263671875, -13.905029296875, -12.857421875, -11.809814453125, -10.76220703125, -9.714599609375, -8.6669921875, -7.619384765625, -6.57177734375, -5.524169921875, -4.4765625, -3.428955078125, -2.38134765625, -1.333740234375, -0.2861328125, 0.761474609375, 1.80908203125, 2.856689453125, 3.904296875, 4.951904296875, 5.99951171875, 7.047119140625, 8.0947265625, 9.142333984375, 10.18994140625, 11.237548828125, 12.28515625, 13.332763671875, 14.38037109375, 15.427978515625, 16.4755859375, 17.523193359375, 18.57080078125, 19.618408203125, 20.666015625, 21.713623046875, 22.76123046875, 23.808837890625, 24.8564453125, 25.904052734375, 26.95166015625, 27.999267578125, 29.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 18.0, 11.0, 19.0, 14.0, 19.0, 26.0, 29.0, 15.0, 30.0, 30.0, 40.0, 41.0, 40.0, 42.0, 38.0, 45.0, 44.0, 35.0, 44.0, 34.0, 30.0, 35.0, 31.0, 33.0, 30.0, 27.0, 26.0, 24.0, 19.0, 13.0, 26.0, 13.0, 9.0, 7.0, 7.0, 7.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.28125, -17.7333984375, -17.185546875, -16.6376953125, -16.08984375, -15.5419921875, -14.994140625, -14.4462890625, -13.8984375, -13.3505859375, -12.802734375, -12.2548828125, -11.70703125, -11.1591796875, -10.611328125, -10.0634765625, -9.515625, -8.9677734375, -8.419921875, -7.8720703125, -7.32421875, -6.7763671875, -6.228515625, -5.6806640625, -5.1328125, -4.5849609375, -4.037109375, -3.4892578125, -2.94140625, -2.3935546875, -1.845703125, -1.2978515625, -0.75, -0.2021484375, 0.345703125, 0.8935546875, 1.44140625, 1.9892578125, 2.537109375, 3.0849609375, 3.6328125, 4.1806640625, 4.728515625, 5.2763671875, 5.82421875, 6.3720703125, 6.919921875, 7.4677734375, 8.015625, 8.5634765625, 9.111328125, 9.6591796875, 10.20703125, 10.7548828125, 11.302734375, 11.8505859375, 12.3984375, 12.9462890625, 13.494140625, 14.0419921875, 14.58984375, 15.1376953125, 15.685546875, 16.2333984375, 16.78125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 14.0, 34.0, 29.0, 69.0, 94.0, 169.0, 303.0, 586.0, 1068.0, 2033.0, 4140.0, 9580.0, 24473.0, 73042.0, 253905.0, 444599.0, 156431.0, 47178.0, 17187.0, 6979.0, 3239.0, 1493.0, 796.0, 451.0, 240.0, 124.0, 88.0, 48.0, 33.0, 32.0, 17.0, 9.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.421875, -10.126708984375, -9.83154296875, -9.536376953125, -9.2412109375, -8.946044921875, -8.65087890625, -8.355712890625, -8.060546875, -7.765380859375, -7.47021484375, -7.175048828125, -6.8798828125, -6.584716796875, -6.28955078125, -5.994384765625, -5.69921875, -5.404052734375, -5.10888671875, -4.813720703125, -4.5185546875, -4.223388671875, -3.92822265625, -3.633056640625, -3.337890625, -3.042724609375, -2.74755859375, -2.452392578125, -2.1572265625, -1.862060546875, -1.56689453125, -1.271728515625, -0.9765625, -0.681396484375, -0.38623046875, -0.091064453125, 0.2041015625, 0.499267578125, 0.79443359375, 1.089599609375, 1.384765625, 1.679931640625, 1.97509765625, 2.270263671875, 2.5654296875, 2.860595703125, 3.15576171875, 3.450927734375, 3.74609375, 4.041259765625, 4.33642578125, 4.631591796875, 4.9267578125, 5.221923828125, 5.51708984375, 5.812255859375, 6.107421875, 6.402587890625, 6.69775390625, 6.992919921875, 7.2880859375, 7.583251953125, 7.87841796875, 8.173583984375, 8.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 17.0, 20.0, 32.0, 43.0, 53.0, 82.0, 77.0, 106.0, 96.0, 87.0, 97.0, 87.0, 42.0, 29.0, 25.0, 19.0, 15.0, 15.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005488395690917969, -0.0005241706967353821, -0.0004995018243789673, -0.0004748329520225525, -0.0004501640796661377, -0.0004254952073097229, -0.0004008263349533081, -0.0003761574625968933, -0.0003514885902404785, -0.0003268197178840637, -0.0003021508455276489, -0.00027748197317123413, -0.00025281310081481934, -0.00022814422845840454, -0.00020347535610198975, -0.00017880648374557495, -0.00015413761138916016, -0.00012946873903274536, -0.00010479986667633057, -8.013099431991577e-05, -5.5462121963500977e-05, -3.079324960708618e-05, -6.124377250671387e-06, 1.8544495105743408e-05, 4.32133674621582e-05, 6.7882239818573e-05, 9.255111217498779e-05, 0.00011721998453140259, 0.00014188885688781738, 0.00016655772924423218, 0.00019122660160064697, 0.00021589547395706177, 0.00024056434631347656, 0.00026523321866989136, 0.00028990209102630615, 0.00031457096338272095, 0.00033923983573913574, 0.00036390870809555054, 0.00038857758045196533, 0.0004132464528083801, 0.0004379153251647949, 0.0004625841975212097, 0.0004872530698776245, 0.0005119219422340393, 0.0005365908145904541, 0.0005612596869468689, 0.0005859285593032837, 0.0006105974316596985, 0.0006352663040161133, 0.0006599351763725281, 0.0006846040487289429, 0.0007092729210853577, 0.0007339417934417725, 0.0007586106657981873, 0.000783279538154602, 0.0008079484105110168, 0.0008326172828674316, 0.0008572861552238464, 0.0008819550275802612, 0.000906623899936676, 0.0009312927722930908, 0.0009559616446495056, 0.0009806305170059204, 0.0010052993893623352, 0.00102996826171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 17.0, 17.0, 42.0, 32.0, 50.0, 46.0, 96.0, 141.0, 219.0, 256.0, 487.0, 758.0, 1385.0, 2547.0, 5326.0, 11856.0, 28825.0, 76813.0, 216077.0, 383154.0, 199802.0, 71561.0, 26952.0, 11196.0, 5057.0, 2501.0, 1269.0, 695.0, 453.0, 247.0, 173.0, 141.0, 102.0, 57.0, 41.0, 41.0, 19.0, 22.0, 14.0, 5.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-11.6484375, -11.3104248046875, -10.972412109375, -10.6343994140625, -10.29638671875, -9.9583740234375, -9.620361328125, -9.2823486328125, -8.9443359375, -8.6063232421875, -8.268310546875, -7.9302978515625, -7.59228515625, -7.2542724609375, -6.916259765625, -6.5782470703125, -6.240234375, -5.9022216796875, -5.564208984375, -5.2261962890625, -4.88818359375, -4.5501708984375, -4.212158203125, -3.8741455078125, -3.5361328125, -3.1981201171875, -2.860107421875, -2.5220947265625, -2.18408203125, -1.8460693359375, -1.508056640625, -1.1700439453125, -0.83203125, -0.4940185546875, -0.156005859375, 0.1820068359375, 0.52001953125, 0.8580322265625, 1.196044921875, 1.5340576171875, 1.8720703125, 2.2100830078125, 2.548095703125, 2.8861083984375, 3.22412109375, 3.5621337890625, 3.900146484375, 4.2381591796875, 4.576171875, 4.9141845703125, 5.252197265625, 5.5902099609375, 5.92822265625, 6.2662353515625, 6.604248046875, 6.9422607421875, 7.2802734375, 7.6182861328125, 7.956298828125, 8.2943115234375, 8.63232421875, 8.9703369140625, 9.308349609375, 9.6463623046875, 9.984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 0.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 15.0, 29.0, 23.0, 45.0, 44.0, 60.0, 77.0, 71.0, 92.0, 101.0, 71.0, 67.0, 53.0, 36.0, 32.0, 29.0, 21.0, 19.0, 16.0, 11.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.2362060546875, -2.156005859375, -2.0758056640625, -1.99560546875, -1.9154052734375, -1.835205078125, -1.7550048828125, -1.6748046875, -1.5946044921875, -1.514404296875, -1.4342041015625, -1.35400390625, -1.2738037109375, -1.193603515625, -1.1134033203125, -1.033203125, -0.9530029296875, -0.872802734375, -0.7926025390625, -0.71240234375, -0.6322021484375, -0.552001953125, -0.4718017578125, -0.3916015625, -0.3114013671875, -0.231201171875, -0.1510009765625, -0.07080078125, 0.0093994140625, 0.089599609375, 0.1697998046875, 0.25, 0.3302001953125, 0.410400390625, 0.4906005859375, 0.57080078125, 0.6510009765625, 0.731201171875, 0.8114013671875, 0.8916015625, 0.9718017578125, 1.052001953125, 1.1322021484375, 1.21240234375, 1.2926025390625, 1.372802734375, 1.4530029296875, 1.533203125, 1.6134033203125, 1.693603515625, 1.7738037109375, 1.85400390625, 1.9342041015625, 2.014404296875, 2.0946044921875, 2.1748046875, 2.2550048828125, 2.335205078125, 2.4154052734375, 2.49560546875, 2.5758056640625, 2.656005859375, 2.7362060546875, 2.81640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 14.0, 13.0, 25.0, 32.0, 44.0, 44.0, 53.0, 69.0, 70.0, 64.0, 66.0, 56.0, 57.0, 79.0, 63.0, 35.0, 37.0, 31.0, 20.0, 20.0, 15.0, 9.0, 8.0, 10.0, 4.0, 1.0, 7.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.088653564453125, -34.002357482910156, -32.91605758666992, -31.829761505126953, -30.74346351623535, -29.65716552734375, -28.57086944580078, -27.48457145690918, -26.398273468017578, -25.311975479125977, -24.225677490234375, -23.139381408691406, -22.053083419799805, -20.966785430908203, -19.880489349365234, -18.794191360473633, -17.70789337158203, -16.62159538269043, -15.535298347473145, -14.44900131225586, -13.362703323364258, -12.276405334472656, -11.190108299255371, -10.103811264038086, -9.017513275146484, -7.931215763092041, -6.844918251037598, -5.758620738983154, -4.672323226928711, -3.5860257148742676, -2.499728202819824, -1.4134306907653809, -0.3271331787109375, 0.7591643333435059, 1.8454618453979492, 2.9317593574523926, 4.018056869506836, 5.104354381561279, 6.190651893615723, 7.276949405670166, 8.36324691772461, 9.449544906616211, 10.535841941833496, 11.622138977050781, 12.708436965942383, 13.794734954833984, 14.88103199005127, 15.967329025268555, 17.053627014160156, 18.139925003051758, 19.22622299194336, 20.312519073486328, 21.39881706237793, 22.48511505126953, 23.5714111328125, 24.6577091217041, 25.744007110595703, 26.830305099487305, 27.916603088378906, 29.002899169921875, 30.089197158813477, 31.175495147705078, 32.26179122924805, 33.34809112548828, 34.43438720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 10.0, 10.0, 10.0, 16.0, 16.0, 25.0, 18.0, 33.0, 36.0, 31.0, 28.0, 28.0, 29.0, 35.0, 38.0, 41.0, 47.0, 41.0, 38.0, 39.0, 47.0, 40.0, 30.0, 29.0, 24.0, 35.0, 27.0, 25.0, 22.0, 27.0, 17.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.153217315673828, -25.315322875976562, -24.477428436279297, -23.639535903930664, -22.8016414642334, -21.963747024536133, -21.1258544921875, -20.287960052490234, -19.45006561279297, -18.612171173095703, -17.774276733398438, -16.936384201049805, -16.09848976135254, -15.260595321655273, -14.422701835632324, -13.584808349609375, -12.74691390991211, -11.909019470214844, -11.071125984191895, -10.233232498168945, -9.39533805847168, -8.557443618774414, -7.719550132751465, -6.881656169891357, -6.04376220703125, -5.205868244171143, -4.367974281311035, -3.5300803184509277, -2.6921863555908203, -1.854292392730713, -1.0163984298706055, -0.17850446701049805, 0.6593914031982422, 1.4972853660583496, 2.335179328918457, 3.1730732917785645, 4.010967254638672, 4.848861217498779, 5.686755180358887, 6.524649143218994, 7.362543106079102, 8.200437545776367, 9.038331031799316, 9.876224517822266, 10.714118957519531, 11.552013397216797, 12.389906883239746, 13.227800369262695, 14.065694808959961, 14.903589248657227, 15.741482734680176, 16.579376220703125, 17.41727066040039, 18.255165100097656, 19.093059539794922, 19.930952072143555, 20.76884651184082, 21.606740951538086, 22.44463348388672, 23.282527923583984, 24.12042236328125, 24.958316802978516, 25.79621124267578, 26.634103775024414, 27.47199821472168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 6.0, 11.0, 10.0, 30.0, 42.0, 66.0, 77.0, 115.0, 167.0, 243.0, 438.0, 580.0, 929.0, 1464.0, 2248.0, 3696.0, 5803.0, 9707.0, 16143.0, 28077.0, 49471.0, 89902.0, 163310.0, 240956.0, 189486.0, 106744.0, 58149.0, 32629.0, 18789.0, 10990.0, 6740.0, 4184.0, 2607.0, 1676.0, 1039.0, 693.0, 430.0, 300.0, 199.0, 150.0, 75.0, 62.0, 36.0, 20.0, 19.0, 12.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9375, -35.73193359375, -34.5263671875, -33.32080078125, -32.115234375, -30.90966796875, -29.7041015625, -28.49853515625, -27.29296875, -26.08740234375, -24.8818359375, -23.67626953125, -22.470703125, -21.26513671875, -20.0595703125, -18.85400390625, -17.6484375, -16.44287109375, -15.2373046875, -14.03173828125, -12.826171875, -11.62060546875, -10.4150390625, -9.20947265625, -8.00390625, -6.79833984375, -5.5927734375, -4.38720703125, -3.181640625, -1.97607421875, -0.7705078125, 0.43505859375, 1.640625, 2.84619140625, 4.0517578125, 5.25732421875, 6.462890625, 7.66845703125, 8.8740234375, 10.07958984375, 11.28515625, 12.49072265625, 13.6962890625, 14.90185546875, 16.107421875, 17.31298828125, 18.5185546875, 19.72412109375, 20.9296875, 22.13525390625, 23.3408203125, 24.54638671875, 25.751953125, 26.95751953125, 28.1630859375, 29.36865234375, 30.57421875, 31.77978515625, 32.9853515625, 34.19091796875, 35.396484375, 36.60205078125, 37.8076171875, 39.01318359375, 40.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 14.0, 12.0, 9.0, 10.0, 13.0, 12.0, 19.0, 20.0, 35.0, 35.0, 36.0, 35.0, 29.0, 33.0, 26.0, 41.0, 51.0, 44.0, 48.0, 48.0, 43.0, 30.0, 52.0, 38.0, 24.0, 32.0, 26.0, 27.0, 22.0, 19.0, 27.0, 16.0, 19.0, 14.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.515625, -26.6328125, -25.75, -24.8671875, -23.984375, -23.1015625, -22.21875, -21.3359375, -20.453125, -19.5703125, -18.6875, -17.8046875, -16.921875, -16.0390625, -15.15625, -14.2734375, -13.390625, -12.5078125, -11.625, -10.7421875, -9.859375, -8.9765625, -8.09375, -7.2109375, -6.328125, -5.4453125, -4.5625, -3.6796875, -2.796875, -1.9140625, -1.03125, -0.1484375, 0.734375, 1.6171875, 2.5, 3.3828125, 4.265625, 5.1484375, 6.03125, 6.9140625, 7.796875, 8.6796875, 9.5625, 10.4453125, 11.328125, 12.2109375, 13.09375, 13.9765625, 14.859375, 15.7421875, 16.625, 17.5078125, 18.390625, 19.2734375, 20.15625, 21.0390625, 21.921875, 22.8046875, 23.6875, 24.5703125, 25.453125, 26.3359375, 27.21875, 28.1015625, 28.984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 9.0, 19.0, 30.0, 45.0, 50.0, 80.0, 100.0, 136.0, 198.0, 285.0, 390.0, 628.0, 905.0, 1238.0, 1957.0, 2678.0, 3993.0, 5928.0, 9163.0, 14176.0, 22019.0, 33987.0, 54456.0, 86907.0, 132918.0, 177215.0, 168148.0, 119601.0, 76215.0, 48193.0, 30421.0, 19134.0, 12442.0, 8096.0, 5322.0, 3658.0, 2421.0, 1627.0, 1078.0, 852.0, 543.0, 395.0, 272.0, 189.0, 125.0, 85.0, 65.0, 52.0, 26.0, 31.0, 11.0, 14.0, 8.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-32.53125, -31.51025390625, -30.4892578125, -29.46826171875, -28.447265625, -27.42626953125, -26.4052734375, -25.38427734375, -24.36328125, -23.34228515625, -22.3212890625, -21.30029296875, -20.279296875, -19.25830078125, -18.2373046875, -17.21630859375, -16.1953125, -15.17431640625, -14.1533203125, -13.13232421875, -12.111328125, -11.09033203125, -10.0693359375, -9.04833984375, -8.02734375, -7.00634765625, -5.9853515625, -4.96435546875, -3.943359375, -2.92236328125, -1.9013671875, -0.88037109375, 0.140625, 1.16162109375, 2.1826171875, 3.20361328125, 4.224609375, 5.24560546875, 6.2666015625, 7.28759765625, 8.30859375, 9.32958984375, 10.3505859375, 11.37158203125, 12.392578125, 13.41357421875, 14.4345703125, 15.45556640625, 16.4765625, 17.49755859375, 18.5185546875, 19.53955078125, 20.560546875, 21.58154296875, 22.6025390625, 23.62353515625, 24.64453125, 25.66552734375, 26.6865234375, 27.70751953125, 28.728515625, 29.74951171875, 30.7705078125, 31.79150390625, 32.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 8.0, 10.0, 19.0, 15.0, 16.0, 22.0, 23.0, 29.0, 35.0, 41.0, 42.0, 44.0, 29.0, 40.0, 57.0, 49.0, 35.0, 46.0, 50.0, 51.0, 44.0, 34.0, 32.0, 36.0, 29.0, 28.0, 18.0, 20.0, 13.0, 10.0, 11.0, 12.0, 8.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.2021484375, -20.560546875, -19.9189453125, -19.27734375, -18.6357421875, -17.994140625, -17.3525390625, -16.7109375, -16.0693359375, -15.427734375, -14.7861328125, -14.14453125, -13.5029296875, -12.861328125, -12.2197265625, -11.578125, -10.9365234375, -10.294921875, -9.6533203125, -9.01171875, -8.3701171875, -7.728515625, -7.0869140625, -6.4453125, -5.8037109375, -5.162109375, -4.5205078125, -3.87890625, -3.2373046875, -2.595703125, -1.9541015625, -1.3125, -0.6708984375, -0.029296875, 0.6123046875, 1.25390625, 1.8955078125, 2.537109375, 3.1787109375, 3.8203125, 4.4619140625, 5.103515625, 5.7451171875, 6.38671875, 7.0283203125, 7.669921875, 8.3115234375, 8.953125, 9.5947265625, 10.236328125, 10.8779296875, 11.51953125, 12.1611328125, 12.802734375, 13.4443359375, 14.0859375, 14.7275390625, 15.369140625, 16.0107421875, 16.65234375, 17.2939453125, 17.935546875, 18.5771484375, 19.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 18.0, 23.0, 57.0, 68.0, 127.0, 163.0, 285.0, 440.0, 856.0, 1379.0, 2435.0, 4581.0, 9096.0, 18975.0, 42703.0, 102665.0, 258287.0, 340391.0, 151950.0, 61396.0, 26562.0, 12362.0, 6187.0, 3248.0, 1709.0, 991.0, 584.0, 350.0, 206.0, 124.0, 95.0, 68.0, 50.0, 23.0, 18.0, 13.0, 14.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.21875, -17.61572265625, -17.0126953125, -16.40966796875, -15.806640625, -15.20361328125, -14.6005859375, -13.99755859375, -13.39453125, -12.79150390625, -12.1884765625, -11.58544921875, -10.982421875, -10.37939453125, -9.7763671875, -9.17333984375, -8.5703125, -7.96728515625, -7.3642578125, -6.76123046875, -6.158203125, -5.55517578125, -4.9521484375, -4.34912109375, -3.74609375, -3.14306640625, -2.5400390625, -1.93701171875, -1.333984375, -0.73095703125, -0.1279296875, 0.47509765625, 1.078125, 1.68115234375, 2.2841796875, 2.88720703125, 3.490234375, 4.09326171875, 4.6962890625, 5.29931640625, 5.90234375, 6.50537109375, 7.1083984375, 7.71142578125, 8.314453125, 8.91748046875, 9.5205078125, 10.12353515625, 10.7265625, 11.32958984375, 11.9326171875, 12.53564453125, 13.138671875, 13.74169921875, 14.3447265625, 14.94775390625, 15.55078125, 16.15380859375, 16.7568359375, 17.35986328125, 17.962890625, 18.56591796875, 19.1689453125, 19.77197265625, 20.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 5.0, 16.0, 25.0, 60.0, 74.0, 114.0, 131.0, 164.0, 143.0, 92.0, 66.0, 41.0, 16.0, 19.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036602020263671875, -0.0035697519779205322, -0.003479301929473877, -0.0033888518810272217, -0.0032984018325805664, -0.003207951784133911, -0.003117501735687256, -0.0030270516872406006, -0.0029366016387939453, -0.00284615159034729, -0.0027557015419006348, -0.0026652514934539795, -0.0025748014450073242, -0.002484351396560669, -0.0023939013481140137, -0.0023034512996673584, -0.002213001251220703, -0.002122551202774048, -0.0020321011543273926, -0.0019416511058807373, -0.001851201057434082, -0.0017607510089874268, -0.0016703009605407715, -0.0015798509120941162, -0.001489400863647461, -0.0013989508152008057, -0.0013085007667541504, -0.0012180507183074951, -0.0011276006698608398, -0.0010371506214141846, -0.0009467005729675293, -0.000856250524520874, -0.0007658004760742188, -0.0006753504276275635, -0.0005849003791809082, -0.0004944503307342529, -0.00040400028228759766, -0.0003135502338409424, -0.0002231001853942871, -0.00013265013694763184, -4.220008850097656e-05, 4.824995994567871e-05, 0.00013870000839233398, 0.00022915005683898926, 0.00031960010528564453, 0.0004100501537322998, 0.0005005002021789551, 0.0005909502506256104, 0.0006814002990722656, 0.0007718503475189209, 0.0008623003959655762, 0.0009527504444122314, 0.0010432004928588867, 0.001133650541305542, 0.0012241005897521973, 0.0013145506381988525, 0.0014050006866455078, 0.001495450735092163, 0.0015859007835388184, 0.0016763508319854736, 0.001766800880432129, 0.0018572509288787842, 0.0019477009773254395, 0.0020381510257720947, 0.00212860107421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 8.0, 3.0, 6.0, 9.0, 14.0, 13.0, 32.0, 28.0, 41.0, 50.0, 66.0, 105.0, 143.0, 221.0, 266.0, 409.0, 664.0, 898.0, 1542.0, 2628.0, 4467.0, 7893.0, 14613.0, 29231.0, 61383.0, 134249.0, 265373.0, 264964.0, 134512.0, 61556.0, 28974.0, 14741.0, 7833.0, 4357.0, 2545.0, 1601.0, 1011.0, 685.0, 415.0, 292.0, 205.0, 140.0, 94.0, 72.0, 53.0, 43.0, 33.0, 24.0, 7.0, 13.0, 12.0, 10.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.484375, -16.93798828125, -16.3916015625, -15.84521484375, -15.298828125, -14.75244140625, -14.2060546875, -13.65966796875, -13.11328125, -12.56689453125, -12.0205078125, -11.47412109375, -10.927734375, -10.38134765625, -9.8349609375, -9.28857421875, -8.7421875, -8.19580078125, -7.6494140625, -7.10302734375, -6.556640625, -6.01025390625, -5.4638671875, -4.91748046875, -4.37109375, -3.82470703125, -3.2783203125, -2.73193359375, -2.185546875, -1.63916015625, -1.0927734375, -0.54638671875, 0.0, 0.54638671875, 1.0927734375, 1.63916015625, 2.185546875, 2.73193359375, 3.2783203125, 3.82470703125, 4.37109375, 4.91748046875, 5.4638671875, 6.01025390625, 6.556640625, 7.10302734375, 7.6494140625, 8.19580078125, 8.7421875, 9.28857421875, 9.8349609375, 10.38134765625, 10.927734375, 11.47412109375, 12.0205078125, 12.56689453125, 13.11328125, 13.65966796875, 14.2060546875, 14.75244140625, 15.298828125, 15.84521484375, 16.3916015625, 16.93798828125, 17.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 8.0, 9.0, 9.0, 17.0, 23.0, 28.0, 40.0, 55.0, 64.0, 68.0, 92.0, 85.0, 91.0, 100.0, 67.0, 47.0, 46.0, 34.0, 16.0, 20.0, 12.0, 20.0, 10.0, 7.0, 8.0, 2.0, 9.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.54296875, -6.33160400390625, -6.1202392578125, -5.90887451171875, -5.697509765625, -5.48614501953125, -5.2747802734375, -5.06341552734375, -4.85205078125, -4.64068603515625, -4.4293212890625, -4.21795654296875, -4.006591796875, -3.79522705078125, -3.5838623046875, -3.37249755859375, -3.1611328125, -2.94976806640625, -2.7384033203125, -2.52703857421875, -2.315673828125, -2.10430908203125, -1.8929443359375, -1.68157958984375, -1.47021484375, -1.25885009765625, -1.0474853515625, -0.83612060546875, -0.624755859375, -0.41339111328125, -0.2020263671875, 0.00933837890625, 0.220703125, 0.43206787109375, 0.6434326171875, 0.85479736328125, 1.066162109375, 1.27752685546875, 1.4888916015625, 1.70025634765625, 1.91162109375, 2.12298583984375, 2.3343505859375, 2.54571533203125, 2.757080078125, 2.96844482421875, 3.1798095703125, 3.39117431640625, 3.6025390625, 3.81390380859375, 4.0252685546875, 4.23663330078125, 4.447998046875, 4.65936279296875, 4.8707275390625, 5.08209228515625, 5.29345703125, 5.50482177734375, 5.7161865234375, 5.92755126953125, 6.138916015625, 6.35028076171875, 6.5616455078125, 6.77301025390625, 6.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 2.0, 13.0, 9.0, 14.0, 18.0, 29.0, 26.0, 28.0, 38.0, 41.0, 55.0, 38.0, 60.0, 51.0, 69.0, 65.0, 53.0, 62.0, 50.0, 46.0, 40.0, 31.0, 29.0, 24.0, 17.0, 12.0, 17.0, 8.0, 11.0, 3.0, 3.0, 9.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.605167388916016, -27.641395568847656, -26.67762565612793, -25.71385383605957, -24.75008201599121, -23.786312103271484, -22.822540283203125, -21.858768463134766, -20.894996643066406, -19.931224822998047, -18.96745491027832, -18.00368309020996, -17.0399112701416, -16.076141357421875, -15.112369537353516, -14.148597717285156, -13.18482780456543, -12.221056938171387, -11.257285118103027, -10.293514251708984, -9.329742431640625, -8.365971565246582, -7.402200698852539, -6.438429355621338, -5.474658012390137, -4.5108866691589355, -3.5471155643463135, -2.5833444595336914, -1.6195731163024902, -0.6558017730712891, 0.3079690933227539, 1.271740436553955, 2.2355117797851562, 3.1992831230163574, 4.163054466247559, 5.126825332641602, 6.090596675872803, 7.054368019104004, 8.018138885498047, 8.981910705566406, 9.94568157196045, 10.909452438354492, 11.873224258422852, 12.836995124816895, 13.800765991210938, 14.764537811279297, 15.72830867767334, 16.692079544067383, 17.655851364135742, 18.6196231842041, 19.583393096923828, 20.547164916992188, 21.510936737060547, 22.474708557128906, 23.438478469848633, 24.402250289916992, 25.36602020263672, 26.329792022705078, 27.293561935424805, 28.257333755493164, 29.221105575561523, 30.18487548828125, 31.14864730834961, 32.11241912841797, 33.07619094848633]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 22.0, 35.0, 29.0, 38.0, 34.0, 41.0, 47.0, 31.0, 46.0, 34.0, 47.0, 44.0, 38.0, 49.0, 43.0, 36.0, 33.0, 35.0, 36.0, 37.0, 16.0, 28.0, 20.0, 21.0, 16.0, 8.0, 5.0, 7.0, 2.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.032825469970703, -26.050125122070312, -25.06742286682129, -24.0847225189209, -23.102020263671875, -22.119319915771484, -21.136619567871094, -20.15391731262207, -19.17121696472168, -18.18851661682129, -17.205814361572266, -16.223114013671875, -15.240412712097168, -14.257711410522461, -13.275010108947754, -12.292308807373047, -11.30960750579834, -10.326906204223633, -9.344204902648926, -8.361503601074219, -7.378803253173828, -6.396101951599121, -5.413400650024414, -4.430699825286865, -3.447998523712158, -2.4652974605560303, -1.4825962781906128, -0.4998950958251953, 0.4828059673309326, 1.4655070304870605, 2.4482083320617676, 3.4309091567993164, 4.413610458374023, 5.3963117599487305, 6.379012584686279, 7.361713886260986, 8.344414710998535, 9.327116012573242, 10.30981731414795, 11.292518615722656, 12.275218963623047, 13.257920265197754, 14.240621566772461, 15.223321914672852, 16.206024169921875, 17.188724517822266, 18.171424865722656, 19.15412712097168, 20.136829376220703, 21.119529724121094, 22.102231979370117, 23.084932327270508, 24.06763458251953, 25.050334930419922, 26.033035278320312, 27.015737533569336, 27.998437881469727, 28.981138229370117, 29.96384048461914, 30.94654083251953, 31.929243087768555, 32.91194152832031, 33.89464569091797, 34.87734603881836, 35.86004638671875]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 3.0, 14.0, 20.0, 24.0, 55.0, 79.0, 131.0, 167.0, 234.0, 297.0, 439.0, 567.0, 876.0, 1287.0, 1775.0, 2838.0, 4263.0, 6501.0, 10682.0, 17277.0, 29531.0, 53876.0, 107253.0, 249101.0, 647771.0, 1288494.0, 1009853.0, 419475.0, 167094.0, 75940.0, 39902.0, 22446.0, 13199.0, 8167.0, 4925.0, 3263.0, 2065.0, 1430.0, 923.0, 641.0, 424.0, 297.0, 176.0, 131.0, 111.0, 76.0, 45.0, 48.0, 36.0, 23.0, 11.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.6875, -31.58935546875, -30.4912109375, -29.39306640625, -28.294921875, -27.19677734375, -26.0986328125, -25.00048828125, -23.90234375, -22.80419921875, -21.7060546875, -20.60791015625, -19.509765625, -18.41162109375, -17.3134765625, -16.21533203125, -15.1171875, -14.01904296875, -12.9208984375, -11.82275390625, -10.724609375, -9.62646484375, -8.5283203125, -7.43017578125, -6.33203125, -5.23388671875, -4.1357421875, -3.03759765625, -1.939453125, -0.84130859375, 0.2568359375, 1.35498046875, 2.453125, 3.55126953125, 4.6494140625, 5.74755859375, 6.845703125, 7.94384765625, 9.0419921875, 10.14013671875, 11.23828125, 12.33642578125, 13.4345703125, 14.53271484375, 15.630859375, 16.72900390625, 17.8271484375, 18.92529296875, 20.0234375, 21.12158203125, 22.2197265625, 23.31787109375, 24.416015625, 25.51416015625, 26.6123046875, 27.71044921875, 28.80859375, 29.90673828125, 31.0048828125, 32.10302734375, 33.201171875, 34.29931640625, 35.3974609375, 36.49560546875, 37.59375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 10.0, 21.0, 21.0, 22.0, 27.0, 31.0, 28.0, 36.0, 29.0, 31.0, 31.0, 45.0, 42.0, 37.0, 49.0, 53.0, 44.0, 45.0, 38.0, 36.0, 40.0, 27.0, 27.0, 38.0, 24.0, 20.0, 20.0, 18.0, 15.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.140625, -22.302490234375, -21.46435546875, -20.626220703125, -19.7880859375, -18.949951171875, -18.11181640625, -17.273681640625, -16.435546875, -15.597412109375, -14.75927734375, -13.921142578125, -13.0830078125, -12.244873046875, -11.40673828125, -10.568603515625, -9.73046875, -8.892333984375, -8.05419921875, -7.216064453125, -6.3779296875, -5.539794921875, -4.70166015625, -3.863525390625, -3.025390625, -2.187255859375, -1.34912109375, -0.510986328125, 0.3271484375, 1.165283203125, 2.00341796875, 2.841552734375, 3.6796875, 4.517822265625, 5.35595703125, 6.194091796875, 7.0322265625, 7.870361328125, 8.70849609375, 9.546630859375, 10.384765625, 11.222900390625, 12.06103515625, 12.899169921875, 13.7373046875, 14.575439453125, 15.41357421875, 16.251708984375, 17.08984375, 17.927978515625, 18.76611328125, 19.604248046875, 20.4423828125, 21.280517578125, 22.11865234375, 22.956787109375, 23.794921875, 24.633056640625, 25.47119140625, 26.309326171875, 27.1474609375, 27.985595703125, 28.82373046875, 29.661865234375, 30.5]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 19.0, 24.0, 42.0, 40.0, 76.0, 111.0, 176.0, 274.0, 433.0, 708.0, 1240.0, 2214.0, 4057.0, 7333.0, 14404.0, 28458.0, 60369.0, 136011.0, 341527.0, 971845.0, 1569859.0, 634232.0, 233085.0, 97480.0, 44507.0, 21347.0, 11012.0, 5792.0, 3156.0, 1812.0, 1018.0, 575.0, 366.0, 210.0, 152.0, 85.0, 70.0, 49.0, 28.0, 17.0, 17.0, 12.0, 8.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-50.40625, -48.845703125, -47.28515625, -45.724609375, -44.1640625, -42.603515625, -41.04296875, -39.482421875, -37.921875, -36.361328125, -34.80078125, -33.240234375, -31.6796875, -30.119140625, -28.55859375, -26.998046875, -25.4375, -23.876953125, -22.31640625, -20.755859375, -19.1953125, -17.634765625, -16.07421875, -14.513671875, -12.953125, -11.392578125, -9.83203125, -8.271484375, -6.7109375, -5.150390625, -3.58984375, -2.029296875, -0.46875, 1.091796875, 2.65234375, 4.212890625, 5.7734375, 7.333984375, 8.89453125, 10.455078125, 12.015625, 13.576171875, 15.13671875, 16.697265625, 18.2578125, 19.818359375, 21.37890625, 22.939453125, 24.5, 26.060546875, 27.62109375, 29.181640625, 30.7421875, 32.302734375, 33.86328125, 35.423828125, 36.984375, 38.544921875, 40.10546875, 41.666015625, 43.2265625, 44.787109375, 46.34765625, 47.908203125, 49.46875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 1.0, 2.0, 4.0, 8.0, 8.0, 16.0, 16.0, 16.0, 34.0, 39.0, 48.0, 68.0, 98.0, 106.0, 149.0, 178.0, 220.0, 296.0, 353.0, 381.0, 383.0, 309.0, 315.0, 240.0, 172.0, 138.0, 104.0, 97.0, 58.0, 57.0, 39.0, 27.0, 22.0, 22.0, 15.0, 16.0, 4.0, 12.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.066650390625, -12.58642578125, -12.106201171875, -11.6259765625, -11.145751953125, -10.66552734375, -10.185302734375, -9.705078125, -9.224853515625, -8.74462890625, -8.264404296875, -7.7841796875, -7.303955078125, -6.82373046875, -6.343505859375, -5.86328125, -5.383056640625, -4.90283203125, -4.422607421875, -3.9423828125, -3.462158203125, -2.98193359375, -2.501708984375, -2.021484375, -1.541259765625, -1.06103515625, -0.580810546875, -0.1005859375, 0.379638671875, 0.85986328125, 1.340087890625, 1.8203125, 2.300537109375, 2.78076171875, 3.260986328125, 3.7412109375, 4.221435546875, 4.70166015625, 5.181884765625, 5.662109375, 6.142333984375, 6.62255859375, 7.102783203125, 7.5830078125, 8.063232421875, 8.54345703125, 9.023681640625, 9.50390625, 9.984130859375, 10.46435546875, 10.944580078125, 11.4248046875, 11.905029296875, 12.38525390625, 12.865478515625, 13.345703125, 13.825927734375, 14.30615234375, 14.786376953125, 15.2666015625, 15.746826171875, 16.22705078125, 16.707275390625, 17.1875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 8.0, 15.0, 16.0, 19.0, 18.0, 25.0, 45.0, 37.0, 47.0, 47.0, 55.0, 66.0, 66.0, 72.0, 74.0, 57.0, 52.0, 55.0, 34.0, 33.0, 31.0, 19.0, 13.0, 14.0, 14.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.146879196166992, -28.024721145629883, -26.902563095092773, -25.78040313720703, -24.658245086669922, -23.536087036132812, -22.413928985595703, -21.291770935058594, -20.169612884521484, -19.047454833984375, -17.925296783447266, -16.803138732910156, -15.680978775024414, -14.558820724487305, -13.436662673950195, -12.314504623413086, -11.192344665527344, -10.070186614990234, -8.948027610778809, -7.825869560241699, -6.703711032867432, -5.581552505493164, -4.459394454956055, -3.337235927581787, -2.2150774002075195, -1.0929189920425415, 0.029239416122436523, 1.151397705078125, 2.2735562324523926, 3.39571475982666, 4.5178728103637695, 5.640031337738037, 6.762187957763672, 7.8843464851379395, 9.006505012512207, 10.128663063049316, 11.250822067260742, 12.372980117797852, 13.495138168334961, 14.61729621887207, 15.739455223083496, 16.861614227294922, 17.98377227783203, 19.10593032836914, 20.22808837890625, 21.35024642944336, 22.47240447998047, 23.59456443786621, 24.71672248840332, 25.83888053894043, 26.96103858947754, 28.08319854736328, 29.20535659790039, 30.3275146484375, 31.44967269897461, 32.57183074951172, 33.69398880004883, 34.81614685058594, 35.93830490112305, 37.060462951660156, 38.182621002197266, 39.304779052734375, 40.42694091796875, 41.54909896850586, 42.67125701904297]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 10.0, 11.0, 8.0, 23.0, 25.0, 18.0, 34.0, 33.0, 18.0, 30.0, 41.0, 42.0, 46.0, 40.0, 26.0, 41.0, 38.0, 40.0, 44.0, 40.0, 47.0, 50.0, 28.0, 35.0, 39.0, 23.0, 16.0, 16.0, 26.0, 18.0, 18.0, 6.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.92987823486328, -26.966094970703125, -26.00231170654297, -25.03852653503418, -24.074743270874023, -23.110960006713867, -22.14717674255371, -21.183391571044922, -20.219608306884766, -19.25582504272461, -18.292041778564453, -17.328256607055664, -16.364473342895508, -15.400690078735352, -14.436906814575195, -13.473122596740723, -12.509339332580566, -11.54555606842041, -10.581771850585938, -9.617988586425781, -8.654204368591309, -7.690421104431152, -6.726637363433838, -5.762853622436523, -4.799069881439209, -3.8352861404418945, -2.87150239944458, -1.9077188968658447, -0.9439351558685303, 0.019848346710205078, 0.9836320877075195, 1.947415828704834, 2.9111995697021484, 3.874983310699463, 4.838767051696777, 5.802550315856934, 6.766334533691406, 7.7301177978515625, 8.693901062011719, 9.657685279846191, 10.621469497680664, 11.58525276184082, 12.549036979675293, 13.51282024383545, 14.476604461669922, 15.440387725830078, 16.404170989990234, 17.36795425415039, 18.331737518310547, 19.295520782470703, 20.25930404663086, 21.22308921813965, 22.186872482299805, 23.15065574645996, 24.114439010620117, 25.078224182128906, 26.042007446289062, 27.00579071044922, 27.969573974609375, 28.933359146118164, 29.89714241027832, 30.860925674438477, 31.824708938598633, 32.78849411010742, 33.75227737426758]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 11.0, 20.0, 33.0, 37.0, 48.0, 70.0, 133.0, 171.0, 260.0, 360.0, 653.0, 899.0, 1351.0, 2044.0, 3177.0, 5166.0, 8392.0, 13912.0, 23654.0, 43074.0, 80186.0, 161704.0, 274271.0, 202797.0, 101878.0, 52046.0, 28734.0, 16783.0, 9815.0, 6058.0, 3768.0, 2376.0, 1610.0, 1025.0, 642.0, 473.0, 293.0, 188.0, 129.0, 79.0, 69.0, 48.0, 33.0, 23.0, 16.0, 12.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0], "bins": [-23.453125, -22.776611328125, -22.10009765625, -21.423583984375, -20.7470703125, -20.070556640625, -19.39404296875, -18.717529296875, -18.041015625, -17.364501953125, -16.68798828125, -16.011474609375, -15.3349609375, -14.658447265625, -13.98193359375, -13.305419921875, -12.62890625, -11.952392578125, -11.27587890625, -10.599365234375, -9.9228515625, -9.246337890625, -8.56982421875, -7.893310546875, -7.216796875, -6.540283203125, -5.86376953125, -5.187255859375, -4.5107421875, -3.834228515625, -3.15771484375, -2.481201171875, -1.8046875, -1.128173828125, -0.45166015625, 0.224853515625, 0.9013671875, 1.577880859375, 2.25439453125, 2.930908203125, 3.607421875, 4.283935546875, 4.96044921875, 5.636962890625, 6.3134765625, 6.989990234375, 7.66650390625, 8.343017578125, 9.01953125, 9.696044921875, 10.37255859375, 11.049072265625, 11.7255859375, 12.402099609375, 13.07861328125, 13.755126953125, 14.431640625, 15.108154296875, 15.78466796875, 16.461181640625, 17.1376953125, 17.814208984375, 18.49072265625, 19.167236328125, 19.84375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 6.0, 10.0, 7.0, 3.0, 16.0, 17.0, 17.0, 27.0, 25.0, 29.0, 34.0, 22.0, 41.0, 55.0, 43.0, 48.0, 40.0, 42.0, 46.0, 35.0, 48.0, 43.0, 43.0, 36.0, 37.0, 34.0, 33.0, 21.0, 21.0, 17.0, 27.0, 12.0, 9.0, 6.0, 7.0, 3.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.40625, -27.38427734375, -26.3623046875, -25.34033203125, -24.318359375, -23.29638671875, -22.2744140625, -21.25244140625, -20.23046875, -19.20849609375, -18.1865234375, -17.16455078125, -16.142578125, -15.12060546875, -14.0986328125, -13.07666015625, -12.0546875, -11.03271484375, -10.0107421875, -8.98876953125, -7.966796875, -6.94482421875, -5.9228515625, -4.90087890625, -3.87890625, -2.85693359375, -1.8349609375, -0.81298828125, 0.208984375, 1.23095703125, 2.2529296875, 3.27490234375, 4.296875, 5.31884765625, 6.3408203125, 7.36279296875, 8.384765625, 9.40673828125, 10.4287109375, 11.45068359375, 12.47265625, 13.49462890625, 14.5166015625, 15.53857421875, 16.560546875, 17.58251953125, 18.6044921875, 19.62646484375, 20.6484375, 21.67041015625, 22.6923828125, 23.71435546875, 24.736328125, 25.75830078125, 26.7802734375, 27.80224609375, 28.82421875, 29.84619140625, 30.8681640625, 31.89013671875, 32.912109375, 33.93408203125, 34.9560546875, 35.97802734375, 37.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 18.0, 20.0, 41.0, 40.0, 68.0, 107.0, 152.0, 255.0, 356.0, 562.0, 782.0, 1285.0, 2028.0, 3064.0, 4784.0, 7908.0, 12806.0, 22322.0, 40218.0, 80458.0, 185266.0, 331329.0, 179958.0, 79122.0, 40135.0, 21787.0, 12796.0, 7599.0, 4759.0, 2952.0, 1882.0, 1245.0, 840.0, 552.0, 364.0, 231.0, 168.0, 88.0, 52.0, 46.0, 27.0, 23.0, 13.0, 14.0, 11.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.26025390625, -27.3017578125, -26.34326171875, -25.384765625, -24.42626953125, -23.4677734375, -22.50927734375, -21.55078125, -20.59228515625, -19.6337890625, -18.67529296875, -17.716796875, -16.75830078125, -15.7998046875, -14.84130859375, -13.8828125, -12.92431640625, -11.9658203125, -11.00732421875, -10.048828125, -9.09033203125, -8.1318359375, -7.17333984375, -6.21484375, -5.25634765625, -4.2978515625, -3.33935546875, -2.380859375, -1.42236328125, -0.4638671875, 0.49462890625, 1.453125, 2.41162109375, 3.3701171875, 4.32861328125, 5.287109375, 6.24560546875, 7.2041015625, 8.16259765625, 9.12109375, 10.07958984375, 11.0380859375, 11.99658203125, 12.955078125, 13.91357421875, 14.8720703125, 15.83056640625, 16.7890625, 17.74755859375, 18.7060546875, 19.66455078125, 20.623046875, 21.58154296875, 22.5400390625, 23.49853515625, 24.45703125, 25.41552734375, 26.3740234375, 27.33251953125, 28.291015625, 29.24951171875, 30.2080078125, 31.16650390625, 32.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 13.0, 10.0, 17.0, 15.0, 16.0, 22.0, 31.0, 22.0, 27.0, 23.0, 38.0, 29.0, 29.0, 50.0, 34.0, 36.0, 44.0, 38.0, 36.0, 38.0, 40.0, 41.0, 38.0, 34.0, 34.0, 29.0, 33.0, 21.0, 17.0, 22.0, 19.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.34375, -18.75244140625, -18.1611328125, -17.56982421875, -16.978515625, -16.38720703125, -15.7958984375, -15.20458984375, -14.61328125, -14.02197265625, -13.4306640625, -12.83935546875, -12.248046875, -11.65673828125, -11.0654296875, -10.47412109375, -9.8828125, -9.29150390625, -8.7001953125, -8.10888671875, -7.517578125, -6.92626953125, -6.3349609375, -5.74365234375, -5.15234375, -4.56103515625, -3.9697265625, -3.37841796875, -2.787109375, -2.19580078125, -1.6044921875, -1.01318359375, -0.421875, 0.16943359375, 0.7607421875, 1.35205078125, 1.943359375, 2.53466796875, 3.1259765625, 3.71728515625, 4.30859375, 4.89990234375, 5.4912109375, 6.08251953125, 6.673828125, 7.26513671875, 7.8564453125, 8.44775390625, 9.0390625, 9.63037109375, 10.2216796875, 10.81298828125, 11.404296875, 11.99560546875, 12.5869140625, 13.17822265625, 13.76953125, 14.36083984375, 14.9521484375, 15.54345703125, 16.134765625, 16.72607421875, 17.3173828125, 17.90869140625, 18.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 19.0, 28.0, 31.0, 48.0, 83.0, 94.0, 187.0, 297.0, 445.0, 845.0, 1506.0, 2967.0, 5936.0, 13104.0, 30892.0, 81385.0, 233454.0, 394767.0, 175024.0, 62221.0, 24110.0, 10579.0, 4885.0, 2500.0, 1262.0, 744.0, 410.0, 256.0, 147.0, 96.0, 56.0, 44.0, 32.0, 17.0, 16.0, 3.0, 4.0, 7.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.078125, -9.7667236328125, -9.455322265625, -9.1439208984375, -8.83251953125, -8.5211181640625, -8.209716796875, -7.8983154296875, -7.5869140625, -7.2755126953125, -6.964111328125, -6.6527099609375, -6.34130859375, -6.0299072265625, -5.718505859375, -5.4071044921875, -5.095703125, -4.7843017578125, -4.472900390625, -4.1614990234375, -3.85009765625, -3.5386962890625, -3.227294921875, -2.9158935546875, -2.6044921875, -2.2930908203125, -1.981689453125, -1.6702880859375, -1.35888671875, -1.0474853515625, -0.736083984375, -0.4246826171875, -0.11328125, 0.1981201171875, 0.509521484375, 0.8209228515625, 1.13232421875, 1.4437255859375, 1.755126953125, 2.0665283203125, 2.3779296875, 2.6893310546875, 3.000732421875, 3.3121337890625, 3.62353515625, 3.9349365234375, 4.246337890625, 4.5577392578125, 4.869140625, 5.1805419921875, 5.491943359375, 5.8033447265625, 6.11474609375, 6.4261474609375, 6.737548828125, 7.0489501953125, 7.3603515625, 7.6717529296875, 7.983154296875, 8.2945556640625, 8.60595703125, 8.9173583984375, 9.228759765625, 9.5401611328125, 9.8515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 15.0, 17.0, 26.0, 37.0, 47.0, 54.0, 75.0, 50.0, 81.0, 69.0, 90.0, 75.0, 62.0, 55.0, 50.0, 40.0, 28.0, 25.0, 19.0, 14.0, 12.0, 7.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0009746551513671875, -0.0009489357471466064, -0.0009232163429260254, -0.0008974969387054443, -0.0008717775344848633, -0.0008460581302642822, -0.0008203387260437012, -0.0007946193218231201, -0.0007688999176025391, -0.000743180513381958, -0.000717461109161377, -0.0006917417049407959, -0.0006660223007202148, -0.0006403028964996338, -0.0006145834922790527, -0.0005888640880584717, -0.0005631446838378906, -0.0005374252796173096, -0.0005117058753967285, -0.00048598647117614746, -0.0004602670669555664, -0.00043454766273498535, -0.0004088282585144043, -0.00038310885429382324, -0.0003573894500732422, -0.00033167004585266113, -0.0003059506416320801, -0.000280231237411499, -0.00025451183319091797, -0.00022879242897033691, -0.00020307302474975586, -0.0001773536205291748, -0.00015163421630859375, -0.0001259148120880127, -0.00010019540786743164, -7.447600364685059e-05, -4.875659942626953e-05, -2.3037195205688477e-05, 2.682209014892578e-06, 2.8401613235473633e-05, 5.412101745605469e-05, 7.984042167663574e-05, 0.0001055598258972168, 0.00013127923011779785, 0.0001569986343383789, 0.00018271803855895996, 0.00020843744277954102, 0.00023415684700012207, 0.0002598762512207031, 0.0002855956554412842, 0.00031131505966186523, 0.0003370344638824463, 0.00036275386810302734, 0.0003884732723236084, 0.00041419267654418945, 0.0004399120807647705, 0.00046563148498535156, 0.0004913508892059326, 0.0005170702934265137, 0.0005427896976470947, 0.0005685091018676758, 0.0005942285060882568, 0.0006199479103088379, 0.0006456673145294189, 0.00067138671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 6.0, 9.0, 12.0, 23.0, 20.0, 27.0, 35.0, 61.0, 86.0, 112.0, 179.0, 244.0, 317.0, 441.0, 635.0, 887.0, 1268.0, 2043.0, 3154.0, 4952.0, 7859.0, 13185.0, 22901.0, 40634.0, 74186.0, 135201.0, 213936.0, 214713.0, 135990.0, 75239.0, 41260.0, 23166.0, 13337.0, 8001.0, 4844.0, 3214.0, 2028.0, 1304.0, 920.0, 640.0, 439.0, 301.0, 198.0, 155.0, 110.0, 73.0, 51.0, 53.0, 33.0, 23.0, 23.0, 9.0, 12.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.51171875, -7.26947021484375, -7.0272216796875, -6.78497314453125, -6.542724609375, -6.30047607421875, -6.0582275390625, -5.81597900390625, -5.57373046875, -5.33148193359375, -5.0892333984375, -4.84698486328125, -4.604736328125, -4.36248779296875, -4.1202392578125, -3.87799072265625, -3.6357421875, -3.39349365234375, -3.1512451171875, -2.90899658203125, -2.666748046875, -2.42449951171875, -2.1822509765625, -1.94000244140625, -1.69775390625, -1.45550537109375, -1.2132568359375, -0.97100830078125, -0.728759765625, -0.48651123046875, -0.2442626953125, -0.00201416015625, 0.240234375, 0.48248291015625, 0.7247314453125, 0.96697998046875, 1.209228515625, 1.45147705078125, 1.6937255859375, 1.93597412109375, 2.17822265625, 2.42047119140625, 2.6627197265625, 2.90496826171875, 3.147216796875, 3.38946533203125, 3.6317138671875, 3.87396240234375, 4.1162109375, 4.35845947265625, 4.6007080078125, 4.84295654296875, 5.085205078125, 5.32745361328125, 5.5697021484375, 5.81195068359375, 6.05419921875, 6.29644775390625, 6.5386962890625, 6.78094482421875, 7.023193359375, 7.26544189453125, 7.5076904296875, 7.74993896484375, 7.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 13.0, 9.0, 14.0, 25.0, 29.0, 32.0, 40.0, 29.0, 25.0, 37.0, 56.0, 51.0, 55.0, 61.0, 56.0, 54.0, 59.0, 57.0, 36.0, 38.0, 32.0, 32.0, 13.0, 29.0, 14.0, 12.0, 14.0, 14.0, 13.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.466522216796875, -2.38812255859375, -2.309722900390625, -2.2313232421875, -2.152923583984375, -2.07452392578125, -1.996124267578125, -1.917724609375, -1.839324951171875, -1.76092529296875, -1.682525634765625, -1.6041259765625, -1.525726318359375, -1.44732666015625, -1.368927001953125, -1.29052734375, -1.212127685546875, -1.13372802734375, -1.055328369140625, -0.9769287109375, -0.898529052734375, -0.82012939453125, -0.741729736328125, -0.663330078125, -0.584930419921875, -0.50653076171875, -0.428131103515625, -0.3497314453125, -0.271331787109375, -0.19293212890625, -0.114532470703125, -0.0361328125, 0.042266845703125, 0.12066650390625, 0.199066162109375, 0.2774658203125, 0.355865478515625, 0.43426513671875, 0.512664794921875, 0.591064453125, 0.669464111328125, 0.74786376953125, 0.826263427734375, 0.9046630859375, 0.983062744140625, 1.06146240234375, 1.139862060546875, 1.21826171875, 1.296661376953125, 1.37506103515625, 1.453460693359375, 1.5318603515625, 1.610260009765625, 1.68865966796875, 1.767059326171875, 1.845458984375, 1.923858642578125, 2.00225830078125, 2.080657958984375, 2.1590576171875, 2.237457275390625, 2.31585693359375, 2.394256591796875, 2.47265625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 13.0, 11.0, 11.0, 14.0, 20.0, 20.0, 22.0, 33.0, 39.0, 43.0, 52.0, 62.0, 60.0, 71.0, 74.0, 71.0, 62.0, 46.0, 56.0, 39.0, 40.0, 30.0, 20.0, 19.0, 14.0, 16.0, 9.0, 6.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.11594581604004, -28.96799659729004, -27.820049285888672, -26.672100067138672, -25.524152755737305, -24.376203536987305, -23.228256225585938, -22.080307006835938, -20.932357788085938, -19.784408569335938, -18.63646125793457, -17.48851203918457, -16.340564727783203, -15.192615509033203, -14.04466724395752, -12.896718978881836, -11.748771667480469, -10.600823402404785, -9.452875137329102, -8.304925918579102, -7.156978130340576, -6.009029865264893, -4.861081123352051, -3.713132858276367, -2.5651845932006836, -1.4172362089157104, -0.2692878246307373, 0.8786606788635254, 2.026608943939209, 3.1745572090148926, 4.322505950927734, 5.470454216003418, 6.618400573730469, 7.766348838806152, 8.914297103881836, 10.062246322631836, 11.210193634033203, 12.358142852783203, 13.506091117858887, 14.65403938293457, 15.801987648010254, 16.949935913085938, 18.097885131835938, 19.245832443237305, 20.393781661987305, 21.541728973388672, 22.689678192138672, 23.837627410888672, 24.98557472229004, 26.13352394104004, 27.281471252441406, 28.429420471191406, 29.577367782592773, 30.725317001342773, 31.87326431274414, 33.02121353149414, 34.16916275024414, 35.31711196899414, 36.46506118774414, 37.613006591796875, 38.760955810546875, 39.908905029296875, 41.056854248046875, 42.204803466796875, 43.35274887084961]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 5.0, 3.0, 8.0, 9.0, 16.0, 4.0, 14.0, 17.0, 23.0, 20.0, 27.0, 34.0, 28.0, 32.0, 43.0, 36.0, 48.0, 34.0, 33.0, 40.0, 36.0, 41.0, 46.0, 36.0, 46.0, 45.0, 39.0, 38.0, 33.0, 21.0, 16.0, 19.0, 22.0, 22.0, 15.0, 7.0, 8.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.48418617248535, -26.535245895385742, -25.586307525634766, -24.637367248535156, -23.688426971435547, -22.739486694335938, -21.79054832458496, -20.84160804748535, -19.892669677734375, -18.943729400634766, -17.99479103088379, -17.04585075378418, -16.09691047668457, -15.147971153259277, -14.199031829833984, -13.250091552734375, -12.301151275634766, -11.352211952209473, -10.403271675109863, -9.45433235168457, -8.505392074584961, -7.556452751159668, -6.607513427734375, -5.658573627471924, -4.709633827209473, -3.7606940269470215, -2.8117544651031494, -1.8628149032592773, -0.9138751029968262, 0.035064697265625, 0.984004020690918, 1.9329438209533691, 2.8818817138671875, 3.8308215141296387, 4.77976131439209, 5.728700637817383, 6.677640438079834, 7.626580238342285, 8.575519561767578, 9.524459838867188, 10.47339916229248, 11.422338485717773, 12.371278762817383, 13.320218086242676, 14.269157409667969, 15.218097686767578, 16.167037963867188, 17.115976333618164, 18.064916610717773, 19.013856887817383, 19.96279525756836, 20.91173553466797, 21.860675811767578, 22.809616088867188, 23.758554458618164, 24.707494735717773, 25.65643310546875, 26.60537338256836, 27.554311752319336, 28.503252029418945, 29.452192306518555, 30.40113067626953, 31.35007095336914, 32.29901123046875, 33.24795150756836]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 22.0, 43.0, 37.0, 48.0, 69.0, 118.0, 143.0, 234.0, 252.0, 473.0, 643.0, 999.0, 1507.0, 2341.0, 3582.0, 5815.0, 9469.0, 15864.0, 26251.0, 44416.0, 75638.0, 127650.0, 190309.0, 199100.0, 138370.0, 82855.0, 48474.0, 28547.0, 17055.0, 10408.0, 6307.0, 3933.0, 2609.0, 1576.0, 1102.0, 702.0, 487.0, 316.0, 227.0, 181.0, 121.0, 71.0, 48.0, 49.0, 26.0, 14.0, 11.0, 15.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.09375, -34.9326171875, -33.771484375, -32.6103515625, -31.44921875, -30.2880859375, -29.126953125, -27.9658203125, -26.8046875, -25.6435546875, -24.482421875, -23.3212890625, -22.16015625, -20.9990234375, -19.837890625, -18.6767578125, -17.515625, -16.3544921875, -15.193359375, -14.0322265625, -12.87109375, -11.7099609375, -10.548828125, -9.3876953125, -8.2265625, -7.0654296875, -5.904296875, -4.7431640625, -3.58203125, -2.4208984375, -1.259765625, -0.0986328125, 1.0625, 2.2236328125, 3.384765625, 4.5458984375, 5.70703125, 6.8681640625, 8.029296875, 9.1904296875, 10.3515625, 11.5126953125, 12.673828125, 13.8349609375, 14.99609375, 16.1572265625, 17.318359375, 18.4794921875, 19.640625, 20.8017578125, 21.962890625, 23.1240234375, 24.28515625, 25.4462890625, 26.607421875, 27.7685546875, 28.9296875, 30.0908203125, 31.251953125, 32.4130859375, 33.57421875, 34.7353515625, 35.896484375, 37.0576171875, 38.21875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 2.0, 3.0, 8.0, 14.0, 9.0, 13.0, 18.0, 19.0, 14.0, 25.0, 36.0, 36.0, 29.0, 33.0, 47.0, 51.0, 36.0, 38.0, 39.0, 42.0, 50.0, 48.0, 39.0, 58.0, 34.0, 33.0, 36.0, 27.0, 25.0, 24.0, 24.0, 11.0, 20.0, 15.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.561279296875, -26.57568359375, -25.590087890625, -24.6044921875, -23.618896484375, -22.63330078125, -21.647705078125, -20.662109375, -19.676513671875, -18.69091796875, -17.705322265625, -16.7197265625, -15.734130859375, -14.74853515625, -13.762939453125, -12.77734375, -11.791748046875, -10.80615234375, -9.820556640625, -8.8349609375, -7.849365234375, -6.86376953125, -5.878173828125, -4.892578125, -3.906982421875, -2.92138671875, -1.935791015625, -0.9501953125, 0.035400390625, 1.02099609375, 2.006591796875, 2.9921875, 3.977783203125, 4.96337890625, 5.948974609375, 6.9345703125, 7.920166015625, 8.90576171875, 9.891357421875, 10.876953125, 11.862548828125, 12.84814453125, 13.833740234375, 14.8193359375, 15.804931640625, 16.79052734375, 17.776123046875, 18.76171875, 19.747314453125, 20.73291015625, 21.718505859375, 22.7041015625, 23.689697265625, 24.67529296875, 25.660888671875, 26.646484375, 27.632080078125, 28.61767578125, 29.603271484375, 30.5888671875, 31.574462890625, 32.56005859375, 33.545654296875, 34.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 17.0, 13.0, 38.0, 46.0, 60.0, 82.0, 133.0, 180.0, 300.0, 419.0, 588.0, 921.0, 1311.0, 1973.0, 2965.0, 4521.0, 6793.0, 10234.0, 15872.0, 24676.0, 39124.0, 61328.0, 96746.0, 146143.0, 183297.0, 156526.0, 105962.0, 67385.0, 43086.0, 27016.0, 17334.0, 11242.0, 7440.0, 4860.0, 3257.0, 2127.0, 1471.0, 946.0, 658.0, 472.0, 287.0, 235.0, 138.0, 107.0, 68.0, 53.0, 32.0, 25.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.65625, -32.59130859375, -31.5263671875, -30.46142578125, -29.396484375, -28.33154296875, -27.2666015625, -26.20166015625, -25.13671875, -24.07177734375, -23.0068359375, -21.94189453125, -20.876953125, -19.81201171875, -18.7470703125, -17.68212890625, -16.6171875, -15.55224609375, -14.4873046875, -13.42236328125, -12.357421875, -11.29248046875, -10.2275390625, -9.16259765625, -8.09765625, -7.03271484375, -5.9677734375, -4.90283203125, -3.837890625, -2.77294921875, -1.7080078125, -0.64306640625, 0.421875, 1.48681640625, 2.5517578125, 3.61669921875, 4.681640625, 5.74658203125, 6.8115234375, 7.87646484375, 8.94140625, 10.00634765625, 11.0712890625, 12.13623046875, 13.201171875, 14.26611328125, 15.3310546875, 16.39599609375, 17.4609375, 18.52587890625, 19.5908203125, 20.65576171875, 21.720703125, 22.78564453125, 23.8505859375, 24.91552734375, 25.98046875, 27.04541015625, 28.1103515625, 29.17529296875, 30.240234375, 31.30517578125, 32.3701171875, 33.43505859375, 34.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 13.0, 9.0, 11.0, 13.0, 16.0, 23.0, 17.0, 26.0, 24.0, 33.0, 41.0, 31.0, 24.0, 42.0, 44.0, 46.0, 40.0, 46.0, 39.0, 40.0, 32.0, 33.0, 30.0, 34.0, 38.0, 35.0, 27.0, 19.0, 27.0, 19.0, 26.0, 7.0, 16.0, 15.0, 9.0, 6.0, 14.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-20.03125, -19.42626953125, -18.8212890625, -18.21630859375, -17.611328125, -17.00634765625, -16.4013671875, -15.79638671875, -15.19140625, -14.58642578125, -13.9814453125, -13.37646484375, -12.771484375, -12.16650390625, -11.5615234375, -10.95654296875, -10.3515625, -9.74658203125, -9.1416015625, -8.53662109375, -7.931640625, -7.32666015625, -6.7216796875, -6.11669921875, -5.51171875, -4.90673828125, -4.3017578125, -3.69677734375, -3.091796875, -2.48681640625, -1.8818359375, -1.27685546875, -0.671875, -0.06689453125, 0.5380859375, 1.14306640625, 1.748046875, 2.35302734375, 2.9580078125, 3.56298828125, 4.16796875, 4.77294921875, 5.3779296875, 5.98291015625, 6.587890625, 7.19287109375, 7.7978515625, 8.40283203125, 9.0078125, 9.61279296875, 10.2177734375, 10.82275390625, 11.427734375, 12.03271484375, 12.6376953125, 13.24267578125, 13.84765625, 14.45263671875, 15.0576171875, 15.66259765625, 16.267578125, 16.87255859375, 17.4775390625, 18.08251953125, 18.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 14.0, 15.0, 18.0, 31.0, 59.0, 75.0, 85.0, 129.0, 196.0, 296.0, 445.0, 623.0, 910.0, 1276.0, 1935.0, 2861.0, 4666.0, 7178.0, 12050.0, 20247.0, 36016.0, 65074.0, 115439.0, 194141.0, 226680.0, 153817.0, 87139.0, 48445.0, 26973.0, 15623.0, 9274.0, 5688.0, 3673.0, 2359.0, 1588.0, 1090.0, 736.0, 517.0, 373.0, 230.0, 171.0, 118.0, 75.0, 61.0, 38.0, 30.0, 28.0, 20.0, 12.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.9140625, -13.482666015625, -13.05126953125, -12.619873046875, -12.1884765625, -11.757080078125, -11.32568359375, -10.894287109375, -10.462890625, -10.031494140625, -9.60009765625, -9.168701171875, -8.7373046875, -8.305908203125, -7.87451171875, -7.443115234375, -7.01171875, -6.580322265625, -6.14892578125, -5.717529296875, -5.2861328125, -4.854736328125, -4.42333984375, -3.991943359375, -3.560546875, -3.129150390625, -2.69775390625, -2.266357421875, -1.8349609375, -1.403564453125, -0.97216796875, -0.540771484375, -0.109375, 0.322021484375, 0.75341796875, 1.184814453125, 1.6162109375, 2.047607421875, 2.47900390625, 2.910400390625, 3.341796875, 3.773193359375, 4.20458984375, 4.635986328125, 5.0673828125, 5.498779296875, 5.93017578125, 6.361572265625, 6.79296875, 7.224365234375, 7.65576171875, 8.087158203125, 8.5185546875, 8.949951171875, 9.38134765625, 9.812744140625, 10.244140625, 10.675537109375, 11.10693359375, 11.538330078125, 11.9697265625, 12.401123046875, 12.83251953125, 13.263916015625, 13.6953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 6.0, 13.0, 18.0, 27.0, 27.0, 43.0, 61.0, 55.0, 78.0, 103.0, 104.0, 93.0, 91.0, 56.0, 52.0, 37.0, 31.0, 24.0, 20.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019588470458984375, -0.0019006580114364624, -0.0018424689769744873, -0.0017842799425125122, -0.0017260909080505371, -0.001667901873588562, -0.001609712839126587, -0.0015515238046646118, -0.0014933347702026367, -0.0014351457357406616, -0.0013769567012786865, -0.0013187676668167114, -0.0012605786323547363, -0.0012023895978927612, -0.0011442005634307861, -0.001086011528968811, -0.001027822494506836, -0.0009696334600448608, -0.0009114444255828857, -0.0008532553911209106, -0.0007950663566589355, -0.0007368773221969604, -0.0006786882877349854, -0.0006204992532730103, -0.0005623102188110352, -0.0005041211843490601, -0.00044593214988708496, -0.00038774311542510986, -0.00032955408096313477, -0.00027136504650115967, -0.00021317601203918457, -0.00015498697757720947, -9.679794311523438e-05, -3.860890865325928e-05, 1.958012580871582e-05, 7.776916027069092e-05, 0.00013595819473266602, 0.0001941472291946411, 0.0002523362636566162, 0.0003105252981185913, 0.0003687143325805664, 0.0004269033670425415, 0.0004850924015045166, 0.0005432814359664917, 0.0006014704704284668, 0.0006596595048904419, 0.000717848539352417, 0.0007760375738143921, 0.0008342266082763672, 0.0008924156427383423, 0.0009506046772003174, 0.0010087937116622925, 0.0010669827461242676, 0.0011251717805862427, 0.0011833608150482178, 0.0012415498495101929, 0.001299738883972168, 0.001357927918434143, 0.0014161169528961182, 0.0014743059873580933, 0.0015324950218200684, 0.0015906840562820435, 0.0016488730907440186, 0.0017070621252059937, 0.0017652511596679688]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 14.0, 9.0, 18.0, 21.0, 36.0, 50.0, 71.0, 74.0, 140.0, 181.0, 255.0, 381.0, 614.0, 916.0, 1443.0, 2330.0, 3794.0, 6541.0, 11643.0, 21174.0, 40724.0, 79475.0, 155702.0, 260167.0, 218421.0, 116056.0, 59127.0, 30324.0, 16422.0, 8824.0, 5213.0, 3032.0, 1810.0, 1263.0, 717.0, 491.0, 378.0, 223.0, 145.0, 103.0, 76.0, 57.0, 27.0, 31.0, 10.0, 7.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.492919921875, -14.95458984375, -14.416259765625, -13.8779296875, -13.339599609375, -12.80126953125, -12.262939453125, -11.724609375, -11.186279296875, -10.64794921875, -10.109619140625, -9.5712890625, -9.032958984375, -8.49462890625, -7.956298828125, -7.41796875, -6.879638671875, -6.34130859375, -5.802978515625, -5.2646484375, -4.726318359375, -4.18798828125, -3.649658203125, -3.111328125, -2.572998046875, -2.03466796875, -1.496337890625, -0.9580078125, -0.419677734375, 0.11865234375, 0.656982421875, 1.1953125, 1.733642578125, 2.27197265625, 2.810302734375, 3.3486328125, 3.886962890625, 4.42529296875, 4.963623046875, 5.501953125, 6.040283203125, 6.57861328125, 7.116943359375, 7.6552734375, 8.193603515625, 8.73193359375, 9.270263671875, 9.80859375, 10.346923828125, 10.88525390625, 11.423583984375, 11.9619140625, 12.500244140625, 13.03857421875, 13.576904296875, 14.115234375, 14.653564453125, 15.19189453125, 15.730224609375, 16.2685546875, 16.806884765625, 17.34521484375, 17.883544921875, 18.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 8.0, 4.0, 12.0, 20.0, 16.0, 28.0, 32.0, 32.0, 36.0, 48.0, 51.0, 45.0, 54.0, 64.0, 60.0, 53.0, 51.0, 69.0, 48.0, 32.0, 44.0, 35.0, 27.0, 16.0, 15.0, 17.0, 11.0, 9.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.71875, -4.55792236328125, -4.3970947265625, -4.23626708984375, -4.075439453125, -3.91461181640625, -3.7537841796875, -3.59295654296875, -3.43212890625, -3.27130126953125, -3.1104736328125, -2.94964599609375, -2.788818359375, -2.62799072265625, -2.4671630859375, -2.30633544921875, -2.1455078125, -1.98468017578125, -1.8238525390625, -1.66302490234375, -1.502197265625, -1.34136962890625, -1.1805419921875, -1.01971435546875, -0.85888671875, -0.69805908203125, -0.5372314453125, -0.37640380859375, -0.215576171875, -0.05474853515625, 0.1060791015625, 0.26690673828125, 0.427734375, 0.58856201171875, 0.7493896484375, 0.91021728515625, 1.071044921875, 1.23187255859375, 1.3927001953125, 1.55352783203125, 1.71435546875, 1.87518310546875, 2.0360107421875, 2.19683837890625, 2.357666015625, 2.51849365234375, 2.6793212890625, 2.84014892578125, 3.0009765625, 3.16180419921875, 3.3226318359375, 3.48345947265625, 3.644287109375, 3.80511474609375, 3.9659423828125, 4.12677001953125, 4.28759765625, 4.44842529296875, 4.6092529296875, 4.77008056640625, 4.930908203125, 5.09173583984375, 5.2525634765625, 5.41339111328125, 5.57421875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 13.0, 12.0, 8.0, 15.0, 16.0, 20.0, 13.0, 17.0, 29.0, 38.0, 38.0, 47.0, 52.0, 56.0, 54.0, 70.0, 67.0, 62.0, 47.0, 52.0, 43.0, 34.0, 27.0, 35.0, 24.0, 13.0, 11.0, 19.0, 9.0, 10.0, 10.0, 6.0, 9.0, 4.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.63134765625, -29.641857147216797, -28.652366638183594, -27.66287612915039, -26.673383712768555, -25.68389320373535, -24.69440269470215, -23.704912185668945, -22.715421676635742, -21.72593116760254, -20.736440658569336, -19.7469482421875, -18.757457733154297, -17.767967224121094, -16.77847671508789, -15.788986206054688, -14.799494743347168, -13.810004234313965, -12.820512771606445, -11.831022262573242, -10.841531753540039, -9.852041244506836, -8.862549781799316, -7.873059272766113, -6.883568286895752, -5.894077301025391, -4.9045867919921875, -3.915095806121826, -2.925605058670044, -1.9361143112182617, -0.9466233253479004, 0.042867183685302734, 1.032358169555664, 2.0218489170074463, 3.0113396644592285, 4.00083065032959, 4.990321159362793, 5.979812145233154, 6.969303131103516, 7.958793640136719, 8.948284149169922, 9.937774658203125, 10.927266120910645, 11.916756629943848, 12.90624713897705, 13.89573860168457, 14.885229110717773, 15.874719619750977, 16.864212036132812, 17.853702545166016, 18.84319305419922, 19.832683563232422, 20.822175979614258, 21.81166648864746, 22.801156997680664, 23.790647506713867, 24.78013801574707, 25.769628524780273, 26.759119033813477, 27.748611450195312, 28.738101959228516, 29.72759246826172, 30.717082977294922, 31.706573486328125, 32.69606399536133]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 8.0, 10.0, 12.0, 8.0, 13.0, 13.0, 10.0, 22.0, 28.0, 22.0, 32.0, 31.0, 48.0, 33.0, 35.0, 34.0, 40.0, 39.0, 40.0, 33.0, 55.0, 57.0, 46.0, 39.0, 33.0, 36.0, 38.0, 36.0, 31.0, 18.0, 18.0, 14.0, 10.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.73298263549805, -31.6606388092041, -30.588294982910156, -29.51595115661621, -28.443607330322266, -27.371261596679688, -26.298917770385742, -25.226573944091797, -24.15423011779785, -23.081886291503906, -22.00954246520996, -20.937198638916016, -19.864852905273438, -18.792510986328125, -17.720165252685547, -16.6478214263916, -15.575477600097656, -14.503133773803711, -13.430789947509766, -12.358445167541504, -11.286101341247559, -10.213757514953613, -9.141412734985352, -8.069068908691406, -6.996725082397461, -5.924381256103516, -4.852036952972412, -3.7796928882598877, -2.7073488235473633, -1.635004997253418, -0.5626606941223145, 0.5096836090087891, 1.5820236206054688, 2.654367685317993, 3.7267117500305176, 4.799056053161621, 5.871399879455566, 6.943743705749512, 8.016088485717773, 9.088432312011719, 10.160776138305664, 11.23311996459961, 12.305463790893555, 13.377808570861816, 14.450152397155762, 15.522496223449707, 16.59484100341797, 17.667184829711914, 18.73952865600586, 19.811872482299805, 20.88421630859375, 21.956560134887695, 23.02890396118164, 24.10124969482422, 25.173593521118164, 26.24593734741211, 27.318281173706055, 28.390625, 29.462968826293945, 30.53531265258789, 31.60765838623047, 32.68000030517578, 33.75234603881836, 34.82469177246094, 35.89703369140625]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 15.0, 24.0, 33.0, 46.0, 60.0, 101.0, 154.0, 212.0, 353.0, 590.0, 992.0, 1719.0, 3071.0, 5870.0, 11618.0, 24885.0, 58800.0, 166852.0, 589452.0, 1646101.0, 1161127.0, 337742.0, 104979.0, 41353.0, 18563.0, 8848.0, 4577.0, 2613.0, 1398.0, 823.0, 472.0, 294.0, 195.0, 99.0, 84.0, 56.0, 29.0, 26.0, 13.0, 16.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.40625, -55.70703125, -54.0078125, -52.30859375, -50.609375, -48.91015625, -47.2109375, -45.51171875, -43.8125, -42.11328125, -40.4140625, -38.71484375, -37.015625, -35.31640625, -33.6171875, -31.91796875, -30.21875, -28.51953125, -26.8203125, -25.12109375, -23.421875, -21.72265625, -20.0234375, -18.32421875, -16.625, -14.92578125, -13.2265625, -11.52734375, -9.828125, -8.12890625, -6.4296875, -4.73046875, -3.03125, -1.33203125, 0.3671875, 2.06640625, 3.765625, 5.46484375, 7.1640625, 8.86328125, 10.5625, 12.26171875, 13.9609375, 15.66015625, 17.359375, 19.05859375, 20.7578125, 22.45703125, 24.15625, 25.85546875, 27.5546875, 29.25390625, 30.953125, 32.65234375, 34.3515625, 36.05078125, 37.75, 39.44921875, 41.1484375, 42.84765625, 44.546875, 46.24609375, 47.9453125, 49.64453125, 51.34375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 0.0, 11.0, 8.0, 7.0, 8.0, 19.0, 10.0, 9.0, 12.0, 18.0, 27.0, 23.0, 40.0, 27.0, 42.0, 39.0, 31.0, 27.0, 40.0, 37.0, 41.0, 51.0, 46.0, 45.0, 50.0, 46.0, 43.0, 30.0, 38.0, 28.0, 27.0, 19.0, 21.0, 10.0, 9.0, 13.0, 13.0, 7.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.125, -32.139404296875, -31.15380859375, -30.168212890625, -29.1826171875, -28.197021484375, -27.21142578125, -26.225830078125, -25.240234375, -24.254638671875, -23.26904296875, -22.283447265625, -21.2978515625, -20.312255859375, -19.32666015625, -18.341064453125, -17.35546875, -16.369873046875, -15.38427734375, -14.398681640625, -13.4130859375, -12.427490234375, -11.44189453125, -10.456298828125, -9.470703125, -8.485107421875, -7.49951171875, -6.513916015625, -5.5283203125, -4.542724609375, -3.55712890625, -2.571533203125, -1.5859375, -0.600341796875, 0.38525390625, 1.370849609375, 2.3564453125, 3.342041015625, 4.32763671875, 5.313232421875, 6.298828125, 7.284423828125, 8.27001953125, 9.255615234375, 10.2412109375, 11.226806640625, 12.21240234375, 13.197998046875, 14.18359375, 15.169189453125, 16.15478515625, 17.140380859375, 18.1259765625, 19.111572265625, 20.09716796875, 21.082763671875, 22.068359375, 23.053955078125, 24.03955078125, 25.025146484375, 26.0107421875, 26.996337890625, 27.98193359375, 28.967529296875, 29.953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [8.0, 1.0, 7.0, 7.0, 9.0, 15.0, 17.0, 31.0, 34.0, 43.0, 67.0, 105.0, 134.0, 203.0, 271.0, 402.0, 590.0, 872.0, 1246.0, 1838.0, 2822.0, 4430.0, 6847.0, 10856.0, 18845.0, 32495.0, 59437.0, 113174.0, 227545.0, 495106.0, 1081006.0, 1118286.0, 516599.0, 237300.0, 117548.0, 61606.0, 33627.0, 19206.0, 11211.0, 7161.0, 4420.0, 2855.0, 1839.0, 1217.0, 931.0, 597.0, 426.0, 274.0, 226.0, 159.0, 103.0, 61.0, 52.0, 50.0, 24.0, 20.0, 10.0, 10.0, 10.0, 8.0, 3.0, 1.0, 0.0, 1.0], "bins": [-41.375, -40.04150390625, -38.7080078125, -37.37451171875, -36.041015625, -34.70751953125, -33.3740234375, -32.04052734375, -30.70703125, -29.37353515625, -28.0400390625, -26.70654296875, -25.373046875, -24.03955078125, -22.7060546875, -21.37255859375, -20.0390625, -18.70556640625, -17.3720703125, -16.03857421875, -14.705078125, -13.37158203125, -12.0380859375, -10.70458984375, -9.37109375, -8.03759765625, -6.7041015625, -5.37060546875, -4.037109375, -2.70361328125, -1.3701171875, -0.03662109375, 1.296875, 2.63037109375, 3.9638671875, 5.29736328125, 6.630859375, 7.96435546875, 9.2978515625, 10.63134765625, 11.96484375, 13.29833984375, 14.6318359375, 15.96533203125, 17.298828125, 18.63232421875, 19.9658203125, 21.29931640625, 22.6328125, 23.96630859375, 25.2998046875, 26.63330078125, 27.966796875, 29.30029296875, 30.6337890625, 31.96728515625, 33.30078125, 34.63427734375, 35.9677734375, 37.30126953125, 38.634765625, 39.96826171875, 41.3017578125, 42.63525390625, 43.96875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 6.0, 12.0, 9.0, 23.0, 18.0, 19.0, 35.0, 29.0, 54.0, 50.0, 78.0, 91.0, 90.0, 146.0, 166.0, 201.0, 275.0, 306.0, 310.0, 315.0, 304.0, 281.0, 245.0, 202.0, 162.0, 123.0, 109.0, 85.0, 72.0, 63.0, 39.0, 36.0, 16.0, 20.0, 13.0, 13.0, 6.0, 11.0, 8.0, 2.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.203125, -13.72119140625, -13.2392578125, -12.75732421875, -12.275390625, -11.79345703125, -11.3115234375, -10.82958984375, -10.34765625, -9.86572265625, -9.3837890625, -8.90185546875, -8.419921875, -7.93798828125, -7.4560546875, -6.97412109375, -6.4921875, -6.01025390625, -5.5283203125, -5.04638671875, -4.564453125, -4.08251953125, -3.6005859375, -3.11865234375, -2.63671875, -2.15478515625, -1.6728515625, -1.19091796875, -0.708984375, -0.22705078125, 0.2548828125, 0.73681640625, 1.21875, 1.70068359375, 2.1826171875, 2.66455078125, 3.146484375, 3.62841796875, 4.1103515625, 4.59228515625, 5.07421875, 5.55615234375, 6.0380859375, 6.52001953125, 7.001953125, 7.48388671875, 7.9658203125, 8.44775390625, 8.9296875, 9.41162109375, 9.8935546875, 10.37548828125, 10.857421875, 11.33935546875, 11.8212890625, 12.30322265625, 12.78515625, 13.26708984375, 13.7490234375, 14.23095703125, 14.712890625, 15.19482421875, 15.6767578125, 16.15869140625, 16.640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 12.0, 22.0, 26.0, 36.0, 45.0, 52.0, 57.0, 63.0, 70.0, 78.0, 78.0, 79.0, 59.0, 56.0, 54.0, 44.0, 27.0, 18.0, 21.0, 22.0, 16.0, 5.0, 12.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.362735748291016, -45.93781280517578, -44.51289367675781, -43.08797073364258, -41.663047790527344, -40.23812484741211, -38.81320571899414, -37.388282775878906, -35.96335983276367, -34.53843688964844, -33.11351776123047, -31.688594818115234, -30.263671875, -28.8387508392334, -27.413829803466797, -25.988906860351562, -24.56398582458496, -23.13906478881836, -21.714141845703125, -20.289220809936523, -18.86429786682129, -17.439376831054688, -16.014453887939453, -14.589532852172852, -13.164610862731934, -11.739688873291016, -10.314766883850098, -8.88984489440918, -7.46492338180542, -6.040001392364502, -4.615079879760742, -3.190157890319824, -1.7652359008789062, -0.34031403064727783, 1.0846078395843506, 2.5095295906066895, 3.9344515800476074, 5.359373569488525, 6.784295082092285, 8.209217071533203, 9.634139060974121, 11.059061050415039, 12.483983039855957, 13.908905029296875, 15.333826065063477, 16.75874900817871, 18.183670043945312, 19.608592987060547, 21.03351402282715, 22.45843505859375, 23.883358001708984, 25.308279037475586, 26.73320198059082, 28.158123016357422, 29.583045959472656, 31.007966995239258, 32.43288803100586, 33.857810974121094, 35.28273010253906, 36.7076530456543, 38.13257598876953, 39.557498931884766, 40.982418060302734, 42.40734100341797, 43.8322639465332]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 1.0, 3.0, 7.0, 15.0, 6.0, 10.0, 17.0, 14.0, 19.0, 25.0, 19.0, 32.0, 26.0, 16.0, 37.0, 33.0, 41.0, 47.0, 44.0, 51.0, 52.0, 38.0, 51.0, 43.0, 48.0, 51.0, 37.0, 35.0, 40.0, 24.0, 19.0, 25.0, 13.0, 9.0, 9.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.490203857421875, -41.285099029541016, -40.079994201660156, -38.8748893737793, -37.66978454589844, -36.46467971801758, -35.25957489013672, -34.05447006225586, -32.849365234375, -31.64426040649414, -30.43915557861328, -29.234050750732422, -28.028945922851562, -26.823841094970703, -25.618736267089844, -24.413631439208984, -23.208526611328125, -22.003421783447266, -20.798316955566406, -19.593212127685547, -18.388107299804688, -17.183002471923828, -15.977897644042969, -14.77279281616211, -13.56768798828125, -12.36258316040039, -11.157478332519531, -9.952373504638672, -8.747268676757812, -7.542163848876953, -6.337059020996094, -5.131954193115234, -3.9268455505371094, -2.72174072265625, -1.5166358947753906, -0.31153106689453125, 0.8935737609863281, 2.0986785888671875, 3.303783416748047, 4.508888244628906, 5.713993072509766, 6.919097900390625, 8.124202728271484, 9.329307556152344, 10.534412384033203, 11.739517211914062, 12.944622039794922, 14.149726867675781, 15.35483169555664, 16.5599365234375, 17.76504135131836, 18.97014617919922, 20.175251007080078, 21.380355834960938, 22.585460662841797, 23.790565490722656, 24.995670318603516, 26.200775146484375, 27.405879974365234, 28.610984802246094, 29.816089630126953, 31.021194458007812, 32.22629928588867, 33.43140411376953, 34.63650894165039]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 20.0, 28.0, 42.0, 58.0, 74.0, 116.0, 193.0, 265.0, 448.0, 632.0, 1047.0, 1566.0, 2565.0, 4295.0, 7225.0, 12532.0, 22700.0, 42685.0, 86629.0, 182185.0, 297433.0, 193571.0, 91024.0, 44556.0, 23743.0, 13207.0, 7759.0, 4530.0, 2745.0, 1704.0, 1027.0, 675.0, 426.0, 298.0, 180.0, 125.0, 78.0, 38.0, 29.0, 34.0, 21.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-28.375, -27.553466796875, -26.73193359375, -25.910400390625, -25.0888671875, -24.267333984375, -23.44580078125, -22.624267578125, -21.802734375, -20.981201171875, -20.15966796875, -19.338134765625, -18.5166015625, -17.695068359375, -16.87353515625, -16.052001953125, -15.23046875, -14.408935546875, -13.58740234375, -12.765869140625, -11.9443359375, -11.122802734375, -10.30126953125, -9.479736328125, -8.658203125, -7.836669921875, -7.01513671875, -6.193603515625, -5.3720703125, -4.550537109375, -3.72900390625, -2.907470703125, -2.0859375, -1.264404296875, -0.44287109375, 0.378662109375, 1.2001953125, 2.021728515625, 2.84326171875, 3.664794921875, 4.486328125, 5.307861328125, 6.12939453125, 6.950927734375, 7.7724609375, 8.593994140625, 9.41552734375, 10.237060546875, 11.05859375, 11.880126953125, 12.70166015625, 13.523193359375, 14.3447265625, 15.166259765625, 15.98779296875, 16.809326171875, 17.630859375, 18.452392578125, 19.27392578125, 20.095458984375, 20.9169921875, 21.738525390625, 22.56005859375, 23.381591796875, 24.203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 11.0, 20.0, 12.0, 20.0, 15.0, 29.0, 21.0, 23.0, 28.0, 35.0, 44.0, 41.0, 49.0, 54.0, 51.0, 57.0, 50.0, 51.0, 49.0, 43.0, 42.0, 40.0, 40.0, 40.0, 21.0, 14.0, 17.0, 10.0, 13.0, 6.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.9375, -45.6298828125, -44.322265625, -43.0146484375, -41.70703125, -40.3994140625, -39.091796875, -37.7841796875, -36.4765625, -35.1689453125, -33.861328125, -32.5537109375, -31.24609375, -29.9384765625, -28.630859375, -27.3232421875, -26.015625, -24.7080078125, -23.400390625, -22.0927734375, -20.78515625, -19.4775390625, -18.169921875, -16.8623046875, -15.5546875, -14.2470703125, -12.939453125, -11.6318359375, -10.32421875, -9.0166015625, -7.708984375, -6.4013671875, -5.09375, -3.7861328125, -2.478515625, -1.1708984375, 0.13671875, 1.4443359375, 2.751953125, 4.0595703125, 5.3671875, 6.6748046875, 7.982421875, 9.2900390625, 10.59765625, 11.9052734375, 13.212890625, 14.5205078125, 15.828125, 17.1357421875, 18.443359375, 19.7509765625, 21.05859375, 22.3662109375, 23.673828125, 24.9814453125, 26.2890625, 27.5966796875, 28.904296875, 30.2119140625, 31.51953125, 32.8271484375, 34.134765625, 35.4423828125, 36.75]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 14.0, 15.0, 15.0, 24.0, 35.0, 47.0, 73.0, 117.0, 178.0, 289.0, 462.0, 669.0, 1086.0, 1746.0, 2724.0, 4756.0, 7998.0, 13618.0, 24344.0, 46730.0, 99934.0, 259997.0, 330142.0, 127810.0, 56989.0, 29092.0, 15981.0, 9347.0, 5484.0, 3316.0, 1995.0, 1311.0, 771.0, 468.0, 341.0, 235.0, 111.0, 100.0, 64.0, 41.0, 22.0, 19.0, 14.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.6875, -32.56982421875, -31.4521484375, -30.33447265625, -29.216796875, -28.09912109375, -26.9814453125, -25.86376953125, -24.74609375, -23.62841796875, -22.5107421875, -21.39306640625, -20.275390625, -19.15771484375, -18.0400390625, -16.92236328125, -15.8046875, -14.68701171875, -13.5693359375, -12.45166015625, -11.333984375, -10.21630859375, -9.0986328125, -7.98095703125, -6.86328125, -5.74560546875, -4.6279296875, -3.51025390625, -2.392578125, -1.27490234375, -0.1572265625, 0.96044921875, 2.078125, 3.19580078125, 4.3134765625, 5.43115234375, 6.548828125, 7.66650390625, 8.7841796875, 9.90185546875, 11.01953125, 12.13720703125, 13.2548828125, 14.37255859375, 15.490234375, 16.60791015625, 17.7255859375, 18.84326171875, 19.9609375, 21.07861328125, 22.1962890625, 23.31396484375, 24.431640625, 25.54931640625, 26.6669921875, 27.78466796875, 28.90234375, 30.02001953125, 31.1376953125, 32.25537109375, 33.373046875, 34.49072265625, 35.6083984375, 36.72607421875, 37.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 16.0, 23.0, 20.0, 34.0, 28.0, 32.0, 36.0, 32.0, 39.0, 48.0, 41.0, 48.0, 51.0, 42.0, 58.0, 46.0, 35.0, 38.0, 33.0, 31.0, 22.0, 30.0, 26.0, 28.0, 18.0, 16.0, 16.0, 12.0, 16.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.171875, -19.4619140625, -18.751953125, -18.0419921875, -17.33203125, -16.6220703125, -15.912109375, -15.2021484375, -14.4921875, -13.7822265625, -13.072265625, -12.3623046875, -11.65234375, -10.9423828125, -10.232421875, -9.5224609375, -8.8125, -8.1025390625, -7.392578125, -6.6826171875, -5.97265625, -5.2626953125, -4.552734375, -3.8427734375, -3.1328125, -2.4228515625, -1.712890625, -1.0029296875, -0.29296875, 0.4169921875, 1.126953125, 1.8369140625, 2.546875, 3.2568359375, 3.966796875, 4.6767578125, 5.38671875, 6.0966796875, 6.806640625, 7.5166015625, 8.2265625, 8.9365234375, 9.646484375, 10.3564453125, 11.06640625, 11.7763671875, 12.486328125, 13.1962890625, 13.90625, 14.6162109375, 15.326171875, 16.0361328125, 16.74609375, 17.4560546875, 18.166015625, 18.8759765625, 19.5859375, 20.2958984375, 21.005859375, 21.7158203125, 22.42578125, 23.1357421875, 23.845703125, 24.5556640625, 25.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 12.0, 10.0, 16.0, 23.0, 40.0, 40.0, 76.0, 92.0, 131.0, 201.0, 278.0, 458.0, 586.0, 916.0, 1476.0, 2307.0, 3702.0, 6330.0, 11234.0, 20532.0, 40198.0, 82439.0, 173009.0, 296167.0, 206428.0, 98484.0, 47249.0, 24197.0, 13043.0, 7292.0, 4264.0, 2601.0, 1625.0, 1061.0, 642.0, 420.0, 303.0, 213.0, 136.0, 109.0, 50.0, 55.0, 31.0, 24.0, 13.0, 13.0, 9.0, 3.0, 2.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.5389404296875, -7.300537109375, -7.0621337890625, -6.82373046875, -6.5853271484375, -6.346923828125, -6.1085205078125, -5.8701171875, -5.6317138671875, -5.393310546875, -5.1549072265625, -4.91650390625, -4.6781005859375, -4.439697265625, -4.2012939453125, -3.962890625, -3.7244873046875, -3.486083984375, -3.2476806640625, -3.00927734375, -2.7708740234375, -2.532470703125, -2.2940673828125, -2.0556640625, -1.8172607421875, -1.578857421875, -1.3404541015625, -1.10205078125, -0.8636474609375, -0.625244140625, -0.3868408203125, -0.1484375, 0.0899658203125, 0.328369140625, 0.5667724609375, 0.80517578125, 1.0435791015625, 1.281982421875, 1.5203857421875, 1.7587890625, 1.9971923828125, 2.235595703125, 2.4739990234375, 2.71240234375, 2.9508056640625, 3.189208984375, 3.4276123046875, 3.666015625, 3.9044189453125, 4.142822265625, 4.3812255859375, 4.61962890625, 4.8580322265625, 5.096435546875, 5.3348388671875, 5.5732421875, 5.8116455078125, 6.050048828125, 6.2884521484375, 6.52685546875, 6.7652587890625, 7.003662109375, 7.2420654296875, 7.48046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 19.0, 28.0, 30.0, 42.0, 41.0, 73.0, 73.0, 82.0, 90.0, 82.0, 61.0, 57.0, 46.0, 46.0, 41.0, 32.0, 29.0, 21.0, 20.0, 14.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010938644409179688, -0.001065678894519806, -0.001037493348121643, -0.0010093078017234802, -0.0009811222553253174, -0.0009529367089271545, -0.0009247511625289917, -0.0008965656161308289, -0.000868380069732666, -0.0008401945233345032, -0.0008120089769363403, -0.0007838234305381775, -0.0007556378841400146, -0.0007274523377418518, -0.000699266791343689, -0.0006710812449455261, -0.0006428956985473633, -0.0006147101521492004, -0.0005865246057510376, -0.0005583390593528748, -0.0005301535129547119, -0.0005019679665565491, -0.00047378242015838623, -0.0004455968737602234, -0.00041741132736206055, -0.0003892257809638977, -0.00036104023456573486, -0.000332854688167572, -0.0003046691417694092, -0.00027648359537124634, -0.0002482980489730835, -0.00022011250257492065, -0.0001919269561767578, -0.00016374140977859497, -0.00013555586338043213, -0.00010737031698226929, -7.918477058410645e-05, -5.0999224185943604e-05, -2.2813677787780762e-05, 5.37186861038208e-06, 3.355741500854492e-05, 6.174296140670776e-05, 8.99285078048706e-05, 0.00011811405420303345, 0.0001462996006011963, 0.00017448514699935913, 0.00020267069339752197, 0.00023085623979568481, 0.00025904178619384766, 0.0002872273325920105, 0.00031541287899017334, 0.0003435984253883362, 0.000371783971786499, 0.00039996951818466187, 0.0004281550645828247, 0.00045634061098098755, 0.0004845261573791504, 0.0005127117037773132, 0.0005408972501754761, 0.0005690827965736389, 0.0005972683429718018, 0.0006254538893699646, 0.0006536394357681274, 0.0006818249821662903, 0.0007100105285644531]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 14.0, 14.0, 23.0, 19.0, 45.0, 72.0, 89.0, 134.0, 161.0, 257.0, 382.0, 655.0, 1031.0, 1725.0, 2881.0, 5142.0, 9570.0, 18481.0, 37291.0, 78460.0, 166162.0, 288396.0, 223825.0, 108538.0, 51595.0, 24784.0, 12699.0, 6661.0, 3698.0, 2171.0, 1291.0, 786.0, 525.0, 333.0, 206.0, 136.0, 96.0, 52.0, 34.0, 38.0, 19.0, 18.0, 6.0, 15.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-10.203125, -9.9005126953125, -9.597900390625, -9.2952880859375, -8.99267578125, -8.6900634765625, -8.387451171875, -8.0848388671875, -7.7822265625, -7.4796142578125, -7.177001953125, -6.8743896484375, -6.57177734375, -6.2691650390625, -5.966552734375, -5.6639404296875, -5.361328125, -5.0587158203125, -4.756103515625, -4.4534912109375, -4.15087890625, -3.8482666015625, -3.545654296875, -3.2430419921875, -2.9404296875, -2.6378173828125, -2.335205078125, -2.0325927734375, -1.72998046875, -1.4273681640625, -1.124755859375, -0.8221435546875, -0.51953125, -0.2169189453125, 0.085693359375, 0.3883056640625, 0.69091796875, 0.9935302734375, 1.296142578125, 1.5987548828125, 1.9013671875, 2.2039794921875, 2.506591796875, 2.8092041015625, 3.11181640625, 3.4144287109375, 3.717041015625, 4.0196533203125, 4.322265625, 4.6248779296875, 4.927490234375, 5.2301025390625, 5.53271484375, 5.8353271484375, 6.137939453125, 6.4405517578125, 6.7431640625, 7.0457763671875, 7.348388671875, 7.6510009765625, 7.95361328125, 8.2562255859375, 8.558837890625, 8.8614501953125, 9.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 16.0, 14.0, 27.0, 26.0, 31.0, 42.0, 58.0, 62.0, 80.0, 61.0, 76.0, 76.0, 66.0, 69.0, 48.0, 35.0, 37.0, 21.0, 18.0, 18.0, 15.0, 10.0, 7.0, 5.0, 12.0, 4.0, 5.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.859100341796875, -2.77288818359375, -2.686676025390625, -2.6004638671875, -2.514251708984375, -2.42803955078125, -2.341827392578125, -2.255615234375, -2.169403076171875, -2.08319091796875, -1.996978759765625, -1.9107666015625, -1.824554443359375, -1.73834228515625, -1.652130126953125, -1.56591796875, -1.479705810546875, -1.39349365234375, -1.307281494140625, -1.2210693359375, -1.134857177734375, -1.04864501953125, -0.962432861328125, -0.876220703125, -0.790008544921875, -0.70379638671875, -0.617584228515625, -0.5313720703125, -0.445159912109375, -0.35894775390625, -0.272735595703125, -0.1865234375, -0.100311279296875, -0.01409912109375, 0.072113037109375, 0.1583251953125, 0.244537353515625, 0.33074951171875, 0.416961669921875, 0.503173828125, 0.589385986328125, 0.67559814453125, 0.761810302734375, 0.8480224609375, 0.934234619140625, 1.02044677734375, 1.106658935546875, 1.19287109375, 1.279083251953125, 1.36529541015625, 1.451507568359375, 1.5377197265625, 1.623931884765625, 1.71014404296875, 1.796356201171875, 1.882568359375, 1.968780517578125, 2.05499267578125, 2.141204833984375, 2.2274169921875, 2.313629150390625, 2.39984130859375, 2.486053466796875, 2.572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 17.0, 14.0, 25.0, 30.0, 45.0, 44.0, 64.0, 61.0, 60.0, 75.0, 83.0, 80.0, 67.0, 57.0, 61.0, 44.0, 27.0, 28.0, 20.0, 16.0, 16.0, 12.0, 6.0, 8.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.283668518066406, -45.869693756103516, -44.455718994140625, -43.04174041748047, -41.62776565551758, -40.21379089355469, -38.79981231689453, -37.38583755493164, -35.97186279296875, -34.55788803100586, -33.14391326904297, -31.729934692382812, -30.315959930419922, -28.90198516845703, -27.488008499145508, -26.074031829833984, -24.660057067871094, -23.246082305908203, -21.83210563659668, -20.418128967285156, -19.004154205322266, -17.590179443359375, -16.17620277404785, -14.762227058410645, -13.348251342773438, -11.93427562713623, -10.520299911499023, -9.106324195861816, -7.692348480224609, -6.278372764587402, -4.864397048950195, -3.4504213333129883, -2.0364456176757812, -0.6224699020385742, 0.7915058135986328, 2.20548152923584, 3.619457244873047, 5.033432960510254, 6.447408676147461, 7.861384391784668, 9.275360107421875, 10.689335823059082, 12.103311538696289, 13.517287254333496, 14.931262969970703, 16.345237731933594, 17.759214401245117, 19.17319107055664, 20.58716583251953, 22.001140594482422, 23.415117263793945, 24.82909393310547, 26.24306869506836, 27.65704345703125, 29.071020126342773, 30.484996795654297, 31.898971557617188, 33.31294631958008, 34.72692108154297, 36.140899658203125, 37.554874420166016, 38.968849182128906, 40.38282775878906, 41.79680252075195, 43.210777282714844]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 14.0, 8.0, 12.0, 13.0, 14.0, 14.0, 26.0, 19.0, 28.0, 31.0, 20.0, 28.0, 31.0, 43.0, 47.0, 42.0, 49.0, 50.0, 43.0, 48.0, 43.0, 48.0, 52.0, 34.0, 41.0, 42.0, 28.0, 23.0, 22.0, 16.0, 10.0, 10.0, 8.0, 14.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.58190155029297, -41.38736343383789, -40.19282531738281, -38.998291015625, -37.80375289916992, -36.609214782714844, -35.41468048095703, -34.22014236450195, -33.025604248046875, -31.831066131591797, -30.63652992248535, -29.441993713378906, -28.247455596923828, -27.05291748046875, -25.858381271362305, -24.66384506225586, -23.46930694580078, -22.274768829345703, -21.080232620239258, -19.885696411132812, -18.691158294677734, -17.496620178222656, -16.30208396911621, -15.10754680633545, -13.913009643554688, -12.718472480773926, -11.523935317993164, -10.329398155212402, -9.13486099243164, -7.940323829650879, -6.745786666870117, -5.5512495040893555, -4.356708526611328, -3.1621713638305664, -1.9676342010498047, -0.773097038269043, 0.42144012451171875, 1.6159772872924805, 2.810514450073242, 4.005051612854004, 5.199588775634766, 6.394125938415527, 7.588663101196289, 8.78320026397705, 9.977737426757812, 11.172274589538574, 12.366811752319336, 13.561348915100098, 14.75588607788086, 15.950423240661621, 17.144960403442383, 18.339496612548828, 19.534034729003906, 20.728572845458984, 21.92310905456543, 23.117645263671875, 24.312183380126953, 25.50672149658203, 26.701257705688477, 27.895793914794922, 29.09033203125, 30.284870147705078, 31.479406356811523, 32.67394256591797, 33.86848068237305]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 7.0, 23.0, 37.0, 34.0, 59.0, 95.0, 154.0, 230.0, 341.0, 556.0, 829.0, 1411.0, 2186.0, 3465.0, 5566.0, 8891.0, 14905.0, 23717.0, 38754.0, 63073.0, 101748.0, 157298.0, 198170.0, 158873.0, 102970.0, 63138.0, 38982.0, 24053.0, 14761.0, 8999.0, 5566.0, 3528.0, 2278.0, 1406.0, 875.0, 580.0, 340.0, 237.0, 157.0, 80.0, 54.0, 48.0, 17.0, 22.0, 13.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-38.96875, -37.73193359375, -36.4951171875, -35.25830078125, -34.021484375, -32.78466796875, -31.5478515625, -30.31103515625, -29.07421875, -27.83740234375, -26.6005859375, -25.36376953125, -24.126953125, -22.89013671875, -21.6533203125, -20.41650390625, -19.1796875, -17.94287109375, -16.7060546875, -15.46923828125, -14.232421875, -12.99560546875, -11.7587890625, -10.52197265625, -9.28515625, -8.04833984375, -6.8115234375, -5.57470703125, -4.337890625, -3.10107421875, -1.8642578125, -0.62744140625, 0.609375, 1.84619140625, 3.0830078125, 4.31982421875, 5.556640625, 6.79345703125, 8.0302734375, 9.26708984375, 10.50390625, 11.74072265625, 12.9775390625, 14.21435546875, 15.451171875, 16.68798828125, 17.9248046875, 19.16162109375, 20.3984375, 21.63525390625, 22.8720703125, 24.10888671875, 25.345703125, 26.58251953125, 27.8193359375, 29.05615234375, 30.29296875, 31.52978515625, 32.7666015625, 34.00341796875, 35.240234375, 36.47705078125, 37.7138671875, 38.95068359375, 40.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 7.0, 6.0, 9.0, 13.0, 14.0, 8.0, 15.0, 19.0, 26.0, 19.0, 25.0, 20.0, 32.0, 37.0, 30.0, 49.0, 55.0, 49.0, 52.0, 49.0, 49.0, 50.0, 60.0, 47.0, 34.0, 45.0, 39.0, 31.0, 27.0, 13.0, 13.0, 11.0, 11.0, 10.0, 7.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.21875, -42.01171875, -40.8046875, -39.59765625, -38.390625, -37.18359375, -35.9765625, -34.76953125, -33.5625, -32.35546875, -31.1484375, -29.94140625, -28.734375, -27.52734375, -26.3203125, -25.11328125, -23.90625, -22.69921875, -21.4921875, -20.28515625, -19.078125, -17.87109375, -16.6640625, -15.45703125, -14.25, -13.04296875, -11.8359375, -10.62890625, -9.421875, -8.21484375, -7.0078125, -5.80078125, -4.59375, -3.38671875, -2.1796875, -0.97265625, 0.234375, 1.44140625, 2.6484375, 3.85546875, 5.0625, 6.26953125, 7.4765625, 8.68359375, 9.890625, 11.09765625, 12.3046875, 13.51171875, 14.71875, 15.92578125, 17.1328125, 18.33984375, 19.546875, 20.75390625, 21.9609375, 23.16796875, 24.375, 25.58203125, 26.7890625, 27.99609375, 29.203125, 30.41015625, 31.6171875, 32.82421875, 34.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 10.0, 13.0, 25.0, 22.0, 31.0, 44.0, 88.0, 124.0, 192.0, 256.0, 409.0, 633.0, 920.0, 1411.0, 2037.0, 3102.0, 4774.0, 7116.0, 10917.0, 16508.0, 25070.0, 38595.0, 58686.0, 88533.0, 129064.0, 166779.0, 155948.0, 114212.0, 76289.0, 50302.0, 33135.0, 21554.0, 14195.0, 9385.0, 6187.0, 4055.0, 2674.0, 1727.0, 1195.0, 780.0, 499.0, 343.0, 237.0, 144.0, 111.0, 79.0, 48.0, 36.0, 25.0, 11.0, 11.0, 11.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.25, -34.02685546875, -32.8037109375, -31.58056640625, -30.357421875, -29.13427734375, -27.9111328125, -26.68798828125, -25.46484375, -24.24169921875, -23.0185546875, -21.79541015625, -20.572265625, -19.34912109375, -18.1259765625, -16.90283203125, -15.6796875, -14.45654296875, -13.2333984375, -12.01025390625, -10.787109375, -9.56396484375, -8.3408203125, -7.11767578125, -5.89453125, -4.67138671875, -3.4482421875, -2.22509765625, -1.001953125, 0.22119140625, 1.4443359375, 2.66748046875, 3.890625, 5.11376953125, 6.3369140625, 7.56005859375, 8.783203125, 10.00634765625, 11.2294921875, 12.45263671875, 13.67578125, 14.89892578125, 16.1220703125, 17.34521484375, 18.568359375, 19.79150390625, 21.0146484375, 22.23779296875, 23.4609375, 24.68408203125, 25.9072265625, 27.13037109375, 28.353515625, 29.57666015625, 30.7998046875, 32.02294921875, 33.24609375, 34.46923828125, 35.6923828125, 36.91552734375, 38.138671875, 39.36181640625, 40.5849609375, 41.80810546875, 43.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 14.0, 10.0, 8.0, 11.0, 8.0, 15.0, 22.0, 19.0, 11.0, 27.0, 24.0, 23.0, 29.0, 39.0, 31.0, 37.0, 24.0, 37.0, 26.0, 43.0, 42.0, 38.0, 32.0, 36.0, 34.0, 47.0, 30.0, 26.0, 37.0, 22.0, 28.0, 20.0, 20.0, 18.0, 23.0, 14.0, 16.0, 7.0, 12.0, 8.0, 9.0, 2.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.709228515625, -18.05908203125, -17.408935546875, -16.7587890625, -16.108642578125, -15.45849609375, -14.808349609375, -14.158203125, -13.508056640625, -12.85791015625, -12.207763671875, -11.5576171875, -10.907470703125, -10.25732421875, -9.607177734375, -8.95703125, -8.306884765625, -7.65673828125, -7.006591796875, -6.3564453125, -5.706298828125, -5.05615234375, -4.406005859375, -3.755859375, -3.105712890625, -2.45556640625, -1.805419921875, -1.1552734375, -0.505126953125, 0.14501953125, 0.795166015625, 1.4453125, 2.095458984375, 2.74560546875, 3.395751953125, 4.0458984375, 4.696044921875, 5.34619140625, 5.996337890625, 6.646484375, 7.296630859375, 7.94677734375, 8.596923828125, 9.2470703125, 9.897216796875, 10.54736328125, 11.197509765625, 11.84765625, 12.497802734375, 13.14794921875, 13.798095703125, 14.4482421875, 15.098388671875, 15.74853515625, 16.398681640625, 17.048828125, 17.698974609375, 18.34912109375, 18.999267578125, 19.6494140625, 20.299560546875, 20.94970703125, 21.599853515625, 22.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 14.0, 34.0, 35.0, 64.0, 65.0, 83.0, 159.0, 243.0, 344.0, 506.0, 822.0, 1317.0, 2163.0, 3585.0, 6398.0, 11480.0, 21717.0, 42286.0, 87756.0, 184611.0, 287426.0, 200708.0, 97234.0, 46716.0, 23570.0, 12483.0, 6785.0, 3790.0, 2283.0, 1388.0, 841.0, 535.0, 342.0, 255.0, 173.0, 99.0, 69.0, 52.0, 43.0, 21.0, 8.0, 9.0, 15.0, 4.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -24.020263671875, -23.25927734375, -22.498291015625, -21.7373046875, -20.976318359375, -20.21533203125, -19.454345703125, -18.693359375, -17.932373046875, -17.17138671875, -16.410400390625, -15.6494140625, -14.888427734375, -14.12744140625, -13.366455078125, -12.60546875, -11.844482421875, -11.08349609375, -10.322509765625, -9.5615234375, -8.800537109375, -8.03955078125, -7.278564453125, -6.517578125, -5.756591796875, -4.99560546875, -4.234619140625, -3.4736328125, -2.712646484375, -1.95166015625, -1.190673828125, -0.4296875, 0.331298828125, 1.09228515625, 1.853271484375, 2.6142578125, 3.375244140625, 4.13623046875, 4.897216796875, 5.658203125, 6.419189453125, 7.18017578125, 7.941162109375, 8.7021484375, 9.463134765625, 10.22412109375, 10.985107421875, 11.74609375, 12.507080078125, 13.26806640625, 14.029052734375, 14.7900390625, 15.551025390625, 16.31201171875, 17.072998046875, 17.833984375, 18.594970703125, 19.35595703125, 20.116943359375, 20.8779296875, 21.638916015625, 22.39990234375, 23.160888671875, 23.921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 8.0, 18.0, 23.0, 34.0, 33.0, 45.0, 54.0, 72.0, 81.0, 94.0, 117.0, 83.0, 72.0, 59.0, 52.0, 34.0, 22.0, 15.0, 16.0, 6.0, 10.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.0027250945568084717, -0.0026425719261169434, -0.002560049295425415, -0.0024775266647338867, -0.0023950040340423584, -0.00231248140335083, -0.0022299587726593018, -0.0021474361419677734, -0.002064913511276245, -0.001982390880584717, -0.0018998682498931885, -0.0018173456192016602, -0.0017348229885101318, -0.0016523003578186035, -0.0015697777271270752, -0.0014872550964355469, -0.0014047324657440186, -0.0013222098350524902, -0.001239687204360962, -0.0011571645736694336, -0.0010746419429779053, -0.000992119312286377, -0.0009095966815948486, -0.0008270740509033203, -0.000744551420211792, -0.0006620287895202637, -0.0005795061588287354, -0.000496983528137207, -0.0004144608974456787, -0.0003319382667541504, -0.00024941563606262207, -0.00016689300537109375, -8.437037467956543e-05, -1.8477439880371094e-06, 8.067488670349121e-05, 0.00016319751739501953, 0.00024572014808654785, 0.00032824277877807617, 0.0004107654094696045, 0.0004932880401611328, 0.0005758106708526611, 0.0006583333015441895, 0.0007408559322357178, 0.0008233785629272461, 0.0009059011936187744, 0.0009884238243103027, 0.001070946455001831, 0.0011534690856933594, 0.0012359917163848877, 0.001318514347076416, 0.0014010369777679443, 0.0014835596084594727, 0.001566082239151001, 0.0016486048698425293, 0.0017311275005340576, 0.001813650131225586, 0.0018961727619171143, 0.0019786953926086426, 0.002061218023300171, 0.0021437406539916992, 0.0022262632846832275, 0.002308785915374756, 0.002391308546066284, 0.0024738311767578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 18.0, 26.0, 31.0, 41.0, 79.0, 73.0, 150.0, 200.0, 346.0, 512.0, 855.0, 1462.0, 2249.0, 3954.0, 6690.0, 11593.0, 21262.0, 39563.0, 74866.0, 141246.0, 237694.0, 224822.0, 130174.0, 68629.0, 36377.0, 19419.0, 10850.0, 6092.0, 3548.0, 2132.0, 1308.0, 795.0, 520.0, 339.0, 195.0, 137.0, 86.0, 56.0, 53.0, 28.0, 17.0, 17.0, 7.0, 8.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.25, -20.56298828125, -19.8759765625, -19.18896484375, -18.501953125, -17.81494140625, -17.1279296875, -16.44091796875, -15.75390625, -15.06689453125, -14.3798828125, -13.69287109375, -13.005859375, -12.31884765625, -11.6318359375, -10.94482421875, -10.2578125, -9.57080078125, -8.8837890625, -8.19677734375, -7.509765625, -6.82275390625, -6.1357421875, -5.44873046875, -4.76171875, -4.07470703125, -3.3876953125, -2.70068359375, -2.013671875, -1.32666015625, -0.6396484375, 0.04736328125, 0.734375, 1.42138671875, 2.1083984375, 2.79541015625, 3.482421875, 4.16943359375, 4.8564453125, 5.54345703125, 6.23046875, 6.91748046875, 7.6044921875, 8.29150390625, 8.978515625, 9.66552734375, 10.3525390625, 11.03955078125, 11.7265625, 12.41357421875, 13.1005859375, 13.78759765625, 14.474609375, 15.16162109375, 15.8486328125, 16.53564453125, 17.22265625, 17.90966796875, 18.5966796875, 19.28369140625, 19.970703125, 20.65771484375, 21.3447265625, 22.03173828125, 22.71875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 4.0, 4.0, 8.0, 13.0, 14.0, 17.0, 17.0, 33.0, 34.0, 33.0, 40.0, 39.0, 48.0, 47.0, 50.0, 66.0, 52.0, 68.0, 64.0, 52.0, 47.0, 37.0, 32.0, 25.0, 31.0, 31.0, 11.0, 21.0, 12.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.46728515625, -7.2509765625, -7.03466796875, -6.818359375, -6.60205078125, -6.3857421875, -6.16943359375, -5.953125, -5.73681640625, -5.5205078125, -5.30419921875, -5.087890625, -4.87158203125, -4.6552734375, -4.43896484375, -4.22265625, -4.00634765625, -3.7900390625, -3.57373046875, -3.357421875, -3.14111328125, -2.9248046875, -2.70849609375, -2.4921875, -2.27587890625, -2.0595703125, -1.84326171875, -1.626953125, -1.41064453125, -1.1943359375, -0.97802734375, -0.76171875, -0.54541015625, -0.3291015625, -0.11279296875, 0.103515625, 0.31982421875, 0.5361328125, 0.75244140625, 0.96875, 1.18505859375, 1.4013671875, 1.61767578125, 1.833984375, 2.05029296875, 2.2666015625, 2.48291015625, 2.69921875, 2.91552734375, 3.1318359375, 3.34814453125, 3.564453125, 3.78076171875, 3.9970703125, 4.21337890625, 4.4296875, 4.64599609375, 4.8623046875, 5.07861328125, 5.294921875, 5.51123046875, 5.7275390625, 5.94384765625, 6.16015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 9.0, 15.0, 19.0, 15.0, 22.0, 25.0, 32.0, 50.0, 40.0, 56.0, 58.0, 68.0, 58.0, 57.0, 62.0, 64.0, 59.0, 37.0, 40.0, 47.0, 17.0, 21.0, 22.0, 20.0, 15.0, 12.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.43230438232422, -41.18538284301758, -39.93846130371094, -38.6915397644043, -37.444618225097656, -36.197696685791016, -34.950775146484375, -33.703853607177734, -32.456932067871094, -31.210010528564453, -29.963088989257812, -28.716167449951172, -27.46924591064453, -26.22232437133789, -24.97540283203125, -23.72848129272461, -22.481557846069336, -21.234636306762695, -19.987714767456055, -18.740793228149414, -17.493871688842773, -16.246950149536133, -15.000027656555176, -13.753106117248535, -12.506184577941895, -11.259263038635254, -10.012341499328613, -8.765419006347656, -7.518497943878174, -6.271576404571533, -5.024654388427734, -3.7777328491210938, -2.530811309814453, -1.283889651298523, -0.03696799278259277, 1.209953784942627, 2.4568753242492676, 3.703796863555908, 4.950718879699707, 6.197640419006348, 7.444561958312988, 8.691483497619629, 9.93840503692627, 11.185327529907227, 12.432249069213867, 13.679170608520508, 14.926092147827148, 16.17301368713379, 17.41993522644043, 18.66685676574707, 19.91377830505371, 21.16069984436035, 22.407621383666992, 23.654542922973633, 24.901466369628906, 26.148387908935547, 27.395309448242188, 28.642230987548828, 29.88915252685547, 31.13607406616211, 32.38299560546875, 33.62991714477539, 34.87683868408203, 36.12376022338867, 37.37068176269531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 6.0, 10.0, 9.0, 13.0, 9.0, 13.0, 19.0, 25.0, 22.0, 30.0, 34.0, 34.0, 31.0, 47.0, 32.0, 52.0, 43.0, 44.0, 44.0, 39.0, 52.0, 42.0, 42.0, 47.0, 44.0, 38.0, 28.0, 26.0, 19.0, 23.0, 16.0, 14.0, 12.0, 14.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.439571380615234, -45.023658752441406, -43.607749938964844, -42.191837310791016, -40.77592468261719, -39.360015869140625, -37.9441032409668, -36.52819061279297, -35.112281799316406, -33.69636917114258, -32.280460357666016, -30.864547729492188, -29.448637008666992, -28.032726287841797, -26.61681365966797, -25.200902938842773, -23.784992218017578, -22.369081497192383, -20.953170776367188, -19.53725814819336, -18.121347427368164, -16.70543670654297, -15.289525032043457, -13.873613357543945, -12.45770263671875, -11.041791915893555, -9.625880241394043, -8.209968566894531, -6.794057846069336, -5.378146648406982, -3.962235450744629, -2.546323776245117, -1.1304092407226562, 0.28550195693969727, 1.7014131546020508, 3.1173243522644043, 4.533235549926758, 5.949146747589111, 7.365057945251465, 8.780969619750977, 10.196880340576172, 11.612791061401367, 13.028702735900879, 14.44461441040039, 15.860525131225586, 17.27643585205078, 18.69234848022461, 20.108259201049805, 21.524169921875, 22.940080642700195, 24.35599136352539, 25.77190399169922, 27.187814712524414, 28.60372543334961, 30.019638061523438, 31.435548782348633, 32.85145950317383, 34.267372131347656, 35.68328094482422, 37.09919357299805, 38.515106201171875, 39.93101501464844, 41.346927642822266, 42.762840270996094, 44.178749084472656]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 8.0, 14.0, 17.0, 17.0, 21.0, 32.0, 45.0, 56.0, 64.0, 85.0, 127.0, 163.0, 233.0, 304.0, 419.0, 671.0, 874.0, 1043125.0, 1167.0, 856.0, 648.0, 462.0, 319.0, 198.0, 166.0, 129.0, 78.0, 62.0, 51.0, 48.0, 27.0, 26.0, 20.0, 8.0, 11.0, 11.0, 7.0, 7.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-885.319091796875, -860.0007934570312, -834.6824951171875, -809.3641967773438, -784.0458984375, -758.7276000976562, -733.4093017578125, -708.0910034179688, -682.772705078125, -657.4544067382812, -632.1361083984375, -606.8178100585938, -581.49951171875, -556.1812133789062, -530.8629150390625, -505.54461669921875, -480.2263488769531, -454.9080505371094, -429.5897521972656, -404.2714538574219, -378.9531555175781, -353.6348571777344, -328.31658935546875, -302.998291015625, -277.67999267578125, -252.3616943359375, -227.04339599609375, -201.72509765625, -176.40679931640625, -151.0885009765625, -125.77021789550781, -100.45191955566406, -75.13360595703125, -49.8153076171875, -24.497013092041016, 0.8212814331054688, 26.13957977294922, 51.45787811279297, 76.77616882324219, 102.09446716308594, 127.41276550292969, 152.73106384277344, 178.0493621826172, 203.36764526367188, 228.68594360351562, 254.00424194335938, 279.3225402832031, 304.6408386230469, 329.9591369628906, 355.2774353027344, 380.5957336425781, 405.9140319824219, 431.2323303222656, 456.5506286621094, 481.868896484375, 507.18719482421875, 532.5054931640625, 557.8237915039062, 583.14208984375, 608.4603881835938, 633.7786865234375, 659.0969848632812, 684.415283203125, 709.7335815429688, 735.0518798828125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 10.0, 9.0, 14.0, 18.0, 23.0, 26.0, 23.0, 23.0, 39.0, 52.0, 62.0, 81.0, 110.0, 130.0, 168.0, 238.0, 413.0, 1584.0, 51458464.0, 7699.0, 902.0, 325.0, 202.0, 149.0, 115.0, 95.0, 74.0, 60.0, 47.0, 29.0, 26.0, 22.0, 22.0, 14.0, 16.0, 12.0, 14.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3355.04296875, -3238.647705078125, -3122.25244140625, -3005.857177734375, -2889.4619140625, -2773.066650390625, -2656.67138671875, -2540.276123046875, -2423.880859375, -2307.485595703125, -2191.09033203125, -2074.695068359375, -1958.2998046875, -1841.904541015625, -1725.50927734375, -1609.114013671875, -1492.71875, -1376.323486328125, -1259.92822265625, -1143.532958984375, -1027.1376953125, -910.742431640625, -794.34716796875, -677.951904296875, -561.556640625, -445.161376953125, -328.76611328125, -212.370849609375, -95.9755859375, 20.419677734375, 136.81494140625, 253.210205078125, 369.605712890625, 486.0009765625, 602.396240234375, 718.79150390625, 835.186767578125, 951.58203125, 1067.977294921875, 1184.37255859375, 1300.767822265625, 1417.1630859375, 1533.558349609375, 1649.95361328125, 1766.348876953125, 1882.744140625, 1999.139404296875, 2115.53466796875, 2231.929931640625, 2348.3251953125, 2464.720458984375, 2581.11572265625, 2697.510986328125, 2813.90625, 2930.301513671875, 3046.69677734375, 3163.092041015625, 3279.4873046875, 3395.882568359375, 3512.27783203125, 3628.673095703125, 3745.068359375, 3861.463623046875, 3977.85888671875, 4094.254150390625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 13.0, 13.0, 21.0, 54.0, 67.0, 111.0, 205.0, 375.0, 647.0, 1167.0, 2128.0, 3966.0, 8101.0, 16808.0, 35378.0, 79686.0, 192082.0, 522875.0, 1990817.0, 2437926.0, 612143.0, 218663.0, 90331.0, 40360.0, 18642.0, 9076.0, 4563.0, 2370.0, 1208.0, 698.0, 373.0, 208.0, 122.0, 84.0, 54.0, 36.0, 18.0, 21.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-162.375, -157.8740234375, -153.373046875, -148.8720703125, -144.37109375, -139.8701171875, -135.369140625, -130.8681640625, -126.3671875, -121.8662109375, -117.365234375, -112.8642578125, -108.36328125, -103.8623046875, -99.361328125, -94.8603515625, -90.359375, -85.8583984375, -81.357421875, -76.8564453125, -72.35546875, -67.8544921875, -63.353515625, -58.8525390625, -54.3515625, -49.8505859375, -45.349609375, -40.8486328125, -36.34765625, -31.8466796875, -27.345703125, -22.8447265625, -18.34375, -13.8427734375, -9.341796875, -4.8408203125, -0.33984375, 4.1611328125, 8.662109375, 13.1630859375, 17.6640625, 22.1650390625, 26.666015625, 31.1669921875, 35.66796875, 40.1689453125, 44.669921875, 49.1708984375, 53.671875, 58.1728515625, 62.673828125, 67.1748046875, 71.67578125, 76.1767578125, 80.677734375, 85.1787109375, 89.6796875, 94.1806640625, 98.681640625, 103.1826171875, 107.68359375, 112.1845703125, 116.685546875, 121.1865234375, 125.6875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 2.0, 6.0, 9.0, 15.0, 13.0, 13.0, 15.0, 18.0, 18.0, 18.0, 34.0, 40.0, 39.0, 50.0, 72.0, 97.0, 120.0, 162.0, 181.0, 212.0, 161.0, 155.0, 112.0, 93.0, 60.0, 43.0, 45.0, 33.0, 30.0, 31.0, 21.0, 14.0, 8.0, 14.0, 13.0, 8.0, 6.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.3486328125, -59.259765625, -57.1708984375, -55.08203125, -52.9931640625, -50.904296875, -48.8154296875, -46.7265625, -44.6376953125, -42.548828125, -40.4599609375, -38.37109375, -36.2822265625, -34.193359375, -32.1044921875, -30.015625, -27.9267578125, -25.837890625, -23.7490234375, -21.66015625, -19.5712890625, -17.482421875, -15.3935546875, -13.3046875, -11.2158203125, -9.126953125, -7.0380859375, -4.94921875, -2.8603515625, -0.771484375, 1.3173828125, 3.40625, 5.4951171875, 7.583984375, 9.6728515625, 11.76171875, 13.8505859375, 15.939453125, 18.0283203125, 20.1171875, 22.2060546875, 24.294921875, 26.3837890625, 28.47265625, 30.5615234375, 32.650390625, 34.7392578125, 36.828125, 38.9169921875, 41.005859375, 43.0947265625, 45.18359375, 47.2724609375, 49.361328125, 51.4501953125, 53.5390625, 55.6279296875, 57.716796875, 59.8056640625, 61.89453125, 63.9833984375, 66.072265625, 68.1611328125, 70.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 18.0, 27.0, 35.0, 36.0, 74.0, 110.0, 157.0, 238.0, 369.0, 557.0, 898.0, 1498.0, 2437.0, 3794.0, 6321.0, 10177.0, 16228.0, 26613.0, 43788.0, 72166.0, 120200.0, 200852.0, 347439.0, 711819.0, 2035070.0, 1444843.0, 536120.0, 285309.0, 168284.0, 100737.0, 60792.0, 36631.0, 22215.0, 13433.0, 8353.0, 4993.0, 3238.0, 2070.0, 1222.0, 783.0, 517.0, 321.0, 214.0, 144.0, 96.0, 43.0, 35.0, 40.0, 21.0, 25.0, 8.0, 13.0, 7.0, 0.0, 1.0, 2.0, 3.0], "bins": [-54.03125, -52.33349609375, -50.6357421875, -48.93798828125, -47.240234375, -45.54248046875, -43.8447265625, -42.14697265625, -40.44921875, -38.75146484375, -37.0537109375, -35.35595703125, -33.658203125, -31.96044921875, -30.2626953125, -28.56494140625, -26.8671875, -25.16943359375, -23.4716796875, -21.77392578125, -20.076171875, -18.37841796875, -16.6806640625, -14.98291015625, -13.28515625, -11.58740234375, -9.8896484375, -8.19189453125, -6.494140625, -4.79638671875, -3.0986328125, -1.40087890625, 0.296875, 1.99462890625, 3.6923828125, 5.39013671875, 7.087890625, 8.78564453125, 10.4833984375, 12.18115234375, 13.87890625, 15.57666015625, 17.2744140625, 18.97216796875, 20.669921875, 22.36767578125, 24.0654296875, 25.76318359375, 27.4609375, 29.15869140625, 30.8564453125, 32.55419921875, 34.251953125, 35.94970703125, 37.6474609375, 39.34521484375, 41.04296875, 42.74072265625, 44.4384765625, 46.13623046875, 47.833984375, 49.53173828125, 51.2294921875, 52.92724609375, 54.625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 6.0, 9.0, 11.0, 9.0, 15.0, 17.0, 35.0, 21.0, 32.0, 39.0, 41.0, 42.0, 55.0, 82.0, 120.0, 191.0, 265.0, 291.0, 219.0, 110.0, 75.0, 52.0, 55.0, 38.0, 29.0, 26.0, 23.0, 21.0, 17.0, 8.0, 8.0, 16.0, 6.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.375, -77.4052734375, -74.435546875, -71.4658203125, -68.49609375, -65.5263671875, -62.556640625, -59.5869140625, -56.6171875, -53.6474609375, -50.677734375, -47.7080078125, -44.73828125, -41.7685546875, -38.798828125, -35.8291015625, -32.859375, -29.8896484375, -26.919921875, -23.9501953125, -20.98046875, -18.0107421875, -15.041015625, -12.0712890625, -9.1015625, -6.1318359375, -3.162109375, -0.1923828125, 2.77734375, 5.7470703125, 8.716796875, 11.6865234375, 14.65625, 17.6259765625, 20.595703125, 23.5654296875, 26.53515625, 29.5048828125, 32.474609375, 35.4443359375, 38.4140625, 41.3837890625, 44.353515625, 47.3232421875, 50.29296875, 53.2626953125, 56.232421875, 59.2021484375, 62.171875, 65.1416015625, 68.111328125, 71.0810546875, 74.05078125, 77.0205078125, 79.990234375, 82.9599609375, 85.9296875, 88.8994140625, 91.869140625, 94.8388671875, 97.80859375, 100.7783203125, 103.748046875, 106.7177734375, 109.6875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 25.0, 43.0, 56.0, 93.0, 102.0, 135.0, 228.0, 310.0, 446.0, 625.0, 887.0, 1264.0, 1819.0, 2545.0, 3713.0, 5343.0, 7789.0, 11437.0, 17611.0, 27081.0, 43863.0, 75192.0, 176320.0, 5419130.0, 271450.0, 85783.0, 48318.0, 29903.0, 19478.0, 12715.0, 8397.0, 5788.0, 4074.0, 2810.0, 1894.0, 1403.0, 997.0, 707.0, 525.0, 335.0, 256.0, 175.0, 111.0, 85.0, 61.0, 44.0, 17.0, 16.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.1669921875, -93.771484375, -90.3759765625, -86.98046875, -83.5849609375, -80.189453125, -76.7939453125, -73.3984375, -70.0029296875, -66.607421875, -63.2119140625, -59.81640625, -56.4208984375, -53.025390625, -49.6298828125, -46.234375, -42.8388671875, -39.443359375, -36.0478515625, -32.65234375, -29.2568359375, -25.861328125, -22.4658203125, -19.0703125, -15.6748046875, -12.279296875, -8.8837890625, -5.48828125, -2.0927734375, 1.302734375, 4.6982421875, 8.09375, 11.4892578125, 14.884765625, 18.2802734375, 21.67578125, 25.0712890625, 28.466796875, 31.8623046875, 35.2578125, 38.6533203125, 42.048828125, 45.4443359375, 48.83984375, 52.2353515625, 55.630859375, 59.0263671875, 62.421875, 65.8173828125, 69.212890625, 72.6083984375, 76.00390625, 79.3994140625, 82.794921875, 86.1904296875, 89.5859375, 92.9814453125, 96.376953125, 99.7724609375, 103.16796875, 106.5634765625, 109.958984375, 113.3544921875, 116.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 13.0, 12.0, 12.0, 10.0, 18.0, 15.0, 19.0, 25.0, 29.0, 19.0, 40.0, 29.0, 33.0, 43.0, 52.0, 77.0, 152.0, 281.0, 404.0, 205.0, 97.0, 71.0, 36.0, 40.0, 36.0, 23.0, 31.0, 33.0, 20.0, 21.0, 14.0, 15.0, 12.0, 11.0, 14.0, 13.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.685546875, -137.99609375, -133.306640625, -128.6171875, -123.927734375, -119.23828125, -114.548828125, -109.859375, -105.169921875, -100.48046875, -95.791015625, -91.1015625, -86.412109375, -81.72265625, -77.033203125, -72.34375, -67.654296875, -62.96484375, -58.275390625, -53.5859375, -48.896484375, -44.20703125, -39.517578125, -34.828125, -30.138671875, -25.44921875, -20.759765625, -16.0703125, -11.380859375, -6.69140625, -2.001953125, 2.6875, 7.376953125, 12.06640625, 16.755859375, 21.4453125, 26.134765625, 30.82421875, 35.513671875, 40.203125, 44.892578125, 49.58203125, 54.271484375, 58.9609375, 63.650390625, 68.33984375, 73.029296875, 77.71875, 82.408203125, 87.09765625, 91.787109375, 96.4765625, 101.166015625, 105.85546875, 110.544921875, 115.234375, 119.923828125, 124.61328125, 129.302734375, 133.9921875, 138.681640625, 143.37109375, 148.060546875, 152.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 7.0, 8.0, 14.0, 18.0, 23.0, 35.0, 48.0, 50.0, 63.0, 87.0, 159.0, 121.0, 61.0, 61.0, 47.0, 34.0, 30.0, 16.0, 17.0, 19.0, 14.0, 7.0, 10.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2396.674072265625, -2304.192626953125, -2211.711181640625, -2119.229736328125, -2026.748291015625, -1934.266845703125, -1841.7852783203125, -1749.3038330078125, -1656.8223876953125, -1564.3409423828125, -1471.8594970703125, -1379.3779296875, -1286.896484375, -1194.4150390625, -1101.93359375, -1009.4521484375, -916.970703125, -824.4892578125, -732.0078125, -639.5263061523438, -547.0448608398438, -454.56341552734375, -362.0819091796875, -269.6004638671875, -177.1190185546875, -84.63755798339844, 7.843902587890625, 100.32537841796875, 192.80682373046875, 285.28826904296875, 377.769775390625, 470.251220703125, 562.732666015625, 655.214111328125, 747.695556640625, 840.1770629882812, 932.6585083007812, 1025.139892578125, 1117.6214599609375, 1210.1029052734375, 1302.5843505859375, 1395.0657958984375, 1487.5472412109375, 1580.02880859375, 1672.51025390625, 1764.99169921875, 1857.47314453125, 1949.95458984375, 2042.43603515625, 2134.91748046875, 2227.39892578125, 2319.88037109375, 2412.36181640625, 2504.84326171875, 2597.32470703125, 2689.80615234375, 2782.28759765625, 2874.76904296875, 2967.25048828125, 3059.73193359375, 3152.21337890625, 3244.69482421875, 3337.17626953125, 3429.65771484375, 3522.139404296875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 10.0, 14.0, 19.0, 19.0, 17.0, 22.0, 18.0, 28.0, 23.0, 32.0, 47.0, 49.0, 81.0, 105.0, 76.0, 74.0, 44.0, 25.0, 27.0, 27.0, 23.0, 21.0, 25.0, 21.0, 16.0, 16.0, 16.0, 8.0, 9.0, 10.0, 11.0, 1.0, 2.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3043.0244140625, -2941.0390625, -2839.053955078125, -2737.068603515625, -2635.08349609375, -2533.09814453125, -2431.11279296875, -2329.127685546875, -2227.142333984375, -2125.156982421875, -2023.171875, -1921.1865234375, -1819.2012939453125, -1717.216064453125, -1615.2308349609375, -1513.24560546875, -1411.2603759765625, -1309.275146484375, -1207.2899169921875, -1105.3046875, -1003.3193359375, -901.3341064453125, -799.348876953125, -697.3635864257812, -595.3783569335938, -493.3930969238281, -391.4078369140625, -289.422607421875, -187.43734741210938, -85.45208740234375, 16.53314208984375, 118.5184326171875, 220.503662109375, 322.4889221191406, 424.47418212890625, 526.4594116210938, 628.4447021484375, 730.429931640625, 832.4151611328125, 934.4004516601562, 1036.3857421875, 1138.3709716796875, 1240.356201171875, 1342.341552734375, 1444.3267822265625, 1546.31201171875, 1648.2972412109375, 1750.282470703125, 1852.2677001953125, 1954.2529296875, 2056.23828125, 2158.223388671875, 2260.208740234375, 2362.19384765625, 2464.17919921875, 2566.16455078125, 2668.149658203125, 2770.135009765625, 2872.1201171875, 2974.10546875, 3076.090576171875, 3178.075927734375, 3280.06103515625, 3382.04638671875, 3484.03173828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 27.0, 43.0, 83.0, 126.0, 208.0, 381.0, 660.0, 1029.0, 1616.0, 2868.0, 5176.0, 10051.0, 23423.0, 75797.0, 653358.0, 3228009.0, 139557.0, 32000.0, 10747.0, 4408.0, 2112.0, 1106.0, 588.0, 339.0, 187.0, 106.0, 75.0, 52.0, 36.0, 24.0, 17.0, 16.0, 3.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.328125, -28.416259765625, -27.50439453125, -26.592529296875, -25.6806640625, -24.768798828125, -23.85693359375, -22.945068359375, -22.033203125, -21.121337890625, -20.20947265625, -19.297607421875, -18.3857421875, -17.473876953125, -16.56201171875, -15.650146484375, -14.73828125, -13.826416015625, -12.91455078125, -12.002685546875, -11.0908203125, -10.178955078125, -9.26708984375, -8.355224609375, -7.443359375, -6.531494140625, -5.61962890625, -4.707763671875, -3.7958984375, -2.884033203125, -1.97216796875, -1.060302734375, -0.1484375, 0.763427734375, 1.67529296875, 2.587158203125, 3.4990234375, 4.410888671875, 5.32275390625, 6.234619140625, 7.146484375, 8.058349609375, 8.97021484375, 9.882080078125, 10.7939453125, 11.705810546875, 12.61767578125, 13.529541015625, 14.44140625, 15.353271484375, 16.26513671875, 17.177001953125, 18.0888671875, 19.000732421875, 19.91259765625, 20.824462890625, 21.736328125, 22.648193359375, 23.56005859375, 24.471923828125, 25.3837890625, 26.295654296875, 27.20751953125, 28.119384765625, 29.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 8.0, 4.0, 17.0, 26.0, 38.0, 54.0, 87.0, 96.0, 165.0, 142.0, 89.0, 83.0, 53.0, 33.0, 33.0, 16.0, 8.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.65155029296875, -3.5101318359375, -3.36871337890625, -3.227294921875, -3.08587646484375, -2.9444580078125, -2.80303955078125, -2.66162109375, -2.52020263671875, -2.3787841796875, -2.23736572265625, -2.095947265625, -1.95452880859375, -1.8131103515625, -1.67169189453125, -1.5302734375, -1.38885498046875, -1.2474365234375, -1.10601806640625, -0.964599609375, -0.82318115234375, -0.6817626953125, -0.54034423828125, -0.39892578125, -0.25750732421875, -0.1160888671875, 0.02532958984375, 0.166748046875, 0.30816650390625, 0.4495849609375, 0.59100341796875, 0.732421875, 0.87384033203125, 1.0152587890625, 1.15667724609375, 1.298095703125, 1.43951416015625, 1.5809326171875, 1.72235107421875, 1.86376953125, 2.00518798828125, 2.1466064453125, 2.28802490234375, 2.429443359375, 2.57086181640625, 2.7122802734375, 2.85369873046875, 2.9951171875, 3.13653564453125, 3.2779541015625, 3.41937255859375, 3.560791015625, 3.70220947265625, 3.8436279296875, 3.98504638671875, 4.12646484375, 4.26788330078125, 4.4093017578125, 4.55072021484375, 4.692138671875, 4.83355712890625, 4.9749755859375, 5.11639404296875, 5.2578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 5.0, 14.0, 12.0, 24.0, 21.0, 28.0, 51.0, 77.0, 90.0, 163.0, 209.0, 353.0, 582.0, 911.0, 1568.0, 2694.0, 4944.0, 9157.0, 17976.0, 38070.0, 86314.0, 228095.0, 856772.0, 2265271.0, 432912.0, 139687.0, 56128.0, 25477.0, 12288.0, 6340.0, 3415.0, 1812.0, 1095.0, 646.0, 373.0, 263.0, 153.0, 92.0, 65.0, 46.0, 30.0, 17.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.0269775390625, -14.530517578125, -14.0340576171875, -13.53759765625, -13.0411376953125, -12.544677734375, -12.0482177734375, -11.5517578125, -11.0552978515625, -10.558837890625, -10.0623779296875, -9.56591796875, -9.0694580078125, -8.572998046875, -8.0765380859375, -7.580078125, -7.0836181640625, -6.587158203125, -6.0906982421875, -5.59423828125, -5.0977783203125, -4.601318359375, -4.1048583984375, -3.6083984375, -3.1119384765625, -2.615478515625, -2.1190185546875, -1.62255859375, -1.1260986328125, -0.629638671875, -0.1331787109375, 0.36328125, 0.8597412109375, 1.356201171875, 1.8526611328125, 2.34912109375, 2.8455810546875, 3.342041015625, 3.8385009765625, 4.3349609375, 4.8314208984375, 5.327880859375, 5.8243408203125, 6.32080078125, 6.8172607421875, 7.313720703125, 7.8101806640625, 8.306640625, 8.8031005859375, 9.299560546875, 9.7960205078125, 10.29248046875, 10.7889404296875, 11.285400390625, 11.7818603515625, 12.2783203125, 12.7747802734375, 13.271240234375, 13.7677001953125, 14.26416015625, 14.7606201171875, 15.257080078125, 15.7535400390625, 16.25]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 6.0, 12.0, 16.0, 18.0, 25.0, 32.0, 42.0, 45.0, 62.0, 81.0, 99.0, 127.0, 152.0, 219.0, 298.0, 518.0, 844.0, 430.0, 254.0, 199.0, 141.0, 105.0, 70.0, 58.0, 51.0, 44.0, 26.0, 19.0, 13.0, 18.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.5306396484375, -7.322998046875, -7.1153564453125, -6.90771484375, -6.7000732421875, -6.492431640625, -6.2847900390625, -6.0771484375, -5.8695068359375, -5.661865234375, -5.4542236328125, -5.24658203125, -5.0389404296875, -4.831298828125, -4.6236572265625, -4.416015625, -4.2083740234375, -4.000732421875, -3.7930908203125, -3.58544921875, -3.3778076171875, -3.170166015625, -2.9625244140625, -2.7548828125, -2.5472412109375, -2.339599609375, -2.1319580078125, -1.92431640625, -1.7166748046875, -1.509033203125, -1.3013916015625, -1.09375, -0.8861083984375, -0.678466796875, -0.4708251953125, -0.26318359375, -0.0555419921875, 0.152099609375, 0.3597412109375, 0.5673828125, 0.7750244140625, 0.982666015625, 1.1903076171875, 1.39794921875, 1.6055908203125, 1.813232421875, 2.0208740234375, 2.228515625, 2.4361572265625, 2.643798828125, 2.8514404296875, 3.05908203125, 3.2667236328125, 3.474365234375, 3.6820068359375, 3.8896484375, 4.0972900390625, 4.304931640625, 4.5125732421875, 4.72021484375, 4.9278564453125, 5.135498046875, 5.3431396484375, 5.55078125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 13.0, 24.0, 28.0, 50.0, 67.0, 61.0, 93.0, 92.0, 99.0, 111.0, 81.0, 66.0, 45.0, 50.0, 22.0, 15.0, 10.0, 13.0, 4.0, 4.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.39988708496094, -46.92252731323242, -45.445167541503906, -43.96780776977539, -42.490447998046875, -41.01308822631836, -39.535728454589844, -38.05836868286133, -36.58100891113281, -35.1036491394043, -33.62628936767578, -32.148929595947266, -30.67156982421875, -29.194210052490234, -27.71685028076172, -26.239490509033203, -24.762128829956055, -23.28476905822754, -21.807409286499023, -20.330049514770508, -18.852689743041992, -17.375329971313477, -15.897969245910645, -14.420609474182129, -12.943249702453613, -11.465889930725098, -9.988530158996582, -8.51116943359375, -7.033810138702393, -5.556450366973877, -4.079090118408203, -2.6017303466796875, -1.1243705749511719, 0.3529893159866333, 1.8303492069244385, 3.307709217071533, 4.785068988800049, 6.2624287605285645, 7.739789009094238, 9.217148780822754, 10.69450855255127, 12.171868324279785, 13.6492280960083, 15.126588821411133, 16.60394859313965, 18.081308364868164, 19.55866813659668, 21.036027908325195, 22.51338768005371, 23.990747451782227, 25.468107223510742, 26.945466995239258, 28.422826766967773, 29.90018653869629, 31.377548217773438, 32.85490798950195, 34.33226776123047, 35.809627532958984, 37.2869873046875, 38.764347076416016, 40.24170684814453, 41.71906661987305, 43.19642639160156, 44.67378616333008, 46.151145935058594]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 10.0, 15.0, 13.0, 18.0, 18.0, 15.0, 22.0, 23.0, 23.0, 34.0, 31.0, 37.0, 31.0, 39.0, 45.0, 41.0, 33.0, 45.0, 35.0, 38.0, 39.0, 43.0, 42.0, 35.0, 27.0, 32.0, 26.0, 22.0, 23.0, 15.0, 16.0, 16.0, 15.0, 15.0, 10.0, 9.0, 2.0, 4.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.855472564697266, -27.86359405517578, -26.871715545654297, -25.879837036132812, -24.887958526611328, -23.896080017089844, -22.90420150756836, -21.912322998046875, -20.92044448852539, -19.928565979003906, -18.936687469482422, -17.944808959960938, -16.952930450439453, -15.961051940917969, -14.969173431396484, -13.977294921875, -12.985416412353516, -11.993537902832031, -11.001659393310547, -10.009780883789062, -9.017902374267578, -8.026023864746094, -7.034145355224609, -6.042266845703125, -5.050388336181641, -4.058509826660156, -3.066631317138672, -2.0747528076171875, -1.0828742980957031, -0.09099578857421875, 0.9008827209472656, 1.89276123046875, 2.8846397399902344, 3.8765182495117188, 4.868396759033203, 5.8602752685546875, 6.852153778076172, 7.844032287597656, 8.83591079711914, 9.827789306640625, 10.81966781616211, 11.811546325683594, 12.803424835205078, 13.795303344726562, 14.787181854248047, 15.779060363769531, 16.770938873291016, 17.7628173828125, 18.754695892333984, 19.74657440185547, 20.738452911376953, 21.730331420898438, 22.722209930419922, 23.714088439941406, 24.70596694946289, 25.697845458984375, 26.68972396850586, 27.681602478027344, 28.673480987548828, 29.665359497070312, 30.657238006591797, 31.64911651611328, 32.640995025634766, 33.63287353515625, 34.624752044677734]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 23.0, 26.0, 38.0, 72.0, 70.0, 120.0, 164.0, 244.0, 365.0, 534.0, 786.0, 1239.0, 2012.0, 3753.0, 7744.0, 19971.0, 69384.0, 464456.0, 380759.0, 61780.0, 18404.0, 7274.0, 3768.0, 2028.0, 1201.0, 794.0, 520.0, 308.0, 228.0, 141.0, 95.0, 72.0, 36.0, 23.0, 26.0, 7.0, 8.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.6171875, -14.1124267578125, -13.607666015625, -13.1029052734375, -12.59814453125, -12.0933837890625, -11.588623046875, -11.0838623046875, -10.5791015625, -10.0743408203125, -9.569580078125, -9.0648193359375, -8.56005859375, -8.0552978515625, -7.550537109375, -7.0457763671875, -6.541015625, -6.0362548828125, -5.531494140625, -5.0267333984375, -4.52197265625, -4.0172119140625, -3.512451171875, -3.0076904296875, -2.5029296875, -1.9981689453125, -1.493408203125, -0.9886474609375, -0.48388671875, 0.0208740234375, 0.525634765625, 1.0303955078125, 1.53515625, 2.0399169921875, 2.544677734375, 3.0494384765625, 3.55419921875, 4.0589599609375, 4.563720703125, 5.0684814453125, 5.5732421875, 6.0780029296875, 6.582763671875, 7.0875244140625, 7.59228515625, 8.0970458984375, 8.601806640625, 9.1065673828125, 9.611328125, 10.1160888671875, 10.620849609375, 11.1256103515625, 11.63037109375, 12.1351318359375, 12.639892578125, 13.1446533203125, 13.6494140625, 14.1541748046875, 14.658935546875, 15.1636962890625, 15.66845703125, 16.1732177734375, 16.677978515625, 17.1827392578125, 17.6875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 12.0, 23.0, 43.0, 72.0, 93.0, 117.0, 128.0, 131.0, 124.0, 66.0, 55.0, 37.0, 27.0, 17.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.073486328125, -3.90869140625, -3.743896484375, -3.5791015625, -3.414306640625, -3.24951171875, -3.084716796875, -2.919921875, -2.755126953125, -2.59033203125, -2.425537109375, -2.2607421875, -2.095947265625, -1.93115234375, -1.766357421875, -1.6015625, -1.436767578125, -1.27197265625, -1.107177734375, -0.9423828125, -0.777587890625, -0.61279296875, -0.447998046875, -0.283203125, -0.118408203125, 0.04638671875, 0.211181640625, 0.3759765625, 0.540771484375, 0.70556640625, 0.870361328125, 1.03515625, 1.199951171875, 1.36474609375, 1.529541015625, 1.6943359375, 1.859130859375, 2.02392578125, 2.188720703125, 2.353515625, 2.518310546875, 2.68310546875, 2.847900390625, 3.0126953125, 3.177490234375, 3.34228515625, 3.507080078125, 3.671875, 3.836669921875, 4.00146484375, 4.166259765625, 4.3310546875, 4.495849609375, 4.66064453125, 4.825439453125, 4.990234375, 5.155029296875, 5.31982421875, 5.484619140625, 5.6494140625, 5.814208984375, 5.97900390625, 6.143798828125, 6.30859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 6.0, 7.0, 8.0, 24.0, 38.0, 69.0, 73.0, 131.0, 176.0, 299.0, 517.0, 799.0, 1344.0, 2374.0, 4005.0, 6966.0, 13019.0, 25641.0, 54330.0, 136180.0, 445886.0, 210882.0, 74490.0, 33743.0, 16673.0, 8854.0, 4968.0, 2784.0, 1644.0, 968.0, 606.0, 372.0, 225.0, 146.0, 98.0, 62.0, 47.0, 24.0, 21.0, 11.0, 8.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7884521484375, -12.397216796875, -12.0059814453125, -11.61474609375, -11.2235107421875, -10.832275390625, -10.4410400390625, -10.0498046875, -9.6585693359375, -9.267333984375, -8.8760986328125, -8.48486328125, -8.0936279296875, -7.702392578125, -7.3111572265625, -6.919921875, -6.5286865234375, -6.137451171875, -5.7462158203125, -5.35498046875, -4.9637451171875, -4.572509765625, -4.1812744140625, -3.7900390625, -3.3988037109375, -3.007568359375, -2.6163330078125, -2.22509765625, -1.8338623046875, -1.442626953125, -1.0513916015625, -0.66015625, -0.2689208984375, 0.122314453125, 0.5135498046875, 0.90478515625, 1.2960205078125, 1.687255859375, 2.0784912109375, 2.4697265625, 2.8609619140625, 3.252197265625, 3.6434326171875, 4.03466796875, 4.4259033203125, 4.817138671875, 5.2083740234375, 5.599609375, 5.9908447265625, 6.382080078125, 6.7733154296875, 7.16455078125, 7.5557861328125, 7.947021484375, 8.3382568359375, 8.7294921875, 9.1207275390625, 9.511962890625, 9.9031982421875, 10.29443359375, 10.6856689453125, 11.076904296875, 11.4681396484375, 11.859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 8.0, 13.0, 12.0, 15.0, 14.0, 16.0, 19.0, 24.0, 19.0, 27.0, 32.0, 26.0, 46.0, 27.0, 44.0, 32.0, 42.0, 40.0, 46.0, 42.0, 48.0, 39.0, 34.0, 36.0, 36.0, 34.0, 41.0, 36.0, 20.0, 25.0, 17.0, 14.0, 13.0, 4.0, 10.0, 11.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3984375, -12.9661865234375, -12.533935546875, -12.1016845703125, -11.66943359375, -11.2371826171875, -10.804931640625, -10.3726806640625, -9.9404296875, -9.5081787109375, -9.075927734375, -8.6436767578125, -8.21142578125, -7.7791748046875, -7.346923828125, -6.9146728515625, -6.482421875, -6.0501708984375, -5.617919921875, -5.1856689453125, -4.75341796875, -4.3211669921875, -3.888916015625, -3.4566650390625, -3.0244140625, -2.5921630859375, -2.159912109375, -1.7276611328125, -1.29541015625, -0.8631591796875, -0.430908203125, 0.0013427734375, 0.43359375, 0.8658447265625, 1.298095703125, 1.7303466796875, 2.16259765625, 2.5948486328125, 3.027099609375, 3.4593505859375, 3.8916015625, 4.3238525390625, 4.756103515625, 5.1883544921875, 5.62060546875, 6.0528564453125, 6.485107421875, 6.9173583984375, 7.349609375, 7.7818603515625, 8.214111328125, 8.6463623046875, 9.07861328125, 9.5108642578125, 9.943115234375, 10.3753662109375, 10.8076171875, 11.2398681640625, 11.672119140625, 12.1043701171875, 12.53662109375, 12.9688720703125, 13.401123046875, 13.8333740234375, 14.265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 6.0, 18.0, 12.0, 14.0, 34.0, 35.0, 49.0, 81.0, 98.0, 166.0, 302.0, 476.0, 910.0, 1868.0, 4352.0, 10999.0, 34189.0, 160408.0, 599087.0, 177771.0, 37176.0, 11586.0, 4599.0, 1991.0, 975.0, 516.0, 277.0, 182.0, 97.0, 49.0, 54.0, 27.0, 33.0, 20.0, 15.0, 19.0, 10.0, 10.0, 3.0, 6.0, 1.0, 3.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-11.28125, -10.9344482421875, -10.587646484375, -10.2408447265625, -9.89404296875, -9.5472412109375, -9.200439453125, -8.8536376953125, -8.5068359375, -8.1600341796875, -7.813232421875, -7.4664306640625, -7.11962890625, -6.7728271484375, -6.426025390625, -6.0792236328125, -5.732421875, -5.3856201171875, -5.038818359375, -4.6920166015625, -4.34521484375, -3.9984130859375, -3.651611328125, -3.3048095703125, -2.9580078125, -2.6112060546875, -2.264404296875, -1.9176025390625, -1.57080078125, -1.2239990234375, -0.877197265625, -0.5303955078125, -0.18359375, 0.1632080078125, 0.510009765625, 0.8568115234375, 1.20361328125, 1.5504150390625, 1.897216796875, 2.2440185546875, 2.5908203125, 2.9376220703125, 3.284423828125, 3.6312255859375, 3.97802734375, 4.3248291015625, 4.671630859375, 5.0184326171875, 5.365234375, 5.7120361328125, 6.058837890625, 6.4056396484375, 6.75244140625, 7.0992431640625, 7.446044921875, 7.7928466796875, 8.1396484375, 8.4864501953125, 8.833251953125, 9.1800537109375, 9.52685546875, 9.8736572265625, 10.220458984375, 10.5672607421875, 10.9140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 14.0, 25.0, 34.0, 37.0, 60.0, 102.0, 92.0, 95.0, 84.0, 81.0, 81.0, 58.0, 51.0, 25.0, 25.0, 14.0, 13.0, 14.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007904917001724243, -0.0007598698139190674, -0.0007292479276657104, -0.0006986260414123535, -0.0006680041551589966, -0.0006373822689056396, -0.0006067603826522827, -0.0005761384963989258, -0.0005455166101455688, -0.0005148947238922119, -0.000484272837638855, -0.00045365095138549805, -0.0004230290651321411, -0.0003924071788787842, -0.00036178529262542725, -0.0003311634063720703, -0.0003005415201187134, -0.00026991963386535645, -0.0002392977476119995, -0.00020867586135864258, -0.00017805397510528564, -0.0001474320888519287, -0.00011681020259857178, -8.618831634521484e-05, -5.556643009185791e-05, -2.4944543838500977e-05, 5.677342414855957e-06, 3.629922866821289e-05, 6.692111492156982e-05, 9.754300117492676e-05, 0.0001281648874282837, 0.00015878677368164062, 0.00018940865993499756, 0.0002200305461883545, 0.0002506524324417114, 0.00028127431869506836, 0.0003118962049484253, 0.0003425180912017822, 0.00037313997745513916, 0.0004037618637084961, 0.00043438374996185303, 0.00046500563621520996, 0.0004956275224685669, 0.0005262494087219238, 0.0005568712949752808, 0.0005874931812286377, 0.0006181150674819946, 0.0006487369537353516, 0.0006793588399887085, 0.0007099807262420654, 0.0007406026124954224, 0.0007712244987487793, 0.0008018463850021362, 0.0008324682712554932, 0.0008630901575088501, 0.000893712043762207, 0.000924333930015564, 0.0009549558162689209, 0.0009855777025222778, 0.0010161995887756348, 0.0010468214750289917, 0.0010774433612823486, 0.0011080652475357056, 0.0011386871337890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 5.0, 9.0, 12.0, 29.0, 40.0, 52.0, 83.0, 114.0, 207.0, 317.0, 475.0, 715.0, 1187.0, 2171.0, 4111.0, 8467.0, 18944.0, 47906.0, 145887.0, 435294.0, 253623.0, 76643.0, 27942.0, 11700.0, 5567.0, 2862.0, 1634.0, 940.0, 548.0, 372.0, 223.0, 128.0, 92.0, 80.0, 48.0, 44.0, 28.0, 9.0, 13.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7713623046875, -6.527099609375, -6.2828369140625, -6.03857421875, -5.7943115234375, -5.550048828125, -5.3057861328125, -5.0615234375, -4.8172607421875, -4.572998046875, -4.3287353515625, -4.08447265625, -3.8402099609375, -3.595947265625, -3.3516845703125, -3.107421875, -2.8631591796875, -2.618896484375, -2.3746337890625, -2.13037109375, -1.8861083984375, -1.641845703125, -1.3975830078125, -1.1533203125, -0.9090576171875, -0.664794921875, -0.4205322265625, -0.17626953125, 0.0679931640625, 0.312255859375, 0.5565185546875, 0.80078125, 1.0450439453125, 1.289306640625, 1.5335693359375, 1.77783203125, 2.0220947265625, 2.266357421875, 2.5106201171875, 2.7548828125, 2.9991455078125, 3.243408203125, 3.4876708984375, 3.73193359375, 3.9761962890625, 4.220458984375, 4.4647216796875, 4.708984375, 4.9532470703125, 5.197509765625, 5.4417724609375, 5.68603515625, 5.9302978515625, 6.174560546875, 6.4188232421875, 6.6630859375, 6.9073486328125, 7.151611328125, 7.3958740234375, 7.64013671875, 7.8843994140625, 8.128662109375, 8.3729248046875, 8.6171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 13.0, 12.0, 23.0, 15.0, 21.0, 28.0, 30.0, 38.0, 47.0, 45.0, 51.0, 54.0, 62.0, 66.0, 72.0, 59.0, 69.0, 39.0, 49.0, 33.0, 30.0, 21.0, 20.0, 14.0, 14.0, 15.0, 8.0, 8.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.43865966796875, -5.2640380859375, -5.08941650390625, -4.914794921875, -4.74017333984375, -4.5655517578125, -4.39093017578125, -4.21630859375, -4.04168701171875, -3.8670654296875, -3.69244384765625, -3.517822265625, -3.34320068359375, -3.1685791015625, -2.99395751953125, -2.8193359375, -2.64471435546875, -2.4700927734375, -2.29547119140625, -2.120849609375, -1.94622802734375, -1.7716064453125, -1.59698486328125, -1.42236328125, -1.24774169921875, -1.0731201171875, -0.89849853515625, -0.723876953125, -0.54925537109375, -0.3746337890625, -0.20001220703125, -0.025390625, 0.14923095703125, 0.3238525390625, 0.49847412109375, 0.673095703125, 0.84771728515625, 1.0223388671875, 1.19696044921875, 1.37158203125, 1.54620361328125, 1.7208251953125, 1.89544677734375, 2.070068359375, 2.24468994140625, 2.4193115234375, 2.59393310546875, 2.7685546875, 2.94317626953125, 3.1177978515625, 3.29241943359375, 3.467041015625, 3.64166259765625, 3.8162841796875, 3.99090576171875, 4.16552734375, 4.34014892578125, 4.5147705078125, 4.68939208984375, 4.864013671875, 5.03863525390625, 5.2132568359375, 5.38787841796875, 5.5625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 14.0, 33.0, 45.0, 99.0, 250.0, 296.0, 111.0, 68.0, 34.0, 16.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2933654785156, -251.33868408203125, -244.3839874267578, -237.42930603027344, -230.47462463378906, -223.51992797851562, -216.56524658203125, -209.61056518554688, -202.6558837890625, -195.70120239257812, -188.7465057373047, -181.7918243408203, -174.83714294433594, -167.8824462890625, -160.92776489257812, -153.97308349609375, -147.0183868408203, -140.06370544433594, -133.1090087890625, -126.15432739257812, -119.19964599609375, -112.24495697021484, -105.29026794433594, -98.33558654785156, -91.38089752197266, -84.42620849609375, -77.47152709960938, -70.51683807373047, -63.56215286254883, -56.60746765136719, -49.65277862548828, -42.69809341430664, -35.743408203125, -28.78872299194336, -21.834035873413086, -14.879348754882812, -7.924663543701172, -0.9699783325195312, 5.984710693359375, 12.939395904541016, 19.894081115722656, 26.848766326904297, 33.80345153808594, 40.758140563964844, 47.712825775146484, 54.667510986328125, 61.62220001220703, 68.57688903808594, 75.53157043457031, 82.48625946044922, 89.4409408569336, 96.3956298828125, 103.35031127929688, 110.30500030517578, 117.25968933105469, 124.21437072753906, 131.1690673828125, 138.12374877929688, 145.0784454345703, 152.0331268310547, 158.98780822753906, 165.9425048828125, 172.89718627929688, 179.85186767578125, 186.80654907226562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 11.0, 13.0, 7.0, 16.0, 23.0, 47.0, 88.0, 141.0, 179.0, 149.0, 118.0, 74.0, 36.0, 26.0, 12.0, 10.0, 7.0, 7.0, 1.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-230.62716674804688, -221.70372009277344, -212.78025817871094, -203.8568115234375, -194.933349609375, -186.00990295410156, -177.08645629882812, -168.16299438476562, -159.2395477294922, -150.31610107421875, -141.39263916015625, -132.4691925048828, -123.54573822021484, -114.62228393554688, -105.69883728027344, -96.77538299560547, -87.8519287109375, -78.92847442626953, -70.00502014160156, -61.081573486328125, -52.158119201660156, -43.23466491699219, -34.311214447021484, -25.38776397705078, -16.464309692382812, -7.540857315063477, 1.3825950622558594, 10.306047439575195, 19.22949981689453, 28.1529541015625, 37.0764045715332, 45.999855041503906, 54.92333984375, 63.84679412841797, 72.77024841308594, 81.69369506835938, 90.61714935302734, 99.54060363769531, 108.46405029296875, 117.38750457763672, 126.31095886230469, 135.23440551757812, 144.15786743164062, 153.08131408691406, 162.0047607421875, 170.92822265625, 179.85166931152344, 188.77511596679688, 197.69857788085938, 206.6220245361328, 215.5454864501953, 224.46893310546875, 233.39239501953125, 242.3158416748047, 251.23928833007812, 260.1627502441406, 269.086181640625, 278.0096435546875, 286.9330749511719, 295.8565368652344, 304.7799987792969, 313.70343017578125, 322.62689208984375, 331.55035400390625, 340.47381591796875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 6.0, 11.0, 18.0, 19.0, 49.0, 86.0, 174.0, 322.0, 701.0, 1379.0, 3540.0, 10439.0, 52685.0, 3781214.0, 307449.0, 26344.0, 6054.0, 2035.0, 799.0, 420.0, 209.0, 135.0, 68.0, 39.0, 26.0, 17.0, 9.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -62.140625, -59.90625, -57.671875, -55.4375, -53.203125, -50.96875, -48.734375, -46.5, -44.265625, -42.03125, -39.796875, -37.5625, -35.328125, -33.09375, -30.859375, -28.625, -26.390625, -24.15625, -21.921875, -19.6875, -17.453125, -15.21875, -12.984375, -10.75, -8.515625, -6.28125, -4.046875, -1.8125, 0.421875, 2.65625, 4.890625, 7.125, 9.359375, 11.59375, 13.828125, 16.0625, 18.296875, 20.53125, 22.765625, 25.0, 27.234375, 29.46875, 31.703125, 33.9375, 36.171875, 38.40625, 40.640625, 42.875, 45.109375, 47.34375, 49.578125, 51.8125, 54.046875, 56.28125, 58.515625, 60.75, 62.984375, 65.21875, 67.453125, 69.6875, 71.921875, 74.15625, 76.390625, 78.625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 12.0, 9.0, 7.0, 11.0, 17.0, 26.0, 37.0, 59.0, 65.0, 87.0, 94.0, 105.0, 120.0, 85.0, 66.0, 44.0, 44.0, 29.0, 20.0, 21.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0390625, -2.90386962890625, -2.7686767578125, -2.63348388671875, -2.498291015625, -2.36309814453125, -2.2279052734375, -2.09271240234375, -1.95751953125, -1.82232666015625, -1.6871337890625, -1.55194091796875, -1.416748046875, -1.28155517578125, -1.1463623046875, -1.01116943359375, -0.8759765625, -0.74078369140625, -0.6055908203125, -0.47039794921875, -0.335205078125, -0.20001220703125, -0.0648193359375, 0.07037353515625, 0.20556640625, 0.34075927734375, 0.4759521484375, 0.61114501953125, 0.746337890625, 0.88153076171875, 1.0167236328125, 1.15191650390625, 1.287109375, 1.42230224609375, 1.5574951171875, 1.69268798828125, 1.827880859375, 1.96307373046875, 2.0982666015625, 2.23345947265625, 2.36865234375, 2.50384521484375, 2.6390380859375, 2.77423095703125, 2.909423828125, 3.04461669921875, 3.1798095703125, 3.31500244140625, 3.4501953125, 3.58538818359375, 3.7205810546875, 3.85577392578125, 3.990966796875, 4.12615966796875, 4.2613525390625, 4.39654541015625, 4.53173828125, 4.66693115234375, 4.8021240234375, 4.93731689453125, 5.072509765625, 5.20770263671875, 5.3428955078125, 5.47808837890625, 5.61328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 16.0, 16.0, 25.0, 32.0, 50.0, 71.0, 93.0, 154.0, 246.0, 367.0, 639.0, 1029.0, 1862.0, 3334.0, 6262.0, 12954.0, 29057.0, 78145.0, 317399.0, 3295717.0, 315678.0, 76740.0, 28324.0, 12508.0, 6061.0, 3207.0, 1726.0, 942.0, 548.0, 376.0, 220.0, 134.0, 93.0, 80.0, 52.0, 33.0, 25.0, 18.0, 9.0, 11.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.0625, -31.075927734375, -30.08935546875, -29.102783203125, -28.1162109375, -27.129638671875, -26.14306640625, -25.156494140625, -24.169921875, -23.183349609375, -22.19677734375, -21.210205078125, -20.2236328125, -19.237060546875, -18.25048828125, -17.263916015625, -16.27734375, -15.290771484375, -14.30419921875, -13.317626953125, -12.3310546875, -11.344482421875, -10.35791015625, -9.371337890625, -8.384765625, -7.398193359375, -6.41162109375, -5.425048828125, -4.4384765625, -3.451904296875, -2.46533203125, -1.478759765625, -0.4921875, 0.494384765625, 1.48095703125, 2.467529296875, 3.4541015625, 4.440673828125, 5.42724609375, 6.413818359375, 7.400390625, 8.386962890625, 9.37353515625, 10.360107421875, 11.3466796875, 12.333251953125, 13.31982421875, 14.306396484375, 15.29296875, 16.279541015625, 17.26611328125, 18.252685546875, 19.2392578125, 20.225830078125, 21.21240234375, 22.198974609375, 23.185546875, 24.172119140625, 25.15869140625, 26.145263671875, 27.1318359375, 28.118408203125, 29.10498046875, 30.091552734375, 31.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 5.0, 12.0, 16.0, 9.0, 18.0, 20.0, 23.0, 34.0, 50.0, 55.0, 83.0, 147.0, 254.0, 460.0, 2035.0, 326.0, 162.0, 101.0, 59.0, 65.0, 42.0, 18.0, 19.0, 9.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.78717041015625, -4.5977783203125, -4.40838623046875, -4.218994140625, -4.02960205078125, -3.8402099609375, -3.65081787109375, -3.46142578125, -3.27203369140625, -3.0826416015625, -2.89324951171875, -2.703857421875, -2.51446533203125, -2.3250732421875, -2.13568115234375, -1.9462890625, -1.75689697265625, -1.5675048828125, -1.37811279296875, -1.188720703125, -0.99932861328125, -0.8099365234375, -0.62054443359375, -0.43115234375, -0.24176025390625, -0.0523681640625, 0.13702392578125, 0.326416015625, 0.51580810546875, 0.7052001953125, 0.89459228515625, 1.083984375, 1.27337646484375, 1.4627685546875, 1.65216064453125, 1.841552734375, 2.03094482421875, 2.2203369140625, 2.40972900390625, 2.59912109375, 2.78851318359375, 2.9779052734375, 3.16729736328125, 3.356689453125, 3.54608154296875, 3.7354736328125, 3.92486572265625, 4.1142578125, 4.30364990234375, 4.4930419921875, 4.68243408203125, 4.871826171875, 5.06121826171875, 5.2506103515625, 5.44000244140625, 5.62939453125, 5.81878662109375, 6.0081787109375, 6.19757080078125, 6.386962890625, 6.57635498046875, 6.7657470703125, 6.95513916015625, 7.14453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 11.0, 3.0, 8.0, 17.0, 10.0, 28.0, 63.0, 63.0, 130.0, 172.0, 161.0, 134.0, 64.0, 64.0, 25.0, 17.0, 11.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.96562194824219, -61.54591751098633, -60.1262092590332, -58.706504821777344, -57.28679656982422, -55.86709213256836, -54.4473876953125, -53.027679443359375, -51.607975006103516, -50.188270568847656, -48.76856231689453, -47.34885787963867, -45.92915344238281, -44.50944519042969, -43.08974075317383, -41.67003631591797, -40.250328063964844, -38.830623626708984, -37.41091537475586, -35.9912109375, -34.571502685546875, -33.151798248291016, -31.732093811035156, -30.312387466430664, -28.892681121826172, -27.47297477722168, -26.053268432617188, -24.633563995361328, -23.213857650756836, -21.794151306152344, -20.374446868896484, -18.954740524291992, -17.5350341796875, -16.115327835083008, -14.695622444152832, -13.275917053222656, -11.856210708618164, -10.436504364013672, -9.016798973083496, -7.59709358215332, -6.177387237548828, -4.757681369781494, -3.33797550201416, -1.9182696342468262, -0.4985637664794922, 0.9211421012878418, 2.340847969055176, 3.7605533599853516, 5.180259704589844, 6.599965572357178, 8.019671440124512, 9.439376831054688, 10.85908317565918, 12.278789520263672, 13.698494911193848, 15.118200302124023, 16.537906646728516, 17.957612991333008, 19.3773193359375, 20.79702377319336, 22.21673011779785, 23.636436462402344, 25.056140899658203, 26.475847244262695, 27.895553588867188]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 8.0, 15.0, 14.0, 20.0, 25.0, 31.0, 37.0, 42.0, 57.0, 51.0, 57.0, 70.0, 60.0, 55.0, 63.0, 52.0, 40.0, 61.0, 44.0, 40.0, 34.0, 16.0, 19.0, 14.0, 10.0, 14.0, 6.0, 3.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37102699279785, -28.486143112182617, -27.601259231567383, -26.71637535095215, -25.83148956298828, -24.946605682373047, -24.061721801757812, -23.176837921142578, -22.291954040527344, -21.40707015991211, -20.522186279296875, -19.63730239868164, -18.752418518066406, -17.867534637451172, -16.982648849487305, -16.09776496887207, -15.212881088256836, -14.327997207641602, -13.443113327026367, -12.558228492736816, -11.673344612121582, -10.788460731506348, -9.903575897216797, -9.018692016601562, -8.133808135986328, -7.248924255371094, -6.364039897918701, -5.479155540466309, -4.594271659851074, -3.70938777923584, -2.8245034217834473, -1.9396190643310547, -1.0547332763671875, -0.16984915733337402, 0.7150349617004395, 1.599919080734253, 2.4848031997680664, 3.369687080383301, 4.254571437835693, 5.139455795288086, 6.02433967590332, 6.909223556518555, 7.794107913970947, 8.67899227142334, 9.563876152038574, 10.448760032653809, 11.33364486694336, 12.218528747558594, 13.103412628173828, 13.988296508789062, 14.873180389404297, 15.758065223693848, 16.642948150634766, 17.52783203125, 18.412717819213867, 19.2976016998291, 20.182485580444336, 21.06736946105957, 21.952253341674805, 22.83713722229004, 23.722023010253906, 24.60690689086914, 25.491790771484375, 26.37667465209961, 27.261558532714844]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 6.0, 15.0, 31.0, 25.0, 60.0, 85.0, 136.0, 261.0, 494.0, 1091.0, 2517.0, 5991.0, 19358.0, 84212.0, 499382.0, 350720.0, 60493.0, 14823.0, 4825.0, 2057.0, 887.0, 463.0, 229.0, 113.0, 82.0, 56.0, 35.0, 30.0, 27.0, 10.0, 9.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.8232421875, -41.521484375, -40.2197265625, -38.91796875, -37.6162109375, -36.314453125, -35.0126953125, -33.7109375, -32.4091796875, -31.107421875, -29.8056640625, -28.50390625, -27.2021484375, -25.900390625, -24.5986328125, -23.296875, -21.9951171875, -20.693359375, -19.3916015625, -18.08984375, -16.7880859375, -15.486328125, -14.1845703125, -12.8828125, -11.5810546875, -10.279296875, -8.9775390625, -7.67578125, -6.3740234375, -5.072265625, -3.7705078125, -2.46875, -1.1669921875, 0.134765625, 1.4365234375, 2.73828125, 4.0400390625, 5.341796875, 6.6435546875, 7.9453125, 9.2470703125, 10.548828125, 11.8505859375, 13.15234375, 14.4541015625, 15.755859375, 17.0576171875, 18.359375, 19.6611328125, 20.962890625, 22.2646484375, 23.56640625, 24.8681640625, 26.169921875, 27.4716796875, 28.7734375, 30.0751953125, 31.376953125, 32.6787109375, 33.98046875, 35.2822265625, 36.583984375, 37.8857421875, 39.1875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 1.0, 2.0, 4.0, 10.0, 11.0, 19.0, 36.0, 45.0, 59.0, 79.0, 79.0, 75.0, 106.0, 102.0, 94.0, 61.0, 62.0, 51.0, 44.0, 10.0, 19.0, 7.0, 8.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.13232421875, -2.9873046875, -2.84228515625, -2.697265625, -2.55224609375, -2.4072265625, -2.26220703125, -2.1171875, -1.97216796875, -1.8271484375, -1.68212890625, -1.537109375, -1.39208984375, -1.2470703125, -1.10205078125, -0.95703125, -0.81201171875, -0.6669921875, -0.52197265625, -0.376953125, -0.23193359375, -0.0869140625, 0.05810546875, 0.203125, 0.34814453125, 0.4931640625, 0.63818359375, 0.783203125, 0.92822265625, 1.0732421875, 1.21826171875, 1.36328125, 1.50830078125, 1.6533203125, 1.79833984375, 1.943359375, 2.08837890625, 2.2333984375, 2.37841796875, 2.5234375, 2.66845703125, 2.8134765625, 2.95849609375, 3.103515625, 3.24853515625, 3.3935546875, 3.53857421875, 3.68359375, 3.82861328125, 3.9736328125, 4.11865234375, 4.263671875, 4.40869140625, 4.5537109375, 4.69873046875, 4.84375, 4.98876953125, 5.1337890625, 5.27880859375, 5.423828125, 5.56884765625, 5.7138671875, 5.85888671875, 6.00390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 32.0, 34.0, 53.0, 79.0, 131.0, 216.0, 355.0, 672.0, 1226.0, 2699.0, 6851.0, 18988.0, 68136.0, 329450.0, 475961.0, 101930.0, 26267.0, 8582.0, 3413.0, 1533.0, 735.0, 437.0, 244.0, 158.0, 108.0, 54.0, 56.0, 32.0, 29.0, 14.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.783935546875, -21.97412109375, -21.164306640625, -20.3544921875, -19.544677734375, -18.73486328125, -17.925048828125, -17.115234375, -16.305419921875, -15.49560546875, -14.685791015625, -13.8759765625, -13.066162109375, -12.25634765625, -11.446533203125, -10.63671875, -9.826904296875, -9.01708984375, -8.207275390625, -7.3974609375, -6.587646484375, -5.77783203125, -4.968017578125, -4.158203125, -3.348388671875, -2.53857421875, -1.728759765625, -0.9189453125, -0.109130859375, 0.70068359375, 1.510498046875, 2.3203125, 3.130126953125, 3.93994140625, 4.749755859375, 5.5595703125, 6.369384765625, 7.17919921875, 7.989013671875, 8.798828125, 9.608642578125, 10.41845703125, 11.228271484375, 12.0380859375, 12.847900390625, 13.65771484375, 14.467529296875, 15.27734375, 16.087158203125, 16.89697265625, 17.706787109375, 18.5166015625, 19.326416015625, 20.13623046875, 20.946044921875, 21.755859375, 22.565673828125, 23.37548828125, 24.185302734375, 24.9951171875, 25.804931640625, 26.61474609375, 27.424560546875, 28.234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 9.0, 6.0, 17.0, 29.0, 21.0, 27.0, 40.0, 43.0, 55.0, 58.0, 50.0, 72.0, 68.0, 54.0, 56.0, 59.0, 55.0, 48.0, 45.0, 40.0, 30.0, 27.0, 17.0, 14.0, 8.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.3927001953125, -13.910400390625, -13.4281005859375, -12.94580078125, -12.4635009765625, -11.981201171875, -11.4989013671875, -11.0166015625, -10.5343017578125, -10.052001953125, -9.5697021484375, -9.08740234375, -8.6051025390625, -8.122802734375, -7.6405029296875, -7.158203125, -6.6759033203125, -6.193603515625, -5.7113037109375, -5.22900390625, -4.7467041015625, -4.264404296875, -3.7821044921875, -3.2998046875, -2.8175048828125, -2.335205078125, -1.8529052734375, -1.37060546875, -0.8883056640625, -0.406005859375, 0.0762939453125, 0.55859375, 1.0408935546875, 1.523193359375, 2.0054931640625, 2.48779296875, 2.9700927734375, 3.452392578125, 3.9346923828125, 4.4169921875, 4.8992919921875, 5.381591796875, 5.8638916015625, 6.34619140625, 6.8284912109375, 7.310791015625, 7.7930908203125, 8.275390625, 8.7576904296875, 9.239990234375, 9.7222900390625, 10.20458984375, 10.6868896484375, 11.169189453125, 11.6514892578125, 12.1337890625, 12.6160888671875, 13.098388671875, 13.5806884765625, 14.06298828125, 14.5452880859375, 15.027587890625, 15.5098876953125, 15.9921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 7.0, 6.0, 9.0, 14.0, 14.0, 16.0, 42.0, 60.0, 57.0, 106.0, 148.0, 228.0, 374.0, 628.0, 1068.0, 1938.0, 3723.0, 7858.0, 17829.0, 48304.0, 165256.0, 477794.0, 221199.0, 61177.0, 21799.0, 9187.0, 4436.0, 2205.0, 1213.0, 678.0, 364.0, 276.0, 183.0, 100.0, 68.0, 41.0, 45.0, 26.0, 17.0, 17.0, 12.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0], "bins": [-27.078125, -26.317626953125, -25.55712890625, -24.796630859375, -24.0361328125, -23.275634765625, -22.51513671875, -21.754638671875, -20.994140625, -20.233642578125, -19.47314453125, -18.712646484375, -17.9521484375, -17.191650390625, -16.43115234375, -15.670654296875, -14.91015625, -14.149658203125, -13.38916015625, -12.628662109375, -11.8681640625, -11.107666015625, -10.34716796875, -9.586669921875, -8.826171875, -8.065673828125, -7.30517578125, -6.544677734375, -5.7841796875, -5.023681640625, -4.26318359375, -3.502685546875, -2.7421875, -1.981689453125, -1.22119140625, -0.460693359375, 0.2998046875, 1.060302734375, 1.82080078125, 2.581298828125, 3.341796875, 4.102294921875, 4.86279296875, 5.623291015625, 6.3837890625, 7.144287109375, 7.90478515625, 8.665283203125, 9.42578125, 10.186279296875, 10.94677734375, 11.707275390625, 12.4677734375, 13.228271484375, 13.98876953125, 14.749267578125, 15.509765625, 16.270263671875, 17.03076171875, 17.791259765625, 18.5517578125, 19.312255859375, 20.07275390625, 20.833251953125, 21.59375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 11.0, 10.0, 16.0, 31.0, 36.0, 62.0, 99.0, 157.0, 171.0, 125.0, 87.0, 64.0, 52.0, 23.0, 12.0, 13.0, 9.0, 1.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003108978271484375, -0.0030025839805603027, -0.0028961896896362305, -0.002789795398712158, -0.002683401107788086, -0.0025770068168640137, -0.0024706125259399414, -0.002364218235015869, -0.002257823944091797, -0.0021514296531677246, -0.0020450353622436523, -0.00193864107131958, -0.0018322467803955078, -0.0017258524894714355, -0.0016194581985473633, -0.001513063907623291, -0.0014066696166992188, -0.0013002753257751465, -0.0011938810348510742, -0.001087486743927002, -0.0009810924530029297, -0.0008746981620788574, -0.0007683038711547852, -0.0006619095802307129, -0.0005555152893066406, -0.00044912099838256836, -0.0003427267074584961, -0.00023633241653442383, -0.00012993812561035156, -2.3543834686279297e-05, 8.285045623779297e-05, 0.00018924474716186523, 0.0002956390380859375, 0.00040203332901000977, 0.000508427619934082, 0.0006148219108581543, 0.0007212162017822266, 0.0008276104927062988, 0.0009340047836303711, 0.0010403990745544434, 0.0011467933654785156, 0.0012531876564025879, 0.0013595819473266602, 0.0014659762382507324, 0.0015723705291748047, 0.001678764820098877, 0.0017851591110229492, 0.0018915534019470215, 0.0019979476928710938, 0.002104341983795166, 0.0022107362747192383, 0.0023171305656433105, 0.002423524856567383, 0.002529919147491455, 0.0026363134384155273, 0.0027427077293395996, 0.002849102020263672, 0.002955496311187744, 0.0030618906021118164, 0.0031682848930358887, 0.003274679183959961, 0.003381073474884033, 0.0034874677658081055, 0.0035938620567321777, 0.00370025634765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 8.0, 18.0, 6.0, 23.0, 23.0, 45.0, 77.0, 101.0, 157.0, 259.0, 393.0, 697.0, 1210.0, 2430.0, 4856.0, 11128.0, 29000.0, 96094.0, 403275.0, 365593.0, 86136.0, 26745.0, 10379.0, 4664.0, 2282.0, 1201.0, 671.0, 406.0, 225.0, 138.0, 92.0, 67.0, 47.0, 27.0, 20.0, 15.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -23.28955078125, -22.4853515625, -21.68115234375, -20.876953125, -20.07275390625, -19.2685546875, -18.46435546875, -17.66015625, -16.85595703125, -16.0517578125, -15.24755859375, -14.443359375, -13.63916015625, -12.8349609375, -12.03076171875, -11.2265625, -10.42236328125, -9.6181640625, -8.81396484375, -8.009765625, -7.20556640625, -6.4013671875, -5.59716796875, -4.79296875, -3.98876953125, -3.1845703125, -2.38037109375, -1.576171875, -0.77197265625, 0.0322265625, 0.83642578125, 1.640625, 2.44482421875, 3.2490234375, 4.05322265625, 4.857421875, 5.66162109375, 6.4658203125, 7.27001953125, 8.07421875, 8.87841796875, 9.6826171875, 10.48681640625, 11.291015625, 12.09521484375, 12.8994140625, 13.70361328125, 14.5078125, 15.31201171875, 16.1162109375, 16.92041015625, 17.724609375, 18.52880859375, 19.3330078125, 20.13720703125, 20.94140625, 21.74560546875, 22.5498046875, 23.35400390625, 24.158203125, 24.96240234375, 25.7666015625, 26.57080078125, 27.375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 11.0, 19.0, 20.0, 25.0, 25.0, 29.0, 38.0, 46.0, 57.0, 53.0, 66.0, 79.0, 69.0, 72.0, 53.0, 53.0, 43.0, 40.0, 33.0, 34.0, 16.0, 13.0, 14.0, 7.0, 12.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9234619140625, -10.518798828125, -10.1141357421875, -9.70947265625, -9.3048095703125, -8.900146484375, -8.4954833984375, -8.0908203125, -7.6861572265625, -7.281494140625, -6.8768310546875, -6.47216796875, -6.0675048828125, -5.662841796875, -5.2581787109375, -4.853515625, -4.4488525390625, -4.044189453125, -3.6395263671875, -3.23486328125, -2.8302001953125, -2.425537109375, -2.0208740234375, -1.6162109375, -1.2115478515625, -0.806884765625, -0.4022216796875, 0.00244140625, 0.4071044921875, 0.811767578125, 1.2164306640625, 1.62109375, 2.0257568359375, 2.430419921875, 2.8350830078125, 3.23974609375, 3.6444091796875, 4.049072265625, 4.4537353515625, 4.8583984375, 5.2630615234375, 5.667724609375, 6.0723876953125, 6.47705078125, 6.8817138671875, 7.286376953125, 7.6910400390625, 8.095703125, 8.5003662109375, 8.905029296875, 9.3096923828125, 9.71435546875, 10.1190185546875, 10.523681640625, 10.9283447265625, 11.3330078125, 11.7376708984375, 12.142333984375, 12.5469970703125, 12.95166015625, 13.3563232421875, 13.760986328125, 14.1656494140625, 14.5703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 35.0, 145.0, 359.0, 307.0, 78.0, 30.0, 24.0, 9.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.84410095214844, -149.30491638183594, -137.7657470703125, -126.2265625, -114.6873779296875, -103.148193359375, -91.60901641845703, -80.06983947753906, -68.53065490722656, -56.99147415161133, -45.452293395996094, -33.91311264038086, -22.373931884765625, -10.83475112915039, 0.7044296264648438, 12.243606567382812, 23.782791137695312, 35.32197189331055, 46.86115264892578, 58.400333404541016, 69.93951416015625, 81.47869873046875, 93.01787567138672, 104.55705261230469, 116.09623718261719, 127.63542175292969, 139.17459106445312, 150.71377563476562, 162.25296020507812, 173.79214477539062, 185.33132934570312, 196.87049865722656, 208.40966796875, 219.9488525390625, 231.488037109375, 243.02720642089844, 254.56639099121094, 266.1055603027344, 277.6447448730469, 289.1839294433594, 300.7231140136719, 312.2622985839844, 323.8014831542969, 335.3406677246094, 346.87982177734375, 358.41900634765625, 369.95819091796875, 381.49737548828125, 393.03656005859375, 404.57574462890625, 416.11492919921875, 427.65411376953125, 439.19329833984375, 450.7324523925781, 462.2716369628906, 473.8108215332031, 485.3500061035156, 496.8891906738281, 508.4283752441406, 519.967529296875, 531.5067138671875, 543.0458984375, 554.5850830078125, 566.124267578125, 577.6634521484375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 11.0, 16.0, 15.0, 25.0, 23.0, 29.0, 36.0, 33.0, 47.0, 64.0, 65.0, 67.0, 50.0, 58.0, 70.0, 60.0, 57.0, 56.0, 39.0, 34.0, 31.0, 14.0, 10.0, 12.0, 10.0, 7.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.30193328857422, -82.23118591308594, -79.16043853759766, -76.08969116210938, -73.01893615722656, -69.94818878173828, -66.87744140625, -63.80669403076172, -60.73594284057617, -57.66519546508789, -54.594444274902344, -51.52369689941406, -48.45294952392578, -45.382198333740234, -42.31145095825195, -39.240699768066406, -36.169952392578125, -33.099205017089844, -30.028453826904297, -26.957706451416016, -23.8869571685791, -20.816207885742188, -17.745460510253906, -14.674711227416992, -11.603961944580078, -8.533212661743164, -5.462464332580566, -2.3917160034179688, 0.6790332794189453, 3.7497825622558594, 6.820529937744141, 9.891279220581055, 12.962020874023438, 16.03277015686035, 19.103519439697266, 22.174266815185547, 25.24501609802246, 28.315765380859375, 31.386512756347656, 34.45726013183594, 37.528011322021484, 40.598758697509766, 43.66950988769531, 46.740257263183594, 49.811004638671875, 52.88175582885742, 55.9525032043457, 59.02325439453125, 62.09400177001953, 65.16474914550781, 68.2354965209961, 71.30624389648438, 74.37699890136719, 77.44774627685547, 80.51849365234375, 83.58924102783203, 86.65998840332031, 89.7307357788086, 92.80148315429688, 95.87223815917969, 98.94298553466797, 102.01373291015625, 105.08448028564453, 108.15522766113281, 111.22598266601562]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 0.0, 2.0, 6.0, 4.0, 19.0, 19.0, 23.0, 40.0, 64.0, 102.0, 142.0, 240.0, 429.0, 738.0, 1305.0, 2672.0, 6185.0, 15721.0, 51130.0, 270382.0, 3471573.0, 290656.0, 54248.0, 16697.0, 6283.0, 2704.0, 1230.0, 617.0, 404.0, 228.0, 136.0, 84.0, 56.0, 38.0, 39.0, 16.0, 17.0, 6.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-67.875, -66.01611328125, -64.1572265625, -62.29833984375, -60.439453125, -58.58056640625, -56.7216796875, -54.86279296875, -53.00390625, -51.14501953125, -49.2861328125, -47.42724609375, -45.568359375, -43.70947265625, -41.8505859375, -39.99169921875, -38.1328125, -36.27392578125, -34.4150390625, -32.55615234375, -30.697265625, -28.83837890625, -26.9794921875, -25.12060546875, -23.26171875, -21.40283203125, -19.5439453125, -17.68505859375, -15.826171875, -13.96728515625, -12.1083984375, -10.24951171875, -8.390625, -6.53173828125, -4.6728515625, -2.81396484375, -0.955078125, 0.90380859375, 2.7626953125, 4.62158203125, 6.48046875, 8.33935546875, 10.1982421875, 12.05712890625, 13.916015625, 15.77490234375, 17.6337890625, 19.49267578125, 21.3515625, 23.21044921875, 25.0693359375, 26.92822265625, 28.787109375, 30.64599609375, 32.5048828125, 34.36376953125, 36.22265625, 38.08154296875, 39.9404296875, 41.79931640625, 43.658203125, 45.51708984375, 47.3759765625, 49.23486328125, 51.09375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 7.0, 13.0, 12.0, 25.0, 29.0, 40.0, 46.0, 56.0, 56.0, 80.0, 85.0, 91.0, 89.0, 78.0, 57.0, 49.0, 36.0, 42.0, 30.0, 24.0, 13.0, 6.0, 9.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.97515869140625, -2.8526611328125, -2.73016357421875, -2.607666015625, -2.48516845703125, -2.3626708984375, -2.24017333984375, -2.11767578125, -1.99517822265625, -1.8726806640625, -1.75018310546875, -1.627685546875, -1.50518798828125, -1.3826904296875, -1.26019287109375, -1.1376953125, -1.01519775390625, -0.8927001953125, -0.77020263671875, -0.647705078125, -0.52520751953125, -0.4027099609375, -0.28021240234375, -0.15771484375, -0.03521728515625, 0.0872802734375, 0.20977783203125, 0.332275390625, 0.45477294921875, 0.5772705078125, 0.69976806640625, 0.822265625, 0.94476318359375, 1.0672607421875, 1.18975830078125, 1.312255859375, 1.43475341796875, 1.5572509765625, 1.67974853515625, 1.80224609375, 1.92474365234375, 2.0472412109375, 2.16973876953125, 2.292236328125, 2.41473388671875, 2.5372314453125, 2.65972900390625, 2.7822265625, 2.90472412109375, 3.0272216796875, 3.14971923828125, 3.272216796875, 3.39471435546875, 3.5172119140625, 3.63970947265625, 3.76220703125, 3.88470458984375, 4.0072021484375, 4.12969970703125, 4.252197265625, 4.37469482421875, 4.4971923828125, 4.61968994140625, 4.7421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 7.0, 15.0, 12.0, 25.0, 26.0, 43.0, 56.0, 85.0, 163.0, 265.0, 570.0, 1373.0, 3953.0, 14455.0, 82214.0, 1189914.0, 2766463.0, 109169.0, 17875.0, 4634.0, 1573.0, 612.0, 281.0, 153.0, 100.0, 56.0, 39.0, 28.0, 32.0, 16.0, 9.0, 9.0, 4.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.7470703125, -64.369140625, -61.9912109375, -59.61328125, -57.2353515625, -54.857421875, -52.4794921875, -50.1015625, -47.7236328125, -45.345703125, -42.9677734375, -40.58984375, -38.2119140625, -35.833984375, -33.4560546875, -31.078125, -28.7001953125, -26.322265625, -23.9443359375, -21.56640625, -19.1884765625, -16.810546875, -14.4326171875, -12.0546875, -9.6767578125, -7.298828125, -4.9208984375, -2.54296875, -0.1650390625, 2.212890625, 4.5908203125, 6.96875, 9.3466796875, 11.724609375, 14.1025390625, 16.48046875, 18.8583984375, 21.236328125, 23.6142578125, 25.9921875, 28.3701171875, 30.748046875, 33.1259765625, 35.50390625, 37.8818359375, 40.259765625, 42.6376953125, 45.015625, 47.3935546875, 49.771484375, 52.1494140625, 54.52734375, 56.9052734375, 59.283203125, 61.6611328125, 64.0390625, 66.4169921875, 68.794921875, 71.1728515625, 73.55078125, 75.9287109375, 78.306640625, 80.6845703125, 83.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 18.0, 13.0, 19.0, 18.0, 47.0, 51.0, 70.0, 88.0, 118.0, 173.0, 227.0, 354.0, 1095.0, 620.0, 298.0, 228.0, 168.0, 121.0, 72.0, 73.0, 39.0, 30.0, 17.0, 26.0, 13.0, 14.0, 8.0, 6.0, 7.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6561279296875, -6.433349609375, -6.2105712890625, -5.98779296875, -5.7650146484375, -5.542236328125, -5.3194580078125, -5.0966796875, -4.8739013671875, -4.651123046875, -4.4283447265625, -4.20556640625, -3.9827880859375, -3.760009765625, -3.5372314453125, -3.314453125, -3.0916748046875, -2.868896484375, -2.6461181640625, -2.42333984375, -2.2005615234375, -1.977783203125, -1.7550048828125, -1.5322265625, -1.3094482421875, -1.086669921875, -0.8638916015625, -0.64111328125, -0.4183349609375, -0.195556640625, 0.0272216796875, 0.25, 0.4727783203125, 0.695556640625, 0.9183349609375, 1.14111328125, 1.3638916015625, 1.586669921875, 1.8094482421875, 2.0322265625, 2.2550048828125, 2.477783203125, 2.7005615234375, 2.92333984375, 3.1461181640625, 3.368896484375, 3.5916748046875, 3.814453125, 4.0372314453125, 4.260009765625, 4.4827880859375, 4.70556640625, 4.9283447265625, 5.151123046875, 5.3739013671875, 5.5966796875, 5.8194580078125, 6.042236328125, 6.2650146484375, 6.48779296875, 6.7105712890625, 6.933349609375, 7.1561279296875, 7.37890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 10.0, 57.0, 165.0, 435.0, 245.0, 59.0, 26.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.42633056640625, -113.62159729003906, -107.8168716430664, -102.01214599609375, -96.20741271972656, -90.40267944335938, -84.59795379638672, -78.79322814941406, -72.98849487304688, -67.18376159667969, -61.37903594970703, -55.57430648803711, -49.76957702636719, -43.964847564697266, -38.160118103027344, -32.35538864135742, -26.5506591796875, -20.745929718017578, -14.941200256347656, -9.136470794677734, -3.3317413330078125, 2.4729881286621094, 8.277717590332031, 14.082447052001953, 19.887176513671875, 25.691905975341797, 31.49663543701172, 37.30136489868164, 43.10609436035156, 48.910823822021484, 54.715553283691406, 60.52028274536133, 66.32501220703125, 72.12974548339844, 77.9344711303711, 83.73919677734375, 89.54393005371094, 95.34866333007812, 101.15338897705078, 106.95811462402344, 112.76284790039062, 118.56758117675781, 124.37230682373047, 130.17703247070312, 135.9817657470703, 141.7864990234375, 147.59121704101562, 153.3959503173828, 159.20068359375, 165.0054168701172, 170.81015014648438, 176.6148681640625, 182.4196014404297, 188.22433471679688, 194.029052734375, 199.8337860107422, 205.63851928710938, 211.44325256347656, 217.24798583984375, 223.05270385742188, 228.85743713378906, 234.66217041015625, 240.46688842773438, 246.27162170410156, 252.07635498046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 10.0, 8.0, 14.0, 20.0, 20.0, 30.0, 17.0, 32.0, 34.0, 30.0, 48.0, 32.0, 40.0, 39.0, 41.0, 44.0, 46.0, 46.0, 57.0, 38.0, 37.0, 44.0, 27.0, 29.0, 21.0, 25.0, 20.0, 26.0, 16.0, 12.0, 11.0, 11.0, 6.0, 8.0, 7.0, 7.0, 3.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.201194763183594, -28.271142959594727, -27.341093063354492, -26.411041259765625, -25.48099136352539, -24.550939559936523, -23.620887756347656, -22.690837860107422, -21.760786056518555, -20.830734252929688, -19.900684356689453, -18.970632553100586, -18.04058265686035, -17.110530853271484, -16.18048095703125, -15.250429153442383, -14.320378303527832, -13.390327453613281, -12.46027660369873, -11.53022575378418, -10.600173950195312, -9.670123100280762, -8.740072250366211, -7.810020923614502, -6.879970073699951, -5.9499192237854, -5.019867897033691, -4.089817047119141, -3.1597659587860107, -2.229714870452881, -1.29966402053833, -0.3696126937866211, 0.5604381561279297, 1.4904892444610596, 2.4205403327941895, 3.3505911827087402, 4.280642509460449, 5.210693359375, 6.140744209289551, 7.07079553604126, 8.000846862792969, 8.93089771270752, 9.86094856262207, 10.791000366210938, 11.721051216125488, 12.651102066040039, 13.58115291595459, 14.51120376586914, 15.441254615783691, 16.371305465698242, 17.30135726928711, 18.231407165527344, 19.16145896911621, 20.091510772705078, 21.021560668945312, 21.95161247253418, 22.881662368774414, 23.81171417236328, 24.741764068603516, 25.671815872192383, 26.601865768432617, 27.531917572021484, 28.46196746826172, 29.392019271850586, 30.322071075439453]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 8.0, 7.0, 20.0, 26.0, 38.0, 45.0, 65.0, 66.0, 145.0, 177.0, 287.0, 426.0, 751.0, 1288.0, 2498.0, 5222.0, 11632.0, 29347.0, 78833.0, 214369.0, 380425.0, 200658.0, 73100.0, 27686.0, 10978.0, 4843.0, 2388.0, 1248.0, 673.0, 399.0, 288.0, 189.0, 113.0, 94.0, 68.0, 47.0, 33.0, 24.0, 16.0, 17.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.3125, -32.345947265625, -31.37939453125, -30.412841796875, -29.4462890625, -28.479736328125, -27.51318359375, -26.546630859375, -25.580078125, -24.613525390625, -23.64697265625, -22.680419921875, -21.7138671875, -20.747314453125, -19.78076171875, -18.814208984375, -17.84765625, -16.881103515625, -15.91455078125, -14.947998046875, -13.9814453125, -13.014892578125, -12.04833984375, -11.081787109375, -10.115234375, -9.148681640625, -8.18212890625, -7.215576171875, -6.2490234375, -5.282470703125, -4.31591796875, -3.349365234375, -2.3828125, -1.416259765625, -0.44970703125, 0.516845703125, 1.4833984375, 2.449951171875, 3.41650390625, 4.383056640625, 5.349609375, 6.316162109375, 7.28271484375, 8.249267578125, 9.2158203125, 10.182373046875, 11.14892578125, 12.115478515625, 13.08203125, 14.048583984375, 15.01513671875, 15.981689453125, 16.9482421875, 17.914794921875, 18.88134765625, 19.847900390625, 20.814453125, 21.781005859375, 22.74755859375, 23.714111328125, 24.6806640625, 25.647216796875, 26.61376953125, 27.580322265625, 28.546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 9.0, 16.0, 24.0, 28.0, 42.0, 47.0, 68.0, 69.0, 89.0, 85.0, 84.0, 76.0, 76.0, 62.0, 56.0, 33.0, 30.0, 27.0, 21.0, 13.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.0909423828125, -2.963134765625, -2.8353271484375, -2.70751953125, -2.5797119140625, -2.451904296875, -2.3240966796875, -2.1962890625, -2.0684814453125, -1.940673828125, -1.8128662109375, -1.68505859375, -1.5572509765625, -1.429443359375, -1.3016357421875, -1.173828125, -1.0460205078125, -0.918212890625, -0.7904052734375, -0.66259765625, -0.5347900390625, -0.406982421875, -0.2791748046875, -0.1513671875, -0.0235595703125, 0.104248046875, 0.2320556640625, 0.35986328125, 0.4876708984375, 0.615478515625, 0.7432861328125, 0.87109375, 0.9989013671875, 1.126708984375, 1.2545166015625, 1.38232421875, 1.5101318359375, 1.637939453125, 1.7657470703125, 1.8935546875, 2.0213623046875, 2.149169921875, 2.2769775390625, 2.40478515625, 2.5325927734375, 2.660400390625, 2.7882080078125, 2.916015625, 3.0438232421875, 3.171630859375, 3.2994384765625, 3.42724609375, 3.5550537109375, 3.682861328125, 3.8106689453125, 3.9384765625, 4.0662841796875, 4.194091796875, 4.3218994140625, 4.44970703125, 4.5775146484375, 4.705322265625, 4.8331298828125, 4.9609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 9.0, 12.0, 14.0, 13.0, 26.0, 27.0, 43.0, 49.0, 83.0, 110.0, 168.0, 337.0, 539.0, 1127.0, 2530.0, 6620.0, 20189.0, 69282.0, 261674.0, 460632.0, 160004.0, 43250.0, 13289.0, 4673.0, 1840.0, 813.0, 456.0, 251.0, 126.0, 115.0, 68.0, 48.0, 34.0, 33.0, 17.0, 15.0, 5.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.71875, -36.474609375, -35.23046875, -33.986328125, -32.7421875, -31.498046875, -30.25390625, -29.009765625, -27.765625, -26.521484375, -25.27734375, -24.033203125, -22.7890625, -21.544921875, -20.30078125, -19.056640625, -17.8125, -16.568359375, -15.32421875, -14.080078125, -12.8359375, -11.591796875, -10.34765625, -9.103515625, -7.859375, -6.615234375, -5.37109375, -4.126953125, -2.8828125, -1.638671875, -0.39453125, 0.849609375, 2.09375, 3.337890625, 4.58203125, 5.826171875, 7.0703125, 8.314453125, 9.55859375, 10.802734375, 12.046875, 13.291015625, 14.53515625, 15.779296875, 17.0234375, 18.267578125, 19.51171875, 20.755859375, 22.0, 23.244140625, 24.48828125, 25.732421875, 26.9765625, 28.220703125, 29.46484375, 30.708984375, 31.953125, 33.197265625, 34.44140625, 35.685546875, 36.9296875, 38.173828125, 39.41796875, 40.662109375, 41.90625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 2.0, 7.0, 14.0, 13.0, 19.0, 16.0, 23.0, 29.0, 31.0, 33.0, 35.0, 45.0, 43.0, 62.0, 46.0, 54.0, 54.0, 51.0, 47.0, 58.0, 44.0, 33.0, 29.0, 33.0, 29.0, 26.0, 28.0, 16.0, 16.0, 10.0, 15.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.212158203125, -15.64306640625, -15.073974609375, -14.5048828125, -13.935791015625, -13.36669921875, -12.797607421875, -12.228515625, -11.659423828125, -11.09033203125, -10.521240234375, -9.9521484375, -9.383056640625, -8.81396484375, -8.244873046875, -7.67578125, -7.106689453125, -6.53759765625, -5.968505859375, -5.3994140625, -4.830322265625, -4.26123046875, -3.692138671875, -3.123046875, -2.553955078125, -1.98486328125, -1.415771484375, -0.8466796875, -0.277587890625, 0.29150390625, 0.860595703125, 1.4296875, 1.998779296875, 2.56787109375, 3.136962890625, 3.7060546875, 4.275146484375, 4.84423828125, 5.413330078125, 5.982421875, 6.551513671875, 7.12060546875, 7.689697265625, 8.2587890625, 8.827880859375, 9.39697265625, 9.966064453125, 10.53515625, 11.104248046875, 11.67333984375, 12.242431640625, 12.8115234375, 13.380615234375, 13.94970703125, 14.518798828125, 15.087890625, 15.656982421875, 16.22607421875, 16.795166015625, 17.3642578125, 17.933349609375, 18.50244140625, 19.071533203125, 19.640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 22.0, 32.0, 43.0, 55.0, 107.0, 160.0, 317.0, 571.0, 1063.0, 2157.0, 4607.0, 10536.0, 27540.0, 83744.0, 298168.0, 417497.0, 134721.0, 40548.0, 14606.0, 6097.0, 2784.0, 1325.0, 712.0, 411.0, 220.0, 157.0, 102.0, 56.0, 37.0, 25.0, 23.0, 21.0, 17.0, 4.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-22.984375, -22.270263671875, -21.55615234375, -20.842041015625, -20.1279296875, -19.413818359375, -18.69970703125, -17.985595703125, -17.271484375, -16.557373046875, -15.84326171875, -15.129150390625, -14.4150390625, -13.700927734375, -12.98681640625, -12.272705078125, -11.55859375, -10.844482421875, -10.13037109375, -9.416259765625, -8.7021484375, -7.988037109375, -7.27392578125, -6.559814453125, -5.845703125, -5.131591796875, -4.41748046875, -3.703369140625, -2.9892578125, -2.275146484375, -1.56103515625, -0.846923828125, -0.1328125, 0.581298828125, 1.29541015625, 2.009521484375, 2.7236328125, 3.437744140625, 4.15185546875, 4.865966796875, 5.580078125, 6.294189453125, 7.00830078125, 7.722412109375, 8.4365234375, 9.150634765625, 9.86474609375, 10.578857421875, 11.29296875, 12.007080078125, 12.72119140625, 13.435302734375, 14.1494140625, 14.863525390625, 15.57763671875, 16.291748046875, 17.005859375, 17.719970703125, 18.43408203125, 19.148193359375, 19.8623046875, 20.576416015625, 21.29052734375, 22.004638671875, 22.71875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 11.0, 12.0, 12.0, 20.0, 37.0, 50.0, 56.0, 65.0, 103.0, 94.0, 122.0, 84.0, 84.0, 69.0, 33.0, 32.0, 36.0, 19.0, 13.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.0040991902351379395, -0.003971695899963379, -0.0038442015647888184, -0.003716707229614258, -0.0035892128944396973, -0.0034617185592651367, -0.003334224224090576, -0.0032067298889160156, -0.003079235553741455, -0.0029517412185668945, -0.002824246883392334, -0.0026967525482177734, -0.002569258213043213, -0.0024417638778686523, -0.002314269542694092, -0.0021867752075195312, -0.0020592808723449707, -0.0019317865371704102, -0.0018042922019958496, -0.001676797866821289, -0.0015493035316467285, -0.001421809196472168, -0.0012943148612976074, -0.0011668205261230469, -0.0010393261909484863, -0.0009118318557739258, -0.0007843375205993652, -0.0006568431854248047, -0.0005293488502502441, -0.0004018545150756836, -0.00027436017990112305, -0.0001468658447265625, -1.9371509552001953e-05, 0.0001081228256225586, 0.00023561716079711914, 0.0003631114959716797, 0.0004906058311462402, 0.0006181001663208008, 0.0007455945014953613, 0.0008730888366699219, 0.0010005831718444824, 0.001128077507019043, 0.0012555718421936035, 0.001383066177368164, 0.0015105605125427246, 0.0016380548477172852, 0.0017655491828918457, 0.0018930435180664062, 0.002020537853240967, 0.0021480321884155273, 0.002275526523590088, 0.0024030208587646484, 0.002530515193939209, 0.0026580095291137695, 0.00278550386428833, 0.0029129981994628906, 0.003040492534637451, 0.0031679868698120117, 0.0032954812049865723, 0.003422975540161133, 0.0035504698753356934, 0.003677964210510254, 0.0038054585456848145, 0.003932952880859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 14.0, 23.0, 41.0, 71.0, 115.0, 233.0, 484.0, 973.0, 2617.0, 8691.0, 39710.0, 344976.0, 570037.0, 62339.0, 12252.0, 3512.0, 1293.0, 539.0, 253.0, 117.0, 92.0, 46.0, 31.0, 16.0, 17.0, 11.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-51.96875, -50.56884765625, -49.1689453125, -47.76904296875, -46.369140625, -44.96923828125, -43.5693359375, -42.16943359375, -40.76953125, -39.36962890625, -37.9697265625, -36.56982421875, -35.169921875, -33.77001953125, -32.3701171875, -30.97021484375, -29.5703125, -28.17041015625, -26.7705078125, -25.37060546875, -23.970703125, -22.57080078125, -21.1708984375, -19.77099609375, -18.37109375, -16.97119140625, -15.5712890625, -14.17138671875, -12.771484375, -11.37158203125, -9.9716796875, -8.57177734375, -7.171875, -5.77197265625, -4.3720703125, -2.97216796875, -1.572265625, -0.17236328125, 1.2275390625, 2.62744140625, 4.02734375, 5.42724609375, 6.8271484375, 8.22705078125, 9.626953125, 11.02685546875, 12.4267578125, 13.82666015625, 15.2265625, 16.62646484375, 18.0263671875, 19.42626953125, 20.826171875, 22.22607421875, 23.6259765625, 25.02587890625, 26.42578125, 27.82568359375, 29.2255859375, 30.62548828125, 32.025390625, 33.42529296875, 34.8251953125, 36.22509765625, 37.625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 9.0, 13.0, 20.0, 16.0, 25.0, 51.0, 49.0, 73.0, 88.0, 118.0, 107.0, 103.0, 82.0, 63.0, 37.0, 26.0, 19.0, 21.0, 17.0, 9.0, 7.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.96875, -19.4305419921875, -18.892333984375, -18.3541259765625, -17.81591796875, -17.2777099609375, -16.739501953125, -16.2012939453125, -15.6630859375, -15.1248779296875, -14.586669921875, -14.0484619140625, -13.51025390625, -12.9720458984375, -12.433837890625, -11.8956298828125, -11.357421875, -10.8192138671875, -10.281005859375, -9.7427978515625, -9.20458984375, -8.6663818359375, -8.128173828125, -7.5899658203125, -7.0517578125, -6.5135498046875, -5.975341796875, -5.4371337890625, -4.89892578125, -4.3607177734375, -3.822509765625, -3.2843017578125, -2.74609375, -2.2078857421875, -1.669677734375, -1.1314697265625, -0.59326171875, -0.0550537109375, 0.483154296875, 1.0213623046875, 1.5595703125, 2.0977783203125, 2.635986328125, 3.1741943359375, 3.71240234375, 4.2506103515625, 4.788818359375, 5.3270263671875, 5.865234375, 6.4034423828125, 6.941650390625, 7.4798583984375, 8.01806640625, 8.5562744140625, 9.094482421875, 9.6326904296875, 10.1708984375, 10.7091064453125, 11.247314453125, 11.7855224609375, 12.32373046875, 12.8619384765625, 13.400146484375, 13.9383544921875, 14.4765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 12.0, 26.0, 62.0, 104.0, 183.0, 223.0, 169.0, 110.0, 54.0, 18.0, 12.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.73016357421875, -367.71539306640625, -356.70062255859375, -345.6858215332031, -334.6710510253906, -323.6562805175781, -312.6414794921875, -301.626708984375, -290.6119384765625, -279.59716796875, -268.5823974609375, -257.5675964355469, -246.55282592773438, -235.53805541992188, -224.5232696533203, -213.50848388671875, -202.49371337890625, -191.47894287109375, -180.4641571044922, -169.44937133789062, -158.43460083007812, -147.41983032226562, -136.40504455566406, -125.39026641845703, -114.37548828125, -103.36071014404297, -92.34593200683594, -81.3311538696289, -70.31637573242188, -59.301597595214844, -48.28681945800781, -37.27204132080078, -26.257232666015625, -15.242454528808594, -4.2276763916015625, 6.787101745605469, 17.8018798828125, 28.81665802001953, 39.83143615722656, 50.846214294433594, 61.860992431640625, 72.87577056884766, 83.89054870605469, 94.90532684326172, 105.92010498046875, 116.93488311767578, 127.94966125488281, 138.96444702148438, 149.97921752929688, 160.99398803710938, 172.00877380371094, 183.0235595703125, 194.038330078125, 205.0531005859375, 216.06788635253906, 227.08267211914062, 238.09744262695312, 249.11221313476562, 260.12701416015625, 271.14178466796875, 282.15655517578125, 293.17132568359375, 304.18609619140625, 315.2008972167969, 326.2156677246094]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 11.0, 12.0, 18.0, 19.0, 25.0, 18.0, 15.0, 31.0, 28.0, 49.0, 49.0, 43.0, 56.0, 26.0, 47.0, 54.0, 41.0, 50.0, 34.0, 45.0, 39.0, 38.0, 43.0, 29.0, 22.0, 26.0, 20.0, 11.0, 16.0, 10.0, 9.0, 8.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-133.895263671875, -130.08030700683594, -126.2653579711914, -122.45040130615234, -118.63545227050781, -114.82049560546875, -111.00553894042969, -107.19058990478516, -103.37564086914062, -99.56068420410156, -95.74573516845703, -91.93077850341797, -88.11582946777344, -84.30087280273438, -80.48591613769531, -76.67096710205078, -72.85601043701172, -69.04105377197266, -65.22610473632812, -61.41114807128906, -57.59619903564453, -53.78124237060547, -49.96628952026367, -46.151336669921875, -42.33638381958008, -38.52143096923828, -34.706478118896484, -30.891523361206055, -27.076570510864258, -23.26161766052246, -19.44666290283203, -15.631710052490234, -11.816764831542969, -8.001811981201172, -4.186858177185059, -0.3719043731689453, 3.4430484771728516, 7.258001327514648, 11.072956085205078, 14.887908935546875, 18.702861785888672, 22.51781463623047, 26.332767486572266, 30.147722244262695, 33.962677001953125, 37.777626037597656, 41.59258270263672, 45.407535552978516, 49.22248840332031, 53.03744125366211, 56.852394104003906, 60.66735076904297, 64.4822998046875, 68.29725646972656, 72.11221313476562, 75.92716217041016, 79.74211120605469, 83.55706787109375, 87.37201690673828, 91.18697357177734, 95.00192260742188, 98.81687927246094, 102.6318359375, 106.44678497314453, 110.2617416381836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 9.0, 15.0, 21.0, 20.0, 30.0, 46.0, 62.0, 78.0, 121.0, 172.0, 243.0, 390.0, 638.0, 1051.0, 1938.0, 3712.0, 8289.0, 21419.0, 68032.0, 337218.0, 3383230.0, 270800.0, 61660.0, 20071.0, 7884.0, 3433.0, 1649.0, 860.0, 440.0, 272.0, 165.0, 99.0, 60.0, 35.0, 36.0, 22.0, 22.0, 17.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.375, -53.71923828125, -52.0634765625, -50.40771484375, -48.751953125, -47.09619140625, -45.4404296875, -43.78466796875, -42.12890625, -40.47314453125, -38.8173828125, -37.16162109375, -35.505859375, -33.85009765625, -32.1943359375, -30.53857421875, -28.8828125, -27.22705078125, -25.5712890625, -23.91552734375, -22.259765625, -20.60400390625, -18.9482421875, -17.29248046875, -15.63671875, -13.98095703125, -12.3251953125, -10.66943359375, -9.013671875, -7.35791015625, -5.7021484375, -4.04638671875, -2.390625, -0.73486328125, 0.9208984375, 2.57666015625, 4.232421875, 5.88818359375, 7.5439453125, 9.19970703125, 10.85546875, 12.51123046875, 14.1669921875, 15.82275390625, 17.478515625, 19.13427734375, 20.7900390625, 22.44580078125, 24.1015625, 25.75732421875, 27.4130859375, 29.06884765625, 30.724609375, 32.38037109375, 34.0361328125, 35.69189453125, 37.34765625, 39.00341796875, 40.6591796875, 42.31494140625, 43.970703125, 45.62646484375, 47.2822265625, 48.93798828125, 50.59375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 16.0, 19.0, 27.0, 36.0, 43.0, 46.0, 60.0, 69.0, 78.0, 63.0, 73.0, 69.0, 77.0, 60.0, 42.0, 45.0, 32.0, 29.0, 29.0, 12.0, 16.0, 9.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.77362060546875, -3.6292724609375, -3.48492431640625, -3.340576171875, -3.19622802734375, -3.0518798828125, -2.90753173828125, -2.76318359375, -2.61883544921875, -2.4744873046875, -2.33013916015625, -2.185791015625, -2.04144287109375, -1.8970947265625, -1.75274658203125, -1.6083984375, -1.46405029296875, -1.3197021484375, -1.17535400390625, -1.031005859375, -0.88665771484375, -0.7423095703125, -0.59796142578125, -0.45361328125, -0.30926513671875, -0.1649169921875, -0.02056884765625, 0.123779296875, 0.26812744140625, 0.4124755859375, 0.55682373046875, 0.701171875, 0.84552001953125, 0.9898681640625, 1.13421630859375, 1.278564453125, 1.42291259765625, 1.5672607421875, 1.71160888671875, 1.85595703125, 2.00030517578125, 2.1446533203125, 2.28900146484375, 2.433349609375, 2.57769775390625, 2.7220458984375, 2.86639404296875, 3.0107421875, 3.15509033203125, 3.2994384765625, 3.44378662109375, 3.588134765625, 3.73248291015625, 3.8768310546875, 4.02117919921875, 4.16552734375, 4.30987548828125, 4.4542236328125, 4.59857177734375, 4.742919921875, 4.88726806640625, 5.0316162109375, 5.17596435546875, 5.3203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 20.0, 15.0, 22.0, 53.0, 69.0, 130.0, 194.0, 337.0, 571.0, 1116.0, 2436.0, 5544.0, 14333.0, 43011.0, 168149.0, 2431916.0, 1315696.0, 148499.0, 39227.0, 13306.0, 5190.0, 2216.0, 1005.0, 516.0, 289.0, 153.0, 97.0, 40.0, 37.0, 21.0, 21.0, 14.0, 11.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.759765625, -45.98828125, -44.216796875, -42.4453125, -40.673828125, -38.90234375, -37.130859375, -35.359375, -33.587890625, -31.81640625, -30.044921875, -28.2734375, -26.501953125, -24.73046875, -22.958984375, -21.1875, -19.416015625, -17.64453125, -15.873046875, -14.1015625, -12.330078125, -10.55859375, -8.787109375, -7.015625, -5.244140625, -3.47265625, -1.701171875, 0.0703125, 1.841796875, 3.61328125, 5.384765625, 7.15625, 8.927734375, 10.69921875, 12.470703125, 14.2421875, 16.013671875, 17.78515625, 19.556640625, 21.328125, 23.099609375, 24.87109375, 26.642578125, 28.4140625, 30.185546875, 31.95703125, 33.728515625, 35.5, 37.271484375, 39.04296875, 40.814453125, 42.5859375, 44.357421875, 46.12890625, 47.900390625, 49.671875, 51.443359375, 53.21484375, 54.986328125, 56.7578125, 58.529296875, 60.30078125, 62.072265625, 63.84375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 17.0, 10.0, 23.0, 25.0, 39.0, 49.0, 53.0, 70.0, 133.0, 151.0, 267.0, 463.0, 1434.0, 448.0, 259.0, 169.0, 110.0, 80.0, 60.0, 44.0, 37.0, 28.0, 20.0, 14.0, 13.0, 16.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.75, -12.40087890625, -12.0517578125, -11.70263671875, -11.353515625, -11.00439453125, -10.6552734375, -10.30615234375, -9.95703125, -9.60791015625, -9.2587890625, -8.90966796875, -8.560546875, -8.21142578125, -7.8623046875, -7.51318359375, -7.1640625, -6.81494140625, -6.4658203125, -6.11669921875, -5.767578125, -5.41845703125, -5.0693359375, -4.72021484375, -4.37109375, -4.02197265625, -3.6728515625, -3.32373046875, -2.974609375, -2.62548828125, -2.2763671875, -1.92724609375, -1.578125, -1.22900390625, -0.8798828125, -0.53076171875, -0.181640625, 0.16748046875, 0.5166015625, 0.86572265625, 1.21484375, 1.56396484375, 1.9130859375, 2.26220703125, 2.611328125, 2.96044921875, 3.3095703125, 3.65869140625, 4.0078125, 4.35693359375, 4.7060546875, 5.05517578125, 5.404296875, 5.75341796875, 6.1025390625, 6.45166015625, 6.80078125, 7.14990234375, 7.4990234375, 7.84814453125, 8.197265625, 8.54638671875, 8.8955078125, 9.24462890625, 9.59375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 23.0, 30.0, 46.0, 50.0, 69.0, 87.0, 106.0, 101.0, 90.0, 82.0, 63.0, 45.0, 35.0, 32.0, 20.0, 16.0, 12.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-57.18735885620117, -55.36600112915039, -53.54464340209961, -51.72328186035156, -49.90192413330078, -48.08056640625, -46.25920867919922, -44.43785095214844, -42.61648941040039, -40.79513168334961, -38.97377395629883, -37.15241241455078, -35.3310546875, -33.50969696044922, -31.688339233398438, -29.866979598999023, -28.045621871948242, -26.22426414489746, -24.402904510498047, -22.581546783447266, -20.76018714904785, -18.93882942199707, -17.117469787597656, -15.296112060546875, -13.474753379821777, -11.65339469909668, -9.832036018371582, -8.010677337646484, -6.189319133758545, -4.3679609298706055, -2.546602249145508, -0.7252435684204102, 1.0961151123046875, 2.917473793029785, 4.738832473754883, 6.560190677642822, 8.381549835205078, 10.20290756225586, 12.024266242980957, 13.845624923706055, 15.666983604431152, 17.48834228515625, 19.30970001220703, 21.131059646606445, 22.952417373657227, 24.77377700805664, 26.595134735107422, 28.416492462158203, 30.237852096557617, 32.05921173095703, 33.88056945800781, 35.701927185058594, 37.523284912109375, 39.344642639160156, 41.1660041809082, 42.987361907958984, 44.808719635009766, 46.63007736206055, 48.45143508911133, 50.272796630859375, 52.094154357910156, 53.91551208496094, 55.73686981201172, 57.5582275390625, 59.37958908081055]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 9.0, 8.0, 18.0, 11.0, 18.0, 25.0, 23.0, 31.0, 26.0, 30.0, 42.0, 32.0, 31.0, 50.0, 49.0, 42.0, 41.0, 57.0, 41.0, 50.0, 33.0, 38.0, 31.0, 29.0, 27.0, 29.0, 26.0, 26.0, 19.0, 16.0, 7.0, 12.0, 9.0, 6.0, 7.0, 11.0, 1.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.58074951171875, -42.231414794921875, -40.882076263427734, -39.53274154663086, -38.183406829833984, -36.83407211303711, -35.48473358154297, -34.135398864746094, -32.78606414794922, -31.43672752380371, -30.087392807006836, -28.738056182861328, -27.388721466064453, -26.039384841918945, -24.690048217773438, -23.340713500976562, -21.991376876831055, -20.642040252685547, -19.292705535888672, -17.943368911743164, -16.59403419494629, -15.244697570800781, -13.89536190032959, -12.546026229858398, -11.196690559387207, -9.847354888916016, -8.498019218444824, -7.148683071136475, -5.799347400665283, -4.450011730194092, -3.100675582885742, -1.7513399124145508, -0.4020042419433594, 0.9473315477371216, 2.2966673374176025, 3.646003246307373, 4.9953389167785645, 6.344674587249756, 7.6940107345581055, 9.043346405029297, 10.392682075500488, 11.74201774597168, 13.091353416442871, 14.440689086914062, 15.79002571105957, 17.139360427856445, 18.488697052001953, 19.838031768798828, 21.187368392944336, 22.536705017089844, 23.88603973388672, 25.235376358032227, 26.5847110748291, 27.93404769897461, 29.283382415771484, 30.632719039916992, 31.9820556640625, 33.331390380859375, 34.680728912353516, 36.03006362915039, 37.379398345947266, 38.72873306274414, 40.07807159423828, 41.427406311035156, 42.77674102783203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 7.0, 6.0, 8.0, 16.0, 18.0, 30.0, 41.0, 74.0, 77.0, 112.0, 186.0, 244.0, 361.0, 526.0, 871.0, 1405.0, 2308.0, 4192.0, 7831.0, 15966.0, 33910.0, 74963.0, 165963.0, 303664.0, 232084.0, 108473.0, 48541.0, 22378.0, 10713.0, 5633.0, 3095.0, 1709.0, 1052.0, 688.0, 434.0, 306.0, 206.0, 147.0, 91.0, 67.0, 48.0, 30.0, 17.0, 20.0, 10.0, 8.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-25.3125, -24.48876953125, -23.6650390625, -22.84130859375, -22.017578125, -21.19384765625, -20.3701171875, -19.54638671875, -18.72265625, -17.89892578125, -17.0751953125, -16.25146484375, -15.427734375, -14.60400390625, -13.7802734375, -12.95654296875, -12.1328125, -11.30908203125, -10.4853515625, -9.66162109375, -8.837890625, -8.01416015625, -7.1904296875, -6.36669921875, -5.54296875, -4.71923828125, -3.8955078125, -3.07177734375, -2.248046875, -1.42431640625, -0.6005859375, 0.22314453125, 1.046875, 1.87060546875, 2.6943359375, 3.51806640625, 4.341796875, 5.16552734375, 5.9892578125, 6.81298828125, 7.63671875, 8.46044921875, 9.2841796875, 10.10791015625, 10.931640625, 11.75537109375, 12.5791015625, 13.40283203125, 14.2265625, 15.05029296875, 15.8740234375, 16.69775390625, 17.521484375, 18.34521484375, 19.1689453125, 19.99267578125, 20.81640625, 21.64013671875, 22.4638671875, 23.28759765625, 24.111328125, 24.93505859375, 25.7587890625, 26.58251953125, 27.40625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 11.0, 15.0, 19.0, 24.0, 29.0, 34.0, 45.0, 55.0, 48.0, 56.0, 69.0, 69.0, 53.0, 64.0, 59.0, 56.0, 51.0, 43.0, 37.0, 41.0, 25.0, 18.0, 6.0, 13.0, 6.0, 10.0, 4.0, 6.0, 1.0, 8.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.009521484375, -3.86669921875, -3.723876953125, -3.5810546875, -3.438232421875, -3.29541015625, -3.152587890625, -3.009765625, -2.866943359375, -2.72412109375, -2.581298828125, -2.4384765625, -2.295654296875, -2.15283203125, -2.010009765625, -1.8671875, -1.724365234375, -1.58154296875, -1.438720703125, -1.2958984375, -1.153076171875, -1.01025390625, -0.867431640625, -0.724609375, -0.581787109375, -0.43896484375, -0.296142578125, -0.1533203125, -0.010498046875, 0.13232421875, 0.275146484375, 0.41796875, 0.560791015625, 0.70361328125, 0.846435546875, 0.9892578125, 1.132080078125, 1.27490234375, 1.417724609375, 1.560546875, 1.703369140625, 1.84619140625, 1.989013671875, 2.1318359375, 2.274658203125, 2.41748046875, 2.560302734375, 2.703125, 2.845947265625, 2.98876953125, 3.131591796875, 3.2744140625, 3.417236328125, 3.56005859375, 3.702880859375, 3.845703125, 3.988525390625, 4.13134765625, 4.274169921875, 4.4169921875, 4.559814453125, 4.70263671875, 4.845458984375, 4.98828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 16.0, 24.0, 34.0, 50.0, 79.0, 107.0, 187.0, 325.0, 650.0, 1482.0, 3650.0, 10869.0, 38739.0, 164795.0, 548171.0, 210809.0, 48292.0, 12950.0, 4138.0, 1643.0, 704.0, 325.0, 193.0, 95.0, 66.0, 46.0, 37.0, 19.0, 14.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.8330078125, -45.134765625, -43.4365234375, -41.73828125, -40.0400390625, -38.341796875, -36.6435546875, -34.9453125, -33.2470703125, -31.548828125, -29.8505859375, -28.15234375, -26.4541015625, -24.755859375, -23.0576171875, -21.359375, -19.6611328125, -17.962890625, -16.2646484375, -14.56640625, -12.8681640625, -11.169921875, -9.4716796875, -7.7734375, -6.0751953125, -4.376953125, -2.6787109375, -0.98046875, 0.7177734375, 2.416015625, 4.1142578125, 5.8125, 7.5107421875, 9.208984375, 10.9072265625, 12.60546875, 14.3037109375, 16.001953125, 17.7001953125, 19.3984375, 21.0966796875, 22.794921875, 24.4931640625, 26.19140625, 27.8896484375, 29.587890625, 31.2861328125, 32.984375, 34.6826171875, 36.380859375, 38.0791015625, 39.77734375, 41.4755859375, 43.173828125, 44.8720703125, 46.5703125, 48.2685546875, 49.966796875, 51.6650390625, 53.36328125, 55.0615234375, 56.759765625, 58.4580078125, 60.15625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 11.0, 12.0, 5.0, 9.0, 13.0, 17.0, 22.0, 30.0, 35.0, 29.0, 32.0, 51.0, 50.0, 51.0, 44.0, 52.0, 52.0, 57.0, 37.0, 44.0, 37.0, 52.0, 39.0, 40.0, 33.0, 28.0, 25.0, 22.0, 15.0, 12.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.413330078125, -22.59228515625, -21.771240234375, -20.9501953125, -20.129150390625, -19.30810546875, -18.487060546875, -17.666015625, -16.844970703125, -16.02392578125, -15.202880859375, -14.3818359375, -13.560791015625, -12.73974609375, -11.918701171875, -11.09765625, -10.276611328125, -9.45556640625, -8.634521484375, -7.8134765625, -6.992431640625, -6.17138671875, -5.350341796875, -4.529296875, -3.708251953125, -2.88720703125, -2.066162109375, -1.2451171875, -0.424072265625, 0.39697265625, 1.218017578125, 2.0390625, 2.860107421875, 3.68115234375, 4.502197265625, 5.3232421875, 6.144287109375, 6.96533203125, 7.786376953125, 8.607421875, 9.428466796875, 10.24951171875, 11.070556640625, 11.8916015625, 12.712646484375, 13.53369140625, 14.354736328125, 15.17578125, 15.996826171875, 16.81787109375, 17.638916015625, 18.4599609375, 19.281005859375, 20.10205078125, 20.923095703125, 21.744140625, 22.565185546875, 23.38623046875, 24.207275390625, 25.0283203125, 25.849365234375, 26.67041015625, 27.491455078125, 28.3125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 1.0, 9.0, 8.0, 8.0, 20.0, 21.0, 30.0, 32.0, 70.0, 98.0, 139.0, 191.0, 375.0, 643.0, 1124.0, 2156.0, 4285.0, 9301.0, 21238.0, 54844.0, 153291.0, 385568.0, 262777.0, 91129.0, 34354.0, 13880.0, 6261.0, 3007.0, 1503.0, 876.0, 496.0, 277.0, 189.0, 123.0, 74.0, 42.0, 35.0, 27.0, 13.0, 15.0, 4.0, 11.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.63037109375, -16.9951171875, -16.35986328125, -15.724609375, -15.08935546875, -14.4541015625, -13.81884765625, -13.18359375, -12.54833984375, -11.9130859375, -11.27783203125, -10.642578125, -10.00732421875, -9.3720703125, -8.73681640625, -8.1015625, -7.46630859375, -6.8310546875, -6.19580078125, -5.560546875, -4.92529296875, -4.2900390625, -3.65478515625, -3.01953125, -2.38427734375, -1.7490234375, -1.11376953125, -0.478515625, 0.15673828125, 0.7919921875, 1.42724609375, 2.0625, 2.69775390625, 3.3330078125, 3.96826171875, 4.603515625, 5.23876953125, 5.8740234375, 6.50927734375, 7.14453125, 7.77978515625, 8.4150390625, 9.05029296875, 9.685546875, 10.32080078125, 10.9560546875, 11.59130859375, 12.2265625, 12.86181640625, 13.4970703125, 14.13232421875, 14.767578125, 15.40283203125, 16.0380859375, 16.67333984375, 17.30859375, 17.94384765625, 18.5791015625, 19.21435546875, 19.849609375, 20.48486328125, 21.1201171875, 21.75537109375, 22.390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 13.0, 12.0, 17.0, 20.0, 37.0, 54.0, 63.0, 94.0, 155.0, 144.0, 124.0, 77.0, 54.0, 43.0, 29.0, 15.0, 8.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004970550537109375, -0.004788458347320557, -0.004606366157531738, -0.00442427396774292, -0.0042421817779541016, -0.004060089588165283, -0.003877997398376465, -0.0036959052085876465, -0.003513813018798828, -0.0033317208290100098, -0.0031496286392211914, -0.002967536449432373, -0.0027854442596435547, -0.0026033520698547363, -0.002421259880065918, -0.0022391676902770996, -0.0020570755004882812, -0.0018749833106994629, -0.0016928911209106445, -0.0015107989311218262, -0.0013287067413330078, -0.0011466145515441895, -0.0009645223617553711, -0.0007824301719665527, -0.0006003379821777344, -0.000418245792388916, -0.00023615360260009766, -5.40614128112793e-05, 0.00012803077697753906, 0.0003101229667663574, 0.0004922151565551758, 0.0006743073463439941, 0.0008563995361328125, 0.0010384917259216309, 0.0012205839157104492, 0.0014026761054992676, 0.001584768295288086, 0.0017668604850769043, 0.0019489526748657227, 0.002131044864654541, 0.0023131370544433594, 0.0024952292442321777, 0.002677321434020996, 0.0028594136238098145, 0.003041505813598633, 0.003223598003387451, 0.0034056901931762695, 0.003587782382965088, 0.0037698745727539062, 0.003951966762542725, 0.004134058952331543, 0.004316151142120361, 0.00449824333190918, 0.004680335521697998, 0.004862427711486816, 0.005044519901275635, 0.005226612091064453, 0.0054087042808532715, 0.00559079647064209, 0.005772888660430908, 0.0059549808502197266, 0.006137073040008545, 0.006319165229797363, 0.006501257419586182, 0.006683349609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 12.0, 19.0, 20.0, 40.0, 63.0, 109.0, 212.0, 430.0, 937.0, 2331.0, 7297.0, 28229.0, 161314.0, 673197.0, 138323.0, 25301.0, 6720.0, 2243.0, 872.0, 387.0, 193.0, 100.0, 76.0, 44.0, 23.0, 12.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.96875, -35.57177734375, -34.1748046875, -32.77783203125, -31.380859375, -29.98388671875, -28.5869140625, -27.18994140625, -25.79296875, -24.39599609375, -22.9990234375, -21.60205078125, -20.205078125, -18.80810546875, -17.4111328125, -16.01416015625, -14.6171875, -13.22021484375, -11.8232421875, -10.42626953125, -9.029296875, -7.63232421875, -6.2353515625, -4.83837890625, -3.44140625, -2.04443359375, -0.6474609375, 0.74951171875, 2.146484375, 3.54345703125, 4.9404296875, 6.33740234375, 7.734375, 9.13134765625, 10.5283203125, 11.92529296875, 13.322265625, 14.71923828125, 16.1162109375, 17.51318359375, 18.91015625, 20.30712890625, 21.7041015625, 23.10107421875, 24.498046875, 25.89501953125, 27.2919921875, 28.68896484375, 30.0859375, 31.48291015625, 32.8798828125, 34.27685546875, 35.673828125, 37.07080078125, 38.4677734375, 39.86474609375, 41.26171875, 42.65869140625, 44.0556640625, 45.45263671875, 46.849609375, 48.24658203125, 49.6435546875, 51.04052734375, 52.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 3.0, 9.0, 9.0, 7.0, 8.0, 11.0, 12.0, 22.0, 18.0, 28.0, 31.0, 34.0, 42.0, 50.0, 65.0, 62.0, 79.0, 81.0, 64.0, 75.0, 51.0, 43.0, 35.0, 30.0, 23.0, 10.0, 12.0, 14.0, 11.0, 10.0, 11.0, 11.0, 6.0, 9.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.3878173828125, -13.892822265625, -13.3978271484375, -12.90283203125, -12.4078369140625, -11.912841796875, -11.4178466796875, -10.9228515625, -10.4278564453125, -9.932861328125, -9.4378662109375, -8.94287109375, -8.4478759765625, -7.952880859375, -7.4578857421875, -6.962890625, -6.4678955078125, -5.972900390625, -5.4779052734375, -4.98291015625, -4.4879150390625, -3.992919921875, -3.4979248046875, -3.0029296875, -2.5079345703125, -2.012939453125, -1.5179443359375, -1.02294921875, -0.5279541015625, -0.032958984375, 0.4620361328125, 0.95703125, 1.4520263671875, 1.947021484375, 2.4420166015625, 2.93701171875, 3.4320068359375, 3.927001953125, 4.4219970703125, 4.9169921875, 5.4119873046875, 5.906982421875, 6.4019775390625, 6.89697265625, 7.3919677734375, 7.886962890625, 8.3819580078125, 8.876953125, 9.3719482421875, 9.866943359375, 10.3619384765625, 10.85693359375, 11.3519287109375, 11.846923828125, 12.3419189453125, 12.8369140625, 13.3319091796875, 13.826904296875, 14.3218994140625, 14.81689453125, 15.3118896484375, 15.806884765625, 16.3018798828125, 16.796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 12.0, 18.0, 18.0, 51.0, 68.0, 146.0, 157.0, 182.0, 125.0, 76.0, 62.0, 30.0, 22.0, 8.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.466064453125, -239.61849975585938, -228.77093505859375, -217.92335510253906, -207.07579040527344, -196.2282257080078, -185.38064575195312, -174.5330810546875, -163.68551635742188, -152.83795166015625, -141.99038696289062, -131.14280700683594, -120.29524230957031, -109.44767761230469, -98.60010528564453, -87.75253295898438, -76.90496826171875, -66.05740356445312, -55.20983123779297, -44.36226272583008, -33.51469421386719, -22.667125701904297, -11.819557189941406, -0.97198486328125, 9.875579833984375, 20.723148345947266, 31.570716857910156, 42.41828536987305, 53.26585388183594, 64.11341857910156, 74.96099090576172, 85.80856323242188, 96.65609741210938, 107.503662109375, 118.35123443603516, 129.1988067626953, 140.04637145996094, 150.89393615722656, 161.74151611328125, 172.58908081054688, 183.4366455078125, 194.28421020507812, 205.13177490234375, 215.97935485839844, 226.82691955566406, 237.6744842529297, 248.52206420898438, 259.36962890625, 270.2171936035156, 281.06475830078125, 291.9123229980469, 302.7598876953125, 313.60748291015625, 324.4550476074219, 335.3026123046875, 346.1501770019531, 356.99774169921875, 367.8453063964844, 378.69287109375, 389.5404357910156, 400.38800048828125, 411.235595703125, 422.0831604003906, 432.93072509765625, 443.7782897949219]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 10.0, 16.0, 16.0, 9.0, 24.0, 27.0, 29.0, 27.0, 30.0, 30.0, 33.0, 39.0, 35.0, 30.0, 42.0, 54.0, 33.0, 47.0, 40.0, 50.0, 46.0, 28.0, 26.0, 36.0, 34.0, 33.0, 27.0, 14.0, 16.0, 15.0, 10.0, 15.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-160.94764709472656, -155.8898468017578, -150.83206176757812, -145.77426147460938, -140.7164764404297, -135.65867614746094, -130.60089111328125, -125.5430908203125, -120.48529815673828, -115.42750549316406, -110.36971282958984, -105.31192016601562, -100.25411987304688, -95.19633483886719, -90.13853454589844, -85.08074188232422, -80.02294921875, -74.96515655517578, -69.90736389160156, -64.84957122802734, -59.79177474975586, -54.73398208618164, -49.676185607910156, -44.61839294433594, -39.56060028076172, -34.5028076171875, -29.44501304626465, -24.387218475341797, -19.329425811767578, -14.27163314819336, -9.213838577270508, -4.156044006347656, 0.9017486572265625, 5.959542274475098, 11.017335891723633, 16.075130462646484, 21.132923126220703, 26.190715789794922, 31.248510360717773, 36.306304931640625, 41.364097595214844, 46.42189025878906, 51.47968292236328, 56.537479400634766, 61.595272064208984, 66.65306091308594, 71.71086120605469, 76.7686538696289, 81.82644653320312, 86.88423919677734, 91.94203186035156, 96.99982452392578, 102.0576171875, 107.11541748046875, 112.17321014404297, 117.23100280761719, 122.2887954711914, 127.34658813476562, 132.40438842773438, 137.46217346191406, 142.5199737548828, 147.5777587890625, 152.63555908203125, 157.693359375, 162.7511444091797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 7.0, 17.0, 26.0, 36.0, 34.0, 77.0, 112.0, 160.0, 244.0, 407.0, 715.0, 1535.0, 3271.0, 7469.0, 19346.0, 61789.0, 353539.0, 3523583.0, 158653.0, 38272.0, 13807.0, 5669.0, 2631.0, 1298.0, 710.0, 356.0, 201.0, 109.0, 55.0, 54.0, 27.0, 16.0, 8.0, 9.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.6875, -63.0419921875, -61.396484375, -59.7509765625, -58.10546875, -56.4599609375, -54.814453125, -53.1689453125, -51.5234375, -49.8779296875, -48.232421875, -46.5869140625, -44.94140625, -43.2958984375, -41.650390625, -40.0048828125, -38.359375, -36.7138671875, -35.068359375, -33.4228515625, -31.77734375, -30.1318359375, -28.486328125, -26.8408203125, -25.1953125, -23.5498046875, -21.904296875, -20.2587890625, -18.61328125, -16.9677734375, -15.322265625, -13.6767578125, -12.03125, -10.3857421875, -8.740234375, -7.0947265625, -5.44921875, -3.8037109375, -2.158203125, -0.5126953125, 1.1328125, 2.7783203125, 4.423828125, 6.0693359375, 7.71484375, 9.3603515625, 11.005859375, 12.6513671875, 14.296875, 15.9423828125, 17.587890625, 19.2333984375, 20.87890625, 22.5244140625, 24.169921875, 25.8154296875, 27.4609375, 29.1064453125, 30.751953125, 32.3974609375, 34.04296875, 35.6884765625, 37.333984375, 38.9794921875, 40.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 16.0, 14.0, 21.0, 22.0, 32.0, 36.0, 39.0, 53.0, 46.0, 64.0, 54.0, 72.0, 61.0, 64.0, 60.0, 51.0, 43.0, 41.0, 41.0, 33.0, 26.0, 12.0, 25.0, 13.0, 11.0, 12.0, 3.0, 5.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.9432373046875, -5.765380859375, -5.5875244140625, -5.40966796875, -5.2318115234375, -5.053955078125, -4.8760986328125, -4.6982421875, -4.5203857421875, -4.342529296875, -4.1646728515625, -3.98681640625, -3.8089599609375, -3.631103515625, -3.4532470703125, -3.275390625, -3.0975341796875, -2.919677734375, -2.7418212890625, -2.56396484375, -2.3861083984375, -2.208251953125, -2.0303955078125, -1.8525390625, -1.6746826171875, -1.496826171875, -1.3189697265625, -1.14111328125, -0.9632568359375, -0.785400390625, -0.6075439453125, -0.4296875, -0.2518310546875, -0.073974609375, 0.1038818359375, 0.28173828125, 0.4595947265625, 0.637451171875, 0.8153076171875, 0.9931640625, 1.1710205078125, 1.348876953125, 1.5267333984375, 1.70458984375, 1.8824462890625, 2.060302734375, 2.2381591796875, 2.416015625, 2.5938720703125, 2.771728515625, 2.9495849609375, 3.12744140625, 3.3052978515625, 3.483154296875, 3.6610107421875, 3.8388671875, 4.0167236328125, 4.194580078125, 4.3724365234375, 4.55029296875, 4.7281494140625, 4.906005859375, 5.0838623046875, 5.26171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 13.0, 19.0, 33.0, 34.0, 57.0, 110.0, 158.0, 275.0, 473.0, 825.0, 1521.0, 2989.0, 6576.0, 16666.0, 52132.0, 256378.0, 3425931.0, 337176.0, 60423.0, 18441.0, 7202.0, 3157.0, 1575.0, 826.0, 487.0, 274.0, 183.0, 115.0, 84.0, 50.0, 31.0, 24.0, 14.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.59375, -61.8056640625, -60.017578125, -58.2294921875, -56.44140625, -54.6533203125, -52.865234375, -51.0771484375, -49.2890625, -47.5009765625, -45.712890625, -43.9248046875, -42.13671875, -40.3486328125, -38.560546875, -36.7724609375, -34.984375, -33.1962890625, -31.408203125, -29.6201171875, -27.83203125, -26.0439453125, -24.255859375, -22.4677734375, -20.6796875, -18.8916015625, -17.103515625, -15.3154296875, -13.52734375, -11.7392578125, -9.951171875, -8.1630859375, -6.375, -4.5869140625, -2.798828125, -1.0107421875, 0.77734375, 2.5654296875, 4.353515625, 6.1416015625, 7.9296875, 9.7177734375, 11.505859375, 13.2939453125, 15.08203125, 16.8701171875, 18.658203125, 20.4462890625, 22.234375, 24.0224609375, 25.810546875, 27.5986328125, 29.38671875, 31.1748046875, 32.962890625, 34.7509765625, 36.5390625, 38.3271484375, 40.115234375, 41.9033203125, 43.69140625, 45.4794921875, 47.267578125, 49.0556640625, 50.84375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 4.0, 18.0, 13.0, 19.0, 35.0, 36.0, 62.0, 65.0, 96.0, 156.0, 262.0, 537.0, 1779.0, 363.0, 180.0, 128.0, 64.0, 59.0, 40.0, 33.0, 29.0, 17.0, 14.0, 8.0, 2.0, 6.0, 3.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8203125, -12.4102783203125, -12.000244140625, -11.5902099609375, -11.18017578125, -10.7701416015625, -10.360107421875, -9.9500732421875, -9.5400390625, -9.1300048828125, -8.719970703125, -8.3099365234375, -7.89990234375, -7.4898681640625, -7.079833984375, -6.6697998046875, -6.259765625, -5.8497314453125, -5.439697265625, -5.0296630859375, -4.61962890625, -4.2095947265625, -3.799560546875, -3.3895263671875, -2.9794921875, -2.5694580078125, -2.159423828125, -1.7493896484375, -1.33935546875, -0.9293212890625, -0.519287109375, -0.1092529296875, 0.30078125, 0.7108154296875, 1.120849609375, 1.5308837890625, 1.94091796875, 2.3509521484375, 2.760986328125, 3.1710205078125, 3.5810546875, 3.9910888671875, 4.401123046875, 4.8111572265625, 5.22119140625, 5.6312255859375, 6.041259765625, 6.4512939453125, 6.861328125, 7.2713623046875, 7.681396484375, 8.0914306640625, 8.50146484375, 8.9114990234375, 9.321533203125, 9.7315673828125, 10.1416015625, 10.5516357421875, 10.961669921875, 11.3717041015625, 11.78173828125, 12.1917724609375, 12.601806640625, 13.0118408203125, 13.421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 18.0, 17.0, 22.0, 41.0, 62.0, 74.0, 156.0, 152.0, 127.0, 106.0, 78.0, 56.0, 29.0, 18.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.20330047607422, -78.2730712890625, -75.34284973144531, -72.41262817382812, -69.4823989868164, -66.55216979980469, -63.6219482421875, -60.69172286987305, -57.761497497558594, -54.83127212524414, -51.90104675292969, -48.970821380615234, -46.04059600830078, -43.11037063598633, -40.180145263671875, -37.24991989135742, -34.31969451904297, -31.389469146728516, -28.459243774414062, -25.52901840209961, -22.598793029785156, -19.668567657470703, -16.73834228515625, -13.808116912841797, -10.877891540527344, -7.947666168212891, -5.0174407958984375, -2.0872154235839844, 0.8430099487304688, 3.773235321044922, 6.703460693359375, 9.633686065673828, 12.563919067382812, 15.494144439697266, 18.42436981201172, 21.354595184326172, 24.284820556640625, 27.215045928955078, 30.14527130126953, 33.075496673583984, 36.00572204589844, 38.93594741821289, 41.866172790527344, 44.7963981628418, 47.72662353515625, 50.6568489074707, 53.587074279785156, 56.51729965209961, 59.44752502441406, 62.377750396728516, 65.30797576904297, 68.23820495605469, 71.16842651367188, 74.09864807128906, 77.02887725830078, 79.9591064453125, 82.88932800292969, 85.81954956054688, 88.7497787475586, 91.68000793457031, 94.6102294921875, 97.54045104980469, 100.4706802368164, 103.40090942382812, 106.33113098144531]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 13.0, 8.0, 25.0, 24.0, 15.0, 36.0, 29.0, 40.0, 36.0, 46.0, 40.0, 39.0, 61.0, 41.0, 52.0, 44.0, 43.0, 38.0, 28.0, 41.0, 36.0, 35.0, 32.0, 29.0, 27.0, 17.0, 16.0, 13.0, 11.0, 7.0, 6.0, 12.0, 6.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.28271484375, -46.7509880065918, -45.21925735473633, -43.687530517578125, -42.15580368041992, -40.62407684326172, -39.09234619140625, -37.56061935424805, -36.028892517089844, -34.49716567993164, -32.96543502807617, -31.43370819091797, -29.901981353759766, -28.37025260925293, -26.838523864746094, -25.30679702758789, -23.775066375732422, -22.243337631225586, -20.711610794067383, -19.179882049560547, -17.648155212402344, -16.116426467895508, -14.584697723388672, -13.052969932556152, -11.521242141723633, -9.989514350891113, -8.457786560058594, -6.926057815551758, -5.394330024719238, -3.8626022338867188, -2.330873489379883, -0.7991456985473633, 0.7325820922851562, 2.264310121536255, 3.7960381507873535, 5.327766418457031, 6.859494209289551, 8.39122200012207, 9.922950744628906, 11.454678535461426, 12.986406326293945, 14.518134117126465, 16.049861907958984, 17.58159065246582, 19.113319396972656, 20.64504623413086, 22.176774978637695, 23.70850372314453, 25.240230560302734, 26.77195930480957, 28.303686141967773, 29.83541488647461, 31.367141723632812, 32.89887237548828, 34.430599212646484, 35.96232604980469, 37.494056701660156, 39.02578353881836, 40.55751419067383, 42.08924102783203, 43.620967864990234, 45.15269470214844, 46.684425354003906, 48.21615219116211, 49.74787902832031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 11.0, 18.0, 14.0, 31.0, 26.0, 68.0, 72.0, 131.0, 186.0, 287.0, 396.0, 638.0, 1040.0, 1880.0, 3269.0, 5772.0, 11059.0, 22474.0, 46201.0, 98852.0, 211631.0, 311793.0, 173689.0, 81114.0, 38038.0, 18613.0, 9357.0, 4999.0, 2746.0, 1683.0, 955.0, 573.0, 302.0, 220.0, 123.0, 111.0, 62.0, 38.0, 17.0, 18.0, 10.0, 8.0, 8.0, 5.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-25.921875, -25.14501953125, -24.3681640625, -23.59130859375, -22.814453125, -22.03759765625, -21.2607421875, -20.48388671875, -19.70703125, -18.93017578125, -18.1533203125, -17.37646484375, -16.599609375, -15.82275390625, -15.0458984375, -14.26904296875, -13.4921875, -12.71533203125, -11.9384765625, -11.16162109375, -10.384765625, -9.60791015625, -8.8310546875, -8.05419921875, -7.27734375, -6.50048828125, -5.7236328125, -4.94677734375, -4.169921875, -3.39306640625, -2.6162109375, -1.83935546875, -1.0625, -0.28564453125, 0.4912109375, 1.26806640625, 2.044921875, 2.82177734375, 3.5986328125, 4.37548828125, 5.15234375, 5.92919921875, 6.7060546875, 7.48291015625, 8.259765625, 9.03662109375, 9.8134765625, 10.59033203125, 11.3671875, 12.14404296875, 12.9208984375, 13.69775390625, 14.474609375, 15.25146484375, 16.0283203125, 16.80517578125, 17.58203125, 18.35888671875, 19.1357421875, 19.91259765625, 20.689453125, 21.46630859375, 22.2431640625, 23.02001953125, 23.796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 12.0, 18.0, 30.0, 25.0, 29.0, 26.0, 43.0, 43.0, 45.0, 62.0, 67.0, 60.0, 65.0, 55.0, 42.0, 53.0, 48.0, 50.0, 46.0, 25.0, 29.0, 22.0, 18.0, 15.0, 10.0, 5.0, 5.0, 13.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.56817626953125, -5.3863525390625, -5.20452880859375, -5.022705078125, -4.84088134765625, -4.6590576171875, -4.47723388671875, -4.29541015625, -4.11358642578125, -3.9317626953125, -3.74993896484375, -3.568115234375, -3.38629150390625, -3.2044677734375, -3.02264404296875, -2.8408203125, -2.65899658203125, -2.4771728515625, -2.29534912109375, -2.113525390625, -1.93170166015625, -1.7498779296875, -1.56805419921875, -1.38623046875, -1.20440673828125, -1.0225830078125, -0.84075927734375, -0.658935546875, -0.47711181640625, -0.2952880859375, -0.11346435546875, 0.068359375, 0.25018310546875, 0.4320068359375, 0.61383056640625, 0.795654296875, 0.97747802734375, 1.1593017578125, 1.34112548828125, 1.52294921875, 1.70477294921875, 1.8865966796875, 2.06842041015625, 2.250244140625, 2.43206787109375, 2.6138916015625, 2.79571533203125, 2.9775390625, 3.15936279296875, 3.3411865234375, 3.52301025390625, 3.704833984375, 3.88665771484375, 4.0684814453125, 4.25030517578125, 4.43212890625, 4.61395263671875, 4.7957763671875, 4.97760009765625, 5.159423828125, 5.34124755859375, 5.5230712890625, 5.70489501953125, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 21.0, 20.0, 23.0, 34.0, 66.0, 116.0, 159.0, 280.0, 468.0, 914.0, 1515.0, 3059.0, 6371.0, 14825.0, 36784.0, 104342.0, 317935.0, 365965.0, 121827.0, 42519.0, 16689.0, 7309.0, 3364.0, 1673.0, 872.0, 524.0, 312.0, 176.0, 128.0, 92.0, 47.0, 31.0, 23.0, 15.0, 13.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.6875, -37.614990234375, -36.54248046875, -35.469970703125, -34.3974609375, -33.324951171875, -32.25244140625, -31.179931640625, -30.107421875, -29.034912109375, -27.96240234375, -26.889892578125, -25.8173828125, -24.744873046875, -23.67236328125, -22.599853515625, -21.52734375, -20.454833984375, -19.38232421875, -18.309814453125, -17.2373046875, -16.164794921875, -15.09228515625, -14.019775390625, -12.947265625, -11.874755859375, -10.80224609375, -9.729736328125, -8.6572265625, -7.584716796875, -6.51220703125, -5.439697265625, -4.3671875, -3.294677734375, -2.22216796875, -1.149658203125, -0.0771484375, 0.995361328125, 2.06787109375, 3.140380859375, 4.212890625, 5.285400390625, 6.35791015625, 7.430419921875, 8.5029296875, 9.575439453125, 10.64794921875, 11.720458984375, 12.79296875, 13.865478515625, 14.93798828125, 16.010498046875, 17.0830078125, 18.155517578125, 19.22802734375, 20.300537109375, 21.373046875, 22.445556640625, 23.51806640625, 24.590576171875, 25.6630859375, 26.735595703125, 27.80810546875, 28.880615234375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 2.0, 3.0, 16.0, 23.0, 21.0, 21.0, 31.0, 42.0, 45.0, 38.0, 65.0, 54.0, 65.0, 57.0, 40.0, 54.0, 51.0, 49.0, 52.0, 40.0, 26.0, 33.0, 22.0, 24.0, 18.0, 13.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.21875, -32.24267578125, -31.2666015625, -30.29052734375, -29.314453125, -28.33837890625, -27.3623046875, -26.38623046875, -25.41015625, -24.43408203125, -23.4580078125, -22.48193359375, -21.505859375, -20.52978515625, -19.5537109375, -18.57763671875, -17.6015625, -16.62548828125, -15.6494140625, -14.67333984375, -13.697265625, -12.72119140625, -11.7451171875, -10.76904296875, -9.79296875, -8.81689453125, -7.8408203125, -6.86474609375, -5.888671875, -4.91259765625, -3.9365234375, -2.96044921875, -1.984375, -1.00830078125, -0.0322265625, 0.94384765625, 1.919921875, 2.89599609375, 3.8720703125, 4.84814453125, 5.82421875, 6.80029296875, 7.7763671875, 8.75244140625, 9.728515625, 10.70458984375, 11.6806640625, 12.65673828125, 13.6328125, 14.60888671875, 15.5849609375, 16.56103515625, 17.537109375, 18.51318359375, 19.4892578125, 20.46533203125, 21.44140625, 22.41748046875, 23.3935546875, 24.36962890625, 25.345703125, 26.32177734375, 27.2978515625, 28.27392578125, 29.25]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 16.0, 13.0, 13.0, 22.0, 28.0, 46.0, 59.0, 90.0, 138.0, 198.0, 250.0, 486.0, 873.0, 1454.0, 2792.0, 5890.0, 14037.0, 39795.0, 139089.0, 444961.0, 282633.0, 74082.0, 23604.0, 9098.0, 4021.0, 2019.0, 1082.0, 623.0, 349.0, 230.0, 158.0, 98.0, 96.0, 55.0, 43.0, 32.0, 21.0, 18.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-16.828125, -16.314453125, -15.80078125, -15.287109375, -14.7734375, -14.259765625, -13.74609375, -13.232421875, -12.71875, -12.205078125, -11.69140625, -11.177734375, -10.6640625, -10.150390625, -9.63671875, -9.123046875, -8.609375, -8.095703125, -7.58203125, -7.068359375, -6.5546875, -6.041015625, -5.52734375, -5.013671875, -4.5, -3.986328125, -3.47265625, -2.958984375, -2.4453125, -1.931640625, -1.41796875, -0.904296875, -0.390625, 0.123046875, 0.63671875, 1.150390625, 1.6640625, 2.177734375, 2.69140625, 3.205078125, 3.71875, 4.232421875, 4.74609375, 5.259765625, 5.7734375, 6.287109375, 6.80078125, 7.314453125, 7.828125, 8.341796875, 8.85546875, 9.369140625, 9.8828125, 10.396484375, 10.91015625, 11.423828125, 11.9375, 12.451171875, 12.96484375, 13.478515625, 13.9921875, 14.505859375, 15.01953125, 15.533203125, 16.046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 0.0, 5.0, 6.0, 7.0, 7.0, 6.0, 19.0, 13.0, 21.0, 33.0, 39.0, 67.0, 111.0, 111.0, 125.0, 104.0, 98.0, 66.0, 42.0, 34.0, 20.0, 18.0, 10.0, 9.0, 6.0, 4.0, 1.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030345916748046875, -0.002905339002609253, -0.0027760863304138184, -0.002646833658218384, -0.0025175809860229492, -0.0023883283138275146, -0.00225907564163208, -0.0021298229694366455, -0.002000570297241211, -0.0018713176250457764, -0.0017420649528503418, -0.0016128122806549072, -0.0014835596084594727, -0.001354306936264038, -0.0012250542640686035, -0.001095801591873169, -0.0009665489196777344, -0.0008372962474822998, -0.0007080435752868652, -0.0005787909030914307, -0.0004495382308959961, -0.0003202855587005615, -0.00019103288650512695, -6.178021430969238e-05, 6.747245788574219e-05, 0.00019672513008117676, 0.00032597780227661133, 0.0004552304744720459, 0.0005844831466674805, 0.000713735818862915, 0.0008429884910583496, 0.0009722411632537842, 0.0011014938354492188, 0.0012307465076446533, 0.0013599991798400879, 0.0014892518520355225, 0.001618504524230957, 0.0017477571964263916, 0.0018770098686218262, 0.0020062625408172607, 0.0021355152130126953, 0.00226476788520813, 0.0023940205574035645, 0.002523273229598999, 0.0026525259017944336, 0.002781778573989868, 0.0029110312461853027, 0.0030402839183807373, 0.003169536590576172, 0.0032987892627716064, 0.003428041934967041, 0.0035572946071624756, 0.00368654727935791, 0.0038157999515533447, 0.003945052623748779, 0.004074305295944214, 0.0042035579681396484, 0.004332810640335083, 0.004462063312530518, 0.004591315984725952, 0.004720568656921387, 0.004849821329116821, 0.004979074001312256, 0.00510832667350769, 0.005237579345703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 15.0, 18.0, 32.0, 29.0, 41.0, 63.0, 97.0, 148.0, 219.0, 304.0, 566.0, 895.0, 1642.0, 3455.0, 8130.0, 24018.0, 96368.0, 453432.0, 353777.0, 72707.0, 19234.0, 6634.0, 2914.0, 1514.0, 822.0, 513.0, 280.0, 212.0, 115.0, 94.0, 62.0, 56.0, 39.0, 15.0, 12.0, 10.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.24951171875, -16.6083984375, -15.96728515625, -15.326171875, -14.68505859375, -14.0439453125, -13.40283203125, -12.76171875, -12.12060546875, -11.4794921875, -10.83837890625, -10.197265625, -9.55615234375, -8.9150390625, -8.27392578125, -7.6328125, -6.99169921875, -6.3505859375, -5.70947265625, -5.068359375, -4.42724609375, -3.7861328125, -3.14501953125, -2.50390625, -1.86279296875, -1.2216796875, -0.58056640625, 0.060546875, 0.70166015625, 1.3427734375, 1.98388671875, 2.625, 3.26611328125, 3.9072265625, 4.54833984375, 5.189453125, 5.83056640625, 6.4716796875, 7.11279296875, 7.75390625, 8.39501953125, 9.0361328125, 9.67724609375, 10.318359375, 10.95947265625, 11.6005859375, 12.24169921875, 12.8828125, 13.52392578125, 14.1650390625, 14.80615234375, 15.447265625, 16.08837890625, 16.7294921875, 17.37060546875, 18.01171875, 18.65283203125, 19.2939453125, 19.93505859375, 20.576171875, 21.21728515625, 21.8583984375, 22.49951171875, 23.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 4.0, 15.0, 29.0, 36.0, 42.0, 63.0, 101.0, 119.0, 128.0, 113.0, 107.0, 85.0, 45.0, 29.0, 21.0, 17.0, 13.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.90087890625, -15.2548828125, -14.60888671875, -13.962890625, -13.31689453125, -12.6708984375, -12.02490234375, -11.37890625, -10.73291015625, -10.0869140625, -9.44091796875, -8.794921875, -8.14892578125, -7.5029296875, -6.85693359375, -6.2109375, -5.56494140625, -4.9189453125, -4.27294921875, -3.626953125, -2.98095703125, -2.3349609375, -1.68896484375, -1.04296875, -0.39697265625, 0.2490234375, 0.89501953125, 1.541015625, 2.18701171875, 2.8330078125, 3.47900390625, 4.125, 4.77099609375, 5.4169921875, 6.06298828125, 6.708984375, 7.35498046875, 8.0009765625, 8.64697265625, 9.29296875, 9.93896484375, 10.5849609375, 11.23095703125, 11.876953125, 12.52294921875, 13.1689453125, 13.81494140625, 14.4609375, 15.10693359375, 15.7529296875, 16.39892578125, 17.044921875, 17.69091796875, 18.3369140625, 18.98291015625, 19.62890625, 20.27490234375, 20.9208984375, 21.56689453125, 22.212890625, 22.85888671875, 23.5048828125, 24.15087890625, 24.796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 26.0, 49.0, 125.0, 311.0, 293.0, 134.0, 40.0, 21.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.3655700683594, -411.714111328125, -391.0626220703125, -370.4111328125, -349.7596740722656, -329.10821533203125, -308.45672607421875, -287.80523681640625, -267.1537780761719, -246.50230407714844, -225.850830078125, -205.19935607910156, -184.54788208007812, -163.8964080810547, -143.24493408203125, -122.59346008300781, -101.94198608398438, -81.29051208496094, -60.6390380859375, -39.98756408691406, -19.336090087890625, 1.3153839111328125, 21.96685791015625, 42.61833190917969, 63.269805908203125, 83.92127990722656, 104.57275390625, 125.22422790527344, 145.87570190429688, 166.5271759033203, 187.17864990234375, 207.8301239013672, 228.4815673828125, 249.13304138183594, 269.7845153808594, 290.43597412109375, 311.08746337890625, 331.73895263671875, 352.3904113769531, 373.0418701171875, 393.693359375, 414.3448486328125, 434.9963073730469, 455.64776611328125, 476.29925537109375, 496.95074462890625, 517.6021728515625, 538.253662109375, 558.9051513671875, 579.556640625, 600.2081298828125, 620.8595581054688, 641.5110473632812, 662.1625366210938, 682.81396484375, 703.4654541015625, 724.116943359375, 744.7684326171875, 765.419921875, 786.0713500976562, 806.7228393554688, 827.3743286132812, 848.0257568359375, 868.67724609375, 889.3287353515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 1.0, 7.0, 14.0, 8.0, 10.0, 18.0, 22.0, 38.0, 44.0, 43.0, 45.0, 51.0, 58.0, 72.0, 66.0, 69.0, 49.0, 64.0, 40.0, 54.0, 36.0, 40.0, 33.0, 18.0, 25.0, 19.0, 16.0, 12.0, 9.0, 4.0, 11.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.98704528808594, -127.05823516845703, -120.12942504882812, -113.20062255859375, -106.27181243896484, -99.34300231933594, -92.41419982910156, -85.48538970947266, -78.55657958984375, -71.62776947021484, -64.69895935058594, -57.77015686035156, -50.841346740722656, -43.91253662109375, -36.98373031616211, -30.05492401123047, -23.126113891601562, -16.19730567932129, -9.268497467041016, -2.339689254760742, 4.589118957519531, 11.517929077148438, 18.446735382080078, 25.37554168701172, 32.304351806640625, 39.23316192626953, 46.16196823120117, 53.09077453613281, 60.01958465576172, 66.94839477539062, 73.877197265625, 80.8060073852539, 87.73483276367188, 94.66364288330078, 101.59245300292969, 108.52125549316406, 115.45006561279297, 122.37887573242188, 129.30767822265625, 136.23648071289062, 143.16529846191406, 150.09410095214844, 157.02291870117188, 163.95172119140625, 170.88052368164062, 177.80934143066406, 184.73814392089844, 191.66696166992188, 198.59576416015625, 205.52456665039062, 212.45338439941406, 219.38218688964844, 226.31100463867188, 233.23980712890625, 240.16860961914062, 247.097412109375, 254.02622985839844, 260.9550476074219, 267.88385009765625, 274.8126525878906, 281.741455078125, 288.6702880859375, 295.5990905761719, 302.52789306640625, 309.4566955566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 13.0, 9.0, 8.0, 16.0, 30.0, 56.0, 39.0, 48.0, 99.0, 153.0, 229.0, 360.0, 586.0, 962.0, 1797.0, 3294.0, 6100.0, 12796.0, 29957.0, 94175.0, 2820837.0, 1077015.0, 89594.0, 29348.0, 12570.0, 6040.0, 3262.0, 1889.0, 1058.0, 637.0, 420.0, 289.0, 168.0, 128.0, 90.0, 56.0, 44.0, 24.0, 20.0, 18.0, 13.0, 7.0, 4.0, 9.0, 2.0, 4.0], "bins": [-46.53125, -45.337646484375, -44.14404296875, -42.950439453125, -41.7568359375, -40.563232421875, -39.36962890625, -38.176025390625, -36.982421875, -35.788818359375, -34.59521484375, -33.401611328125, -32.2080078125, -31.014404296875, -29.82080078125, -28.627197265625, -27.43359375, -26.239990234375, -25.04638671875, -23.852783203125, -22.6591796875, -21.465576171875, -20.27197265625, -19.078369140625, -17.884765625, -16.691162109375, -15.49755859375, -14.303955078125, -13.1103515625, -11.916748046875, -10.72314453125, -9.529541015625, -8.3359375, -7.142333984375, -5.94873046875, -4.755126953125, -3.5615234375, -2.367919921875, -1.17431640625, 0.019287109375, 1.212890625, 2.406494140625, 3.60009765625, 4.793701171875, 5.9873046875, 7.180908203125, 8.37451171875, 9.568115234375, 10.76171875, 11.955322265625, 13.14892578125, 14.342529296875, 15.5361328125, 16.729736328125, 17.92333984375, 19.116943359375, 20.310546875, 21.504150390625, 22.69775390625, 23.891357421875, 25.0849609375, 26.278564453125, 27.47216796875, 28.665771484375, 29.859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 11.0, 25.0, 28.0, 30.0, 54.0, 46.0, 61.0, 62.0, 82.0, 82.0, 86.0, 69.0, 63.0, 65.0, 50.0, 50.0, 33.0, 25.0, 19.0, 11.0, 7.0, 10.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.678955078125, -6.41259765625, -6.146240234375, -5.8798828125, -5.613525390625, -5.34716796875, -5.080810546875, -4.814453125, -4.548095703125, -4.28173828125, -4.015380859375, -3.7490234375, -3.482666015625, -3.21630859375, -2.949951171875, -2.68359375, -2.417236328125, -2.15087890625, -1.884521484375, -1.6181640625, -1.351806640625, -1.08544921875, -0.819091796875, -0.552734375, -0.286376953125, -0.02001953125, 0.246337890625, 0.5126953125, 0.779052734375, 1.04541015625, 1.311767578125, 1.578125, 1.844482421875, 2.11083984375, 2.377197265625, 2.6435546875, 2.909912109375, 3.17626953125, 3.442626953125, 3.708984375, 3.975341796875, 4.24169921875, 4.508056640625, 4.7744140625, 5.040771484375, 5.30712890625, 5.573486328125, 5.83984375, 6.106201171875, 6.37255859375, 6.638916015625, 6.9052734375, 7.171630859375, 7.43798828125, 7.704345703125, 7.970703125, 8.237060546875, 8.50341796875, 8.769775390625, 9.0361328125, 9.302490234375, 9.56884765625, 9.835205078125, 10.1015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 12.0, 13.0, 7.0, 15.0, 36.0, 46.0, 60.0, 102.0, 142.0, 217.0, 386.0, 625.0, 1217.0, 2132.0, 4372.0, 9660.0, 22993.0, 67920.0, 319793.0, 3439845.0, 233334.0, 55379.0, 19674.0, 8271.0, 3716.0, 1841.0, 1009.0, 509.0, 306.0, 202.0, 141.0, 90.0, 55.0, 47.0, 34.0, 25.0, 19.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.96875, -45.52001953125, -44.0712890625, -42.62255859375, -41.173828125, -39.72509765625, -38.2763671875, -36.82763671875, -35.37890625, -33.93017578125, -32.4814453125, -31.03271484375, -29.583984375, -28.13525390625, -26.6865234375, -25.23779296875, -23.7890625, -22.34033203125, -20.8916015625, -19.44287109375, -17.994140625, -16.54541015625, -15.0966796875, -13.64794921875, -12.19921875, -10.75048828125, -9.3017578125, -7.85302734375, -6.404296875, -4.95556640625, -3.5068359375, -2.05810546875, -0.609375, 0.83935546875, 2.2880859375, 3.73681640625, 5.185546875, 6.63427734375, 8.0830078125, 9.53173828125, 10.98046875, 12.42919921875, 13.8779296875, 15.32666015625, 16.775390625, 18.22412109375, 19.6728515625, 21.12158203125, 22.5703125, 24.01904296875, 25.4677734375, 26.91650390625, 28.365234375, 29.81396484375, 31.2626953125, 32.71142578125, 34.16015625, 35.60888671875, 37.0576171875, 38.50634765625, 39.955078125, 41.40380859375, 42.8525390625, 44.30126953125, 45.75]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 4.0, 3.0, 5.0, 10.0, 12.0, 13.0, 16.0, 21.0, 33.0, 49.0, 76.0, 98.0, 168.0, 343.0, 2202.0, 470.0, 194.0, 106.0, 71.0, 54.0, 35.0, 23.0, 20.0, 12.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4375, -14.94921875, -14.4609375, -13.97265625, -13.484375, -12.99609375, -12.5078125, -12.01953125, -11.53125, -11.04296875, -10.5546875, -10.06640625, -9.578125, -9.08984375, -8.6015625, -8.11328125, -7.625, -7.13671875, -6.6484375, -6.16015625, -5.671875, -5.18359375, -4.6953125, -4.20703125, -3.71875, -3.23046875, -2.7421875, -2.25390625, -1.765625, -1.27734375, -0.7890625, -0.30078125, 0.1875, 0.67578125, 1.1640625, 1.65234375, 2.140625, 2.62890625, 3.1171875, 3.60546875, 4.09375, 4.58203125, 5.0703125, 5.55859375, 6.046875, 6.53515625, 7.0234375, 7.51171875, 8.0, 8.48828125, 8.9765625, 9.46484375, 9.953125, 10.44140625, 10.9296875, 11.41796875, 11.90625, 12.39453125, 12.8828125, 13.37109375, 13.859375, 14.34765625, 14.8359375, 15.32421875, 15.8125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 17.0, 29.0, 52.0, 83.0, 105.0, 144.0, 154.0, 140.0, 94.0, 69.0, 45.0, 10.0, 20.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-96.26805114746094, -93.10364532470703, -89.9392318725586, -86.77482604980469, -83.61042022705078, -80.44601440429688, -77.28160095214844, -74.11719512939453, -70.95278930664062, -67.78838348388672, -64.62397003173828, -61.459564208984375, -58.29515838623047, -55.1307487487793, -51.966339111328125, -48.80193328857422, -45.63751983642578, -42.47311019897461, -39.3087043762207, -36.14429473876953, -32.979888916015625, -29.815479278564453, -26.65106964111328, -23.486661911010742, -20.322254180908203, -17.157846450805664, -13.993437767028809, -10.829029083251953, -7.664621353149414, -4.500213623046875, -1.3358039855957031, 1.828603744506836, 4.993019104003906, 8.157426834106445, 11.3218355178833, 14.486244201660156, 17.650651931762695, 20.815059661865234, 23.979469299316406, 27.143877029418945, 30.308284759521484, 33.472694396972656, 36.63710021972656, 39.801509857177734, 42.965919494628906, 46.13032531738281, 49.294734954833984, 52.459144592285156, 55.62355041503906, 58.787960052490234, 61.95236587524414, 65.11677551269531, 68.28118133544922, 71.44558715820312, 74.61000061035156, 77.77440643310547, 80.93881225585938, 84.10321807861328, 87.26763153076172, 90.43203735351562, 93.59644317626953, 96.76084899902344, 99.92526245117188, 103.08966827392578, 106.25408172607422]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 10.0, 6.0, 16.0, 10.0, 15.0, 19.0, 12.0, 28.0, 37.0, 30.0, 33.0, 44.0, 44.0, 52.0, 57.0, 63.0, 50.0, 65.0, 58.0, 43.0, 51.0, 50.0, 44.0, 32.0, 24.0, 35.0, 13.0, 20.0, 17.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.17987060546875, -60.27134704589844, -58.36282730102539, -56.45430374145508, -54.545780181884766, -52.63726043701172, -50.728736877441406, -48.820213317871094, -46.91168975830078, -45.00316619873047, -43.09464645385742, -41.18612289428711, -39.2775993347168, -37.36907958984375, -35.46055603027344, -33.552032470703125, -31.643512725830078, -29.7349910736084, -27.826467514038086, -25.917945861816406, -24.009422302246094, -22.100900650024414, -20.192378997802734, -18.283855438232422, -16.375333786010742, -14.466811180114746, -12.55828857421875, -10.64976692199707, -8.741244316101074, -6.832721710205078, -4.924200057983398, -3.0156774520874023, -1.1071548461914062, 0.8013675212860107, 2.7098898887634277, 4.618412017822266, 6.526934623718262, 8.435457229614258, 10.343978881835938, 12.252501487731934, 14.16102409362793, 16.06954574584961, 17.978069305419922, 19.8865909576416, 21.79511260986328, 23.703636169433594, 25.612157821655273, 27.520679473876953, 29.429203033447266, 31.337724685668945, 33.246246337890625, 35.15476989746094, 37.06329345703125, 38.97181701660156, 40.88033676147461, 42.78886032104492, 44.69738006591797, 46.60590362548828, 48.51442337036133, 50.42294692993164, 52.33147048950195, 54.239990234375, 56.14851379394531, 58.057037353515625, 59.96556091308594]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 24.0, 34.0, 35.0, 56.0, 86.0, 119.0, 207.0, 282.0, 462.0, 762.0, 1261.0, 2208.0, 3913.0, 7131.0, 13323.0, 26350.0, 54431.0, 113010.0, 240900.0, 295633.0, 147638.0, 69736.0, 33691.0, 16960.0, 8930.0, 4622.0, 2736.0, 1549.0, 922.0, 510.0, 365.0, 202.0, 165.0, 97.0, 51.0, 40.0, 34.0, 16.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.265625, -23.433837890625, -22.60205078125, -21.770263671875, -20.9384765625, -20.106689453125, -19.27490234375, -18.443115234375, -17.611328125, -16.779541015625, -15.94775390625, -15.115966796875, -14.2841796875, -13.452392578125, -12.62060546875, -11.788818359375, -10.95703125, -10.125244140625, -9.29345703125, -8.461669921875, -7.6298828125, -6.798095703125, -5.96630859375, -5.134521484375, -4.302734375, -3.470947265625, -2.63916015625, -1.807373046875, -0.9755859375, -0.143798828125, 0.68798828125, 1.519775390625, 2.3515625, 3.183349609375, 4.01513671875, 4.846923828125, 5.6787109375, 6.510498046875, 7.34228515625, 8.174072265625, 9.005859375, 9.837646484375, 10.66943359375, 11.501220703125, 12.3330078125, 13.164794921875, 13.99658203125, 14.828369140625, 15.66015625, 16.491943359375, 17.32373046875, 18.155517578125, 18.9873046875, 19.819091796875, 20.65087890625, 21.482666015625, 22.314453125, 23.146240234375, 23.97802734375, 24.809814453125, 25.6416015625, 26.473388671875, 27.30517578125, 28.136962890625, 28.96875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 8.0, 6.0, 17.0, 18.0, 16.0, 22.0, 35.0, 36.0, 34.0, 33.0, 42.0, 43.0, 52.0, 51.0, 46.0, 52.0, 50.0, 47.0, 51.0, 52.0, 45.0, 39.0, 34.0, 28.0, 29.0, 18.0, 19.0, 16.0, 9.0, 9.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.48828125, -6.29949951171875, -6.1107177734375, -5.92193603515625, -5.733154296875, -5.54437255859375, -5.3555908203125, -5.16680908203125, -4.97802734375, -4.78924560546875, -4.6004638671875, -4.41168212890625, -4.222900390625, -4.03411865234375, -3.8453369140625, -3.65655517578125, -3.4677734375, -3.27899169921875, -3.0902099609375, -2.90142822265625, -2.712646484375, -2.52386474609375, -2.3350830078125, -2.14630126953125, -1.95751953125, -1.76873779296875, -1.5799560546875, -1.39117431640625, -1.202392578125, -1.01361083984375, -0.8248291015625, -0.63604736328125, -0.447265625, -0.25848388671875, -0.0697021484375, 0.11907958984375, 0.307861328125, 0.49664306640625, 0.6854248046875, 0.87420654296875, 1.06298828125, 1.25177001953125, 1.4405517578125, 1.62933349609375, 1.818115234375, 2.00689697265625, 2.1956787109375, 2.38446044921875, 2.5732421875, 2.76202392578125, 2.9508056640625, 3.13958740234375, 3.328369140625, 3.51715087890625, 3.7059326171875, 3.89471435546875, 4.08349609375, 4.27227783203125, 4.4610595703125, 4.64984130859375, 4.838623046875, 5.02740478515625, 5.2161865234375, 5.40496826171875, 5.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 7.0, 12.0, 25.0, 18.0, 42.0, 53.0, 80.0, 99.0, 151.0, 278.0, 413.0, 659.0, 1155.0, 2141.0, 4237.0, 9061.0, 21225.0, 52775.0, 148034.0, 384038.0, 266972.0, 93917.0, 34946.0, 14701.0, 6347.0, 3151.0, 1620.0, 910.0, 524.0, 325.0, 219.0, 126.0, 92.0, 64.0, 49.0, 18.0, 22.0, 17.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.09375, -30.145263671875, -29.19677734375, -28.248291015625, -27.2998046875, -26.351318359375, -25.40283203125, -24.454345703125, -23.505859375, -22.557373046875, -21.60888671875, -20.660400390625, -19.7119140625, -18.763427734375, -17.81494140625, -16.866455078125, -15.91796875, -14.969482421875, -14.02099609375, -13.072509765625, -12.1240234375, -11.175537109375, -10.22705078125, -9.278564453125, -8.330078125, -7.381591796875, -6.43310546875, -5.484619140625, -4.5361328125, -3.587646484375, -2.63916015625, -1.690673828125, -0.7421875, 0.206298828125, 1.15478515625, 2.103271484375, 3.0517578125, 4.000244140625, 4.94873046875, 5.897216796875, 6.845703125, 7.794189453125, 8.74267578125, 9.691162109375, 10.6396484375, 11.588134765625, 12.53662109375, 13.485107421875, 14.43359375, 15.382080078125, 16.33056640625, 17.279052734375, 18.2275390625, 19.176025390625, 20.12451171875, 21.072998046875, 22.021484375, 22.969970703125, 23.91845703125, 24.866943359375, 25.8154296875, 26.763916015625, 27.71240234375, 28.660888671875, 29.609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 3.0, 11.0, 10.0, 16.0, 8.0, 17.0, 31.0, 24.0, 25.0, 29.0, 26.0, 48.0, 38.0, 56.0, 51.0, 65.0, 49.0, 47.0, 64.0, 65.0, 38.0, 47.0, 36.0, 41.0, 33.0, 21.0, 23.0, 24.0, 20.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.386474609375, -31.39794921875, -30.409423828125, -29.4208984375, -28.432373046875, -27.44384765625, -26.455322265625, -25.466796875, -24.478271484375, -23.48974609375, -22.501220703125, -21.5126953125, -20.524169921875, -19.53564453125, -18.547119140625, -17.55859375, -16.570068359375, -15.58154296875, -14.593017578125, -13.6044921875, -12.615966796875, -11.62744140625, -10.638916015625, -9.650390625, -8.661865234375, -7.67333984375, -6.684814453125, -5.6962890625, -4.707763671875, -3.71923828125, -2.730712890625, -1.7421875, -0.753662109375, 0.23486328125, 1.223388671875, 2.2119140625, 3.200439453125, 4.18896484375, 5.177490234375, 6.166015625, 7.154541015625, 8.14306640625, 9.131591796875, 10.1201171875, 11.108642578125, 12.09716796875, 13.085693359375, 14.07421875, 15.062744140625, 16.05126953125, 17.039794921875, 18.0283203125, 19.016845703125, 20.00537109375, 20.993896484375, 21.982421875, 22.970947265625, 23.95947265625, 24.947998046875, 25.9365234375, 26.925048828125, 27.91357421875, 28.902099609375, 29.890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 26.0, 34.0, 52.0, 69.0, 104.0, 187.0, 354.0, 490.0, 888.0, 1655.0, 3198.0, 7489.0, 22159.0, 116825.0, 647692.0, 198656.0, 30890.0, 9331.0, 4007.0, 1897.0, 1025.0, 564.0, 336.0, 221.0, 136.0, 85.0, 55.0, 36.0, 22.0, 18.0, 8.0, 9.0, 8.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.203125, -26.39404296875, -25.5849609375, -24.77587890625, -23.966796875, -23.15771484375, -22.3486328125, -21.53955078125, -20.73046875, -19.92138671875, -19.1123046875, -18.30322265625, -17.494140625, -16.68505859375, -15.8759765625, -15.06689453125, -14.2578125, -13.44873046875, -12.6396484375, -11.83056640625, -11.021484375, -10.21240234375, -9.4033203125, -8.59423828125, -7.78515625, -6.97607421875, -6.1669921875, -5.35791015625, -4.548828125, -3.73974609375, -2.9306640625, -2.12158203125, -1.3125, -0.50341796875, 0.3056640625, 1.11474609375, 1.923828125, 2.73291015625, 3.5419921875, 4.35107421875, 5.16015625, 5.96923828125, 6.7783203125, 7.58740234375, 8.396484375, 9.20556640625, 10.0146484375, 10.82373046875, 11.6328125, 12.44189453125, 13.2509765625, 14.06005859375, 14.869140625, 15.67822265625, 16.4873046875, 17.29638671875, 18.10546875, 18.91455078125, 19.7236328125, 20.53271484375, 21.341796875, 22.15087890625, 22.9599609375, 23.76904296875, 24.578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 39.0, 60.0, 140.0, 235.0, 204.0, 90.0, 61.0, 40.0, 18.0, 7.0, 12.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007381439208984375, -0.00712507963180542, -0.006868720054626465, -0.00661236047744751, -0.006356000900268555, -0.0060996413230896, -0.0058432817459106445, -0.0055869221687316895, -0.005330562591552734, -0.005074203014373779, -0.004817843437194824, -0.004561483860015869, -0.004305124282836914, -0.004048764705657959, -0.003792405128479004, -0.003536045551300049, -0.0032796859741210938, -0.0030233263969421387, -0.0027669668197631836, -0.0025106072425842285, -0.0022542476654052734, -0.0019978880882263184, -0.0017415285110473633, -0.0014851689338684082, -0.0012288093566894531, -0.000972449779510498, -0.000716090202331543, -0.0004597306251525879, -0.0002033710479736328, 5.2988529205322266e-05, 0.00030934810638427734, 0.0005657076835632324, 0.0008220672607421875, 0.0010784268379211426, 0.0013347864151000977, 0.0015911459922790527, 0.0018475055694580078, 0.002103865146636963, 0.002360224723815918, 0.002616584300994873, 0.002872943878173828, 0.003129303455352783, 0.0033856630325317383, 0.0036420226097106934, 0.0038983821868896484, 0.0041547417640686035, 0.004411101341247559, 0.004667460918426514, 0.004923820495605469, 0.005180180072784424, 0.005436539649963379, 0.005692899227142334, 0.005949258804321289, 0.006205618381500244, 0.006461977958679199, 0.006718337535858154, 0.006974697113037109, 0.0072310566902160645, 0.0074874162673950195, 0.007743775844573975, 0.00800013542175293, 0.008256494998931885, 0.00851285457611084, 0.008769214153289795, 0.00902557373046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 11.0, 11.0, 16.0, 24.0, 23.0, 42.0, 68.0, 105.0, 154.0, 208.0, 345.0, 525.0, 919.0, 1603.0, 3137.0, 6666.0, 17359.0, 74089.0, 564272.0, 312702.0, 43067.0, 12141.0, 5102.0, 2544.0, 1271.0, 805.0, 445.0, 286.0, 193.0, 127.0, 91.0, 50.0, 44.0, 34.0, 17.0, 15.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.228759765625, -24.41064453125, -23.592529296875, -22.7744140625, -21.956298828125, -21.13818359375, -20.320068359375, -19.501953125, -18.683837890625, -17.86572265625, -17.047607421875, -16.2294921875, -15.411376953125, -14.59326171875, -13.775146484375, -12.95703125, -12.138916015625, -11.32080078125, -10.502685546875, -9.6845703125, -8.866455078125, -8.04833984375, -7.230224609375, -6.412109375, -5.593994140625, -4.77587890625, -3.957763671875, -3.1396484375, -2.321533203125, -1.50341796875, -0.685302734375, 0.1328125, 0.950927734375, 1.76904296875, 2.587158203125, 3.4052734375, 4.223388671875, 5.04150390625, 5.859619140625, 6.677734375, 7.495849609375, 8.31396484375, 9.132080078125, 9.9501953125, 10.768310546875, 11.58642578125, 12.404541015625, 13.22265625, 14.040771484375, 14.85888671875, 15.677001953125, 16.4951171875, 17.313232421875, 18.13134765625, 18.949462890625, 19.767578125, 20.585693359375, 21.40380859375, 22.221923828125, 23.0400390625, 23.858154296875, 24.67626953125, 25.494384765625, 26.3125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 6.0, 17.0, 11.0, 39.0, 60.0, 60.0, 100.0, 131.0, 147.0, 126.0, 99.0, 53.0, 50.0, 23.0, 19.0, 10.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.96875, -24.279296875, -23.58984375, -22.900390625, -22.2109375, -21.521484375, -20.83203125, -20.142578125, -19.453125, -18.763671875, -18.07421875, -17.384765625, -16.6953125, -16.005859375, -15.31640625, -14.626953125, -13.9375, -13.248046875, -12.55859375, -11.869140625, -11.1796875, -10.490234375, -9.80078125, -9.111328125, -8.421875, -7.732421875, -7.04296875, -6.353515625, -5.6640625, -4.974609375, -4.28515625, -3.595703125, -2.90625, -2.216796875, -1.52734375, -0.837890625, -0.1484375, 0.541015625, 1.23046875, 1.919921875, 2.609375, 3.298828125, 3.98828125, 4.677734375, 5.3671875, 6.056640625, 6.74609375, 7.435546875, 8.125, 8.814453125, 9.50390625, 10.193359375, 10.8828125, 11.572265625, 12.26171875, 12.951171875, 13.640625, 14.330078125, 15.01953125, 15.708984375, 16.3984375, 17.087890625, 17.77734375, 18.466796875, 19.15625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 15.0, 24.0, 86.0, 172.0, 295.0, 228.0, 110.0, 35.0, 22.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-733.7855224609375, -717.6943969726562, -701.603271484375, -685.5120849609375, -669.4209594726562, -653.329833984375, -637.2387084960938, -621.1475830078125, -605.056396484375, -588.9652709960938, -572.8741455078125, -556.782958984375, -540.6918334960938, -524.6007080078125, -508.50958251953125, -492.4184265136719, -476.3273010253906, -460.2361755371094, -444.14501953125, -428.05389404296875, -411.9627380371094, -395.8716125488281, -379.78045654296875, -363.6893310546875, -347.59820556640625, -331.507080078125, -315.4159240722656, -299.3247985839844, -283.233642578125, -267.14251708984375, -251.05137634277344, -234.96023559570312, -218.86907958984375, -202.77793884277344, -186.68679809570312, -170.59567260742188, -154.5045166015625, -138.41339111328125, -122.32225036621094, -106.23110961914062, -90.13996887207031, -74.048828125, -57.95769119262695, -41.866554260253906, -25.775413513183594, -9.684272766113281, 6.4068603515625, 22.498001098632812, 38.589141845703125, 54.68028259277344, 70.77142333984375, 86.86255645751953, 102.95369720458984, 119.04483795166016, 135.13597106933594, 151.22711181640625, 167.31825256347656, 183.40939331054688, 199.5005340576172, 215.5916748046875, 231.68280029296875, 247.77395629882812, 263.8650817871094, 279.95623779296875, 296.04736328125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 5.0, 16.0, 8.0, 18.0, 20.0, 28.0, 28.0, 19.0, 22.0, 29.0, 40.0, 46.0, 41.0, 43.0, 44.0, 34.0, 34.0, 37.0, 42.0, 45.0, 49.0, 35.0, 33.0, 27.0, 26.0, 30.0, 20.0, 24.0, 21.0, 15.0, 8.0, 15.0, 15.0, 11.0, 14.0, 7.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.99783325195312, -132.920654296875, -128.84347534179688, -124.76631164550781, -120.68913269042969, -116.61195373535156, -112.53478240966797, -108.45761108398438, -104.38043212890625, -100.30325317382812, -96.22608184814453, -92.14891052246094, -88.07173156738281, -83.99455261230469, -79.9173812866211, -75.8402099609375, -71.76303100585938, -67.68585205078125, -63.608680725097656, -59.5315055847168, -55.45433044433594, -51.37715530395508, -47.29998016357422, -43.22280502319336, -39.1456298828125, -35.06845474243164, -30.99127960205078, -26.914104461669922, -22.836929321289062, -18.759754180908203, -14.682579040527344, -10.605403900146484, -6.528221130371094, -2.4510459899902344, 1.626129150390625, 5.703304290771484, 9.780479431152344, 13.857654571533203, 17.934829711914062, 22.012004852294922, 26.08917999267578, 30.16635513305664, 34.2435302734375, 38.32070541381836, 42.39788055419922, 46.47505569458008, 50.55223083496094, 54.6294059753418, 58.706581115722656, 62.783756256103516, 66.86093139648438, 70.9381103515625, 75.0152816772461, 79.09245300292969, 83.16963195800781, 87.24681091308594, 91.32398223876953, 95.40115356445312, 99.47833251953125, 103.55551147460938, 107.63268280029297, 111.70985412597656, 115.78703308105469, 119.86421203613281, 123.9413833618164]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 20.0, 33.0, 45.0, 53.0, 82.0, 211.0, 344.0, 609.0, 1177.0, 2760.0, 6638.0, 17387.0, 55073.0, 287098.0, 3556693.0, 197355.0, 44065.0, 14474.0, 5596.0, 2320.0, 1056.0, 513.0, 282.0, 149.0, 85.0, 40.0, 20.0, 24.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.53125, -52.01953125, -50.5078125, -48.99609375, -47.484375, -45.97265625, -44.4609375, -42.94921875, -41.4375, -39.92578125, -38.4140625, -36.90234375, -35.390625, -33.87890625, -32.3671875, -30.85546875, -29.34375, -27.83203125, -26.3203125, -24.80859375, -23.296875, -21.78515625, -20.2734375, -18.76171875, -17.25, -15.73828125, -14.2265625, -12.71484375, -11.203125, -9.69140625, -8.1796875, -6.66796875, -5.15625, -3.64453125, -2.1328125, -0.62109375, 0.890625, 2.40234375, 3.9140625, 5.42578125, 6.9375, 8.44921875, 9.9609375, 11.47265625, 12.984375, 14.49609375, 16.0078125, 17.51953125, 19.03125, 20.54296875, 22.0546875, 23.56640625, 25.078125, 26.58984375, 28.1015625, 29.61328125, 31.125, 32.63671875, 34.1484375, 35.66015625, 37.171875, 38.68359375, 40.1953125, 41.70703125, 43.21875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 9.0, 16.0, 17.0, 21.0, 25.0, 37.0, 34.0, 32.0, 53.0, 53.0, 51.0, 51.0, 70.0, 58.0, 57.0, 56.0, 55.0, 51.0, 45.0, 33.0, 36.0, 29.0, 15.0, 17.0, 13.0, 14.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.45703125, -7.24420166015625, -7.0313720703125, -6.81854248046875, -6.605712890625, -6.39288330078125, -6.1800537109375, -5.96722412109375, -5.75439453125, -5.54156494140625, -5.3287353515625, -5.11590576171875, -4.903076171875, -4.69024658203125, -4.4774169921875, -4.26458740234375, -4.0517578125, -3.83892822265625, -3.6260986328125, -3.41326904296875, -3.200439453125, -2.98760986328125, -2.7747802734375, -2.56195068359375, -2.34912109375, -2.13629150390625, -1.9234619140625, -1.71063232421875, -1.497802734375, -1.28497314453125, -1.0721435546875, -0.85931396484375, -0.646484375, -0.43365478515625, -0.2208251953125, -0.00799560546875, 0.204833984375, 0.41766357421875, 0.6304931640625, 0.84332275390625, 1.05615234375, 1.26898193359375, 1.4818115234375, 1.69464111328125, 1.907470703125, 2.12030029296875, 2.3331298828125, 2.54595947265625, 2.7587890625, 2.97161865234375, 3.1844482421875, 3.39727783203125, 3.610107421875, 3.82293701171875, 4.0357666015625, 4.24859619140625, 4.46142578125, 4.67425537109375, 4.8870849609375, 5.09991455078125, 5.312744140625, 5.52557373046875, 5.7384033203125, 5.95123291015625, 6.1640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 4.0, 7.0, 10.0, 8.0, 28.0, 26.0, 56.0, 49.0, 101.0, 112.0, 169.0, 259.0, 426.0, 649.0, 1035.0, 1796.0, 3025.0, 5376.0, 10109.0, 20782.0, 47356.0, 128416.0, 526775.0, 2957008.0, 322767.0, 93674.0, 36664.0, 17035.0, 8596.0, 4657.0, 2700.0, 1647.0, 969.0, 640.0, 400.0, 311.0, 181.0, 124.0, 100.0, 66.0, 46.0, 39.0, 18.0, 20.0, 11.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-29.46875, -28.529052734375, -27.58935546875, -26.649658203125, -25.7099609375, -24.770263671875, -23.83056640625, -22.890869140625, -21.951171875, -21.011474609375, -20.07177734375, -19.132080078125, -18.1923828125, -17.252685546875, -16.31298828125, -15.373291015625, -14.43359375, -13.493896484375, -12.55419921875, -11.614501953125, -10.6748046875, -9.735107421875, -8.79541015625, -7.855712890625, -6.916015625, -5.976318359375, -5.03662109375, -4.096923828125, -3.1572265625, -2.217529296875, -1.27783203125, -0.338134765625, 0.6015625, 1.541259765625, 2.48095703125, 3.420654296875, 4.3603515625, 5.300048828125, 6.23974609375, 7.179443359375, 8.119140625, 9.058837890625, 9.99853515625, 10.938232421875, 11.8779296875, 12.817626953125, 13.75732421875, 14.697021484375, 15.63671875, 16.576416015625, 17.51611328125, 18.455810546875, 19.3955078125, 20.335205078125, 21.27490234375, 22.214599609375, 23.154296875, 24.093994140625, 25.03369140625, 25.973388671875, 26.9130859375, 27.852783203125, 28.79248046875, 29.732177734375, 30.671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 9.0, 21.0, 16.0, 19.0, 49.0, 47.0, 90.0, 86.0, 135.0, 200.0, 313.0, 1102.0, 999.0, 312.0, 178.0, 130.0, 77.0, 58.0, 32.0, 30.0, 31.0, 19.0, 15.0, 15.0, 13.0, 6.0, 6.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1484375, -12.6785888671875, -12.208740234375, -11.7388916015625, -11.26904296875, -10.7991943359375, -10.329345703125, -9.8594970703125, -9.3896484375, -8.9197998046875, -8.449951171875, -7.9801025390625, -7.51025390625, -7.0404052734375, -6.570556640625, -6.1007080078125, -5.630859375, -5.1610107421875, -4.691162109375, -4.2213134765625, -3.75146484375, -3.2816162109375, -2.811767578125, -2.3419189453125, -1.8720703125, -1.4022216796875, -0.932373046875, -0.4625244140625, 0.00732421875, 0.4771728515625, 0.947021484375, 1.4168701171875, 1.88671875, 2.3565673828125, 2.826416015625, 3.2962646484375, 3.76611328125, 4.2359619140625, 4.705810546875, 5.1756591796875, 5.6455078125, 6.1153564453125, 6.585205078125, 7.0550537109375, 7.52490234375, 7.9947509765625, 8.464599609375, 8.9344482421875, 9.404296875, 9.8741455078125, 10.343994140625, 10.8138427734375, 11.28369140625, 11.7535400390625, 12.223388671875, 12.6932373046875, 13.1630859375, 13.6329345703125, 14.102783203125, 14.5726318359375, 15.04248046875, 15.5123291015625, 15.982177734375, 16.4520263671875, 16.921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 7.0, 15.0, 24.0, 48.0, 62.0, 100.0, 146.0, 183.0, 138.0, 101.0, 67.0, 41.0, 29.0, 16.0, 12.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.6975555419922, -159.95765686035156, -155.2177734375, -150.47787475585938, -145.73797607421875, -140.99807739257812, -136.2581787109375, -131.51829528808594, -126.77839660644531, -122.03849792480469, -117.2986068725586, -112.5587158203125, -107.81881713867188, -103.07891845703125, -98.33902740478516, -93.59913635253906, -88.85923767089844, -84.11933898925781, -79.37944793701172, -74.63955688476562, -69.899658203125, -65.15975952148438, -60.41986846923828, -55.67997360229492, -50.94007873535156, -46.2001838684082, -41.460289001464844, -36.720394134521484, -31.980499267578125, -27.240604400634766, -22.500709533691406, -17.760814666748047, -13.020904541015625, -8.281009674072266, -3.5411148071289062, 1.1987800598144531, 5.9386749267578125, 10.678569793701172, 15.418464660644531, 20.15835952758789, 24.89825439453125, 29.63814926147461, 34.37804412841797, 39.11793899536133, 43.85783386230469, 48.59772872924805, 53.337623596191406, 58.077518463134766, 62.817413330078125, 67.55731201171875, 72.29720306396484, 77.03709411621094, 81.77699279785156, 86.51689147949219, 91.25678253173828, 95.99667358398438, 100.736572265625, 105.47647094726562, 110.21636199951172, 114.95625305175781, 119.69615173339844, 124.43605041503906, 129.17593383789062, 133.91583251953125, 138.65573120117188]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 6.0, 10.0, 14.0, 7.0, 12.0, 14.0, 11.0, 19.0, 22.0, 18.0, 20.0, 26.0, 31.0, 26.0, 33.0, 34.0, 39.0, 40.0, 43.0, 41.0, 40.0, 36.0, 46.0, 39.0, 38.0, 27.0, 34.0, 29.0, 31.0, 32.0, 24.0, 19.0, 25.0, 7.0, 15.0, 18.0, 9.0, 13.0, 9.0, 13.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-53.023902893066406, -51.3731689453125, -49.722434997558594, -48.07170104980469, -46.42096710205078, -44.770233154296875, -43.11949920654297, -41.46876525878906, -39.818031311035156, -38.16729736328125, -36.516563415527344, -34.86582946777344, -33.21509552001953, -31.564361572265625, -29.91362953186035, -28.262895584106445, -26.612163543701172, -24.961429595947266, -23.31069564819336, -21.659961700439453, -20.009227752685547, -18.35849380493164, -16.707761764526367, -15.057027816772461, -13.406293869018555, -11.755559921264648, -10.104825973510742, -8.454092979431152, -6.803359031677246, -5.15262508392334, -3.50189208984375, -1.8511581420898438, -0.2004241943359375, 1.4503095149993896, 3.101043224334717, 4.751776695251465, 6.402510643005371, 8.053244590759277, 9.703977584838867, 11.354711532592773, 13.00544548034668, 14.656179428100586, 16.306913375854492, 17.957645416259766, 19.608379364013672, 21.259113311767578, 22.909847259521484, 24.56058120727539, 26.211315155029297, 27.862049102783203, 29.51278305053711, 31.163516998291016, 32.81425094604492, 34.46498489379883, 36.11571502685547, 37.766448974609375, 39.41718292236328, 41.06791687011719, 42.718650817871094, 44.369384765625, 46.020118713378906, 47.67085266113281, 49.32158660888672, 50.972320556640625, 52.62305450439453]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 18.0, 16.0, 20.0, 45.0, 51.0, 100.0, 150.0, 239.0, 472.0, 875.0, 1992.0, 4451.0, 11528.0, 32583.0, 103283.0, 377490.0, 364283.0, 99754.0, 31566.0, 11278.0, 4400.0, 1939.0, 934.0, 451.0, 243.0, 134.0, 83.0, 62.0, 40.0, 22.0, 17.0, 14.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.56005859375, -48.0576171875, -46.55517578125, -45.052734375, -43.55029296875, -42.0478515625, -40.54541015625, -39.04296875, -37.54052734375, -36.0380859375, -34.53564453125, -33.033203125, -31.53076171875, -30.0283203125, -28.52587890625, -27.0234375, -25.52099609375, -24.0185546875, -22.51611328125, -21.013671875, -19.51123046875, -18.0087890625, -16.50634765625, -15.00390625, -13.50146484375, -11.9990234375, -10.49658203125, -8.994140625, -7.49169921875, -5.9892578125, -4.48681640625, -2.984375, -1.48193359375, 0.0205078125, 1.52294921875, 3.025390625, 4.52783203125, 6.0302734375, 7.53271484375, 9.03515625, 10.53759765625, 12.0400390625, 13.54248046875, 15.044921875, 16.54736328125, 18.0498046875, 19.55224609375, 21.0546875, 22.55712890625, 24.0595703125, 25.56201171875, 27.064453125, 28.56689453125, 30.0693359375, 31.57177734375, 33.07421875, 34.57666015625, 36.0791015625, 37.58154296875, 39.083984375, 40.58642578125, 42.0888671875, 43.59130859375, 45.09375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 10.0, 12.0, 15.0, 17.0, 12.0, 25.0, 24.0, 34.0, 42.0, 35.0, 42.0, 35.0, 50.0, 62.0, 49.0, 55.0, 62.0, 53.0, 52.0, 43.0, 45.0, 45.0, 30.0, 24.0, 25.0, 15.0, 16.0, 13.0, 11.0, 5.0, 9.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.82806396484375, -5.6287841796875, -5.42950439453125, -5.230224609375, -5.03094482421875, -4.8316650390625, -4.63238525390625, -4.43310546875, -4.23382568359375, -4.0345458984375, -3.83526611328125, -3.635986328125, -3.43670654296875, -3.2374267578125, -3.03814697265625, -2.8388671875, -2.63958740234375, -2.4403076171875, -2.24102783203125, -2.041748046875, -1.84246826171875, -1.6431884765625, -1.44390869140625, -1.24462890625, -1.04534912109375, -0.8460693359375, -0.64678955078125, -0.447509765625, -0.24822998046875, -0.0489501953125, 0.15032958984375, 0.349609375, 0.54888916015625, 0.7481689453125, 0.94744873046875, 1.146728515625, 1.34600830078125, 1.5452880859375, 1.74456787109375, 1.94384765625, 2.14312744140625, 2.3424072265625, 2.54168701171875, 2.740966796875, 2.94024658203125, 3.1395263671875, 3.33880615234375, 3.5380859375, 3.73736572265625, 3.9366455078125, 4.13592529296875, 4.335205078125, 4.53448486328125, 4.7337646484375, 4.93304443359375, 5.13232421875, 5.33160400390625, 5.5308837890625, 5.73016357421875, 5.929443359375, 6.12872314453125, 6.3280029296875, 6.52728271484375, 6.7265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 11.0, 11.0, 18.0, 27.0, 39.0, 68.0, 86.0, 157.0, 246.0, 444.0, 778.0, 1293.0, 2520.0, 5012.0, 11777.0, 30295.0, 85781.0, 274777.0, 423919.0, 134443.0, 45696.0, 16878.0, 7022.0, 3297.0, 1684.0, 914.0, 537.0, 302.0, 175.0, 133.0, 65.0, 43.0, 30.0, 25.0, 13.0, 18.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.125, -30.98583984375, -29.8466796875, -28.70751953125, -27.568359375, -26.42919921875, -25.2900390625, -24.15087890625, -23.01171875, -21.87255859375, -20.7333984375, -19.59423828125, -18.455078125, -17.31591796875, -16.1767578125, -15.03759765625, -13.8984375, -12.75927734375, -11.6201171875, -10.48095703125, -9.341796875, -8.20263671875, -7.0634765625, -5.92431640625, -4.78515625, -3.64599609375, -2.5068359375, -1.36767578125, -0.228515625, 0.91064453125, 2.0498046875, 3.18896484375, 4.328125, 5.46728515625, 6.6064453125, 7.74560546875, 8.884765625, 10.02392578125, 11.1630859375, 12.30224609375, 13.44140625, 14.58056640625, 15.7197265625, 16.85888671875, 17.998046875, 19.13720703125, 20.2763671875, 21.41552734375, 22.5546875, 23.69384765625, 24.8330078125, 25.97216796875, 27.111328125, 28.25048828125, 29.3896484375, 30.52880859375, 31.66796875, 32.80712890625, 33.9462890625, 35.08544921875, 36.224609375, 37.36376953125, 38.5029296875, 39.64208984375, 40.78125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 5.0, 15.0, 12.0, 20.0, 23.0, 21.0, 27.0, 34.0, 39.0, 40.0, 48.0, 38.0, 64.0, 43.0, 64.0, 59.0, 58.0, 57.0, 35.0, 42.0, 35.0, 29.0, 30.0, 29.0, 25.0, 19.0, 23.0, 9.0, 11.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.10595703125, -27.0556640625, -26.00537109375, -24.955078125, -23.90478515625, -22.8544921875, -21.80419921875, -20.75390625, -19.70361328125, -18.6533203125, -17.60302734375, -16.552734375, -15.50244140625, -14.4521484375, -13.40185546875, -12.3515625, -11.30126953125, -10.2509765625, -9.20068359375, -8.150390625, -7.10009765625, -6.0498046875, -4.99951171875, -3.94921875, -2.89892578125, -1.8486328125, -0.79833984375, 0.251953125, 1.30224609375, 2.3525390625, 3.40283203125, 4.453125, 5.50341796875, 6.5537109375, 7.60400390625, 8.654296875, 9.70458984375, 10.7548828125, 11.80517578125, 12.85546875, 13.90576171875, 14.9560546875, 16.00634765625, 17.056640625, 18.10693359375, 19.1572265625, 20.20751953125, 21.2578125, 22.30810546875, 23.3583984375, 24.40869140625, 25.458984375, 26.50927734375, 27.5595703125, 28.60986328125, 29.66015625, 30.71044921875, 31.7607421875, 32.81103515625, 33.861328125, 34.91162109375, 35.9619140625, 37.01220703125, 38.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 15.0, 28.0, 45.0, 76.0, 95.0, 171.0, 326.0, 594.0, 1271.0, 2672.0, 6970.0, 26457.0, 216110.0, 685800.0, 84330.0, 14701.0, 4837.0, 1957.0, 948.0, 495.0, 262.0, 138.0, 86.0, 59.0, 44.0, 10.0, 12.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.390625, -30.387939453125, -29.38525390625, -28.382568359375, -27.3798828125, -26.377197265625, -25.37451171875, -24.371826171875, -23.369140625, -22.366455078125, -21.36376953125, -20.361083984375, -19.3583984375, -18.355712890625, -17.35302734375, -16.350341796875, -15.34765625, -14.344970703125, -13.34228515625, -12.339599609375, -11.3369140625, -10.334228515625, -9.33154296875, -8.328857421875, -7.326171875, -6.323486328125, -5.32080078125, -4.318115234375, -3.3154296875, -2.312744140625, -1.31005859375, -0.307373046875, 0.6953125, 1.697998046875, 2.70068359375, 3.703369140625, 4.7060546875, 5.708740234375, 6.71142578125, 7.714111328125, 8.716796875, 9.719482421875, 10.72216796875, 11.724853515625, 12.7275390625, 13.730224609375, 14.73291015625, 15.735595703125, 16.73828125, 17.740966796875, 18.74365234375, 19.746337890625, 20.7490234375, 21.751708984375, 22.75439453125, 23.757080078125, 24.759765625, 25.762451171875, 26.76513671875, 27.767822265625, 28.7705078125, 29.773193359375, 30.77587890625, 31.778564453125, 32.78125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 20.0, 30.0, 73.0, 165.0, 293.0, 226.0, 82.0, 39.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01534271240234375, -0.014990806579589844, -0.014638900756835938, -0.014286994934082031, -0.013935089111328125, -0.013583183288574219, -0.013231277465820312, -0.012879371643066406, -0.0125274658203125, -0.012175559997558594, -0.011823654174804688, -0.011471748352050781, -0.011119842529296875, -0.010767936706542969, -0.010416030883789062, -0.010064125061035156, -0.00971221923828125, -0.009360313415527344, -0.009008407592773438, -0.008656501770019531, -0.008304595947265625, -0.007952690124511719, -0.0076007843017578125, -0.007248878479003906, -0.00689697265625, -0.006545066833496094, -0.0061931610107421875, -0.005841255187988281, -0.005489349365234375, -0.005137443542480469, -0.0047855377197265625, -0.004433631896972656, -0.00408172607421875, -0.0037298202514648438, -0.0033779144287109375, -0.0030260086059570312, -0.002674102783203125, -0.0023221969604492188, -0.0019702911376953125, -0.0016183853149414062, -0.0012664794921875, -0.0009145736694335938, -0.0005626678466796875, -0.00021076202392578125, 0.000141143798828125, 0.0004930496215820312, 0.0008449554443359375, 0.0011968612670898438, 0.00154876708984375, 0.0019006729125976562, 0.0022525787353515625, 0.0026044845581054688, 0.002956390380859375, 0.0033082962036132812, 0.0036602020263671875, 0.004012107849121094, 0.004364013671875, 0.004715919494628906, 0.0050678253173828125, 0.005419731140136719, 0.005771636962890625, 0.006123542785644531, 0.0064754486083984375, 0.006827354431152344, 0.00717926025390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 7.0, 10.0, 8.0, 18.0, 26.0, 29.0, 32.0, 66.0, 96.0, 219.0, 483.0, 1273.0, 4264.0, 18873.0, 207185.0, 753871.0, 49893.0, 8553.0, 2228.0, 759.0, 293.0, 133.0, 84.0, 47.0, 31.0, 16.0, 21.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0830078125, -37.791015625, -36.4990234375, -35.20703125, -33.9150390625, -32.623046875, -31.3310546875, -30.0390625, -28.7470703125, -27.455078125, -26.1630859375, -24.87109375, -23.5791015625, -22.287109375, -20.9951171875, -19.703125, -18.4111328125, -17.119140625, -15.8271484375, -14.53515625, -13.2431640625, -11.951171875, -10.6591796875, -9.3671875, -8.0751953125, -6.783203125, -5.4912109375, -4.19921875, -2.9072265625, -1.615234375, -0.3232421875, 0.96875, 2.2607421875, 3.552734375, 4.8447265625, 6.13671875, 7.4287109375, 8.720703125, 10.0126953125, 11.3046875, 12.5966796875, 13.888671875, 15.1806640625, 16.47265625, 17.7646484375, 19.056640625, 20.3486328125, 21.640625, 22.9326171875, 24.224609375, 25.5166015625, 26.80859375, 28.1005859375, 29.392578125, 30.6845703125, 31.9765625, 33.2685546875, 34.560546875, 35.8525390625, 37.14453125, 38.4365234375, 39.728515625, 41.0205078125, 42.3125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 15.0, 28.0, 38.0, 84.0, 139.0, 147.0, 182.0, 128.0, 69.0, 59.0, 29.0, 14.0, 18.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.1529541015625, -12.376220703125, -11.5994873046875, -10.82275390625, -10.0460205078125, -9.269287109375, -8.4925537109375, -7.7158203125, -6.9390869140625, -6.162353515625, -5.3856201171875, -4.60888671875, -3.8321533203125, -3.055419921875, -2.2786865234375, -1.501953125, -0.7252197265625, 0.051513671875, 0.8282470703125, 1.60498046875, 2.3817138671875, 3.158447265625, 3.9351806640625, 4.7119140625, 5.4886474609375, 6.265380859375, 7.0421142578125, 7.81884765625, 8.5955810546875, 9.372314453125, 10.1490478515625, 10.92578125, 11.7025146484375, 12.479248046875, 13.2559814453125, 14.03271484375, 14.8094482421875, 15.586181640625, 16.3629150390625, 17.1396484375, 17.9163818359375, 18.693115234375, 19.4698486328125, 20.24658203125, 21.0233154296875, 21.800048828125, 22.5767822265625, 23.353515625, 24.1302490234375, 24.906982421875, 25.6837158203125, 26.46044921875, 27.2371826171875, 28.013916015625, 28.7906494140625, 29.5673828125, 30.3441162109375, 31.120849609375, 31.8975830078125, 32.67431640625, 33.4510498046875, 34.227783203125, 35.0045166015625, 35.78125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 10.0, 8.0, 16.0, 34.0, 43.0, 55.0, 71.0, 94.0, 113.0, 138.0, 103.0, 88.0, 76.0, 50.0, 24.0, 18.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.0894775390625, -247.854736328125, -239.6199951171875, -231.38525390625, -223.15049743652344, -214.91575622558594, -206.68101501464844, -198.44627380371094, -190.21151733398438, -181.97677612304688, -173.74203491210938, -165.50729370117188, -157.2725372314453, -149.0377960205078, -140.8030548095703, -132.5683135986328, -124.33357238769531, -116.09883117675781, -107.86408233642578, -99.62934112548828, -91.39459228515625, -83.15985107421875, -74.92510986328125, -66.69036865234375, -58.45561981201172, -50.22087478637695, -41.98612976074219, -33.75138854980469, -25.516643524169922, -17.281898498535156, -9.047157287597656, -0.8124122619628906, 7.422332763671875, 15.657076835632324, 23.891820907592773, 32.126564025878906, 40.36130905151367, 48.59605407714844, 56.83079528808594, 65.06553649902344, 73.30028533935547, 81.53502655029297, 89.769775390625, 98.0045166015625, 106.2392578125, 114.47400665283203, 122.70874786376953, 130.94349670410156, 139.17823791503906, 147.41297912597656, 155.64772033691406, 163.88247680664062, 172.11721801757812, 180.35195922851562, 188.58670043945312, 196.82144165039062, 205.05618286132812, 213.29092407226562, 221.52566528320312, 229.76040649414062, 237.9951629638672, 246.2299041748047, 254.4646453857422, 262.69940185546875, 270.93414306640625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 10.0, 10.0, 17.0, 12.0, 19.0, 22.0, 26.0, 30.0, 23.0, 23.0, 35.0, 26.0, 34.0, 38.0, 43.0, 48.0, 46.0, 39.0, 42.0, 40.0, 41.0, 30.0, 43.0, 29.0, 27.0, 45.0, 21.0, 21.0, 15.0, 20.0, 15.0, 15.0, 13.0, 18.0, 5.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.3483428955078, -152.33303833007812, -147.31773376464844, -142.3024139404297, -137.287109375, -132.2718048095703, -127.25650024414062, -122.24119567871094, -117.22588348388672, -112.21057891845703, -107.19526672363281, -102.17996215820312, -97.16465759277344, -92.14934539794922, -87.13404083251953, -82.11872863769531, -77.10342407226562, -72.08811950683594, -67.07280731201172, -62.05750274658203, -57.04219436645508, -52.026885986328125, -47.01158142089844, -41.996273040771484, -36.98096466064453, -31.965656280517578, -26.950349807739258, -21.935043334960938, -16.919734954833984, -11.904426574707031, -6.889120101928711, -1.8738136291503906, 3.1414947509765625, 8.1568021774292, 13.172109603881836, 18.187416076660156, 23.20272445678711, 28.218032836914062, 33.23333740234375, 38.2486457824707, 43.263954162597656, 48.27926254272461, 53.29457092285156, 58.30987548828125, 63.3251838684082, 68.34049224853516, 73.35579681396484, 78.37110900878906, 83.38641357421875, 88.40171813964844, 93.41703033447266, 98.43233489990234, 103.44764709472656, 108.46295166015625, 113.47825622558594, 118.49356079101562, 123.50887298583984, 128.52418518066406, 133.53948974609375, 138.55479431152344, 143.57009887695312, 148.58541870117188, 153.60072326660156, 158.61602783203125, 163.63133239746094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 8.0, 9.0, 7.0, 13.0, 11.0, 19.0, 31.0, 36.0, 50.0, 63.0, 90.0, 127.0, 200.0, 297.0, 451.0, 627.0, 1018.0, 1594.0, 2755.0, 4804.0, 9020.0, 18885.0, 47462.0, 182228.0, 3613362.0, 215585.0, 52137.0, 20819.0, 9798.0, 5069.0, 2837.0, 1707.0, 1064.0, 676.0, 420.0, 292.0, 216.0, 158.0, 97.0, 72.0, 42.0, 42.0, 27.0, 17.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -36.98388671875, -35.8115234375, -34.63916015625, -33.466796875, -32.29443359375, -31.1220703125, -29.94970703125, -28.77734375, -27.60498046875, -26.4326171875, -25.26025390625, -24.087890625, -22.91552734375, -21.7431640625, -20.57080078125, -19.3984375, -18.22607421875, -17.0537109375, -15.88134765625, -14.708984375, -13.53662109375, -12.3642578125, -11.19189453125, -10.01953125, -8.84716796875, -7.6748046875, -6.50244140625, -5.330078125, -4.15771484375, -2.9853515625, -1.81298828125, -0.640625, 0.53173828125, 1.7041015625, 2.87646484375, 4.048828125, 5.22119140625, 6.3935546875, 7.56591796875, 8.73828125, 9.91064453125, 11.0830078125, 12.25537109375, 13.427734375, 14.60009765625, 15.7724609375, 16.94482421875, 18.1171875, 19.28955078125, 20.4619140625, 21.63427734375, 22.806640625, 23.97900390625, 25.1513671875, 26.32373046875, 27.49609375, 28.66845703125, 29.8408203125, 31.01318359375, 32.185546875, 33.35791015625, 34.5302734375, 35.70263671875, 36.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 7.0, 13.0, 11.0, 19.0, 26.0, 22.0, 33.0, 30.0, 41.0, 50.0, 63.0, 67.0, 46.0, 70.0, 62.0, 56.0, 57.0, 49.0, 40.0, 40.0, 44.0, 23.0, 20.0, 17.0, 22.0, 17.0, 6.0, 12.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.83197021484375, -7.5858154296875, -7.33966064453125, -7.093505859375, -6.84735107421875, -6.6011962890625, -6.35504150390625, -6.10888671875, -5.86273193359375, -5.6165771484375, -5.37042236328125, -5.124267578125, -4.87811279296875, -4.6319580078125, -4.38580322265625, -4.1396484375, -3.89349365234375, -3.6473388671875, -3.40118408203125, -3.155029296875, -2.90887451171875, -2.6627197265625, -2.41656494140625, -2.17041015625, -1.92425537109375, -1.6781005859375, -1.43194580078125, -1.185791015625, -0.93963623046875, -0.6934814453125, -0.44732666015625, -0.201171875, 0.04498291015625, 0.2911376953125, 0.53729248046875, 0.783447265625, 1.02960205078125, 1.2757568359375, 1.52191162109375, 1.76806640625, 2.01422119140625, 2.2603759765625, 2.50653076171875, 2.752685546875, 2.99884033203125, 3.2449951171875, 3.49114990234375, 3.7373046875, 3.98345947265625, 4.2296142578125, 4.47576904296875, 4.721923828125, 4.96807861328125, 5.2142333984375, 5.46038818359375, 5.70654296875, 5.95269775390625, 6.1988525390625, 6.44500732421875, 6.691162109375, 6.93731689453125, 7.1834716796875, 7.42962646484375, 7.67578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 13.0, 11.0, 16.0, 14.0, 14.0, 29.0, 41.0, 40.0, 59.0, 70.0, 128.0, 173.0, 301.0, 532.0, 1241.0, 3288.0, 10633.0, 49090.0, 1468107.0, 2592680.0, 50599.0, 11171.0, 3273.0, 1282.0, 554.0, 280.0, 169.0, 122.0, 73.0, 54.0, 48.0, 39.0, 26.0, 17.0, 16.0, 16.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.125, -80.4443359375, -77.763671875, -75.0830078125, -72.40234375, -69.7216796875, -67.041015625, -64.3603515625, -61.6796875, -58.9990234375, -56.318359375, -53.6376953125, -50.95703125, -48.2763671875, -45.595703125, -42.9150390625, -40.234375, -37.5537109375, -34.873046875, -32.1923828125, -29.51171875, -26.8310546875, -24.150390625, -21.4697265625, -18.7890625, -16.1083984375, -13.427734375, -10.7470703125, -8.06640625, -5.3857421875, -2.705078125, -0.0244140625, 2.65625, 5.3369140625, 8.017578125, 10.6982421875, 13.37890625, 16.0595703125, 18.740234375, 21.4208984375, 24.1015625, 26.7822265625, 29.462890625, 32.1435546875, 34.82421875, 37.5048828125, 40.185546875, 42.8662109375, 45.546875, 48.2275390625, 50.908203125, 53.5888671875, 56.26953125, 58.9501953125, 61.630859375, 64.3115234375, 66.9921875, 69.6728515625, 72.353515625, 75.0341796875, 77.71484375, 80.3955078125, 83.076171875, 85.7568359375, 88.4375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 9.0, 15.0, 22.0, 36.0, 48.0, 114.0, 301.0, 2643.0, 532.0, 168.0, 80.0, 34.0, 30.0, 19.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.84375, -46.74853515625, -45.6533203125, -44.55810546875, -43.462890625, -42.36767578125, -41.2724609375, -40.17724609375, -39.08203125, -37.98681640625, -36.8916015625, -35.79638671875, -34.701171875, -33.60595703125, -32.5107421875, -31.41552734375, -30.3203125, -29.22509765625, -28.1298828125, -27.03466796875, -25.939453125, -24.84423828125, -23.7490234375, -22.65380859375, -21.55859375, -20.46337890625, -19.3681640625, -18.27294921875, -17.177734375, -16.08251953125, -14.9873046875, -13.89208984375, -12.796875, -11.70166015625, -10.6064453125, -9.51123046875, -8.416015625, -7.32080078125, -6.2255859375, -5.13037109375, -4.03515625, -2.93994140625, -1.8447265625, -0.74951171875, 0.345703125, 1.44091796875, 2.5361328125, 3.63134765625, 4.7265625, 5.82177734375, 6.9169921875, 8.01220703125, 9.107421875, 10.20263671875, 11.2978515625, 12.39306640625, 13.48828125, 14.58349609375, 15.6787109375, 16.77392578125, 17.869140625, 18.96435546875, 20.0595703125, 21.15478515625, 22.25]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 12.0, 14.0, 10.0, 38.0, 45.0, 49.0, 88.0, 87.0, 132.0, 132.0, 101.0, 83.0, 56.0, 39.0, 29.0, 18.0, 12.0, 9.0, 11.0, 6.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.51214599609375, -140.02114868164062, -136.53013610839844, -133.03912353515625, -129.54812622070312, -126.05712127685547, -122.56611633300781, -119.07511138916016, -115.5841064453125, -112.09310150146484, -108.60209655761719, -105.11109161376953, -101.62008666992188, -98.12908172607422, -94.63807678222656, -91.1470718383789, -87.65606689453125, -84.1650619506836, -80.67405700683594, -77.18305206298828, -73.69204711914062, -70.20104217529297, -66.71003723144531, -63.219032287597656, -59.72802734375, -56.237022399902344, -52.74601745605469, -49.25501251220703, -45.764007568359375, -42.27300262451172, -38.78199768066406, -35.290992736816406, -31.79998779296875, -28.308982849121094, -24.817977905273438, -21.32697296142578, -17.835968017578125, -14.344963073730469, -10.853958129882812, -7.362953186035156, -3.8719482421875, -0.38094329833984375, 3.1100616455078125, 6.601066589355469, 10.092071533203125, 13.583076477050781, 17.074081420898438, 20.565086364746094, 24.05609130859375, 27.547096252441406, 31.038101196289062, 34.52910614013672, 38.020111083984375, 41.51111602783203, 45.00212097167969, 48.493125915527344, 51.984130859375, 55.475135803222656, 58.96614074707031, 62.45714569091797, 65.94815063476562, 69.43915557861328, 72.93016052246094, 76.4211654663086, 79.91217041015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 15.0, 15.0, 25.0, 15.0, 27.0, 41.0, 39.0, 51.0, 42.0, 58.0, 64.0, 70.0, 62.0, 68.0, 66.0, 66.0, 57.0, 49.0, 36.0, 35.0, 28.0, 17.0, 16.0, 13.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.21607971191406, -96.05860137939453, -92.901123046875, -89.74364471435547, -86.58616638183594, -83.4286880493164, -80.27120971679688, -77.11373138427734, -73.95625305175781, -70.79877471923828, -67.64129638671875, -64.48381805419922, -61.32633972167969, -58.168861389160156, -55.011383056640625, -51.853904724121094, -48.69643020629883, -45.5389518737793, -42.381473541259766, -39.223995208740234, -36.0665168762207, -32.90903854370117, -29.751562118530273, -26.594083786010742, -23.43660545349121, -20.27912712097168, -17.12164878845215, -13.964171409606934, -10.806693077087402, -7.649214744567871, -4.491737365722656, -1.334259033203125, 1.8232192993164062, 4.9806976318359375, 8.138175964355469, 11.295653343200684, 14.453131675720215, 17.610610961914062, 20.76808738708496, 23.925565719604492, 27.083044052124023, 30.240522384643555, 33.39799880981445, 36.555477142333984, 39.712955474853516, 42.87043380737305, 46.02791213989258, 49.18539047241211, 52.34286880493164, 55.50034713745117, 58.6578254699707, 61.815303802490234, 64.9727783203125, 68.13025665283203, 71.28773498535156, 74.4452133178711, 77.60269165039062, 80.76016998291016, 83.91764831542969, 87.07512664794922, 90.23260498046875, 93.39008331298828, 96.54756164550781, 99.70503997802734, 102.86251831054688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 13.0, 11.0, 20.0, 47.0, 38.0, 95.0, 120.0, 194.0, 309.0, 632.0, 1120.0, 2051.0, 3879.0, 7826.0, 16601.0, 36770.0, 86855.0, 226346.0, 385835.0, 162083.0, 64195.0, 27732.0, 12814.0, 6045.0, 3060.0, 1581.0, 916.0, 533.0, 293.0, 183.0, 120.0, 78.0, 52.0, 27.0, 23.0, 17.0, 11.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.46826171875, -31.2802734375, -30.09228515625, -28.904296875, -27.71630859375, -26.5283203125, -25.34033203125, -24.15234375, -22.96435546875, -21.7763671875, -20.58837890625, -19.400390625, -18.21240234375, -17.0244140625, -15.83642578125, -14.6484375, -13.46044921875, -12.2724609375, -11.08447265625, -9.896484375, -8.70849609375, -7.5205078125, -6.33251953125, -5.14453125, -3.95654296875, -2.7685546875, -1.58056640625, -0.392578125, 0.79541015625, 1.9833984375, 3.17138671875, 4.359375, 5.54736328125, 6.7353515625, 7.92333984375, 9.111328125, 10.29931640625, 11.4873046875, 12.67529296875, 13.86328125, 15.05126953125, 16.2392578125, 17.42724609375, 18.615234375, 19.80322265625, 20.9912109375, 22.17919921875, 23.3671875, 24.55517578125, 25.7431640625, 26.93115234375, 28.119140625, 29.30712890625, 30.4951171875, 31.68310546875, 32.87109375, 34.05908203125, 35.2470703125, 36.43505859375, 37.623046875, 38.81103515625, 39.9990234375, 41.18701171875, 42.375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 4.0, 10.0, 12.0, 6.0, 13.0, 12.0, 19.0, 21.0, 18.0, 20.0, 31.0, 27.0, 36.0, 55.0, 45.0, 36.0, 42.0, 43.0, 55.0, 48.0, 46.0, 42.0, 49.0, 43.0, 21.0, 24.0, 32.0, 25.0, 24.0, 25.0, 20.0, 17.0, 13.0, 13.0, 13.0, 10.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3046875, -6.10009765625, -5.8955078125, -5.69091796875, -5.486328125, -5.28173828125, -5.0771484375, -4.87255859375, -4.66796875, -4.46337890625, -4.2587890625, -4.05419921875, -3.849609375, -3.64501953125, -3.4404296875, -3.23583984375, -3.03125, -2.82666015625, -2.6220703125, -2.41748046875, -2.212890625, -2.00830078125, -1.8037109375, -1.59912109375, -1.39453125, -1.18994140625, -0.9853515625, -0.78076171875, -0.576171875, -0.37158203125, -0.1669921875, 0.03759765625, 0.2421875, 0.44677734375, 0.6513671875, 0.85595703125, 1.060546875, 1.26513671875, 1.4697265625, 1.67431640625, 1.87890625, 2.08349609375, 2.2880859375, 2.49267578125, 2.697265625, 2.90185546875, 3.1064453125, 3.31103515625, 3.515625, 3.72021484375, 3.9248046875, 4.12939453125, 4.333984375, 4.53857421875, 4.7431640625, 4.94775390625, 5.15234375, 5.35693359375, 5.5615234375, 5.76611328125, 5.970703125, 6.17529296875, 6.3798828125, 6.58447265625, 6.7890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 11.0, 11.0, 18.0, 14.0, 36.0, 49.0, 81.0, 110.0, 161.0, 220.0, 394.0, 569.0, 976.0, 1602.0, 2919.0, 5879.0, 11430.0, 24759.0, 56053.0, 139399.0, 357677.0, 266490.0, 100040.0, 41257.0, 18713.0, 9083.0, 4582.0, 2376.0, 1395.0, 795.0, 483.0, 324.0, 215.0, 131.0, 87.0, 59.0, 45.0, 25.0, 22.0, 11.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.609375, -25.74609375, -24.8828125, -24.01953125, -23.15625, -22.29296875, -21.4296875, -20.56640625, -19.703125, -18.83984375, -17.9765625, -17.11328125, -16.25, -15.38671875, -14.5234375, -13.66015625, -12.796875, -11.93359375, -11.0703125, -10.20703125, -9.34375, -8.48046875, -7.6171875, -6.75390625, -5.890625, -5.02734375, -4.1640625, -3.30078125, -2.4375, -1.57421875, -0.7109375, 0.15234375, 1.015625, 1.87890625, 2.7421875, 3.60546875, 4.46875, 5.33203125, 6.1953125, 7.05859375, 7.921875, 8.78515625, 9.6484375, 10.51171875, 11.375, 12.23828125, 13.1015625, 13.96484375, 14.828125, 15.69140625, 16.5546875, 17.41796875, 18.28125, 19.14453125, 20.0078125, 20.87109375, 21.734375, 22.59765625, 23.4609375, 24.32421875, 25.1875, 26.05078125, 26.9140625, 27.77734375, 28.640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 3.0, 11.0, 14.0, 19.0, 15.0, 18.0, 22.0, 28.0, 30.0, 35.0, 46.0, 41.0, 53.0, 39.0, 42.0, 51.0, 49.0, 61.0, 35.0, 40.0, 43.0, 36.0, 36.0, 37.0, 24.0, 30.0, 13.0, 24.0, 16.0, 11.0, 16.0, 9.0, 13.0, 7.0, 8.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.81982421875, -24.8583984375, -23.89697265625, -22.935546875, -21.97412109375, -21.0126953125, -20.05126953125, -19.08984375, -18.12841796875, -17.1669921875, -16.20556640625, -15.244140625, -14.28271484375, -13.3212890625, -12.35986328125, -11.3984375, -10.43701171875, -9.4755859375, -8.51416015625, -7.552734375, -6.59130859375, -5.6298828125, -4.66845703125, -3.70703125, -2.74560546875, -1.7841796875, -0.82275390625, 0.138671875, 1.10009765625, 2.0615234375, 3.02294921875, 3.984375, 4.94580078125, 5.9072265625, 6.86865234375, 7.830078125, 8.79150390625, 9.7529296875, 10.71435546875, 11.67578125, 12.63720703125, 13.5986328125, 14.56005859375, 15.521484375, 16.48291015625, 17.4443359375, 18.40576171875, 19.3671875, 20.32861328125, 21.2900390625, 22.25146484375, 23.212890625, 24.17431640625, 25.1357421875, 26.09716796875, 27.05859375, 28.02001953125, 28.9814453125, 29.94287109375, 30.904296875, 31.86572265625, 32.8271484375, 33.78857421875, 34.75]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 10.0, 22.0, 19.0, 31.0, 54.0, 100.0, 145.0, 242.0, 357.0, 595.0, 1008.0, 1992.0, 4135.0, 11513.0, 45642.0, 296493.0, 556064.0, 97893.0, 19912.0, 6309.0, 2714.0, 1291.0, 774.0, 473.0, 306.0, 178.0, 99.0, 56.0, 41.0, 25.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.0, -27.267333984375, -26.53466796875, -25.802001953125, -25.0693359375, -24.336669921875, -23.60400390625, -22.871337890625, -22.138671875, -21.406005859375, -20.67333984375, -19.940673828125, -19.2080078125, -18.475341796875, -17.74267578125, -17.010009765625, -16.27734375, -15.544677734375, -14.81201171875, -14.079345703125, -13.3466796875, -12.614013671875, -11.88134765625, -11.148681640625, -10.416015625, -9.683349609375, -8.95068359375, -8.218017578125, -7.4853515625, -6.752685546875, -6.02001953125, -5.287353515625, -4.5546875, -3.822021484375, -3.08935546875, -2.356689453125, -1.6240234375, -0.891357421875, -0.15869140625, 0.573974609375, 1.306640625, 2.039306640625, 2.77197265625, 3.504638671875, 4.2373046875, 4.969970703125, 5.70263671875, 6.435302734375, 7.16796875, 7.900634765625, 8.63330078125, 9.365966796875, 10.0986328125, 10.831298828125, 11.56396484375, 12.296630859375, 13.029296875, 13.761962890625, 14.49462890625, 15.227294921875, 15.9599609375, 16.692626953125, 17.42529296875, 18.157958984375, 18.890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 28.0, 54.0, 120.0, 286.0, 256.0, 122.0, 43.0, 16.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139617919921875, -0.01358342170715332, -0.01320505142211914, -0.012826681137084961, -0.012448310852050781, -0.012069940567016602, -0.011691570281982422, -0.011313199996948242, -0.010934829711914062, -0.010556459426879883, -0.010178089141845703, -0.009799718856811523, -0.009421348571777344, -0.009042978286743164, -0.008664608001708984, -0.008286237716674805, -0.007907867431640625, -0.007529497146606445, -0.007151126861572266, -0.006772756576538086, -0.006394386291503906, -0.0060160160064697266, -0.005637645721435547, -0.005259275436401367, -0.0048809051513671875, -0.004502534866333008, -0.004124164581298828, -0.0037457942962646484, -0.0033674240112304688, -0.002989053726196289, -0.0026106834411621094, -0.0022323131561279297, -0.00185394287109375, -0.0014755725860595703, -0.0010972023010253906, -0.0007188320159912109, -0.00034046173095703125, 3.790855407714844e-05, 0.0004162788391113281, 0.0007946491241455078, 0.0011730194091796875, 0.0015513896942138672, 0.0019297599792480469, 0.0023081302642822266, 0.0026865005493164062, 0.003064870834350586, 0.0034432411193847656, 0.0038216114044189453, 0.004199981689453125, 0.004578351974487305, 0.004956722259521484, 0.005335092544555664, 0.005713462829589844, 0.0060918331146240234, 0.006470203399658203, 0.006848573684692383, 0.0072269439697265625, 0.007605314254760742, 0.007983684539794922, 0.008362054824829102, 0.008740425109863281, 0.009118795394897461, 0.00949716567993164, 0.00987553596496582, 0.01025390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 10.0, 17.0, 24.0, 21.0, 42.0, 49.0, 68.0, 107.0, 162.0, 242.0, 459.0, 813.0, 1766.0, 4330.0, 16814.0, 130442.0, 738636.0, 129846.0, 16230.0, 4549.0, 1814.0, 903.0, 446.0, 240.0, 160.0, 117.0, 58.0, 49.0, 46.0, 26.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.53125, -28.56298828125, -27.5947265625, -26.62646484375, -25.658203125, -24.68994140625, -23.7216796875, -22.75341796875, -21.78515625, -20.81689453125, -19.8486328125, -18.88037109375, -17.912109375, -16.94384765625, -15.9755859375, -15.00732421875, -14.0390625, -13.07080078125, -12.1025390625, -11.13427734375, -10.166015625, -9.19775390625, -8.2294921875, -7.26123046875, -6.29296875, -5.32470703125, -4.3564453125, -3.38818359375, -2.419921875, -1.45166015625, -0.4833984375, 0.48486328125, 1.453125, 2.42138671875, 3.3896484375, 4.35791015625, 5.326171875, 6.29443359375, 7.2626953125, 8.23095703125, 9.19921875, 10.16748046875, 11.1357421875, 12.10400390625, 13.072265625, 14.04052734375, 15.0087890625, 15.97705078125, 16.9453125, 17.91357421875, 18.8818359375, 19.85009765625, 20.818359375, 21.78662109375, 22.7548828125, 23.72314453125, 24.69140625, 25.65966796875, 26.6279296875, 27.59619140625, 28.564453125, 29.53271484375, 30.5009765625, 31.46923828125, 32.4375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 17.0, 51.0, 68.0, 112.0, 185.0, 184.0, 132.0, 95.0, 60.0, 38.0, 8.0, 11.0, 4.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.59375, -28.77490234375, -27.9560546875, -27.13720703125, -26.318359375, -25.49951171875, -24.6806640625, -23.86181640625, -23.04296875, -22.22412109375, -21.4052734375, -20.58642578125, -19.767578125, -18.94873046875, -18.1298828125, -17.31103515625, -16.4921875, -15.67333984375, -14.8544921875, -14.03564453125, -13.216796875, -12.39794921875, -11.5791015625, -10.76025390625, -9.94140625, -9.12255859375, -8.3037109375, -7.48486328125, -6.666015625, -5.84716796875, -5.0283203125, -4.20947265625, -3.390625, -2.57177734375, -1.7529296875, -0.93408203125, -0.115234375, 0.70361328125, 1.5224609375, 2.34130859375, 3.16015625, 3.97900390625, 4.7978515625, 5.61669921875, 6.435546875, 7.25439453125, 8.0732421875, 8.89208984375, 9.7109375, 10.52978515625, 11.3486328125, 12.16748046875, 12.986328125, 13.80517578125, 14.6240234375, 15.44287109375, 16.26171875, 17.08056640625, 17.8994140625, 18.71826171875, 19.537109375, 20.35595703125, 21.1748046875, 21.99365234375, 22.8125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 19.0, 66.0, 165.0, 291.0, 257.0, 131.0, 56.0, 12.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-947.981201171875, -928.575439453125, -909.1696166992188, -889.7638549804688, -870.3580322265625, -850.9522705078125, -831.5465087890625, -812.1406860351562, -792.7349243164062, -773.3291625976562, -753.92333984375, -734.517578125, -715.1117553710938, -695.7059936523438, -676.3001708984375, -656.8944091796875, -637.4886474609375, -618.0828857421875, -598.6770629882812, -579.2713012695312, -559.865478515625, -540.459716796875, -521.053955078125, -501.64813232421875, -482.2423095703125, -462.8365173339844, -443.43072509765625, -424.02496337890625, -404.6191711425781, -385.21337890625, -365.8075866699219, -346.40179443359375, -326.9960021972656, -307.5902099609375, -288.1844177246094, -268.77862548828125, -249.37286376953125, -229.96707153320312, -210.561279296875, -191.15550231933594, -171.7497100830078, -152.3439178466797, -132.93814086914062, -113.5323486328125, -94.1265640258789, -74.72077941894531, -55.31498718261719, -35.909210205078125, -16.50341796875, 2.9023685455322266, 22.308155059814453, 41.71394348144531, 61.119728088378906, 80.5255126953125, 99.93130493164062, 119.33708190917969, 138.7428741455078, 158.14866638183594, 177.554443359375, 196.96023559570312, 216.36602783203125, 235.7718048095703, 255.17759704589844, 274.5833740234375, 293.9891662597656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 13.0, 7.0, 8.0, 7.0, 13.0, 11.0, 20.0, 24.0, 29.0, 24.0, 39.0, 35.0, 39.0, 35.0, 47.0, 47.0, 49.0, 30.0, 40.0, 37.0, 56.0, 37.0, 34.0, 45.0, 35.0, 36.0, 29.0, 36.0, 16.0, 12.0, 20.0, 17.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-176.2188262939453, -171.19631958007812, -166.17381286621094, -161.15130615234375, -156.12879943847656, -151.10629272460938, -146.0837860107422, -141.061279296875, -136.0387725830078, -131.01626586914062, -125.99375915527344, -120.97125244140625, -115.94874572753906, -110.92623901367188, -105.90373229980469, -100.8812255859375, -95.85871124267578, -90.8362045288086, -85.8136978149414, -80.79119110107422, -75.76868438720703, -70.74617767333984, -65.72366333007812, -60.7011604309082, -55.678653717041016, -50.65614700317383, -45.63364028930664, -40.61112976074219, -35.588623046875, -30.566118240356445, -25.543609619140625, -20.521102905273438, -15.49859619140625, -10.476089477539062, -5.453581809997559, -0.4310741424560547, 4.591432571411133, 9.61393928527832, 14.63644790649414, 19.658954620361328, 24.681461334228516, 29.703968048095703, 34.72647476196289, 39.748985290527344, 44.77149200439453, 49.79399871826172, 54.816505432128906, 59.839012145996094, 64.86151885986328, 69.88402557373047, 74.90653228759766, 79.92903900146484, 84.95154571533203, 89.97405242919922, 94.99656677246094, 100.01907348632812, 105.04158020019531, 110.0640869140625, 115.08659362792969, 120.10910034179688, 125.13160705566406, 130.15411376953125, 135.17662048339844, 140.19912719726562, 145.2216339111328]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 4.0, 15.0, 18.0, 28.0, 28.0, 46.0, 59.0, 81.0, 106.0, 170.0, 214.0, 322.0, 530.0, 711.0, 1206.0, 1961.0, 3306.0, 5875.0, 12223.0, 31335.0, 117355.0, 3529191.0, 389619.0, 60109.0, 19977.0, 8690.0, 4462.0, 2496.0, 1453.0, 957.0, 543.0, 381.0, 260.0, 173.0, 123.0, 67.0, 67.0, 39.0, 26.0, 17.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-45.15625, -43.73486328125, -42.3134765625, -40.89208984375, -39.470703125, -38.04931640625, -36.6279296875, -35.20654296875, -33.78515625, -32.36376953125, -30.9423828125, -29.52099609375, -28.099609375, -26.67822265625, -25.2568359375, -23.83544921875, -22.4140625, -20.99267578125, -19.5712890625, -18.14990234375, -16.728515625, -15.30712890625, -13.8857421875, -12.46435546875, -11.04296875, -9.62158203125, -8.2001953125, -6.77880859375, -5.357421875, -3.93603515625, -2.5146484375, -1.09326171875, 0.328125, 1.74951171875, 3.1708984375, 4.59228515625, 6.013671875, 7.43505859375, 8.8564453125, 10.27783203125, 11.69921875, 13.12060546875, 14.5419921875, 15.96337890625, 17.384765625, 18.80615234375, 20.2275390625, 21.64892578125, 23.0703125, 24.49169921875, 25.9130859375, 27.33447265625, 28.755859375, 30.17724609375, 31.5986328125, 33.02001953125, 34.44140625, 35.86279296875, 37.2841796875, 38.70556640625, 40.126953125, 41.54833984375, 42.9697265625, 44.39111328125, 45.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 12.0, 25.0, 20.0, 29.0, 25.0, 23.0, 39.0, 36.0, 42.0, 66.0, 46.0, 40.0, 59.0, 41.0, 48.0, 45.0, 44.0, 44.0, 32.0, 32.0, 39.0, 35.0, 24.0, 29.0, 20.0, 13.0, 16.0, 10.0, 11.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.94921875, -7.73040771484375, -7.5115966796875, -7.29278564453125, -7.073974609375, -6.85516357421875, -6.6363525390625, -6.41754150390625, -6.19873046875, -5.97991943359375, -5.7611083984375, -5.54229736328125, -5.323486328125, -5.10467529296875, -4.8858642578125, -4.66705322265625, -4.4482421875, -4.22943115234375, -4.0106201171875, -3.79180908203125, -3.572998046875, -3.35418701171875, -3.1353759765625, -2.91656494140625, -2.69775390625, -2.47894287109375, -2.2601318359375, -2.04132080078125, -1.822509765625, -1.60369873046875, -1.3848876953125, -1.16607666015625, -0.947265625, -0.72845458984375, -0.5096435546875, -0.29083251953125, -0.072021484375, 0.14678955078125, 0.3656005859375, 0.58441162109375, 0.80322265625, 1.02203369140625, 1.2408447265625, 1.45965576171875, 1.678466796875, 1.89727783203125, 2.1160888671875, 2.33489990234375, 2.5537109375, 2.77252197265625, 2.9913330078125, 3.21014404296875, 3.428955078125, 3.64776611328125, 3.8665771484375, 4.08538818359375, 4.30419921875, 4.52301025390625, 4.7418212890625, 4.96063232421875, 5.179443359375, 5.39825439453125, 5.6170654296875, 5.83587646484375, 6.0546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 20.0, 17.0, 21.0, 30.0, 33.0, 37.0, 42.0, 45.0, 67.0, 69.0, 108.0, 148.0, 224.0, 339.0, 544.0, 1037.0, 2258.0, 5027.0, 15493.0, 74735.0, 2946855.0, 1061756.0, 62012.0, 13734.0, 4771.0, 2027.0, 1060.0, 559.0, 305.0, 231.0, 164.0, 104.0, 87.0, 55.0, 50.0, 41.0, 27.0, 25.0, 30.0, 17.0, 12.0, 11.0, 10.0, 7.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-71.875, -69.7578125, -67.640625, -65.5234375, -63.40625, -61.2890625, -59.171875, -57.0546875, -54.9375, -52.8203125, -50.703125, -48.5859375, -46.46875, -44.3515625, -42.234375, -40.1171875, -38.0, -35.8828125, -33.765625, -31.6484375, -29.53125, -27.4140625, -25.296875, -23.1796875, -21.0625, -18.9453125, -16.828125, -14.7109375, -12.59375, -10.4765625, -8.359375, -6.2421875, -4.125, -2.0078125, 0.109375, 2.2265625, 4.34375, 6.4609375, 8.578125, 10.6953125, 12.8125, 14.9296875, 17.046875, 19.1640625, 21.28125, 23.3984375, 25.515625, 27.6328125, 29.75, 31.8671875, 33.984375, 36.1015625, 38.21875, 40.3359375, 42.453125, 44.5703125, 46.6875, 48.8046875, 50.921875, 53.0390625, 55.15625, 57.2734375, 59.390625, 61.5078125, 63.625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 14.0, 5.0, 19.0, 62.0, 100.0, 195.0, 649.0, 2325.0, 380.0, 150.0, 63.0, 39.0, 23.0, 19.0, 9.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.184814453125, -42.02587890625, -40.866943359375, -39.7080078125, -38.549072265625, -37.39013671875, -36.231201171875, -35.072265625, -33.913330078125, -32.75439453125, -31.595458984375, -30.4365234375, -29.277587890625, -28.11865234375, -26.959716796875, -25.80078125, -24.641845703125, -23.48291015625, -22.323974609375, -21.1650390625, -20.006103515625, -18.84716796875, -17.688232421875, -16.529296875, -15.370361328125, -14.21142578125, -13.052490234375, -11.8935546875, -10.734619140625, -9.57568359375, -8.416748046875, -7.2578125, -6.098876953125, -4.93994140625, -3.781005859375, -2.6220703125, -1.463134765625, -0.30419921875, 0.854736328125, 2.013671875, 3.172607421875, 4.33154296875, 5.490478515625, 6.6494140625, 7.808349609375, 8.96728515625, 10.126220703125, 11.28515625, 12.444091796875, 13.60302734375, 14.761962890625, 15.9208984375, 17.079833984375, 18.23876953125, 19.397705078125, 20.556640625, 21.715576171875, 22.87451171875, 24.033447265625, 25.1923828125, 26.351318359375, 27.51025390625, 28.669189453125, 29.828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 14.0, 34.0, 70.0, 136.0, 209.0, 219.0, 156.0, 77.0, 37.0, 23.0, 15.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.14600372314453, -97.03350067138672, -88.9209976196289, -80.8084945678711, -72.69599151611328, -64.58348846435547, -56.470985412597656, -48.358482360839844, -40.24597930908203, -32.13347625732422, -24.020973205566406, -15.908470153808594, -7.795967102050781, 0.31653594970703125, 8.429039001464844, 16.541542053222656, 24.65404510498047, 32.76654815673828, 40.879051208496094, 48.991554260253906, 57.10405731201172, 65.21656036376953, 73.32906341552734, 81.44156646728516, 89.55406951904297, 97.66657257080078, 105.7790756225586, 113.8915786743164, 122.00408172607422, 130.1165771484375, 138.22909545898438, 146.34158325195312, 154.4541015625, 162.5666046142578, 170.67910766601562, 178.79161071777344, 186.90411376953125, 195.01661682128906, 203.12911987304688, 211.2416229248047, 219.3541259765625, 227.4666290283203, 235.57913208007812, 243.69163513183594, 251.80413818359375, 259.9166259765625, 268.0291442871094, 276.14166259765625, 284.254150390625, 292.36663818359375, 300.4791564941406, 308.5916748046875, 316.70416259765625, 324.816650390625, 332.9291687011719, 341.04168701171875, 349.1541748046875, 357.26666259765625, 365.3791809082031, 373.49169921875, 381.60418701171875, 389.7166748046875, 397.8291931152344, 405.94171142578125, 414.05419921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 3.0, 10.0, 7.0, 9.0, 11.0, 13.0, 18.0, 23.0, 29.0, 17.0, 30.0, 21.0, 33.0, 31.0, 32.0, 31.0, 42.0, 44.0, 38.0, 51.0, 40.0, 45.0, 33.0, 40.0, 40.0, 25.0, 25.0, 34.0, 24.0, 23.0, 21.0, 16.0, 18.0, 14.0, 15.0, 25.0, 10.0, 14.0, 5.0, 13.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-72.34542083740234, -70.24555206298828, -68.14569091796875, -66.04582214355469, -63.94595718383789, -61.846092224121094, -59.74622344970703, -57.646358489990234, -55.54649353027344, -53.44662857055664, -51.346763610839844, -49.24689483642578, -47.147029876708984, -45.04716491699219, -42.947296142578125, -40.84743118286133, -38.74756622314453, -36.647701263427734, -34.54783630371094, -32.447967529296875, -30.348102569580078, -28.24823760986328, -26.14837074279785, -24.048503875732422, -21.948638916015625, -19.848773956298828, -17.7489070892334, -15.649041175842285, -13.549175262451172, -11.449309349060059, -9.349443435668945, -7.249577522277832, -5.149715423583984, -3.049849510192871, -0.9499835968017578, 1.1498823165893555, 3.2497482299804688, 5.349614143371582, 7.449480056762695, 9.549345970153809, 11.649211883544922, 13.749077796936035, 15.848943710327148, 17.948810577392578, 20.048675537109375, 22.148540496826172, 24.2484073638916, 26.34827423095703, 28.448139190673828, 30.548004150390625, 32.64787292480469, 34.747737884521484, 36.84760284423828, 38.94746780395508, 41.047332763671875, 43.14720153808594, 45.247066497802734, 47.34693145751953, 49.446800231933594, 51.54666519165039, 53.64653015136719, 55.746395111083984, 57.84626007080078, 59.946128845214844, 62.04599380493164]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 13.0, 14.0, 38.0, 39.0, 57.0, 92.0, 141.0, 185.0, 389.0, 544.0, 919.0, 1722.0, 3140.0, 6254.0, 13382.0, 32580.0, 91712.0, 397513.0, 358154.0, 85201.0, 30840.0, 12652.0, 5942.0, 2985.0, 1615.0, 900.0, 539.0, 348.0, 222.0, 131.0, 73.0, 65.0, 36.0, 28.0, 23.0, 15.0, 14.0, 7.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.78125, -40.43212890625, -39.0830078125, -37.73388671875, -36.384765625, -35.03564453125, -33.6865234375, -32.33740234375, -30.98828125, -29.63916015625, -28.2900390625, -26.94091796875, -25.591796875, -24.24267578125, -22.8935546875, -21.54443359375, -20.1953125, -18.84619140625, -17.4970703125, -16.14794921875, -14.798828125, -13.44970703125, -12.1005859375, -10.75146484375, -9.40234375, -8.05322265625, -6.7041015625, -5.35498046875, -4.005859375, -2.65673828125, -1.3076171875, 0.04150390625, 1.390625, 2.73974609375, 4.0888671875, 5.43798828125, 6.787109375, 8.13623046875, 9.4853515625, 10.83447265625, 12.18359375, 13.53271484375, 14.8818359375, 16.23095703125, 17.580078125, 18.92919921875, 20.2783203125, 21.62744140625, 22.9765625, 24.32568359375, 25.6748046875, 27.02392578125, 28.373046875, 29.72216796875, 31.0712890625, 32.42041015625, 33.76953125, 35.11865234375, 36.4677734375, 37.81689453125, 39.166015625, 40.51513671875, 41.8642578125, 43.21337890625, 44.5625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 10.0, 5.0, 13.0, 13.0, 26.0, 22.0, 28.0, 39.0, 36.0, 38.0, 44.0, 49.0, 40.0, 57.0, 46.0, 45.0, 47.0, 42.0, 41.0, 48.0, 40.0, 38.0, 28.0, 24.0, 32.0, 18.0, 28.0, 9.0, 16.0, 11.0, 13.0, 6.0, 11.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.5390625, -7.31964111328125, -7.1002197265625, -6.88079833984375, -6.661376953125, -6.44195556640625, -6.2225341796875, -6.00311279296875, -5.78369140625, -5.56427001953125, -5.3448486328125, -5.12542724609375, -4.906005859375, -4.68658447265625, -4.4671630859375, -4.24774169921875, -4.0283203125, -3.80889892578125, -3.5894775390625, -3.37005615234375, -3.150634765625, -2.93121337890625, -2.7117919921875, -2.49237060546875, -2.27294921875, -2.05352783203125, -1.8341064453125, -1.61468505859375, -1.395263671875, -1.17584228515625, -0.9564208984375, -0.73699951171875, -0.517578125, -0.29815673828125, -0.0787353515625, 0.14068603515625, 0.360107421875, 0.57952880859375, 0.7989501953125, 1.01837158203125, 1.23779296875, 1.45721435546875, 1.6766357421875, 1.89605712890625, 2.115478515625, 2.33489990234375, 2.5543212890625, 2.77374267578125, 2.9931640625, 3.21258544921875, 3.4320068359375, 3.65142822265625, 3.870849609375, 4.09027099609375, 4.3096923828125, 4.52911376953125, 4.74853515625, 4.96795654296875, 5.1873779296875, 5.40679931640625, 5.626220703125, 5.84564208984375, 6.0650634765625, 6.28448486328125, 6.50390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 6.0, 6.0, 15.0, 8.0, 27.0, 25.0, 47.0, 53.0, 80.0, 131.0, 220.0, 326.0, 483.0, 768.0, 1352.0, 2267.0, 4538.0, 10369.0, 30607.0, 123809.0, 600582.0, 201603.0, 44520.0, 13989.0, 5652.0, 2858.0, 1597.0, 952.0, 608.0, 328.0, 214.0, 142.0, 98.0, 75.0, 49.0, 29.0, 24.0, 25.0, 11.0, 8.0, 8.0, 7.0, 9.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-42.46875, -41.16796875, -39.8671875, -38.56640625, -37.265625, -35.96484375, -34.6640625, -33.36328125, -32.0625, -30.76171875, -29.4609375, -28.16015625, -26.859375, -25.55859375, -24.2578125, -22.95703125, -21.65625, -20.35546875, -19.0546875, -17.75390625, -16.453125, -15.15234375, -13.8515625, -12.55078125, -11.25, -9.94921875, -8.6484375, -7.34765625, -6.046875, -4.74609375, -3.4453125, -2.14453125, -0.84375, 0.45703125, 1.7578125, 3.05859375, 4.359375, 5.66015625, 6.9609375, 8.26171875, 9.5625, 10.86328125, 12.1640625, 13.46484375, 14.765625, 16.06640625, 17.3671875, 18.66796875, 19.96875, 21.26953125, 22.5703125, 23.87109375, 25.171875, 26.47265625, 27.7734375, 29.07421875, 30.375, 31.67578125, 32.9765625, 34.27734375, 35.578125, 36.87890625, 38.1796875, 39.48046875, 40.78125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 12.0, 9.0, 22.0, 17.0, 28.0, 29.0, 52.0, 48.0, 45.0, 31.0, 72.0, 51.0, 69.0, 62.0, 60.0, 58.0, 42.0, 44.0, 52.0, 34.0, 36.0, 26.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.515625, -30.291259765625, -29.06689453125, -27.842529296875, -26.6181640625, -25.393798828125, -24.16943359375, -22.945068359375, -21.720703125, -20.496337890625, -19.27197265625, -18.047607421875, -16.8232421875, -15.598876953125, -14.37451171875, -13.150146484375, -11.92578125, -10.701416015625, -9.47705078125, -8.252685546875, -7.0283203125, -5.803955078125, -4.57958984375, -3.355224609375, -2.130859375, -0.906494140625, 0.31787109375, 1.542236328125, 2.7666015625, 3.990966796875, 5.21533203125, 6.439697265625, 7.6640625, 8.888427734375, 10.11279296875, 11.337158203125, 12.5615234375, 13.785888671875, 15.01025390625, 16.234619140625, 17.458984375, 18.683349609375, 19.90771484375, 21.132080078125, 22.3564453125, 23.580810546875, 24.80517578125, 26.029541015625, 27.25390625, 28.478271484375, 29.70263671875, 30.927001953125, 32.1513671875, 33.375732421875, 34.60009765625, 35.824462890625, 37.048828125, 38.273193359375, 39.49755859375, 40.721923828125, 41.9462890625, 43.170654296875, 44.39501953125, 45.619384765625, 46.84375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 14.0, 13.0, 19.0, 23.0, 47.0, 48.0, 101.0, 114.0, 182.0, 330.0, 524.0, 978.0, 1976.0, 4405.0, 11937.0, 41592.0, 286570.0, 591956.0, 77240.0, 18320.0, 6445.0, 2655.0, 1274.0, 715.0, 393.0, 239.0, 126.0, 82.0, 63.0, 42.0, 38.0, 20.0, 18.0, 14.0, 5.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.796875, -21.074951171875, -20.35302734375, -19.631103515625, -18.9091796875, -18.187255859375, -17.46533203125, -16.743408203125, -16.021484375, -15.299560546875, -14.57763671875, -13.855712890625, -13.1337890625, -12.411865234375, -11.68994140625, -10.968017578125, -10.24609375, -9.524169921875, -8.80224609375, -8.080322265625, -7.3583984375, -6.636474609375, -5.91455078125, -5.192626953125, -4.470703125, -3.748779296875, -3.02685546875, -2.304931640625, -1.5830078125, -0.861083984375, -0.13916015625, 0.582763671875, 1.3046875, 2.026611328125, 2.74853515625, 3.470458984375, 4.1923828125, 4.914306640625, 5.63623046875, 6.358154296875, 7.080078125, 7.802001953125, 8.52392578125, 9.245849609375, 9.9677734375, 10.689697265625, 11.41162109375, 12.133544921875, 12.85546875, 13.577392578125, 14.29931640625, 15.021240234375, 15.7431640625, 16.465087890625, 17.18701171875, 17.908935546875, 18.630859375, 19.352783203125, 20.07470703125, 20.796630859375, 21.5185546875, 22.240478515625, 22.96240234375, 23.684326171875, 24.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 18.0, 19.0, 64.0, 180.0, 400.0, 180.0, 60.0, 26.0, 17.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.018890380859375, -0.01849287748336792, -0.01809537410736084, -0.01769787073135376, -0.01730036735534668, -0.0169028639793396, -0.01650536060333252, -0.01610785722732544, -0.01571035385131836, -0.01531285047531128, -0.0149153470993042, -0.01451784372329712, -0.014120340347290039, -0.013722836971282959, -0.013325333595275879, -0.012927830219268799, -0.012530326843261719, -0.012132823467254639, -0.011735320091247559, -0.011337816715240479, -0.010940313339233398, -0.010542809963226318, -0.010145306587219238, -0.009747803211212158, -0.009350299835205078, -0.008952796459197998, -0.008555293083190918, -0.008157789707183838, -0.007760286331176758, -0.007362782955169678, -0.006965279579162598, -0.006567776203155518, -0.0061702728271484375, -0.005772769451141357, -0.005375266075134277, -0.004977762699127197, -0.004580259323120117, -0.004182755947113037, -0.003785252571105957, -0.003387749195098877, -0.002990245819091797, -0.002592742443084717, -0.0021952390670776367, -0.0017977356910705566, -0.0014002323150634766, -0.0010027289390563965, -0.0006052255630493164, -0.00020772218704223633, 0.00018978118896484375, 0.0005872845649719238, 0.000984787940979004, 0.001382291316986084, 0.001779794692993164, 0.002177298069000244, 0.0025748014450073242, 0.0029723048210144043, 0.0033698081970214844, 0.0037673115730285645, 0.0041648149490356445, 0.004562318325042725, 0.004959821701049805, 0.005357325077056885, 0.005754828453063965, 0.006152331829071045, 0.006549835205078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 11.0, 20.0, 30.0, 32.0, 63.0, 72.0, 134.0, 242.0, 374.0, 670.0, 1150.0, 2310.0, 5140.0, 13539.0, 44681.0, 276872.0, 581807.0, 85428.0, 21361.0, 7818.0, 3175.0, 1603.0, 806.0, 471.0, 266.0, 146.0, 110.0, 76.0, 32.0, 24.0, 26.0, 19.0, 11.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.5615234375, -17.966796875, -17.3720703125, -16.77734375, -16.1826171875, -15.587890625, -14.9931640625, -14.3984375, -13.8037109375, -13.208984375, -12.6142578125, -12.01953125, -11.4248046875, -10.830078125, -10.2353515625, -9.640625, -9.0458984375, -8.451171875, -7.8564453125, -7.26171875, -6.6669921875, -6.072265625, -5.4775390625, -4.8828125, -4.2880859375, -3.693359375, -3.0986328125, -2.50390625, -1.9091796875, -1.314453125, -0.7197265625, -0.125, 0.4697265625, 1.064453125, 1.6591796875, 2.25390625, 2.8486328125, 3.443359375, 4.0380859375, 4.6328125, 5.2275390625, 5.822265625, 6.4169921875, 7.01171875, 7.6064453125, 8.201171875, 8.7958984375, 9.390625, 9.9853515625, 10.580078125, 11.1748046875, 11.76953125, 12.3642578125, 12.958984375, 13.5537109375, 14.1484375, 14.7431640625, 15.337890625, 15.9326171875, 16.52734375, 17.1220703125, 17.716796875, 18.3115234375, 18.90625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 19.0, 35.0, 55.0, 62.0, 92.0, 119.0, 108.0, 106.0, 87.0, 79.0, 53.0, 29.0, 19.0, 14.0, 12.0, 13.0, 6.0, 4.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-18.21875, -17.7586669921875, -17.298583984375, -16.8385009765625, -16.37841796875, -15.9183349609375, -15.458251953125, -14.9981689453125, -14.5380859375, -14.0780029296875, -13.617919921875, -13.1578369140625, -12.69775390625, -12.2376708984375, -11.777587890625, -11.3175048828125, -10.857421875, -10.3973388671875, -9.937255859375, -9.4771728515625, -9.01708984375, -8.5570068359375, -8.096923828125, -7.6368408203125, -7.1767578125, -6.7166748046875, -6.256591796875, -5.7965087890625, -5.33642578125, -4.8763427734375, -4.416259765625, -3.9561767578125, -3.49609375, -3.0360107421875, -2.575927734375, -2.1158447265625, -1.65576171875, -1.1956787109375, -0.735595703125, -0.2755126953125, 0.1845703125, 0.6446533203125, 1.104736328125, 1.5648193359375, 2.02490234375, 2.4849853515625, 2.945068359375, 3.4051513671875, 3.865234375, 4.3253173828125, 4.785400390625, 5.2454833984375, 5.70556640625, 6.1656494140625, 6.625732421875, 7.0858154296875, 7.5458984375, 8.0059814453125, 8.466064453125, 8.9261474609375, 9.38623046875, 9.8463134765625, 10.306396484375, 10.7664794921875, 11.2265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 16.0, 25.0, 46.0, 65.0, 113.0, 128.0, 141.0, 135.0, 114.0, 72.0, 66.0, 23.0, 25.0, 13.0, 10.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.1841735839844, -294.5325622558594, -284.8809814453125, -275.2293701171875, -265.5777587890625, -255.92616271972656, -246.27456665039062, -236.62295532226562, -226.9713592529297, -217.31976318359375, -207.66815185546875, -198.0165557861328, -188.36495971679688, -178.71334838867188, -169.06175231933594, -159.41015625, -149.758544921875, -140.10694885253906, -130.45533752441406, -120.80374145507812, -111.15213775634766, -101.50053405761719, -91.84893798828125, -82.19733428955078, -72.54573059082031, -62.894126892089844, -53.24252700805664, -43.59092712402344, -33.93932342529297, -24.2877197265625, -14.636119842529297, -4.984519958496094, 4.667083740234375, 14.318685531616211, 23.970287322998047, 33.62188720703125, 43.27349090576172, 52.92509460449219, 62.57669448852539, 72.2282943725586, 81.87989807128906, 91.53150177001953, 101.18310546875, 110.83470153808594, 120.4863052368164, 130.13790893554688, 139.7895050048828, 149.44110107421875, 159.09271240234375, 168.7443084716797, 178.3959197998047, 188.04751586914062, 197.69912719726562, 207.35072326660156, 217.0023193359375, 226.6539306640625, 236.30552673339844, 245.95712280273438, 255.60873413085938, 265.2603454589844, 274.91192626953125, 284.56353759765625, 294.21514892578125, 303.8667297363281, 313.5183410644531]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 10.0, 8.0, 5.0, 13.0, 17.0, 19.0, 18.0, 35.0, 16.0, 22.0, 35.0, 33.0, 49.0, 43.0, 34.0, 42.0, 41.0, 51.0, 40.0, 41.0, 41.0, 40.0, 42.0, 42.0, 34.0, 26.0, 34.0, 26.0, 22.0, 15.0, 17.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 8.0, 3.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-171.1358642578125, -166.36476135253906, -161.59365844726562, -156.8225555419922, -152.05145263671875, -147.28036499023438, -142.50926208496094, -137.7381591796875, -132.96705627441406, -128.19595336914062, -123.42485046386719, -118.65375518798828, -113.88265228271484, -109.1115493774414, -104.3404541015625, -99.56935119628906, -94.79824829101562, -90.02714538574219, -85.25604248046875, -80.48494720458984, -75.7138442993164, -70.94274139404297, -66.17164611816406, -61.400543212890625, -56.62944030761719, -51.85833740234375, -47.08723831176758, -42.316139221191406, -37.54503631591797, -32.77393341064453, -28.00283432006836, -23.231735229492188, -18.460617065429688, -13.689516067504883, -8.918415069580078, -4.147314071655273, 0.6237869262695312, 5.394887924194336, 10.16598892211914, 14.937088012695312, 19.70819091796875, 24.479291915893555, 29.25039291381836, 34.02149200439453, 38.79259490966797, 43.563697814941406, 48.33479690551758, 53.10589599609375, 57.87699890136719, 62.648101806640625, 67.41920471191406, 72.19029998779297, 76.9614028930664, 81.73250579833984, 86.50360107421875, 91.27470397949219, 96.04580688476562, 100.81690979003906, 105.5880126953125, 110.3591079711914, 115.13021087646484, 119.90131378173828, 124.67240905761719, 129.44351196289062, 134.21461486816406]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 2.0, 6.0, 6.0, 17.0, 15.0, 34.0, 36.0, 52.0, 81.0, 103.0, 154.0, 253.0, 404.0, 669.0, 1215.0, 2237.0, 4708.0, 10735.0, 32251.0, 236190.0, 3794677.0, 77477.0, 18548.0, 7120.0, 3282.0, 1661.0, 873.0, 549.0, 342.0, 218.0, 125.0, 86.0, 39.0, 38.0, 26.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.25, -74.2041015625, -72.158203125, -70.1123046875, -68.06640625, -66.0205078125, -63.974609375, -61.9287109375, -59.8828125, -57.8369140625, -55.791015625, -53.7451171875, -51.69921875, -49.6533203125, -47.607421875, -45.5615234375, -43.515625, -41.4697265625, -39.423828125, -37.3779296875, -35.33203125, -33.2861328125, -31.240234375, -29.1943359375, -27.1484375, -25.1025390625, -23.056640625, -21.0107421875, -18.96484375, -16.9189453125, -14.873046875, -12.8271484375, -10.78125, -8.7353515625, -6.689453125, -4.6435546875, -2.59765625, -0.5517578125, 1.494140625, 3.5400390625, 5.5859375, 7.6318359375, 9.677734375, 11.7236328125, 13.76953125, 15.8154296875, 17.861328125, 19.9072265625, 21.953125, 23.9990234375, 26.044921875, 28.0908203125, 30.13671875, 32.1826171875, 34.228515625, 36.2744140625, 38.3203125, 40.3662109375, 42.412109375, 44.4580078125, 46.50390625, 48.5498046875, 50.595703125, 52.6416015625, 54.6875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 14.0, 15.0, 8.0, 17.0, 15.0, 20.0, 34.0, 39.0, 42.0, 46.0, 44.0, 57.0, 58.0, 36.0, 51.0, 45.0, 42.0, 52.0, 44.0, 55.0, 46.0, 33.0, 37.0, 29.0, 23.0, 14.0, 24.0, 11.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0523681640625, -7.792236328125, -7.5321044921875, -7.27197265625, -7.0118408203125, -6.751708984375, -6.4915771484375, -6.2314453125, -5.9713134765625, -5.711181640625, -5.4510498046875, -5.19091796875, -4.9307861328125, -4.670654296875, -4.4105224609375, -4.150390625, -3.8902587890625, -3.630126953125, -3.3699951171875, -3.10986328125, -2.8497314453125, -2.589599609375, -2.3294677734375, -2.0693359375, -1.8092041015625, -1.549072265625, -1.2889404296875, -1.02880859375, -0.7686767578125, -0.508544921875, -0.2484130859375, 0.01171875, 0.2718505859375, 0.531982421875, 0.7921142578125, 1.05224609375, 1.3123779296875, 1.572509765625, 1.8326416015625, 2.0927734375, 2.3529052734375, 2.613037109375, 2.8731689453125, 3.13330078125, 3.3934326171875, 3.653564453125, 3.9136962890625, 4.173828125, 4.4339599609375, 4.694091796875, 4.9542236328125, 5.21435546875, 5.4744873046875, 5.734619140625, 5.9947509765625, 6.2548828125, 6.5150146484375, 6.775146484375, 7.0352783203125, 7.29541015625, 7.5555419921875, 7.815673828125, 8.0758056640625, 8.3359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 16.0, 18.0, 22.0, 21.0, 45.0, 53.0, 76.0, 140.0, 200.0, 342.0, 569.0, 1052.0, 2346.0, 6104.0, 20481.0, 143394.0, 3863223.0, 125591.0, 19523.0, 6054.0, 2356.0, 1124.0, 582.0, 323.0, 181.0, 146.0, 78.0, 52.0, 33.0, 22.0, 18.0, 14.0, 15.0, 7.0, 5.0, 5.0, 7.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-91.8125, -89.1494140625, -86.486328125, -83.8232421875, -81.16015625, -78.4970703125, -75.833984375, -73.1708984375, -70.5078125, -67.8447265625, -65.181640625, -62.5185546875, -59.85546875, -57.1923828125, -54.529296875, -51.8662109375, -49.203125, -46.5400390625, -43.876953125, -41.2138671875, -38.55078125, -35.8876953125, -33.224609375, -30.5615234375, -27.8984375, -25.2353515625, -22.572265625, -19.9091796875, -17.24609375, -14.5830078125, -11.919921875, -9.2568359375, -6.59375, -3.9306640625, -1.267578125, 1.3955078125, 4.05859375, 6.7216796875, 9.384765625, 12.0478515625, 14.7109375, 17.3740234375, 20.037109375, 22.7001953125, 25.36328125, 28.0263671875, 30.689453125, 33.3525390625, 36.015625, 38.6787109375, 41.341796875, 44.0048828125, 46.66796875, 49.3310546875, 51.994140625, 54.6572265625, 57.3203125, 59.9833984375, 62.646484375, 65.3095703125, 67.97265625, 70.6357421875, 73.298828125, 75.9619140625, 78.625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 17.0, 30.0, 33.0, 92.0, 223.0, 988.0, 2253.0, 228.0, 84.0, 33.0, 25.0, 14.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.994140625, -47.80078125, -46.607421875, -45.4140625, -44.220703125, -43.02734375, -41.833984375, -40.640625, -39.447265625, -38.25390625, -37.060546875, -35.8671875, -34.673828125, -33.48046875, -32.287109375, -31.09375, -29.900390625, -28.70703125, -27.513671875, -26.3203125, -25.126953125, -23.93359375, -22.740234375, -21.546875, -20.353515625, -19.16015625, -17.966796875, -16.7734375, -15.580078125, -14.38671875, -13.193359375, -12.0, -10.806640625, -9.61328125, -8.419921875, -7.2265625, -6.033203125, -4.83984375, -3.646484375, -2.453125, -1.259765625, -0.06640625, 1.126953125, 2.3203125, 3.513671875, 4.70703125, 5.900390625, 7.09375, 8.287109375, 9.48046875, 10.673828125, 11.8671875, 13.060546875, 14.25390625, 15.447265625, 16.640625, 17.833984375, 19.02734375, 20.220703125, 21.4140625, 22.607421875, 23.80078125, 24.994140625, 26.1875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 17.0, 36.0, 105.0, 272.0, 328.0, 171.0, 46.0, 15.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-497.5877380371094, -486.80401611328125, -476.0202941894531, -465.236572265625, -454.4528503417969, -443.66912841796875, -432.88543701171875, -422.1017150878906, -411.3179931640625, -400.5342712402344, -389.75054931640625, -378.9668273925781, -368.18310546875, -357.3994140625, -346.61566162109375, -335.83197021484375, -325.0482177734375, -314.2644958496094, -303.48077392578125, -292.6970520019531, -281.913330078125, -271.129638671875, -260.34588623046875, -249.56219482421875, -238.77847290039062, -227.9947509765625, -217.21102905273438, -206.42730712890625, -195.6436004638672, -184.85987854003906, -174.07615661621094, -163.29244995117188, -152.5087432861328, -141.7250213623047, -130.94129943847656, -120.15758514404297, -109.37387084960938, -98.59014892578125, -87.80642700195312, -77.02271270751953, -66.2389907836914, -55.45527267456055, -44.67155456542969, -33.88783264160156, -23.104114532470703, -12.320396423339844, -1.5366744995117188, 9.247039794921875, 20.03076171875, 30.81447982788086, 41.59819793701172, 52.381919860839844, 63.1656379699707, 73.94935607910156, 84.73307800292969, 95.51679229736328, 106.3005142211914, 117.08423614501953, 127.86795043945312, 138.65167236328125, 149.43539428710938, 160.2191162109375, 171.00283813476562, 181.7865447998047, 192.5702667236328]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 13.0, 21.0, 9.0, 19.0, 22.0, 30.0, 34.0, 40.0, 40.0, 40.0, 49.0, 54.0, 50.0, 54.0, 49.0, 46.0, 46.0, 42.0, 47.0, 43.0, 39.0, 31.0, 23.0, 26.0, 24.0, 20.0, 9.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.95223999023438, -70.51971435546875, -68.0871810913086, -65.65465545654297, -63.22212600708008, -60.78959655761719, -58.35707092285156, -55.92454147338867, -53.49201202392578, -51.05948257446289, -48.626953125, -46.194427490234375, -43.761898040771484, -41.329368591308594, -38.89684295654297, -36.46431350708008, -34.03178405761719, -31.599254608154297, -29.16672706604004, -26.73419952392578, -24.30167007446289, -21.869140625, -19.436613082885742, -17.004085540771484, -14.571556091308594, -12.13902759552002, -9.706499099731445, -7.273970603942871, -4.841442108154297, -2.4089136123657227, 0.023614883422851562, 2.4561424255371094, 4.888671875, 7.321200370788574, 9.753728866577148, 12.186257362365723, 14.618785858154297, 17.051315307617188, 19.483842849731445, 21.916370391845703, 24.348899841308594, 26.781429290771484, 29.213956832885742, 31.646484375, 34.07901382446289, 36.51154327392578, 38.944068908691406, 41.3765983581543, 43.80912780761719, 46.24165725708008, 48.67418670654297, 51.106712341308594, 53.539241790771484, 55.971771240234375, 58.404296875, 60.83682632446289, 63.26935577392578, 65.7018814086914, 68.13441467285156, 70.56694030761719, 72.99946594238281, 75.43199920654297, 77.8645248413086, 80.29705810546875, 82.72958374023438]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 0.0, 1.0, 10.0, 12.0, 19.0, 15.0, 22.0, 49.0, 55.0, 91.0, 116.0, 187.0, 273.0, 346.0, 558.0, 885.0, 1421.0, 2339.0, 3864.0, 6781.0, 13252.0, 26668.0, 57851.0, 145256.0, 408541.0, 224001.0, 81783.0, 35703.0, 17219.0, 8670.0, 4855.0, 2850.0, 1689.0, 1037.0, 685.0, 437.0, 310.0, 192.0, 131.0, 108.0, 79.0, 46.0, 42.0, 36.0, 29.0, 13.0, 6.0, 10.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-27.3125, -26.501953125, -25.69140625, -24.880859375, -24.0703125, -23.259765625, -22.44921875, -21.638671875, -20.828125, -20.017578125, -19.20703125, -18.396484375, -17.5859375, -16.775390625, -15.96484375, -15.154296875, -14.34375, -13.533203125, -12.72265625, -11.912109375, -11.1015625, -10.291015625, -9.48046875, -8.669921875, -7.859375, -7.048828125, -6.23828125, -5.427734375, -4.6171875, -3.806640625, -2.99609375, -2.185546875, -1.375, -0.564453125, 0.24609375, 1.056640625, 1.8671875, 2.677734375, 3.48828125, 4.298828125, 5.109375, 5.919921875, 6.73046875, 7.541015625, 8.3515625, 9.162109375, 9.97265625, 10.783203125, 11.59375, 12.404296875, 13.21484375, 14.025390625, 14.8359375, 15.646484375, 16.45703125, 17.267578125, 18.078125, 18.888671875, 19.69921875, 20.509765625, 21.3203125, 22.130859375, 22.94140625, 23.751953125, 24.5625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 18.0, 24.0, 14.0, 25.0, 34.0, 25.0, 39.0, 33.0, 39.0, 31.0, 25.0, 36.0, 47.0, 37.0, 43.0, 46.0, 42.0, 43.0, 40.0, 29.0, 33.0, 30.0, 30.0, 23.0, 25.0, 24.0, 19.0, 12.0, 8.0, 14.0, 9.0, 5.0, 9.0, 6.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-7.71875, -7.4967041015625, -7.274658203125, -7.0526123046875, -6.83056640625, -6.6085205078125, -6.386474609375, -6.1644287109375, -5.9423828125, -5.7203369140625, -5.498291015625, -5.2762451171875, -5.05419921875, -4.8321533203125, -4.610107421875, -4.3880615234375, -4.166015625, -3.9439697265625, -3.721923828125, -3.4998779296875, -3.27783203125, -3.0557861328125, -2.833740234375, -2.6116943359375, -2.3896484375, -2.1676025390625, -1.945556640625, -1.7235107421875, -1.50146484375, -1.2794189453125, -1.057373046875, -0.8353271484375, -0.61328125, -0.3912353515625, -0.169189453125, 0.0528564453125, 0.27490234375, 0.4969482421875, 0.718994140625, 0.9410400390625, 1.1630859375, 1.3851318359375, 1.607177734375, 1.8292236328125, 2.05126953125, 2.2733154296875, 2.495361328125, 2.7174072265625, 2.939453125, 3.1614990234375, 3.383544921875, 3.6055908203125, 3.82763671875, 4.0496826171875, 4.271728515625, 4.4937744140625, 4.7158203125, 4.9378662109375, 5.159912109375, 5.3819580078125, 5.60400390625, 5.8260498046875, 6.048095703125, 6.2701416015625, 6.4921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 17.0, 19.0, 27.0, 35.0, 53.0, 76.0, 126.0, 191.0, 293.0, 533.0, 895.0, 1561.0, 2923.0, 6259.0, 15001.0, 41950.0, 175214.0, 624114.0, 122420.0, 33123.0, 12354.0, 5306.0, 2652.0, 1330.0, 740.0, 480.0, 289.0, 167.0, 128.0, 69.0, 54.0, 34.0, 21.0, 15.0, 18.0, 12.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-43.71875, -42.40966796875, -41.1005859375, -39.79150390625, -38.482421875, -37.17333984375, -35.8642578125, -34.55517578125, -33.24609375, -31.93701171875, -30.6279296875, -29.31884765625, -28.009765625, -26.70068359375, -25.3916015625, -24.08251953125, -22.7734375, -21.46435546875, -20.1552734375, -18.84619140625, -17.537109375, -16.22802734375, -14.9189453125, -13.60986328125, -12.30078125, -10.99169921875, -9.6826171875, -8.37353515625, -7.064453125, -5.75537109375, -4.4462890625, -3.13720703125, -1.828125, -0.51904296875, 0.7900390625, 2.09912109375, 3.408203125, 4.71728515625, 6.0263671875, 7.33544921875, 8.64453125, 9.95361328125, 11.2626953125, 12.57177734375, 13.880859375, 15.18994140625, 16.4990234375, 17.80810546875, 19.1171875, 20.42626953125, 21.7353515625, 23.04443359375, 24.353515625, 25.66259765625, 26.9716796875, 28.28076171875, 29.58984375, 30.89892578125, 32.2080078125, 33.51708984375, 34.826171875, 36.13525390625, 37.4443359375, 38.75341796875, 40.0625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 4.0, 9.0, 10.0, 19.0, 19.0, 31.0, 32.0, 40.0, 55.0, 53.0, 55.0, 59.0, 67.0, 74.0, 63.0, 64.0, 61.0, 42.0, 47.0, 33.0, 26.0, 29.0, 22.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.46875, -48.88427734375, -47.2998046875, -45.71533203125, -44.130859375, -42.54638671875, -40.9619140625, -39.37744140625, -37.79296875, -36.20849609375, -34.6240234375, -33.03955078125, -31.455078125, -29.87060546875, -28.2861328125, -26.70166015625, -25.1171875, -23.53271484375, -21.9482421875, -20.36376953125, -18.779296875, -17.19482421875, -15.6103515625, -14.02587890625, -12.44140625, -10.85693359375, -9.2724609375, -7.68798828125, -6.103515625, -4.51904296875, -2.9345703125, -1.35009765625, 0.234375, 1.81884765625, 3.4033203125, 4.98779296875, 6.572265625, 8.15673828125, 9.7412109375, 11.32568359375, 12.91015625, 14.49462890625, 16.0791015625, 17.66357421875, 19.248046875, 20.83251953125, 22.4169921875, 24.00146484375, 25.5859375, 27.17041015625, 28.7548828125, 30.33935546875, 31.923828125, 33.50830078125, 35.0927734375, 36.67724609375, 38.26171875, 39.84619140625, 41.4306640625, 43.01513671875, 44.599609375, 46.18408203125, 47.7685546875, 49.35302734375, 50.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 17.0, 21.0, 33.0, 35.0, 37.0, 65.0, 82.0, 155.0, 231.0, 393.0, 631.0, 1192.0, 2055.0, 4010.0, 8994.0, 24223.0, 95114.0, 565868.0, 269306.0, 48105.0, 14957.0, 6213.0, 2909.0, 1560.0, 849.0, 531.0, 295.0, 202.0, 147.0, 88.0, 51.0, 47.0, 30.0, 18.0, 9.0, 13.0, 12.0, 6.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.171875, -18.604248046875, -18.03662109375, -17.468994140625, -16.9013671875, -16.333740234375, -15.76611328125, -15.198486328125, -14.630859375, -14.063232421875, -13.49560546875, -12.927978515625, -12.3603515625, -11.792724609375, -11.22509765625, -10.657470703125, -10.08984375, -9.522216796875, -8.95458984375, -8.386962890625, -7.8193359375, -7.251708984375, -6.68408203125, -6.116455078125, -5.548828125, -4.981201171875, -4.41357421875, -3.845947265625, -3.2783203125, -2.710693359375, -2.14306640625, -1.575439453125, -1.0078125, -0.440185546875, 0.12744140625, 0.695068359375, 1.2626953125, 1.830322265625, 2.39794921875, 2.965576171875, 3.533203125, 4.100830078125, 4.66845703125, 5.236083984375, 5.8037109375, 6.371337890625, 6.93896484375, 7.506591796875, 8.07421875, 8.641845703125, 9.20947265625, 9.777099609375, 10.3447265625, 10.912353515625, 11.47998046875, 12.047607421875, 12.615234375, 13.182861328125, 13.75048828125, 14.318115234375, 14.8857421875, 15.453369140625, 16.02099609375, 16.588623046875, 17.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 13.0, 14.0, 15.0, 40.0, 81.0, 342.0, 316.0, 81.0, 27.0, 25.0, 16.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013065934181213379, -0.012681245803833008, -0.012296557426452637, -0.011911869049072266, -0.011527180671691895, -0.011142492294311523, -0.010757803916931152, -0.010373115539550781, -0.00998842716217041, -0.009603738784790039, -0.009219050407409668, -0.008834362030029297, -0.008449673652648926, -0.008064985275268555, -0.007680296897888184, -0.0072956085205078125, -0.006910920143127441, -0.00652623176574707, -0.006141543388366699, -0.005756855010986328, -0.005372166633605957, -0.004987478256225586, -0.004602789878845215, -0.004218101501464844, -0.0038334131240844727, -0.0034487247467041016, -0.0030640363693237305, -0.0026793479919433594, -0.0022946596145629883, -0.0019099712371826172, -0.001525282859802246, -0.001140594482421875, -0.0007559061050415039, -0.0003712177276611328, 1.3470649719238281e-05, 0.0003981590270996094, 0.0007828474044799805, 0.0011675357818603516, 0.0015522241592407227, 0.0019369125366210938, 0.002321600914001465, 0.002706289291381836, 0.003090977668762207, 0.003475666046142578, 0.0038603544235229492, 0.00424504280090332, 0.004629731178283691, 0.0050144195556640625, 0.005399107933044434, 0.005783796310424805, 0.006168484687805176, 0.006553173065185547, 0.006937861442565918, 0.007322549819946289, 0.00770723819732666, 0.008091926574707031, 0.008476614952087402, 0.008861303329467773, 0.009245991706848145, 0.009630680084228516, 0.010015368461608887, 0.010400056838989258, 0.010784745216369629, 0.01116943359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 20.0, 35.0, 53.0, 54.0, 109.0, 163.0, 319.0, 557.0, 1103.0, 2364.0, 6106.0, 19826.0, 98932.0, 732409.0, 148827.0, 24762.0, 7344.0, 2849.0, 1210.0, 640.0, 338.0, 205.0, 107.0, 58.0, 43.0, 31.0, 16.0, 10.0, 15.0, 9.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.53564453125, -25.7900390625, -25.04443359375, -24.298828125, -23.55322265625, -22.8076171875, -22.06201171875, -21.31640625, -20.57080078125, -19.8251953125, -19.07958984375, -18.333984375, -17.58837890625, -16.8427734375, -16.09716796875, -15.3515625, -14.60595703125, -13.8603515625, -13.11474609375, -12.369140625, -11.62353515625, -10.8779296875, -10.13232421875, -9.38671875, -8.64111328125, -7.8955078125, -7.14990234375, -6.404296875, -5.65869140625, -4.9130859375, -4.16748046875, -3.421875, -2.67626953125, -1.9306640625, -1.18505859375, -0.439453125, 0.30615234375, 1.0517578125, 1.79736328125, 2.54296875, 3.28857421875, 4.0341796875, 4.77978515625, 5.525390625, 6.27099609375, 7.0166015625, 7.76220703125, 8.5078125, 9.25341796875, 9.9990234375, 10.74462890625, 11.490234375, 12.23583984375, 12.9814453125, 13.72705078125, 14.47265625, 15.21826171875, 15.9638671875, 16.70947265625, 17.455078125, 18.20068359375, 18.9462890625, 19.69189453125, 20.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 11.0, 13.0, 37.0, 52.0, 69.0, 82.0, 133.0, 130.0, 119.0, 94.0, 63.0, 44.0, 32.0, 20.0, 13.0, 12.0, 5.0, 10.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.796875, -18.202392578125, -17.60791015625, -17.013427734375, -16.4189453125, -15.824462890625, -15.22998046875, -14.635498046875, -14.041015625, -13.446533203125, -12.85205078125, -12.257568359375, -11.6630859375, -11.068603515625, -10.47412109375, -9.879638671875, -9.28515625, -8.690673828125, -8.09619140625, -7.501708984375, -6.9072265625, -6.312744140625, -5.71826171875, -5.123779296875, -4.529296875, -3.934814453125, -3.34033203125, -2.745849609375, -2.1513671875, -1.556884765625, -0.96240234375, -0.367919921875, 0.2265625, 0.821044921875, 1.41552734375, 2.010009765625, 2.6044921875, 3.198974609375, 3.79345703125, 4.387939453125, 4.982421875, 5.576904296875, 6.17138671875, 6.765869140625, 7.3603515625, 7.954833984375, 8.54931640625, 9.143798828125, 9.73828125, 10.332763671875, 10.92724609375, 11.521728515625, 12.1162109375, 12.710693359375, 13.30517578125, 13.899658203125, 14.494140625, 15.088623046875, 15.68310546875, 16.277587890625, 16.8720703125, 17.466552734375, 18.06103515625, 18.655517578125, 19.25]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 23.0, 67.0, 177.0, 331.0, 236.0, 110.0, 47.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.3223876953125, -163.19183349609375, -142.061279296875, -120.93071746826172, -99.80016326904297, -78.66960906982422, -57.53904724121094, -36.40849304199219, -15.277938842773438, 5.852617263793945, 26.983173370361328, 48.113731384277344, 69.2442855834961, 90.37483978271484, 111.50540161132812, 132.63595581054688, 153.76651000976562, 174.89706420898438, 196.02761840820312, 217.15817260742188, 238.28872680664062, 259.4192810058594, 280.54986572265625, 301.680419921875, 322.81097412109375, 343.9415283203125, 365.07208251953125, 386.20263671875, 407.33319091796875, 428.4637451171875, 449.59429931640625, 470.724853515625, 491.85540771484375, 512.9859619140625, 534.1165161132812, 555.2470703125, 576.3776245117188, 597.5081787109375, 618.6387329101562, 639.769287109375, 660.8998413085938, 682.0303955078125, 703.1609497070312, 724.29150390625, 745.4220581054688, 766.5526123046875, 787.6831665039062, 808.813720703125, 829.9443359375, 851.0748901367188, 872.2054443359375, 893.3359985351562, 914.466552734375, 935.5971069335938, 956.7276611328125, 977.8582153320312, 998.98876953125, 1020.1193237304688, 1041.2498779296875, 1062.3804931640625, 1083.510986328125, 1104.6416015625, 1125.7720947265625, 1146.9027099609375, 1168.033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 8.0, 6.0, 7.0, 7.0, 10.0, 18.0, 13.0, 14.0, 19.0, 21.0, 25.0, 24.0, 24.0, 25.0, 34.0, 39.0, 38.0, 29.0, 38.0, 37.0, 42.0, 36.0, 48.0, 44.0, 36.0, 34.0, 38.0, 38.0, 31.0, 28.0, 19.0, 21.0, 20.0, 22.0, 16.0, 13.0, 15.0, 5.0, 10.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-159.8803253173828, -154.90208435058594, -149.92385864257812, -144.94561767578125, -139.96737670898438, -134.9891357421875, -130.01089477539062, -125.03266906738281, -120.05442810058594, -115.07618713378906, -110.09795379638672, -105.11972045898438, -100.1414794921875, -95.16323852539062, -90.18500518798828, -85.20677185058594, -80.22853088378906, -75.25028991699219, -70.27205657958984, -65.2938232421875, -60.315582275390625, -55.337345123291016, -50.359107971191406, -45.3808708190918, -40.40263366699219, -35.42439651489258, -30.44615936279297, -25.46792221069336, -20.48968505859375, -15.51144790649414, -10.533210754394531, -5.554973602294922, -0.57672119140625, 4.401515960693359, 9.379753112792969, 14.357990264892578, 19.336227416992188, 24.314464569091797, 29.292701721191406, 34.270938873291016, 39.249176025390625, 44.227413177490234, 49.205650329589844, 54.18388748168945, 59.16212463378906, 64.14036560058594, 69.11859893798828, 74.09683227539062, 79.0750732421875, 84.05331420898438, 89.03154754638672, 94.00978088378906, 98.98802185058594, 103.96626281738281, 108.94449615478516, 113.9227294921875, 118.90097045898438, 123.87921142578125, 128.85745239257812, 133.83567810058594, 138.8139190673828, 143.7921600341797, 148.7703857421875, 153.74862670898438, 158.72686767578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 4.0, 12.0, 16.0, 27.0, 27.0, 34.0, 65.0, 74.0, 101.0, 114.0, 178.0, 248.0, 347.0, 444.0, 705.0, 1101.0, 1795.0, 3163.0, 5883.0, 12140.0, 30468.0, 109577.0, 3737310.0, 213040.0, 43991.0, 16193.0, 7428.0, 3729.0, 2175.0, 1313.0, 772.0, 504.0, 341.0, 258.0, 185.0, 122.0, 89.0, 71.0, 52.0, 33.0, 37.0, 13.0, 17.0, 8.0, 11.0, 9.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0], "bins": [-66.375, -64.3427734375, -62.310546875, -60.2783203125, -58.24609375, -56.2138671875, -54.181640625, -52.1494140625, -50.1171875, -48.0849609375, -46.052734375, -44.0205078125, -41.98828125, -39.9560546875, -37.923828125, -35.8916015625, -33.859375, -31.8271484375, -29.794921875, -27.7626953125, -25.73046875, -23.6982421875, -21.666015625, -19.6337890625, -17.6015625, -15.5693359375, -13.537109375, -11.5048828125, -9.47265625, -7.4404296875, -5.408203125, -3.3759765625, -1.34375, 0.6884765625, 2.720703125, 4.7529296875, 6.78515625, 8.8173828125, 10.849609375, 12.8818359375, 14.9140625, 16.9462890625, 18.978515625, 21.0107421875, 23.04296875, 25.0751953125, 27.107421875, 29.1396484375, 31.171875, 33.2041015625, 35.236328125, 37.2685546875, 39.30078125, 41.3330078125, 43.365234375, 45.3974609375, 47.4296875, 49.4619140625, 51.494140625, 53.5263671875, 55.55859375, 57.5908203125, 59.623046875, 61.6552734375, 63.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 7.0, 5.0, 6.0, 7.0, 8.0, 10.0, 15.0, 8.0, 19.0, 23.0, 14.0, 28.0, 28.0, 32.0, 28.0, 32.0, 38.0, 29.0, 34.0, 39.0, 42.0, 39.0, 41.0, 38.0, 46.0, 39.0, 53.0, 36.0, 32.0, 32.0, 29.0, 23.0, 19.0, 16.0, 19.0, 17.0, 9.0, 15.0, 8.0, 9.0, 10.0, 1.0, 5.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.39453125, -7.16351318359375, -6.9324951171875, -6.70147705078125, -6.470458984375, -6.23944091796875, -6.0084228515625, -5.77740478515625, -5.54638671875, -5.31536865234375, -5.0843505859375, -4.85333251953125, -4.622314453125, -4.39129638671875, -4.1602783203125, -3.92926025390625, -3.6982421875, -3.46722412109375, -3.2362060546875, -3.00518798828125, -2.774169921875, -2.54315185546875, -2.3121337890625, -2.08111572265625, -1.85009765625, -1.61907958984375, -1.3880615234375, -1.15704345703125, -0.926025390625, -0.69500732421875, -0.4639892578125, -0.23297119140625, -0.001953125, 0.22906494140625, 0.4600830078125, 0.69110107421875, 0.922119140625, 1.15313720703125, 1.3841552734375, 1.61517333984375, 1.84619140625, 2.07720947265625, 2.3082275390625, 2.53924560546875, 2.770263671875, 3.00128173828125, 3.2322998046875, 3.46331787109375, 3.6943359375, 3.92535400390625, 4.1563720703125, 4.38739013671875, 4.618408203125, 4.84942626953125, 5.0804443359375, 5.31146240234375, 5.54248046875, 5.77349853515625, 6.0045166015625, 6.23553466796875, 6.466552734375, 6.69757080078125, 6.9285888671875, 7.15960693359375, 7.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 12.0, 11.0, 9.0, 17.0, 22.0, 22.0, 32.0, 52.0, 51.0, 68.0, 76.0, 120.0, 124.0, 186.0, 193.0, 262.0, 342.0, 426.0, 610.0, 895.0, 1483.0, 3126.0, 7892.0, 27869.0, 238192.0, 3801709.0, 82641.0, 16205.0, 5064.0, 2206.0, 1211.0, 705.0, 529.0, 404.0, 281.0, 258.0, 211.0, 172.0, 114.0, 108.0, 82.0, 75.0, 49.0, 38.0, 39.0, 19.0, 24.0, 14.0, 12.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-105.0, -101.6455078125, -98.291015625, -94.9365234375, -91.58203125, -88.2275390625, -84.873046875, -81.5185546875, -78.1640625, -74.8095703125, -71.455078125, -68.1005859375, -64.74609375, -61.3916015625, -58.037109375, -54.6826171875, -51.328125, -47.9736328125, -44.619140625, -41.2646484375, -37.91015625, -34.5556640625, -31.201171875, -27.8466796875, -24.4921875, -21.1376953125, -17.783203125, -14.4287109375, -11.07421875, -7.7197265625, -4.365234375, -1.0107421875, 2.34375, 5.6982421875, 9.052734375, 12.4072265625, 15.76171875, 19.1162109375, 22.470703125, 25.8251953125, 29.1796875, 32.5341796875, 35.888671875, 39.2431640625, 42.59765625, 45.9521484375, 49.306640625, 52.6611328125, 56.015625, 59.3701171875, 62.724609375, 66.0791015625, 69.43359375, 72.7880859375, 76.142578125, 79.4970703125, 82.8515625, 86.2060546875, 89.560546875, 92.9150390625, 96.26953125, 99.6240234375, 102.978515625, 106.3330078125, 109.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 9.0, 15.0, 26.0, 49.0, 139.0, 553.0, 2870.0, 263.0, 68.0, 32.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.90625, -59.986328125, -58.06640625, -56.146484375, -54.2265625, -52.306640625, -50.38671875, -48.466796875, -46.546875, -44.626953125, -42.70703125, -40.787109375, -38.8671875, -36.947265625, -35.02734375, -33.107421875, -31.1875, -29.267578125, -27.34765625, -25.427734375, -23.5078125, -21.587890625, -19.66796875, -17.748046875, -15.828125, -13.908203125, -11.98828125, -10.068359375, -8.1484375, -6.228515625, -4.30859375, -2.388671875, -0.46875, 1.451171875, 3.37109375, 5.291015625, 7.2109375, 9.130859375, 11.05078125, 12.970703125, 14.890625, 16.810546875, 18.73046875, 20.650390625, 22.5703125, 24.490234375, 26.41015625, 28.330078125, 30.25, 32.169921875, 34.08984375, 36.009765625, 37.9296875, 39.849609375, 41.76953125, 43.689453125, 45.609375, 47.529296875, 49.44921875, 51.369140625, 53.2890625, 55.208984375, 57.12890625, 59.048828125, 60.96875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 34.0, 33.0, 53.0, 68.0, 108.0, 120.0, 160.0, 122.0, 75.0, 53.0, 40.0, 22.0, 15.0, 21.0, 6.0, 8.0, 9.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.16546630859375, -134.84486389160156, -128.52427673339844, -122.20367431640625, -115.8830795288086, -109.56248474121094, -103.24188232421875, -96.9212875366211, -90.60069274902344, -84.28009796142578, -77.95950317382812, -71.63890075683594, -65.31830596923828, -58.997711181640625, -52.6771125793457, -46.35651397705078, -40.035919189453125, -33.71532440185547, -27.394725799560547, -21.074129104614258, -14.753532409667969, -8.43293571472168, -2.1123390197753906, 4.208259582519531, 10.528854370117188, 16.849451065063477, 23.170047760009766, 29.490644454956055, 35.811241149902344, 42.1318359375, 48.45243453979492, 54.773033142089844, 61.0936279296875, 67.41422271728516, 73.73481750488281, 80.055419921875, 86.37601470947266, 92.69660949707031, 99.0172119140625, 105.33780670166016, 111.65840148925781, 117.97899627685547, 124.29959106445312, 130.6201934814453, 136.9407958984375, 143.26138305664062, 149.5819854736328, 155.902587890625, 162.22317504882812, 168.5437774658203, 174.86436462402344, 181.18496704101562, 187.50555419921875, 193.82615661621094, 200.14675903320312, 206.46734619140625, 212.78794860839844, 219.10855102539062, 225.42913818359375, 231.74974060058594, 238.07034301757812, 244.39093017578125, 250.71153259277344, 257.0321350097656, 263.35272216796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 5.0, 18.0, 13.0, 13.0, 19.0, 24.0, 19.0, 27.0, 21.0, 36.0, 30.0, 21.0, 37.0, 36.0, 41.0, 37.0, 34.0, 43.0, 49.0, 41.0, 33.0, 44.0, 43.0, 34.0, 35.0, 42.0, 14.0, 20.0, 28.0, 25.0, 22.0, 14.0, 7.0, 9.0, 10.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-112.75352478027344, -109.40979766845703, -106.06607055664062, -102.72233581542969, -99.37860870361328, -96.03488159179688, -92.69115447998047, -89.34742736816406, -86.00369262695312, -82.65996551513672, -79.31623840332031, -75.97250366210938, -72.62877655029297, -69.28504943847656, -65.94132232666016, -62.597591400146484, -59.25386428833008, -55.91013717651367, -52.56640625, -49.222679138183594, -45.87894821166992, -42.535221099853516, -39.191490173339844, -35.84776306152344, -32.50403594970703, -29.160306930541992, -25.816577911376953, -22.472850799560547, -19.129119873046875, -15.785392761230469, -12.44166374206543, -9.09793472290039, -5.754203796386719, -2.410475015640259, 0.9332537651062012, 4.276982307434082, 7.620711326599121, 10.964439392089844, 14.308168411254883, 17.651897430419922, 20.99562644958496, 24.33935546875, 27.68308448791504, 31.026813507080078, 34.370540618896484, 37.714271545410156, 41.05799865722656, 44.40172576904297, 47.74545669555664, 51.08918380737305, 54.43291473388672, 57.776641845703125, 61.1203727722168, 64.46409606933594, 67.80783081054688, 71.15155792236328, 74.49528503417969, 77.8390121459961, 81.1827392578125, 84.52647399902344, 87.87020111083984, 91.21392822265625, 94.55765533447266, 97.90138244628906, 101.2451171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 21.0, 26.0, 33.0, 42.0, 53.0, 68.0, 125.0, 172.0, 234.0, 355.0, 505.0, 739.0, 1173.0, 1824.0, 3011.0, 5414.0, 10012.0, 20681.0, 47120.0, 127742.0, 426942.0, 256452.0, 79960.0, 32147.0, 15191.0, 7546.0, 4119.0, 2426.0, 1442.0, 937.0, 609.0, 428.0, 262.0, 192.0, 134.0, 104.0, 80.0, 63.0, 35.0, 26.0, 14.0, 18.0, 9.0, 11.0, 9.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-44.8125, -43.40234375, -41.9921875, -40.58203125, -39.171875, -37.76171875, -36.3515625, -34.94140625, -33.53125, -32.12109375, -30.7109375, -29.30078125, -27.890625, -26.48046875, -25.0703125, -23.66015625, -22.25, -20.83984375, -19.4296875, -18.01953125, -16.609375, -15.19921875, -13.7890625, -12.37890625, -10.96875, -9.55859375, -8.1484375, -6.73828125, -5.328125, -3.91796875, -2.5078125, -1.09765625, 0.3125, 1.72265625, 3.1328125, 4.54296875, 5.953125, 7.36328125, 8.7734375, 10.18359375, 11.59375, 13.00390625, 14.4140625, 15.82421875, 17.234375, 18.64453125, 20.0546875, 21.46484375, 22.875, 24.28515625, 25.6953125, 27.10546875, 28.515625, 29.92578125, 31.3359375, 32.74609375, 34.15625, 35.56640625, 36.9765625, 38.38671875, 39.796875, 41.20703125, 42.6171875, 44.02734375, 45.4375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 6.0, 13.0, 17.0, 15.0, 18.0, 25.0, 31.0, 23.0, 29.0, 29.0, 43.0, 35.0, 44.0, 43.0, 46.0, 44.0, 49.0, 48.0, 41.0, 51.0, 35.0, 28.0, 33.0, 39.0, 26.0, 29.0, 19.0, 16.0, 24.0, 13.0, 12.0, 12.0, 9.0, 6.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-11.2734375, -10.94287109375, -10.6123046875, -10.28173828125, -9.951171875, -9.62060546875, -9.2900390625, -8.95947265625, -8.62890625, -8.29833984375, -7.9677734375, -7.63720703125, -7.306640625, -6.97607421875, -6.6455078125, -6.31494140625, -5.984375, -5.65380859375, -5.3232421875, -4.99267578125, -4.662109375, -4.33154296875, -4.0009765625, -3.67041015625, -3.33984375, -3.00927734375, -2.6787109375, -2.34814453125, -2.017578125, -1.68701171875, -1.3564453125, -1.02587890625, -0.6953125, -0.36474609375, -0.0341796875, 0.29638671875, 0.626953125, 0.95751953125, 1.2880859375, 1.61865234375, 1.94921875, 2.27978515625, 2.6103515625, 2.94091796875, 3.271484375, 3.60205078125, 3.9326171875, 4.26318359375, 4.59375, 4.92431640625, 5.2548828125, 5.58544921875, 5.916015625, 6.24658203125, 6.5771484375, 6.90771484375, 7.23828125, 7.56884765625, 7.8994140625, 8.22998046875, 8.560546875, 8.89111328125, 9.2216796875, 9.55224609375, 9.8828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 15.0, 21.0, 28.0, 47.0, 79.0, 131.0, 243.0, 387.0, 662.0, 1286.0, 2535.0, 5259.0, 13111.0, 42051.0, 224656.0, 618690.0, 98678.0, 24367.0, 8476.0, 3707.0, 1805.0, 987.0, 531.0, 293.0, 170.0, 121.0, 76.0, 49.0, 22.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -64.56005859375, -62.6201171875, -60.68017578125, -58.740234375, -56.80029296875, -54.8603515625, -52.92041015625, -50.98046875, -49.04052734375, -47.1005859375, -45.16064453125, -43.220703125, -41.28076171875, -39.3408203125, -37.40087890625, -35.4609375, -33.52099609375, -31.5810546875, -29.64111328125, -27.701171875, -25.76123046875, -23.8212890625, -21.88134765625, -19.94140625, -18.00146484375, -16.0615234375, -14.12158203125, -12.181640625, -10.24169921875, -8.3017578125, -6.36181640625, -4.421875, -2.48193359375, -0.5419921875, 1.39794921875, 3.337890625, 5.27783203125, 7.2177734375, 9.15771484375, 11.09765625, 13.03759765625, 14.9775390625, 16.91748046875, 18.857421875, 20.79736328125, 22.7373046875, 24.67724609375, 26.6171875, 28.55712890625, 30.4970703125, 32.43701171875, 34.376953125, 36.31689453125, 38.2568359375, 40.19677734375, 42.13671875, 44.07666015625, 46.0166015625, 47.95654296875, 49.896484375, 51.83642578125, 53.7763671875, 55.71630859375, 57.65625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 6.0, 11.0, 12.0, 9.0, 19.0, 19.0, 21.0, 27.0, 30.0, 32.0, 42.0, 42.0, 56.0, 53.0, 45.0, 68.0, 59.0, 42.0, 46.0, 47.0, 44.0, 39.0, 39.0, 27.0, 24.0, 24.0, 20.0, 18.0, 13.0, 13.0, 7.0, 7.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.09375, -50.39453125, -48.6953125, -46.99609375, -45.296875, -43.59765625, -41.8984375, -40.19921875, -38.5, -36.80078125, -35.1015625, -33.40234375, -31.703125, -30.00390625, -28.3046875, -26.60546875, -24.90625, -23.20703125, -21.5078125, -19.80859375, -18.109375, -16.41015625, -14.7109375, -13.01171875, -11.3125, -9.61328125, -7.9140625, -6.21484375, -4.515625, -2.81640625, -1.1171875, 0.58203125, 2.28125, 3.98046875, 5.6796875, 7.37890625, 9.078125, 10.77734375, 12.4765625, 14.17578125, 15.875, 17.57421875, 19.2734375, 20.97265625, 22.671875, 24.37109375, 26.0703125, 27.76953125, 29.46875, 31.16796875, 32.8671875, 34.56640625, 36.265625, 37.96484375, 39.6640625, 41.36328125, 43.0625, 44.76171875, 46.4609375, 48.16015625, 49.859375, 51.55859375, 53.2578125, 54.95703125, 56.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 7.0, 9.0, 22.0, 23.0, 38.0, 37.0, 85.0, 135.0, 221.0, 368.0, 607.0, 1275.0, 2579.0, 5967.0, 16613.0, 65817.0, 520756.0, 360916.0, 49515.0, 13646.0, 5040.0, 2290.0, 1118.0, 594.0, 346.0, 203.0, 101.0, 71.0, 49.0, 37.0, 26.0, 10.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.53125, -24.7783203125, -24.025390625, -23.2724609375, -22.51953125, -21.7666015625, -21.013671875, -20.2607421875, -19.5078125, -18.7548828125, -18.001953125, -17.2490234375, -16.49609375, -15.7431640625, -14.990234375, -14.2373046875, -13.484375, -12.7314453125, -11.978515625, -11.2255859375, -10.47265625, -9.7197265625, -8.966796875, -8.2138671875, -7.4609375, -6.7080078125, -5.955078125, -5.2021484375, -4.44921875, -3.6962890625, -2.943359375, -2.1904296875, -1.4375, -0.6845703125, 0.068359375, 0.8212890625, 1.57421875, 2.3271484375, 3.080078125, 3.8330078125, 4.5859375, 5.3388671875, 6.091796875, 6.8447265625, 7.59765625, 8.3505859375, 9.103515625, 9.8564453125, 10.609375, 11.3623046875, 12.115234375, 12.8681640625, 13.62109375, 14.3740234375, 15.126953125, 15.8798828125, 16.6328125, 17.3857421875, 18.138671875, 18.8916015625, 19.64453125, 20.3974609375, 21.150390625, 21.9033203125, 22.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 18.0, 19.0, 40.0, 91.0, 280.0, 274.0, 121.0, 57.0, 33.0, 16.0, 16.0, 4.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00972747802734375, -0.009354829788208008, -0.008982181549072266, -0.008609533309936523, -0.008236885070800781, -0.007864236831665039, -0.007491588592529297, -0.007118940353393555, -0.0067462921142578125, -0.00637364387512207, -0.006000995635986328, -0.005628347396850586, -0.005255699157714844, -0.0048830509185791016, -0.004510402679443359, -0.004137754440307617, -0.003765106201171875, -0.003392457962036133, -0.0030198097229003906, -0.0026471614837646484, -0.0022745132446289062, -0.001901865005493164, -0.0015292167663574219, -0.0011565685272216797, -0.0007839202880859375, -0.0004112720489501953, -3.8623809814453125e-05, 0.00033402442932128906, 0.0007066726684570312, 0.0010793209075927734, 0.0014519691467285156, 0.0018246173858642578, 0.002197265625, 0.002569913864135742, 0.0029425621032714844, 0.0033152103424072266, 0.0036878585815429688, 0.004060506820678711, 0.004433155059814453, 0.004805803298950195, 0.0051784515380859375, 0.00555109977722168, 0.005923748016357422, 0.006296396255493164, 0.006669044494628906, 0.0070416927337646484, 0.007414340972900391, 0.007786989212036133, 0.008159637451171875, 0.008532285690307617, 0.00890493392944336, 0.009277582168579102, 0.009650230407714844, 0.010022878646850586, 0.010395526885986328, 0.01076817512512207, 0.011140823364257812, 0.011513471603393555, 0.011886119842529297, 0.012258768081665039, 0.012631416320800781, 0.013004064559936523, 0.013376712799072266, 0.013749361038208008, 0.01412200927734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 11.0, 14.0, 28.0, 34.0, 52.0, 82.0, 136.0, 173.0, 303.0, 423.0, 689.0, 1074.0, 2022.0, 3475.0, 6974.0, 16102.0, 47111.0, 206575.0, 550518.0, 148252.0, 37211.0, 13483.0, 6035.0, 3118.0, 1740.0, 1033.0, 654.0, 397.0, 241.0, 165.0, 127.0, 89.0, 49.0, 37.0, 31.0, 14.0, 13.0, 8.0, 6.0, 8.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.9375, -18.35302734375, -17.7685546875, -17.18408203125, -16.599609375, -16.01513671875, -15.4306640625, -14.84619140625, -14.26171875, -13.67724609375, -13.0927734375, -12.50830078125, -11.923828125, -11.33935546875, -10.7548828125, -10.17041015625, -9.5859375, -9.00146484375, -8.4169921875, -7.83251953125, -7.248046875, -6.66357421875, -6.0791015625, -5.49462890625, -4.91015625, -4.32568359375, -3.7412109375, -3.15673828125, -2.572265625, -1.98779296875, -1.4033203125, -0.81884765625, -0.234375, 0.35009765625, 0.9345703125, 1.51904296875, 2.103515625, 2.68798828125, 3.2724609375, 3.85693359375, 4.44140625, 5.02587890625, 5.6103515625, 6.19482421875, 6.779296875, 7.36376953125, 7.9482421875, 8.53271484375, 9.1171875, 9.70166015625, 10.2861328125, 10.87060546875, 11.455078125, 12.03955078125, 12.6240234375, 13.20849609375, 13.79296875, 14.37744140625, 14.9619140625, 15.54638671875, 16.130859375, 16.71533203125, 17.2998046875, 17.88427734375, 18.46875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 7.0, 11.0, 17.0, 12.0, 24.0, 28.0, 32.0, 41.0, 75.0, 60.0, 83.0, 110.0, 92.0, 91.0, 66.0, 55.0, 33.0, 27.0, 21.0, 16.0, 13.0, 15.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.890625, -16.352783203125, -15.81494140625, -15.277099609375, -14.7392578125, -14.201416015625, -13.66357421875, -13.125732421875, -12.587890625, -12.050048828125, -11.51220703125, -10.974365234375, -10.4365234375, -9.898681640625, -9.36083984375, -8.822998046875, -8.28515625, -7.747314453125, -7.20947265625, -6.671630859375, -6.1337890625, -5.595947265625, -5.05810546875, -4.520263671875, -3.982421875, -3.444580078125, -2.90673828125, -2.368896484375, -1.8310546875, -1.293212890625, -0.75537109375, -0.217529296875, 0.3203125, 0.858154296875, 1.39599609375, 1.933837890625, 2.4716796875, 3.009521484375, 3.54736328125, 4.085205078125, 4.623046875, 5.160888671875, 5.69873046875, 6.236572265625, 6.7744140625, 7.312255859375, 7.85009765625, 8.387939453125, 8.92578125, 9.463623046875, 10.00146484375, 10.539306640625, 11.0771484375, 11.614990234375, 12.15283203125, 12.690673828125, 13.228515625, 13.766357421875, 14.30419921875, 14.842041015625, 15.3798828125, 15.917724609375, 16.45556640625, 16.993408203125, 17.53125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 19.0, 18.0, 32.0, 62.0, 82.0, 160.0, 174.0, 143.0, 119.0, 72.0, 47.0, 33.0, 22.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.1904907226562, -577.7869262695312, -562.38330078125, -546.979736328125, -531.5761108398438, -516.1725463867188, -500.7689514160156, -485.3653564453125, -469.9617614746094, -454.55816650390625, -439.1545715332031, -423.7509765625, -408.347412109375, -392.9438171386719, -377.54022216796875, -362.1366271972656, -346.7330322265625, -331.3294372558594, -315.92584228515625, -300.52227783203125, -285.1186828613281, -269.715087890625, -254.31149291992188, -238.90789794921875, -223.50433349609375, -208.10073852539062, -192.69715881347656, -177.29356384277344, -161.8899688720703, -146.48638916015625, -131.08279418945312, -115.67919921875, -100.27560424804688, -84.87201690673828, -69.46842193603516, -54.06483459472656, -38.6612434387207, -23.257652282714844, -7.85406494140625, 7.549530029296875, 22.95311737060547, 38.35670852661133, 53.76029968261719, 69.16388702392578, 84.56747436523438, 99.9710693359375, 115.3746566772461, 130.77825927734375, 146.1818389892578, 161.58543395996094, 176.989013671875, 192.39260864257812, 207.79620361328125, 223.19979858398438, 238.60337829589844, 254.00697326660156, 269.4105529785156, 284.81414794921875, 300.2177429199219, 315.621337890625, 331.02490234375, 346.4284973144531, 361.83209228515625, 377.2356872558594, 392.6392822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 9.0, 8.0, 11.0, 17.0, 17.0, 19.0, 17.0, 38.0, 20.0, 20.0, 27.0, 35.0, 43.0, 48.0, 51.0, 44.0, 38.0, 42.0, 41.0, 51.0, 48.0, 47.0, 44.0, 33.0, 43.0, 28.0, 20.0, 19.0, 21.0, 10.0, 19.0, 9.0, 12.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-284.66607666015625, -276.7821350097656, -268.898193359375, -261.0142517089844, -253.1302947998047, -245.24635314941406, -237.36241149902344, -229.4784698486328, -221.59451293945312, -213.7105712890625, -205.82662963867188, -197.94268798828125, -190.05873107910156, -182.17478942871094, -174.2908477783203, -166.4069061279297, -158.52296447753906, -150.63902282714844, -142.7550811767578, -134.87112426757812, -126.9871826171875, -119.10324096679688, -111.21929931640625, -103.33535766601562, -95.45140838623047, -87.56746673583984, -79.68351745605469, -71.79957580566406, -63.91563034057617, -56.03168487548828, -48.147743225097656, -40.263797760009766, -32.379852294921875, -24.495906829833984, -16.611963272094727, -8.728019714355469, -0.8440742492675781, 7.0398712158203125, 14.923812866210938, 22.807758331298828, 30.69170379638672, 38.57564926147461, 46.4595947265625, 54.343536376953125, 62.227481842041016, 70.1114273071289, 77.99536895751953, 85.87931823730469, 93.76325988769531, 101.64720153808594, 109.5311508178711, 117.41509246826172, 125.29904174804688, 133.1829833984375, 141.06692504882812, 148.95086669921875, 156.83480834960938, 164.71875, 172.60269165039062, 180.48663330078125, 188.37059020996094, 196.25453186035156, 204.1384735107422, 212.0224151611328, 219.9063720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 7.0, 9.0, 8.0, 15.0, 23.0, 22.0, 35.0, 45.0, 52.0, 85.0, 110.0, 134.0, 202.0, 229.0, 343.0, 510.0, 735.0, 1082.0, 1665.0, 2543.0, 4464.0, 8500.0, 18487.0, 48152.0, 238041.0, 3690454.0, 115384.0, 33001.0, 13288.0, 6541.0, 3623.0, 2087.0, 1295.0, 946.0, 593.0, 393.0, 315.0, 226.0, 171.0, 101.0, 80.0, 69.0, 47.0, 46.0, 29.0, 19.0, 19.0, 13.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-66.375, -64.3212890625, -62.267578125, -60.2138671875, -58.16015625, -56.1064453125, -54.052734375, -51.9990234375, -49.9453125, -47.8916015625, -45.837890625, -43.7841796875, -41.73046875, -39.6767578125, -37.623046875, -35.5693359375, -33.515625, -31.4619140625, -29.408203125, -27.3544921875, -25.30078125, -23.2470703125, -21.193359375, -19.1396484375, -17.0859375, -15.0322265625, -12.978515625, -10.9248046875, -8.87109375, -6.8173828125, -4.763671875, -2.7099609375, -0.65625, 1.3974609375, 3.451171875, 5.5048828125, 7.55859375, 9.6123046875, 11.666015625, 13.7197265625, 15.7734375, 17.8271484375, 19.880859375, 21.9345703125, 23.98828125, 26.0419921875, 28.095703125, 30.1494140625, 32.203125, 34.2568359375, 36.310546875, 38.3642578125, 40.41796875, 42.4716796875, 44.525390625, 46.5791015625, 48.6328125, 50.6865234375, 52.740234375, 54.7939453125, 56.84765625, 58.9013671875, 60.955078125, 63.0087890625, 65.0625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 3.0, 8.0, 10.0, 14.0, 16.0, 15.0, 17.0, 23.0, 34.0, 40.0, 28.0, 27.0, 38.0, 44.0, 40.0, 50.0, 40.0, 48.0, 42.0, 49.0, 44.0, 41.0, 36.0, 40.0, 32.0, 25.0, 32.0, 26.0, 15.0, 25.0, 20.0, 14.0, 10.0, 8.0, 8.0, 13.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.5899658203125, -9.258056640625, -8.9261474609375, -8.59423828125, -8.2623291015625, -7.930419921875, -7.5985107421875, -7.2666015625, -6.9346923828125, -6.602783203125, -6.2708740234375, -5.93896484375, -5.6070556640625, -5.275146484375, -4.9432373046875, -4.611328125, -4.2794189453125, -3.947509765625, -3.6156005859375, -3.28369140625, -2.9517822265625, -2.619873046875, -2.2879638671875, -1.9560546875, -1.6241455078125, -1.292236328125, -0.9603271484375, -0.62841796875, -0.2965087890625, 0.035400390625, 0.3673095703125, 0.69921875, 1.0311279296875, 1.363037109375, 1.6949462890625, 2.02685546875, 2.3587646484375, 2.690673828125, 3.0225830078125, 3.3544921875, 3.6864013671875, 4.018310546875, 4.3502197265625, 4.68212890625, 5.0140380859375, 5.345947265625, 5.6778564453125, 6.009765625, 6.3416748046875, 6.673583984375, 7.0054931640625, 7.33740234375, 7.6693115234375, 8.001220703125, 8.3331298828125, 8.6650390625, 8.9969482421875, 9.328857421875, 9.6607666015625, 9.99267578125, 10.3245849609375, 10.656494140625, 10.9884033203125, 11.3203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 8.0, 15.0, 14.0, 25.0, 21.0, 27.0, 34.0, 36.0, 59.0, 70.0, 99.0, 127.0, 214.0, 348.0, 589.0, 1016.0, 2219.0, 6018.0, 26854.0, 1659761.0, 2458543.0, 27167.0, 6051.0, 2233.0, 1064.0, 569.0, 329.0, 180.0, 142.0, 105.0, 77.0, 59.0, 41.0, 34.0, 26.0, 20.0, 21.0, 11.0, 7.0, 9.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-200.375, -194.650390625, -188.92578125, -183.201171875, -177.4765625, -171.751953125, -166.02734375, -160.302734375, -154.578125, -148.853515625, -143.12890625, -137.404296875, -131.6796875, -125.955078125, -120.23046875, -114.505859375, -108.78125, -103.056640625, -97.33203125, -91.607421875, -85.8828125, -80.158203125, -74.43359375, -68.708984375, -62.984375, -57.259765625, -51.53515625, -45.810546875, -40.0859375, -34.361328125, -28.63671875, -22.912109375, -17.1875, -11.462890625, -5.73828125, -0.013671875, 5.7109375, 11.435546875, 17.16015625, 22.884765625, 28.609375, 34.333984375, 40.05859375, 45.783203125, 51.5078125, 57.232421875, 62.95703125, 68.681640625, 74.40625, 80.130859375, 85.85546875, 91.580078125, 97.3046875, 103.029296875, 108.75390625, 114.478515625, 120.203125, 125.927734375, 131.65234375, 137.376953125, 143.1015625, 148.826171875, 154.55078125, 160.275390625, 166.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 16.0, 36.0, 108.0, 500.0, 3073.0, 213.0, 65.0, 22.0, 11.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.375, -126.8740234375, -123.373046875, -119.8720703125, -116.37109375, -112.8701171875, -109.369140625, -105.8681640625, -102.3671875, -98.8662109375, -95.365234375, -91.8642578125, -88.36328125, -84.8623046875, -81.361328125, -77.8603515625, -74.359375, -70.8583984375, -67.357421875, -63.8564453125, -60.35546875, -56.8544921875, -53.353515625, -49.8525390625, -46.3515625, -42.8505859375, -39.349609375, -35.8486328125, -32.34765625, -28.8466796875, -25.345703125, -21.8447265625, -18.34375, -14.8427734375, -11.341796875, -7.8408203125, -4.33984375, -0.8388671875, 2.662109375, 6.1630859375, 9.6640625, 13.1650390625, 16.666015625, 20.1669921875, 23.66796875, 27.1689453125, 30.669921875, 34.1708984375, 37.671875, 41.1728515625, 44.673828125, 48.1748046875, 51.67578125, 55.1767578125, 58.677734375, 62.1787109375, 65.6796875, 69.1806640625, 72.681640625, 76.1826171875, 79.68359375, 83.1845703125, 86.685546875, 90.1865234375, 93.6875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 29.0, 55.0, 49.0, 116.0, 150.0, 180.0, 135.0, 83.0, 64.0, 28.0, 27.0, 18.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-574.7474365234375, -563.2962646484375, -551.8450927734375, -540.3939819335938, -528.9428100585938, -517.4916381835938, -506.04046630859375, -494.58929443359375, -483.1381530761719, -471.6869812011719, -460.23583984375, -448.78466796875, -437.33349609375, -425.8823547363281, -414.4311828613281, -402.98004150390625, -391.52886962890625, -380.07769775390625, -368.6265563964844, -357.1753845214844, -345.7242431640625, -334.2730712890625, -322.8218994140625, -311.3707275390625, -299.9195861816406, -288.4684143066406, -277.01727294921875, -265.56610107421875, -254.1149444580078, -242.66378784179688, -231.21261596679688, -219.76145935058594, -208.310302734375, -196.85914611816406, -185.40798950195312, -173.95681762695312, -162.5056610107422, -151.05450439453125, -139.60333251953125, -128.1521759033203, -116.70101928710938, -105.24986267089844, -93.79869842529297, -82.3475341796875, -70.89637756347656, -59.44521713256836, -47.994056701660156, -36.54289245605469, -25.09173583984375, -13.640575408935547, -2.1894149780273438, 9.26174545288086, 20.712905883789062, 32.164066314697266, 43.61522674560547, 55.06639099121094, 66.51754760742188, 77.96870422363281, 89.41986846923828, 100.87103271484375, 112.32218933105469, 123.77334594726562, 135.22451782226562, 146.67567443847656, 158.1268310546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0, 7.0, 10.0, 5.0, 7.0, 10.0, 10.0, 16.0, 10.0, 16.0, 17.0, 22.0, 26.0, 25.0, 25.0, 31.0, 38.0, 27.0, 30.0, 43.0, 52.0, 34.0, 41.0, 40.0, 52.0, 39.0, 37.0, 43.0, 53.0, 24.0, 24.0, 33.0, 28.0, 15.0, 18.0, 17.0, 13.0, 9.0, 13.0, 5.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-137.32858276367188, -132.5045166015625, -127.68045806884766, -122.85639190673828, -118.03233337402344, -113.20826721191406, -108.38420104980469, -103.56013488769531, -98.73607635498047, -93.9120101928711, -89.08795166015625, -84.26388549804688, -79.4398193359375, -74.61576080322266, -69.79169464111328, -64.96763610839844, -60.14356994628906, -55.31950759887695, -50.495445251464844, -45.67137908935547, -40.84731674194336, -36.02325439453125, -31.199190139770508, -26.375125885009766, -21.551063537597656, -16.727001190185547, -11.902936935424805, -7.078873634338379, -2.254810333251953, 2.5692520141601562, 7.393316268920898, 12.21738052368164, 17.04144287109375, 21.86550521850586, 26.6895694732666, 31.513633728027344, 36.33769607543945, 41.16175842285156, 45.98582458496094, 50.80988693237305, 55.633949279785156, 60.458011627197266, 65.28207397460938, 70.10614013671875, 74.93020629882812, 79.75426483154297, 84.57833099365234, 89.40238952636719, 94.22645568847656, 99.05052185058594, 103.87458038330078, 108.69864654541016, 113.522705078125, 118.34677124023438, 123.17083740234375, 127.99490356445312, 132.8189697265625, 137.64303588867188, 142.46710205078125, 147.29115295410156, 152.11521911621094, 156.9392852783203, 161.7633514404297, 166.58741760253906, 171.41146850585938]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 15.0, 13.0, 20.0, 20.0, 30.0, 47.0, 57.0, 77.0, 109.0, 143.0, 200.0, 260.0, 384.0, 548.0, 902.0, 1465.0, 2783.0, 5954.0, 14397.0, 44557.0, 181452.0, 533318.0, 187892.0, 45758.0, 14840.0, 6142.0, 2835.0, 1556.0, 848.0, 526.0, 372.0, 281.0, 185.0, 135.0, 93.0, 79.0, 63.0, 43.0, 27.0, 27.0, 18.0, 13.0, 14.0, 9.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -62.5673828125, -60.447265625, -58.3271484375, -56.20703125, -54.0869140625, -51.966796875, -49.8466796875, -47.7265625, -45.6064453125, -43.486328125, -41.3662109375, -39.24609375, -37.1259765625, -35.005859375, -32.8857421875, -30.765625, -28.6455078125, -26.525390625, -24.4052734375, -22.28515625, -20.1650390625, -18.044921875, -15.9248046875, -13.8046875, -11.6845703125, -9.564453125, -7.4443359375, -5.32421875, -3.2041015625, -1.083984375, 1.0361328125, 3.15625, 5.2763671875, 7.396484375, 9.5166015625, 11.63671875, 13.7568359375, 15.876953125, 17.9970703125, 20.1171875, 22.2373046875, 24.357421875, 26.4775390625, 28.59765625, 30.7177734375, 32.837890625, 34.9580078125, 37.078125, 39.1982421875, 41.318359375, 43.4384765625, 45.55859375, 47.6787109375, 49.798828125, 51.9189453125, 54.0390625, 56.1591796875, 58.279296875, 60.3994140625, 62.51953125, 64.6396484375, 66.759765625, 68.8798828125, 71.0]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 11.0, 18.0, 18.0, 25.0, 26.0, 25.0, 31.0, 37.0, 33.0, 36.0, 49.0, 46.0, 43.0, 59.0, 46.0, 40.0, 48.0, 46.0, 41.0, 29.0, 28.0, 36.0, 19.0, 27.0, 24.0, 19.0, 26.0, 10.0, 14.0, 7.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.734375, -13.307373046875, -12.88037109375, -12.453369140625, -12.0263671875, -11.599365234375, -11.17236328125, -10.745361328125, -10.318359375, -9.891357421875, -9.46435546875, -9.037353515625, -8.6103515625, -8.183349609375, -7.75634765625, -7.329345703125, -6.90234375, -6.475341796875, -6.04833984375, -5.621337890625, -5.1943359375, -4.767333984375, -4.34033203125, -3.913330078125, -3.486328125, -3.059326171875, -2.63232421875, -2.205322265625, -1.7783203125, -1.351318359375, -0.92431640625, -0.497314453125, -0.0703125, 0.356689453125, 0.78369140625, 1.210693359375, 1.6376953125, 2.064697265625, 2.49169921875, 2.918701171875, 3.345703125, 3.772705078125, 4.19970703125, 4.626708984375, 5.0537109375, 5.480712890625, 5.90771484375, 6.334716796875, 6.76171875, 7.188720703125, 7.61572265625, 8.042724609375, 8.4697265625, 8.896728515625, 9.32373046875, 9.750732421875, 10.177734375, 10.604736328125, 11.03173828125, 11.458740234375, 11.8857421875, 12.312744140625, 12.73974609375, 13.166748046875, 13.59375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 12.0, 8.0, 15.0, 13.0, 28.0, 30.0, 30.0, 52.0, 74.0, 82.0, 120.0, 188.0, 248.0, 320.0, 471.0, 752.0, 1245.0, 2312.0, 4969.0, 17254.0, 133697.0, 756982.0, 104769.0, 14629.0, 4547.0, 2116.0, 1174.0, 732.0, 487.0, 333.0, 229.0, 148.0, 109.0, 101.0, 71.0, 53.0, 42.0, 22.0, 22.0, 12.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-117.75, -114.33203125, -110.9140625, -107.49609375, -104.078125, -100.66015625, -97.2421875, -93.82421875, -90.40625, -86.98828125, -83.5703125, -80.15234375, -76.734375, -73.31640625, -69.8984375, -66.48046875, -63.0625, -59.64453125, -56.2265625, -52.80859375, -49.390625, -45.97265625, -42.5546875, -39.13671875, -35.71875, -32.30078125, -28.8828125, -25.46484375, -22.046875, -18.62890625, -15.2109375, -11.79296875, -8.375, -4.95703125, -1.5390625, 1.87890625, 5.296875, 8.71484375, 12.1328125, 15.55078125, 18.96875, 22.38671875, 25.8046875, 29.22265625, 32.640625, 36.05859375, 39.4765625, 42.89453125, 46.3125, 49.73046875, 53.1484375, 56.56640625, 59.984375, 63.40234375, 66.8203125, 70.23828125, 73.65625, 77.07421875, 80.4921875, 83.91015625, 87.328125, 90.74609375, 94.1640625, 97.58203125, 101.0]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 7.0, 11.0, 18.0, 20.0, 32.0, 51.0, 61.0, 52.0, 79.0, 83.0, 89.0, 87.0, 80.0, 54.0, 62.0, 56.0, 39.0, 30.0, 27.0, 21.0, 7.0, 9.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.1875, -105.3994140625, -101.611328125, -97.8232421875, -94.03515625, -90.2470703125, -86.458984375, -82.6708984375, -78.8828125, -75.0947265625, -71.306640625, -67.5185546875, -63.73046875, -59.9423828125, -56.154296875, -52.3662109375, -48.578125, -44.7900390625, -41.001953125, -37.2138671875, -33.42578125, -29.6376953125, -25.849609375, -22.0615234375, -18.2734375, -14.4853515625, -10.697265625, -6.9091796875, -3.12109375, 0.6669921875, 4.455078125, 8.2431640625, 12.03125, 15.8193359375, 19.607421875, 23.3955078125, 27.18359375, 30.9716796875, 34.759765625, 38.5478515625, 42.3359375, 46.1240234375, 49.912109375, 53.7001953125, 57.48828125, 61.2763671875, 65.064453125, 68.8525390625, 72.640625, 76.4287109375, 80.216796875, 84.0048828125, 87.79296875, 91.5810546875, 95.369140625, 99.1572265625, 102.9453125, 106.7333984375, 110.521484375, 114.3095703125, 118.09765625, 121.8857421875, 125.673828125, 129.4619140625, 133.25]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 2.0, 6.0, 18.0, 20.0, 28.0, 50.0, 64.0, 98.0, 111.0, 168.0, 224.0, 300.0, 457.0, 697.0, 1009.0, 1563.0, 2407.0, 4398.0, 13033.0, 260732.0, 729620.0, 20205.0, 5289.0, 2718.0, 1759.0, 1078.0, 746.0, 512.0, 365.0, 266.0, 170.0, 119.0, 82.0, 55.0, 49.0, 30.0, 29.0, 18.0, 18.0, 9.0, 10.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.75, -81.05859375, -78.3671875, -75.67578125, -72.984375, -70.29296875, -67.6015625, -64.91015625, -62.21875, -59.52734375, -56.8359375, -54.14453125, -51.453125, -48.76171875, -46.0703125, -43.37890625, -40.6875, -37.99609375, -35.3046875, -32.61328125, -29.921875, -27.23046875, -24.5390625, -21.84765625, -19.15625, -16.46484375, -13.7734375, -11.08203125, -8.390625, -5.69921875, -3.0078125, -0.31640625, 2.375, 5.06640625, 7.7578125, 10.44921875, 13.140625, 15.83203125, 18.5234375, 21.21484375, 23.90625, 26.59765625, 29.2890625, 31.98046875, 34.671875, 37.36328125, 40.0546875, 42.74609375, 45.4375, 48.12890625, 50.8203125, 53.51171875, 56.203125, 58.89453125, 61.5859375, 64.27734375, 66.96875, 69.66015625, 72.3515625, 75.04296875, 77.734375, 80.42578125, 83.1171875, 85.80859375, 88.5]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 17.0, 76.0, 309.0, 448.0, 100.0, 21.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0355224609375, -0.03444957733154297, -0.03337669372558594, -0.032303810119628906, -0.031230926513671875, -0.030158042907714844, -0.029085159301757812, -0.02801227569580078, -0.02693939208984375, -0.02586650848388672, -0.024793624877929688, -0.023720741271972656, -0.022647857666015625, -0.021574974060058594, -0.020502090454101562, -0.01942920684814453, -0.0183563232421875, -0.01728343963623047, -0.016210556030273438, -0.015137672424316406, -0.014064788818359375, -0.012991905212402344, -0.011919021606445312, -0.010846138000488281, -0.00977325439453125, -0.008700370788574219, -0.0076274871826171875, -0.006554603576660156, -0.005481719970703125, -0.004408836364746094, -0.0033359527587890625, -0.0022630691528320312, -0.001190185546875, -0.00011730194091796875, 0.0009555816650390625, 0.0020284652709960938, 0.003101348876953125, 0.004174232482910156, 0.0052471160888671875, 0.006319999694824219, 0.00739288330078125, 0.008465766906738281, 0.009538650512695312, 0.010611534118652344, 0.011684417724609375, 0.012757301330566406, 0.013830184936523438, 0.014903068542480469, 0.0159759521484375, 0.01704883575439453, 0.018121719360351562, 0.019194602966308594, 0.020267486572265625, 0.021340370178222656, 0.022413253784179688, 0.02348613739013672, 0.02455902099609375, 0.02563190460205078, 0.026704788208007812, 0.027777671813964844, 0.028850555419921875, 0.029923439025878906, 0.030996322631835938, 0.03206920623779297, 0.03314208984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 23.0, 18.0, 23.0, 32.0, 63.0, 79.0, 137.0, 261.0, 443.0, 792.0, 1540.0, 2902.0, 6596.0, 39430.0, 929007.0, 53086.0, 7391.0, 3085.0, 1625.0, 861.0, 419.0, 283.0, 165.0, 88.0, 55.0, 45.0, 19.0, 14.0, 16.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.1875, -95.9404296875, -92.693359375, -89.4462890625, -86.19921875, -82.9521484375, -79.705078125, -76.4580078125, -73.2109375, -69.9638671875, -66.716796875, -63.4697265625, -60.22265625, -56.9755859375, -53.728515625, -50.4814453125, -47.234375, -43.9873046875, -40.740234375, -37.4931640625, -34.24609375, -30.9990234375, -27.751953125, -24.5048828125, -21.2578125, -18.0107421875, -14.763671875, -11.5166015625, -8.26953125, -5.0224609375, -1.775390625, 1.4716796875, 4.71875, 7.9658203125, 11.212890625, 14.4599609375, 17.70703125, 20.9541015625, 24.201171875, 27.4482421875, 30.6953125, 33.9423828125, 37.189453125, 40.4365234375, 43.68359375, 46.9306640625, 50.177734375, 53.4248046875, 56.671875, 59.9189453125, 63.166015625, 66.4130859375, 69.66015625, 72.9072265625, 76.154296875, 79.4013671875, 82.6484375, 85.8955078125, 89.142578125, 92.3896484375, 95.63671875, 98.8837890625, 102.130859375, 105.3779296875, 108.625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 6.0, 5.0, 19.0, 35.0, 60.0, 133.0, 267.0, 243.0, 98.0, 47.0, 27.0, 15.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.6875, -65.072265625, -62.45703125, -59.841796875, -57.2265625, -54.611328125, -51.99609375, -49.380859375, -46.765625, -44.150390625, -41.53515625, -38.919921875, -36.3046875, -33.689453125, -31.07421875, -28.458984375, -25.84375, -23.228515625, -20.61328125, -17.998046875, -15.3828125, -12.767578125, -10.15234375, -7.537109375, -4.921875, -2.306640625, 0.30859375, 2.923828125, 5.5390625, 8.154296875, 10.76953125, 13.384765625, 16.0, 18.615234375, 21.23046875, 23.845703125, 26.4609375, 29.076171875, 31.69140625, 34.306640625, 36.921875, 39.537109375, 42.15234375, 44.767578125, 47.3828125, 49.998046875, 52.61328125, 55.228515625, 57.84375, 60.458984375, 63.07421875, 65.689453125, 68.3046875, 70.919921875, 73.53515625, 76.150390625, 78.765625, 81.380859375, 83.99609375, 86.611328125, 89.2265625, 91.841796875, 94.45703125, 97.072265625, 99.6875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 5.0, 13.0, 9.0, 17.0, 18.0, 23.0, 30.0, 44.0, 65.0, 76.0, 80.0, 98.0, 89.0, 90.0, 88.0, 64.0, 48.0, 28.0, 19.0, 20.0, 17.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-592.8483276367188, -576.5643310546875, -560.2803955078125, -543.9963989257812, -527.7124633789062, -511.428466796875, -495.1445007324219, -478.86053466796875, -462.5765380859375, -446.2925720214844, -430.00860595703125, -413.724609375, -397.4406433105469, -381.15667724609375, -364.8727111816406, -348.5887451171875, -332.3047790527344, -316.02081298828125, -299.7368469238281, -283.452880859375, -267.16888427734375, -250.88491821289062, -234.6009521484375, -218.31698608398438, -202.0330047607422, -185.74903869628906, -169.46505737304688, -153.18109130859375, -136.89712524414062, -120.61314392089844, -104.32917785644531, -88.04520416259766, -71.76119995117188, -55.47722625732422, -39.19325637817383, -22.909286499023438, -6.625312805175781, 9.658660888671875, 25.942626953125, 42.226600646972656, 58.51057434082031, 74.79454803466797, 91.07852172851562, 107.36248779296875, 123.6464614868164, 139.93043518066406, 156.2144012451172, 172.49838256835938, 188.7823486328125, 205.06631469726562, 221.3502960205078, 237.63426208496094, 253.91824340820312, 270.20220947265625, 286.4861755371094, 302.7701416015625, 319.05413818359375, 335.3381042480469, 351.6220703125, 367.90606689453125, 384.1900329589844, 400.4739990234375, 416.7579650878906, 433.04193115234375, 449.3258972167969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 5.0, 4.0, 7.0, 5.0, 13.0, 8.0, 8.0, 11.0, 15.0, 17.0, 25.0, 23.0, 27.0, 27.0, 29.0, 23.0, 35.0, 48.0, 27.0, 42.0, 48.0, 50.0, 37.0, 48.0, 32.0, 54.0, 38.0, 28.0, 30.0, 29.0, 17.0, 29.0, 24.0, 23.0, 9.0, 16.0, 15.0, 18.0, 11.0, 10.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-379.4832763671875, -368.2763671875, -357.0694274902344, -345.8625183105469, -334.6556091308594, -323.44866943359375, -312.24176025390625, -301.03485107421875, -289.82794189453125, -278.62103271484375, -267.4140930175781, -256.2071838378906, -245.00027465820312, -233.79335021972656, -222.58642578125, -211.3795166015625, -200.17257690429688, -188.9656524658203, -177.7587432861328, -166.55181884765625, -155.34490966796875, -144.1379852294922, -132.93106079101562, -121.7241439819336, -110.51722717285156, -99.31031036376953, -88.1033935546875, -76.89646911621094, -65.6895523071289, -54.482635498046875, -43.27571105957031, -32.06879425048828, -20.86187744140625, -9.654958724975586, 1.5519599914550781, 12.758880615234375, 23.965797424316406, 35.17271423339844, 46.379638671875, 57.58655548095703, 68.79347229003906, 80.0003890991211, 91.20730590820312, 102.41423034667969, 113.62114715576172, 124.82806396484375, 136.0349884033203, 147.24191284179688, 158.44882202148438, 169.65574645996094, 180.86265563964844, 192.069580078125, 203.2764892578125, 214.48341369628906, 225.69033813476562, 236.89724731445312, 248.1041717529297, 259.31109619140625, 270.51800537109375, 281.72491455078125, 292.9318542480469, 304.1387634277344, 315.345703125, 326.5526123046875, 337.759521484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 12.0, 19.0, 38.0, 46.0, 59.0, 76.0, 165.0, 201.0, 338.0, 578.0, 979.0, 1901.0, 4742.0, 22472.0, 4143452.0, 11966.0, 3424.0, 1537.0, 823.0, 519.0, 281.0, 185.0, 123.0, 87.0, 58.0, 41.0, 22.0, 19.0, 15.0, 10.0, 7.0, 13.0, 3.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-204.5, -198.71484375, -192.9296875, -187.14453125, -181.359375, -175.57421875, -169.7890625, -164.00390625, -158.21875, -152.43359375, -146.6484375, -140.86328125, -135.078125, -129.29296875, -123.5078125, -117.72265625, -111.9375, -106.15234375, -100.3671875, -94.58203125, -88.796875, -83.01171875, -77.2265625, -71.44140625, -65.65625, -59.87109375, -54.0859375, -48.30078125, -42.515625, -36.73046875, -30.9453125, -25.16015625, -19.375, -13.58984375, -7.8046875, -2.01953125, 3.765625, 9.55078125, 15.3359375, 21.12109375, 26.90625, 32.69140625, 38.4765625, 44.26171875, 50.046875, 55.83203125, 61.6171875, 67.40234375, 73.1875, 78.97265625, 84.7578125, 90.54296875, 96.328125, 102.11328125, 107.8984375, 113.68359375, 119.46875, 125.25390625, 131.0390625, 136.82421875, 142.609375, 148.39453125, 154.1796875, 159.96484375, 165.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 13.0, 16.0, 16.0, 21.0, 22.0, 30.0, 33.0, 34.0, 36.0, 39.0, 52.0, 51.0, 30.0, 53.0, 54.0, 47.0, 60.0, 43.0, 45.0, 37.0, 34.0, 27.0, 28.0, 24.0, 28.0, 25.0, 15.0, 15.0, 7.0, 14.0, 6.0, 11.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.421875, -16.885498046875, -16.34912109375, -15.812744140625, -15.2763671875, -14.739990234375, -14.20361328125, -13.667236328125, -13.130859375, -12.594482421875, -12.05810546875, -11.521728515625, -10.9853515625, -10.448974609375, -9.91259765625, -9.376220703125, -8.83984375, -8.303466796875, -7.76708984375, -7.230712890625, -6.6943359375, -6.157958984375, -5.62158203125, -5.085205078125, -4.548828125, -4.012451171875, -3.47607421875, -2.939697265625, -2.4033203125, -1.866943359375, -1.33056640625, -0.794189453125, -0.2578125, 0.278564453125, 0.81494140625, 1.351318359375, 1.8876953125, 2.424072265625, 2.96044921875, 3.496826171875, 4.033203125, 4.569580078125, 5.10595703125, 5.642333984375, 6.1787109375, 6.715087890625, 7.25146484375, 7.787841796875, 8.32421875, 8.860595703125, 9.39697265625, 9.933349609375, 10.4697265625, 11.006103515625, 11.54248046875, 12.078857421875, 12.615234375, 13.151611328125, 13.68798828125, 14.224365234375, 14.7607421875, 15.297119140625, 15.83349609375, 16.369873046875, 16.90625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 26.0, 28.0, 33.0, 60.0, 70.0, 102.0, 125.0, 171.0, 242.0, 310.0, 458.0, 800.0, 1671.0, 4978.0, 73170.0, 4100556.0, 6623.0, 2044.0, 863.0, 516.0, 348.0, 251.0, 224.0, 140.0, 112.0, 96.0, 60.0, 60.0, 34.0, 27.0, 24.0, 13.0, 10.0, 4.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-217.0, -207.9921875, -198.984375, -189.9765625, -180.96875, -171.9609375, -162.953125, -153.9453125, -144.9375, -135.9296875, -126.921875, -117.9140625, -108.90625, -99.8984375, -90.890625, -81.8828125, -72.875, -63.8671875, -54.859375, -45.8515625, -36.84375, -27.8359375, -18.828125, -9.8203125, -0.8125, 8.1953125, 17.203125, 26.2109375, 35.21875, 44.2265625, 53.234375, 62.2421875, 71.25, 80.2578125, 89.265625, 98.2734375, 107.28125, 116.2890625, 125.296875, 134.3046875, 143.3125, 152.3203125, 161.328125, 170.3359375, 179.34375, 188.3515625, 197.359375, 206.3671875, 215.375, 224.3828125, 233.390625, 242.3984375, 251.40625, 260.4140625, 269.421875, 278.4296875, 287.4375, 296.4453125, 305.453125, 314.4609375, 323.46875, 332.4765625, 341.484375, 350.4921875, 359.5]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 14.0, 46.0, 3904.0, 67.0, 17.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.1875, -35.67626953125, -34.1650390625, -32.65380859375, -31.142578125, -29.63134765625, -28.1201171875, -26.60888671875, -25.09765625, -23.58642578125, -22.0751953125, -20.56396484375, -19.052734375, -17.54150390625, -16.0302734375, -14.51904296875, -13.0078125, -11.49658203125, -9.9853515625, -8.47412109375, -6.962890625, -5.45166015625, -3.9404296875, -2.42919921875, -0.91796875, 0.59326171875, 2.1044921875, 3.61572265625, 5.126953125, 6.63818359375, 8.1494140625, 9.66064453125, 11.171875, 12.68310546875, 14.1943359375, 15.70556640625, 17.216796875, 18.72802734375, 20.2392578125, 21.75048828125, 23.26171875, 24.77294921875, 26.2841796875, 27.79541015625, 29.306640625, 30.81787109375, 32.3291015625, 33.84033203125, 35.3515625, 36.86279296875, 38.3740234375, 39.88525390625, 41.396484375, 42.90771484375, 44.4189453125, 45.93017578125, 47.44140625, 48.95263671875, 50.4638671875, 51.97509765625, 53.486328125, 54.99755859375, 56.5087890625, 58.02001953125, 59.53125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 13.0, 19.0, 42.0, 78.0, 149.0, 204.0, 179.0, 118.0, 65.0, 46.0, 24.0, 29.0, 10.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.42698669433594, -235.44906616210938, -228.4711456298828, -221.49322509765625, -214.51528930664062, -207.53738403320312, -200.5594482421875, -193.58152770996094, -186.60360717773438, -179.6256866455078, -172.64776611328125, -165.6698455810547, -158.69192504882812, -151.7139892578125, -144.73606872558594, -137.75814819335938, -130.7802276611328, -123.80230712890625, -116.82438659667969, -109.8464584350586, -102.86853790283203, -95.89061737060547, -88.91268920898438, -81.93476867675781, -74.95684814453125, -67.97892761230469, -61.00100326538086, -54.02307891845703, -47.04515838623047, -40.067237854003906, -33.08931350708008, -26.11138916015625, -19.13348388671875, -12.155561447143555, -5.177639007568359, 1.800283432006836, 8.778205871582031, 15.756126403808594, 22.734050750732422, 29.71197509765625, 36.68989562988281, 43.667816162109375, 50.6457405090332, 57.62366485595703, 64.6015853881836, 71.57950592041016, 78.55743408203125, 85.53535461425781, 92.51327514648438, 99.49119567871094, 106.4691162109375, 113.4470443725586, 120.42496490478516, 127.40288543701172, 134.3808135986328, 141.35873413085938, 148.33665466308594, 155.3145751953125, 162.29249572753906, 169.27041625976562, 176.24835205078125, 183.22625732421875, 190.20419311523438, 197.18211364746094, 204.1600341796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 6.0, 9.0, 5.0, 12.0, 8.0, 8.0, 18.0, 16.0, 18.0, 21.0, 17.0, 22.0, 22.0, 28.0, 41.0, 37.0, 36.0, 33.0, 42.0, 31.0, 33.0, 36.0, 36.0, 25.0, 36.0, 28.0, 31.0, 29.0, 26.0, 27.0, 24.0, 28.0, 24.0, 22.0, 19.0, 15.0, 16.0, 27.0, 14.0, 13.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-63.00270080566406, -60.92894744873047, -58.855194091796875, -56.78144073486328, -54.70768737792969, -52.633934020996094, -50.5601806640625, -48.486427307128906, -46.41267395019531, -44.33892059326172, -42.265167236328125, -40.19141387939453, -38.11766052246094, -36.043907165527344, -33.97015380859375, -31.896400451660156, -29.822647094726562, -27.74889373779297, -25.675140380859375, -23.60138702392578, -21.527633666992188, -19.453880310058594, -17.380126953125, -15.306373596191406, -13.232620239257812, -11.158866882324219, -9.085113525390625, -7.011360168457031, -4.9376068115234375, -2.8638534545898438, -0.79010009765625, 1.2836532592773438, 3.3574066162109375, 5.431159973144531, 7.504913330078125, 9.578666687011719, 11.652420043945312, 13.726173400878906, 15.7999267578125, 17.873680114746094, 19.947433471679688, 22.02118682861328, 24.094940185546875, 26.16869354248047, 28.242446899414062, 30.316200256347656, 32.38995361328125, 34.463706970214844, 36.53746032714844, 38.61121368408203, 40.684967041015625, 42.75872039794922, 44.83247375488281, 46.906227111816406, 48.97998046875, 51.053733825683594, 53.12748718261719, 55.20124053955078, 57.274993896484375, 59.34874725341797, 61.42250061035156, 63.496253967285156, 65.57000732421875, 67.64376068115234, 69.71751403808594]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 15.0, 29.0, 21.0, 29.0, 41.0, 65.0, 89.0, 108.0, 142.0, 201.0, 338.0, 427.0, 677.0, 954.0, 1601.0, 2399.0, 3761.0, 6436.0, 11525.0, 21453.0, 42702.0, 92380.0, 226267.0, 339518.0, 157975.0, 67463.0, 31586.0, 16665.0, 9002.0, 5279.0, 3232.0, 2043.0, 1310.0, 870.0, 574.0, 369.0, 318.0, 200.0, 135.0, 89.0, 66.0, 52.0, 29.0, 26.0, 16.0, 25.0, 14.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-48.4375, -46.89013671875, -45.3427734375, -43.79541015625, -42.248046875, -40.70068359375, -39.1533203125, -37.60595703125, -36.05859375, -34.51123046875, -32.9638671875, -31.41650390625, -29.869140625, -28.32177734375, -26.7744140625, -25.22705078125, -23.6796875, -22.13232421875, -20.5849609375, -19.03759765625, -17.490234375, -15.94287109375, -14.3955078125, -12.84814453125, -11.30078125, -9.75341796875, -8.2060546875, -6.65869140625, -5.111328125, -3.56396484375, -2.0166015625, -0.46923828125, 1.078125, 2.62548828125, 4.1728515625, 5.72021484375, 7.267578125, 8.81494140625, 10.3623046875, 11.90966796875, 13.45703125, 15.00439453125, 16.5517578125, 18.09912109375, 19.646484375, 21.19384765625, 22.7412109375, 24.28857421875, 25.8359375, 27.38330078125, 28.9306640625, 30.47802734375, 32.025390625, 33.57275390625, 35.1201171875, 36.66748046875, 38.21484375, 39.76220703125, 41.3095703125, 42.85693359375, 44.404296875, 45.95166015625, 47.4990234375, 49.04638671875, 50.59375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 13.0, 9.0, 7.0, 12.0, 22.0, 12.0, 21.0, 33.0, 34.0, 43.0, 44.0, 59.0, 53.0, 52.0, 50.0, 53.0, 53.0, 57.0, 35.0, 44.0, 34.0, 33.0, 32.0, 28.0, 19.0, 18.0, 18.0, 20.0, 25.0, 12.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.125, -20.435302734375, -19.74560546875, -19.055908203125, -18.3662109375, -17.676513671875, -16.98681640625, -16.297119140625, -15.607421875, -14.917724609375, -14.22802734375, -13.538330078125, -12.8486328125, -12.158935546875, -11.46923828125, -10.779541015625, -10.08984375, -9.400146484375, -8.71044921875, -8.020751953125, -7.3310546875, -6.641357421875, -5.95166015625, -5.261962890625, -4.572265625, -3.882568359375, -3.19287109375, -2.503173828125, -1.8134765625, -1.123779296875, -0.43408203125, 0.255615234375, 0.9453125, 1.635009765625, 2.32470703125, 3.014404296875, 3.7041015625, 4.393798828125, 5.08349609375, 5.773193359375, 6.462890625, 7.152587890625, 7.84228515625, 8.531982421875, 9.2216796875, 9.911376953125, 10.60107421875, 11.290771484375, 11.98046875, 12.670166015625, 13.35986328125, 14.049560546875, 14.7392578125, 15.428955078125, 16.11865234375, 16.808349609375, 17.498046875, 18.187744140625, 18.87744140625, 19.567138671875, 20.2568359375, 20.946533203125, 21.63623046875, 22.325927734375, 23.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 10.0, 21.0, 10.0, 23.0, 32.0, 65.0, 83.0, 172.0, 321.0, 479.0, 1048.0, 2382.0, 5725.0, 15785.0, 57909.0, 360688.0, 500628.0, 72490.0, 18831.0, 6627.0, 2598.0, 1261.0, 584.0, 296.0, 181.0, 122.0, 53.0, 43.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3125, -90.8291015625, -87.345703125, -83.8623046875, -80.37890625, -76.8955078125, -73.412109375, -69.9287109375, -66.4453125, -62.9619140625, -59.478515625, -55.9951171875, -52.51171875, -49.0283203125, -45.544921875, -42.0615234375, -38.578125, -35.0947265625, -31.611328125, -28.1279296875, -24.64453125, -21.1611328125, -17.677734375, -14.1943359375, -10.7109375, -7.2275390625, -3.744140625, -0.2607421875, 3.22265625, 6.7060546875, 10.189453125, 13.6728515625, 17.15625, 20.6396484375, 24.123046875, 27.6064453125, 31.08984375, 34.5732421875, 38.056640625, 41.5400390625, 45.0234375, 48.5068359375, 51.990234375, 55.4736328125, 58.95703125, 62.4404296875, 65.923828125, 69.4072265625, 72.890625, 76.3740234375, 79.857421875, 83.3408203125, 86.82421875, 90.3076171875, 93.791015625, 97.2744140625, 100.7578125, 104.2412109375, 107.724609375, 111.2080078125, 114.69140625, 118.1748046875, 121.658203125, 125.1416015625, 128.625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 19.0, 17.0, 25.0, 30.0, 21.0, 40.0, 47.0, 41.0, 37.0, 59.0, 60.0, 49.0, 45.0, 60.0, 69.0, 56.0, 53.0, 35.0, 39.0, 29.0, 41.0, 21.0, 15.0, 14.0, 9.0, 16.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.375, -110.953125, -106.53125, -102.109375, -97.6875, -93.265625, -88.84375, -84.421875, -80.0, -75.578125, -71.15625, -66.734375, -62.3125, -57.890625, -53.46875, -49.046875, -44.625, -40.203125, -35.78125, -31.359375, -26.9375, -22.515625, -18.09375, -13.671875, -9.25, -4.828125, -0.40625, 4.015625, 8.4375, 12.859375, 17.28125, 21.703125, 26.125, 30.546875, 34.96875, 39.390625, 43.8125, 48.234375, 52.65625, 57.078125, 61.5, 65.921875, 70.34375, 74.765625, 79.1875, 83.609375, 88.03125, 92.453125, 96.875, 101.296875, 105.71875, 110.140625, 114.5625, 118.984375, 123.40625, 127.828125, 132.25, 136.671875, 141.09375, 145.515625, 149.9375, 154.359375, 158.78125, 163.203125, 167.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 21.0, 32.0, 36.0, 60.0, 88.0, 135.0, 205.0, 317.0, 487.0, 760.0, 1308.0, 2339.0, 4898.0, 12149.0, 43821.0, 447540.0, 466531.0, 44751.0, 12244.0, 4868.0, 2347.0, 1378.0, 775.0, 442.0, 321.0, 173.0, 155.0, 108.0, 66.0, 42.0, 44.0, 19.0, 16.0, 13.0, 7.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.59375, -52.8330078125, -51.072265625, -49.3115234375, -47.55078125, -45.7900390625, -44.029296875, -42.2685546875, -40.5078125, -38.7470703125, -36.986328125, -35.2255859375, -33.46484375, -31.7041015625, -29.943359375, -28.1826171875, -26.421875, -24.6611328125, -22.900390625, -21.1396484375, -19.37890625, -17.6181640625, -15.857421875, -14.0966796875, -12.3359375, -10.5751953125, -8.814453125, -7.0537109375, -5.29296875, -3.5322265625, -1.771484375, -0.0107421875, 1.75, 3.5107421875, 5.271484375, 7.0322265625, 8.79296875, 10.5537109375, 12.314453125, 14.0751953125, 15.8359375, 17.5966796875, 19.357421875, 21.1181640625, 22.87890625, 24.6396484375, 26.400390625, 28.1611328125, 29.921875, 31.6826171875, 33.443359375, 35.2041015625, 36.96484375, 38.7255859375, 40.486328125, 42.2470703125, 44.0078125, 45.7685546875, 47.529296875, 49.2900390625, 51.05078125, 52.8115234375, 54.572265625, 56.3330078125, 58.09375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 19.0, 23.0, 34.0, 58.0, 78.0, 99.0, 131.0, 120.0, 108.0, 76.0, 51.0, 40.0, 25.0, 13.0, 26.0, 13.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01082611083984375, -0.01050722599029541, -0.01018834114074707, -0.00986945629119873, -0.00955057144165039, -0.00923168659210205, -0.008912801742553711, -0.008593916893005371, -0.008275032043457031, -0.007956147193908691, -0.0076372623443603516, -0.007318377494812012, -0.006999492645263672, -0.006680607795715332, -0.006361722946166992, -0.006042838096618652, -0.0057239532470703125, -0.005405068397521973, -0.005086183547973633, -0.004767298698425293, -0.004448413848876953, -0.004129528999328613, -0.0038106441497802734, -0.0034917593002319336, -0.0031728744506835938, -0.002853989601135254, -0.002535104751586914, -0.0022162199020385742, -0.0018973350524902344, -0.0015784502029418945, -0.0012595653533935547, -0.0009406805038452148, -0.000621795654296875, -0.00030291080474853516, 1.5974044799804688e-05, 0.00033485889434814453, 0.0006537437438964844, 0.0009726285934448242, 0.001291513442993164, 0.001610398292541504, 0.0019292831420898438, 0.0022481679916381836, 0.0025670528411865234, 0.0028859376907348633, 0.003204822540283203, 0.003523707389831543, 0.003842592239379883, 0.004161477088928223, 0.0044803619384765625, 0.004799246788024902, 0.005118131637573242, 0.005437016487121582, 0.005755901336669922, 0.006074786186218262, 0.0063936710357666016, 0.006712555885314941, 0.007031440734863281, 0.007350325584411621, 0.007669210433959961, 0.0079880952835083, 0.00830698013305664, 0.00862586498260498, 0.00894474983215332, 0.00926363468170166, 0.00958251953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 17.0, 38.0, 64.0, 101.0, 148.0, 348.0, 757.0, 1928.0, 7195.0, 44423.0, 837202.0, 137676.0, 13348.0, 3145.0, 1113.0, 454.0, 242.0, 100.0, 83.0, 42.0, 28.0, 21.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.8125, -102.7626953125, -99.712890625, -96.6630859375, -93.61328125, -90.5634765625, -87.513671875, -84.4638671875, -81.4140625, -78.3642578125, -75.314453125, -72.2646484375, -69.21484375, -66.1650390625, -63.115234375, -60.0654296875, -57.015625, -53.9658203125, -50.916015625, -47.8662109375, -44.81640625, -41.7666015625, -38.716796875, -35.6669921875, -32.6171875, -29.5673828125, -26.517578125, -23.4677734375, -20.41796875, -17.3681640625, -14.318359375, -11.2685546875, -8.21875, -5.1689453125, -2.119140625, 0.9306640625, 3.98046875, 7.0302734375, 10.080078125, 13.1298828125, 16.1796875, 19.2294921875, 22.279296875, 25.3291015625, 28.37890625, 31.4287109375, 34.478515625, 37.5283203125, 40.578125, 43.6279296875, 46.677734375, 49.7275390625, 52.77734375, 55.8271484375, 58.876953125, 61.9267578125, 64.9765625, 68.0263671875, 71.076171875, 74.1259765625, 77.17578125, 80.2255859375, 83.275390625, 86.3251953125, 89.375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 12.0, 16.0, 31.0, 51.0, 88.0, 141.0, 196.0, 171.0, 109.0, 57.0, 28.0, 23.0, 17.0, 9.0, 12.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-113.9375, -111.3330078125, -108.728515625, -106.1240234375, -103.51953125, -100.9150390625, -98.310546875, -95.7060546875, -93.1015625, -90.4970703125, -87.892578125, -85.2880859375, -82.68359375, -80.0791015625, -77.474609375, -74.8701171875, -72.265625, -69.6611328125, -67.056640625, -64.4521484375, -61.84765625, -59.2431640625, -56.638671875, -54.0341796875, -51.4296875, -48.8251953125, -46.220703125, -43.6162109375, -41.01171875, -38.4072265625, -35.802734375, -33.1982421875, -30.59375, -27.9892578125, -25.384765625, -22.7802734375, -20.17578125, -17.5712890625, -14.966796875, -12.3623046875, -9.7578125, -7.1533203125, -4.548828125, -1.9443359375, 0.66015625, 3.2646484375, 5.869140625, 8.4736328125, 11.078125, 13.6826171875, 16.287109375, 18.8916015625, 21.49609375, 24.1005859375, 26.705078125, 29.3095703125, 31.9140625, 34.5185546875, 37.123046875, 39.7275390625, 42.33203125, 44.9365234375, 47.541015625, 50.1455078125, 52.75]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 21.0, 27.0, 49.0, 58.0, 83.0, 134.0, 152.0, 152.0, 110.0, 73.0, 56.0, 34.0, 13.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-520.7315063476562, -487.66729736328125, -454.60308837890625, -421.53887939453125, -388.47467041015625, -355.41046142578125, -322.3462829589844, -289.2820739746094, -256.2178649902344, -223.15365600585938, -190.08944702148438, -157.02525329589844, -123.96104431152344, -90.89683532714844, -57.8326416015625, -24.7684326171875, 8.2957763671875, 41.359981536865234, 74.42418670654297, 107.48838806152344, 140.55259704589844, 173.61680603027344, 206.68099975585938, 239.74520874023438, 272.8094177246094, 305.8736267089844, 338.9378356933594, 372.00201416015625, 405.06622314453125, 438.13043212890625, 471.19464111328125, 504.25885009765625, 537.322998046875, 570.38720703125, 603.451416015625, 636.515625, 669.579833984375, 702.64404296875, 735.708251953125, 768.7724609375, 801.836669921875, 834.90087890625, 867.965087890625, 901.029296875, 934.093505859375, 967.15771484375, 1000.221923828125, 1033.2861328125, 1066.350341796875, 1099.41455078125, 1132.478759765625, 1165.54296875, 1198.607177734375, 1231.67138671875, 1264.735595703125, 1297.7998046875, 1330.8638916015625, 1363.9281005859375, 1396.9923095703125, 1430.0565185546875, 1463.1207275390625, 1496.1849365234375, 1529.2491455078125, 1562.3133544921875, 1595.3775634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 1.0, 7.0, 6.0, 11.0, 12.0, 13.0, 13.0, 16.0, 22.0, 20.0, 18.0, 22.0, 22.0, 25.0, 33.0, 42.0, 33.0, 39.0, 33.0, 38.0, 56.0, 40.0, 45.0, 40.0, 33.0, 31.0, 32.0, 41.0, 27.0, 32.0, 20.0, 18.0, 21.0, 25.0, 22.0, 12.0, 11.0, 14.0, 7.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-495.1510009765625, -478.4688720703125, -461.7867431640625, -445.1046142578125, -428.4224853515625, -411.7403564453125, -395.0581970214844, -378.3760681152344, -361.6939392089844, -345.0118103027344, -328.3296813964844, -311.6475524902344, -294.96539306640625, -278.28326416015625, -261.60113525390625, -244.91900634765625, -228.23687744140625, -211.55474853515625, -194.87261962890625, -178.1904754638672, -161.5083465576172, -144.8262176513672, -128.14407348632812, -111.46194458007812, -94.77981567382812, -78.09768676757812, -61.415550231933594, -44.73341751098633, -28.051284790039062, -11.369155883789062, 5.312980651855469, 21.9951171875, 38.67718505859375, 55.359317779541016, 72.04145050048828, 88.72358703613281, 105.40571594238281, 122.08784484863281, 138.76998901367188, 155.45211791992188, 172.13424682617188, 188.81637573242188, 205.49850463867188, 222.18064880371094, 238.86277770996094, 255.54490661621094, 272.22705078125, 288.9091796875, 305.59130859375, 322.2734375, 338.95556640625, 355.6376953125, 372.31982421875, 389.001953125, 405.6841125488281, 422.3662414550781, 439.0483703613281, 455.7304992675781, 472.4126281738281, 489.0947570800781, 505.77691650390625, 522.4590454101562, 539.1411743164062, 555.8233032226562, 572.5054321289062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 16.0, 13.0, 32.0, 30.0, 74.0, 95.0, 128.0, 173.0, 250.0, 429.0, 611.0, 999.0, 1661.0, 3899.0, 27188.0, 4144708.0, 7958.0, 2359.0, 1242.0, 792.0, 535.0, 332.0, 260.0, 145.0, 95.0, 81.0, 55.0, 32.0, 23.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-259.5, -252.71484375, -245.9296875, -239.14453125, -232.359375, -225.57421875, -218.7890625, -212.00390625, -205.21875, -198.43359375, -191.6484375, -184.86328125, -178.078125, -171.29296875, -164.5078125, -157.72265625, -150.9375, -144.15234375, -137.3671875, -130.58203125, -123.796875, -117.01171875, -110.2265625, -103.44140625, -96.65625, -89.87109375, -83.0859375, -76.30078125, -69.515625, -62.73046875, -55.9453125, -49.16015625, -42.375, -35.58984375, -28.8046875, -22.01953125, -15.234375, -8.44921875, -1.6640625, 5.12109375, 11.90625, 18.69140625, 25.4765625, 32.26171875, 39.046875, 45.83203125, 52.6171875, 59.40234375, 66.1875, 72.97265625, 79.7578125, 86.54296875, 93.328125, 100.11328125, 106.8984375, 113.68359375, 120.46875, 127.25390625, 134.0390625, 140.82421875, 147.609375, 154.39453125, 161.1796875, 167.96484375, 174.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 15.0, 20.0, 25.0, 15.0, 26.0, 33.0, 39.0, 47.0, 44.0, 42.0, 54.0, 55.0, 56.0, 53.0, 57.0, 44.0, 43.0, 55.0, 42.0, 41.0, 31.0, 28.0, 28.0, 14.0, 16.0, 14.0, 13.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.772216796875, -19.99755859375, -19.222900390625, -18.4482421875, -17.673583984375, -16.89892578125, -16.124267578125, -15.349609375, -14.574951171875, -13.80029296875, -13.025634765625, -12.2509765625, -11.476318359375, -10.70166015625, -9.927001953125, -9.15234375, -8.377685546875, -7.60302734375, -6.828369140625, -6.0537109375, -5.279052734375, -4.50439453125, -3.729736328125, -2.955078125, -2.180419921875, -1.40576171875, -0.631103515625, 0.1435546875, 0.918212890625, 1.69287109375, 2.467529296875, 3.2421875, 4.016845703125, 4.79150390625, 5.566162109375, 6.3408203125, 7.115478515625, 7.89013671875, 8.664794921875, 9.439453125, 10.214111328125, 10.98876953125, 11.763427734375, 12.5380859375, 13.312744140625, 14.08740234375, 14.862060546875, 15.63671875, 16.411376953125, 17.18603515625, 17.960693359375, 18.7353515625, 19.510009765625, 20.28466796875, 21.059326171875, 21.833984375, 22.608642578125, 23.38330078125, 24.157958984375, 24.9326171875, 25.707275390625, 26.48193359375, 27.256591796875, 28.03125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 9.0, 9.0, 15.0, 18.0, 22.0, 36.0, 45.0, 41.0, 85.0, 102.0, 172.0, 281.0, 551.0, 1349.0, 3994.0, 22458.0, 4147232.0, 12589.0, 2977.0, 1049.0, 433.0, 262.0, 151.0, 99.0, 68.0, 56.0, 49.0, 31.0, 21.0, 21.0, 10.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.01171875, -291.0234375, -282.03515625, -273.046875, -264.05859375, -255.0703125, -246.08203125, -237.09375, -228.10546875, -219.1171875, -210.12890625, -201.140625, -192.15234375, -183.1640625, -174.17578125, -165.1875, -156.19921875, -147.2109375, -138.22265625, -129.234375, -120.24609375, -111.2578125, -102.26953125, -93.28125, -84.29296875, -75.3046875, -66.31640625, -57.328125, -48.33984375, -39.3515625, -30.36328125, -21.375, -12.38671875, -3.3984375, 5.58984375, 14.578125, 23.56640625, 32.5546875, 41.54296875, 50.53125, 59.51953125, 68.5078125, 77.49609375, 86.484375, 95.47265625, 104.4609375, 113.44921875, 122.4375, 131.42578125, 140.4140625, 149.40234375, 158.390625, 167.37890625, 176.3671875, 185.35546875, 194.34375, 203.33203125, 212.3203125, 221.30859375, 230.296875, 239.28515625, 248.2734375, 257.26171875, 266.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 45.0, 3845.0, 123.0, 15.0, 12.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -73.22314453125, -71.3837890625, -69.54443359375, -67.705078125, -65.86572265625, -64.0263671875, -62.18701171875, -60.34765625, -58.50830078125, -56.6689453125, -54.82958984375, -52.990234375, -51.15087890625, -49.3115234375, -47.47216796875, -45.6328125, -43.79345703125, -41.9541015625, -40.11474609375, -38.275390625, -36.43603515625, -34.5966796875, -32.75732421875, -30.91796875, -29.07861328125, -27.2392578125, -25.39990234375, -23.560546875, -21.72119140625, -19.8818359375, -18.04248046875, -16.203125, -14.36376953125, -12.5244140625, -10.68505859375, -8.845703125, -7.00634765625, -5.1669921875, -3.32763671875, -1.48828125, 0.35107421875, 2.1904296875, 4.02978515625, 5.869140625, 7.70849609375, 9.5478515625, 11.38720703125, 13.2265625, 15.06591796875, 16.9052734375, 18.74462890625, 20.583984375, 22.42333984375, 24.2626953125, 26.10205078125, 27.94140625, 29.78076171875, 31.6201171875, 33.45947265625, 35.298828125, 37.13818359375, 38.9775390625, 40.81689453125, 42.65625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 5.0, 6.0, 13.0, 14.0, 22.0, 23.0, 17.0, 42.0, 44.0, 59.0, 69.0, 78.0, 95.0, 96.0, 77.0, 72.0, 73.0, 48.0, 43.0, 22.0, 19.0, 10.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-117.26155090332031, -114.4413070678711, -111.62106323242188, -108.80081939697266, -105.98057556152344, -103.16033172607422, -100.340087890625, -97.51983642578125, -94.69960021972656, -91.87935638427734, -89.05911254882812, -86.2388687133789, -83.41862487792969, -80.59838104248047, -77.77813720703125, -74.9578857421875, -72.13764190673828, -69.31739807128906, -66.49715423583984, -63.676910400390625, -60.856666564941406, -58.03642272949219, -55.2161750793457, -52.395931243896484, -49.575687408447266, -46.75544357299805, -43.93519973754883, -41.114952087402344, -38.294708251953125, -35.474464416503906, -32.65422058105469, -29.83397674560547, -27.013736724853516, -24.193492889404297, -21.373249053955078, -18.553003311157227, -15.732759475708008, -12.912515640258789, -10.092269897460938, -7.272026062011719, -4.4517822265625, -1.631537914276123, 1.188706398010254, 4.008951187133789, 6.829195022583008, 9.649438858032227, 12.469684600830078, 15.289928436279297, 18.110172271728516, 20.930416107177734, 23.750659942626953, 26.570905685424805, 29.391149520874023, 32.211395263671875, 35.031639099121094, 37.85188293457031, 40.67212677001953, 43.49237060546875, 46.31261444091797, 49.13285827636719, 51.953102111816406, 54.773345947265625, 57.59359359741211, 60.41383743286133, 63.23408126831055]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 22.0, 14.0, 23.0, 31.0, 29.0, 37.0, 32.0, 39.0, 31.0, 44.0, 47.0, 56.0, 49.0, 53.0, 50.0, 45.0, 46.0, 38.0, 35.0, 46.0, 31.0, 30.0, 22.0, 8.0, 14.0, 16.0, 21.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-85.15863037109375, -82.89708709716797, -80.63554382324219, -78.3740005493164, -76.11245727539062, -73.85091400146484, -71.58937072753906, -69.32783508300781, -67.0662841796875, -64.80474090576172, -62.54319763183594, -60.281654357910156, -58.020111083984375, -55.758567810058594, -53.49702835083008, -51.2354850769043, -48.97394561767578, -46.71240234375, -44.45085906982422, -42.18931579589844, -39.927772521972656, -37.666229248046875, -35.40468978881836, -33.14314651489258, -30.881603240966797, -28.620059967041016, -26.358516693115234, -24.096975326538086, -21.835432052612305, -19.573888778686523, -17.312347412109375, -15.050804138183594, -12.789268493652344, -10.527725219726562, -8.266182899475098, -6.004640102386475, -3.7430973052978516, -1.4815540313720703, 0.7799882888793945, 3.0415306091308594, 5.303073883056641, 7.564616680145264, 9.826159477233887, 12.087701797485352, 14.349245071411133, 16.610788345336914, 18.872329711914062, 21.133872985839844, 23.395416259765625, 25.656959533691406, 27.918502807617188, 30.180044174194336, 32.44158935546875, 34.70313262939453, 36.96467208862305, 39.22621536254883, 41.48775863647461, 43.74930191040039, 46.01084518432617, 48.27238845825195, 50.53392791748047, 52.79547119140625, 55.05701446533203, 57.31855773925781, 59.580101013183594]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 13.0, 11.0, 15.0, 42.0, 47.0, 72.0, 87.0, 138.0, 188.0, 281.0, 457.0, 721.0, 1123.0, 1815.0, 2907.0, 5179.0, 9397.0, 18051.0, 37886.0, 87937.0, 229442.0, 362427.0, 163511.0, 65109.0, 29188.0, 14100.0, 7503.0, 4252.0, 2509.0, 1451.0, 906.0, 597.0, 391.0, 263.0, 175.0, 112.0, 74.0, 48.0, 27.0, 22.0, 23.0, 13.0, 10.0, 14.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.7314453125, -52.119140625, -50.5068359375, -48.89453125, -47.2822265625, -45.669921875, -44.0576171875, -42.4453125, -40.8330078125, -39.220703125, -37.6083984375, -35.99609375, -34.3837890625, -32.771484375, -31.1591796875, -29.546875, -27.9345703125, -26.322265625, -24.7099609375, -23.09765625, -21.4853515625, -19.873046875, -18.2607421875, -16.6484375, -15.0361328125, -13.423828125, -11.8115234375, -10.19921875, -8.5869140625, -6.974609375, -5.3623046875, -3.75, -2.1376953125, -0.525390625, 1.0869140625, 2.69921875, 4.3115234375, 5.923828125, 7.5361328125, 9.1484375, 10.7607421875, 12.373046875, 13.9853515625, 15.59765625, 17.2099609375, 18.822265625, 20.4345703125, 22.046875, 23.6591796875, 25.271484375, 26.8837890625, 28.49609375, 30.1083984375, 31.720703125, 33.3330078125, 34.9453125, 36.5576171875, 38.169921875, 39.7822265625, 41.39453125, 43.0068359375, 44.619140625, 46.2314453125, 47.84375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 1.0, 8.0, 6.0, 12.0, 14.0, 9.0, 10.0, 17.0, 19.0, 26.0, 29.0, 45.0, 42.0, 52.0, 38.0, 44.0, 45.0, 57.0, 54.0, 64.0, 46.0, 39.0, 31.0, 52.0, 36.0, 32.0, 39.0, 35.0, 21.0, 14.0, 13.0, 12.0, 13.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.25, -25.45751953125, -24.6650390625, -23.87255859375, -23.080078125, -22.28759765625, -21.4951171875, -20.70263671875, -19.91015625, -19.11767578125, -18.3251953125, -17.53271484375, -16.740234375, -15.94775390625, -15.1552734375, -14.36279296875, -13.5703125, -12.77783203125, -11.9853515625, -11.19287109375, -10.400390625, -9.60791015625, -8.8154296875, -8.02294921875, -7.23046875, -6.43798828125, -5.6455078125, -4.85302734375, -4.060546875, -3.26806640625, -2.4755859375, -1.68310546875, -0.890625, -0.09814453125, 0.6943359375, 1.48681640625, 2.279296875, 3.07177734375, 3.8642578125, 4.65673828125, 5.44921875, 6.24169921875, 7.0341796875, 7.82666015625, 8.619140625, 9.41162109375, 10.2041015625, 10.99658203125, 11.7890625, 12.58154296875, 13.3740234375, 14.16650390625, 14.958984375, 15.75146484375, 16.5439453125, 17.33642578125, 18.12890625, 18.92138671875, 19.7138671875, 20.50634765625, 21.298828125, 22.09130859375, 22.8837890625, 23.67626953125, 24.46875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 16.0, 14.0, 24.0, 44.0, 43.0, 75.0, 107.0, 172.0, 338.0, 609.0, 1128.0, 2532.0, 6139.0, 17477.0, 65167.0, 406382.0, 447755.0, 70184.0, 18651.0, 6380.0, 2559.0, 1233.0, 581.0, 316.0, 204.0, 119.0, 92.0, 42.0, 31.0, 28.0, 21.0, 15.0, 8.0, 3.0, 10.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.75, -95.84765625, -92.9453125, -90.04296875, -87.140625, -84.23828125, -81.3359375, -78.43359375, -75.53125, -72.62890625, -69.7265625, -66.82421875, -63.921875, -61.01953125, -58.1171875, -55.21484375, -52.3125, -49.41015625, -46.5078125, -43.60546875, -40.703125, -37.80078125, -34.8984375, -31.99609375, -29.09375, -26.19140625, -23.2890625, -20.38671875, -17.484375, -14.58203125, -11.6796875, -8.77734375, -5.875, -2.97265625, -0.0703125, 2.83203125, 5.734375, 8.63671875, 11.5390625, 14.44140625, 17.34375, 20.24609375, 23.1484375, 26.05078125, 28.953125, 31.85546875, 34.7578125, 37.66015625, 40.5625, 43.46484375, 46.3671875, 49.26953125, 52.171875, 55.07421875, 57.9765625, 60.87890625, 63.78125, 66.68359375, 69.5859375, 72.48828125, 75.390625, 78.29296875, 81.1953125, 84.09765625, 87.0]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 7.0, 12.0, 8.0, 11.0, 13.0, 11.0, 19.0, 22.0, 28.0, 29.0, 19.0, 30.0, 29.0, 40.0, 33.0, 41.0, 47.0, 51.0, 47.0, 44.0, 44.0, 38.0, 41.0, 40.0, 45.0, 32.0, 32.0, 35.0, 25.0, 27.0, 15.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.0, -90.6435546875, -87.287109375, -83.9306640625, -80.57421875, -77.2177734375, -73.861328125, -70.5048828125, -67.1484375, -63.7919921875, -60.435546875, -57.0791015625, -53.72265625, -50.3662109375, -47.009765625, -43.6533203125, -40.296875, -36.9404296875, -33.583984375, -30.2275390625, -26.87109375, -23.5146484375, -20.158203125, -16.8017578125, -13.4453125, -10.0888671875, -6.732421875, -3.3759765625, -0.01953125, 3.3369140625, 6.693359375, 10.0498046875, 13.40625, 16.7626953125, 20.119140625, 23.4755859375, 26.83203125, 30.1884765625, 33.544921875, 36.9013671875, 40.2578125, 43.6142578125, 46.970703125, 50.3271484375, 53.68359375, 57.0400390625, 60.396484375, 63.7529296875, 67.109375, 70.4658203125, 73.822265625, 77.1787109375, 80.53515625, 83.8916015625, 87.248046875, 90.6044921875, 93.9609375, 97.3173828125, 100.673828125, 104.0302734375, 107.38671875, 110.7431640625, 114.099609375, 117.4560546875, 120.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 13.0, 17.0, 32.0, 33.0, 60.0, 104.0, 189.0, 337.0, 693.0, 1532.0, 4421.0, 23280.0, 697940.0, 298463.0, 15371.0, 3467.0, 1261.0, 574.0, 317.0, 164.0, 90.0, 45.0, 50.0, 24.0, 27.0, 13.0, 8.0, 8.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.125, -70.40625, -67.6875, -64.96875, -62.25, -59.53125, -56.8125, -54.09375, -51.375, -48.65625, -45.9375, -43.21875, -40.5, -37.78125, -35.0625, -32.34375, -29.625, -26.90625, -24.1875, -21.46875, -18.75, -16.03125, -13.3125, -10.59375, -7.875, -5.15625, -2.4375, 0.28125, 3.0, 5.71875, 8.4375, 11.15625, 13.875, 16.59375, 19.3125, 22.03125, 24.75, 27.46875, 30.1875, 32.90625, 35.625, 38.34375, 41.0625, 43.78125, 46.5, 49.21875, 51.9375, 54.65625, 57.375, 60.09375, 62.8125, 65.53125, 68.25, 70.96875, 73.6875, 76.40625, 79.125, 81.84375, 84.5625, 87.28125, 90.0, 92.71875, 95.4375, 98.15625, 100.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 7.0, 6.0, 16.0, 22.0, 25.0, 61.0, 104.0, 192.0, 216.0, 159.0, 71.0, 37.0, 22.0, 14.0, 10.0, 9.0, 13.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155792236328125, -0.014987468719482422, -0.014395713806152344, -0.013803958892822266, -0.013212203979492188, -0.01262044906616211, -0.012028694152832031, -0.011436939239501953, -0.010845184326171875, -0.010253429412841797, -0.009661674499511719, -0.00906991958618164, -0.008478164672851562, -0.007886409759521484, -0.007294654846191406, -0.006702899932861328, -0.00611114501953125, -0.005519390106201172, -0.004927635192871094, -0.004335880279541016, -0.0037441253662109375, -0.0031523704528808594, -0.0025606155395507812, -0.001968860626220703, -0.001377105712890625, -0.0007853507995605469, -0.00019359588623046875, 0.0003981590270996094, 0.0009899139404296875, 0.0015816688537597656, 0.0021734237670898438, 0.002765178680419922, 0.00335693359375, 0.003948688507080078, 0.004540443420410156, 0.005132198333740234, 0.0057239532470703125, 0.006315708160400391, 0.006907463073730469, 0.007499217987060547, 0.008090972900390625, 0.008682727813720703, 0.009274482727050781, 0.00986623764038086, 0.010457992553710938, 0.011049747467041016, 0.011641502380371094, 0.012233257293701172, 0.01282501220703125, 0.013416767120361328, 0.014008522033691406, 0.014600276947021484, 0.015192031860351562, 0.01578378677368164, 0.01637554168701172, 0.016967296600341797, 0.017559051513671875, 0.018150806427001953, 0.01874256134033203, 0.01933431625366211, 0.019926071166992188, 0.020517826080322266, 0.021109580993652344, 0.021701335906982422, 0.0222930908203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 17.0, 20.0, 42.0, 63.0, 92.0, 145.0, 195.0, 384.0, 813.0, 1713.0, 4588.0, 17902.0, 167810.0, 773531.0, 64947.0, 10360.0, 3176.0, 1266.0, 612.0, 300.0, 202.0, 109.0, 78.0, 48.0, 34.0, 20.0, 14.0, 13.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.4375, -70.38671875, -68.3359375, -66.28515625, -64.234375, -62.18359375, -60.1328125, -58.08203125, -56.03125, -53.98046875, -51.9296875, -49.87890625, -47.828125, -45.77734375, -43.7265625, -41.67578125, -39.625, -37.57421875, -35.5234375, -33.47265625, -31.421875, -29.37109375, -27.3203125, -25.26953125, -23.21875, -21.16796875, -19.1171875, -17.06640625, -15.015625, -12.96484375, -10.9140625, -8.86328125, -6.8125, -4.76171875, -2.7109375, -0.66015625, 1.390625, 3.44140625, 5.4921875, 7.54296875, 9.59375, 11.64453125, 13.6953125, 15.74609375, 17.796875, 19.84765625, 21.8984375, 23.94921875, 26.0, 28.05078125, 30.1015625, 32.15234375, 34.203125, 36.25390625, 38.3046875, 40.35546875, 42.40625, 44.45703125, 46.5078125, 48.55859375, 50.609375, 52.66015625, 54.7109375, 56.76171875, 58.8125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 31.0, 41.0, 54.0, 88.0, 120.0, 135.0, 143.0, 111.0, 87.0, 44.0, 31.0, 27.0, 15.0, 8.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.94580078125, -61.1416015625, -59.33740234375, -57.533203125, -55.72900390625, -53.9248046875, -52.12060546875, -50.31640625, -48.51220703125, -46.7080078125, -44.90380859375, -43.099609375, -41.29541015625, -39.4912109375, -37.68701171875, -35.8828125, -34.07861328125, -32.2744140625, -30.47021484375, -28.666015625, -26.86181640625, -25.0576171875, -23.25341796875, -21.44921875, -19.64501953125, -17.8408203125, -16.03662109375, -14.232421875, -12.42822265625, -10.6240234375, -8.81982421875, -7.015625, -5.21142578125, -3.4072265625, -1.60302734375, 0.201171875, 2.00537109375, 3.8095703125, 5.61376953125, 7.41796875, 9.22216796875, 11.0263671875, 12.83056640625, 14.634765625, 16.43896484375, 18.2431640625, 20.04736328125, 21.8515625, 23.65576171875, 25.4599609375, 27.26416015625, 29.068359375, 30.87255859375, 32.6767578125, 34.48095703125, 36.28515625, 38.08935546875, 39.8935546875, 41.69775390625, 43.501953125, 45.30615234375, 47.1103515625, 48.91455078125, 50.71875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 15.0, 18.0, 36.0, 44.0, 43.0, 51.0, 98.0, 95.0, 101.0, 91.0, 92.0, 78.0, 63.0, 46.0, 34.0, 21.0, 13.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-396.11224365234375, -376.8864440917969, -357.66064453125, -338.4348449707031, -319.20904541015625, -299.9832763671875, -280.7574768066406, -261.53167724609375, -242.30587768554688, -223.080078125, -203.85427856445312, -184.6284942626953, -165.40269470214844, -146.17689514160156, -126.95110321044922, -107.72531127929688, -88.49951171875, -69.27371215820312, -50.04792022705078, -30.822124481201172, -11.596328735351562, 7.6294708251953125, 26.855262756347656, 46.0810546875, 65.30685424804688, 84.53265380859375, 103.7584457397461, 122.98423767089844, 142.2100372314453, 161.4358367919922, 180.66162109375, 199.88742065429688, 219.1131591796875, 238.33895874023438, 257.56475830078125, 276.7905578613281, 296.016357421875, 315.24212646484375, 334.4679260253906, 353.6937255859375, 372.9195251464844, 392.14532470703125, 411.3711242675781, 430.596923828125, 449.82269287109375, 469.04852294921875, 488.2742919921875, 507.5000915527344, 526.7258911132812, 545.95166015625, 565.177490234375, 584.4032592773438, 603.6290893554688, 622.8548583984375, 642.0806884765625, 661.3064575195312, 680.5322265625, 699.7579956054688, 718.9838256835938, 738.2095947265625, 757.4354248046875, 776.6611938476562, 795.8870239257812, 815.11279296875, 834.338623046875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 8.0, 2.0, 9.0, 8.0, 10.0, 16.0, 12.0, 13.0, 29.0, 23.0, 20.0, 30.0, 29.0, 42.0, 54.0, 62.0, 55.0, 62.0, 63.0, 51.0, 41.0, 45.0, 37.0, 39.0, 32.0, 29.0, 33.0, 32.0, 18.0, 20.0, 21.0, 6.0, 10.0, 10.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-692.869384765625, -673.8358764648438, -654.8023681640625, -635.7688598632812, -616.7353515625, -597.7017822265625, -578.6682739257812, -559.634765625, -540.6012573242188, -521.5677490234375, -502.53424072265625, -483.5007019042969, -464.4671936035156, -445.4336853027344, -426.400146484375, -407.36663818359375, -388.3331298828125, -369.29962158203125, -350.26611328125, -331.2325744628906, -312.1990661621094, -293.1655578613281, -274.13201904296875, -255.0985107421875, -236.06500244140625, -217.031494140625, -197.9979705810547, -178.96444702148438, -159.93093872070312, -140.89743041992188, -121.86390686035156, -102.83038330078125, -83.79693603515625, -64.76342010498047, -45.72990417480469, -26.696388244628906, -7.662872314453125, 11.370643615722656, 30.404159545898438, 49.43768310546875, 68.47119140625, 87.50470733642578, 106.53822326660156, 125.57173919677734, 144.60525512695312, 163.63876342773438, 182.6722869873047, 201.705810546875, 220.73931884765625, 239.7728271484375, 258.80633544921875, 277.8398742675781, 296.8733825683594, 315.9068908691406, 334.9404296875, 353.97393798828125, 373.0074462890625, 392.04095458984375, 411.074462890625, 430.1080017089844, 449.1415100097656, 468.1750183105469, 487.20855712890625, 506.2420654296875, 525.2755737304688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 10.0, 5.0, 13.0, 15.0, 15.0, 35.0, 26.0, 41.0, 51.0, 76.0, 92.0, 143.0, 216.0, 303.0, 408.0, 613.0, 886.0, 1517.0, 3404.0, 4144988.0, 34143.0, 3026.0, 1384.0, 912.0, 586.0, 386.0, 272.0, 223.0, 139.0, 96.0, 64.0, 49.0, 46.0, 36.0, 21.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -201.564453125, -195.25390625, -188.943359375, -182.6328125, -176.322265625, -170.01171875, -163.701171875, -157.390625, -151.080078125, -144.76953125, -138.458984375, -132.1484375, -125.837890625, -119.52734375, -113.216796875, -106.90625, -100.595703125, -94.28515625, -87.974609375, -81.6640625, -75.353515625, -69.04296875, -62.732421875, -56.421875, -50.111328125, -43.80078125, -37.490234375, -31.1796875, -24.869140625, -18.55859375, -12.248046875, -5.9375, 0.373046875, 6.68359375, 12.994140625, 19.3046875, 25.615234375, 31.92578125, 38.236328125, 44.546875, 50.857421875, 57.16796875, 63.478515625, 69.7890625, 76.099609375, 82.41015625, 88.720703125, 95.03125, 101.341796875, 107.65234375, 113.962890625, 120.2734375, 126.583984375, 132.89453125, 139.205078125, 145.515625, 151.826171875, 158.13671875, 164.447265625, 170.7578125, 177.068359375, 183.37890625, 189.689453125, 196.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 7.0, 3.0, 8.0, 10.0, 6.0, 7.0, 12.0, 15.0, 16.0, 15.0, 19.0, 27.0, 26.0, 37.0, 55.0, 47.0, 43.0, 52.0, 49.0, 57.0, 58.0, 48.0, 59.0, 43.0, 44.0, 39.0, 29.0, 32.0, 26.0, 21.0, 21.0, 14.0, 12.0, 12.0, 8.0, 9.0, 2.0, 8.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.140625, -24.371337890625, -23.60205078125, -22.832763671875, -22.0634765625, -21.294189453125, -20.52490234375, -19.755615234375, -18.986328125, -18.217041015625, -17.44775390625, -16.678466796875, -15.9091796875, -15.139892578125, -14.37060546875, -13.601318359375, -12.83203125, -12.062744140625, -11.29345703125, -10.524169921875, -9.7548828125, -8.985595703125, -8.21630859375, -7.447021484375, -6.677734375, -5.908447265625, -5.13916015625, -4.369873046875, -3.6005859375, -2.831298828125, -2.06201171875, -1.292724609375, -0.5234375, 0.245849609375, 1.01513671875, 1.784423828125, 2.5537109375, 3.322998046875, 4.09228515625, 4.861572265625, 5.630859375, 6.400146484375, 7.16943359375, 7.938720703125, 8.7080078125, 9.477294921875, 10.24658203125, 11.015869140625, 11.78515625, 12.554443359375, 13.32373046875, 14.093017578125, 14.8623046875, 15.631591796875, 16.40087890625, 17.170166015625, 17.939453125, 18.708740234375, 19.47802734375, 20.247314453125, 21.0166015625, 21.785888671875, 22.55517578125, 23.324462890625, 24.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 12.0, 22.0, 30.0, 34.0, 48.0, 69.0, 103.0, 154.0, 294.0, 551.0, 1736.0, 4138771.0, 49561.0, 1542.0, 545.0, 271.0, 161.0, 104.0, 76.0, 37.0, 33.0, 28.0, 19.0, 15.0, 7.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-543.0, -522.859375, -502.71875, -482.578125, -462.4375, -442.296875, -422.15625, -402.015625, -381.875, -361.734375, -341.59375, -321.453125, -301.3125, -281.171875, -261.03125, -240.890625, -220.75, -200.609375, -180.46875, -160.328125, -140.1875, -120.046875, -99.90625, -79.765625, -59.625, -39.484375, -19.34375, 0.796875, 20.9375, 41.078125, 61.21875, 81.359375, 101.5, 121.640625, 141.78125, 161.921875, 182.0625, 202.203125, 222.34375, 242.484375, 262.625, 282.765625, 302.90625, 323.046875, 343.1875, 363.328125, 383.46875, 403.609375, 423.75, 443.890625, 464.03125, 484.171875, 504.3125, 524.453125, 544.59375, 564.734375, 584.875, 605.015625, 625.15625, 645.296875, 665.4375, 685.578125, 705.71875, 725.859375, 746.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 3915.0, 140.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.125, -143.701171875, -140.27734375, -136.853515625, -133.4296875, -130.005859375, -126.58203125, -123.158203125, -119.734375, -116.310546875, -112.88671875, -109.462890625, -106.0390625, -102.615234375, -99.19140625, -95.767578125, -92.34375, -88.919921875, -85.49609375, -82.072265625, -78.6484375, -75.224609375, -71.80078125, -68.376953125, -64.953125, -61.529296875, -58.10546875, -54.681640625, -51.2578125, -47.833984375, -44.41015625, -40.986328125, -37.5625, -34.138671875, -30.71484375, -27.291015625, -23.8671875, -20.443359375, -17.01953125, -13.595703125, -10.171875, -6.748046875, -3.32421875, 0.099609375, 3.5234375, 6.947265625, 10.37109375, 13.794921875, 17.21875, 20.642578125, 24.06640625, 27.490234375, 30.9140625, 34.337890625, 37.76171875, 41.185546875, 44.609375, 48.033203125, 51.45703125, 54.880859375, 58.3046875, 61.728515625, 65.15234375, 68.576171875, 72.0]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 6.0, 17.0, 19.0, 32.0, 48.0, 43.0, 86.0, 114.0, 133.0, 130.0, 99.0, 66.0, 48.0, 42.0, 22.0, 22.0, 10.0, 11.0, 8.0, 6.0, 10.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.56886291503906, -217.20550537109375, -211.84214782714844, -206.47879028320312, -201.1154327392578, -195.7520751953125, -190.38870239257812, -185.0253448486328, -179.6619873046875, -174.2986297607422, -168.93527221679688, -163.57191467285156, -158.20855712890625, -152.84518432617188, -147.48184204101562, -142.11846923828125, -136.755126953125, -131.3917694091797, -126.02841186523438, -120.66505432128906, -115.30168914794922, -109.9383316040039, -104.5749740600586, -99.21160888671875, -93.84825134277344, -88.48489379882812, -83.12153625488281, -77.7581787109375, -72.39481353759766, -67.03145599365234, -61.66809844970703, -56.30473709106445, -50.941368103027344, -45.57801055908203, -40.21464920043945, -34.85129165649414, -29.487932205200195, -24.12457275390625, -18.761215209960938, -13.39785385131836, -8.034496307373047, -2.6711373329162598, 2.6922216415405273, 8.055580139160156, 13.418939590454102, 18.782299041748047, 24.14565658569336, 29.509017944335938, 34.87237548828125, 40.23573303222656, 45.59909439086914, 50.96245193481445, 56.32581329345703, 61.689170837402344, 67.05252838134766, 72.4158935546875, 77.77925109863281, 83.14260864257812, 88.50596618652344, 93.86932373046875, 99.2326889038086, 104.5960464477539, 109.95940399169922, 115.32276916503906, 120.68611907958984]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 8.0, 9.0, 13.0, 16.0, 18.0, 23.0, 26.0, 19.0, 41.0, 37.0, 38.0, 31.0, 42.0, 24.0, 45.0, 46.0, 45.0, 31.0, 43.0, 42.0, 41.0, 35.0, 42.0, 42.0, 35.0, 35.0, 21.0, 15.0, 25.0, 19.0, 14.0, 13.0, 6.0, 16.0, 9.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.53889465332031, -94.59437561035156, -91.64986419677734, -88.70535278320312, -85.76083374023438, -82.81631469726562, -79.8718032836914, -76.92729187011719, -73.98277282714844, -71.03825378417969, -68.09374237060547, -65.14923095703125, -62.2047119140625, -59.260196685791016, -56.31568145751953, -53.37116622924805, -50.42665100097656, -47.48213577270508, -44.537620544433594, -41.59310531616211, -38.648590087890625, -35.70407485961914, -32.759559631347656, -29.815044403076172, -26.870529174804688, -23.926013946533203, -20.98149871826172, -18.036983489990234, -15.09246826171875, -12.147953033447266, -9.203437805175781, -6.258922576904297, -3.3144149780273438, -0.3698997497558594, 2.574615478515625, 5.519130706787109, 8.463645935058594, 11.408161163330078, 14.352676391601562, 17.297191619873047, 20.24170684814453, 23.186222076416016, 26.1307373046875, 29.075252532958984, 32.01976776123047, 34.96428298950195, 37.90879821777344, 40.85331344604492, 43.797828674316406, 46.74234390258789, 49.686859130859375, 52.63137435913086, 55.575889587402344, 58.52040481567383, 61.46492004394531, 64.40943908691406, 67.35395050048828, 70.2984619140625, 73.24298095703125, 76.1875, 79.13201141357422, 82.07652282714844, 85.02104187011719, 87.96556091308594, 90.91007232666016]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 8.0, 13.0, 12.0, 29.0, 36.0, 40.0, 83.0, 120.0, 168.0, 260.0, 455.0, 656.0, 1120.0, 1944.0, 3521.0, 7036.0, 14993.0, 36168.0, 104460.0, 436203.0, 308132.0, 78669.0, 28624.0, 12394.0, 5929.0, 3082.0, 1730.0, 1012.0, 581.0, 370.0, 228.0, 148.0, 119.0, 75.0, 41.0, 25.0, 16.0, 12.0, 13.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6875, -67.2744140625, -64.861328125, -62.4482421875, -60.03515625, -57.6220703125, -55.208984375, -52.7958984375, -50.3828125, -47.9697265625, -45.556640625, -43.1435546875, -40.73046875, -38.3173828125, -35.904296875, -33.4912109375, -31.078125, -28.6650390625, -26.251953125, -23.8388671875, -21.42578125, -19.0126953125, -16.599609375, -14.1865234375, -11.7734375, -9.3603515625, -6.947265625, -4.5341796875, -2.12109375, 0.2919921875, 2.705078125, 5.1181640625, 7.53125, 9.9443359375, 12.357421875, 14.7705078125, 17.18359375, 19.5966796875, 22.009765625, 24.4228515625, 26.8359375, 29.2490234375, 31.662109375, 34.0751953125, 36.48828125, 38.9013671875, 41.314453125, 43.7275390625, 46.140625, 48.5537109375, 50.966796875, 53.3798828125, 55.79296875, 58.2060546875, 60.619140625, 63.0322265625, 65.4453125, 67.8583984375, 70.271484375, 72.6845703125, 75.09765625, 77.5107421875, 79.923828125, 82.3369140625, 84.75]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 5.0, 15.0, 13.0, 22.0, 18.0, 28.0, 22.0, 26.0, 32.0, 47.0, 47.0, 39.0, 46.0, 59.0, 49.0, 60.0, 67.0, 54.0, 39.0, 52.0, 24.0, 32.0, 38.0, 21.0, 26.0, 10.0, 21.0, 16.0, 15.0, 5.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68994140625, -28.6923828125, -27.69482421875, -26.697265625, -25.69970703125, -24.7021484375, -23.70458984375, -22.70703125, -21.70947265625, -20.7119140625, -19.71435546875, -18.716796875, -17.71923828125, -16.7216796875, -15.72412109375, -14.7265625, -13.72900390625, -12.7314453125, -11.73388671875, -10.736328125, -9.73876953125, -8.7412109375, -7.74365234375, -6.74609375, -5.74853515625, -4.7509765625, -3.75341796875, -2.755859375, -1.75830078125, -0.7607421875, 0.23681640625, 1.234375, 2.23193359375, 3.2294921875, 4.22705078125, 5.224609375, 6.22216796875, 7.2197265625, 8.21728515625, 9.21484375, 10.21240234375, 11.2099609375, 12.20751953125, 13.205078125, 14.20263671875, 15.2001953125, 16.19775390625, 17.1953125, 18.19287109375, 19.1904296875, 20.18798828125, 21.185546875, 22.18310546875, 23.1806640625, 24.17822265625, 25.17578125, 26.17333984375, 27.1708984375, 28.16845703125, 29.166015625, 30.16357421875, 31.1611328125, 32.15869140625, 33.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 13.0, 12.0, 17.0, 25.0, 29.0, 37.0, 62.0, 89.0, 155.0, 264.0, 549.0, 926.0, 1937.0, 4807.0, 15551.0, 73487.0, 655937.0, 245219.0, 34374.0, 8898.0, 3110.0, 1382.0, 672.0, 351.0, 225.0, 134.0, 89.0, 60.0, 35.0, 24.0, 21.0, 19.0, 11.0, 3.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.875, -112.4443359375, -109.013671875, -105.5830078125, -102.15234375, -98.7216796875, -95.291015625, -91.8603515625, -88.4296875, -84.9990234375, -81.568359375, -78.1376953125, -74.70703125, -71.2763671875, -67.845703125, -64.4150390625, -60.984375, -57.5537109375, -54.123046875, -50.6923828125, -47.26171875, -43.8310546875, -40.400390625, -36.9697265625, -33.5390625, -30.1083984375, -26.677734375, -23.2470703125, -19.81640625, -16.3857421875, -12.955078125, -9.5244140625, -6.09375, -2.6630859375, 0.767578125, 4.1982421875, 7.62890625, 11.0595703125, 14.490234375, 17.9208984375, 21.3515625, 24.7822265625, 28.212890625, 31.6435546875, 35.07421875, 38.5048828125, 41.935546875, 45.3662109375, 48.796875, 52.2275390625, 55.658203125, 59.0888671875, 62.51953125, 65.9501953125, 69.380859375, 72.8115234375, 76.2421875, 79.6728515625, 83.103515625, 86.5341796875, 89.96484375, 93.3955078125, 96.826171875, 100.2568359375, 103.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 7.0, 1.0, 12.0, 15.0, 16.0, 12.0, 20.0, 28.0, 29.0, 35.0, 28.0, 32.0, 37.0, 36.0, 36.0, 45.0, 42.0, 46.0, 43.0, 39.0, 46.0, 41.0, 42.0, 35.0, 32.0, 45.0, 27.0, 25.0, 16.0, 20.0, 18.0, 12.0, 14.0, 14.0, 10.0, 6.0, 6.0, 1.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.5625, -110.857421875, -107.15234375, -103.447265625, -99.7421875, -96.037109375, -92.33203125, -88.626953125, -84.921875, -81.216796875, -77.51171875, -73.806640625, -70.1015625, -66.396484375, -62.69140625, -58.986328125, -55.28125, -51.576171875, -47.87109375, -44.166015625, -40.4609375, -36.755859375, -33.05078125, -29.345703125, -25.640625, -21.935546875, -18.23046875, -14.525390625, -10.8203125, -7.115234375, -3.41015625, 0.294921875, 4.0, 7.705078125, 11.41015625, 15.115234375, 18.8203125, 22.525390625, 26.23046875, 29.935546875, 33.640625, 37.345703125, 41.05078125, 44.755859375, 48.4609375, 52.166015625, 55.87109375, 59.576171875, 63.28125, 66.986328125, 70.69140625, 74.396484375, 78.1015625, 81.806640625, 85.51171875, 89.216796875, 92.921875, 96.626953125, 100.33203125, 104.037109375, 107.7421875, 111.447265625, 115.15234375, 118.857421875, 122.5625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 26.0, 17.0, 29.0, 59.0, 93.0, 225.0, 418.0, 1028.0, 2686.0, 9029.0, 46864.0, 627948.0, 318052.0, 31470.0, 6813.0, 2169.0, 768.0, 346.0, 183.0, 96.0, 62.0, 39.0, 27.0, 21.0, 12.0, 11.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.96875, -61.1640625, -59.359375, -57.5546875, -55.75, -53.9453125, -52.140625, -50.3359375, -48.53125, -46.7265625, -44.921875, -43.1171875, -41.3125, -39.5078125, -37.703125, -35.8984375, -34.09375, -32.2890625, -30.484375, -28.6796875, -26.875, -25.0703125, -23.265625, -21.4609375, -19.65625, -17.8515625, -16.046875, -14.2421875, -12.4375, -10.6328125, -8.828125, -7.0234375, -5.21875, -3.4140625, -1.609375, 0.1953125, 2.0, 3.8046875, 5.609375, 7.4140625, 9.21875, 11.0234375, 12.828125, 14.6328125, 16.4375, 18.2421875, 20.046875, 21.8515625, 23.65625, 25.4609375, 27.265625, 29.0703125, 30.875, 32.6796875, 34.484375, 36.2890625, 38.09375, 39.8984375, 41.703125, 43.5078125, 45.3125, 47.1171875, 48.921875, 50.7265625, 52.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 21.0, 21.0, 52.0, 102.0, 161.0, 224.0, 168.0, 101.0, 43.0, 28.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008453369140625, -0.007940053939819336, -0.007426738739013672, -0.006913423538208008, -0.006400108337402344, -0.00588679313659668, -0.005373477935791016, -0.0048601627349853516, -0.0043468475341796875, -0.0038335323333740234, -0.0033202171325683594, -0.0028069019317626953, -0.0022935867309570312, -0.0017802715301513672, -0.0012669563293457031, -0.0007536411285400391, -0.000240325927734375, 0.00027298927307128906, 0.0007863044738769531, 0.0012996196746826172, 0.0018129348754882812, 0.0023262500762939453, 0.0028395652770996094, 0.0033528804779052734, 0.0038661956787109375, 0.0043795108795166016, 0.004892826080322266, 0.00540614128112793, 0.005919456481933594, 0.006432771682739258, 0.006946086883544922, 0.007459402084350586, 0.00797271728515625, 0.008486032485961914, 0.008999347686767578, 0.009512662887573242, 0.010025978088378906, 0.01053929328918457, 0.011052608489990234, 0.011565923690795898, 0.012079238891601562, 0.012592554092407227, 0.01310586929321289, 0.013619184494018555, 0.014132499694824219, 0.014645814895629883, 0.015159130096435547, 0.01567244529724121, 0.016185760498046875, 0.01669907569885254, 0.017212390899658203, 0.017725706100463867, 0.01823902130126953, 0.018752336502075195, 0.01926565170288086, 0.019778966903686523, 0.020292282104492188, 0.02080559730529785, 0.021318912506103516, 0.02183222770690918, 0.022345542907714844, 0.022858858108520508, 0.023372173309326172, 0.023885488510131836, 0.0243988037109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 11.0, 7.0, 16.0, 23.0, 30.0, 41.0, 57.0, 85.0, 171.0, 277.0, 595.0, 1451.0, 4780.0, 22783.0, 224477.0, 723785.0, 56615.0, 9112.0, 2385.0, 853.0, 413.0, 210.0, 116.0, 65.0, 56.0, 31.0, 34.0, 20.0, 14.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.5625, -72.318359375, -70.07421875, -67.830078125, -65.5859375, -63.341796875, -61.09765625, -58.853515625, -56.609375, -54.365234375, -52.12109375, -49.876953125, -47.6328125, -45.388671875, -43.14453125, -40.900390625, -38.65625, -36.412109375, -34.16796875, -31.923828125, -29.6796875, -27.435546875, -25.19140625, -22.947265625, -20.703125, -18.458984375, -16.21484375, -13.970703125, -11.7265625, -9.482421875, -7.23828125, -4.994140625, -2.75, -0.505859375, 1.73828125, 3.982421875, 6.2265625, 8.470703125, 10.71484375, 12.958984375, 15.203125, 17.447265625, 19.69140625, 21.935546875, 24.1796875, 26.423828125, 28.66796875, 30.912109375, 33.15625, 35.400390625, 37.64453125, 39.888671875, 42.1328125, 44.376953125, 46.62109375, 48.865234375, 51.109375, 53.353515625, 55.59765625, 57.841796875, 60.0859375, 62.330078125, 64.57421875, 66.818359375, 69.0625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 12.0, 28.0, 31.0, 49.0, 58.0, 76.0, 124.0, 175.0, 138.0, 82.0, 69.0, 36.0, 34.0, 21.0, 17.0, 12.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84375, -50.58740234375, -48.3310546875, -46.07470703125, -43.818359375, -41.56201171875, -39.3056640625, -37.04931640625, -34.79296875, -32.53662109375, -30.2802734375, -28.02392578125, -25.767578125, -23.51123046875, -21.2548828125, -18.99853515625, -16.7421875, -14.48583984375, -12.2294921875, -9.97314453125, -7.716796875, -5.46044921875, -3.2041015625, -0.94775390625, 1.30859375, 3.56494140625, 5.8212890625, 8.07763671875, 10.333984375, 12.59033203125, 14.8466796875, 17.10302734375, 19.359375, 21.61572265625, 23.8720703125, 26.12841796875, 28.384765625, 30.64111328125, 32.8974609375, 35.15380859375, 37.41015625, 39.66650390625, 41.9228515625, 44.17919921875, 46.435546875, 48.69189453125, 50.9482421875, 53.20458984375, 55.4609375, 57.71728515625, 59.9736328125, 62.22998046875, 64.486328125, 66.74267578125, 68.9990234375, 71.25537109375, 73.51171875, 75.76806640625, 78.0244140625, 80.28076171875, 82.537109375, 84.79345703125, 87.0498046875, 89.30615234375, 91.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 17.0, 18.0, 64.0, 118.0, 210.0, 243.0, 153.0, 82.0, 43.0, 20.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-997.660888671875, -950.6033935546875, -903.5459594726562, -856.488525390625, -809.4310302734375, -762.37353515625, -715.3161010742188, -668.2586669921875, -621.201171875, -574.1436767578125, -527.0862426757812, -480.0287780761719, -432.9713134765625, -385.9138488769531, -338.85638427734375, -291.7989196777344, -244.741455078125, -197.68399047851562, -150.62652587890625, -103.56906127929688, -56.5115966796875, -9.454132080078125, 37.60333251953125, 84.66079711914062, 131.71826171875, 178.77572631835938, 225.83319091796875, 272.8906555175781, 319.9481201171875, 367.0055847167969, 414.06304931640625, 461.1205139160156, 508.177978515625, 555.2354736328125, 602.2929077148438, 649.350341796875, 696.4078369140625, 743.46533203125, 790.5227661132812, 837.5802001953125, 884.6376953125, 931.6951904296875, 978.7526245117188, 1025.81005859375, 1072.8675537109375, 1119.925048828125, 1166.982421875, 1214.0399169921875, 1261.097412109375, 1308.1549072265625, 1355.21240234375, 1402.269775390625, 1449.3272705078125, 1496.384765625, 1543.442138671875, 1590.4996337890625, 1637.55712890625, 1684.6146240234375, 1731.672119140625, 1778.7294921875, 1825.7869873046875, 1872.844482421875, 1919.90185546875, 1966.9593505859375, 2014.016845703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 11.0, 17.0, 16.0, 16.0, 22.0, 29.0, 46.0, 38.0, 35.0, 51.0, 54.0, 55.0, 74.0, 53.0, 57.0, 51.0, 51.0, 51.0, 35.0, 41.0, 30.0, 28.0, 19.0, 14.0, 17.0, 14.0, 15.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-650.7698364257812, -627.1006469726562, -603.4314575195312, -579.76220703125, -556.093017578125, -532.423828125, -508.754638671875, -485.08544921875, -461.416259765625, -437.7470703125, -414.0778503417969, -390.4086608886719, -366.7394714355469, -343.07025146484375, -319.40106201171875, -295.73187255859375, -272.0626525878906, -248.39344787597656, -224.72425842285156, -201.0550537109375, -177.3858642578125, -153.71665954589844, -130.04745483398438, -106.37826538085938, -82.70906066894531, -59.03986358642578, -35.370662689208984, -11.701461791992188, 11.967735290527344, 35.636932373046875, 59.30613708496094, 82.97532653808594, 106.64453125, 130.31373596191406, 153.98292541503906, 177.65213012695312, 201.32131958007812, 224.9905242919922, 248.65972900390625, 272.32891845703125, 295.99810791015625, 319.66729736328125, 343.3365173339844, 367.0057067871094, 390.6748962402344, 414.3441162109375, 438.0133056640625, 461.6824951171875, 485.3517150878906, 509.0209045410156, 532.6901245117188, 556.3593139648438, 580.0285034179688, 603.6976928710938, 627.366943359375, 651.0361328125, 674.705322265625, 698.37451171875, 722.043701171875, 745.712890625, 769.3821411132812, 793.0513305664062, 816.7205200195312, 840.3897094726562, 864.0588989257812]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 7.0, 1.0, 9.0, 9.0, 18.0, 14.0, 21.0, 30.0, 48.0, 62.0, 99.0, 123.0, 166.0, 310.0, 427.0, 631.0, 984.0, 1486.0, 2689.0, 5530.0, 23555.0, 4129707.0, 17038.0, 4707.0, 2421.0, 1419.0, 900.0, 601.0, 392.0, 276.0, 176.0, 131.0, 93.0, 50.0, 47.0, 37.0, 22.0, 18.0, 12.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -151.71875, -146.5625, -141.40625, -136.25, -131.09375, -125.9375, -120.78125, -115.625, -110.46875, -105.3125, -100.15625, -95.0, -89.84375, -84.6875, -79.53125, -74.375, -69.21875, -64.0625, -58.90625, -53.75, -48.59375, -43.4375, -38.28125, -33.125, -27.96875, -22.8125, -17.65625, -12.5, -7.34375, -2.1875, 2.96875, 8.125, 13.28125, 18.4375, 23.59375, 28.75, 33.90625, 39.0625, 44.21875, 49.375, 54.53125, 59.6875, 64.84375, 70.0, 75.15625, 80.3125, 85.46875, 90.625, 95.78125, 100.9375, 106.09375, 111.25, 116.40625, 121.5625, 126.71875, 131.875, 137.03125, 142.1875, 147.34375, 152.5, 157.65625, 162.8125, 167.96875, 173.125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 28.0, 28.0, 23.0, 38.0, 56.0, 65.0, 60.0, 73.0, 69.0, 82.0, 84.0, 63.0, 65.0, 59.0, 33.0, 38.0, 21.0, 13.0, 12.0, 16.0, 14.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.84375, -49.47705078125, -48.1103515625, -46.74365234375, -45.376953125, -44.01025390625, -42.6435546875, -41.27685546875, -39.91015625, -38.54345703125, -37.1767578125, -35.81005859375, -34.443359375, -33.07666015625, -31.7099609375, -30.34326171875, -28.9765625, -27.60986328125, -26.2431640625, -24.87646484375, -23.509765625, -22.14306640625, -20.7763671875, -19.40966796875, -18.04296875, -16.67626953125, -15.3095703125, -13.94287109375, -12.576171875, -11.20947265625, -9.8427734375, -8.47607421875, -7.109375, -5.74267578125, -4.3759765625, -3.00927734375, -1.642578125, -0.27587890625, 1.0908203125, 2.45751953125, 3.82421875, 5.19091796875, 6.5576171875, 7.92431640625, 9.291015625, 10.65771484375, 12.0244140625, 13.39111328125, 14.7578125, 16.12451171875, 17.4912109375, 18.85791015625, 20.224609375, 21.59130859375, 22.9580078125, 24.32470703125, 25.69140625, 27.05810546875, 28.4248046875, 29.79150390625, 31.158203125, 32.52490234375, 33.8916015625, 35.25830078125, 36.625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 19.0, 13.0, 25.0, 39.0, 49.0, 62.0, 136.0, 160.0, 237.0, 348.0, 527.0, 973.0, 1594.0, 3073.0, 7426.0, 42505.0, 4103301.0, 21736.0, 5681.0, 2643.0, 1387.0, 791.0, 500.0, 303.0, 239.0, 153.0, 105.0, 84.0, 48.0, 29.0, 32.0, 21.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-204.75, -198.79296875, -192.8359375, -186.87890625, -180.921875, -174.96484375, -169.0078125, -163.05078125, -157.09375, -151.13671875, -145.1796875, -139.22265625, -133.265625, -127.30859375, -121.3515625, -115.39453125, -109.4375, -103.48046875, -97.5234375, -91.56640625, -85.609375, -79.65234375, -73.6953125, -67.73828125, -61.78125, -55.82421875, -49.8671875, -43.91015625, -37.953125, -31.99609375, -26.0390625, -20.08203125, -14.125, -8.16796875, -2.2109375, 3.74609375, 9.703125, 15.66015625, 21.6171875, 27.57421875, 33.53125, 39.48828125, 45.4453125, 51.40234375, 57.359375, 63.31640625, 69.2734375, 75.23046875, 81.1875, 87.14453125, 93.1015625, 99.05859375, 105.015625, 110.97265625, 116.9296875, 122.88671875, 128.84375, 134.80078125, 140.7578125, 146.71484375, 152.671875, 158.62890625, 164.5859375, 170.54296875, 176.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 8.0, 9.0, 17.0, 16.0, 45.0, 167.0, 3643.0, 101.0, 24.0, 15.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9375, -59.7529296875, -57.568359375, -55.3837890625, -53.19921875, -51.0146484375, -48.830078125, -46.6455078125, -44.4609375, -42.2763671875, -40.091796875, -37.9072265625, -35.72265625, -33.5380859375, -31.353515625, -29.1689453125, -26.984375, -24.7998046875, -22.615234375, -20.4306640625, -18.24609375, -16.0615234375, -13.876953125, -11.6923828125, -9.5078125, -7.3232421875, -5.138671875, -2.9541015625, -0.76953125, 1.4150390625, 3.599609375, 5.7841796875, 7.96875, 10.1533203125, 12.337890625, 14.5224609375, 16.70703125, 18.8916015625, 21.076171875, 23.2607421875, 25.4453125, 27.6298828125, 29.814453125, 31.9990234375, 34.18359375, 36.3681640625, 38.552734375, 40.7373046875, 42.921875, 45.1064453125, 47.291015625, 49.4755859375, 51.66015625, 53.8447265625, 56.029296875, 58.2138671875, 60.3984375, 62.5830078125, 64.767578125, 66.9521484375, 69.13671875, 71.3212890625, 73.505859375, 75.6904296875, 77.875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 20.0, 39.0, 63.0, 92.0, 139.0, 163.0, 148.0, 98.0, 77.0, 39.0, 22.0, 17.0, 11.0, 9.0, 4.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.9148712158203, -219.68553161621094, -211.45620727539062, -203.22686767578125, -194.99752807617188, -186.7681884765625, -178.5388641357422, -170.3095245361328, -162.0802001953125, -153.85086059570312, -145.6215362548828, -137.39219665527344, -129.16285705566406, -120.93352508544922, -112.70419311523438, -104.474853515625, -96.24551391601562, -88.01618194580078, -79.7868423461914, -71.55751037597656, -63.32817459106445, -55.098838806152344, -46.8695068359375, -38.64017105102539, -30.41083526611328, -22.181499481201172, -13.952165603637695, -5.722831726074219, 2.5065040588378906, 10.73583984375, 18.965171813964844, 27.194507598876953, 35.423858642578125, 43.653194427490234, 51.882530212402344, 60.11186218261719, 68.34120178222656, 76.5705337524414, 84.79986572265625, 93.02920532226562, 101.25853729248047, 109.48786926269531, 117.71720886230469, 125.94654083251953, 134.17587280273438, 142.40521240234375, 150.63455200195312, 158.86387634277344, 167.0932159423828, 175.3225555419922, 183.5518798828125, 191.78121948242188, 200.01055908203125, 208.23989868164062, 216.46922302246094, 224.6985626220703, 232.92788696289062, 241.1572265625, 249.3865509033203, 257.61590576171875, 265.84521484375, 274.0745544433594, 282.30389404296875, 290.5332336425781, 298.7625732421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 9.0, 8.0, 7.0, 7.0, 14.0, 10.0, 15.0, 15.0, 23.0, 27.0, 29.0, 23.0, 35.0, 28.0, 44.0, 40.0, 42.0, 35.0, 41.0, 50.0, 45.0, 42.0, 34.0, 43.0, 32.0, 38.0, 20.0, 26.0, 39.0, 23.0, 27.0, 24.0, 15.0, 12.0, 12.0, 9.0, 17.0, 8.0, 6.0, 7.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-113.14628601074219, -109.76753997802734, -106.3887939453125, -103.01004791259766, -99.63130187988281, -96.25255584716797, -92.87380981445312, -89.49507141113281, -86.11631774902344, -82.7375717163086, -79.35882568359375, -75.9800796508789, -72.60133361816406, -69.22258758544922, -65.84384155273438, -62.4650993347168, -59.08635711669922, -55.707611083984375, -52.32886505126953, -48.95011901855469, -45.571372985839844, -42.192626953125, -38.81388473510742, -35.43513870239258, -32.056392669677734, -28.67764663696289, -25.298900604248047, -21.920156478881836, -18.541410446166992, -15.162664413452148, -11.783920288085938, -8.405174255371094, -5.02642822265625, -1.6476826667785645, 1.731062889099121, 5.109807968139648, 8.488554000854492, 11.867300033569336, 15.246044158935547, 18.62479019165039, 22.003536224365234, 25.382282257080078, 28.761028289794922, 32.1397705078125, 35.518516540527344, 38.89726257324219, 42.27600860595703, 45.654754638671875, 49.03350067138672, 52.41224670410156, 55.790992736816406, 59.16973876953125, 62.548484802246094, 65.92723083496094, 69.30596923828125, 72.68472290039062, 76.06346130371094, 79.44220733642578, 82.82095336914062, 86.19969940185547, 89.57844543457031, 92.95719146728516, 96.3359375, 99.71467590332031, 103.09342956542969]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 4.0, 1.0, 8.0, 8.0, 10.0, 7.0, 21.0, 26.0, 46.0, 68.0, 114.0, 132.0, 246.0, 402.0, 577.0, 1010.0, 1768.0, 3204.0, 6171.0, 13491.0, 31657.0, 85384.0, 290007.0, 418524.0, 119461.0, 42063.0, 17301.0, 7821.0, 3927.0, 2047.0, 1157.0, 688.0, 405.0, 266.0, 191.0, 102.0, 67.0, 51.0, 33.0, 29.0, 21.0, 9.0, 12.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0, -84.20703125, -81.4140625, -78.62109375, -75.828125, -73.03515625, -70.2421875, -67.44921875, -64.65625, -61.86328125, -59.0703125, -56.27734375, -53.484375, -50.69140625, -47.8984375, -45.10546875, -42.3125, -39.51953125, -36.7265625, -33.93359375, -31.140625, -28.34765625, -25.5546875, -22.76171875, -19.96875, -17.17578125, -14.3828125, -11.58984375, -8.796875, -6.00390625, -3.2109375, -0.41796875, 2.375, 5.16796875, 7.9609375, 10.75390625, 13.546875, 16.33984375, 19.1328125, 21.92578125, 24.71875, 27.51171875, 30.3046875, 33.09765625, 35.890625, 38.68359375, 41.4765625, 44.26953125, 47.0625, 49.85546875, 52.6484375, 55.44140625, 58.234375, 61.02734375, 63.8203125, 66.61328125, 69.40625, 72.19921875, 74.9921875, 77.78515625, 80.578125, 83.37109375, 86.1640625, 88.95703125, 91.75]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 11.0, 19.0, 17.0, 21.0, 27.0, 38.0, 28.0, 46.0, 68.0, 70.0, 77.0, 70.0, 69.0, 67.0, 73.0, 64.0, 37.0, 42.0, 25.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.96875, -43.560546875, -42.15234375, -40.744140625, -39.3359375, -37.927734375, -36.51953125, -35.111328125, -33.703125, -32.294921875, -30.88671875, -29.478515625, -28.0703125, -26.662109375, -25.25390625, -23.845703125, -22.4375, -21.029296875, -19.62109375, -18.212890625, -16.8046875, -15.396484375, -13.98828125, -12.580078125, -11.171875, -9.763671875, -8.35546875, -6.947265625, -5.5390625, -4.130859375, -2.72265625, -1.314453125, 0.09375, 1.501953125, 2.91015625, 4.318359375, 5.7265625, 7.134765625, 8.54296875, 9.951171875, 11.359375, 12.767578125, 14.17578125, 15.583984375, 16.9921875, 18.400390625, 19.80859375, 21.216796875, 22.625, 24.033203125, 25.44140625, 26.849609375, 28.2578125, 29.666015625, 31.07421875, 32.482421875, 33.890625, 35.298828125, 36.70703125, 38.115234375, 39.5234375, 40.931640625, 42.33984375, 43.748046875, 45.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 13.0, 10.0, 20.0, 18.0, 37.0, 45.0, 58.0, 104.0, 107.0, 167.0, 274.0, 381.0, 663.0, 1053.0, 1913.0, 3780.0, 8094.0, 21816.0, 72238.0, 386025.0, 432949.0, 78114.0, 23096.0, 8738.0, 3879.0, 1925.0, 1072.0, 600.0, 428.0, 285.0, 195.0, 115.0, 98.0, 60.0, 41.0, 30.0, 26.0, 18.0, 17.0, 5.0, 6.0, 7.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0], "bins": [-102.6875, -99.755859375, -96.82421875, -93.892578125, -90.9609375, -88.029296875, -85.09765625, -82.166015625, -79.234375, -76.302734375, -73.37109375, -70.439453125, -67.5078125, -64.576171875, -61.64453125, -58.712890625, -55.78125, -52.849609375, -49.91796875, -46.986328125, -44.0546875, -41.123046875, -38.19140625, -35.259765625, -32.328125, -29.396484375, -26.46484375, -23.533203125, -20.6015625, -17.669921875, -14.73828125, -11.806640625, -8.875, -5.943359375, -3.01171875, -0.080078125, 2.8515625, 5.783203125, 8.71484375, 11.646484375, 14.578125, 17.509765625, 20.44140625, 23.373046875, 26.3046875, 29.236328125, 32.16796875, 35.099609375, 38.03125, 40.962890625, 43.89453125, 46.826171875, 49.7578125, 52.689453125, 55.62109375, 58.552734375, 61.484375, 64.416015625, 67.34765625, 70.279296875, 73.2109375, 76.142578125, 79.07421875, 82.005859375, 84.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 8.0, 12.0, 15.0, 17.0, 19.0, 22.0, 37.0, 41.0, 47.0, 38.0, 53.0, 50.0, 52.0, 57.0, 77.0, 66.0, 47.0, 46.0, 41.0, 50.0, 39.0, 27.0, 32.0, 23.0, 20.0, 15.0, 10.0, 8.0, 7.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.125, -187.783203125, -182.44140625, -177.099609375, -171.7578125, -166.416015625, -161.07421875, -155.732421875, -150.390625, -145.048828125, -139.70703125, -134.365234375, -129.0234375, -123.681640625, -118.33984375, -112.998046875, -107.65625, -102.314453125, -96.97265625, -91.630859375, -86.2890625, -80.947265625, -75.60546875, -70.263671875, -64.921875, -59.580078125, -54.23828125, -48.896484375, -43.5546875, -38.212890625, -32.87109375, -27.529296875, -22.1875, -16.845703125, -11.50390625, -6.162109375, -0.8203125, 4.521484375, 9.86328125, 15.205078125, 20.546875, 25.888671875, 31.23046875, 36.572265625, 41.9140625, 47.255859375, 52.59765625, 57.939453125, 63.28125, 68.623046875, 73.96484375, 79.306640625, 84.6484375, 89.990234375, 95.33203125, 100.673828125, 106.015625, 111.357421875, 116.69921875, 122.041015625, 127.3828125, 132.724609375, 138.06640625, 143.408203125, 148.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 4.0, 7.0, 12.0, 19.0, 31.0, 49.0, 72.0, 157.0, 356.0, 1101.0, 4598.0, 47778.0, 954694.0, 34049.0, 3931.0, 984.0, 352.0, 158.0, 68.0, 38.0, 30.0, 18.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.65625, -97.8125, -93.96875, -90.125, -86.28125, -82.4375, -78.59375, -74.75, -70.90625, -67.0625, -63.21875, -59.375, -55.53125, -51.6875, -47.84375, -44.0, -40.15625, -36.3125, -32.46875, -28.625, -24.78125, -20.9375, -17.09375, -13.25, -9.40625, -5.5625, -1.71875, 2.125, 5.96875, 9.8125, 13.65625, 17.5, 21.34375, 25.1875, 29.03125, 32.875, 36.71875, 40.5625, 44.40625, 48.25, 52.09375, 55.9375, 59.78125, 63.625, 67.46875, 71.3125, 75.15625, 79.0, 82.84375, 86.6875, 90.53125, 94.375, 98.21875, 102.0625, 105.90625, 109.75, 113.59375, 117.4375, 121.28125, 125.125, 128.96875, 132.8125, 136.65625, 140.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 25.0, 22.0, 23.0, 39.0, 53.0, 84.0, 144.0, 212.0, 159.0, 80.0, 46.0, 20.0, 19.0, 15.0, 12.0, 5.0, 9.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0136566162109375, -0.013141870498657227, -0.012627124786376953, -0.01211237907409668, -0.011597633361816406, -0.011082887649536133, -0.01056814193725586, -0.010053396224975586, -0.009538650512695312, -0.009023904800415039, -0.008509159088134766, -0.007994413375854492, -0.007479667663574219, -0.006964921951293945, -0.006450176239013672, -0.0059354305267333984, -0.005420684814453125, -0.0049059391021728516, -0.004391193389892578, -0.0038764476776123047, -0.0033617019653320312, -0.002846956253051758, -0.0023322105407714844, -0.001817464828491211, -0.0013027191162109375, -0.0007879734039306641, -0.0002732276916503906, 0.0002415180206298828, 0.0007562637329101562, 0.0012710094451904297, 0.0017857551574707031, 0.0023005008697509766, 0.00281524658203125, 0.0033299922943115234, 0.003844738006591797, 0.00435948371887207, 0.004874229431152344, 0.005388975143432617, 0.005903720855712891, 0.006418466567993164, 0.0069332122802734375, 0.007447957992553711, 0.007962703704833984, 0.008477449417114258, 0.008992195129394531, 0.009506940841674805, 0.010021686553955078, 0.010536432266235352, 0.011051177978515625, 0.011565923690795898, 0.012080669403076172, 0.012595415115356445, 0.013110160827636719, 0.013624906539916992, 0.014139652252197266, 0.014654397964477539, 0.015169143676757812, 0.015683889389038086, 0.01619863510131836, 0.016713380813598633, 0.017228126525878906, 0.01774287223815918, 0.018257617950439453, 0.018772363662719727, 0.019287109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 8.0, 5.0, 4.0, 5.0, 17.0, 23.0, 25.0, 42.0, 60.0, 93.0, 161.0, 293.0, 466.0, 1076.0, 2846.0, 12254.0, 205873.0, 795902.0, 22184.0, 4280.0, 1433.0, 650.0, 323.0, 179.0, 103.0, 83.0, 43.0, 28.0, 25.0, 22.0, 14.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-104.0625, -100.611328125, -97.16015625, -93.708984375, -90.2578125, -86.806640625, -83.35546875, -79.904296875, -76.453125, -73.001953125, -69.55078125, -66.099609375, -62.6484375, -59.197265625, -55.74609375, -52.294921875, -48.84375, -45.392578125, -41.94140625, -38.490234375, -35.0390625, -31.587890625, -28.13671875, -24.685546875, -21.234375, -17.783203125, -14.33203125, -10.880859375, -7.4296875, -3.978515625, -0.52734375, 2.923828125, 6.375, 9.826171875, 13.27734375, 16.728515625, 20.1796875, 23.630859375, 27.08203125, 30.533203125, 33.984375, 37.435546875, 40.88671875, 44.337890625, 47.7890625, 51.240234375, 54.69140625, 58.142578125, 61.59375, 65.044921875, 68.49609375, 71.947265625, 75.3984375, 78.849609375, 82.30078125, 85.751953125, 89.203125, 92.654296875, 96.10546875, 99.556640625, 103.0078125, 106.458984375, 109.91015625, 113.361328125, 116.8125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 11.0, 11.0, 17.0, 24.0, 50.0, 90.0, 220.0, 257.0, 151.0, 67.0, 34.0, 19.0, 20.0, 13.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.375, -86.943359375, -83.51171875, -80.080078125, -76.6484375, -73.216796875, -69.78515625, -66.353515625, -62.921875, -59.490234375, -56.05859375, -52.626953125, -49.1953125, -45.763671875, -42.33203125, -38.900390625, -35.46875, -32.037109375, -28.60546875, -25.173828125, -21.7421875, -18.310546875, -14.87890625, -11.447265625, -8.015625, -4.583984375, -1.15234375, 2.279296875, 5.7109375, 9.142578125, 12.57421875, 16.005859375, 19.4375, 22.869140625, 26.30078125, 29.732421875, 33.1640625, 36.595703125, 40.02734375, 43.458984375, 46.890625, 50.322265625, 53.75390625, 57.185546875, 60.6171875, 64.048828125, 67.48046875, 70.912109375, 74.34375, 77.775390625, 81.20703125, 84.638671875, 88.0703125, 91.501953125, 94.93359375, 98.365234375, 101.796875, 105.228515625, 108.66015625, 112.091796875, 115.5234375, 118.955078125, 122.38671875, 125.818359375, 129.25]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 30.0, 157.0, 447.0, 263.0, 67.0, 22.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1050.192626953125, -941.7163696289062, -833.2401123046875, -724.7638549804688, -616.28759765625, -507.81134033203125, -399.3350830078125, -290.85882568359375, -182.382568359375, -73.90631103515625, 34.5699462890625, 143.04620361328125, 251.5224609375, 359.99871826171875, 468.4749755859375, 576.9512329101562, 685.427490234375, 793.9037475585938, 902.3800048828125, 1010.8562622070312, 1119.33251953125, 1227.808837890625, 1336.2850341796875, 1444.76123046875, 1553.237548828125, 1661.7138671875, 1770.1900634765625, 1878.666259765625, 1987.142578125, 2095.618896484375, 2204.09521484375, 2312.5712890625, 2421.04736328125, 2529.523681640625, 2638.0, 2746.47607421875, 2854.952392578125, 2963.4287109375, 3071.90478515625, 3180.381103515625, 3288.857421875, 3397.333740234375, 3505.81005859375, 3614.2861328125, 3722.762451171875, 3831.23876953125, 3939.71484375, 4048.191162109375, 4156.66748046875, 4265.1435546875, 4373.6201171875, 4482.09619140625, 4590.572265625, 4699.048828125, 4807.52490234375, 4916.00146484375, 5024.4775390625, 5132.95361328125, 5241.43017578125, 5349.90625, 5458.3828125, 5566.85888671875, 5675.3349609375, 5783.8115234375, 5892.28759765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 3.0, 8.0, 8.0, 14.0, 9.0, 11.0, 13.0, 22.0, 26.0, 24.0, 36.0, 27.0, 32.0, 37.0, 39.0, 40.0, 54.0, 43.0, 53.0, 55.0, 37.0, 55.0, 40.0, 46.0, 37.0, 42.0, 30.0, 30.0, 17.0, 26.0, 17.0, 16.0, 10.0, 12.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-621.1695556640625, -600.2647705078125, -579.3599853515625, -558.4552001953125, -537.5504150390625, -516.6456298828125, -495.7408447265625, -474.8360595703125, -453.9312744140625, -433.0264892578125, -412.1217041015625, -391.2169189453125, -370.3121337890625, -349.4073486328125, -328.5025634765625, -307.5977783203125, -286.6929626464844, -265.7881774902344, -244.88339233398438, -223.97860717773438, -203.07382202148438, -182.16903686523438, -161.2642364501953, -140.3594512939453, -119.45466613769531, -98.54988098144531, -77.64509582519531, -56.74030303955078, -35.83551788330078, -14.930732727050781, 5.97406005859375, 26.87884521484375, 47.78363037109375, 68.68841552734375, 89.59320068359375, 110.49799346923828, 131.40277099609375, 152.30755615234375, 173.2123565673828, 194.1171417236328, 215.0219268798828, 235.9267120361328, 256.8315124511719, 277.7362976074219, 298.6410827636719, 319.5458679199219, 340.4506530761719, 361.3554382324219, 382.2602233886719, 403.1650085449219, 424.0697937011719, 444.9745788574219, 465.8793640136719, 486.7841491699219, 507.68896484375, 528.59375, 549.49853515625, 570.4033203125, 591.30810546875, 612.212890625, 633.11767578125, 654.0224609375, 674.92724609375, 695.83203125, 716.73681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 15.0, 13.0, 20.0, 27.0, 46.0, 64.0, 72.0, 125.0, 127.0, 188.0, 252.0, 357.0, 524.0, 766.0, 1063.0, 1690.0, 2684.0, 4578.0, 8676.0, 19378.0, 65604.0, 903120.0, 2988755.0, 141421.0, 28522.0, 11413.0, 5606.0, 3251.0, 1884.0, 1180.0, 837.0, 533.0, 412.0, 267.0, 195.0, 158.0, 105.0, 96.0, 60.0, 57.0, 45.0, 25.0, 15.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.9375, -68.5068359375, -66.076171875, -63.6455078125, -61.21484375, -58.7841796875, -56.353515625, -53.9228515625, -51.4921875, -49.0615234375, -46.630859375, -44.2001953125, -41.76953125, -39.3388671875, -36.908203125, -34.4775390625, -32.046875, -29.6162109375, -27.185546875, -24.7548828125, -22.32421875, -19.8935546875, -17.462890625, -15.0322265625, -12.6015625, -10.1708984375, -7.740234375, -5.3095703125, -2.87890625, -0.4482421875, 1.982421875, 4.4130859375, 6.84375, 9.2744140625, 11.705078125, 14.1357421875, 16.56640625, 18.9970703125, 21.427734375, 23.8583984375, 26.2890625, 28.7197265625, 31.150390625, 33.5810546875, 36.01171875, 38.4423828125, 40.873046875, 43.3037109375, 45.734375, 48.1650390625, 50.595703125, 53.0263671875, 55.45703125, 57.8876953125, 60.318359375, 62.7490234375, 65.1796875, 67.6103515625, 70.041015625, 72.4716796875, 74.90234375, 77.3330078125, 79.763671875, 82.1943359375, 84.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 7.0, 14.0, 28.0, 17.0, 25.0, 40.0, 39.0, 45.0, 61.0, 68.0, 77.0, 75.0, 76.0, 78.0, 68.0, 63.0, 44.0, 36.0, 32.0, 25.0, 12.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -33.60693359375, -32.1826171875, -30.75830078125, -29.333984375, -27.90966796875, -26.4853515625, -25.06103515625, -23.63671875, -22.21240234375, -20.7880859375, -19.36376953125, -17.939453125, -16.51513671875, -15.0908203125, -13.66650390625, -12.2421875, -10.81787109375, -9.3935546875, -7.96923828125, -6.544921875, -5.12060546875, -3.6962890625, -2.27197265625, -0.84765625, 0.57666015625, 2.0009765625, 3.42529296875, 4.849609375, 6.27392578125, 7.6982421875, 9.12255859375, 10.546875, 11.97119140625, 13.3955078125, 14.81982421875, 16.244140625, 17.66845703125, 19.0927734375, 20.51708984375, 21.94140625, 23.36572265625, 24.7900390625, 26.21435546875, 27.638671875, 29.06298828125, 30.4873046875, 31.91162109375, 33.3359375, 34.76025390625, 36.1845703125, 37.60888671875, 39.033203125, 40.45751953125, 41.8818359375, 43.30615234375, 44.73046875, 46.15478515625, 47.5791015625, 49.00341796875, 50.427734375, 51.85205078125, 53.2763671875, 54.70068359375, 56.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 11.0, 6.0, 8.0, 13.0, 20.0, 16.0, 41.0, 73.0, 88.0, 162.0, 246.0, 428.0, 781.0, 1588.0, 3545.0, 8788.0, 25957.0, 110839.0, 3336524.0, 621263.0, 56466.0, 16364.0, 5971.0, 2408.0, 1174.0, 613.0, 348.0, 210.0, 111.0, 79.0, 38.0, 37.0, 16.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.875, -98.337890625, -94.80078125, -91.263671875, -87.7265625, -84.189453125, -80.65234375, -77.115234375, -73.578125, -70.041015625, -66.50390625, -62.966796875, -59.4296875, -55.892578125, -52.35546875, -48.818359375, -45.28125, -41.744140625, -38.20703125, -34.669921875, -31.1328125, -27.595703125, -24.05859375, -20.521484375, -16.984375, -13.447265625, -9.91015625, -6.373046875, -2.8359375, 0.701171875, 4.23828125, 7.775390625, 11.3125, 14.849609375, 18.38671875, 21.923828125, 25.4609375, 28.998046875, 32.53515625, 36.072265625, 39.609375, 43.146484375, 46.68359375, 50.220703125, 53.7578125, 57.294921875, 60.83203125, 64.369140625, 67.90625, 71.443359375, 74.98046875, 78.517578125, 82.0546875, 85.591796875, 89.12890625, 92.666015625, 96.203125, 99.740234375, 103.27734375, 106.814453125, 110.3515625, 113.888671875, 117.42578125, 120.962890625, 124.5]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 11.0, 24.0, 24.0, 36.0, 37.0, 63.0, 102.0, 205.0, 526.0, 1404.0, 898.0, 321.0, 132.0, 76.0, 41.0, 30.0, 17.0, 23.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -136.6904296875, -132.755859375, -128.8212890625, -124.88671875, -120.9521484375, -117.017578125, -113.0830078125, -109.1484375, -105.2138671875, -101.279296875, -97.3447265625, -93.41015625, -89.4755859375, -85.541015625, -81.6064453125, -77.671875, -73.7373046875, -69.802734375, -65.8681640625, -61.93359375, -57.9990234375, -54.064453125, -50.1298828125, -46.1953125, -42.2607421875, -38.326171875, -34.3916015625, -30.45703125, -26.5224609375, -22.587890625, -18.6533203125, -14.71875, -10.7841796875, -6.849609375, -2.9150390625, 1.01953125, 4.9541015625, 8.888671875, 12.8232421875, 16.7578125, 20.6923828125, 24.626953125, 28.5615234375, 32.49609375, 36.4306640625, 40.365234375, 44.2998046875, 48.234375, 52.1689453125, 56.103515625, 60.0380859375, 63.97265625, 67.9072265625, 71.841796875, 75.7763671875, 79.7109375, 83.6455078125, 87.580078125, 91.5146484375, 95.44921875, 99.3837890625, 103.318359375, 107.2529296875, 111.1875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 20.0, 25.0, 51.0, 106.0, 196.0, 292.0, 181.0, 62.0, 26.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1828.8466796875, -1782.648193359375, -1736.44970703125, -1690.251220703125, -1644.052734375, -1597.854248046875, -1551.65576171875, -1505.457275390625, -1459.2587890625, -1413.060302734375, -1366.86181640625, -1320.663330078125, -1274.46484375, -1228.266357421875, -1182.06787109375, -1135.869384765625, -1089.6710205078125, -1043.4725341796875, -997.2740478515625, -951.0755615234375, -904.8770751953125, -858.6785888671875, -812.4801635742188, -766.2816772460938, -720.0831909179688, -673.8847045898438, -627.6862182617188, -581.48779296875, -535.289306640625, -489.0907897949219, -442.892333984375, -396.69384765625, -350.495361328125, -304.296875, -258.098388671875, -211.89993286132812, -165.70144653320312, -119.50296020507812, -73.30450439453125, -27.10601806640625, 19.09246826171875, 65.29094696044922, 111.48942565917969, 157.68789672851562, 203.88638305664062, 250.08486938476562, 296.2833251953125, 342.4818115234375, 388.6802978515625, 434.8787841796875, 481.0772705078125, 527.2757568359375, 573.4742431640625, 619.6727294921875, 665.8711547851562, 712.0696411132812, 758.2681274414062, 804.4666137695312, 850.6651000976562, 896.863525390625, 943.06201171875, 989.260498046875, 1035.458984375, 1081.657470703125, 1127.85595703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 17.0, 23.0, 20.0, 16.0, 19.0, 25.0, 28.0, 32.0, 31.0, 31.0, 40.0, 42.0, 42.0, 39.0, 37.0, 46.0, 50.0, 33.0, 42.0, 44.0, 44.0, 43.0, 25.0, 29.0, 35.0, 22.0, 23.0, 10.0, 13.0, 9.0, 13.0, 8.0, 11.0, 10.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-447.6067810058594, -433.94354248046875, -420.28033447265625, -406.61712646484375, -392.9538879394531, -379.2906494140625, -365.62744140625, -351.9642333984375, -338.3009948730469, -324.63775634765625, -310.97454833984375, -297.31134033203125, -283.6481018066406, -269.98486328125, -256.3216552734375, -242.65843200683594, -228.99520874023438, -215.3319854736328, -201.66876220703125, -188.0055389404297, -174.34231567382812, -160.67909240722656, -147.015869140625, -133.35264587402344, -119.68942260742188, -106.02619934082031, -92.36297607421875, -78.69975280761719, -65.03652954101562, -51.37330627441406, -37.7100830078125, -24.046859741210938, -10.38360595703125, 3.2796173095703125, 16.942840576171875, 30.606063842773438, 44.269287109375, 57.93251037597656, 71.59573364257812, 85.25895690917969, 98.92218017578125, 112.58540344238281, 126.24862670898438, 139.91184997558594, 153.5750732421875, 167.23829650878906, 180.90151977539062, 194.5647430419922, 208.22796630859375, 221.8911895751953, 235.55441284179688, 249.21763610839844, 262.880859375, 276.5440673828125, 290.2073059082031, 303.87054443359375, 317.53375244140625, 331.19696044921875, 344.8601989746094, 358.5234375, 372.1866455078125, 385.849853515625, 399.5130920410156, 413.17633056640625, 426.83953857421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 10.0, 10.0, 17.0, 14.0, 30.0, 47.0, 67.0, 89.0, 143.0, 223.0, 329.0, 457.0, 697.0, 978.0, 1595.0, 2476.0, 4149.0, 6958.0, 12624.0, 24743.0, 53562.0, 140373.0, 394937.0, 243737.0, 83951.0, 35681.0, 17201.0, 9233.0, 5166.0, 3165.0, 2007.0, 1241.0, 863.0, 518.0, 368.0, 261.0, 187.0, 129.0, 102.0, 62.0, 40.0, 33.0, 22.0, 19.0, 13.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-71.875, -69.7451171875, -67.615234375, -65.4853515625, -63.35546875, -61.2255859375, -59.095703125, -56.9658203125, -54.8359375, -52.7060546875, -50.576171875, -48.4462890625, -46.31640625, -44.1865234375, -42.056640625, -39.9267578125, -37.796875, -35.6669921875, -33.537109375, -31.4072265625, -29.27734375, -27.1474609375, -25.017578125, -22.8876953125, -20.7578125, -18.6279296875, -16.498046875, -14.3681640625, -12.23828125, -10.1083984375, -7.978515625, -5.8486328125, -3.71875, -1.5888671875, 0.541015625, 2.6708984375, 4.80078125, 6.9306640625, 9.060546875, 11.1904296875, 13.3203125, 15.4501953125, 17.580078125, 19.7099609375, 21.83984375, 23.9697265625, 26.099609375, 28.2294921875, 30.359375, 32.4892578125, 34.619140625, 36.7490234375, 38.87890625, 41.0087890625, 43.138671875, 45.2685546875, 47.3984375, 49.5283203125, 51.658203125, 53.7880859375, 55.91796875, 58.0478515625, 60.177734375, 62.3076171875, 64.4375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 15.0, 19.0, 22.0, 23.0, 28.0, 32.0, 46.0, 49.0, 45.0, 60.0, 69.0, 58.0, 64.0, 72.0, 49.0, 54.0, 50.0, 37.0, 33.0, 35.0, 20.0, 21.0, 19.0, 19.0, 11.0, 6.0, 1.0, 4.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.630859375, -30.35546875, -29.080078125, -27.8046875, -26.529296875, -25.25390625, -23.978515625, -22.703125, -21.427734375, -20.15234375, -18.876953125, -17.6015625, -16.326171875, -15.05078125, -13.775390625, -12.5, -11.224609375, -9.94921875, -8.673828125, -7.3984375, -6.123046875, -4.84765625, -3.572265625, -2.296875, -1.021484375, 0.25390625, 1.529296875, 2.8046875, 4.080078125, 5.35546875, 6.630859375, 7.90625, 9.181640625, 10.45703125, 11.732421875, 13.0078125, 14.283203125, 15.55859375, 16.833984375, 18.109375, 19.384765625, 20.66015625, 21.935546875, 23.2109375, 24.486328125, 25.76171875, 27.037109375, 28.3125, 29.587890625, 30.86328125, 32.138671875, 33.4140625, 34.689453125, 35.96484375, 37.240234375, 38.515625, 39.791015625, 41.06640625, 42.341796875, 43.6171875, 44.892578125, 46.16796875, 47.443359375, 48.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 11.0, 18.0, 18.0, 29.0, 35.0, 51.0, 67.0, 108.0, 202.0, 293.0, 433.0, 809.0, 1624.0, 3957.0, 12396.0, 60986.0, 732676.0, 197690.0, 25240.0, 6758.0, 2447.0, 1122.0, 594.0, 314.0, 219.0, 121.0, 97.0, 67.0, 46.0, 28.0, 25.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-161.625, -156.689453125, -151.75390625, -146.818359375, -141.8828125, -136.947265625, -132.01171875, -127.076171875, -122.140625, -117.205078125, -112.26953125, -107.333984375, -102.3984375, -97.462890625, -92.52734375, -87.591796875, -82.65625, -77.720703125, -72.78515625, -67.849609375, -62.9140625, -57.978515625, -53.04296875, -48.107421875, -43.171875, -38.236328125, -33.30078125, -28.365234375, -23.4296875, -18.494140625, -13.55859375, -8.623046875, -3.6875, 1.248046875, 6.18359375, 11.119140625, 16.0546875, 20.990234375, 25.92578125, 30.861328125, 35.796875, 40.732421875, 45.66796875, 50.603515625, 55.5390625, 60.474609375, 65.41015625, 70.345703125, 75.28125, 80.216796875, 85.15234375, 90.087890625, 95.0234375, 99.958984375, 104.89453125, 109.830078125, 114.765625, 119.701171875, 124.63671875, 129.572265625, 134.5078125, 139.443359375, 144.37890625, 149.314453125, 154.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 9.0, 6.0, 9.0, 13.0, 16.0, 23.0, 26.0, 32.0, 31.0, 34.0, 45.0, 42.0, 35.0, 34.0, 55.0, 50.0, 49.0, 42.0, 54.0, 52.0, 47.0, 42.0, 32.0, 35.0, 36.0, 21.0, 21.0, 19.0, 9.0, 9.0, 8.0, 9.0, 8.0, 4.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-184.875, -180.048828125, -175.22265625, -170.396484375, -165.5703125, -160.744140625, -155.91796875, -151.091796875, -146.265625, -141.439453125, -136.61328125, -131.787109375, -126.9609375, -122.134765625, -117.30859375, -112.482421875, -107.65625, -102.830078125, -98.00390625, -93.177734375, -88.3515625, -83.525390625, -78.69921875, -73.873046875, -69.046875, -64.220703125, -59.39453125, -54.568359375, -49.7421875, -44.916015625, -40.08984375, -35.263671875, -30.4375, -25.611328125, -20.78515625, -15.958984375, -11.1328125, -6.306640625, -1.48046875, 3.345703125, 8.171875, 12.998046875, 17.82421875, 22.650390625, 27.4765625, 32.302734375, 37.12890625, 41.955078125, 46.78125, 51.607421875, 56.43359375, 61.259765625, 66.0859375, 70.912109375, 75.73828125, 80.564453125, 85.390625, 90.216796875, 95.04296875, 99.869140625, 104.6953125, 109.521484375, 114.34765625, 119.173828125, 124.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 7.0, 11.0, 17.0, 13.0, 32.0, 41.0, 65.0, 119.0, 186.0, 320.0, 610.0, 1194.0, 2696.0, 6509.0, 21063.0, 134098.0, 761233.0, 93140.0, 16884.0, 5457.0, 2407.0, 1097.0, 512.0, 289.0, 207.0, 124.0, 71.0, 43.0, 33.0, 17.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -42.7568359375, -41.138671875, -39.5205078125, -37.90234375, -36.2841796875, -34.666015625, -33.0478515625, -31.4296875, -29.8115234375, -28.193359375, -26.5751953125, -24.95703125, -23.3388671875, -21.720703125, -20.1025390625, -18.484375, -16.8662109375, -15.248046875, -13.6298828125, -12.01171875, -10.3935546875, -8.775390625, -7.1572265625, -5.5390625, -3.9208984375, -2.302734375, -0.6845703125, 0.93359375, 2.5517578125, 4.169921875, 5.7880859375, 7.40625, 9.0244140625, 10.642578125, 12.2607421875, 13.87890625, 15.4970703125, 17.115234375, 18.7333984375, 20.3515625, 21.9697265625, 23.587890625, 25.2060546875, 26.82421875, 28.4423828125, 30.060546875, 31.6787109375, 33.296875, 34.9150390625, 36.533203125, 38.1513671875, 39.76953125, 41.3876953125, 43.005859375, 44.6240234375, 46.2421875, 47.8603515625, 49.478515625, 51.0966796875, 52.71484375, 54.3330078125, 55.951171875, 57.5693359375, 59.1875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 16.0, 18.0, 34.0, 37.0, 61.0, 100.0, 120.0, 187.0, 144.0, 89.0, 51.0, 45.0, 16.0, 11.0, 10.0, 11.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018157958984375, -0.017614126205444336, -0.017070293426513672, -0.016526460647583008, -0.015982627868652344, -0.01543879508972168, -0.014894962310791016, -0.014351129531860352, -0.013807296752929688, -0.013263463973999023, -0.01271963119506836, -0.012175798416137695, -0.011631965637207031, -0.011088132858276367, -0.010544300079345703, -0.010000467300415039, -0.009456634521484375, -0.008912801742553711, -0.008368968963623047, -0.007825136184692383, -0.007281303405761719, -0.006737470626831055, -0.006193637847900391, -0.0056498050689697266, -0.0051059722900390625, -0.0045621395111083984, -0.004018306732177734, -0.0034744739532470703, -0.0029306411743164062, -0.002386808395385742, -0.0018429756164550781, -0.001299142837524414, -0.00075531005859375, -0.00021147727966308594, 0.0003323554992675781, 0.0008761882781982422, 0.0014200210571289062, 0.0019638538360595703, 0.0025076866149902344, 0.0030515193939208984, 0.0035953521728515625, 0.0041391849517822266, 0.004683017730712891, 0.005226850509643555, 0.005770683288574219, 0.006314516067504883, 0.006858348846435547, 0.007402181625366211, 0.007946014404296875, 0.008489847183227539, 0.009033679962158203, 0.009577512741088867, 0.010121345520019531, 0.010665178298950195, 0.01120901107788086, 0.011752843856811523, 0.012296676635742188, 0.012840509414672852, 0.013384342193603516, 0.01392817497253418, 0.014472007751464844, 0.015015840530395508, 0.015559673309326172, 0.016103506088256836, 0.0166473388671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 10.0, 12.0, 14.0, 20.0, 29.0, 42.0, 56.0, 81.0, 126.0, 201.0, 353.0, 647.0, 1119.0, 2386.0, 6094.0, 19918.0, 113039.0, 726313.0, 143128.0, 22680.0, 6694.0, 2646.0, 1288.0, 631.0, 363.0, 221.0, 137.0, 95.0, 59.0, 38.0, 29.0, 22.0, 11.0, 18.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0, -43.57373046875, -42.1474609375, -40.72119140625, -39.294921875, -37.86865234375, -36.4423828125, -35.01611328125, -33.58984375, -32.16357421875, -30.7373046875, -29.31103515625, -27.884765625, -26.45849609375, -25.0322265625, -23.60595703125, -22.1796875, -20.75341796875, -19.3271484375, -17.90087890625, -16.474609375, -15.04833984375, -13.6220703125, -12.19580078125, -10.76953125, -9.34326171875, -7.9169921875, -6.49072265625, -5.064453125, -3.63818359375, -2.2119140625, -0.78564453125, 0.640625, 2.06689453125, 3.4931640625, 4.91943359375, 6.345703125, 7.77197265625, 9.1982421875, 10.62451171875, 12.05078125, 13.47705078125, 14.9033203125, 16.32958984375, 17.755859375, 19.18212890625, 20.6083984375, 22.03466796875, 23.4609375, 24.88720703125, 26.3134765625, 27.73974609375, 29.166015625, 30.59228515625, 32.0185546875, 33.44482421875, 34.87109375, 36.29736328125, 37.7236328125, 39.14990234375, 40.576171875, 42.00244140625, 43.4287109375, 44.85498046875, 46.28125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 6.0, 12.0, 16.0, 12.0, 15.0, 23.0, 47.0, 50.0, 60.0, 75.0, 82.0, 77.0, 91.0, 74.0, 80.0, 56.0, 55.0, 41.0, 25.0, 15.0, 13.0, 10.0, 10.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-48.1875, -46.85107421875, -45.5146484375, -44.17822265625, -42.841796875, -41.50537109375, -40.1689453125, -38.83251953125, -37.49609375, -36.15966796875, -34.8232421875, -33.48681640625, -32.150390625, -30.81396484375, -29.4775390625, -28.14111328125, -26.8046875, -25.46826171875, -24.1318359375, -22.79541015625, -21.458984375, -20.12255859375, -18.7861328125, -17.44970703125, -16.11328125, -14.77685546875, -13.4404296875, -12.10400390625, -10.767578125, -9.43115234375, -8.0947265625, -6.75830078125, -5.421875, -4.08544921875, -2.7490234375, -1.41259765625, -0.076171875, 1.26025390625, 2.5966796875, 3.93310546875, 5.26953125, 6.60595703125, 7.9423828125, 9.27880859375, 10.615234375, 11.95166015625, 13.2880859375, 14.62451171875, 15.9609375, 17.29736328125, 18.6337890625, 19.97021484375, 21.306640625, 22.64306640625, 23.9794921875, 25.31591796875, 26.65234375, 27.98876953125, 29.3251953125, 30.66162109375, 31.998046875, 33.33447265625, 34.6708984375, 36.00732421875, 37.34375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 12.0, 8.0, 9.0, 28.0, 52.0, 59.0, 93.0, 138.0, 155.0, 150.0, 87.0, 72.0, 51.0, 28.0, 20.0, 16.0, 7.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-859.085205078125, -830.8626708984375, -802.6400756835938, -774.4175415039062, -746.1949462890625, -717.972412109375, -689.7498779296875, -661.52734375, -633.3047485351562, -605.0822143554688, -576.859619140625, -548.6370849609375, -520.41455078125, -492.19195556640625, -463.96942138671875, -435.7468566894531, -407.5242919921875, -379.3017272949219, -351.07916259765625, -322.85662841796875, -294.6340637207031, -266.4114990234375, -238.18894958496094, -209.96640014648438, -181.74383544921875, -153.52127075195312, -125.29872131347656, -97.07616424560547, -68.85360717773438, -40.63104248046875, -12.408493041992188, 15.814056396484375, 44.03662109375, 72.2591781616211, 100.48173522949219, 128.70428466796875, 156.92684936523438, 185.1494140625, 213.37196350097656, 241.59451293945312, 269.81707763671875, 298.0396423339844, 326.26220703125, 354.4847412109375, 382.7073059082031, 410.92987060546875, 439.15240478515625, 467.3749694824219, 495.5975341796875, 523.820068359375, 552.0426635742188, 580.2651977539062, 608.48779296875, 636.7103271484375, 664.932861328125, 693.1553955078125, 721.3779907226562, 749.6005249023438, 777.8231201171875, 806.045654296875, 834.2681884765625, 862.4907836914062, 890.7133178710938, 918.9359130859375, 947.158447265625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 14.0, 13.0, 21.0, 24.0, 23.0, 20.0, 23.0, 29.0, 29.0, 41.0, 47.0, 66.0, 55.0, 65.0, 48.0, 56.0, 49.0, 35.0, 35.0, 31.0, 31.0, 35.0, 32.0, 29.0, 19.0, 14.0, 18.0, 9.0, 8.0, 10.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.265380859375, -602.0185546875, -582.7717895507812, -563.5249633789062, -544.2781372070312, -525.0313110351562, -505.7845458984375, -486.5377197265625, -467.2908935546875, -448.0440979003906, -428.7972717285156, -409.55047607421875, -390.30364990234375, -371.0568542480469, -351.81005859375, -332.563232421875, -313.3164367675781, -294.06964111328125, -274.82281494140625, -255.57601928710938, -236.32919311523438, -217.0823974609375, -197.83558654785156, -178.58877563476562, -159.3419647216797, -140.09515380859375, -120.84834289550781, -101.6015396118164, -82.35472869873047, -63.10791778564453, -43.861114501953125, -24.614303588867188, -5.36749267578125, 13.879316329956055, 33.12612533569336, 52.37293243408203, 71.61974334716797, 90.8665542602539, 110.11335754394531, 129.36016845703125, 148.6069793701172, 167.85379028320312, 187.10060119628906, 206.347412109375, 225.59420776367188, 244.84103393554688, 264.08782958984375, 283.33465576171875, 302.5814514160156, 321.8282470703125, 341.0750732421875, 360.3218688964844, 379.5686950683594, 398.81549072265625, 418.06231689453125, 437.3091125488281, 456.555908203125, 475.8027038574219, 495.0495300292969, 514.2963256835938, 533.5431518554688, 552.7899780273438, 572.0367431640625, 591.2835693359375, 610.5303955078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 16.0, 12.0, 16.0, 27.0, 31.0, 35.0, 61.0, 127.0, 247.0, 494.0, 1273.0, 3488.0, 13045.0, 183165.0, 3873333.0, 102921.0, 10835.0, 3048.0, 1105.0, 462.0, 213.0, 104.0, 59.0, 21.0, 37.0, 18.0, 11.0, 9.0, 11.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-122.125, -118.2392578125, -114.353515625, -110.4677734375, -106.58203125, -102.6962890625, -98.810546875, -94.9248046875, -91.0390625, -87.1533203125, -83.267578125, -79.3818359375, -75.49609375, -71.6103515625, -67.724609375, -63.8388671875, -59.953125, -56.0673828125, -52.181640625, -48.2958984375, -44.41015625, -40.5244140625, -36.638671875, -32.7529296875, -28.8671875, -24.9814453125, -21.095703125, -17.2099609375, -13.32421875, -9.4384765625, -5.552734375, -1.6669921875, 2.21875, 6.1044921875, 9.990234375, 13.8759765625, 17.76171875, 21.6474609375, 25.533203125, 29.4189453125, 33.3046875, 37.1904296875, 41.076171875, 44.9619140625, 48.84765625, 52.7333984375, 56.619140625, 60.5048828125, 64.390625, 68.2763671875, 72.162109375, 76.0478515625, 79.93359375, 83.8193359375, 87.705078125, 91.5908203125, 95.4765625, 99.3623046875, 103.248046875, 107.1337890625, 111.01953125, 114.9052734375, 118.791015625, 122.6767578125, 126.5625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 6.0, 13.0, 8.0, 9.0, 9.0, 19.0, 15.0, 21.0, 16.0, 29.0, 40.0, 37.0, 40.0, 55.0, 47.0, 44.0, 73.0, 69.0, 63.0, 42.0, 56.0, 55.0, 45.0, 27.0, 25.0, 24.0, 12.0, 18.0, 20.0, 15.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.15625, -36.99853515625, -35.8408203125, -34.68310546875, -33.525390625, -32.36767578125, -31.2099609375, -30.05224609375, -28.89453125, -27.73681640625, -26.5791015625, -25.42138671875, -24.263671875, -23.10595703125, -21.9482421875, -20.79052734375, -19.6328125, -18.47509765625, -17.3173828125, -16.15966796875, -15.001953125, -13.84423828125, -12.6865234375, -11.52880859375, -10.37109375, -9.21337890625, -8.0556640625, -6.89794921875, -5.740234375, -4.58251953125, -3.4248046875, -2.26708984375, -1.109375, 0.04833984375, 1.2060546875, 2.36376953125, 3.521484375, 4.67919921875, 5.8369140625, 6.99462890625, 8.15234375, 9.31005859375, 10.4677734375, 11.62548828125, 12.783203125, 13.94091796875, 15.0986328125, 16.25634765625, 17.4140625, 18.57177734375, 19.7294921875, 20.88720703125, 22.044921875, 23.20263671875, 24.3603515625, 25.51806640625, 26.67578125, 27.83349609375, 28.9912109375, 30.14892578125, 31.306640625, 32.46435546875, 33.6220703125, 34.77978515625, 35.9375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 6.0, 15.0, 27.0, 30.0, 49.0, 86.0, 122.0, 233.0, 298.0, 488.0, 780.0, 1290.0, 2312.0, 4807.0, 11148.0, 31970.0, 148658.0, 2966738.0, 910060.0, 77751.0, 21124.0, 7936.0, 3680.0, 1825.0, 1062.0, 615.0, 399.0, 237.0, 162.0, 118.0, 64.0, 54.0, 38.0, 30.0, 13.0, 11.0, 9.0, 2.0, 8.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.75, -80.1494140625, -77.548828125, -74.9482421875, -72.34765625, -69.7470703125, -67.146484375, -64.5458984375, -61.9453125, -59.3447265625, -56.744140625, -54.1435546875, -51.54296875, -48.9423828125, -46.341796875, -43.7412109375, -41.140625, -38.5400390625, -35.939453125, -33.3388671875, -30.73828125, -28.1376953125, -25.537109375, -22.9365234375, -20.3359375, -17.7353515625, -15.134765625, -12.5341796875, -9.93359375, -7.3330078125, -4.732421875, -2.1318359375, 0.46875, 3.0693359375, 5.669921875, 8.2705078125, 10.87109375, 13.4716796875, 16.072265625, 18.6728515625, 21.2734375, 23.8740234375, 26.474609375, 29.0751953125, 31.67578125, 34.2763671875, 36.876953125, 39.4775390625, 42.078125, 44.6787109375, 47.279296875, 49.8798828125, 52.48046875, 55.0810546875, 57.681640625, 60.2822265625, 62.8828125, 65.4833984375, 68.083984375, 70.6845703125, 73.28515625, 75.8857421875, 78.486328125, 81.0869140625, 83.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 4.0, 11.0, 21.0, 22.0, 23.0, 59.0, 82.0, 155.0, 335.0, 823.0, 1243.0, 640.0, 276.0, 137.0, 81.0, 44.0, 24.0, 26.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.6875, -102.2119140625, -98.736328125, -95.2607421875, -91.78515625, -88.3095703125, -84.833984375, -81.3583984375, -77.8828125, -74.4072265625, -70.931640625, -67.4560546875, -63.98046875, -60.5048828125, -57.029296875, -53.5537109375, -50.078125, -46.6025390625, -43.126953125, -39.6513671875, -36.17578125, -32.7001953125, -29.224609375, -25.7490234375, -22.2734375, -18.7978515625, -15.322265625, -11.8466796875, -8.37109375, -4.8955078125, -1.419921875, 2.0556640625, 5.53125, 9.0068359375, 12.482421875, 15.9580078125, 19.43359375, 22.9091796875, 26.384765625, 29.8603515625, 33.3359375, 36.8115234375, 40.287109375, 43.7626953125, 47.23828125, 50.7138671875, 54.189453125, 57.6650390625, 61.140625, 64.6162109375, 68.091796875, 71.5673828125, 75.04296875, 78.5185546875, 81.994140625, 85.4697265625, 88.9453125, 92.4208984375, 95.896484375, 99.3720703125, 102.84765625, 106.3232421875, 109.798828125, 113.2744140625, 116.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 19.0, 10.0, 50.0, 68.0, 102.0, 115.0, 147.0, 147.0, 109.0, 66.0, 49.0, 31.0, 20.0, 9.0, 10.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-392.81005859375, -373.8019104003906, -354.7937316894531, -335.78558349609375, -316.77740478515625, -297.7692565917969, -278.7611083984375, -259.7529296875, -240.74478149414062, -221.7366180419922, -202.72845458984375, -183.72030639648438, -164.71214294433594, -145.7039794921875, -126.6958236694336, -107.68766784667969, -88.67950439453125, -69.67134094238281, -50.663185119628906, -31.655025482177734, -12.646865844726562, 6.361297607421875, 25.36945343017578, 44.37760925292969, 63.385772705078125, 82.39393615722656, 101.40209197998047, 120.41024780273438, 139.4184112548828, 158.42657470703125, 177.43472290039062, 196.44288635253906, 215.45111083984375, 234.4592742919922, 253.46743774414062, 272.4755859375, 291.4837646484375, 310.4919128417969, 329.50006103515625, 348.50823974609375, 367.5163879394531, 386.5245361328125, 405.53271484375, 424.5408630371094, 443.54901123046875, 462.55718994140625, 481.5653381347656, 500.573486328125, 519.5816650390625, 538.58984375, 557.5979614257812, 576.6061401367188, 595.6143188476562, 614.6224365234375, 633.630615234375, 652.6387939453125, 671.64697265625, 690.6551513671875, 709.6632690429688, 728.6714477539062, 747.6796264648438, 766.687744140625, 785.6959228515625, 804.7041015625, 823.7122192382812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 11.0, 17.0, 17.0, 22.0, 29.0, 13.0, 31.0, 30.0, 30.0, 38.0, 44.0, 41.0, 46.0, 36.0, 51.0, 42.0, 44.0, 49.0, 33.0, 52.0, 36.0, 39.0, 32.0, 25.0, 20.0, 26.0, 21.0, 20.0, 14.0, 13.0, 12.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-320.2158508300781, -309.3950500488281, -298.57427978515625, -287.75347900390625, -276.93267822265625, -266.11187744140625, -255.2910919189453, -244.47030639648438, -233.64950561523438, -222.82870483398438, -212.00791931152344, -201.1871337890625, -190.3663330078125, -179.5455322265625, -168.72474670410156, -157.90396118164062, -147.08316040039062, -136.26235961914062, -125.44157409667969, -114.62078094482422, -103.79998779296875, -92.97919464111328, -82.15840148925781, -71.33760833740234, -60.516815185546875, -49.696022033691406, -38.87522888183594, -28.05443572998047, -17.233642578125, -6.412849426269531, 4.4079437255859375, 15.228736877441406, 26.049560546875, 36.87035369873047, 47.69114685058594, 58.511940002441406, 69.33273315429688, 80.15352630615234, 90.97431945800781, 101.79511260986328, 112.61590576171875, 123.43669891357422, 134.2574920654297, 145.07827758789062, 155.89907836914062, 166.71987915039062, 177.54066467285156, 188.3614501953125, 199.1822509765625, 210.0030517578125, 220.82383728027344, 231.64462280273438, 242.46542358398438, 253.28622436523438, 264.10699462890625, 274.92779541015625, 285.74859619140625, 296.56939697265625, 307.39019775390625, 318.2109680175781, 329.0317687988281, 339.8525695800781, 350.67333984375, 361.494140625, 372.31494140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 18.0, 9.0, 16.0, 18.0, 37.0, 39.0, 69.0, 111.0, 158.0, 223.0, 382.0, 528.0, 934.0, 1588.0, 2943.0, 5377.0, 11101.0, 25030.0, 63904.0, 186270.0, 446536.0, 189974.0, 64009.0, 25402.0, 11251.0, 5460.0, 2900.0, 1689.0, 941.0, 571.0, 337.0, 238.0, 121.0, 102.0, 68.0, 53.0, 24.0, 35.0, 15.0, 17.0, 10.0, 4.0, 9.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-70.1875, -68.0283203125, -65.869140625, -63.7099609375, -61.55078125, -59.3916015625, -57.232421875, -55.0732421875, -52.9140625, -50.7548828125, -48.595703125, -46.4365234375, -44.27734375, -42.1181640625, -39.958984375, -37.7998046875, -35.640625, -33.4814453125, -31.322265625, -29.1630859375, -27.00390625, -24.8447265625, -22.685546875, -20.5263671875, -18.3671875, -16.2080078125, -14.048828125, -11.8896484375, -9.73046875, -7.5712890625, -5.412109375, -3.2529296875, -1.09375, 1.0654296875, 3.224609375, 5.3837890625, 7.54296875, 9.7021484375, 11.861328125, 14.0205078125, 16.1796875, 18.3388671875, 20.498046875, 22.6572265625, 24.81640625, 26.9755859375, 29.134765625, 31.2939453125, 33.453125, 35.6123046875, 37.771484375, 39.9306640625, 42.08984375, 44.2490234375, 46.408203125, 48.5673828125, 50.7265625, 52.8857421875, 55.044921875, 57.2041015625, 59.36328125, 61.5224609375, 63.681640625, 65.8408203125, 68.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 14.0, 16.0, 12.0, 12.0, 19.0, 16.0, 25.0, 29.0, 24.0, 34.0, 34.0, 37.0, 37.0, 37.0, 52.0, 39.0, 50.0, 57.0, 39.0, 52.0, 47.0, 48.0, 40.0, 24.0, 34.0, 21.0, 25.0, 12.0, 25.0, 9.0, 13.0, 15.0, 9.0, 4.0, 4.0, 6.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.542236328125, -29.47509765625, -28.407958984375, -27.3408203125, -26.273681640625, -25.20654296875, -24.139404296875, -23.072265625, -22.005126953125, -20.93798828125, -19.870849609375, -18.8037109375, -17.736572265625, -16.66943359375, -15.602294921875, -14.53515625, -13.468017578125, -12.40087890625, -11.333740234375, -10.2666015625, -9.199462890625, -8.13232421875, -7.065185546875, -5.998046875, -4.930908203125, -3.86376953125, -2.796630859375, -1.7294921875, -0.662353515625, 0.40478515625, 1.471923828125, 2.5390625, 3.606201171875, 4.67333984375, 5.740478515625, 6.8076171875, 7.874755859375, 8.94189453125, 10.009033203125, 11.076171875, 12.143310546875, 13.21044921875, 14.277587890625, 15.3447265625, 16.411865234375, 17.47900390625, 18.546142578125, 19.61328125, 20.680419921875, 21.74755859375, 22.814697265625, 23.8818359375, 24.948974609375, 26.01611328125, 27.083251953125, 28.150390625, 29.217529296875, 30.28466796875, 31.351806640625, 32.4189453125, 33.486083984375, 34.55322265625, 35.620361328125, 36.6875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 16.0, 17.0, 21.0, 30.0, 54.0, 79.0, 112.0, 196.0, 361.0, 715.0, 1601.0, 4388.0, 16287.0, 90939.0, 754227.0, 147165.0, 22667.0, 5823.0, 2027.0, 840.0, 400.0, 208.0, 137.0, 76.0, 44.0, 29.0, 26.0, 7.0, 17.0, 13.0, 3.0, 9.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.25, -134.3828125, -129.515625, -124.6484375, -119.78125, -114.9140625, -110.046875, -105.1796875, -100.3125, -95.4453125, -90.578125, -85.7109375, -80.84375, -75.9765625, -71.109375, -66.2421875, -61.375, -56.5078125, -51.640625, -46.7734375, -41.90625, -37.0390625, -32.171875, -27.3046875, -22.4375, -17.5703125, -12.703125, -7.8359375, -2.96875, 1.8984375, 6.765625, 11.6328125, 16.5, 21.3671875, 26.234375, 31.1015625, 35.96875, 40.8359375, 45.703125, 50.5703125, 55.4375, 60.3046875, 65.171875, 70.0390625, 74.90625, 79.7734375, 84.640625, 89.5078125, 94.375, 99.2421875, 104.109375, 108.9765625, 113.84375, 118.7109375, 123.578125, 128.4453125, 133.3125, 138.1796875, 143.046875, 147.9140625, 152.78125, 157.6484375, 162.515625, 167.3828125, 172.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 9.0, 11.0, 14.0, 15.0, 25.0, 20.0, 34.0, 30.0, 52.0, 48.0, 43.0, 38.0, 43.0, 48.0, 52.0, 57.0, 63.0, 50.0, 42.0, 44.0, 45.0, 33.0, 28.0, 24.0, 23.0, 18.0, 12.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.25, -158.201171875, -153.15234375, -148.103515625, -143.0546875, -138.005859375, -132.95703125, -127.908203125, -122.859375, -117.810546875, -112.76171875, -107.712890625, -102.6640625, -97.615234375, -92.56640625, -87.517578125, -82.46875, -77.419921875, -72.37109375, -67.322265625, -62.2734375, -57.224609375, -52.17578125, -47.126953125, -42.078125, -37.029296875, -31.98046875, -26.931640625, -21.8828125, -16.833984375, -11.78515625, -6.736328125, -1.6875, 3.361328125, 8.41015625, 13.458984375, 18.5078125, 23.556640625, 28.60546875, 33.654296875, 38.703125, 43.751953125, 48.80078125, 53.849609375, 58.8984375, 63.947265625, 68.99609375, 74.044921875, 79.09375, 84.142578125, 89.19140625, 94.240234375, 99.2890625, 104.337890625, 109.38671875, 114.435546875, 119.484375, 124.533203125, 129.58203125, 134.630859375, 139.6796875, 144.728515625, 149.77734375, 154.826171875, 159.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 16.0, 24.0, 28.0, 58.0, 75.0, 122.0, 223.0, 394.0, 691.0, 1554.0, 3915.0, 12000.0, 61114.0, 719539.0, 211415.0, 25690.0, 6857.0, 2371.0, 1126.0, 533.0, 334.0, 172.0, 110.0, 57.0, 32.0, 20.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.875, -77.5771484375, -75.279296875, -72.9814453125, -70.68359375, -68.3857421875, -66.087890625, -63.7900390625, -61.4921875, -59.1943359375, -56.896484375, -54.5986328125, -52.30078125, -50.0029296875, -47.705078125, -45.4072265625, -43.109375, -40.8115234375, -38.513671875, -36.2158203125, -33.91796875, -31.6201171875, -29.322265625, -27.0244140625, -24.7265625, -22.4287109375, -20.130859375, -17.8330078125, -15.53515625, -13.2373046875, -10.939453125, -8.6416015625, -6.34375, -4.0458984375, -1.748046875, 0.5498046875, 2.84765625, 5.1455078125, 7.443359375, 9.7412109375, 12.0390625, 14.3369140625, 16.634765625, 18.9326171875, 21.23046875, 23.5283203125, 25.826171875, 28.1240234375, 30.421875, 32.7197265625, 35.017578125, 37.3154296875, 39.61328125, 41.9111328125, 44.208984375, 46.5068359375, 48.8046875, 51.1025390625, 53.400390625, 55.6982421875, 57.99609375, 60.2939453125, 62.591796875, 64.8896484375, 67.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 13.0, 24.0, 50.0, 91.0, 247.0, 291.0, 128.0, 50.0, 31.0, 17.0, 15.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.054443359375, -0.053238868713378906, -0.05203437805175781, -0.05082988739013672, -0.049625396728515625, -0.04842090606689453, -0.04721641540527344, -0.046011924743652344, -0.04480743408203125, -0.043602943420410156, -0.04239845275878906, -0.04119396209716797, -0.039989471435546875, -0.03878498077392578, -0.03758049011230469, -0.036375999450683594, -0.0351715087890625, -0.033967018127441406, -0.03276252746582031, -0.03155803680419922, -0.030353546142578125, -0.02914905548095703, -0.027944564819335938, -0.026740074157714844, -0.02553558349609375, -0.024331092834472656, -0.023126602172851562, -0.02192211151123047, -0.020717620849609375, -0.01951313018798828, -0.018308639526367188, -0.017104148864746094, -0.015899658203125, -0.014695167541503906, -0.013490676879882812, -0.012286186218261719, -0.011081695556640625, -0.009877204895019531, -0.008672714233398438, -0.007468223571777344, -0.00626373291015625, -0.005059242248535156, -0.0038547515869140625, -0.0026502609252929688, -0.001445770263671875, -0.00024127960205078125, 0.0009632110595703125, 0.0021677017211914062, 0.0033721923828125, 0.004576683044433594, 0.0057811737060546875, 0.006985664367675781, 0.008190155029296875, 0.009394645690917969, 0.010599136352539062, 0.011803627014160156, 0.01300811767578125, 0.014212608337402344, 0.015417098999023438, 0.01662158966064453, 0.017826080322265625, 0.01903057098388672, 0.020235061645507812, 0.021439552307128906, 0.02264404296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 15.0, 24.0, 22.0, 41.0, 78.0, 107.0, 172.0, 365.0, 668.0, 1350.0, 3169.0, 8856.0, 35408.0, 241637.0, 650614.0, 80703.0, 16169.0, 5056.0, 2012.0, 971.0, 439.0, 253.0, 154.0, 74.0, 54.0, 28.0, 18.0, 20.0, 18.0, 11.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.25, -50.52197265625, -48.7939453125, -47.06591796875, -45.337890625, -43.60986328125, -41.8818359375, -40.15380859375, -38.42578125, -36.69775390625, -34.9697265625, -33.24169921875, -31.513671875, -29.78564453125, -28.0576171875, -26.32958984375, -24.6015625, -22.87353515625, -21.1455078125, -19.41748046875, -17.689453125, -15.96142578125, -14.2333984375, -12.50537109375, -10.77734375, -9.04931640625, -7.3212890625, -5.59326171875, -3.865234375, -2.13720703125, -0.4091796875, 1.31884765625, 3.046875, 4.77490234375, 6.5029296875, 8.23095703125, 9.958984375, 11.68701171875, 13.4150390625, 15.14306640625, 16.87109375, 18.59912109375, 20.3271484375, 22.05517578125, 23.783203125, 25.51123046875, 27.2392578125, 28.96728515625, 30.6953125, 32.42333984375, 34.1513671875, 35.87939453125, 37.607421875, 39.33544921875, 41.0634765625, 42.79150390625, 44.51953125, 46.24755859375, 47.9755859375, 49.70361328125, 51.431640625, 53.15966796875, 54.8876953125, 56.61572265625, 58.34375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 11.0, 17.0, 13.0, 32.0, 48.0, 43.0, 79.0, 65.0, 98.0, 108.0, 92.0, 91.0, 67.0, 66.0, 36.0, 25.0, 17.0, 15.0, 20.0, 9.0, 3.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.15234375, -58.2421875, -56.33203125, -54.421875, -52.51171875, -50.6015625, -48.69140625, -46.78125, -44.87109375, -42.9609375, -41.05078125, -39.140625, -37.23046875, -35.3203125, -33.41015625, -31.5, -29.58984375, -27.6796875, -25.76953125, -23.859375, -21.94921875, -20.0390625, -18.12890625, -16.21875, -14.30859375, -12.3984375, -10.48828125, -8.578125, -6.66796875, -4.7578125, -2.84765625, -0.9375, 0.97265625, 2.8828125, 4.79296875, 6.703125, 8.61328125, 10.5234375, 12.43359375, 14.34375, 16.25390625, 18.1640625, 20.07421875, 21.984375, 23.89453125, 25.8046875, 27.71484375, 29.625, 31.53515625, 33.4453125, 35.35546875, 37.265625, 39.17578125, 41.0859375, 42.99609375, 44.90625, 46.81640625, 48.7265625, 50.63671875, 52.546875, 54.45703125, 56.3671875, 58.27734375, 60.1875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 21.0, 64.0, 191.0, 314.0, 216.0, 108.0, 40.0, 19.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1606.042724609375, -1551.7738037109375, -1497.5048828125, -1443.2359619140625, -1388.967041015625, -1334.6981201171875, -1280.42919921875, -1226.1602783203125, -1171.891357421875, -1117.6224365234375, -1063.353515625, -1009.0845947265625, -954.815673828125, -900.5467529296875, -846.27783203125, -792.0089111328125, -737.739990234375, -683.4710693359375, -629.2021484375, -574.9332275390625, -520.664306640625, -466.3953857421875, -412.12646484375, -357.8575439453125, -303.588623046875, -249.3197021484375, -195.05078125, -140.7818603515625, -86.512939453125, -32.2440185546875, 22.02490234375, 76.2938232421875, 130.5628662109375, 184.831787109375, 239.1007080078125, 293.36962890625, 347.6385498046875, 401.907470703125, 456.1763916015625, 510.4453125, 564.7142333984375, 618.983154296875, 673.2520751953125, 727.52099609375, 781.7899169921875, 836.058837890625, 890.3277587890625, 944.5966796875, 998.8656005859375, 1053.134521484375, 1107.4034423828125, 1161.67236328125, 1215.9412841796875, 1270.210205078125, 1324.4791259765625, 1378.748046875, 1433.0169677734375, 1487.285888671875, 1541.5548095703125, 1595.82373046875, 1650.0926513671875, 1704.361572265625, 1758.6304931640625, 1812.8994140625, 1867.1683349609375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 11.0, 7.0, 6.0, 15.0, 10.0, 17.0, 13.0, 20.0, 22.0, 31.0, 20.0, 29.0, 38.0, 27.0, 42.0, 42.0, 37.0, 41.0, 59.0, 52.0, 49.0, 32.0, 39.0, 39.0, 38.0, 34.0, 29.0, 21.0, 31.0, 20.0, 16.0, 18.0, 15.0, 12.0, 20.0, 8.0, 8.0, 11.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-614.193115234375, -596.7333374023438, -579.2735595703125, -561.8137817382812, -544.35400390625, -526.8941650390625, -509.43438720703125, -491.974609375, -474.51483154296875, -457.0550537109375, -439.59527587890625, -422.1354675292969, -404.6756896972656, -387.2159118652344, -369.756103515625, -352.29632568359375, -334.8365478515625, -317.37677001953125, -299.9169921875, -282.4571838378906, -264.9974060058594, -247.53762817382812, -230.0778350830078, -212.6180419921875, -195.15826416015625, -177.698486328125, -160.2386932373047, -142.77890014648438, -125.31912231445312, -107.85933685302734, -90.39955139160156, -72.93976593017578, -55.47998046875, -38.02019500732422, -20.560409545898438, -3.1006240844726562, 14.359161376953125, 31.818946838378906, 49.27873229980469, 66.73851776123047, 84.19830322265625, 101.65808868408203, 119.11787414550781, 136.57766723632812, 154.03744506835938, 171.49722290039062, 188.95701599121094, 206.41680908203125, 223.8765869140625, 241.33636474609375, 258.796142578125, 276.2559509277344, 293.7157287597656, 311.1755065917969, 328.63531494140625, 346.0950927734375, 363.55487060546875, 381.0146484375, 398.47442626953125, 415.9342346191406, 433.3940124511719, 450.8537902832031, 468.3135986328125, 485.77337646484375, 503.233154296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 7.0, 9.0, 6.0, 7.0, 19.0, 21.0, 25.0, 44.0, 60.0, 80.0, 107.0, 156.0, 262.0, 406.0, 633.0, 1064.0, 1674.0, 3061.0, 5722.0, 11498.0, 26539.0, 83376.0, 341821.0, 1637369.0, 1615702.0, 337040.0, 79085.0, 25243.0, 10819.0, 5333.0, 2781.0, 1573.0, 938.0, 618.0, 404.0, 215.0, 151.0, 105.0, 82.0, 65.0, 47.0, 36.0, 18.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0], "bins": [-42.125, -40.80810546875, -39.4912109375, -38.17431640625, -36.857421875, -35.54052734375, -34.2236328125, -32.90673828125, -31.58984375, -30.27294921875, -28.9560546875, -27.63916015625, -26.322265625, -25.00537109375, -23.6884765625, -22.37158203125, -21.0546875, -19.73779296875, -18.4208984375, -17.10400390625, -15.787109375, -14.47021484375, -13.1533203125, -11.83642578125, -10.51953125, -9.20263671875, -7.8857421875, -6.56884765625, -5.251953125, -3.93505859375, -2.6181640625, -1.30126953125, 0.015625, 1.33251953125, 2.6494140625, 3.96630859375, 5.283203125, 6.60009765625, 7.9169921875, 9.23388671875, 10.55078125, 11.86767578125, 13.1845703125, 14.50146484375, 15.818359375, 17.13525390625, 18.4521484375, 19.76904296875, 21.0859375, 22.40283203125, 23.7197265625, 25.03662109375, 26.353515625, 27.67041015625, 28.9873046875, 30.30419921875, 31.62109375, 32.93798828125, 34.2548828125, 35.57177734375, 36.888671875, 38.20556640625, 39.5224609375, 40.83935546875, 42.15625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 3.0, 6.0, 6.0, 12.0, 18.0, 20.0, 15.0, 26.0, 18.0, 39.0, 22.0, 31.0, 38.0, 32.0, 64.0, 44.0, 45.0, 59.0, 60.0, 44.0, 49.0, 48.0, 50.0, 36.0, 38.0, 25.0, 20.0, 23.0, 13.0, 15.0, 16.0, 17.0, 8.0, 10.0, 7.0, 4.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.859375, -26.784912109375, -25.71044921875, -24.635986328125, -23.5615234375, -22.487060546875, -21.41259765625, -20.338134765625, -19.263671875, -18.189208984375, -17.11474609375, -16.040283203125, -14.9658203125, -13.891357421875, -12.81689453125, -11.742431640625, -10.66796875, -9.593505859375, -8.51904296875, -7.444580078125, -6.3701171875, -5.295654296875, -4.22119140625, -3.146728515625, -2.072265625, -0.997802734375, 0.07666015625, 1.151123046875, 2.2255859375, 3.300048828125, 4.37451171875, 5.448974609375, 6.5234375, 7.597900390625, 8.67236328125, 9.746826171875, 10.8212890625, 11.895751953125, 12.97021484375, 14.044677734375, 15.119140625, 16.193603515625, 17.26806640625, 18.342529296875, 19.4169921875, 20.491455078125, 21.56591796875, 22.640380859375, 23.71484375, 24.789306640625, 25.86376953125, 26.938232421875, 28.0126953125, 29.087158203125, 30.16162109375, 31.236083984375, 32.310546875, 33.385009765625, 34.45947265625, 35.533935546875, 36.6083984375, 37.682861328125, 38.75732421875, 39.831787109375, 40.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 9.0, 18.0, 31.0, 29.0, 72.0, 75.0, 119.0, 190.0, 308.0, 521.0, 940.0, 1683.0, 3561.0, 8626.0, 26466.0, 109246.0, 1789763.0, 2092117.0, 118253.0, 26661.0, 8451.0, 3434.0, 1606.0, 804.0, 471.0, 279.0, 157.0, 124.0, 85.0, 39.0, 46.0, 19.0, 15.0, 10.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.9375, -99.72265625, -96.5078125, -93.29296875, -90.078125, -86.86328125, -83.6484375, -80.43359375, -77.21875, -74.00390625, -70.7890625, -67.57421875, -64.359375, -61.14453125, -57.9296875, -54.71484375, -51.5, -48.28515625, -45.0703125, -41.85546875, -38.640625, -35.42578125, -32.2109375, -28.99609375, -25.78125, -22.56640625, -19.3515625, -16.13671875, -12.921875, -9.70703125, -6.4921875, -3.27734375, -0.0625, 3.15234375, 6.3671875, 9.58203125, 12.796875, 16.01171875, 19.2265625, 22.44140625, 25.65625, 28.87109375, 32.0859375, 35.30078125, 38.515625, 41.73046875, 44.9453125, 48.16015625, 51.375, 54.58984375, 57.8046875, 61.01953125, 64.234375, 67.44921875, 70.6640625, 73.87890625, 77.09375, 80.30859375, 83.5234375, 86.73828125, 89.953125, 93.16796875, 96.3828125, 99.59765625, 102.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 11.0, 9.0, 21.0, 28.0, 31.0, 53.0, 72.0, 75.0, 164.0, 383.0, 800.0, 1065.0, 599.0, 291.0, 159.0, 89.0, 74.0, 38.0, 25.0, 19.0, 16.0, 6.0, 8.0, 11.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.5, -138.08984375, -133.6796875, -129.26953125, -124.859375, -120.44921875, -116.0390625, -111.62890625, -107.21875, -102.80859375, -98.3984375, -93.98828125, -89.578125, -85.16796875, -80.7578125, -76.34765625, -71.9375, -67.52734375, -63.1171875, -58.70703125, -54.296875, -49.88671875, -45.4765625, -41.06640625, -36.65625, -32.24609375, -27.8359375, -23.42578125, -19.015625, -14.60546875, -10.1953125, -5.78515625, -1.375, 3.03515625, 7.4453125, 11.85546875, 16.265625, 20.67578125, 25.0859375, 29.49609375, 33.90625, 38.31640625, 42.7265625, 47.13671875, 51.546875, 55.95703125, 60.3671875, 64.77734375, 69.1875, 73.59765625, 78.0078125, 82.41796875, 86.828125, 91.23828125, 95.6484375, 100.05859375, 104.46875, 108.87890625, 113.2890625, 117.69921875, 122.109375, 126.51953125, 130.9296875, 135.33984375, 139.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 14.0, 14.0, 30.0, 91.0, 173.0, 246.0, 216.0, 128.0, 40.0, 26.0, 10.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2329.535888671875, -2277.539794921875, -2225.54345703125, -2173.54736328125, -2121.55126953125, -2069.554931640625, -2017.558837890625, -1965.5626220703125, -1913.56640625, -1861.5701904296875, -1809.5740966796875, -1757.577880859375, -1705.5816650390625, -1653.58544921875, -1601.58935546875, -1549.5931396484375, -1497.5970458984375, -1445.600830078125, -1393.604736328125, -1341.6085205078125, -1289.6123046875, -1237.6162109375, -1185.6199951171875, -1133.623779296875, -1081.627685546875, -1029.6314697265625, -977.6353149414062, -925.63916015625, -873.6429443359375, -821.6467895507812, -769.650634765625, -717.6544189453125, -665.6580810546875, -613.6619262695312, -561.6657104492188, -509.6695556640625, -457.6733703613281, -405.67718505859375, -353.6810302734375, -301.6848449707031, -249.68865966796875, -197.69247436523438, -145.69630432128906, -93.70013427734375, -41.703948974609375, 10.292236328125, 62.28839111328125, 114.28457641601562, 166.28076171875, 218.27694702148438, 270.27313232421875, 322.269287109375, 374.2654724121094, 426.26165771484375, 478.2578125, 530.2540283203125, 582.2501831054688, 634.246337890625, 686.2425537109375, 738.2387084960938, 790.23486328125, 842.2310791015625, 894.2272338867188, 946.223388671875, 998.2196044921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 9.0, 7.0, 6.0, 15.0, 20.0, 30.0, 23.0, 26.0, 31.0, 33.0, 34.0, 44.0, 41.0, 62.0, 55.0, 64.0, 39.0, 57.0, 31.0, 52.0, 34.0, 33.0, 41.0, 29.0, 32.0, 23.0, 22.0, 22.0, 17.0, 14.0, 5.0, 12.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-600.299560546875, -582.5486450195312, -564.7977294921875, -547.0468139648438, -529.2958984375, -511.54498291015625, -493.7940673828125, -476.04315185546875, -458.292236328125, -440.54132080078125, -422.7904052734375, -405.03948974609375, -387.28857421875, -369.53765869140625, -351.7867431640625, -334.03582763671875, -316.2848815917969, -298.5339660644531, -280.7830505371094, -263.0321350097656, -245.28121948242188, -227.53030395507812, -209.7793731689453, -192.02845764160156, -174.2775421142578, -156.52662658691406, -138.7757110595703, -121.02478790283203, -103.27387237548828, -85.52295684814453, -67.77203369140625, -50.0211181640625, -32.27020263671875, -14.519285202026367, 3.2316322326660156, 20.98255157470703, 38.73346710205078, 56.48438262939453, 74.23530578613281, 91.98622131347656, 109.73713684082031, 127.48805236816406, 145.2389678955078, 162.98989868164062, 180.74081420898438, 198.49172973632812, 216.24264526367188, 233.99356079101562, 251.74447631835938, 269.4953918457031, 287.2463073730469, 304.9972229003906, 322.7481384277344, 340.4990539550781, 358.25, 376.00091552734375, 393.7518310546875, 411.50274658203125, 429.253662109375, 447.00457763671875, 464.7554931640625, 482.50640869140625, 500.25732421875, 518.0082397460938, 535.7591552734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 12.0, 17.0, 14.0, 30.0, 49.0, 60.0, 92.0, 118.0, 166.0, 324.0, 546.0, 795.0, 1369.0, 2291.0, 3907.0, 6995.0, 12940.0, 25408.0, 50653.0, 106499.0, 238442.0, 313772.0, 145050.0, 67864.0, 33471.0, 16497.0, 9029.0, 5049.0, 2811.0, 1649.0, 953.0, 635.0, 332.0, 257.0, 139.0, 104.0, 54.0, 47.0, 36.0, 34.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.875, -54.083984375, -52.29296875, -50.501953125, -48.7109375, -46.919921875, -45.12890625, -43.337890625, -41.546875, -39.755859375, -37.96484375, -36.173828125, -34.3828125, -32.591796875, -30.80078125, -29.009765625, -27.21875, -25.427734375, -23.63671875, -21.845703125, -20.0546875, -18.263671875, -16.47265625, -14.681640625, -12.890625, -11.099609375, -9.30859375, -7.517578125, -5.7265625, -3.935546875, -2.14453125, -0.353515625, 1.4375, 3.228515625, 5.01953125, 6.810546875, 8.6015625, 10.392578125, 12.18359375, 13.974609375, 15.765625, 17.556640625, 19.34765625, 21.138671875, 22.9296875, 24.720703125, 26.51171875, 28.302734375, 30.09375, 31.884765625, 33.67578125, 35.466796875, 37.2578125, 39.048828125, 40.83984375, 42.630859375, 44.421875, 46.212890625, 48.00390625, 49.794921875, 51.5859375, 53.376953125, 55.16796875, 56.958984375, 58.75]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 13.0, 11.0, 13.0, 15.0, 20.0, 28.0, 24.0, 34.0, 41.0, 42.0, 49.0, 57.0, 52.0, 54.0, 50.0, 50.0, 57.0, 44.0, 57.0, 39.0, 27.0, 35.0, 35.0, 28.0, 13.0, 24.0, 17.0, 11.0, 12.0, 11.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.5625, -47.31103515625, -46.0595703125, -44.80810546875, -43.556640625, -42.30517578125, -41.0537109375, -39.80224609375, -38.55078125, -37.29931640625, -36.0478515625, -34.79638671875, -33.544921875, -32.29345703125, -31.0419921875, -29.79052734375, -28.5390625, -27.28759765625, -26.0361328125, -24.78466796875, -23.533203125, -22.28173828125, -21.0302734375, -19.77880859375, -18.52734375, -17.27587890625, -16.0244140625, -14.77294921875, -13.521484375, -12.27001953125, -11.0185546875, -9.76708984375, -8.515625, -7.26416015625, -6.0126953125, -4.76123046875, -3.509765625, -2.25830078125, -1.0068359375, 0.24462890625, 1.49609375, 2.74755859375, 3.9990234375, 5.25048828125, 6.501953125, 7.75341796875, 9.0048828125, 10.25634765625, 11.5078125, 12.75927734375, 14.0107421875, 15.26220703125, 16.513671875, 17.76513671875, 19.0166015625, 20.26806640625, 21.51953125, 22.77099609375, 24.0224609375, 25.27392578125, 26.525390625, 27.77685546875, 29.0283203125, 30.27978515625, 31.53125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 13.0, 11.0, 13.0, 22.0, 52.0, 38.0, 64.0, 100.0, 165.0, 239.0, 413.0, 740.0, 1487.0, 3644.0, 12819.0, 96721.0, 809573.0, 102051.0, 13321.0, 3666.0, 1458.0, 720.0, 419.0, 281.0, 158.0, 108.0, 70.0, 57.0, 37.0, 18.0, 18.0, 20.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-254.75, -248.134765625, -241.51953125, -234.904296875, -228.2890625, -221.673828125, -215.05859375, -208.443359375, -201.828125, -195.212890625, -188.59765625, -181.982421875, -175.3671875, -168.751953125, -162.13671875, -155.521484375, -148.90625, -142.291015625, -135.67578125, -129.060546875, -122.4453125, -115.830078125, -109.21484375, -102.599609375, -95.984375, -89.369140625, -82.75390625, -76.138671875, -69.5234375, -62.908203125, -56.29296875, -49.677734375, -43.0625, -36.447265625, -29.83203125, -23.216796875, -16.6015625, -9.986328125, -3.37109375, 3.244140625, 9.859375, 16.474609375, 23.08984375, 29.705078125, 36.3203125, 42.935546875, 49.55078125, 56.166015625, 62.78125, 69.396484375, 76.01171875, 82.626953125, 89.2421875, 95.857421875, 102.47265625, 109.087890625, 115.703125, 122.318359375, 128.93359375, 135.548828125, 142.1640625, 148.779296875, 155.39453125, 162.009765625, 168.625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 4.0, 14.0, 16.0, 22.0, 24.0, 19.0, 24.0, 45.0, 40.0, 47.0, 46.0, 58.0, 65.0, 66.0, 56.0, 52.0, 61.0, 32.0, 42.0, 42.0, 32.0, 38.0, 27.0, 27.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-266.25, -259.634765625, -253.01953125, -246.404296875, -239.7890625, -233.173828125, -226.55859375, -219.943359375, -213.328125, -206.712890625, -200.09765625, -193.482421875, -186.8671875, -180.251953125, -173.63671875, -167.021484375, -160.40625, -153.791015625, -147.17578125, -140.560546875, -133.9453125, -127.330078125, -120.71484375, -114.099609375, -107.484375, -100.869140625, -94.25390625, -87.638671875, -81.0234375, -74.408203125, -67.79296875, -61.177734375, -54.5625, -47.947265625, -41.33203125, -34.716796875, -28.1015625, -21.486328125, -14.87109375, -8.255859375, -1.640625, 4.974609375, 11.58984375, 18.205078125, 24.8203125, 31.435546875, 38.05078125, 44.666015625, 51.28125, 57.896484375, 64.51171875, 71.126953125, 77.7421875, 84.357421875, 90.97265625, 97.587890625, 104.203125, 110.818359375, 117.43359375, 124.048828125, 130.6640625, 137.279296875, 143.89453125, 150.509765625, 157.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 12.0, 11.0, 22.0, 29.0, 34.0, 62.0, 103.0, 184.0, 314.0, 617.0, 1452.0, 3601.0, 10910.0, 43443.0, 256964.0, 628947.0, 75842.0, 17024.0, 5188.0, 1950.0, 816.0, 424.0, 218.0, 123.0, 87.0, 45.0, 49.0, 24.0, 11.0, 10.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -33.82177734375, -32.3623046875, -30.90283203125, -29.443359375, -27.98388671875, -26.5244140625, -25.06494140625, -23.60546875, -22.14599609375, -20.6865234375, -19.22705078125, -17.767578125, -16.30810546875, -14.8486328125, -13.38916015625, -11.9296875, -10.47021484375, -9.0107421875, -7.55126953125, -6.091796875, -4.63232421875, -3.1728515625, -1.71337890625, -0.25390625, 1.20556640625, 2.6650390625, 4.12451171875, 5.583984375, 7.04345703125, 8.5029296875, 9.96240234375, 11.421875, 12.88134765625, 14.3408203125, 15.80029296875, 17.259765625, 18.71923828125, 20.1787109375, 21.63818359375, 23.09765625, 24.55712890625, 26.0166015625, 27.47607421875, 28.935546875, 30.39501953125, 31.8544921875, 33.31396484375, 34.7734375, 36.23291015625, 37.6923828125, 39.15185546875, 40.611328125, 42.07080078125, 43.5302734375, 44.98974609375, 46.44921875, 47.90869140625, 49.3681640625, 50.82763671875, 52.287109375, 53.74658203125, 55.2060546875, 56.66552734375, 58.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 25.0, 24.0, 28.0, 33.0, 40.0, 57.0, 84.0, 91.0, 121.0, 98.0, 88.0, 57.0, 51.0, 32.0, 34.0, 18.0, 16.0, 15.0, 10.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017974853515625, -0.017531633377075195, -0.01708841323852539, -0.016645193099975586, -0.01620197296142578, -0.015758752822875977, -0.015315532684326172, -0.014872312545776367, -0.014429092407226562, -0.013985872268676758, -0.013542652130126953, -0.013099431991577148, -0.012656211853027344, -0.012212991714477539, -0.011769771575927734, -0.01132655143737793, -0.010883331298828125, -0.01044011116027832, -0.009996891021728516, -0.009553670883178711, -0.009110450744628906, -0.008667230606079102, -0.008224010467529297, -0.007780790328979492, -0.0073375701904296875, -0.006894350051879883, -0.006451129913330078, -0.0060079097747802734, -0.005564689636230469, -0.005121469497680664, -0.004678249359130859, -0.004235029220581055, -0.00379180908203125, -0.0033485889434814453, -0.0029053688049316406, -0.002462148666381836, -0.0020189285278320312, -0.0015757083892822266, -0.0011324882507324219, -0.0006892681121826172, -0.0002460479736328125, 0.0001971721649169922, 0.0006403923034667969, 0.0010836124420166016, 0.0015268325805664062, 0.001970052719116211, 0.0024132728576660156, 0.0028564929962158203, 0.003299713134765625, 0.0037429332733154297, 0.004186153411865234, 0.004629373550415039, 0.005072593688964844, 0.0055158138275146484, 0.005959033966064453, 0.006402254104614258, 0.0068454742431640625, 0.007288694381713867, 0.007731914520263672, 0.008175134658813477, 0.008618354797363281, 0.009061574935913086, 0.00950479507446289, 0.009948015213012695, 0.0103912353515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 10.0, 24.0, 27.0, 69.0, 77.0, 131.0, 208.0, 472.0, 994.0, 2513.0, 8960.0, 59805.0, 787034.0, 164473.0, 17237.0, 3867.0, 1355.0, 590.0, 291.0, 147.0, 82.0, 58.0, 34.0, 22.0, 17.0, 9.0, 10.0, 10.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.0625, -74.96240234375, -72.8623046875, -70.76220703125, -68.662109375, -66.56201171875, -64.4619140625, -62.36181640625, -60.26171875, -58.16162109375, -56.0615234375, -53.96142578125, -51.861328125, -49.76123046875, -47.6611328125, -45.56103515625, -43.4609375, -41.36083984375, -39.2607421875, -37.16064453125, -35.060546875, -32.96044921875, -30.8603515625, -28.76025390625, -26.66015625, -24.56005859375, -22.4599609375, -20.35986328125, -18.259765625, -16.15966796875, -14.0595703125, -11.95947265625, -9.859375, -7.75927734375, -5.6591796875, -3.55908203125, -1.458984375, 0.64111328125, 2.7412109375, 4.84130859375, 6.94140625, 9.04150390625, 11.1416015625, 13.24169921875, 15.341796875, 17.44189453125, 19.5419921875, 21.64208984375, 23.7421875, 25.84228515625, 27.9423828125, 30.04248046875, 32.142578125, 34.24267578125, 36.3427734375, 38.44287109375, 40.54296875, 42.64306640625, 44.7431640625, 46.84326171875, 48.943359375, 51.04345703125, 53.1435546875, 55.24365234375, 57.34375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 9.0, 10.0, 16.0, 14.0, 21.0, 21.0, 29.0, 26.0, 39.0, 48.0, 43.0, 37.0, 54.0, 74.0, 76.0, 59.0, 58.0, 54.0, 36.0, 34.0, 30.0, 28.0, 19.0, 25.0, 19.0, 22.0, 5.0, 8.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.5625, -38.36669921875, -37.1708984375, -35.97509765625, -34.779296875, -33.58349609375, -32.3876953125, -31.19189453125, -29.99609375, -28.80029296875, -27.6044921875, -26.40869140625, -25.212890625, -24.01708984375, -22.8212890625, -21.62548828125, -20.4296875, -19.23388671875, -18.0380859375, -16.84228515625, -15.646484375, -14.45068359375, -13.2548828125, -12.05908203125, -10.86328125, -9.66748046875, -8.4716796875, -7.27587890625, -6.080078125, -4.88427734375, -3.6884765625, -2.49267578125, -1.296875, -0.10107421875, 1.0947265625, 2.29052734375, 3.486328125, 4.68212890625, 5.8779296875, 7.07373046875, 8.26953125, 9.46533203125, 10.6611328125, 11.85693359375, 13.052734375, 14.24853515625, 15.4443359375, 16.64013671875, 17.8359375, 19.03173828125, 20.2275390625, 21.42333984375, 22.619140625, 23.81494140625, 25.0107421875, 26.20654296875, 27.40234375, 28.59814453125, 29.7939453125, 30.98974609375, 32.185546875, 33.38134765625, 34.5771484375, 35.77294921875, 36.96875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 13.0, 39.0, 50.0, 150.0, 268.0, 217.0, 139.0, 64.0, 26.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-973.2877197265625, -928.6898803710938, -884.092041015625, -839.4942626953125, -794.8963623046875, -750.298583984375, -705.7007446289062, -661.1029052734375, -616.5050659179688, -571.9072265625, -527.3093872070312, -482.7115783691406, -438.1137390136719, -393.5158996582031, -348.9180908203125, -304.32025146484375, -259.722412109375, -215.12457275390625, -170.52674865722656, -125.92892456054688, -81.33108520507812, -36.733245849609375, 7.86456298828125, 52.46240234375, 97.06024169921875, 141.6580810546875, 186.2559051513672, 230.85372924804688, 275.4515686035156, 320.0494079589844, 364.647216796875, 409.24505615234375, 453.843017578125, 498.44085693359375, 543.0386962890625, 587.636474609375, 632.234375, 676.8321533203125, 721.4299926757812, 766.02783203125, 810.6256713867188, 855.2235107421875, 899.8213500976562, 944.419189453125, 989.0169677734375, 1033.6148681640625, 1078.212646484375, 1122.810546875, 1167.4083251953125, 1212.006103515625, 1256.60400390625, 1301.2017822265625, 1345.7996826171875, 1390.3974609375, 1434.995361328125, 1479.5931396484375, 1524.19091796875, 1568.7886962890625, 1613.3865966796875, 1657.984375, 1702.582275390625, 1747.1800537109375, 1791.77783203125, 1836.375732421875, 1880.9736328125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 11.0, 19.0, 14.0, 21.0, 25.0, 28.0, 32.0, 27.0, 26.0, 36.0, 35.0, 48.0, 67.0, 62.0, 69.0, 50.0, 43.0, 51.0, 36.0, 30.0, 26.0, 29.0, 18.0, 21.0, 23.0, 17.0, 15.0, 8.0, 20.0, 11.0, 6.0, 3.0, 3.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-561.072265625, -540.8294067382812, -520.5864868164062, -500.3436279296875, -480.1007385253906, -459.85784912109375, -439.614990234375, -419.3721008300781, -399.12921142578125, -378.8863220214844, -358.6434326171875, -338.40057373046875, -318.1576843261719, -297.914794921875, -277.67193603515625, -257.4290466308594, -237.1861572265625, -216.94326782226562, -196.7003936767578, -176.45751953125, -156.21463012695312, -135.97174072265625, -115.72886657714844, -95.48599243164062, -75.24310302734375, -55.000221252441406, -34.75733947753906, -14.514457702636719, 5.728424072265625, 25.97130584716797, 46.21418762207031, 66.45706176757812, 86.69989013671875, 106.9427719116211, 127.18565368652344, 147.42852783203125, 167.67141723632812, 187.914306640625, 208.1571807861328, 228.40005493164062, 248.6429443359375, 268.8858337402344, 289.12872314453125, 309.37158203125, 329.6144714355469, 349.85736083984375, 370.1002197265625, 390.3431091308594, 410.58599853515625, 430.8288879394531, 451.07177734375, 471.31463623046875, 491.5575256347656, 511.8004150390625, 532.0432739257812, 552.2861328125, 572.529052734375, 592.7719116210938, 613.0148315429688, 633.2576904296875, 653.5006103515625, 673.7434692382812, 693.986328125, 714.229248046875, 734.4721069335938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 21.0, 38.0, 53.0, 117.0, 191.0, 393.0, 774.0, 1571.0, 3257.0, 7061.0, 17521.0, 59584.0, 312803.0, 1805955.0, 1642431.0, 263033.0, 51539.0, 15667.0, 6471.0, 2728.0, 1406.0, 691.0, 403.0, 231.0, 124.0, 82.0, 41.0, 26.0, 20.0, 9.0, 11.0, 6.0, 6.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.15771484375, -29.5966796875, -28.03564453125, -26.474609375, -24.91357421875, -23.3525390625, -21.79150390625, -20.23046875, -18.66943359375, -17.1083984375, -15.54736328125, -13.986328125, -12.42529296875, -10.8642578125, -9.30322265625, -7.7421875, -6.18115234375, -4.6201171875, -3.05908203125, -1.498046875, 0.06298828125, 1.6240234375, 3.18505859375, 4.74609375, 6.30712890625, 7.8681640625, 9.42919921875, 10.990234375, 12.55126953125, 14.1123046875, 15.67333984375, 17.234375, 18.79541015625, 20.3564453125, 21.91748046875, 23.478515625, 25.03955078125, 26.6005859375, 28.16162109375, 29.72265625, 31.28369140625, 32.8447265625, 34.40576171875, 35.966796875, 37.52783203125, 39.0888671875, 40.64990234375, 42.2109375, 43.77197265625, 45.3330078125, 46.89404296875, 48.455078125, 50.01611328125, 51.5771484375, 53.13818359375, 54.69921875, 56.26025390625, 57.8212890625, 59.38232421875, 60.943359375, 62.50439453125, 64.0654296875, 65.62646484375, 67.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 6.0, 17.0, 11.0, 22.0, 39.0, 46.0, 52.0, 62.0, 64.0, 73.0, 87.0, 85.0, 81.0, 65.0, 73.0, 51.0, 49.0, 33.0, 31.0, 9.0, 18.0, 15.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -41.71484375, -39.7421875, -37.76953125, -35.796875, -33.82421875, -31.8515625, -29.87890625, -27.90625, -25.93359375, -23.9609375, -21.98828125, -20.015625, -18.04296875, -16.0703125, -14.09765625, -12.125, -10.15234375, -8.1796875, -6.20703125, -4.234375, -2.26171875, -0.2890625, 1.68359375, 3.65625, 5.62890625, 7.6015625, 9.57421875, 11.546875, 13.51953125, 15.4921875, 17.46484375, 19.4375, 21.41015625, 23.3828125, 25.35546875, 27.328125, 29.30078125, 31.2734375, 33.24609375, 35.21875, 37.19140625, 39.1640625, 41.13671875, 43.109375, 45.08203125, 47.0546875, 49.02734375, 51.0, 52.97265625, 54.9453125, 56.91796875, 58.890625, 60.86328125, 62.8359375, 64.80859375, 66.78125, 68.75390625, 70.7265625, 72.69921875, 74.671875, 76.64453125, 78.6171875, 80.58984375, 82.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 7.0, 14.0, 19.0, 26.0, 42.0, 75.0, 114.0, 251.0, 429.0, 1048.0, 2956.0, 10096.0, 46659.0, 449647.0, 3437692.0, 203525.0, 29860.0, 7354.0, 2427.0, 1007.0, 428.0, 241.0, 142.0, 85.0, 50.0, 32.0, 20.0, 9.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.4375, -106.9169921875, -103.396484375, -99.8759765625, -96.35546875, -92.8349609375, -89.314453125, -85.7939453125, -82.2734375, -78.7529296875, -75.232421875, -71.7119140625, -68.19140625, -64.6708984375, -61.150390625, -57.6298828125, -54.109375, -50.5888671875, -47.068359375, -43.5478515625, -40.02734375, -36.5068359375, -32.986328125, -29.4658203125, -25.9453125, -22.4248046875, -18.904296875, -15.3837890625, -11.86328125, -8.3427734375, -4.822265625, -1.3017578125, 2.21875, 5.7392578125, 9.259765625, 12.7802734375, 16.30078125, 19.8212890625, 23.341796875, 26.8623046875, 30.3828125, 33.9033203125, 37.423828125, 40.9443359375, 44.46484375, 47.9853515625, 51.505859375, 55.0263671875, 58.546875, 62.0673828125, 65.587890625, 69.1083984375, 72.62890625, 76.1494140625, 79.669921875, 83.1904296875, 86.7109375, 90.2314453125, 93.751953125, 97.2724609375, 100.79296875, 104.3134765625, 107.833984375, 111.3544921875, 114.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 5.0, 9.0, 19.0, 21.0, 25.0, 28.0, 47.0, 51.0, 59.0, 100.0, 156.0, 253.0, 423.0, 632.0, 684.0, 568.0, 335.0, 198.0, 121.0, 72.0, 53.0, 38.0, 34.0, 25.0, 28.0, 12.0, 12.0, 12.0, 7.0, 7.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-85.125, -82.220703125, -79.31640625, -76.412109375, -73.5078125, -70.603515625, -67.69921875, -64.794921875, -61.890625, -58.986328125, -56.08203125, -53.177734375, -50.2734375, -47.369140625, -44.46484375, -41.560546875, -38.65625, -35.751953125, -32.84765625, -29.943359375, -27.0390625, -24.134765625, -21.23046875, -18.326171875, -15.421875, -12.517578125, -9.61328125, -6.708984375, -3.8046875, -0.900390625, 2.00390625, 4.908203125, 7.8125, 10.716796875, 13.62109375, 16.525390625, 19.4296875, 22.333984375, 25.23828125, 28.142578125, 31.046875, 33.951171875, 36.85546875, 39.759765625, 42.6640625, 45.568359375, 48.47265625, 51.376953125, 54.28125, 57.185546875, 60.08984375, 62.994140625, 65.8984375, 68.802734375, 71.70703125, 74.611328125, 77.515625, 80.419921875, 83.32421875, 86.228515625, 89.1328125, 92.037109375, 94.94140625, 97.845703125, 100.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 19.0, 21.0, 72.0, 162.0, 287.0, 236.0, 117.0, 51.0, 17.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1917.255126953125, -1866.497802734375, -1815.7403564453125, -1764.9830322265625, -1714.2257080078125, -1663.46826171875, -1612.7109375, -1561.95361328125, -1511.1961669921875, -1460.4388427734375, -1409.681396484375, -1358.924072265625, -1308.166748046875, -1257.4093017578125, -1206.6519775390625, -1155.89453125, -1105.13720703125, -1054.3798828125, -1003.6224975585938, -952.8651123046875, -902.1077270507812, -851.350341796875, -800.593017578125, -749.8356323242188, -699.078369140625, -648.3209838867188, -597.5636596679688, -546.8062744140625, -496.04888916015625, -445.2915344238281, -394.5341796875, -343.77679443359375, -293.0194091796875, -242.2620391845703, -191.50466918945312, -140.747314453125, -89.98994445800781, -39.232574462890625, 11.5247802734375, 62.28216552734375, 113.03952026367188, 163.79689025878906, 214.55426025390625, 265.3116149902344, 316.0689697265625, 366.82635498046875, 417.5837097167969, 468.3410949707031, 519.0984497070312, 569.8558349609375, 620.6131591796875, 671.3705444335938, 722.1279296875, 772.88525390625, 823.6426391601562, 874.4000244140625, 925.1573486328125, 975.9147338867188, 1026.672119140625, 1077.429443359375, 1128.186767578125, 1178.9442138671875, 1229.7015380859375, 1280.458984375, 1331.21630859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 7.0, 10.0, 12.0, 14.0, 16.0, 24.0, 29.0, 31.0, 24.0, 36.0, 42.0, 49.0, 58.0, 46.0, 63.0, 52.0, 41.0, 51.0, 52.0, 39.0, 33.0, 29.0, 30.0, 29.0, 34.0, 18.0, 26.0, 19.0, 23.0, 7.0, 3.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-502.78564453125, -487.50390625, -472.22216796875, -456.9404296875, -441.6586608886719, -426.3769226074219, -411.0951843261719, -395.8134460449219, -380.53167724609375, -365.24993896484375, -349.96820068359375, -334.68646240234375, -319.4046936035156, -304.1229553222656, -288.8412170410156, -273.5594787597656, -258.2777404785156, -242.99600219726562, -227.71424865722656, -212.43251037597656, -197.1507568359375, -181.8690185546875, -166.5872802734375, -151.3055419921875, -136.02378845214844, -120.7420425415039, -105.46029663085938, -90.17855834960938, -74.89681243896484, -59.61506652832031, -44.33332824707031, -29.05158233642578, -13.76983642578125, 1.5119075775146484, 16.793651580810547, 32.07539367675781, 47.357139587402344, 62.638885498046875, 77.92062377929688, 93.2023696899414, 108.48411560058594, 123.76586151123047, 139.047607421875, 154.329345703125, 169.611083984375, 184.89283752441406, 200.17457580566406, 215.45632934570312, 230.73806762695312, 246.01980590820312, 261.3015441894531, 276.58331298828125, 291.86505126953125, 307.14678955078125, 322.42852783203125, 337.71026611328125, 352.99200439453125, 368.27374267578125, 383.55548095703125, 398.83721923828125, 414.1189880371094, 429.4007263183594, 444.6824645996094, 459.9642028808594, 475.2459716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 1.0, 11.0, 10.0, 21.0, 45.0, 65.0, 110.0, 201.0, 360.0, 700.0, 1504.0, 3167.0, 7517.0, 20044.0, 58044.0, 204418.0, 502920.0, 169535.0, 50151.0, 17278.0, 6808.0, 2922.0, 1303.0, 670.0, 337.0, 162.0, 104.0, 53.0, 24.0, 38.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5, -83.748046875, -80.99609375, -78.244140625, -75.4921875, -72.740234375, -69.98828125, -67.236328125, -64.484375, -61.732421875, -58.98046875, -56.228515625, -53.4765625, -50.724609375, -47.97265625, -45.220703125, -42.46875, -39.716796875, -36.96484375, -34.212890625, -31.4609375, -28.708984375, -25.95703125, -23.205078125, -20.453125, -17.701171875, -14.94921875, -12.197265625, -9.4453125, -6.693359375, -3.94140625, -1.189453125, 1.5625, 4.314453125, 7.06640625, 9.818359375, 12.5703125, 15.322265625, 18.07421875, 20.826171875, 23.578125, 26.330078125, 29.08203125, 31.833984375, 34.5859375, 37.337890625, 40.08984375, 42.841796875, 45.59375, 48.345703125, 51.09765625, 53.849609375, 56.6015625, 59.353515625, 62.10546875, 64.857421875, 67.609375, 70.361328125, 73.11328125, 75.865234375, 78.6171875, 81.369140625, 84.12109375, 86.873046875, 89.625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 12.0, 13.0, 23.0, 28.0, 25.0, 63.0, 64.0, 68.0, 78.0, 84.0, 93.0, 67.0, 76.0, 80.0, 61.0, 33.0, 34.0, 39.0, 19.0, 19.0, 8.0, 7.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.875, -50.72265625, -48.5703125, -46.41796875, -44.265625, -42.11328125, -39.9609375, -37.80859375, -35.65625, -33.50390625, -31.3515625, -29.19921875, -27.046875, -24.89453125, -22.7421875, -20.58984375, -18.4375, -16.28515625, -14.1328125, -11.98046875, -9.828125, -7.67578125, -5.5234375, -3.37109375, -1.21875, 0.93359375, 3.0859375, 5.23828125, 7.390625, 9.54296875, 11.6953125, 13.84765625, 16.0, 18.15234375, 20.3046875, 22.45703125, 24.609375, 26.76171875, 28.9140625, 31.06640625, 33.21875, 35.37109375, 37.5234375, 39.67578125, 41.828125, 43.98046875, 46.1328125, 48.28515625, 50.4375, 52.58984375, 54.7421875, 56.89453125, 59.046875, 61.19921875, 63.3515625, 65.50390625, 67.65625, 69.80859375, 71.9609375, 74.11328125, 76.265625, 78.41796875, 80.5703125, 82.72265625, 84.875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 17.0, 22.0, 52.0, 53.0, 83.0, 165.0, 271.0, 515.0, 915.0, 2230.0, 7789.0, 47481.0, 743147.0, 217415.0, 20791.0, 4375.0, 1484.0, 744.0, 380.0, 225.0, 114.0, 79.0, 66.0, 30.0, 24.0, 19.0, 10.0, 7.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -150.548828125, -144.22265625, -137.896484375, -131.5703125, -125.244140625, -118.91796875, -112.591796875, -106.265625, -99.939453125, -93.61328125, -87.287109375, -80.9609375, -74.634765625, -68.30859375, -61.982421875, -55.65625, -49.330078125, -43.00390625, -36.677734375, -30.3515625, -24.025390625, -17.69921875, -11.373046875, -5.046875, 1.279296875, 7.60546875, 13.931640625, 20.2578125, 26.583984375, 32.91015625, 39.236328125, 45.5625, 51.888671875, 58.21484375, 64.541015625, 70.8671875, 77.193359375, 83.51953125, 89.845703125, 96.171875, 102.498046875, 108.82421875, 115.150390625, 121.4765625, 127.802734375, 134.12890625, 140.455078125, 146.78125, 153.107421875, 159.43359375, 165.759765625, 172.0859375, 178.412109375, 184.73828125, 191.064453125, 197.390625, 203.716796875, 210.04296875, 216.369140625, 222.6953125, 229.021484375, 235.34765625, 241.673828125, 248.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 22.0, 35.0, 50.0, 64.0, 68.0, 99.0, 93.0, 101.0, 95.0, 86.0, 66.0, 53.0, 46.0, 22.0, 23.0, 19.0, 14.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.75, -260.83984375, -250.9296875, -241.01953125, -231.109375, -221.19921875, -211.2890625, -201.37890625, -191.46875, -181.55859375, -171.6484375, -161.73828125, -151.828125, -141.91796875, -132.0078125, -122.09765625, -112.1875, -102.27734375, -92.3671875, -82.45703125, -72.546875, -62.63671875, -52.7265625, -42.81640625, -32.90625, -22.99609375, -13.0859375, -3.17578125, 6.734375, 16.64453125, 26.5546875, 36.46484375, 46.375, 56.28515625, 66.1953125, 76.10546875, 86.015625, 95.92578125, 105.8359375, 115.74609375, 125.65625, 135.56640625, 145.4765625, 155.38671875, 165.296875, 175.20703125, 185.1171875, 195.02734375, 204.9375, 214.84765625, 224.7578125, 234.66796875, 244.578125, 254.48828125, 264.3984375, 274.30859375, 284.21875, 294.12890625, 304.0390625, 313.94921875, 323.859375, 333.76953125, 343.6796875, 353.58984375, 363.5]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 12.0, 17.0, 35.0, 49.0, 67.0, 81.0, 144.0, 263.0, 405.0, 666.0, 1376.0, 2832.0, 6746.0, 18861.0, 71853.0, 575286.0, 293068.0, 51585.0, 14607.0, 5568.0, 2364.0, 1095.0, 582.0, 364.0, 223.0, 115.0, 76.0, 46.0, 45.0, 22.0, 25.0, 20.0, 14.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.5625, -41.1845703125, -39.806640625, -38.4287109375, -37.05078125, -35.6728515625, -34.294921875, -32.9169921875, -31.5390625, -30.1611328125, -28.783203125, -27.4052734375, -26.02734375, -24.6494140625, -23.271484375, -21.8935546875, -20.515625, -19.1376953125, -17.759765625, -16.3818359375, -15.00390625, -13.6259765625, -12.248046875, -10.8701171875, -9.4921875, -8.1142578125, -6.736328125, -5.3583984375, -3.98046875, -2.6025390625, -1.224609375, 0.1533203125, 1.53125, 2.9091796875, 4.287109375, 5.6650390625, 7.04296875, 8.4208984375, 9.798828125, 11.1767578125, 12.5546875, 13.9326171875, 15.310546875, 16.6884765625, 18.06640625, 19.4443359375, 20.822265625, 22.2001953125, 23.578125, 24.9560546875, 26.333984375, 27.7119140625, 29.08984375, 30.4677734375, 31.845703125, 33.2236328125, 34.6015625, 35.9794921875, 37.357421875, 38.7353515625, 40.11328125, 41.4912109375, 42.869140625, 44.2470703125, 45.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 7.0, 9.0, 11.0, 9.0, 13.0, 22.0, 20.0, 36.0, 55.0, 87.0, 135.0, 127.0, 138.0, 99.0, 66.0, 39.0, 36.0, 20.0, 10.0, 13.0, 6.0, 5.0, 8.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0214691162109375, -0.02088308334350586, -0.02029705047607422, -0.019711017608642578, -0.019124984741210938, -0.018538951873779297, -0.017952919006347656, -0.017366886138916016, -0.016780853271484375, -0.016194820404052734, -0.015608787536621094, -0.015022754669189453, -0.014436721801757812, -0.013850688934326172, -0.013264656066894531, -0.01267862319946289, -0.01209259033203125, -0.01150655746459961, -0.010920524597167969, -0.010334491729736328, -0.009748458862304688, -0.009162425994873047, -0.008576393127441406, -0.007990360260009766, -0.007404327392578125, -0.006818294525146484, -0.006232261657714844, -0.005646228790283203, -0.0050601959228515625, -0.004474163055419922, -0.0038881301879882812, -0.0033020973205566406, -0.002716064453125, -0.0021300315856933594, -0.0015439987182617188, -0.0009579658508300781, -0.0003719329833984375, 0.00021409988403320312, 0.0008001327514648438, 0.0013861656188964844, 0.001972198486328125, 0.0025582313537597656, 0.0031442642211914062, 0.003730297088623047, 0.0043163299560546875, 0.004902362823486328, 0.005488395690917969, 0.006074428558349609, 0.00666046142578125, 0.007246494293212891, 0.007832527160644531, 0.008418560028076172, 0.009004592895507812, 0.009590625762939453, 0.010176658630371094, 0.010762691497802734, 0.011348724365234375, 0.011934757232666016, 0.012520790100097656, 0.013106822967529297, 0.013692855834960938, 0.014278888702392578, 0.014864921569824219, 0.01545095443725586, 0.0160369873046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 16.0, 12.0, 26.0, 38.0, 49.0, 80.0, 101.0, 147.0, 211.0, 361.0, 651.0, 1292.0, 2624.0, 6720.0, 20560.0, 86577.0, 606980.0, 253168.0, 46984.0, 12940.0, 4531.0, 1974.0, 1009.0, 535.0, 301.0, 176.0, 147.0, 103.0, 65.0, 43.0, 35.0, 32.0, 15.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.71875, -34.43408203125, -33.1494140625, -31.86474609375, -30.580078125, -29.29541015625, -28.0107421875, -26.72607421875, -25.44140625, -24.15673828125, -22.8720703125, -21.58740234375, -20.302734375, -19.01806640625, -17.7333984375, -16.44873046875, -15.1640625, -13.87939453125, -12.5947265625, -11.31005859375, -10.025390625, -8.74072265625, -7.4560546875, -6.17138671875, -4.88671875, -3.60205078125, -2.3173828125, -1.03271484375, 0.251953125, 1.53662109375, 2.8212890625, 4.10595703125, 5.390625, 6.67529296875, 7.9599609375, 9.24462890625, 10.529296875, 11.81396484375, 13.0986328125, 14.38330078125, 15.66796875, 16.95263671875, 18.2373046875, 19.52197265625, 20.806640625, 22.09130859375, 23.3759765625, 24.66064453125, 25.9453125, 27.22998046875, 28.5146484375, 29.79931640625, 31.083984375, 32.36865234375, 33.6533203125, 34.93798828125, 36.22265625, 37.50732421875, 38.7919921875, 40.07666015625, 41.361328125, 42.64599609375, 43.9306640625, 45.21533203125, 46.5]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 5.0, 12.0, 15.0, 15.0, 25.0, 31.0, 33.0, 29.0, 35.0, 42.0, 55.0, 54.0, 59.0, 65.0, 77.0, 60.0, 62.0, 40.0, 33.0, 45.0, 29.0, 23.0, 13.0, 20.0, 21.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.40625, -27.4072265625, -26.408203125, -25.4091796875, -24.41015625, -23.4111328125, -22.412109375, -21.4130859375, -20.4140625, -19.4150390625, -18.416015625, -17.4169921875, -16.41796875, -15.4189453125, -14.419921875, -13.4208984375, -12.421875, -11.4228515625, -10.423828125, -9.4248046875, -8.42578125, -7.4267578125, -6.427734375, -5.4287109375, -4.4296875, -3.4306640625, -2.431640625, -1.4326171875, -0.43359375, 0.5654296875, 1.564453125, 2.5634765625, 3.5625, 4.5615234375, 5.560546875, 6.5595703125, 7.55859375, 8.5576171875, 9.556640625, 10.5556640625, 11.5546875, 12.5537109375, 13.552734375, 14.5517578125, 15.55078125, 16.5498046875, 17.548828125, 18.5478515625, 19.546875, 20.5458984375, 21.544921875, 22.5439453125, 23.54296875, 24.5419921875, 25.541015625, 26.5400390625, 27.5390625, 28.5380859375, 29.537109375, 30.5361328125, 31.53515625, 32.5341796875, 33.533203125, 34.5322265625, 35.53125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 11.0, 18.0, 39.0, 75.0, 119.0, 186.0, 248.0, 123.0, 64.0, 39.0, 23.0, 19.0, 10.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1224.50927734375, -1190.79345703125, -1157.07763671875, -1123.3616943359375, -1089.6458740234375, -1055.9300537109375, -1022.2142333984375, -988.4984130859375, -954.7825317382812, -921.0667114257812, -887.350830078125, -853.635009765625, -819.919189453125, -786.2033081054688, -752.4874877929688, -718.7716064453125, -685.0557861328125, -651.3399658203125, -617.6240844726562, -583.9082641601562, -550.1923828125, -516.4765625, -482.7607421875, -449.0448913574219, -415.32904052734375, -381.6131896972656, -347.8973388671875, -314.1815185546875, -280.4656677246094, -246.74981689453125, -213.0339813232422, -179.31814575195312, -145.60223388671875, -111.88639068603516, -78.17054748535156, -44.45470428466797, -10.738861083984375, 22.97698974609375, 56.69282531738281, 90.40866088867188, 124.12451171875, 157.84036254882812, 191.5561981201172, 225.27203369140625, 258.9878845214844, 292.7037353515625, 326.4195556640625, 360.1354064941406, 393.85125732421875, 427.5671081542969, 461.282958984375, 494.998779296875, 528.714599609375, 562.4304809570312, 596.1463012695312, 629.8621826171875, 663.5780029296875, 697.2938232421875, 731.0097045898438, 764.7255249023438, 798.44140625, 832.1572265625, 865.873046875, 899.5888671875, 933.3047485351562]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 8.0, 8.0, 22.0, 16.0, 15.0, 13.0, 19.0, 22.0, 17.0, 29.0, 27.0, 38.0, 37.0, 36.0, 42.0, 69.0, 82.0, 74.0, 56.0, 50.0, 52.0, 32.0, 26.0, 35.0, 33.0, 22.0, 20.0, 18.0, 11.0, 19.0, 6.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.338134765625, -599.2092895507812, -577.0805053710938, -554.95166015625, -532.8228149414062, -510.6940002441406, -488.565185546875, -466.43634033203125, -444.3075256347656, -422.1787109375, -400.04986572265625, -377.9210510253906, -355.792236328125, -333.66339111328125, -311.5345764160156, -289.40576171875, -267.27691650390625, -245.14808654785156, -223.01925659179688, -200.89044189453125, -178.76161193847656, -156.63278198242188, -134.50396728515625, -112.37513732910156, -90.24630737304688, -68.11747741699219, -45.98865509033203, -23.859832763671875, -1.7310028076171875, 20.3978271484375, 42.526641845703125, 64.65547180175781, 86.78436279296875, 108.91319274902344, 131.04202270507812, 153.17083740234375, 175.29966735839844, 197.42849731445312, 219.55731201171875, 241.68614196777344, 263.8149719238281, 285.94378662109375, 308.0726318359375, 330.2014465332031, 352.33026123046875, 374.4591064453125, 396.5879211425781, 418.71673583984375, 440.8455810546875, 462.9743957519531, 485.1032409667969, 507.2320556640625, 529.3609008789062, 551.48974609375, 573.6185302734375, 595.7473754882812, 617.876220703125, 640.0050659179688, 662.1338500976562, 684.2626953125, 706.3915405273438, 728.5203857421875, 750.649169921875, 772.7780151367188, 794.9067993164062]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 10.0, 21.0, 30.0, 35.0, 57.0, 99.0, 146.0, 226.0, 394.0, 706.0, 1249.0, 2478.0, 5664.0, 15421.0, 67333.0, 658834.0, 2894341.0, 470632.0, 53549.0, 13219.0, 4880.0, 2151.0, 1158.0, 591.0, 387.0, 193.0, 152.0, 95.0, 67.0, 40.0, 31.0, 21.0, 12.0, 8.0, 10.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.4375, -63.287109375, -61.13671875, -58.986328125, -56.8359375, -54.685546875, -52.53515625, -50.384765625, -48.234375, -46.083984375, -43.93359375, -41.783203125, -39.6328125, -37.482421875, -35.33203125, -33.181640625, -31.03125, -28.880859375, -26.73046875, -24.580078125, -22.4296875, -20.279296875, -18.12890625, -15.978515625, -13.828125, -11.677734375, -9.52734375, -7.376953125, -5.2265625, -3.076171875, -0.92578125, 1.224609375, 3.375, 5.525390625, 7.67578125, 9.826171875, 11.9765625, 14.126953125, 16.27734375, 18.427734375, 20.578125, 22.728515625, 24.87890625, 27.029296875, 29.1796875, 31.330078125, 33.48046875, 35.630859375, 37.78125, 39.931640625, 42.08203125, 44.232421875, 46.3828125, 48.533203125, 50.68359375, 52.833984375, 54.984375, 57.134765625, 59.28515625, 61.435546875, 63.5859375, 65.736328125, 67.88671875, 70.037109375, 72.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 14.0, 11.0, 11.0, 16.0, 22.0, 31.0, 45.0, 51.0, 44.0, 49.0, 59.0, 67.0, 60.0, 63.0, 75.0, 58.0, 55.0, 37.0, 45.0, 49.0, 25.0, 25.0, 20.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.875, -52.3740234375, -50.873046875, -49.3720703125, -47.87109375, -46.3701171875, -44.869140625, -43.3681640625, -41.8671875, -40.3662109375, -38.865234375, -37.3642578125, -35.86328125, -34.3623046875, -32.861328125, -31.3603515625, -29.859375, -28.3583984375, -26.857421875, -25.3564453125, -23.85546875, -22.3544921875, -20.853515625, -19.3525390625, -17.8515625, -16.3505859375, -14.849609375, -13.3486328125, -11.84765625, -10.3466796875, -8.845703125, -7.3447265625, -5.84375, -4.3427734375, -2.841796875, -1.3408203125, 0.16015625, 1.6611328125, 3.162109375, 4.6630859375, 6.1640625, 7.6650390625, 9.166015625, 10.6669921875, 12.16796875, 13.6689453125, 15.169921875, 16.6708984375, 18.171875, 19.6728515625, 21.173828125, 22.6748046875, 24.17578125, 25.6767578125, 27.177734375, 28.6787109375, 30.1796875, 31.6806640625, 33.181640625, 34.6826171875, 36.18359375, 37.6845703125, 39.185546875, 40.6865234375, 42.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 16.0, 25.0, 32.0, 47.0, 73.0, 106.0, 153.0, 236.0, 440.0, 1419.0, 21920.0, 4090630.0, 75264.0, 2581.0, 611.0, 238.0, 156.0, 120.0, 63.0, 51.0, 41.0, 20.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-364.75, -353.57421875, -342.3984375, -331.22265625, -320.046875, -308.87109375, -297.6953125, -286.51953125, -275.34375, -264.16796875, -252.9921875, -241.81640625, -230.640625, -219.46484375, -208.2890625, -197.11328125, -185.9375, -174.76171875, -163.5859375, -152.41015625, -141.234375, -130.05859375, -118.8828125, -107.70703125, -96.53125, -85.35546875, -74.1796875, -63.00390625, -51.828125, -40.65234375, -29.4765625, -18.30078125, -7.125, 4.05078125, 15.2265625, 26.40234375, 37.578125, 48.75390625, 59.9296875, 71.10546875, 82.28125, 93.45703125, 104.6328125, 115.80859375, 126.984375, 138.16015625, 149.3359375, 160.51171875, 171.6875, 182.86328125, 194.0390625, 205.21484375, 216.390625, 227.56640625, 238.7421875, 249.91796875, 261.09375, 272.26953125, 283.4453125, 294.62109375, 305.796875, 316.97265625, 328.1484375, 339.32421875, 350.5]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 28.0, 48.0, 118.0, 335.0, 1260.0, 1639.0, 409.0, 128.0, 43.0, 24.0, 16.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.0, -282.71484375, -274.4296875, -266.14453125, -257.859375, -249.57421875, -241.2890625, -233.00390625, -224.71875, -216.43359375, -208.1484375, -199.86328125, -191.578125, -183.29296875, -175.0078125, -166.72265625, -158.4375, -150.15234375, -141.8671875, -133.58203125, -125.296875, -117.01171875, -108.7265625, -100.44140625, -92.15625, -83.87109375, -75.5859375, -67.30078125, -59.015625, -50.73046875, -42.4453125, -34.16015625, -25.875, -17.58984375, -9.3046875, -1.01953125, 7.265625, 15.55078125, 23.8359375, 32.12109375, 40.40625, 48.69140625, 56.9765625, 65.26171875, 73.546875, 81.83203125, 90.1171875, 98.40234375, 106.6875, 114.97265625, 123.2578125, 131.54296875, 139.828125, 148.11328125, 156.3984375, 164.68359375, 172.96875, 181.25390625, 189.5390625, 197.82421875, 206.109375, 214.39453125, 222.6796875, 230.96484375, 239.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 30.0, 58.0, 85.0, 193.0, 276.0, 188.0, 72.0, 34.0, 17.0, 13.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1509.131591796875, -1458.294921875, -1407.4583740234375, -1356.6217041015625, -1305.78515625, -1254.948486328125, -1204.11181640625, -1153.2752685546875, -1102.4385986328125, -1051.6019287109375, -1000.765380859375, -949.9287109375, -899.0921020507812, -848.2554931640625, -797.4188842773438, -746.582275390625, -695.7456665039062, -644.9090576171875, -594.0724487304688, -543.23583984375, -492.399169921875, -441.56256103515625, -390.7259521484375, -339.8893127441406, -289.0527038574219, -238.21607971191406, -187.37945556640625, -136.5428466796875, -85.70622253417969, -34.869598388671875, 15.967010498046875, 66.80364990234375, 117.6402587890625, 168.4768829345703, 219.31350708007812, 270.1501159667969, 320.98675537109375, 371.8233642578125, 422.65997314453125, 473.4966125488281, 524.333251953125, 575.1698608398438, 626.0064697265625, 676.8431396484375, 727.6797485351562, 778.516357421875, 829.3529663085938, 880.1895751953125, 931.0261840820312, 981.86279296875, 1032.699462890625, 1083.5360107421875, 1134.3726806640625, 1185.209228515625, 1236.0458984375, 1286.882568359375, 1337.7191162109375, 1388.5557861328125, 1439.392333984375, 1490.22900390625, 1541.0655517578125, 1591.9022216796875, 1642.73876953125, 1693.575439453125, 1744.412109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 11.0, 9.0, 8.0, 20.0, 27.0, 27.0, 25.0, 36.0, 45.0, 41.0, 49.0, 52.0, 56.0, 55.0, 53.0, 60.0, 56.0, 60.0, 54.0, 44.0, 35.0, 36.0, 33.0, 22.0, 21.0, 16.0, 16.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2180786132812, -570.8192138671875, -552.4203491210938, -534.0214233398438, -515.62255859375, -497.22369384765625, -478.8248291015625, -460.42596435546875, -442.0270690917969, -423.6282043457031, -405.22930908203125, -386.8304443359375, -368.43157958984375, -350.0326843261719, -331.6338195800781, -313.23492431640625, -294.8360595703125, -276.43719482421875, -258.0382995605469, -239.63943481445312, -221.2405548095703, -202.8416748046875, -184.44281005859375, -166.04393005371094, -147.64505004882812, -129.2461700439453, -110.84729766845703, -92.44842529296875, -74.04954528808594, -55.650665283203125, -37.251792907714844, -18.852920532226562, -0.4541015625, 17.944774627685547, 36.343650817871094, 54.74252700805664, 73.14140319824219, 91.540283203125, 109.93915557861328, 128.33802795410156, 146.73690795898438, 165.1357879638672, 183.53466796875, 201.93353271484375, 220.33241271972656, 238.73129272460938, 257.1301574707031, 275.529052734375, 293.92791748046875, 312.3267822265625, 330.7256774902344, 349.1245422363281, 367.5234375, 385.92230224609375, 404.3211669921875, 422.72003173828125, 441.1189270019531, 459.5177917480469, 477.91668701171875, 496.3155517578125, 514.7144165039062, 533.11328125, 551.51220703125, 569.9110717773438, 588.3099365234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 11.0, 14.0, 28.0, 35.0, 65.0, 75.0, 104.0, 173.0, 264.0, 381.0, 675.0, 1009.0, 1639.0, 2715.0, 4614.0, 8333.0, 15642.0, 30873.0, 64199.0, 143086.0, 292468.0, 254336.0, 117494.0, 53493.0, 25908.0, 13289.0, 7105.0, 4119.0, 2413.0, 1435.0, 900.0, 555.0, 354.0, 256.0, 177.0, 119.0, 55.0, 44.0, 26.0, 20.0, 13.0, 9.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-44.46875, -43.1162109375, -41.763671875, -40.4111328125, -39.05859375, -37.7060546875, -36.353515625, -35.0009765625, -33.6484375, -32.2958984375, -30.943359375, -29.5908203125, -28.23828125, -26.8857421875, -25.533203125, -24.1806640625, -22.828125, -21.4755859375, -20.123046875, -18.7705078125, -17.41796875, -16.0654296875, -14.712890625, -13.3603515625, -12.0078125, -10.6552734375, -9.302734375, -7.9501953125, -6.59765625, -5.2451171875, -3.892578125, -2.5400390625, -1.1875, 0.1650390625, 1.517578125, 2.8701171875, 4.22265625, 5.5751953125, 6.927734375, 8.2802734375, 9.6328125, 10.9853515625, 12.337890625, 13.6904296875, 15.04296875, 16.3955078125, 17.748046875, 19.1005859375, 20.453125, 21.8056640625, 23.158203125, 24.5107421875, 25.86328125, 27.2158203125, 28.568359375, 29.9208984375, 31.2734375, 32.6259765625, 33.978515625, 35.3310546875, 36.68359375, 38.0361328125, 39.388671875, 40.7412109375, 42.09375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 12.0, 10.0, 13.0, 19.0, 23.0, 37.0, 35.0, 50.0, 48.0, 57.0, 55.0, 51.0, 62.0, 53.0, 59.0, 56.0, 61.0, 50.0, 36.0, 36.0, 30.0, 26.0, 22.0, 26.0, 6.0, 18.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.15625, -53.5771484375, -51.998046875, -50.4189453125, -48.83984375, -47.2607421875, -45.681640625, -44.1025390625, -42.5234375, -40.9443359375, -39.365234375, -37.7861328125, -36.20703125, -34.6279296875, -33.048828125, -31.4697265625, -29.890625, -28.3115234375, -26.732421875, -25.1533203125, -23.57421875, -21.9951171875, -20.416015625, -18.8369140625, -17.2578125, -15.6787109375, -14.099609375, -12.5205078125, -10.94140625, -9.3623046875, -7.783203125, -6.2041015625, -4.625, -3.0458984375, -1.466796875, 0.1123046875, 1.69140625, 3.2705078125, 4.849609375, 6.4287109375, 8.0078125, 9.5869140625, 11.166015625, 12.7451171875, 14.32421875, 15.9033203125, 17.482421875, 19.0615234375, 20.640625, 22.2197265625, 23.798828125, 25.3779296875, 26.95703125, 28.5361328125, 30.115234375, 31.6943359375, 33.2734375, 34.8525390625, 36.431640625, 38.0107421875, 39.58984375, 41.1689453125, 42.748046875, 44.3271484375, 45.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 19.0, 22.0, 21.0, 46.0, 83.0, 199.0, 442.0, 1152.0, 3208.0, 11024.0, 54963.0, 610550.0, 314279.0, 39696.0, 8518.0, 2588.0, 927.0, 388.0, 181.0, 85.0, 46.0, 35.0, 25.0, 12.0, 3.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0, -116.814453125, -112.62890625, -108.443359375, -104.2578125, -100.072265625, -95.88671875, -91.701171875, -87.515625, -83.330078125, -79.14453125, -74.958984375, -70.7734375, -66.587890625, -62.40234375, -58.216796875, -54.03125, -49.845703125, -45.66015625, -41.474609375, -37.2890625, -33.103515625, -28.91796875, -24.732421875, -20.546875, -16.361328125, -12.17578125, -7.990234375, -3.8046875, 0.380859375, 4.56640625, 8.751953125, 12.9375, 17.123046875, 21.30859375, 25.494140625, 29.6796875, 33.865234375, 38.05078125, 42.236328125, 46.421875, 50.607421875, 54.79296875, 58.978515625, 63.1640625, 67.349609375, 71.53515625, 75.720703125, 79.90625, 84.091796875, 88.27734375, 92.462890625, 96.6484375, 100.833984375, 105.01953125, 109.205078125, 113.390625, 117.576171875, 121.76171875, 125.947265625, 130.1328125, 134.318359375, 138.50390625, 142.689453125, 146.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 9.0, 8.0, 13.0, 28.0, 28.0, 38.0, 32.0, 46.0, 45.0, 51.0, 64.0, 58.0, 52.0, 62.0, 78.0, 46.0, 48.0, 44.0, 43.0, 28.0, 32.0, 36.0, 13.0, 22.0, 6.0, 12.0, 5.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-200.125, -194.01171875, -187.8984375, -181.78515625, -175.671875, -169.55859375, -163.4453125, -157.33203125, -151.21875, -145.10546875, -138.9921875, -132.87890625, -126.765625, -120.65234375, -114.5390625, -108.42578125, -102.3125, -96.19921875, -90.0859375, -83.97265625, -77.859375, -71.74609375, -65.6328125, -59.51953125, -53.40625, -47.29296875, -41.1796875, -35.06640625, -28.953125, -22.83984375, -16.7265625, -10.61328125, -4.5, 1.61328125, 7.7265625, 13.83984375, 19.953125, 26.06640625, 32.1796875, 38.29296875, 44.40625, 50.51953125, 56.6328125, 62.74609375, 68.859375, 74.97265625, 81.0859375, 87.19921875, 93.3125, 99.42578125, 105.5390625, 111.65234375, 117.765625, 123.87890625, 129.9921875, 136.10546875, 142.21875, 148.33203125, 154.4453125, 160.55859375, 166.671875, 172.78515625, 178.8984375, 185.01171875, 191.125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 12.0, 21.0, 21.0, 41.0, 54.0, 109.0, 205.0, 425.0, 997.0, 2590.0, 8855.0, 35096.0, 166522.0, 641214.0, 148259.0, 31623.0, 8108.0, 2548.0, 961.0, 383.0, 212.0, 103.0, 58.0, 37.0, 24.0, 17.0, 15.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.1875, -30.226806640625, -29.26611328125, -28.305419921875, -27.3447265625, -26.384033203125, -25.42333984375, -24.462646484375, -23.501953125, -22.541259765625, -21.58056640625, -20.619873046875, -19.6591796875, -18.698486328125, -17.73779296875, -16.777099609375, -15.81640625, -14.855712890625, -13.89501953125, -12.934326171875, -11.9736328125, -11.012939453125, -10.05224609375, -9.091552734375, -8.130859375, -7.170166015625, -6.20947265625, -5.248779296875, -4.2880859375, -3.327392578125, -2.36669921875, -1.406005859375, -0.4453125, 0.515380859375, 1.47607421875, 2.436767578125, 3.3974609375, 4.358154296875, 5.31884765625, 6.279541015625, 7.240234375, 8.200927734375, 9.16162109375, 10.122314453125, 11.0830078125, 12.043701171875, 13.00439453125, 13.965087890625, 14.92578125, 15.886474609375, 16.84716796875, 17.807861328125, 18.7685546875, 19.729248046875, 20.68994140625, 21.650634765625, 22.611328125, 23.572021484375, 24.53271484375, 25.493408203125, 26.4541015625, 27.414794921875, 28.37548828125, 29.336181640625, 30.296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 10.0, 13.0, 13.0, 19.0, 25.0, 33.0, 36.0, 53.0, 61.0, 74.0, 72.0, 81.0, 94.0, 71.0, 76.0, 44.0, 54.0, 28.0, 27.0, 26.0, 15.0, 9.0, 9.0, 8.0, 7.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010815560817718506, -0.010530352592468262, -0.010245144367218018, -0.009959936141967773, -0.00967472791671753, -0.009389519691467285, -0.009104311466217041, -0.008819103240966797, -0.008533895015716553, -0.008248686790466309, -0.007963478565216064, -0.00767827033996582, -0.007393062114715576, -0.007107853889465332, -0.006822645664215088, -0.006537437438964844, -0.0062522292137146, -0.0059670209884643555, -0.005681812763214111, -0.005396604537963867, -0.005111396312713623, -0.004826188087463379, -0.004540979862213135, -0.004255771636962891, -0.0039705634117126465, -0.0036853551864624023, -0.003400146961212158, -0.003114938735961914, -0.00282973051071167, -0.0025445222854614258, -0.0022593140602111816, -0.0019741058349609375, -0.0016888976097106934, -0.0014036893844604492, -0.001118481159210205, -0.0008332729339599609, -0.0005480647087097168, -0.00026285648345947266, 2.2351741790771484e-05, 0.0003075599670410156, 0.0005927681922912598, 0.0008779764175415039, 0.001163184642791748, 0.0014483928680419922, 0.0017336010932922363, 0.0020188093185424805, 0.0023040175437927246, 0.0025892257690429688, 0.002874433994293213, 0.003159642219543457, 0.003444850444793701, 0.0037300586700439453, 0.0040152668952941895, 0.004300475120544434, 0.004585683345794678, 0.004870891571044922, 0.005156099796295166, 0.00544130802154541, 0.005726516246795654, 0.0060117244720458984, 0.006296932697296143, 0.006582140922546387, 0.006867349147796631, 0.007152557373046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 9.0, 25.0, 38.0, 82.0, 141.0, 243.0, 581.0, 1483.0, 4299.0, 16100.0, 77608.0, 567917.0, 306886.0, 55340.0, 12047.0, 3483.0, 1236.0, 516.0, 239.0, 118.0, 57.0, 32.0, 23.0, 14.0, 6.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.125, -27.0390625, -25.953125, -24.8671875, -23.78125, -22.6953125, -21.609375, -20.5234375, -19.4375, -18.3515625, -17.265625, -16.1796875, -15.09375, -14.0078125, -12.921875, -11.8359375, -10.75, -9.6640625, -8.578125, -7.4921875, -6.40625, -5.3203125, -4.234375, -3.1484375, -2.0625, -0.9765625, 0.109375, 1.1953125, 2.28125, 3.3671875, 4.453125, 5.5390625, 6.625, 7.7109375, 8.796875, 9.8828125, 10.96875, 12.0546875, 13.140625, 14.2265625, 15.3125, 16.3984375, 17.484375, 18.5703125, 19.65625, 20.7421875, 21.828125, 22.9140625, 24.0, 25.0859375, 26.171875, 27.2578125, 28.34375, 29.4296875, 30.515625, 31.6015625, 32.6875, 33.7734375, 34.859375, 35.9453125, 37.03125, 38.1171875, 39.203125, 40.2890625, 41.375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 13.0, 13.0, 18.0, 28.0, 35.0, 42.0, 61.0, 65.0, 80.0, 70.0, 73.0, 96.0, 53.0, 76.0, 48.0, 50.0, 34.0, 39.0, 20.0, 23.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-42.21875, -41.120361328125, -40.02197265625, -38.923583984375, -37.8251953125, -36.726806640625, -35.62841796875, -34.530029296875, -33.431640625, -32.333251953125, -31.23486328125, -30.136474609375, -29.0380859375, -27.939697265625, -26.84130859375, -25.742919921875, -24.64453125, -23.546142578125, -22.44775390625, -21.349365234375, -20.2509765625, -19.152587890625, -18.05419921875, -16.955810546875, -15.857421875, -14.759033203125, -13.66064453125, -12.562255859375, -11.4638671875, -10.365478515625, -9.26708984375, -8.168701171875, -7.0703125, -5.971923828125, -4.87353515625, -3.775146484375, -2.6767578125, -1.578369140625, -0.47998046875, 0.618408203125, 1.716796875, 2.815185546875, 3.91357421875, 5.011962890625, 6.1103515625, 7.208740234375, 8.30712890625, 9.405517578125, 10.50390625, 11.602294921875, 12.70068359375, 13.799072265625, 14.8974609375, 15.995849609375, 17.09423828125, 18.192626953125, 19.291015625, 20.389404296875, 21.48779296875, 22.586181640625, 23.6845703125, 24.782958984375, 25.88134765625, 26.979736328125, 28.078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 25.0, 56.0, 139.0, 359.0, 263.0, 79.0, 40.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1960.0020751953125, -1916.3197021484375, -1872.637451171875, -1828.955078125, -1785.272705078125, -1741.5904541015625, -1697.9080810546875, -1654.225830078125, -1610.54345703125, -1566.861083984375, -1523.1788330078125, -1479.4964599609375, -1435.8140869140625, -1392.1318359375, -1348.449462890625, -1304.76708984375, -1261.084716796875, -1217.40234375, -1173.7200927734375, -1130.0377197265625, -1086.3553466796875, -1042.673095703125, -998.99072265625, -955.3084106445312, -911.6260986328125, -867.9437866210938, -824.2614135742188, -780.5791015625, -736.8967895507812, -693.2144775390625, -649.5321044921875, -605.8497924804688, -562.16748046875, -518.4851684570312, -474.8028259277344, -431.1204833984375, -387.43817138671875, -343.7558288574219, -300.073486328125, -256.39117431640625, -212.70883178710938, -169.02650451660156, -125.34416961669922, -81.66183471679688, -37.97950744628906, 5.70281982421875, 49.385162353515625, 93.06747436523438, 136.74981689453125, 180.43214416503906, 224.11447143554688, 267.79681396484375, 311.4791259765625, 355.1614685058594, 398.84381103515625, 442.526123046875, 486.2084655761719, 529.8908081054688, 573.5731201171875, 617.2554931640625, 660.9378051757812, 704.6201171875, 748.302490234375, 791.9847412109375, 835.6671142578125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 13.0, 9.0, 16.0, 17.0, 12.0, 22.0, 24.0, 25.0, 25.0, 30.0, 37.0, 45.0, 50.0, 79.0, 71.0, 82.0, 48.0, 40.0, 38.0, 35.0, 24.0, 34.0, 17.0, 28.0, 22.0, 20.0, 17.0, 13.0, 8.0, 16.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-676.45458984375, -656.978515625, -637.5025024414062, -618.0264282226562, -598.5504150390625, -579.0743408203125, -559.5983276367188, -540.1222534179688, -520.646240234375, -501.1701965332031, -481.69415283203125, -462.2181091308594, -442.7420654296875, -423.2659912109375, -403.7899475097656, -384.31390380859375, -364.83782958984375, -345.3617858886719, -325.8857421875, -306.4096984863281, -286.93365478515625, -267.45758056640625, -247.98153686523438, -228.5054931640625, -209.02944946289062, -189.55340576171875, -170.07736206054688, -150.60130310058594, -131.12525939941406, -111.64921569824219, -92.17316436767578, -72.69711303710938, -53.2210693359375, -33.74502182006836, -14.268974304199219, 5.207073211669922, 24.683120727539062, 44.15916442871094, 63.635215759277344, 83.11126708984375, 102.58731079101562, 122.0633544921875, 141.53939819335938, 161.0154571533203, 180.4915008544922, 199.96754455566406, 219.443603515625, 238.91964721679688, 258.39569091796875, 277.8717346191406, 297.3477783203125, 316.8238220214844, 336.29986572265625, 355.77593994140625, 375.2519836425781, 394.72802734375, 414.2040710449219, 433.68011474609375, 453.1561584472656, 472.6322021484375, 492.1082763671875, 511.58428955078125, 531.0603637695312, 550.536376953125, 570.012451171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 4.0, 8.0, 8.0, 16.0, 17.0, 18.0, 25.0, 35.0, 40.0, 75.0, 140.0, 292.0, 961.0, 3287.0, 16414.0, 305575.0, 3542003.0, 303306.0, 16907.0, 3377.0, 988.0, 350.0, 147.0, 59.0, 47.0, 32.0, 28.0, 21.0, 14.0, 9.0, 18.0, 13.0, 6.0, 3.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.5625, -105.1162109375, -101.669921875, -98.2236328125, -94.77734375, -91.3310546875, -87.884765625, -84.4384765625, -80.9921875, -77.5458984375, -74.099609375, -70.6533203125, -67.20703125, -63.7607421875, -60.314453125, -56.8681640625, -53.421875, -49.9755859375, -46.529296875, -43.0830078125, -39.63671875, -36.1904296875, -32.744140625, -29.2978515625, -25.8515625, -22.4052734375, -18.958984375, -15.5126953125, -12.06640625, -8.6201171875, -5.173828125, -1.7275390625, 1.71875, 5.1650390625, 8.611328125, 12.0576171875, 15.50390625, 18.9501953125, 22.396484375, 25.8427734375, 29.2890625, 32.7353515625, 36.181640625, 39.6279296875, 43.07421875, 46.5205078125, 49.966796875, 53.4130859375, 56.859375, 60.3056640625, 63.751953125, 67.1982421875, 70.64453125, 74.0908203125, 77.537109375, 80.9833984375, 84.4296875, 87.8759765625, 91.322265625, 94.7685546875, 98.21484375, 101.6611328125, 105.107421875, 108.5537109375, 112.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 0.0, 4.0, 7.0, 6.0, 4.0, 9.0, 10.0, 11.0, 6.0, 16.0, 12.0, 15.0, 19.0, 24.0, 29.0, 39.0, 44.0, 42.0, 46.0, 52.0, 49.0, 33.0, 40.0, 53.0, 51.0, 41.0, 32.0, 47.0, 34.0, 39.0, 32.0, 25.0, 19.0, 24.0, 10.0, 14.0, 16.0, 13.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.51806640625, -38.2548828125, -36.99169921875, -35.728515625, -34.46533203125, -33.2021484375, -31.93896484375, -30.67578125, -29.41259765625, -28.1494140625, -26.88623046875, -25.623046875, -24.35986328125, -23.0966796875, -21.83349609375, -20.5703125, -19.30712890625, -18.0439453125, -16.78076171875, -15.517578125, -14.25439453125, -12.9912109375, -11.72802734375, -10.46484375, -9.20166015625, -7.9384765625, -6.67529296875, -5.412109375, -4.14892578125, -2.8857421875, -1.62255859375, -0.359375, 0.90380859375, 2.1669921875, 3.43017578125, 4.693359375, 5.95654296875, 7.2197265625, 8.48291015625, 9.74609375, 11.00927734375, 12.2724609375, 13.53564453125, 14.798828125, 16.06201171875, 17.3251953125, 18.58837890625, 19.8515625, 21.11474609375, 22.3779296875, 23.64111328125, 24.904296875, 26.16748046875, 27.4306640625, 28.69384765625, 29.95703125, 31.22021484375, 32.4833984375, 33.74658203125, 35.009765625, 36.27294921875, 37.5361328125, 38.79931640625, 40.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 12.0, 16.0, 68.0, 110.0, 256.0, 855.0, 13677.0, 4151282.0, 26451.0, 1022.0, 281.0, 128.0, 55.0, 37.0, 19.0, 14.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-430.25, -416.17578125, -402.1015625, -388.02734375, -373.953125, -359.87890625, -345.8046875, -331.73046875, -317.65625, -303.58203125, -289.5078125, -275.43359375, -261.359375, -247.28515625, -233.2109375, -219.13671875, -205.0625, -190.98828125, -176.9140625, -162.83984375, -148.765625, -134.69140625, -120.6171875, -106.54296875, -92.46875, -78.39453125, -64.3203125, -50.24609375, -36.171875, -22.09765625, -8.0234375, 6.05078125, 20.125, 34.19921875, 48.2734375, 62.34765625, 76.421875, 90.49609375, 104.5703125, 118.64453125, 132.71875, 146.79296875, 160.8671875, 174.94140625, 189.015625, 203.08984375, 217.1640625, 231.23828125, 245.3125, 259.38671875, 273.4609375, 287.53515625, 301.609375, 315.68359375, 329.7578125, 343.83203125, 357.90625, 371.98046875, 386.0546875, 400.12890625, 414.203125, 428.27734375, 442.3515625, 456.42578125, 470.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 12.0, 29.0, 47.0, 99.0, 396.0, 1714.0, 1348.0, 284.0, 81.0, 35.0, 13.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.25, -254.7265625, -246.203125, -237.6796875, -229.15625, -220.6328125, -212.109375, -203.5859375, -195.0625, -186.5390625, -178.015625, -169.4921875, -160.96875, -152.4453125, -143.921875, -135.3984375, -126.875, -118.3515625, -109.828125, -101.3046875, -92.78125, -84.2578125, -75.734375, -67.2109375, -58.6875, -50.1640625, -41.640625, -33.1171875, -24.59375, -16.0703125, -7.546875, 0.9765625, 9.5, 18.0234375, 26.546875, 35.0703125, 43.59375, 52.1171875, 60.640625, 69.1640625, 77.6875, 86.2109375, 94.734375, 103.2578125, 111.78125, 120.3046875, 128.828125, 137.3515625, 145.875, 154.3984375, 162.921875, 171.4453125, 179.96875, 188.4921875, 197.015625, 205.5390625, 214.0625, 222.5859375, 231.109375, 239.6328125, 248.15625, 256.6796875, 265.203125, 273.7265625, 282.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 17.0, 19.0, 15.0, 41.0, 43.0, 80.0, 132.0, 179.0, 143.0, 113.0, 99.0, 37.0, 29.0, 14.0, 12.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-973.7903442382812, -947.4930419921875, -921.1957397460938, -894.8983764648438, -868.60107421875, -842.3037719726562, -816.0064697265625, -789.7091064453125, -763.4118041992188, -737.114501953125, -710.8171997070312, -684.5198364257812, -658.2225341796875, -631.9252319335938, -605.6279296875, -579.33056640625, -553.0333251953125, -526.7360229492188, -500.4386901855469, -474.1413879394531, -447.84405517578125, -421.5467529296875, -395.24945068359375, -368.9521179199219, -342.65478515625, -316.35748291015625, -290.0601501464844, -263.7628479003906, -237.46551513671875, -211.168212890625, -184.8708953857422, -158.57357788085938, -132.2762451171875, -105.97892761230469, -79.68161010742188, -53.384300231933594, -27.08698272705078, -0.7896728515625, 25.507644653320312, 51.804962158203125, 78.10227966308594, 104.39959716796875, 130.69691467285156, 156.99423217773438, 183.29153442382812, 209.58885192871094, 235.88616943359375, 262.1834716796875, 288.4808044433594, 314.7781066894531, 341.075439453125, 367.37274169921875, 393.6700744628906, 419.9673767089844, 446.26470947265625, 472.56201171875, 498.85931396484375, 525.1566162109375, 551.4539184570312, 577.7512817382812, 604.048583984375, 630.3458862304688, 656.6431884765625, 682.9405517578125, 709.2378540039062]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 9.0, 9.0, 14.0, 17.0, 11.0, 27.0, 30.0, 29.0, 26.0, 33.0, 33.0, 28.0, 34.0, 32.0, 49.0, 47.0, 42.0, 41.0, 44.0, 31.0, 42.0, 32.0, 35.0, 34.0, 16.0, 29.0, 24.0, 17.0, 17.0, 20.0, 17.0, 22.0, 9.0, 16.0, 9.0, 3.0, 12.0, 7.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-434.8672180175781, -421.15618896484375, -407.44512939453125, -393.73406982421875, -380.0230407714844, -366.31201171875, -352.6009521484375, -338.889892578125, -325.1788635253906, -311.46783447265625, -297.75677490234375, -284.04571533203125, -270.3346862792969, -256.6236572265625, -242.91259765625, -229.20155334472656, -215.49050903320312, -201.7794647216797, -188.06842041015625, -174.3573760986328, -160.64633178710938, -146.93528747558594, -133.2242431640625, -119.51319885253906, -105.80215454101562, -92.09111022949219, -78.38006591796875, -64.66902160644531, -50.957977294921875, -37.24693298339844, -23.535888671875, -9.824844360351562, 3.88623046875, 17.597274780273438, 31.308319091796875, 45.01936340332031, 58.73040771484375, 72.44145202636719, 86.15249633789062, 99.86354064941406, 113.5745849609375, 127.28562927246094, 140.99667358398438, 154.7077178955078, 168.41876220703125, 182.1298065185547, 195.84085083007812, 209.55189514160156, 223.262939453125, 236.97398376464844, 250.68502807617188, 264.39605712890625, 278.10711669921875, 291.81817626953125, 305.5292053222656, 319.240234375, 332.9512939453125, 346.662353515625, 360.3733825683594, 374.08441162109375, 387.79547119140625, 401.50653076171875, 415.2175598144531, 428.9285888671875, 442.6396484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 12.0, 18.0, 39.0, 44.0, 75.0, 81.0, 129.0, 229.0, 304.0, 489.0, 780.0, 1186.0, 2012.0, 3341.0, 5522.0, 9790.0, 17678.0, 32318.0, 63723.0, 126578.0, 251100.0, 258932.0, 132386.0, 65143.0, 33902.0, 18071.0, 10081.0, 5697.0, 3385.0, 1981.0, 1295.0, 723.0, 512.0, 324.0, 213.0, 149.0, 78.0, 67.0, 49.0, 29.0, 23.0, 17.0, 15.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.71875, -39.48583984375, -38.2529296875, -37.02001953125, -35.787109375, -34.55419921875, -33.3212890625, -32.08837890625, -30.85546875, -29.62255859375, -28.3896484375, -27.15673828125, -25.923828125, -24.69091796875, -23.4580078125, -22.22509765625, -20.9921875, -19.75927734375, -18.5263671875, -17.29345703125, -16.060546875, -14.82763671875, -13.5947265625, -12.36181640625, -11.12890625, -9.89599609375, -8.6630859375, -7.43017578125, -6.197265625, -4.96435546875, -3.7314453125, -2.49853515625, -1.265625, -0.03271484375, 1.2001953125, 2.43310546875, 3.666015625, 4.89892578125, 6.1318359375, 7.36474609375, 8.59765625, 9.83056640625, 11.0634765625, 12.29638671875, 13.529296875, 14.76220703125, 15.9951171875, 17.22802734375, 18.4609375, 19.69384765625, 20.9267578125, 22.15966796875, 23.392578125, 24.62548828125, 25.8583984375, 27.09130859375, 28.32421875, 29.55712890625, 30.7900390625, 32.02294921875, 33.255859375, 34.48876953125, 35.7216796875, 36.95458984375, 38.1875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 3.0, 8.0, 3.0, 9.0, 10.0, 13.0, 9.0, 18.0, 19.0, 24.0, 33.0, 46.0, 39.0, 43.0, 43.0, 59.0, 70.0, 60.0, 34.0, 46.0, 47.0, 48.0, 44.0, 42.0, 44.0, 23.0, 35.0, 22.0, 20.0, 23.0, 15.0, 12.0, 11.0, 5.0, 4.0, 7.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.34375, -51.77734375, -50.2109375, -48.64453125, -47.078125, -45.51171875, -43.9453125, -42.37890625, -40.8125, -39.24609375, -37.6796875, -36.11328125, -34.546875, -32.98046875, -31.4140625, -29.84765625, -28.28125, -26.71484375, -25.1484375, -23.58203125, -22.015625, -20.44921875, -18.8828125, -17.31640625, -15.75, -14.18359375, -12.6171875, -11.05078125, -9.484375, -7.91796875, -6.3515625, -4.78515625, -3.21875, -1.65234375, -0.0859375, 1.48046875, 3.046875, 4.61328125, 6.1796875, 7.74609375, 9.3125, 10.87890625, 12.4453125, 14.01171875, 15.578125, 17.14453125, 18.7109375, 20.27734375, 21.84375, 23.41015625, 24.9765625, 26.54296875, 28.109375, 29.67578125, 31.2421875, 32.80859375, 34.375, 35.94140625, 37.5078125, 39.07421875, 40.640625, 42.20703125, 43.7734375, 45.33984375, 46.90625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 5.0, 12.0, 6.0, 13.0, 23.0, 39.0, 36.0, 80.0, 89.0, 161.0, 250.0, 583.0, 1471.0, 5413.0, 27802.0, 334125.0, 635496.0, 33660.0, 6214.0, 1670.0, 606.0, 305.0, 148.0, 92.0, 62.0, 53.0, 34.0, 31.0, 13.0, 13.0, 12.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-135.375, -129.970703125, -124.56640625, -119.162109375, -113.7578125, -108.353515625, -102.94921875, -97.544921875, -92.140625, -86.736328125, -81.33203125, -75.927734375, -70.5234375, -65.119140625, -59.71484375, -54.310546875, -48.90625, -43.501953125, -38.09765625, -32.693359375, -27.2890625, -21.884765625, -16.48046875, -11.076171875, -5.671875, -0.267578125, 5.13671875, 10.541015625, 15.9453125, 21.349609375, 26.75390625, 32.158203125, 37.5625, 42.966796875, 48.37109375, 53.775390625, 59.1796875, 64.583984375, 69.98828125, 75.392578125, 80.796875, 86.201171875, 91.60546875, 97.009765625, 102.4140625, 107.818359375, 113.22265625, 118.626953125, 124.03125, 129.435546875, 134.83984375, 140.244140625, 145.6484375, 151.052734375, 156.45703125, 161.861328125, 167.265625, 172.669921875, 178.07421875, 183.478515625, 188.8828125, 194.287109375, 199.69140625, 205.095703125, 210.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 15.0, 13.0, 13.0, 13.0, 24.0, 26.0, 24.0, 50.0, 50.0, 66.0, 67.0, 88.0, 77.0, 89.0, 91.0, 62.0, 44.0, 45.0, 28.0, 28.0, 21.0, 10.0, 9.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.625, -192.599609375, -183.57421875, -174.548828125, -165.5234375, -156.498046875, -147.47265625, -138.447265625, -129.421875, -120.396484375, -111.37109375, -102.345703125, -93.3203125, -84.294921875, -75.26953125, -66.244140625, -57.21875, -48.193359375, -39.16796875, -30.142578125, -21.1171875, -12.091796875, -3.06640625, 5.958984375, 14.984375, 24.009765625, 33.03515625, 42.060546875, 51.0859375, 60.111328125, 69.13671875, 78.162109375, 87.1875, 96.212890625, 105.23828125, 114.263671875, 123.2890625, 132.314453125, 141.33984375, 150.365234375, 159.390625, 168.416015625, 177.44140625, 186.466796875, 195.4921875, 204.517578125, 213.54296875, 222.568359375, 231.59375, 240.619140625, 249.64453125, 258.669921875, 267.6953125, 276.720703125, 285.74609375, 294.771484375, 303.796875, 312.822265625, 321.84765625, 330.873046875, 339.8984375, 348.923828125, 357.94921875, 366.974609375, 376.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 11.0, 13.0, 14.0, 20.0, 32.0, 39.0, 62.0, 121.0, 214.0, 341.0, 627.0, 1413.0, 3518.0, 10588.0, 41838.0, 304161.0, 612761.0, 52904.0, 12517.0, 4137.0, 1586.0, 690.0, 382.0, 196.0, 108.0, 74.0, 58.0, 29.0, 15.0, 23.0, 13.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.8125, -31.6435546875, -30.474609375, -29.3056640625, -28.13671875, -26.9677734375, -25.798828125, -24.6298828125, -23.4609375, -22.2919921875, -21.123046875, -19.9541015625, -18.78515625, -17.6162109375, -16.447265625, -15.2783203125, -14.109375, -12.9404296875, -11.771484375, -10.6025390625, -9.43359375, -8.2646484375, -7.095703125, -5.9267578125, -4.7578125, -3.5888671875, -2.419921875, -1.2509765625, -0.08203125, 1.0869140625, 2.255859375, 3.4248046875, 4.59375, 5.7626953125, 6.931640625, 8.1005859375, 9.26953125, 10.4384765625, 11.607421875, 12.7763671875, 13.9453125, 15.1142578125, 16.283203125, 17.4521484375, 18.62109375, 19.7900390625, 20.958984375, 22.1279296875, 23.296875, 24.4658203125, 25.634765625, 26.8037109375, 27.97265625, 29.1416015625, 30.310546875, 31.4794921875, 32.6484375, 33.8173828125, 34.986328125, 36.1552734375, 37.32421875, 38.4931640625, 39.662109375, 40.8310546875, 42.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 15.0, 24.0, 26.0, 15.0, 44.0, 47.0, 74.0, 105.0, 135.0, 132.0, 97.0, 71.0, 60.0, 32.0, 19.0, 27.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.01139974594116211, -0.011004447937011719, -0.010609149932861328, -0.010213851928710938, -0.009818553924560547, -0.009423255920410156, -0.009027957916259766, -0.008632659912109375, -0.008237361907958984, -0.007842063903808594, -0.007446765899658203, -0.0070514678955078125, -0.006656169891357422, -0.006260871887207031, -0.005865573883056641, -0.00547027587890625, -0.005074977874755859, -0.004679679870605469, -0.004284381866455078, -0.0038890838623046875, -0.003493785858154297, -0.0030984878540039062, -0.0027031898498535156, -0.002307891845703125, -0.0019125938415527344, -0.0015172958374023438, -0.0011219978332519531, -0.0007266998291015625, -0.0003314018249511719, 6.389617919921875e-05, 0.0004591941833496094, 0.0008544921875, 0.0012497901916503906, 0.0016450881958007812, 0.002040386199951172, 0.0024356842041015625, 0.002830982208251953, 0.0032262802124023438, 0.0036215782165527344, 0.004016876220703125, 0.004412174224853516, 0.004807472229003906, 0.005202770233154297, 0.0055980682373046875, 0.005993366241455078, 0.006388664245605469, 0.006783962249755859, 0.00717926025390625, 0.007574558258056641, 0.007969856262207031, 0.008365154266357422, 0.008760452270507812, 0.009155750274658203, 0.009551048278808594, 0.009946346282958984, 0.010341644287109375, 0.010736942291259766, 0.011132240295410156, 0.011527538299560547, 0.011922836303710938, 0.012318134307861328, 0.012713432312011719, 0.01310873031616211, 0.0135040283203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 1.0, 2.0, 12.0, 6.0, 15.0, 26.0, 28.0, 28.0, 63.0, 93.0, 166.0, 300.0, 635.0, 1521.0, 4640.0, 18892.0, 126188.0, 789077.0, 85903.0, 14515.0, 3888.0, 1334.0, 538.0, 265.0, 164.0, 93.0, 54.0, 29.0, 24.0, 25.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.34375, -46.89697265625, -45.4501953125, -44.00341796875, -42.556640625, -41.10986328125, -39.6630859375, -38.21630859375, -36.76953125, -35.32275390625, -33.8759765625, -32.42919921875, -30.982421875, -29.53564453125, -28.0888671875, -26.64208984375, -25.1953125, -23.74853515625, -22.3017578125, -20.85498046875, -19.408203125, -17.96142578125, -16.5146484375, -15.06787109375, -13.62109375, -12.17431640625, -10.7275390625, -9.28076171875, -7.833984375, -6.38720703125, -4.9404296875, -3.49365234375, -2.046875, -0.60009765625, 0.8466796875, 2.29345703125, 3.740234375, 5.18701171875, 6.6337890625, 8.08056640625, 9.52734375, 10.97412109375, 12.4208984375, 13.86767578125, 15.314453125, 16.76123046875, 18.2080078125, 19.65478515625, 21.1015625, 22.54833984375, 23.9951171875, 25.44189453125, 26.888671875, 28.33544921875, 29.7822265625, 31.22900390625, 32.67578125, 34.12255859375, 35.5693359375, 37.01611328125, 38.462890625, 39.90966796875, 41.3564453125, 42.80322265625, 44.25]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 7.0, 14.0, 17.0, 40.0, 59.0, 81.0, 122.0, 143.0, 127.0, 110.0, 81.0, 48.0, 26.0, 32.0, 13.0, 17.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.09375, -61.37841796875, -59.6630859375, -57.94775390625, -56.232421875, -54.51708984375, -52.8017578125, -51.08642578125, -49.37109375, -47.65576171875, -45.9404296875, -44.22509765625, -42.509765625, -40.79443359375, -39.0791015625, -37.36376953125, -35.6484375, -33.93310546875, -32.2177734375, -30.50244140625, -28.787109375, -27.07177734375, -25.3564453125, -23.64111328125, -21.92578125, -20.21044921875, -18.4951171875, -16.77978515625, -15.064453125, -13.34912109375, -11.6337890625, -9.91845703125, -8.203125, -6.48779296875, -4.7724609375, -3.05712890625, -1.341796875, 0.37353515625, 2.0888671875, 3.80419921875, 5.51953125, 7.23486328125, 8.9501953125, 10.66552734375, 12.380859375, 14.09619140625, 15.8115234375, 17.52685546875, 19.2421875, 20.95751953125, 22.6728515625, 24.38818359375, 26.103515625, 27.81884765625, 29.5341796875, 31.24951171875, 32.96484375, 34.68017578125, 36.3955078125, 38.11083984375, 39.826171875, 41.54150390625, 43.2568359375, 44.97216796875, 46.6875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 16.0, 34.0, 122.0, 327.0, 355.0, 95.0, 28.0, 15.0, 8.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2877.7158203125, -2820.189453125, -2762.663330078125, -2705.136962890625, -2647.61083984375, -2590.08447265625, -2532.55810546875, -2475.031982421875, -2417.505615234375, -2359.979248046875, -2302.453125, -2244.9267578125, -2187.400634765625, -2129.874267578125, -2072.34814453125, -2014.82177734375, -1957.295654296875, -1899.7694091796875, -1842.2431640625, -1784.716796875, -1727.1905517578125, -1669.664306640625, -1612.1380615234375, -1554.61181640625, -1497.08544921875, -1439.5592041015625, -1382.032958984375, -1324.506591796875, -1266.9803466796875, -1209.4541015625, -1151.9278564453125, -1094.401611328125, -1036.87548828125, -979.3492431640625, -921.8229370117188, -864.2966918945312, -806.7704467773438, -749.244140625, -691.7178955078125, -634.191650390625, -576.665283203125, -519.1390380859375, -461.6127624511719, -404.08648681640625, -346.56024169921875, -289.0339660644531, -231.5076904296875, -173.9814453125, -116.4552001953125, -58.92893600463867, -1.4026718139648438, 56.12359619140625, 113.64985656738281, 171.17611694335938, 228.702392578125, 286.2286376953125, 343.7549133300781, 401.28118896484375, 458.80743408203125, 516.333740234375, 573.8599853515625, 631.38623046875, 688.9124755859375, 746.438720703125, 803.9650268554688]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 7.0, 10.0, 4.0, 5.0, 8.0, 10.0, 13.0, 10.0, 17.0, 28.0, 25.0, 24.0, 35.0, 44.0, 39.0, 57.0, 65.0, 84.0, 89.0, 61.0, 45.0, 28.0, 29.0, 28.0, 23.0, 22.0, 26.0, 21.0, 23.0, 6.0, 14.0, 18.0, 10.0, 10.0, 4.0, 10.0, 7.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-648.345947265625, -626.691162109375, -605.036376953125, -583.3815307617188, -561.7267456054688, -540.0719604492188, -518.4171752929688, -496.7623596191406, -475.1075439453125, -453.4527587890625, -431.7979431152344, -410.1431579589844, -388.48834228515625, -366.83355712890625, -345.17877197265625, -323.5239562988281, -301.8691711425781, -280.2143859863281, -258.5595703125, -236.90478515625, -215.24996948242188, -193.59518432617188, -171.9403839111328, -150.28558349609375, -128.6307830810547, -106.97598266601562, -85.32118225097656, -63.66638946533203, -42.01158905029297, -20.356788635253906, 1.298004150390625, 22.952804565429688, 44.60760498046875, 66.26240539550781, 87.91720581054688, 109.5719985961914, 131.226806640625, 152.881591796875, 174.53639221191406, 196.19119262695312, 217.8459930419922, 239.50079345703125, 261.15557861328125, 282.8103942871094, 304.4651794433594, 326.1199951171875, 347.7747802734375, 369.4295654296875, 391.0843811035156, 412.7391662597656, 434.39398193359375, 456.04876708984375, 477.7035827636719, 499.3583679199219, 521.01318359375, 542.66796875, 564.32275390625, 585.9775390625, 607.63232421875, 629.2871704101562, 650.9419555664062, 672.5967407226562, 694.2515258789062, 715.9063720703125, 737.5611572265625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 25.0, 28.0, 51.0, 66.0, 85.0, 132.0, 210.0, 365.0, 555.0, 950.0, 1709.0, 3113.0, 6487.0, 17084.0, 59253.0, 238813.0, 1040822.0, 2042804.0, 584813.0, 135691.0, 36909.0, 12663.0, 5464.0, 2679.0, 1407.0, 781.0, 483.0, 262.0, 193.0, 129.0, 78.0, 51.0, 29.0, 24.0, 17.0, 6.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.34375, -40.94677734375, -39.5498046875, -38.15283203125, -36.755859375, -35.35888671875, -33.9619140625, -32.56494140625, -31.16796875, -29.77099609375, -28.3740234375, -26.97705078125, -25.580078125, -24.18310546875, -22.7861328125, -21.38916015625, -19.9921875, -18.59521484375, -17.1982421875, -15.80126953125, -14.404296875, -13.00732421875, -11.6103515625, -10.21337890625, -8.81640625, -7.41943359375, -6.0224609375, -4.62548828125, -3.228515625, -1.83154296875, -0.4345703125, 0.96240234375, 2.359375, 3.75634765625, 5.1533203125, 6.55029296875, 7.947265625, 9.34423828125, 10.7412109375, 12.13818359375, 13.53515625, 14.93212890625, 16.3291015625, 17.72607421875, 19.123046875, 20.52001953125, 21.9169921875, 23.31396484375, 24.7109375, 26.10791015625, 27.5048828125, 28.90185546875, 30.298828125, 31.69580078125, 33.0927734375, 34.48974609375, 35.88671875, 37.28369140625, 38.6806640625, 40.07763671875, 41.474609375, 42.87158203125, 44.2685546875, 45.66552734375, 47.0625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 17.0, 23.0, 23.0, 24.0, 29.0, 35.0, 33.0, 49.0, 69.0, 51.0, 57.0, 62.0, 46.0, 60.0, 54.0, 45.0, 39.0, 52.0, 32.0, 34.0, 26.0, 26.0, 15.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0], "bins": [-73.375, -71.57470703125, -69.7744140625, -67.97412109375, -66.173828125, -64.37353515625, -62.5732421875, -60.77294921875, -58.97265625, -57.17236328125, -55.3720703125, -53.57177734375, -51.771484375, -49.97119140625, -48.1708984375, -46.37060546875, -44.5703125, -42.77001953125, -40.9697265625, -39.16943359375, -37.369140625, -35.56884765625, -33.7685546875, -31.96826171875, -30.16796875, -28.36767578125, -26.5673828125, -24.76708984375, -22.966796875, -21.16650390625, -19.3662109375, -17.56591796875, -15.765625, -13.96533203125, -12.1650390625, -10.36474609375, -8.564453125, -6.76416015625, -4.9638671875, -3.16357421875, -1.36328125, 0.43701171875, 2.2373046875, 4.03759765625, 5.837890625, 7.63818359375, 9.4384765625, 11.23876953125, 13.0390625, 14.83935546875, 16.6396484375, 18.43994140625, 20.240234375, 22.04052734375, 23.8408203125, 25.64111328125, 27.44140625, 29.24169921875, 31.0419921875, 32.84228515625, 34.642578125, 36.44287109375, 38.2431640625, 40.04345703125, 41.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 32.0, 41.0, 76.0, 114.0, 282.0, 916.0, 3407.0, 21011.0, 777702.0, 3343801.0, 39599.0, 5129.0, 1233.0, 413.0, 225.0, 98.0, 52.0, 38.0, 19.0, 15.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.75, -178.3671875, -172.984375, -167.6015625, -162.21875, -156.8359375, -151.453125, -146.0703125, -140.6875, -135.3046875, -129.921875, -124.5390625, -119.15625, -113.7734375, -108.390625, -103.0078125, -97.625, -92.2421875, -86.859375, -81.4765625, -76.09375, -70.7109375, -65.328125, -59.9453125, -54.5625, -49.1796875, -43.796875, -38.4140625, -33.03125, -27.6484375, -22.265625, -16.8828125, -11.5, -6.1171875, -0.734375, 4.6484375, 10.03125, 15.4140625, 20.796875, 26.1796875, 31.5625, 36.9453125, 42.328125, 47.7109375, 53.09375, 58.4765625, 63.859375, 69.2421875, 74.625, 80.0078125, 85.390625, 90.7734375, 96.15625, 101.5390625, 106.921875, 112.3046875, 117.6875, 123.0703125, 128.453125, 133.8359375, 139.21875, 144.6015625, 149.984375, 155.3671875, 160.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 6.0, 6.0, 10.0, 19.0, 13.0, 22.0, 20.0, 33.0, 62.0, 102.0, 176.0, 298.0, 557.0, 804.0, 730.0, 533.0, 287.0, 148.0, 69.0, 55.0, 37.0, 24.0, 14.0, 9.0, 13.0, 5.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.3125, -101.9169921875, -98.521484375, -95.1259765625, -91.73046875, -88.3349609375, -84.939453125, -81.5439453125, -78.1484375, -74.7529296875, -71.357421875, -67.9619140625, -64.56640625, -61.1708984375, -57.775390625, -54.3798828125, -50.984375, -47.5888671875, -44.193359375, -40.7978515625, -37.40234375, -34.0068359375, -30.611328125, -27.2158203125, -23.8203125, -20.4248046875, -17.029296875, -13.6337890625, -10.23828125, -6.8427734375, -3.447265625, -0.0517578125, 3.34375, 6.7392578125, 10.134765625, 13.5302734375, 16.92578125, 20.3212890625, 23.716796875, 27.1123046875, 30.5078125, 33.9033203125, 37.298828125, 40.6943359375, 44.08984375, 47.4853515625, 50.880859375, 54.2763671875, 57.671875, 61.0673828125, 64.462890625, 67.8583984375, 71.25390625, 74.6494140625, 78.044921875, 81.4404296875, 84.8359375, 88.2314453125, 91.626953125, 95.0224609375, 98.41796875, 101.8134765625, 105.208984375, 108.6044921875, 112.0]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 19.0, 30.0, 55.0, 109.0, 190.0, 241.0, 157.0, 100.0, 45.0, 19.0, 7.0, 2.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-859.0454711914062, -828.9410400390625, -798.8365478515625, -768.7321166992188, -738.627685546875, -708.523193359375, -678.4187622070312, -648.3143310546875, -618.2098388671875, -588.1054077148438, -558.0009155273438, -527.896484375, -497.79205322265625, -467.6875915527344, -437.5831298828125, -407.47869873046875, -377.374267578125, -347.2698059082031, -317.1653747558594, -287.0609130859375, -256.95648193359375, -226.85202026367188, -196.74755859375, -166.6431121826172, -136.53866577148438, -106.43421936035156, -76.32976531982422, -46.225311279296875, -16.120864868164062, 13.98358154296875, 44.088043212890625, 74.19248962402344, 104.2969970703125, 134.4014434814453, 164.50588989257812, 194.6103515625, 224.7147979736328, 254.81924438476562, 284.9237060546875, 315.02813720703125, 345.1325988769531, 375.237060546875, 405.34149169921875, 435.4459533691406, 465.5504150390625, 495.65484619140625, 525.75927734375, 555.86376953125, 585.9682006835938, 616.0726318359375, 646.1771240234375, 676.2815551757812, 706.385986328125, 736.490478515625, 766.5949096679688, 796.6993408203125, 826.8038330078125, 856.9082641601562, 887.0127563476562, 917.1171875, 947.2216186523438, 977.3260498046875, 1007.4305419921875, 1037.5350341796875, 1067.639404296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 15.0, 24.0, 16.0, 18.0, 31.0, 33.0, 50.0, 37.0, 42.0, 48.0, 53.0, 48.0, 49.0, 53.0, 50.0, 48.0, 43.0, 65.0, 35.0, 44.0, 38.0, 28.0, 23.0, 17.0, 19.0, 15.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-440.7887268066406, -425.0470886230469, -409.3054504394531, -393.5638122558594, -377.8221740722656, -362.0805358886719, -346.3388671875, -330.59722900390625, -314.8555908203125, -299.11395263671875, -283.372314453125, -267.63067626953125, -251.8890380859375, -236.14739990234375, -220.40574645996094, -204.6641082763672, -188.9224853515625, -173.18084716796875, -157.439208984375, -141.69757080078125, -125.95592498779297, -110.21428680419922, -94.47264099121094, -78.73100280761719, -62.98936462402344, -47.24772644042969, -31.506084442138672, -15.764442443847656, -0.02280426025390625, 15.718833923339844, 31.460479736328125, 47.202117919921875, 62.94378662109375, 78.6854248046875, 94.42706298828125, 110.16870880126953, 125.91034698486328, 141.6519775390625, 157.3936309814453, 173.13526916503906, 188.8769073486328, 204.61854553222656, 220.3601837158203, 236.10183715820312, 251.84347534179688, 267.5851135253906, 283.3267517089844, 299.0683898925781, 314.8100280761719, 330.5516662597656, 346.2933044433594, 362.0349426269531, 377.7765808105469, 393.5182189941406, 409.2598876953125, 425.00152587890625, 440.7431640625, 456.48480224609375, 472.2264404296875, 487.96807861328125, 503.709716796875, 519.4513549804688, 535.1929931640625, 550.9346313476562, 566.67626953125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 27.0, 36.0, 58.0, 78.0, 138.0, 187.0, 306.0, 449.0, 800.0, 1376.0, 2526.0, 4567.0, 9098.0, 18610.0, 42402.0, 103074.0, 271164.0, 348178.0, 140545.0, 56135.0, 24609.0, 11449.0, 5588.0, 3022.0, 1602.0, 954.0, 560.0, 349.0, 240.0, 142.0, 86.0, 66.0, 50.0, 22.0, 19.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.75, -56.978515625, -55.20703125, -53.435546875, -51.6640625, -49.892578125, -48.12109375, -46.349609375, -44.578125, -42.806640625, -41.03515625, -39.263671875, -37.4921875, -35.720703125, -33.94921875, -32.177734375, -30.40625, -28.634765625, -26.86328125, -25.091796875, -23.3203125, -21.548828125, -19.77734375, -18.005859375, -16.234375, -14.462890625, -12.69140625, -10.919921875, -9.1484375, -7.376953125, -5.60546875, -3.833984375, -2.0625, -0.291015625, 1.48046875, 3.251953125, 5.0234375, 6.794921875, 8.56640625, 10.337890625, 12.109375, 13.880859375, 15.65234375, 17.423828125, 19.1953125, 20.966796875, 22.73828125, 24.509765625, 26.28125, 28.052734375, 29.82421875, 31.595703125, 33.3671875, 35.138671875, 36.91015625, 38.681640625, 40.453125, 42.224609375, 43.99609375, 45.767578125, 47.5390625, 49.310546875, 51.08203125, 52.853515625, 54.625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 19.0, 19.0, 18.0, 21.0, 32.0, 24.0, 37.0, 37.0, 55.0, 55.0, 57.0, 45.0, 55.0, 58.0, 48.0, 44.0, 45.0, 49.0, 38.0, 24.0, 28.0, 29.0, 23.0, 17.0, 11.0, 16.0, 10.0, 12.0, 7.0, 4.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0], "bins": [-68.6875, -66.98583984375, -65.2841796875, -63.58251953125, -61.880859375, -60.17919921875, -58.4775390625, -56.77587890625, -55.07421875, -53.37255859375, -51.6708984375, -49.96923828125, -48.267578125, -46.56591796875, -44.8642578125, -43.16259765625, -41.4609375, -39.75927734375, -38.0576171875, -36.35595703125, -34.654296875, -32.95263671875, -31.2509765625, -29.54931640625, -27.84765625, -26.14599609375, -24.4443359375, -22.74267578125, -21.041015625, -19.33935546875, -17.6376953125, -15.93603515625, -14.234375, -12.53271484375, -10.8310546875, -9.12939453125, -7.427734375, -5.72607421875, -4.0244140625, -2.32275390625, -0.62109375, 1.08056640625, 2.7822265625, 4.48388671875, 6.185546875, 7.88720703125, 9.5888671875, 11.29052734375, 12.9921875, 14.69384765625, 16.3955078125, 18.09716796875, 19.798828125, 21.50048828125, 23.2021484375, 24.90380859375, 26.60546875, 28.30712890625, 30.0087890625, 31.71044921875, 33.412109375, 35.11376953125, 36.8154296875, 38.51708984375, 40.21875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 12.0, 22.0, 23.0, 32.0, 47.0, 85.0, 132.0, 194.0, 368.0, 804.0, 2162.0, 9157.0, 91163.0, 880387.0, 53946.0, 6795.0, 1668.0, 646.0, 349.0, 179.0, 118.0, 60.0, 42.0, 41.0, 19.0, 26.0, 14.0, 13.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.625, -163.435546875, -157.24609375, -151.056640625, -144.8671875, -138.677734375, -132.48828125, -126.298828125, -120.109375, -113.919921875, -107.73046875, -101.541015625, -95.3515625, -89.162109375, -82.97265625, -76.783203125, -70.59375, -64.404296875, -58.21484375, -52.025390625, -45.8359375, -39.646484375, -33.45703125, -27.267578125, -21.078125, -14.888671875, -8.69921875, -2.509765625, 3.6796875, 9.869140625, 16.05859375, 22.248046875, 28.4375, 34.626953125, 40.81640625, 47.005859375, 53.1953125, 59.384765625, 65.57421875, 71.763671875, 77.953125, 84.142578125, 90.33203125, 96.521484375, 102.7109375, 108.900390625, 115.08984375, 121.279296875, 127.46875, 133.658203125, 139.84765625, 146.037109375, 152.2265625, 158.416015625, 164.60546875, 170.794921875, 176.984375, 183.173828125, 189.36328125, 195.552734375, 201.7421875, 207.931640625, 214.12109375, 220.310546875, 226.5]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 23.0, 19.0, 29.0, 23.0, 27.0, 35.0, 41.0, 34.0, 64.0, 52.0, 71.0, 83.0, 64.0, 76.0, 53.0, 45.0, 47.0, 37.0, 32.0, 31.0, 16.0, 20.0, 11.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-241.5, -234.46875, -227.4375, -220.40625, -213.375, -206.34375, -199.3125, -192.28125, -185.25, -178.21875, -171.1875, -164.15625, -157.125, -150.09375, -143.0625, -136.03125, -129.0, -121.96875, -114.9375, -107.90625, -100.875, -93.84375, -86.8125, -79.78125, -72.75, -65.71875, -58.6875, -51.65625, -44.625, -37.59375, -30.5625, -23.53125, -16.5, -9.46875, -2.4375, 4.59375, 11.625, 18.65625, 25.6875, 32.71875, 39.75, 46.78125, 53.8125, 60.84375, 67.875, 74.90625, 81.9375, 88.96875, 96.0, 103.03125, 110.0625, 117.09375, 124.125, 131.15625, 138.1875, 145.21875, 152.25, 159.28125, 166.3125, 173.34375, 180.375, 187.40625, 194.4375, 201.46875, 208.5]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 5.0, 9.0, 15.0, 21.0, 27.0, 50.0, 57.0, 88.0, 113.0, 174.0, 279.0, 461.0, 828.0, 1501.0, 3027.0, 7033.0, 18222.0, 58683.0, 254086.0, 589384.0, 75960.0, 22405.0, 8397.0, 3659.0, 1674.0, 939.0, 527.0, 335.0, 172.0, 127.0, 86.0, 53.0, 39.0, 24.0, 16.0, 21.0, 15.0, 12.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.921875, -20.226806640625, -19.53173828125, -18.836669921875, -18.1416015625, -17.446533203125, -16.75146484375, -16.056396484375, -15.361328125, -14.666259765625, -13.97119140625, -13.276123046875, -12.5810546875, -11.885986328125, -11.19091796875, -10.495849609375, -9.80078125, -9.105712890625, -8.41064453125, -7.715576171875, -7.0205078125, -6.325439453125, -5.63037109375, -4.935302734375, -4.240234375, -3.545166015625, -2.85009765625, -2.155029296875, -1.4599609375, -0.764892578125, -0.06982421875, 0.625244140625, 1.3203125, 2.015380859375, 2.71044921875, 3.405517578125, 4.1005859375, 4.795654296875, 5.49072265625, 6.185791015625, 6.880859375, 7.575927734375, 8.27099609375, 8.966064453125, 9.6611328125, 10.356201171875, 11.05126953125, 11.746337890625, 12.44140625, 13.136474609375, 13.83154296875, 14.526611328125, 15.2216796875, 15.916748046875, 16.61181640625, 17.306884765625, 18.001953125, 18.697021484375, 19.39208984375, 20.087158203125, 20.7822265625, 21.477294921875, 22.17236328125, 22.867431640625, 23.5625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 19.0, 25.0, 37.0, 67.0, 78.0, 144.0, 195.0, 155.0, 77.0, 60.0, 45.0, 33.0, 14.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020669221878051758, -0.020143985748291016, -0.019618749618530273, -0.01909351348876953, -0.01856827735900879, -0.018043041229248047, -0.017517805099487305, -0.016992568969726562, -0.01646733283996582, -0.015942096710205078, -0.015416860580444336, -0.014891624450683594, -0.014366388320922852, -0.01384115219116211, -0.013315916061401367, -0.012790679931640625, -0.012265443801879883, -0.01174020767211914, -0.011214971542358398, -0.010689735412597656, -0.010164499282836914, -0.009639263153076172, -0.00911402702331543, -0.008588790893554688, -0.008063554763793945, -0.007538318634033203, -0.007013082504272461, -0.006487846374511719, -0.0059626102447509766, -0.005437374114990234, -0.004912137985229492, -0.00438690185546875, -0.003861665725708008, -0.0033364295959472656, -0.0028111934661865234, -0.0022859573364257812, -0.001760721206665039, -0.0012354850769042969, -0.0007102489471435547, -0.0001850128173828125, 0.0003402233123779297, 0.0008654594421386719, 0.001390695571899414, 0.0019159317016601562, 0.0024411678314208984, 0.0029664039611816406, 0.003491640090942383, 0.004016876220703125, 0.004542112350463867, 0.005067348480224609, 0.0055925846099853516, 0.006117820739746094, 0.006643056869506836, 0.007168292999267578, 0.00769352912902832, 0.008218765258789062, 0.008744001388549805, 0.009269237518310547, 0.009794473648071289, 0.010319709777832031, 0.010844945907592773, 0.011370182037353516, 0.011895418167114258, 0.012420654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 9.0, 13.0, 19.0, 18.0, 31.0, 37.0, 37.0, 56.0, 101.0, 168.0, 303.0, 627.0, 1320.0, 3608.0, 12718.0, 62919.0, 677294.0, 239679.0, 36555.0, 8240.0, 2547.0, 1050.0, 503.0, 241.0, 154.0, 104.0, 46.0, 35.0, 28.0, 14.0, 16.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.8125, -29.8134765625, -28.814453125, -27.8154296875, -26.81640625, -25.8173828125, -24.818359375, -23.8193359375, -22.8203125, -21.8212890625, -20.822265625, -19.8232421875, -18.82421875, -17.8251953125, -16.826171875, -15.8271484375, -14.828125, -13.8291015625, -12.830078125, -11.8310546875, -10.83203125, -9.8330078125, -8.833984375, -7.8349609375, -6.8359375, -5.8369140625, -4.837890625, -3.8388671875, -2.83984375, -1.8408203125, -0.841796875, 0.1572265625, 1.15625, 2.1552734375, 3.154296875, 4.1533203125, 5.15234375, 6.1513671875, 7.150390625, 8.1494140625, 9.1484375, 10.1474609375, 11.146484375, 12.1455078125, 13.14453125, 14.1435546875, 15.142578125, 16.1416015625, 17.140625, 18.1396484375, 19.138671875, 20.1376953125, 21.13671875, 22.1357421875, 23.134765625, 24.1337890625, 25.1328125, 26.1318359375, 27.130859375, 28.1298828125, 29.12890625, 30.1279296875, 31.126953125, 32.1259765625, 33.125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 2.0, 7.0, 3.0, 1.0, 10.0, 10.0, 14.0, 13.0, 12.0, 17.0, 26.0, 27.0, 41.0, 37.0, 48.0, 69.0, 61.0, 86.0, 68.0, 71.0, 66.0, 33.0, 59.0, 31.0, 26.0, 20.0, 20.0, 17.0, 7.0, 18.0, 11.0, 11.0, 6.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-25.78125, -25.071533203125, -24.36181640625, -23.652099609375, -22.9423828125, -22.232666015625, -21.52294921875, -20.813232421875, -20.103515625, -19.393798828125, -18.68408203125, -17.974365234375, -17.2646484375, -16.554931640625, -15.84521484375, -15.135498046875, -14.42578125, -13.716064453125, -13.00634765625, -12.296630859375, -11.5869140625, -10.877197265625, -10.16748046875, -9.457763671875, -8.748046875, -8.038330078125, -7.32861328125, -6.618896484375, -5.9091796875, -5.199462890625, -4.48974609375, -3.780029296875, -3.0703125, -2.360595703125, -1.65087890625, -0.941162109375, -0.2314453125, 0.478271484375, 1.18798828125, 1.897705078125, 2.607421875, 3.317138671875, 4.02685546875, 4.736572265625, 5.4462890625, 6.156005859375, 6.86572265625, 7.575439453125, 8.28515625, 8.994873046875, 9.70458984375, 10.414306640625, 11.1240234375, 11.833740234375, 12.54345703125, 13.253173828125, 13.962890625, 14.672607421875, 15.38232421875, 16.092041015625, 16.8017578125, 17.511474609375, 18.22119140625, 18.930908203125, 19.640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 12.0, 9.0, 42.0, 77.0, 236.0, 414.0, 117.0, 49.0, 21.0, 14.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1807.1153564453125, -1763.2694091796875, -1719.423583984375, -1675.57763671875, -1631.7318115234375, -1587.8858642578125, -1544.0400390625, -1500.194091796875, -1456.34814453125, -1412.502197265625, -1368.6563720703125, -1324.8104248046875, -1280.964599609375, -1237.11865234375, -1193.272705078125, -1149.4268798828125, -1105.5810546875, -1061.735107421875, -1017.8892822265625, -974.0433349609375, -930.1974487304688, -886.3515625, -842.5056762695312, -798.6597900390625, -754.8138427734375, -710.9679565429688, -667.1220703125, -623.276123046875, -579.4302368164062, -535.5843505859375, -491.73846435546875, -447.8925476074219, -404.046630859375, -360.20074462890625, -316.3548278808594, -272.5089416503906, -228.6630401611328, -184.817138671875, -140.97125244140625, -97.12533569335938, -53.279449462890625, -9.433551788330078, 34.41234588623047, 78.25823974609375, 122.10414123535156, 165.95004272460938, 209.79592895507812, 253.641845703125, 297.48773193359375, 341.3336181640625, 385.1795349121094, 429.0254211425781, 472.871337890625, 516.7172241210938, 560.5631103515625, 604.4090576171875, 648.2548828125, 692.1007690429688, 735.9466552734375, 779.7926025390625, 823.6384887695312, 867.484375, 911.3302612304688, 955.1761474609375, 999.0220947265625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 17.0, 9.0, 24.0, 24.0, 26.0, 36.0, 30.0, 49.0, 53.0, 115.0, 125.0, 82.0, 37.0, 44.0, 36.0, 26.0, 21.0, 22.0, 17.0, 21.0, 22.0, 22.0, 17.0, 10.0, 6.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-632.9547119140625, -612.6290283203125, -592.3033447265625, -571.9777221679688, -551.6520385742188, -531.3263549804688, -511.00067138671875, -490.67498779296875, -470.3493347167969, -450.0236511230469, -429.697998046875, -409.372314453125, -389.046630859375, -368.7209777832031, -348.3952941894531, -328.06964111328125, -307.74395751953125, -287.41827392578125, -267.0926208496094, -246.76693725585938, -226.44126892089844, -206.1156005859375, -185.7899169921875, -165.46424865722656, -145.13858032226562, -124.81291198730469, -104.48723602294922, -84.16156005859375, -63.83589172363281, -43.510223388671875, -23.184547424316406, -2.8588714599609375, 17.46685791015625, 37.79253005981445, 58.118202209472656, 78.44387817382812, 98.76954650878906, 119.09521484375, 139.4208984375, 159.74656677246094, 180.07223510742188, 200.3979034423828, 220.72357177734375, 241.04925537109375, 261.37493896484375, 281.7005920410156, 302.0262756347656, 322.3519287109375, 342.6776123046875, 363.0032958984375, 383.3289489746094, 403.6546325683594, 423.98028564453125, 444.30596923828125, 464.63165283203125, 484.95733642578125, 505.2829895019531, 525.608642578125, 545.934326171875, 566.260009765625, 586.585693359375, 606.911376953125, 627.2369995117188, 647.5626831054688, 667.8883666992188]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 9.0, 7.0, 16.0, 16.0, 25.0, 28.0, 36.0, 55.0, 56.0, 84.0, 117.0, 209.0, 348.0, 828.0, 2119.0, 6248.0, 26011.0, 224688.0, 2481273.0, 1324648.0, 104568.0, 15733.0, 4217.0, 1441.0, 622.0, 275.0, 174.0, 115.0, 74.0, 55.0, 41.0, 37.0, 27.0, 18.0, 10.0, 15.0, 9.0, 4.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-111.375, -107.876953125, -104.37890625, -100.880859375, -97.3828125, -93.884765625, -90.38671875, -86.888671875, -83.390625, -79.892578125, -76.39453125, -72.896484375, -69.3984375, -65.900390625, -62.40234375, -58.904296875, -55.40625, -51.908203125, -48.41015625, -44.912109375, -41.4140625, -37.916015625, -34.41796875, -30.919921875, -27.421875, -23.923828125, -20.42578125, -16.927734375, -13.4296875, -9.931640625, -6.43359375, -2.935546875, 0.5625, 4.060546875, 7.55859375, 11.056640625, 14.5546875, 18.052734375, 21.55078125, 25.048828125, 28.546875, 32.044921875, 35.54296875, 39.041015625, 42.5390625, 46.037109375, 49.53515625, 53.033203125, 56.53125, 60.029296875, 63.52734375, 67.025390625, 70.5234375, 74.021484375, 77.51953125, 81.017578125, 84.515625, 88.013671875, 91.51171875, 95.009765625, 98.5078125, 102.005859375, 105.50390625, 109.001953125, 112.5]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 10.0, 11.0, 15.0, 15.0, 22.0, 25.0, 27.0, 34.0, 32.0, 39.0, 42.0, 50.0, 54.0, 50.0, 59.0, 40.0, 49.0, 54.0, 43.0, 44.0, 39.0, 34.0, 32.0, 25.0, 28.0, 28.0, 16.0, 11.0, 11.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-59.875, -58.33349609375, -56.7919921875, -55.25048828125, -53.708984375, -52.16748046875, -50.6259765625, -49.08447265625, -47.54296875, -46.00146484375, -44.4599609375, -42.91845703125, -41.376953125, -39.83544921875, -38.2939453125, -36.75244140625, -35.2109375, -33.66943359375, -32.1279296875, -30.58642578125, -29.044921875, -27.50341796875, -25.9619140625, -24.42041015625, -22.87890625, -21.33740234375, -19.7958984375, -18.25439453125, -16.712890625, -15.17138671875, -13.6298828125, -12.08837890625, -10.546875, -9.00537109375, -7.4638671875, -5.92236328125, -4.380859375, -2.83935546875, -1.2978515625, 0.24365234375, 1.78515625, 3.32666015625, 4.8681640625, 6.40966796875, 7.951171875, 9.49267578125, 11.0341796875, 12.57568359375, 14.1171875, 15.65869140625, 17.2001953125, 18.74169921875, 20.283203125, 21.82470703125, 23.3662109375, 24.90771484375, 26.44921875, 27.99072265625, 29.5322265625, 31.07373046875, 32.615234375, 34.15673828125, 35.6982421875, 37.23974609375, 38.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 10.0, 24.0, 69.0, 150.0, 387.0, 1692.0, 37562.0, 4146052.0, 6997.0, 890.0, 274.0, 97.0, 35.0, 18.0, 10.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-565.5, -544.015625, -522.53125, -501.046875, -479.5625, -458.078125, -436.59375, -415.109375, -393.625, -372.140625, -350.65625, -329.171875, -307.6875, -286.203125, -264.71875, -243.234375, -221.75, -200.265625, -178.78125, -157.296875, -135.8125, -114.328125, -92.84375, -71.359375, -49.875, -28.390625, -6.90625, 14.578125, 36.0625, 57.546875, 79.03125, 100.515625, 122.0, 143.484375, 164.96875, 186.453125, 207.9375, 229.421875, 250.90625, 272.390625, 293.875, 315.359375, 336.84375, 358.328125, 379.8125, 401.296875, 422.78125, 444.265625, 465.75, 487.234375, 508.71875, 530.203125, 551.6875, 573.171875, 594.65625, 616.140625, 637.625, 659.109375, 680.59375, 702.078125, 723.5625, 745.046875, 766.53125, 788.015625, 809.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 14.0, 21.0, 65.0, 149.0, 355.0, 1118.0, 1555.0, 514.0, 156.0, 74.0, 37.0, 13.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.75, -452.5625, -440.375, -428.1875, -416.0, -403.8125, -391.625, -379.4375, -367.25, -355.0625, -342.875, -330.6875, -318.5, -306.3125, -294.125, -281.9375, -269.75, -257.5625, -245.375, -233.1875, -221.0, -208.8125, -196.625, -184.4375, -172.25, -160.0625, -147.875, -135.6875, -123.5, -111.3125, -99.125, -86.9375, -74.75, -62.5625, -50.375, -38.1875, -26.0, -13.8125, -1.625, 10.5625, 22.75, 34.9375, 47.125, 59.3125, 71.5, 83.6875, 95.875, 108.0625, 120.25, 132.4375, 144.625, 156.8125, 169.0, 181.1875, 193.375, 205.5625, 217.75, 229.9375, 242.125, 254.3125, 266.5, 278.6875, 290.875, 303.0625, 315.25]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 19.0, 16.0, 35.0, 52.0, 103.0, 142.0, 201.0, 148.0, 109.0, 68.0, 35.0, 20.0, 9.0, 7.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1939.178466796875, -1887.5079345703125, -1835.8372802734375, -1784.166748046875, -1732.49609375, -1680.8255615234375, -1629.155029296875, -1577.484375, -1525.813720703125, -1474.1431884765625, -1422.4725341796875, -1370.802001953125, -1319.13134765625, -1267.4608154296875, -1215.790283203125, -1164.11962890625, -1112.4490966796875, -1060.778564453125, -1009.10791015625, -957.4373779296875, -905.7667236328125, -854.09619140625, -802.4255981445312, -750.7550048828125, -699.0844116210938, -647.413818359375, -595.7432250976562, -544.0726318359375, -492.4020690917969, -440.7314758300781, -389.0609130859375, -337.39031982421875, -285.7197265625, -234.04913330078125, -182.37855529785156, -130.70797729492188, -79.03738403320312, -27.366790771484375, 24.30377197265625, 75.974365234375, 127.64495849609375, 179.3155517578125, 230.9861297607422, 282.6567077636719, 334.3273010253906, 385.9978942871094, 437.66845703125, 489.33905029296875, 541.0096435546875, 592.6802368164062, 644.350830078125, 696.0213623046875, 747.6920166015625, 799.362548828125, 851.0331420898438, 902.7037353515625, 954.3743286132812, 1006.044921875, 1057.7154541015625, 1109.3861083984375, 1161.056640625, 1212.727294921875, 1264.3978271484375, 1316.068359375, 1367.739013671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 8.0, 13.0, 10.0, 22.0, 22.0, 24.0, 28.0, 22.0, 30.0, 33.0, 33.0, 33.0, 34.0, 41.0, 40.0, 47.0, 53.0, 66.0, 48.0, 43.0, 38.0, 37.0, 34.0, 42.0, 28.0, 34.0, 15.0, 19.0, 13.0, 13.0, 16.0, 13.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-781.1297607421875, -758.0313110351562, -734.9329223632812, -711.83447265625, -688.736083984375, -665.6376342773438, -642.5391845703125, -619.4407958984375, -596.3423461914062, -573.243896484375, -550.1455078125, -527.0470581054688, -503.9486389160156, -480.8502197265625, -457.7518005371094, -434.65338134765625, -411.5549621582031, -388.45654296875, -365.3581237792969, -342.25970458984375, -319.1612548828125, -296.0628356933594, -272.96441650390625, -249.86598205566406, -226.76756286621094, -203.6691436767578, -180.57070922851562, -157.4722900390625, -134.37387084960938, -111.27543640136719, -88.17701721191406, -65.07858276367188, -41.98016357421875, -18.881738662719727, 4.216686248779297, 27.315109252929688, 50.413536071777344, 73.511962890625, 96.61038208007812, 119.70881652832031, 142.80723571777344, 165.90565490722656, 189.00408935546875, 212.10250854492188, 235.200927734375, 258.29937744140625, 281.39776611328125, 304.4962158203125, 327.5946350097656, 350.69305419921875, 373.7914733886719, 396.889892578125, 419.98834228515625, 443.0867614746094, 466.1851806640625, 489.28363037109375, 512.3820190429688, 535.48046875, 558.578857421875, 581.6773071289062, 604.7756958007812, 627.8741455078125, 650.9725341796875, 674.0709838867188, 697.16943359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 31.0, 27.0, 48.0, 62.0, 106.0, 124.0, 222.0, 322.0, 622.0, 1028.0, 1813.0, 3528.0, 7278.0, 15554.0, 37922.0, 107503.0, 451320.0, 288742.0, 78191.0, 29003.0, 12470.0, 5844.0, 2893.0, 1543.0, 880.0, 523.0, 268.0, 203.0, 141.0, 81.0, 54.0, 39.0, 32.0, 23.0, 16.0, 8.0, 13.0, 6.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.6875, -81.2158203125, -78.744140625, -76.2724609375, -73.80078125, -71.3291015625, -68.857421875, -66.3857421875, -63.9140625, -61.4423828125, -58.970703125, -56.4990234375, -54.02734375, -51.5556640625, -49.083984375, -46.6123046875, -44.140625, -41.6689453125, -39.197265625, -36.7255859375, -34.25390625, -31.7822265625, -29.310546875, -26.8388671875, -24.3671875, -21.8955078125, -19.423828125, -16.9521484375, -14.48046875, -12.0087890625, -9.537109375, -7.0654296875, -4.59375, -2.1220703125, 0.349609375, 2.8212890625, 5.29296875, 7.7646484375, 10.236328125, 12.7080078125, 15.1796875, 17.6513671875, 20.123046875, 22.5947265625, 25.06640625, 27.5380859375, 30.009765625, 32.4814453125, 34.953125, 37.4248046875, 39.896484375, 42.3681640625, 44.83984375, 47.3115234375, 49.783203125, 52.2548828125, 54.7265625, 57.1982421875, 59.669921875, 62.1416015625, 64.61328125, 67.0849609375, 69.556640625, 72.0283203125, 74.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 3.0, 6.0, 14.0, 21.0, 14.0, 13.0, 27.0, 21.0, 28.0, 31.0, 38.0, 45.0, 53.0, 41.0, 54.0, 46.0, 62.0, 53.0, 46.0, 38.0, 42.0, 43.0, 32.0, 33.0, 17.0, 23.0, 25.0, 20.0, 18.0, 12.0, 9.0, 13.0, 9.0, 3.0, 4.0, 2.0, 9.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-66.5, -64.57373046875, -62.6474609375, -60.72119140625, -58.794921875, -56.86865234375, -54.9423828125, -53.01611328125, -51.08984375, -49.16357421875, -47.2373046875, -45.31103515625, -43.384765625, -41.45849609375, -39.5322265625, -37.60595703125, -35.6796875, -33.75341796875, -31.8271484375, -29.90087890625, -27.974609375, -26.04833984375, -24.1220703125, -22.19580078125, -20.26953125, -18.34326171875, -16.4169921875, -14.49072265625, -12.564453125, -10.63818359375, -8.7119140625, -6.78564453125, -4.859375, -2.93310546875, -1.0068359375, 0.91943359375, 2.845703125, 4.77197265625, 6.6982421875, 8.62451171875, 10.55078125, 12.47705078125, 14.4033203125, 16.32958984375, 18.255859375, 20.18212890625, 22.1083984375, 24.03466796875, 25.9609375, 27.88720703125, 29.8134765625, 31.73974609375, 33.666015625, 35.59228515625, 37.5185546875, 39.44482421875, 41.37109375, 43.29736328125, 45.2236328125, 47.14990234375, 49.076171875, 51.00244140625, 52.9287109375, 54.85498046875, 56.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 12.0, 10.0, 13.0, 21.0, 39.0, 48.0, 88.0, 142.0, 308.0, 646.0, 1701.0, 7088.0, 68428.0, 932271.0, 30940.0, 4485.0, 1218.0, 533.0, 256.0, 114.0, 62.0, 42.0, 29.0, 12.0, 18.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.75, -178.125, -170.5, -162.875, -155.25, -147.625, -140.0, -132.375, -124.75, -117.125, -109.5, -101.875, -94.25, -86.625, -79.0, -71.375, -63.75, -56.125, -48.5, -40.875, -33.25, -25.625, -18.0, -10.375, -2.75, 4.875, 12.5, 20.125, 27.75, 35.375, 43.0, 50.625, 58.25, 65.875, 73.5, 81.125, 88.75, 96.375, 104.0, 111.625, 119.25, 126.875, 134.5, 142.125, 149.75, 157.375, 165.0, 172.625, 180.25, 187.875, 195.5, 203.125, 210.75, 218.375, 226.0, 233.625, 241.25, 248.875, 256.5, 264.125, 271.75, 279.375, 287.0, 294.625, 302.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 17.0, 14.0, 17.0, 20.0, 25.0, 33.0, 36.0, 39.0, 51.0, 80.0, 92.0, 101.0, 91.0, 59.0, 46.0, 45.0, 33.0, 33.0, 24.0, 25.0, 16.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-417.25, -405.46875, -393.6875, -381.90625, -370.125, -358.34375, -346.5625, -334.78125, -323.0, -311.21875, -299.4375, -287.65625, -275.875, -264.09375, -252.3125, -240.53125, -228.75, -216.96875, -205.1875, -193.40625, -181.625, -169.84375, -158.0625, -146.28125, -134.5, -122.71875, -110.9375, -99.15625, -87.375, -75.59375, -63.8125, -52.03125, -40.25, -28.46875, -16.6875, -4.90625, 6.875, 18.65625, 30.4375, 42.21875, 54.0, 65.78125, 77.5625, 89.34375, 101.125, 112.90625, 124.6875, 136.46875, 148.25, 160.03125, 171.8125, 183.59375, 195.375, 207.15625, 218.9375, 230.71875, 242.5, 254.28125, 266.0625, 277.84375, 289.625, 301.40625, 313.1875, 324.96875, 336.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 19.0, 16.0, 32.0, 78.0, 92.0, 158.0, 370.0, 902.0, 2263.0, 7338.0, 33057.0, 809606.0, 166564.0, 20274.0, 5012.0, 1574.0, 617.0, 265.0, 127.0, 67.0, 54.0, 20.0, 15.0, 7.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5625, -51.3359375, -50.109375, -48.8828125, -47.65625, -46.4296875, -45.203125, -43.9765625, -42.75, -41.5234375, -40.296875, -39.0703125, -37.84375, -36.6171875, -35.390625, -34.1640625, -32.9375, -31.7109375, -30.484375, -29.2578125, -28.03125, -26.8046875, -25.578125, -24.3515625, -23.125, -21.8984375, -20.671875, -19.4453125, -18.21875, -16.9921875, -15.765625, -14.5390625, -13.3125, -12.0859375, -10.859375, -9.6328125, -8.40625, -7.1796875, -5.953125, -4.7265625, -3.5, -2.2734375, -1.046875, 0.1796875, 1.40625, 2.6328125, 3.859375, 5.0859375, 6.3125, 7.5390625, 8.765625, 9.9921875, 11.21875, 12.4453125, 13.671875, 14.8984375, 16.125, 17.3515625, 18.578125, 19.8046875, 21.03125, 22.2578125, 23.484375, 24.7109375, 25.9375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 10.0, 8.0, 8.0, 7.0, 11.0, 19.0, 26.0, 34.0, 36.0, 53.0, 82.0, 98.0, 121.0, 116.0, 95.0, 74.0, 38.0, 23.0, 21.0, 24.0, 14.0, 9.0, 14.0, 4.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01104736328125, -0.010699152946472168, -0.010350942611694336, -0.010002732276916504, -0.009654521942138672, -0.00930631160736084, -0.008958101272583008, -0.008609890937805176, -0.008261680603027344, -0.007913470268249512, -0.00756525993347168, -0.007217049598693848, -0.006868839263916016, -0.006520628929138184, -0.0061724185943603516, -0.0058242082595825195, -0.0054759979248046875, -0.0051277875900268555, -0.0047795772552490234, -0.004431366920471191, -0.004083156585693359, -0.0037349462509155273, -0.0033867359161376953, -0.0030385255813598633, -0.0026903152465820312, -0.0023421049118041992, -0.001993894577026367, -0.0016456842422485352, -0.0012974739074707031, -0.0009492635726928711, -0.0006010532379150391, -0.00025284290313720703, 9.5367431640625e-05, 0.00044357776641845703, 0.0007917881011962891, 0.001139998435974121, 0.0014882087707519531, 0.0018364191055297852, 0.002184629440307617, 0.0025328397750854492, 0.0028810501098632812, 0.0032292604446411133, 0.0035774707794189453, 0.003925681114196777, 0.004273891448974609, 0.004622101783752441, 0.0049703121185302734, 0.0053185224533081055, 0.0056667327880859375, 0.0060149431228637695, 0.0063631534576416016, 0.006711363792419434, 0.007059574127197266, 0.007407784461975098, 0.00775599479675293, 0.008104205131530762, 0.008452415466308594, 0.008800625801086426, 0.009148836135864258, 0.00949704647064209, 0.009845256805419922, 0.010193467140197754, 0.010541677474975586, 0.010889887809753418, 0.01123809814453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 15.0, 20.0, 36.0, 46.0, 58.0, 87.0, 152.0, 253.0, 553.0, 939.0, 2434.0, 7566.0, 33010.0, 778010.0, 195343.0, 21129.0, 5362.0, 1823.0, 790.0, 405.0, 201.0, 99.0, 61.0, 51.0, 23.0, 20.0, 7.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.01953125, -31.9140625, -30.80859375, -29.703125, -28.59765625, -27.4921875, -26.38671875, -25.28125, -24.17578125, -23.0703125, -21.96484375, -20.859375, -19.75390625, -18.6484375, -17.54296875, -16.4375, -15.33203125, -14.2265625, -13.12109375, -12.015625, -10.91015625, -9.8046875, -8.69921875, -7.59375, -6.48828125, -5.3828125, -4.27734375, -3.171875, -2.06640625, -0.9609375, 0.14453125, 1.25, 2.35546875, 3.4609375, 4.56640625, 5.671875, 6.77734375, 7.8828125, 8.98828125, 10.09375, 11.19921875, 12.3046875, 13.41015625, 14.515625, 15.62109375, 16.7265625, 17.83203125, 18.9375, 20.04296875, 21.1484375, 22.25390625, 23.359375, 24.46484375, 25.5703125, 26.67578125, 27.78125, 28.88671875, 29.9921875, 31.09765625, 32.203125, 33.30859375, 34.4140625, 35.51953125, 36.625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 5.0, 12.0, 7.0, 6.0, 11.0, 15.0, 11.0, 18.0, 21.0, 41.0, 55.0, 52.0, 87.0, 89.0, 103.0, 106.0, 80.0, 66.0, 42.0, 36.0, 27.0, 18.0, 17.0, 17.0, 12.0, 4.0, 6.0, 6.0, 4.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65625, -41.46826171875, -40.2802734375, -39.09228515625, -37.904296875, -36.71630859375, -35.5283203125, -34.34033203125, -33.15234375, -31.96435546875, -30.7763671875, -29.58837890625, -28.400390625, -27.21240234375, -26.0244140625, -24.83642578125, -23.6484375, -22.46044921875, -21.2724609375, -20.08447265625, -18.896484375, -17.70849609375, -16.5205078125, -15.33251953125, -14.14453125, -12.95654296875, -11.7685546875, -10.58056640625, -9.392578125, -8.20458984375, -7.0166015625, -5.82861328125, -4.640625, -3.45263671875, -2.2646484375, -1.07666015625, 0.111328125, 1.29931640625, 2.4873046875, 3.67529296875, 4.86328125, 6.05126953125, 7.2392578125, 8.42724609375, 9.615234375, 10.80322265625, 11.9912109375, 13.17919921875, 14.3671875, 15.55517578125, 16.7431640625, 17.93115234375, 19.119140625, 20.30712890625, 21.4951171875, 22.68310546875, 23.87109375, 25.05908203125, 26.2470703125, 27.43505859375, 28.623046875, 29.81103515625, 30.9990234375, 32.18701171875, 33.375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 17.0, 28.0, 57.0, 99.0, 455.0, 192.0, 59.0, 44.0, 15.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2002.5418701171875, -1953.463134765625, -1904.3843994140625, -1855.3056640625, -1806.2269287109375, -1757.148193359375, -1708.0694580078125, -1658.99072265625, -1609.9119873046875, -1560.833251953125, -1511.7545166015625, -1462.67578125, -1413.5970458984375, -1364.518310546875, -1315.4395751953125, -1266.36083984375, -1217.2821044921875, -1168.203369140625, -1119.1246337890625, -1070.0458984375, -1020.9671630859375, -971.888427734375, -922.8096923828125, -873.73095703125, -824.6522216796875, -775.573486328125, -726.4947509765625, -677.416015625, -628.3372802734375, -579.258544921875, -530.1798095703125, -481.10107421875, -432.0224609375, -382.9437255859375, -333.864990234375, -284.7862548828125, -235.70751953125, -186.6287841796875, -137.550048828125, -88.4713134765625, -39.392578125, 9.6861572265625, 58.764892578125, 107.8436279296875, 156.92236328125, 206.0010986328125, 255.079833984375, 304.1585693359375, 353.2373046875, 402.3160400390625, 451.394775390625, 500.4735107421875, 549.55224609375, 598.6309814453125, 647.709716796875, 696.7884521484375, 745.8671875, 794.9459228515625, 844.024658203125, 893.1033935546875, 942.18212890625, 991.2608642578125, 1040.339599609375, 1089.4183349609375, 1138.4970703125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 13.0, 4.0, 8.0, 10.0, 12.0, 16.0, 17.0, 20.0, 13.0, 24.0, 27.0, 27.0, 34.0, 62.0, 179.0, 214.0, 79.0, 38.0, 32.0, 30.0, 19.0, 20.0, 18.0, 16.0, 5.0, 8.0, 11.0, 5.0, 8.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-811.7107543945312, -781.8485107421875, -751.9862060546875, -722.1239624023438, -692.26171875, -662.3994750976562, -632.5372314453125, -602.6749267578125, -572.8126831054688, -542.950439453125, -513.088134765625, -483.22589111328125, -453.3636474609375, -423.50140380859375, -393.6391296386719, -363.77685546875, -333.91461181640625, -304.0523681640625, -274.1900939941406, -244.3278350830078, -214.465576171875, -184.6033172607422, -154.74105834960938, -124.87879943847656, -95.01654052734375, -65.15428161621094, -35.292022705078125, -5.4297637939453125, 24.4324951171875, 54.29475402832031, 84.15701293945312, 114.01927185058594, 143.881591796875, 173.7438507080078, 203.60610961914062, 233.46836853027344, 263.33062744140625, 293.19287109375, 323.0551452636719, 352.91741943359375, 382.7796630859375, 412.64190673828125, 442.5041809082031, 472.366455078125, 502.22869873046875, 532.0909423828125, 561.9532470703125, 591.8154907226562, 621.677734375, 651.5399780273438, 681.4022216796875, 711.2645263671875, 741.1267700195312, 770.989013671875, 800.851318359375, 830.7135620117188, 860.5758056640625, 890.4380493164062, 920.30029296875, 950.16259765625, 980.0248413085938, 1009.8870849609375, 1039.7493896484375, 1069.611572265625, 1099.473876953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 5.0, 3.0, 7.0, 10.0, 10.0, 12.0, 13.0, 17.0, 19.0, 22.0, 25.0, 36.0, 45.0, 55.0, 124.0, 196.0, 76.0, 62.0, 37.0, 29.0, 37.0, 26.0, 20.0, 26.0, 16.0, 15.0, 10.0, 11.0, 6.0, 2.0, 7.0, 2.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.5625, -46.3974609375, -44.232421875, -42.0673828125, -39.90234375, -37.7373046875, -35.572265625, -33.4072265625, -31.2421875, -29.0771484375, -26.912109375, -24.7470703125, -22.58203125, -20.4169921875, -18.251953125, -16.0869140625, -13.921875, -11.7568359375, -9.591796875, -7.4267578125, -5.26171875, -3.0966796875, -0.931640625, 1.2333984375, 3.3984375, 5.5634765625, 7.728515625, 9.8935546875, 12.05859375, 14.2236328125, 16.388671875, 18.5537109375, 20.71875, 22.8837890625, 25.048828125, 27.2138671875, 29.37890625, 31.5439453125, 33.708984375, 35.8740234375, 38.0390625, 40.2041015625, 42.369140625, 44.5341796875, 46.69921875, 48.8642578125, 51.029296875, 53.1943359375, 55.359375, 57.5244140625, 59.689453125, 61.8544921875, 64.01953125, 66.1845703125, 68.349609375, 70.5146484375, 72.6796875, 74.8447265625, 77.009765625, 79.1748046875, 81.33984375, 83.5048828125, 85.669921875, 87.8349609375, 90.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 10.0, 11.0, 6.0, 13.0, 15.0, 21.0, 24.0, 24.0, 60.0, 106.0, 167.0, 336.0, 721.0, 2171.0, 9514.0, 8327996.0, 40952.0, 4274.0, 1166.0, 470.0, 171.0, 114.0, 63.0, 54.0, 25.0, 16.0, 10.0, 14.0, 6.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-537.6149291992188, -522.1497192382812, -506.6845397949219, -491.2193603515625, -475.754150390625, -460.2889709472656, -444.8237609863281, -429.35858154296875, -413.89337158203125, -398.4281921386719, -382.9629821777344, -367.497802734375, -352.0325927734375, -336.5674133300781, -321.1022033691406, -305.63702392578125, -290.17181396484375, -274.7066345214844, -259.2414245605469, -243.77622985839844, -228.31103515625, -212.84585571289062, -197.38064575195312, -181.91546630859375, -166.45028686523438, -150.98509216308594, -135.5198974609375, -120.05470275878906, -104.58950805664062, -89.12432098388672, -73.65912628173828, -58.193931579589844, -42.728729248046875, -27.263534545898438, -11.798341751098633, 3.666851043701172, 19.13204574584961, 34.59723663330078, 50.06243133544922, 65.52762603759766, 80.9928207397461, 96.45801544189453, 111.92321014404297, 127.38839721679688, 142.8535919189453, 158.31878662109375, 173.7839813232422, 189.24917602539062, 204.71437072753906, 220.1795654296875, 235.64476013183594, 251.10995483398438, 266.57513427734375, 282.04034423828125, 297.5055236816406, 312.9707336425781, 328.4359130859375, 343.9010925292969, 359.3663024902344, 374.83148193359375, 390.29669189453125, 405.7618713378906, 421.2270812988281, 436.6922607421875, 452.157470703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 4.0, 7.0, 3.0, 5.0, 5.0, 7.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.5076904296875, -359.2933044433594, -345.07891845703125, -330.8645324707031, -316.650146484375, -302.4357604980469, -288.22137451171875, -274.0069885253906, -259.7926025390625, -245.57821655273438, -231.36383056640625, -217.14944458007812, -202.93505859375, -188.72067260742188, -174.50628662109375, -160.29190063476562, -146.07752990722656, -131.86314392089844, -117.64875793457031, -103.43437194824219, -89.21998596191406, -75.00560760498047, -60.791221618652344, -46.57683563232422, -32.362449645996094, -18.14806365966797, -3.9336795806884766, 10.280704498291016, 24.49509048461914, 38.70947265625, 52.923858642578125, 67.13824462890625, 81.35263061523438, 95.5670166015625, 109.78140258789062, 123.99578857421875, 138.21017456054688, 152.424560546875, 166.63894653320312, 180.85333251953125, 195.06771850585938, 209.2821044921875, 223.49649047851562, 237.71087646484375, 251.92526245117188, 266.1396484375, 280.3540344238281, 294.56842041015625, 308.78277587890625, 322.9971618652344, 337.2115478515625, 351.4259338378906, 365.64031982421875, 379.8547058105469, 394.069091796875, 408.2834777832031, 422.49786376953125, 436.7122497558594, 450.9266357421875, 465.1410217285156, 479.35540771484375, 493.5697937011719, 507.7841796875, 521.99853515625, 536.2129516601562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 10.0, 9.0, 16.0, 16.0, 30.0, 31.0, 40.0, 51.0, 60.0, 56.0, 62.0, 80.0, 77.0, 71.0, 64.0, 55.0, 40.0, 38.0, 41.0, 28.0, 24.0, 26.0, 13.0, 20.0, 6.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.3623046875, -35.849609375, -34.3369140625, -32.82421875, -31.3115234375, -29.798828125, -28.2861328125, -26.7734375, -25.2607421875, -23.748046875, -22.2353515625, -20.72265625, -19.2099609375, -17.697265625, -16.1845703125, -14.671875, -13.1591796875, -11.646484375, -10.1337890625, -8.62109375, -7.1083984375, -5.595703125, -4.0830078125, -2.5703125, -1.0576171875, 0.455078125, 1.9677734375, 3.48046875, 4.9931640625, 6.505859375, 8.0185546875, 9.53125, 11.0439453125, 12.556640625, 14.0693359375, 15.58203125, 17.0947265625, 18.607421875, 20.1201171875, 21.6328125, 23.1455078125, 24.658203125, 26.1708984375, 27.68359375, 29.1962890625, 30.708984375, 32.2216796875, 33.734375, 35.2470703125, 36.759765625, 38.2724609375, 39.78515625, 41.2978515625, 42.810546875, 44.3232421875, 45.8359375, 47.3486328125, 48.861328125, 50.3740234375, 51.88671875, 53.3994140625, 54.912109375, 56.4248046875, 57.9375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 5.0, 4.0, 8.0, 19.0, 16.0, 23.0, 41.0, 72.0, 102.0, 153.0, 257.0, 493.0, 731.0, 1441.0, 2833.0, 6169.0, 14143.0, 35592.0, 97478.0, 189860.0, 106797.0, 39414.0, 15538.0, 6551.0, 3153.0, 1453.0, 776.0, 477.0, 249.0, 163.0, 92.0, 53.0, 32.0, 25.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-409.25, -398.3515625, -387.453125, -376.5546875, -365.65625, -354.7578125, -343.859375, -332.9609375, -322.0625, -311.1640625, -300.265625, -289.3671875, -278.46875, -267.5703125, -256.671875, -245.7734375, -234.875, -223.9765625, -213.078125, -202.1796875, -191.28125, -180.3828125, -169.484375, -158.5859375, -147.6875, -136.7890625, -125.890625, -114.9921875, -104.09375, -93.1953125, -82.296875, -71.3984375, -60.5, -49.6015625, -38.703125, -27.8046875, -16.90625, -6.0078125, 4.890625, 15.7890625, 26.6875, 37.5859375, 48.484375, 59.3828125, 70.28125, 81.1796875, 92.078125, 102.9765625, 113.875, 124.7734375, 135.671875, 146.5703125, 157.46875, 168.3671875, 179.265625, 190.1640625, 201.0625, 211.9609375, 222.859375, 233.7578125, 244.65625, 255.5546875, 266.453125, 277.3515625, 288.25]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 29.0, 23.0, 29.0, 36.0, 31.0, 51.0, 45.0, 54.0, 62.0, 53.0, 68.0, 51.0, 59.0, 64.0, 53.0, 40.0, 35.0, 28.0, 23.0, 13.0, 17.0, 18.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.19921875, -54.1484375, -52.09765625, -50.046875, -47.99609375, -45.9453125, -43.89453125, -41.84375, -39.79296875, -37.7421875, -35.69140625, -33.640625, -31.58984375, -29.5390625, -27.48828125, -25.4375, -23.38671875, -21.3359375, -19.28515625, -17.234375, -15.18359375, -13.1328125, -11.08203125, -9.03125, -6.98046875, -4.9296875, -2.87890625, -0.828125, 1.22265625, 3.2734375, 5.32421875, 7.375, 9.42578125, 11.4765625, 13.52734375, 15.578125, 17.62890625, 19.6796875, 21.73046875, 23.78125, 25.83203125, 27.8828125, 29.93359375, 31.984375, 34.03515625, 36.0859375, 38.13671875, 40.1875, 42.23828125, 44.2890625, 46.33984375, 48.390625, 50.44140625, 52.4921875, 54.54296875, 56.59375, 58.64453125, 60.6953125, 62.74609375, 64.796875, 66.84765625, 68.8984375, 70.94921875, 73.0]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 14.0, 22.0, 34.0, 64.0, 56.0, 68.0, 47.0, 50.0, 31.0, 14.0, 17.0, 11.0, 8.0, 9.0, 6.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.912353515625, -344.955322265625, -332.998291015625, -321.041259765625, -309.0841979980469, -297.1271667480469, -285.1701354980469, -273.2131042480469, -261.2560729980469, -249.29904174804688, -237.3419952392578, -225.3849639892578, -213.4279327392578, -201.47088623046875, -189.51385498046875, -177.55682373046875, -165.5997772216797, -153.6427459716797, -141.68569946289062, -129.72866821289062, -117.77163696289062, -105.8145980834961, -93.85755920410156, -81.90052795410156, -69.94348907470703, -57.986454010009766, -46.0294189453125, -34.07238006591797, -22.115345001220703, -10.158309936523438, 1.7987289428710938, 13.755760192871094, 25.712799072265625, 37.66983413696289, 49.626869201660156, 61.58390808105469, 73.54093933105469, 85.49797821044922, 97.45501708984375, 109.41204833984375, 121.36908721923828, 133.3261260986328, 145.2831573486328, 157.24020385742188, 169.19723510742188, 181.15426635742188, 193.11129760742188, 205.06832885742188, 217.02537536621094, 228.98240661621094, 240.939453125, 252.896484375, 264.853515625, 276.810546875, 288.767578125, 300.724609375, 312.6816711425781, 324.6387023925781, 336.5957336425781, 348.55279541015625, 360.50982666015625, 372.46685791015625, 384.42388916015625, 396.38092041015625, 408.33795166015625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 6.0, 6.0, 3.0, 5.0, 2.0, 9.0, 12.0, 21.0, 67.0, 87.0, 89.0, 53.0, 39.0, 17.0, 11.0, 10.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-300.09393310546875, -287.365966796875, -274.63800048828125, -261.9100646972656, -249.18209838867188, -236.45413208007812, -223.72616577148438, -210.9982147216797, -198.270263671875, -185.54229736328125, -172.81434631347656, -160.0863800048828, -147.35842895507812, -134.63046264648438, -121.90250396728516, -109.17454528808594, -96.44657897949219, -83.71862030029297, -70.99066162109375, -58.262699127197266, -45.53474044799805, -32.80678176879883, -20.078819274902344, -7.350860595703125, 5.377098083496094, 18.105056762695312, 30.833017349243164, 43.560977935791016, 56.288936614990234, 69.01689147949219, 81.74485778808594, 94.47281646728516, 107.20077514648438, 119.9287338256836, 132.6566925048828, 145.38465881347656, 158.11260986328125, 170.840576171875, 183.56854248046875, 196.29649353027344, 209.02444458007812, 221.75241088867188, 234.48036193847656, 247.2083282470703, 259.936279296875, 272.66424560546875, 285.3922119140625, 298.12017822265625, 310.84814453125, 323.57611083984375, 336.3040771484375, 349.0320129394531, 361.7599792480469, 374.4879455566406, 387.2159118652344, 399.94384765625, 412.67181396484375, 425.3997802734375, 438.12774658203125, 450.8556823730469, 463.5836486816406, 476.3116149902344, 489.0395812988281, 501.76751708984375, 514.4954833984375]}, "eval/loss": 0.6976933479309082, "eval/wer": 0.12308607695358985, "eval/runtime": 636.3851, "eval/samples_per_second": 4.152, "eval/steps_per_second": 0.52, "train/train_runtime": 134751.1179, "train/train_samples_per_second": 5.295, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 1.8353804810692644} \ No newline at end of file +{"train/loss": 0.2868, "train/learning_rate": 1.1267605633802817e-08, "train/epoch": 25.0, "train/global_step": 22300, "_runtime": 135763, "_timestamp": 1648277107, "_step": 22315, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 7.0, 6.0, 24.0, 16.0, 17.0, 28.0, 27.0, 41.0, 41.0, 57.0, 59.0, 69.0, 82.0, 96.0, 86.0, 78.0, 58.0, 45.0, 38.0, 26.0, 29.0, 15.0, 12.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-151.30198669433594, -147.59866333007812, -143.8953399658203, -140.1920166015625, -136.4886932373047, -132.78536987304688, -129.08204650878906, -125.37871551513672, -121.6753921508789, -117.9720687866211, -114.26874542236328, -110.56542205810547, -106.86209106445312, -103.15876770019531, -99.4554443359375, -95.75212097167969, -92.04879760742188, -88.34547424316406, -84.64215087890625, -80.93882751464844, -77.23550415039062, -73.53218078613281, -69.82884979248047, -66.12552642822266, -62.422203063964844, -58.71887969970703, -55.01555633544922, -51.31222915649414, -47.60890579223633, -43.905582427978516, -40.20225524902344, -36.498931884765625, -32.795616149902344, -29.09229278564453, -25.388967514038086, -21.68564224243164, -17.982318878173828, -14.278995513916016, -10.57567024230957, -6.872344970703125, -3.1690216064453125, 0.5343027114868164, 4.237627029418945, 7.940951347351074, 11.644275665283203, 15.347599029541016, 19.05092430114746, 22.754249572753906, 26.45757293701172, 30.16089630126953, 33.864219665527344, 37.56754684448242, 41.270870208740234, 44.97419357299805, 48.677520751953125, 52.38084411621094, 56.08416748046875, 59.78749084472656, 63.490814208984375, 67.19413757324219, 70.8974609375, 74.60078430175781, 78.30411529541016, 82.00743865966797, 85.71076202392578]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 5.0, 9.0, 6.0, 9.0, 9.0, 17.0, 11.0, 20.0, 22.0, 17.0, 22.0, 27.0, 28.0, 41.0, 43.0, 41.0, 38.0, 29.0, 37.0, 41.0, 42.0, 39.0, 49.0, 32.0, 36.0, 39.0, 43.0, 36.0, 28.0, 21.0, 19.0, 23.0, 23.0, 17.0, 19.0, 14.0, 11.0, 9.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-68.2059097290039, -65.8742904663086, -63.54267501831055, -61.2110595703125, -58.87944030761719, -56.54782485961914, -54.216209411621094, -51.88459014892578, -49.552974700927734, -47.22135925292969, -44.889739990234375, -42.55812454223633, -40.22650909423828, -37.89488983154297, -35.56327438354492, -33.231658935546875, -30.900039672851562, -28.568422317504883, -26.236804962158203, -23.905189514160156, -21.573572158813477, -19.241954803466797, -16.91033935546875, -14.57872200012207, -12.24710464477539, -9.915487289428711, -7.583870887756348, -5.252254009246826, -2.9206371307373047, -0.589019775390625, 1.7425966262817383, 4.074213027954102, 6.4058380126953125, 8.737455368041992, 11.069071769714355, 13.400688171386719, 15.732305526733398, 18.063922882080078, 20.395538330078125, 22.727155685424805, 25.058773040771484, 27.390390396118164, 29.722007751464844, 32.05362319946289, 34.38523864746094, 36.71685791015625, 39.0484733581543, 41.380088806152344, 43.711708068847656, 46.0433235168457, 48.374942779541016, 50.70655822753906, 53.038177490234375, 55.36979293823242, 57.70140838623047, 60.03302764892578, 62.36464309692383, 64.69625854492188, 67.02787780761719, 69.3594970703125, 71.69110870361328, 74.0227279663086, 76.3543472290039, 78.68595886230469, 81.017578125]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 12.0, 18.0, 28.0, 29.0, 53.0, 108.0, 107.0, 163.0, 256.0, 330.0, 564.0, 776.0, 1236.0, 1872.0, 3065.0, 4669.0, 7626.0, 12886.0, 22633.0, 41141.0, 80592.0, 188661.0, 947081.0, 2287244.0, 348355.0, 115935.0, 55682.0, 29584.0, 16883.0, 9812.0, 5959.0, 3823.0, 2390.0, 1520.0, 1027.0, 673.0, 441.0, 317.0, 229.0, 154.0, 100.0, 75.0, 41.0, 39.0, 20.0, 21.0, 11.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-244.5, -236.67578125, -228.8515625, -221.02734375, -213.203125, -205.37890625, -197.5546875, -189.73046875, -181.90625, -174.08203125, -166.2578125, -158.43359375, -150.609375, -142.78515625, -134.9609375, -127.13671875, -119.3125, -111.48828125, -103.6640625, -95.83984375, -88.015625, -80.19140625, -72.3671875, -64.54296875, -56.71875, -48.89453125, -41.0703125, -33.24609375, -25.421875, -17.59765625, -9.7734375, -1.94921875, 5.875, 13.69921875, 21.5234375, 29.34765625, 37.171875, 44.99609375, 52.8203125, 60.64453125, 68.46875, 76.29296875, 84.1171875, 91.94140625, 99.765625, 107.58984375, 115.4140625, 123.23828125, 131.0625, 138.88671875, 146.7109375, 154.53515625, 162.359375, 170.18359375, 178.0078125, 185.83203125, 193.65625, 201.48046875, 209.3046875, 217.12890625, 224.953125, 232.77734375, 240.6015625, 248.42578125, 256.25]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 5.0, 15.0, 13.0, 16.0, 16.0, 22.0, 22.0, 35.0, 32.0, 24.0, 40.0, 39.0, 38.0, 48.0, 53.0, 53.0, 38.0, 57.0, 37.0, 41.0, 35.0, 37.0, 40.0, 33.0, 40.0, 27.0, 18.0, 25.0, 19.0, 18.0, 10.0, 14.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.5, -73.923828125, -71.34765625, -68.771484375, -66.1953125, -63.619140625, -61.04296875, -58.466796875, -55.890625, -53.314453125, -50.73828125, -48.162109375, -45.5859375, -43.009765625, -40.43359375, -37.857421875, -35.28125, -32.705078125, -30.12890625, -27.552734375, -24.9765625, -22.400390625, -19.82421875, -17.248046875, -14.671875, -12.095703125, -9.51953125, -6.943359375, -4.3671875, -1.791015625, 0.78515625, 3.361328125, 5.9375, 8.513671875, 11.08984375, 13.666015625, 16.2421875, 18.818359375, 21.39453125, 23.970703125, 26.546875, 29.123046875, 31.69921875, 34.275390625, 36.8515625, 39.427734375, 42.00390625, 44.580078125, 47.15625, 49.732421875, 52.30859375, 54.884765625, 57.4609375, 60.037109375, 62.61328125, 65.189453125, 67.765625, 70.341796875, 72.91796875, 75.494140625, 78.0703125, 80.646484375, 83.22265625, 85.798828125, 88.375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 20.0, 13.0, 26.0, 36.0, 60.0, 61.0, 107.0, 158.0, 234.0, 376.0, 559.0, 822.0, 1219.0, 1891.0, 2835.0, 4483.0, 6999.0, 11484.0, 18649.0, 30897.0, 51990.0, 92909.0, 172017.0, 372599.0, 1327744.0, 1326657.0, 371097.0, 172183.0, 92267.0, 52629.0, 30890.0, 18748.0, 11327.0, 7083.0, 4602.0, 2971.0, 1872.0, 1273.0, 849.0, 554.0, 355.0, 248.0, 153.0, 111.0, 74.0, 40.0, 28.0, 33.0, 17.0, 10.0, 14.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-139.5, -135.0, -130.5, -126.0, -121.5, -117.0, -112.5, -108.0, -103.5, -99.0, -94.5, -90.0, -85.5, -81.0, -76.5, -72.0, -67.5, -63.0, -58.5, -54.0, -49.5, -45.0, -40.5, -36.0, -31.5, -27.0, -22.5, -18.0, -13.5, -9.0, -4.5, 0.0, 4.5, 9.0, 13.5, 18.0, 22.5, 27.0, 31.5, 36.0, 40.5, 45.0, 49.5, 54.0, 58.5, 63.0, 67.5, 72.0, 76.5, 81.0, 85.5, 90.0, 94.5, 99.0, 103.5, 108.0, 112.5, 117.0, 121.5, 126.0, 130.5, 135.0, 139.5, 144.0, 148.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 10.0, 14.0, 13.0, 21.0, 25.0, 29.0, 37.0, 45.0, 39.0, 60.0, 77.0, 63.0, 91.0, 122.0, 121.0, 154.0, 196.0, 273.0, 395.0, 473.0, 384.0, 271.0, 196.0, 160.0, 122.0, 113.0, 95.0, 72.0, 69.0, 50.0, 55.0, 37.0, 27.0, 33.0, 22.0, 22.0, 19.0, 15.0, 6.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.5, -37.1904296875, -35.880859375, -34.5712890625, -33.26171875, -31.9521484375, -30.642578125, -29.3330078125, -28.0234375, -26.7138671875, -25.404296875, -24.0947265625, -22.78515625, -21.4755859375, -20.166015625, -18.8564453125, -17.546875, -16.2373046875, -14.927734375, -13.6181640625, -12.30859375, -10.9990234375, -9.689453125, -8.3798828125, -7.0703125, -5.7607421875, -4.451171875, -3.1416015625, -1.83203125, -0.5224609375, 0.787109375, 2.0966796875, 3.40625, 4.7158203125, 6.025390625, 7.3349609375, 8.64453125, 9.9541015625, 11.263671875, 12.5732421875, 13.8828125, 15.1923828125, 16.501953125, 17.8115234375, 19.12109375, 20.4306640625, 21.740234375, 23.0498046875, 24.359375, 25.6689453125, 26.978515625, 28.2880859375, 29.59765625, 30.9072265625, 32.216796875, 33.5263671875, 34.8359375, 36.1455078125, 37.455078125, 38.7646484375, 40.07421875, 41.3837890625, 42.693359375, 44.0029296875, 45.3125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 9.0, 10.0, 12.0, 17.0, 13.0, 20.0, 25.0, 30.0, 36.0, 38.0, 49.0, 56.0, 69.0, 71.0, 65.0, 79.0, 60.0, 48.0, 52.0, 39.0, 31.0, 24.0, 20.0, 18.0, 16.0, 11.0, 11.0, 12.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.65741729736328, -107.41815948486328, -104.17890930175781, -100.93965148925781, -97.70040130615234, -94.46114349365234, -91.22189331054688, -87.98263549804688, -84.7433853149414, -81.5041275024414, -78.26487731933594, -75.02561950683594, -71.78636932373047, -68.54711151123047, -65.307861328125, -62.068603515625, -58.829349517822266, -55.59009552001953, -52.3508415222168, -49.11158752441406, -45.87233352661133, -42.633079528808594, -39.393821716308594, -36.154571533203125, -32.915313720703125, -29.67605972290039, -26.436805725097656, -23.197551727294922, -19.958297729492188, -16.71904182434082, -13.479787826538086, -10.240533828735352, -7.00128173828125, -3.7620275020599365, -0.522773265838623, 2.7164812088012695, 5.955735206604004, 9.194990158081055, 12.434244155883789, 15.673498153686523, 18.912752151489258, 22.152006149291992, 25.391260147094727, 28.630516052246094, 31.869770050048828, 35.10902404785156, 38.3482780456543, 41.58753204345703, 44.826786041259766, 48.0660400390625, 51.305294036865234, 54.54454803466797, 57.7838020324707, 61.02305603027344, 64.26231384277344, 67.5015640258789, 70.7408218383789, 73.9800796508789, 77.21932983398438, 80.45858764648438, 83.69783782958984, 86.93709564208984, 90.17634582519531, 93.41560363769531, 96.65485382080078]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 8.0, 6.0, 13.0, 15.0, 16.0, 26.0, 25.0, 34.0, 25.0, 30.0, 30.0, 37.0, 28.0, 49.0, 48.0, 43.0, 34.0, 41.0, 42.0, 50.0, 34.0, 32.0, 41.0, 42.0, 37.0, 29.0, 22.0, 22.0, 21.0, 22.0, 16.0, 17.0, 9.0, 16.0, 8.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-101.45652770996094, -98.67851257324219, -95.9004898071289, -93.12247467041016, -90.34445190429688, -87.56643676757812, -84.78842163085938, -82.0103988647461, -79.23237609863281, -76.45436096191406, -73.67633819580078, -70.89832305908203, -68.12030029296875, -65.34228515625, -62.564266204833984, -59.78624725341797, -57.00823211669922, -54.2302131652832, -51.45219421386719, -48.67417907714844, -45.896156311035156, -43.118141174316406, -40.34012222290039, -37.562103271484375, -34.78408432006836, -32.006065368652344, -29.228046417236328, -26.450029373168945, -23.67201042175293, -20.893991470336914, -18.11597442626953, -15.337955474853516, -12.559944152832031, -9.781925201416016, -7.003907203674316, -4.225889205932617, -1.4478702545166016, 1.330148696899414, 4.108165740966797, 6.8861846923828125, 9.664203643798828, 12.442222595214844, 15.220240592956543, 17.998258590698242, 20.776277542114258, 23.554296493530273, 26.332313537597656, 29.110332489013672, 31.888351440429688, 34.6663703918457, 37.44438934326172, 40.22240447998047, 43.00042724609375, 45.7784423828125, 48.556461334228516, 51.33448028564453, 54.11249923706055, 56.89051818847656, 59.66853713989258, 62.446556091308594, 65.22457122802734, 68.00259399414062, 70.78060913085938, 73.55862426757812, 76.3366470336914]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 9.0, 26.0, 24.0, 39.0, 48.0, 84.0, 112.0, 173.0, 247.0, 394.0, 600.0, 972.0, 1362.0, 2078.0, 3369.0, 5550.0, 9380.0, 15744.0, 27919.0, 51158.0, 97672.0, 192739.0, 285786.0, 164591.0, 83739.0, 44649.0, 24379.0, 13724.0, 8155.0, 5048.0, 3137.0, 2009.0, 1239.0, 806.0, 506.0, 340.0, 213.0, 175.0, 123.0, 72.0, 50.0, 37.0, 24.0, 14.0, 15.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-136.375, -132.1640625, -127.953125, -123.7421875, -119.53125, -115.3203125, -111.109375, -106.8984375, -102.6875, -98.4765625, -94.265625, -90.0546875, -85.84375, -81.6328125, -77.421875, -73.2109375, -69.0, -64.7890625, -60.578125, -56.3671875, -52.15625, -47.9453125, -43.734375, -39.5234375, -35.3125, -31.1015625, -26.890625, -22.6796875, -18.46875, -14.2578125, -10.046875, -5.8359375, -1.625, 2.5859375, 6.796875, 11.0078125, 15.21875, 19.4296875, 23.640625, 27.8515625, 32.0625, 36.2734375, 40.484375, 44.6953125, 48.90625, 53.1171875, 57.328125, 61.5390625, 65.75, 69.9609375, 74.171875, 78.3828125, 82.59375, 86.8046875, 91.015625, 95.2265625, 99.4375, 103.6484375, 107.859375, 112.0703125, 116.28125, 120.4921875, 124.703125, 128.9140625, 133.125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 8.0, 8.0, 18.0, 17.0, 18.0, 25.0, 28.0, 28.0, 36.0, 27.0, 40.0, 37.0, 43.0, 51.0, 56.0, 49.0, 43.0, 38.0, 38.0, 37.0, 35.0, 36.0, 46.0, 27.0, 27.0, 29.0, 15.0, 22.0, 27.0, 11.0, 17.0, 9.0, 14.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-101.3125, -98.515625, -95.71875, -92.921875, -90.125, -87.328125, -84.53125, -81.734375, -78.9375, -76.140625, -73.34375, -70.546875, -67.75, -64.953125, -62.15625, -59.359375, -56.5625, -53.765625, -50.96875, -48.171875, -45.375, -42.578125, -39.78125, -36.984375, -34.1875, -31.390625, -28.59375, -25.796875, -23.0, -20.203125, -17.40625, -14.609375, -11.8125, -9.015625, -6.21875, -3.421875, -0.625, 2.171875, 4.96875, 7.765625, 10.5625, 13.359375, 16.15625, 18.953125, 21.75, 24.546875, 27.34375, 30.140625, 32.9375, 35.734375, 38.53125, 41.328125, 44.125, 46.921875, 49.71875, 52.515625, 55.3125, 58.109375, 60.90625, 63.703125, 66.5, 69.296875, 72.09375, 74.890625, 77.6875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 10.0, 7.0, 13.0, 19.0, 24.0, 34.0, 45.0, 66.0, 85.0, 112.0, 158.0, 243.0, 334.0, 523.0, 690.0, 988.0, 1460.0, 2228.0, 3397.0, 5229.0, 8498.0, 14213.0, 24711.0, 45831.0, 94309.0, 216723.0, 322761.0, 151198.0, 68890.0, 35120.0, 19395.0, 11253.0, 6939.0, 4341.0, 2797.0, 1896.0, 1244.0, 798.0, 608.0, 414.0, 270.0, 184.0, 124.0, 102.0, 74.0, 62.0, 41.0, 31.0, 19.0, 10.0, 9.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 4.0], "bins": [-166.0, -160.859375, -155.71875, -150.578125, -145.4375, -140.296875, -135.15625, -130.015625, -124.875, -119.734375, -114.59375, -109.453125, -104.3125, -99.171875, -94.03125, -88.890625, -83.75, -78.609375, -73.46875, -68.328125, -63.1875, -58.046875, -52.90625, -47.765625, -42.625, -37.484375, -32.34375, -27.203125, -22.0625, -16.921875, -11.78125, -6.640625, -1.5, 3.640625, 8.78125, 13.921875, 19.0625, 24.203125, 29.34375, 34.484375, 39.625, 44.765625, 49.90625, 55.046875, 60.1875, 65.328125, 70.46875, 75.609375, 80.75, 85.890625, 91.03125, 96.171875, 101.3125, 106.453125, 111.59375, 116.734375, 121.875, 127.015625, 132.15625, 137.296875, 142.4375, 147.578125, 152.71875, 157.859375, 163.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 10.0, 19.0, 18.0, 21.0, 16.0, 20.0, 21.0, 24.0, 28.0, 34.0, 32.0, 41.0, 50.0, 37.0, 50.0, 44.0, 42.0, 44.0, 38.0, 52.0, 42.0, 51.0, 31.0, 39.0, 32.0, 18.0, 23.0, 11.0, 24.0, 16.0, 6.0, 12.0, 12.0, 6.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.21875, -57.23388671875, -55.2490234375, -53.26416015625, -51.279296875, -49.29443359375, -47.3095703125, -45.32470703125, -43.33984375, -41.35498046875, -39.3701171875, -37.38525390625, -35.400390625, -33.41552734375, -31.4306640625, -29.44580078125, -27.4609375, -25.47607421875, -23.4912109375, -21.50634765625, -19.521484375, -17.53662109375, -15.5517578125, -13.56689453125, -11.58203125, -9.59716796875, -7.6123046875, -5.62744140625, -3.642578125, -1.65771484375, 0.3271484375, 2.31201171875, 4.296875, 6.28173828125, 8.2666015625, 10.25146484375, 12.236328125, 14.22119140625, 16.2060546875, 18.19091796875, 20.17578125, 22.16064453125, 24.1455078125, 26.13037109375, 28.115234375, 30.10009765625, 32.0849609375, 34.06982421875, 36.0546875, 38.03955078125, 40.0244140625, 42.00927734375, 43.994140625, 45.97900390625, 47.9638671875, 49.94873046875, 51.93359375, 53.91845703125, 55.9033203125, 57.88818359375, 59.873046875, 61.85791015625, 63.8427734375, 65.82763671875, 67.8125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 6.0, 16.0, 10.0, 16.0, 17.0, 25.0, 34.0, 50.0, 68.0, 106.0, 120.0, 207.0, 333.0, 490.0, 827.0, 1416.0, 2519.0, 5305.0, 14173.0, 68530.0, 698566.0, 211555.0, 27635.0, 8116.0, 3588.0, 1828.0, 1113.0, 652.0, 415.0, 286.0, 164.0, 112.0, 81.0, 50.0, 35.0, 36.0, 16.0, 13.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-159.875, -155.13671875, -150.3984375, -145.66015625, -140.921875, -136.18359375, -131.4453125, -126.70703125, -121.96875, -117.23046875, -112.4921875, -107.75390625, -103.015625, -98.27734375, -93.5390625, -88.80078125, -84.0625, -79.32421875, -74.5859375, -69.84765625, -65.109375, -60.37109375, -55.6328125, -50.89453125, -46.15625, -41.41796875, -36.6796875, -31.94140625, -27.203125, -22.46484375, -17.7265625, -12.98828125, -8.25, -3.51171875, 1.2265625, 5.96484375, 10.703125, 15.44140625, 20.1796875, 24.91796875, 29.65625, 34.39453125, 39.1328125, 43.87109375, 48.609375, 53.34765625, 58.0859375, 62.82421875, 67.5625, 72.30078125, 77.0390625, 81.77734375, 86.515625, 91.25390625, 95.9921875, 100.73046875, 105.46875, 110.20703125, 114.9453125, 119.68359375, 124.421875, 129.16015625, 133.8984375, 138.63671875, 143.375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 15.0, 17.0, 22.0, 48.0, 69.0, 143.0, 243.0, 187.0, 101.0, 54.0, 45.0, 15.0, 18.0, 6.0, 6.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007694244384765625, -0.007286727428436279, -0.006879210472106934, -0.006471693515777588, -0.006064176559448242, -0.0056566596031188965, -0.005249142646789551, -0.004841625690460205, -0.004434108734130859, -0.004026591777801514, -0.003619074821472168, -0.0032115578651428223, -0.0028040409088134766, -0.002396523952484131, -0.001989006996154785, -0.0015814900398254395, -0.0011739730834960938, -0.000766456127166748, -0.00035893917083740234, 4.857778549194336e-05, 0.00045609474182128906, 0.0008636116981506348, 0.0012711286544799805, 0.0016786456108093262, 0.002086162567138672, 0.0024936795234680176, 0.0029011964797973633, 0.003308713436126709, 0.0037162303924560547, 0.0041237473487854, 0.004531264305114746, 0.004938781261444092, 0.0053462982177734375, 0.005753815174102783, 0.006161332130432129, 0.006568849086761475, 0.00697636604309082, 0.007383882999420166, 0.007791399955749512, 0.008198916912078857, 0.008606433868408203, 0.009013950824737549, 0.009421467781066895, 0.00982898473739624, 0.010236501693725586, 0.010644018650054932, 0.011051535606384277, 0.011459052562713623, 0.011866569519042969, 0.012274086475372314, 0.01268160343170166, 0.013089120388031006, 0.013496637344360352, 0.013904154300689697, 0.014311671257019043, 0.014719188213348389, 0.015126705169677734, 0.01553422212600708, 0.015941739082336426, 0.01634925603866577, 0.016756772994995117, 0.017164289951324463, 0.01757180690765381, 0.017979323863983154, 0.0183868408203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 5.0, 9.0, 10.0, 16.0, 20.0, 31.0, 37.0, 58.0, 74.0, 94.0, 134.0, 155.0, 234.0, 334.0, 498.0, 635.0, 947.0, 1422.0, 2075.0, 3224.0, 5257.0, 9635.0, 17862.0, 37229.0, 86105.0, 228337.0, 372032.0, 157571.0, 61598.0, 27801.0, 14210.0, 7636.0, 4549.0, 2787.0, 1787.0, 1180.0, 863.0, 599.0, 406.0, 295.0, 219.0, 142.0, 127.0, 84.0, 67.0, 48.0, 41.0, 31.0, 10.0, 13.0, 5.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-60.75, -58.8701171875, -56.990234375, -55.1103515625, -53.23046875, -51.3505859375, -49.470703125, -47.5908203125, -45.7109375, -43.8310546875, -41.951171875, -40.0712890625, -38.19140625, -36.3115234375, -34.431640625, -32.5517578125, -30.671875, -28.7919921875, -26.912109375, -25.0322265625, -23.15234375, -21.2724609375, -19.392578125, -17.5126953125, -15.6328125, -13.7529296875, -11.873046875, -9.9931640625, -8.11328125, -6.2333984375, -4.353515625, -2.4736328125, -0.59375, 1.2861328125, 3.166015625, 5.0458984375, 6.92578125, 8.8056640625, 10.685546875, 12.5654296875, 14.4453125, 16.3251953125, 18.205078125, 20.0849609375, 21.96484375, 23.8447265625, 25.724609375, 27.6044921875, 29.484375, 31.3642578125, 33.244140625, 35.1240234375, 37.00390625, 38.8837890625, 40.763671875, 42.6435546875, 44.5234375, 46.4033203125, 48.283203125, 50.1630859375, 52.04296875, 53.9228515625, 55.802734375, 57.6826171875, 59.5625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 3.0, 13.0, 13.0, 15.0, 23.0, 27.0, 25.0, 44.0, 70.0, 45.0, 71.0, 79.0, 96.0, 93.0, 78.0, 59.0, 47.0, 30.0, 30.0, 28.0, 22.0, 17.0, 15.0, 9.0, 4.0, 12.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.265625, -19.658203125, -19.05078125, -18.443359375, -17.8359375, -17.228515625, -16.62109375, -16.013671875, -15.40625, -14.798828125, -14.19140625, -13.583984375, -12.9765625, -12.369140625, -11.76171875, -11.154296875, -10.546875, -9.939453125, -9.33203125, -8.724609375, -8.1171875, -7.509765625, -6.90234375, -6.294921875, -5.6875, -5.080078125, -4.47265625, -3.865234375, -3.2578125, -2.650390625, -2.04296875, -1.435546875, -0.828125, -0.220703125, 0.38671875, 0.994140625, 1.6015625, 2.208984375, 2.81640625, 3.423828125, 4.03125, 4.638671875, 5.24609375, 5.853515625, 6.4609375, 7.068359375, 7.67578125, 8.283203125, 8.890625, 9.498046875, 10.10546875, 10.712890625, 11.3203125, 11.927734375, 12.53515625, 13.142578125, 13.75, 14.357421875, 14.96484375, 15.572265625, 16.1796875, 16.787109375, 17.39453125, 18.001953125, 18.609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 4.0, 14.0, 8.0, 17.0, 24.0, 13.0, 27.0, 36.0, 35.0, 48.0, 62.0, 71.0, 63.0, 84.0, 88.0, 73.0, 60.0, 51.0, 34.0, 33.0, 36.0, 29.0, 16.0, 17.0, 13.0, 10.0, 8.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-125.12419128417969, -121.61530303955078, -118.10641479492188, -114.5975341796875, -111.0886459350586, -107.57975769042969, -104.07087707519531, -100.5619888305664, -97.0531005859375, -93.5442123413086, -90.03532409667969, -86.52644348144531, -83.0175552368164, -79.5086669921875, -75.99978637695312, -72.49089813232422, -68.98200988769531, -65.4731216430664, -61.964237213134766, -58.455352783203125, -54.94646453857422, -51.43757629394531, -47.92869186401367, -44.41980743408203, -40.910919189453125, -37.40203094482422, -33.89314651489258, -30.384260177612305, -26.87537384033203, -23.366487503051758, -19.857601165771484, -16.34871482849121, -12.839820861816406, -9.330934524536133, -5.822048187255859, -2.313161849975586, 1.1957244873046875, 4.704610824584961, 8.213497161865234, 11.722383499145508, 15.231269836425781, 18.740156173706055, 22.249042510986328, 25.7579288482666, 29.266815185546875, 32.77570343017578, 36.28458786010742, 39.79347229003906, 43.30236053466797, 46.811248779296875, 50.320133209228516, 53.829017639160156, 57.33790588378906, 60.84679412841797, 64.35568237304688, 67.86456298828125, 71.37345123291016, 74.88233947753906, 78.39122009277344, 81.90010833740234, 85.40899658203125, 88.91788482666016, 92.42677307128906, 95.93565368652344, 99.44454193115234]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 5.0, 11.0, 7.0, 8.0, 15.0, 12.0, 26.0, 22.0, 27.0, 34.0, 29.0, 34.0, 38.0, 34.0, 38.0, 43.0, 47.0, 46.0, 32.0, 33.0, 39.0, 44.0, 35.0, 42.0, 38.0, 38.0, 37.0, 26.0, 20.0, 15.0, 22.0, 19.0, 18.0, 9.0, 12.0, 18.0, 8.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-89.54629516601562, -87.0429458618164, -84.53958892822266, -82.03623962402344, -79.53289031982422, -77.029541015625, -74.52618408203125, -72.02283477783203, -69.51948547363281, -67.0161361694336, -64.51277923583984, -62.009429931640625, -59.506080627441406, -57.00272750854492, -54.49937438964844, -51.99602508544922, -49.49266815185547, -46.989315032958984, -44.485965728759766, -41.98261260986328, -39.47926330566406, -36.97591018676758, -34.472557067871094, -31.969205856323242, -29.46585464477539, -26.96250343322754, -24.459152221679688, -21.955799102783203, -19.45244789123535, -16.9490966796875, -14.445744514465332, -11.942392349243164, -9.439041137695312, -6.935689449310303, -4.432337760925293, -1.9289860725402832, 0.5743656158447266, 3.077716827392578, 5.581068992614746, 8.084421157836914, 10.587772369384766, 13.091123580932617, 15.594475746154785, 18.097827911376953, 20.601179122924805, 23.104530334472656, 25.60788345336914, 28.111234664916992, 30.614585876464844, 33.11793899536133, 35.62128829956055, 38.12464141845703, 40.62799072265625, 43.131343841552734, 45.63469696044922, 48.13804626464844, 50.64139938354492, 53.144752502441406, 55.648101806640625, 58.15145492553711, 60.654808044433594, 63.15815734863281, 65.66150665283203, 68.16486358642578, 70.668212890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 32.0, 44.0, 69.0, 95.0, 152.0, 197.0, 315.0, 444.0, 679.0, 994.0, 1504.0, 2203.0, 3243.0, 5054.0, 7190.0, 10846.0, 16108.0, 24199.0, 36866.0, 57281.0, 89018.0, 142174.0, 203276.0, 159389.0, 100229.0, 64158.0, 41377.0, 27044.0, 17762.0, 11889.0, 8055.0, 5426.0, 3711.0, 2378.0, 1686.0, 1085.0, 757.0, 513.0, 335.0, 221.0, 146.0, 128.0, 64.0, 60.0, 34.0, 21.0, 26.0, 4.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0], "bins": [-95.1875, -92.177734375, -89.16796875, -86.158203125, -83.1484375, -80.138671875, -77.12890625, -74.119140625, -71.109375, -68.099609375, -65.08984375, -62.080078125, -59.0703125, -56.060546875, -53.05078125, -50.041015625, -47.03125, -44.021484375, -41.01171875, -38.001953125, -34.9921875, -31.982421875, -28.97265625, -25.962890625, -22.953125, -19.943359375, -16.93359375, -13.923828125, -10.9140625, -7.904296875, -4.89453125, -1.884765625, 1.125, 4.134765625, 7.14453125, 10.154296875, 13.1640625, 16.173828125, 19.18359375, 22.193359375, 25.203125, 28.212890625, 31.22265625, 34.232421875, 37.2421875, 40.251953125, 43.26171875, 46.271484375, 49.28125, 52.291015625, 55.30078125, 58.310546875, 61.3203125, 64.330078125, 67.33984375, 70.349609375, 73.359375, 76.369140625, 79.37890625, 82.388671875, 85.3984375, 88.408203125, 91.41796875, 94.427734375, 97.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 8.0, 12.0, 16.0, 17.0, 24.0, 33.0, 33.0, 28.0, 34.0, 41.0, 28.0, 36.0, 43.0, 54.0, 49.0, 39.0, 39.0, 42.0, 43.0, 46.0, 37.0, 40.0, 35.0, 32.0, 34.0, 19.0, 18.0, 24.0, 15.0, 11.0, 11.0, 8.0, 9.0, 11.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-93.0, -90.3916015625, -87.783203125, -85.1748046875, -82.56640625, -79.9580078125, -77.349609375, -74.7412109375, -72.1328125, -69.5244140625, -66.916015625, -64.3076171875, -61.69921875, -59.0908203125, -56.482421875, -53.8740234375, -51.265625, -48.6572265625, -46.048828125, -43.4404296875, -40.83203125, -38.2236328125, -35.615234375, -33.0068359375, -30.3984375, -27.7900390625, -25.181640625, -22.5732421875, -19.96484375, -17.3564453125, -14.748046875, -12.1396484375, -9.53125, -6.9228515625, -4.314453125, -1.7060546875, 0.90234375, 3.5107421875, 6.119140625, 8.7275390625, 11.3359375, 13.9443359375, 16.552734375, 19.1611328125, 21.76953125, 24.3779296875, 26.986328125, 29.5947265625, 32.203125, 34.8115234375, 37.419921875, 40.0283203125, 42.63671875, 45.2451171875, 47.853515625, 50.4619140625, 53.0703125, 55.6787109375, 58.287109375, 60.8955078125, 63.50390625, 66.1123046875, 68.720703125, 71.3291015625, 73.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 4.0, 5.0, 1.0, 6.0, 12.0, 16.0, 28.0, 31.0, 38.0, 58.0, 82.0, 120.0, 173.0, 260.0, 403.0, 604.0, 816.0, 1255.0, 1846.0, 2711.0, 4182.0, 6623.0, 10072.0, 15696.0, 24913.0, 39863.0, 63703.0, 104523.0, 167050.0, 211371.0, 147841.0, 90886.0, 56324.0, 34853.0, 22104.0, 14053.0, 8968.0, 5694.0, 3752.0, 2427.0, 1642.0, 1098.0, 739.0, 548.0, 323.0, 269.0, 186.0, 138.0, 73.0, 60.0, 35.0, 29.0, 18.0, 14.0, 10.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-129.375, -125.25, -121.125, -117.0, -112.875, -108.75, -104.625, -100.5, -96.375, -92.25, -88.125, -84.0, -79.875, -75.75, -71.625, -67.5, -63.375, -59.25, -55.125, -51.0, -46.875, -42.75, -38.625, -34.5, -30.375, -26.25, -22.125, -18.0, -13.875, -9.75, -5.625, -1.5, 2.625, 6.75, 10.875, 15.0, 19.125, 23.25, 27.375, 31.5, 35.625, 39.75, 43.875, 48.0, 52.125, 56.25, 60.375, 64.5, 68.625, 72.75, 76.875, 81.0, 85.125, 89.25, 93.375, 97.5, 101.625, 105.75, 109.875, 114.0, 118.125, 122.25, 126.375, 130.5, 134.625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 12.0, 9.0, 13.0, 10.0, 11.0, 12.0, 21.0, 18.0, 27.0, 22.0, 30.0, 24.0, 21.0, 35.0, 31.0, 37.0, 57.0, 33.0, 42.0, 56.0, 51.0, 41.0, 28.0, 36.0, 38.0, 43.0, 30.0, 22.0, 34.0, 19.0, 22.0, 18.0, 17.0, 11.0, 13.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.099609375, -42.57421875, -41.048828125, -39.5234375, -37.998046875, -36.47265625, -34.947265625, -33.421875, -31.896484375, -30.37109375, -28.845703125, -27.3203125, -25.794921875, -24.26953125, -22.744140625, -21.21875, -19.693359375, -18.16796875, -16.642578125, -15.1171875, -13.591796875, -12.06640625, -10.541015625, -9.015625, -7.490234375, -5.96484375, -4.439453125, -2.9140625, -1.388671875, 0.13671875, 1.662109375, 3.1875, 4.712890625, 6.23828125, 7.763671875, 9.2890625, 10.814453125, 12.33984375, 13.865234375, 15.390625, 16.916015625, 18.44140625, 19.966796875, 21.4921875, 23.017578125, 24.54296875, 26.068359375, 27.59375, 29.119140625, 30.64453125, 32.169921875, 33.6953125, 35.220703125, 36.74609375, 38.271484375, 39.796875, 41.322265625, 42.84765625, 44.373046875, 45.8984375, 47.423828125, 48.94921875, 50.474609375, 52.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 21.0, 31.0, 36.0, 54.0, 85.0, 103.0, 169.0, 268.0, 396.0, 570.0, 924.0, 1300.0, 1935.0, 2953.0, 4609.0, 7268.0, 11211.0, 18543.0, 31490.0, 56343.0, 112241.0, 248774.0, 274061.0, 125109.0, 61803.0, 33886.0, 20235.0, 11931.0, 7785.0, 4947.0, 3153.0, 2072.0, 1416.0, 915.0, 616.0, 412.0, 300.0, 176.0, 144.0, 93.0, 62.0, 32.0, 26.0, 13.0, 6.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-34.6875, -33.66943359375, -32.6513671875, -31.63330078125, -30.615234375, -29.59716796875, -28.5791015625, -27.56103515625, -26.54296875, -25.52490234375, -24.5068359375, -23.48876953125, -22.470703125, -21.45263671875, -20.4345703125, -19.41650390625, -18.3984375, -17.38037109375, -16.3623046875, -15.34423828125, -14.326171875, -13.30810546875, -12.2900390625, -11.27197265625, -10.25390625, -9.23583984375, -8.2177734375, -7.19970703125, -6.181640625, -5.16357421875, -4.1455078125, -3.12744140625, -2.109375, -1.09130859375, -0.0732421875, 0.94482421875, 1.962890625, 2.98095703125, 3.9990234375, 5.01708984375, 6.03515625, 7.05322265625, 8.0712890625, 9.08935546875, 10.107421875, 11.12548828125, 12.1435546875, 13.16162109375, 14.1796875, 15.19775390625, 16.2158203125, 17.23388671875, 18.251953125, 19.27001953125, 20.2880859375, 21.30615234375, 22.32421875, 23.34228515625, 24.3603515625, 25.37841796875, 26.396484375, 27.41455078125, 28.4326171875, 29.45068359375, 30.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 10.0, 9.0, 30.0, 32.0, 28.0, 68.0, 75.0, 114.0, 170.0, 127.0, 82.0, 69.0, 51.0, 36.0, 17.0, 17.0, 12.0, 4.0, 8.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00492095947265625, -0.0047539472579956055, -0.004586935043334961, -0.004419922828674316, -0.004252910614013672, -0.004085898399353027, -0.003918886184692383, -0.0037518739700317383, -0.0035848617553710938, -0.0034178495407104492, -0.0032508373260498047, -0.00308382511138916, -0.0029168128967285156, -0.002749800682067871, -0.0025827884674072266, -0.002415776252746582, -0.0022487640380859375, -0.002081751823425293, -0.0019147396087646484, -0.001747727394104004, -0.0015807151794433594, -0.0014137029647827148, -0.0012466907501220703, -0.0010796785354614258, -0.0009126663208007812, -0.0007456541061401367, -0.0005786418914794922, -0.00041162967681884766, -0.0002446174621582031, -7.76052474975586e-05, 8.940696716308594e-05, 0.00025641918182373047, 0.000423431396484375, 0.0005904436111450195, 0.0007574558258056641, 0.0009244680404663086, 0.0010914802551269531, 0.0012584924697875977, 0.0014255046844482422, 0.0015925168991088867, 0.0017595291137695312, 0.0019265413284301758, 0.0020935535430908203, 0.002260565757751465, 0.0024275779724121094, 0.002594590187072754, 0.0027616024017333984, 0.002928614616394043, 0.0030956268310546875, 0.003262639045715332, 0.0034296512603759766, 0.003596663475036621, 0.0037636756896972656, 0.00393068790435791, 0.004097700119018555, 0.004264712333679199, 0.004431724548339844, 0.004598736763000488, 0.004765748977661133, 0.004932761192321777, 0.005099773406982422, 0.005266785621643066, 0.005433797836303711, 0.0056008100509643555, 0.005767822265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 10.0, 13.0, 24.0, 26.0, 55.0, 53.0, 79.0, 145.0, 190.0, 284.0, 373.0, 503.0, 686.0, 1005.0, 1281.0, 1882.0, 2659.0, 3780.0, 5578.0, 8129.0, 12536.0, 19250.0, 30144.0, 50059.0, 89445.0, 168913.0, 255632.0, 168325.0, 89393.0, 49738.0, 30067.0, 19065.0, 12491.0, 8205.0, 5482.0, 3802.0, 2599.0, 1838.0, 1351.0, 896.0, 697.0, 541.0, 409.0, 285.0, 199.0, 134.0, 108.0, 58.0, 40.0, 39.0, 26.0, 11.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0], "bins": [-25.578125, -24.791015625, -24.00390625, -23.216796875, -22.4296875, -21.642578125, -20.85546875, -20.068359375, -19.28125, -18.494140625, -17.70703125, -16.919921875, -16.1328125, -15.345703125, -14.55859375, -13.771484375, -12.984375, -12.197265625, -11.41015625, -10.623046875, -9.8359375, -9.048828125, -8.26171875, -7.474609375, -6.6875, -5.900390625, -5.11328125, -4.326171875, -3.5390625, -2.751953125, -1.96484375, -1.177734375, -0.390625, 0.396484375, 1.18359375, 1.970703125, 2.7578125, 3.544921875, 4.33203125, 5.119140625, 5.90625, 6.693359375, 7.48046875, 8.267578125, 9.0546875, 9.841796875, 10.62890625, 11.416015625, 12.203125, 12.990234375, 13.77734375, 14.564453125, 15.3515625, 16.138671875, 16.92578125, 17.712890625, 18.5, 19.287109375, 20.07421875, 20.861328125, 21.6484375, 22.435546875, 23.22265625, 24.009765625, 24.796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 11.0, 5.0, 5.0, 14.0, 13.0, 15.0, 15.0, 28.0, 25.0, 36.0, 30.0, 41.0, 41.0, 49.0, 61.0, 74.0, 63.0, 67.0, 51.0, 67.0, 41.0, 30.0, 23.0, 30.0, 25.0, 25.0, 16.0, 16.0, 20.0, 5.0, 9.0, 3.0, 3.0, 7.0, 4.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.677490234375, -9.38623046875, -9.094970703125, -8.8037109375, -8.512451171875, -8.22119140625, -7.929931640625, -7.638671875, -7.347412109375, -7.05615234375, -6.764892578125, -6.4736328125, -6.182373046875, -5.89111328125, -5.599853515625, -5.30859375, -5.017333984375, -4.72607421875, -4.434814453125, -4.1435546875, -3.852294921875, -3.56103515625, -3.269775390625, -2.978515625, -2.687255859375, -2.39599609375, -2.104736328125, -1.8134765625, -1.522216796875, -1.23095703125, -0.939697265625, -0.6484375, -0.357177734375, -0.06591796875, 0.225341796875, 0.5166015625, 0.807861328125, 1.09912109375, 1.390380859375, 1.681640625, 1.972900390625, 2.26416015625, 2.555419921875, 2.8466796875, 3.137939453125, 3.42919921875, 3.720458984375, 4.01171875, 4.302978515625, 4.59423828125, 4.885498046875, 5.1767578125, 5.468017578125, 5.75927734375, 6.050537109375, 6.341796875, 6.633056640625, 6.92431640625, 7.215576171875, 7.5068359375, 7.798095703125, 8.08935546875, 8.380615234375, 8.671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 17.0, 14.0, 20.0, 25.0, 27.0, 37.0, 40.0, 40.0, 65.0, 77.0, 86.0, 73.0, 80.0, 78.0, 72.0, 46.0, 32.0, 43.0, 30.0, 16.0, 11.0, 12.0, 11.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-133.5307159423828, -129.7549285888672, -125.9791488647461, -122.20336151123047, -118.42757415771484, -114.65179443359375, -110.87600708007812, -107.1002197265625, -103.32443237304688, -99.54864501953125, -95.77286529541016, -91.99707794189453, -88.2212905883789, -84.44551086425781, -80.66972351074219, -76.89393615722656, -73.11815643310547, -69.34236907958984, -65.56658935546875, -61.790802001953125, -58.0150146484375, -54.23923110961914, -50.46344757080078, -46.687660217285156, -42.9118766784668, -39.13609313964844, -35.36030578613281, -31.584522247314453, -27.80873680114746, -24.03295135498047, -20.25716781616211, -16.481382369995117, -12.705589294433594, -8.929803848266602, -5.154019355773926, -1.37823486328125, 2.397550582885742, 6.173336029052734, 9.949119567871094, 13.724905014038086, 17.500690460205078, 21.27647590637207, 25.052261352539062, 28.828044891357422, 32.60382843017578, 36.379615783691406, 40.155399322509766, 43.931182861328125, 47.70697021484375, 51.48275375366211, 55.258541107177734, 59.034324645996094, 62.81011199951172, 66.58589172363281, 70.36167907714844, 74.13746643066406, 77.91325378417969, 81.68904113769531, 85.4648208618164, 89.24060821533203, 93.01639556884766, 96.79217529296875, 100.56796264648438, 104.34375, 108.1195297241211]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 14.0, 8.0, 10.0, 11.0, 18.0, 24.0, 15.0, 20.0, 22.0, 27.0, 35.0, 36.0, 34.0, 40.0, 58.0, 35.0, 50.0, 37.0, 34.0, 32.0, 52.0, 38.0, 48.0, 31.0, 25.0, 35.0, 28.0, 32.0, 17.0, 17.0, 17.0, 14.0, 10.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-87.68623352050781, -85.16998291015625, -82.65373992919922, -80.13748931884766, -77.62124633789062, -75.10499572753906, -72.58875274658203, -70.07250213623047, -67.55625915527344, -65.04000854492188, -62.523765563964844, -60.00751876831055, -57.49127197265625, -54.97502136230469, -52.45877456665039, -49.942527770996094, -47.42627716064453, -44.910030364990234, -42.39378356933594, -39.87753677368164, -37.361289978027344, -34.84503936767578, -32.328792572021484, -29.812545776367188, -27.29629898071289, -24.780052185058594, -22.263805389404297, -19.747556686401367, -17.23130989074707, -14.715063095092773, -12.19881534576416, -9.682567596435547, -7.166313171386719, -4.650065898895264, -2.1338186264038086, 0.3824286460876465, 2.8986759185791016, 5.414922714233398, 7.931170463562012, 10.447418212890625, 12.963665008544922, 15.479911804199219, 17.996158599853516, 20.512407302856445, 23.028654098510742, 25.54490089416504, 28.06114959716797, 30.577396392822266, 33.09364318847656, 35.60988998413086, 38.126136779785156, 40.64238357543945, 43.15863037109375, 45.67488098144531, 48.19112777709961, 50.707374572753906, 53.2236213684082, 55.7398681640625, 58.2561149597168, 60.772361755371094, 63.288612365722656, 65.80485534667969, 68.32110595703125, 70.83735656738281, 73.35359954833984]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 19.0, 14.0, 29.0, 32.0, 55.0, 74.0, 103.0, 119.0, 210.0, 282.0, 412.0, 556.0, 895.0, 1187.0, 1883.0, 2776.0, 4309.0, 6704.0, 10315.0, 17003.0, 28306.0, 48684.0, 88053.0, 187379.0, 630551.0, 1835347.0, 857478.0, 225933.0, 101559.0, 55886.0, 32868.0, 19804.0, 12638.0, 8068.0, 5071.0, 3309.0, 2185.0, 1377.0, 940.0, 616.0, 411.0, 274.0, 193.0, 130.0, 78.0, 56.0, 38.0, 23.0, 8.0, 7.0, 13.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0], "bins": [-133.75, -129.6484375, -125.546875, -121.4453125, -117.34375, -113.2421875, -109.140625, -105.0390625, -100.9375, -96.8359375, -92.734375, -88.6328125, -84.53125, -80.4296875, -76.328125, -72.2265625, -68.125, -64.0234375, -59.921875, -55.8203125, -51.71875, -47.6171875, -43.515625, -39.4140625, -35.3125, -31.2109375, -27.109375, -23.0078125, -18.90625, -14.8046875, -10.703125, -6.6015625, -2.5, 1.6015625, 5.703125, 9.8046875, 13.90625, 18.0078125, 22.109375, 26.2109375, 30.3125, 34.4140625, 38.515625, 42.6171875, 46.71875, 50.8203125, 54.921875, 59.0234375, 63.125, 67.2265625, 71.328125, 75.4296875, 79.53125, 83.6328125, 87.734375, 91.8359375, 95.9375, 100.0390625, 104.140625, 108.2421875, 112.34375, 116.4453125, 120.546875, 124.6484375, 128.75]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 14.0, 11.0, 11.0, 20.0, 20.0, 22.0, 17.0, 32.0, 26.0, 26.0, 38.0, 52.0, 47.0, 46.0, 47.0, 42.0, 46.0, 32.0, 48.0, 42.0, 36.0, 39.0, 33.0, 37.0, 30.0, 24.0, 31.0, 16.0, 16.0, 18.0, 15.0, 9.0, 12.0, 9.0, 2.0, 3.0, 5.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-72.25, -70.15234375, -68.0546875, -65.95703125, -63.859375, -61.76171875, -59.6640625, -57.56640625, -55.46875, -53.37109375, -51.2734375, -49.17578125, -47.078125, -44.98046875, -42.8828125, -40.78515625, -38.6875, -36.58984375, -34.4921875, -32.39453125, -30.296875, -28.19921875, -26.1015625, -24.00390625, -21.90625, -19.80859375, -17.7109375, -15.61328125, -13.515625, -11.41796875, -9.3203125, -7.22265625, -5.125, -3.02734375, -0.9296875, 1.16796875, 3.265625, 5.36328125, 7.4609375, 9.55859375, 11.65625, 13.75390625, 15.8515625, 17.94921875, 20.046875, 22.14453125, 24.2421875, 26.33984375, 28.4375, 30.53515625, 32.6328125, 34.73046875, 36.828125, 38.92578125, 41.0234375, 43.12109375, 45.21875, 47.31640625, 49.4140625, 51.51171875, 53.609375, 55.70703125, 57.8046875, 59.90234375, 62.0]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 19.0, 17.0, 40.0, 50.0, 89.0, 114.0, 193.0, 280.0, 424.0, 602.0, 905.0, 1415.0, 2100.0, 3419.0, 5309.0, 8701.0, 13909.0, 23288.0, 40078.0, 72269.0, 138113.0, 291672.0, 795463.0, 1711127.0, 583313.0, 235998.0, 115113.0, 61729.0, 34852.0, 20393.0, 12335.0, 7590.0, 4657.0, 3061.0, 1885.0, 1269.0, 812.0, 571.0, 349.0, 246.0, 159.0, 101.0, 82.0, 44.0, 29.0, 29.0, 19.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-115.5, -111.931640625, -108.36328125, -104.794921875, -101.2265625, -97.658203125, -94.08984375, -90.521484375, -86.953125, -83.384765625, -79.81640625, -76.248046875, -72.6796875, -69.111328125, -65.54296875, -61.974609375, -58.40625, -54.837890625, -51.26953125, -47.701171875, -44.1328125, -40.564453125, -36.99609375, -33.427734375, -29.859375, -26.291015625, -22.72265625, -19.154296875, -15.5859375, -12.017578125, -8.44921875, -4.880859375, -1.3125, 2.255859375, 5.82421875, 9.392578125, 12.9609375, 16.529296875, 20.09765625, 23.666015625, 27.234375, 30.802734375, 34.37109375, 37.939453125, 41.5078125, 45.076171875, 48.64453125, 52.212890625, 55.78125, 59.349609375, 62.91796875, 66.486328125, 70.0546875, 73.623046875, 77.19140625, 80.759765625, 84.328125, 87.896484375, 91.46484375, 95.033203125, 98.6015625, 102.169921875, 105.73828125, 109.306640625, 112.875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 6.0, 10.0, 9.0, 14.0, 20.0, 19.0, 21.0, 30.0, 34.0, 35.0, 45.0, 62.0, 86.0, 87.0, 117.0, 158.0, 162.0, 239.0, 259.0, 396.0, 427.0, 376.0, 284.0, 231.0, 190.0, 127.0, 121.0, 113.0, 83.0, 68.0, 47.0, 36.0, 32.0, 23.0, 27.0, 12.0, 11.0, 9.0, 8.0, 16.0, 11.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.53125, -34.4033203125, -33.275390625, -32.1474609375, -31.01953125, -29.8916015625, -28.763671875, -27.6357421875, -26.5078125, -25.3798828125, -24.251953125, -23.1240234375, -21.99609375, -20.8681640625, -19.740234375, -18.6123046875, -17.484375, -16.3564453125, -15.228515625, -14.1005859375, -12.97265625, -11.8447265625, -10.716796875, -9.5888671875, -8.4609375, -7.3330078125, -6.205078125, -5.0771484375, -3.94921875, -2.8212890625, -1.693359375, -0.5654296875, 0.5625, 1.6904296875, 2.818359375, 3.9462890625, 5.07421875, 6.2021484375, 7.330078125, 8.4580078125, 9.5859375, 10.7138671875, 11.841796875, 12.9697265625, 14.09765625, 15.2255859375, 16.353515625, 17.4814453125, 18.609375, 19.7373046875, 20.865234375, 21.9931640625, 23.12109375, 24.2490234375, 25.376953125, 26.5048828125, 27.6328125, 28.7607421875, 29.888671875, 31.0166015625, 32.14453125, 33.2724609375, 34.400390625, 35.5283203125, 36.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 5.0, 20.0, 24.0, 27.0, 39.0, 28.0, 41.0, 41.0, 66.0, 80.0, 75.0, 93.0, 101.0, 62.0, 61.0, 46.0, 34.0, 31.0, 28.0, 20.0, 13.0, 13.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-138.45950317382812, -134.84710693359375, -131.2346954345703, -127.6222915649414, -124.0098876953125, -120.3974838256836, -116.78507995605469, -113.17267608642578, -109.56027221679688, -105.94786834716797, -102.33546447753906, -98.72306060791016, -95.11065673828125, -91.49825286865234, -87.88584899902344, -84.27344512939453, -80.66104125976562, -77.04863739013672, -73.43623352050781, -69.8238296508789, -66.21142578125, -62.599021911621094, -58.98661804199219, -55.37421417236328, -51.761810302734375, -48.14940643310547, -44.53700256347656, -40.924598693847656, -37.31219482421875, -33.699790954589844, -30.087387084960938, -26.47498321533203, -22.862579345703125, -19.25017547607422, -15.637771606445312, -12.025367736816406, -8.4129638671875, -4.800559997558594, -1.1881561279296875, 2.4242477416992188, 6.036651611328125, 9.649055480957031, 13.261459350585938, 16.873863220214844, 20.48626708984375, 24.098670959472656, 27.711074829101562, 31.32347869873047, 34.935882568359375, 38.54828643798828, 42.16069030761719, 45.773094177246094, 49.385498046875, 52.997901916503906, 56.61030578613281, 60.22270965576172, 63.835113525390625, 67.44751739501953, 71.05992126464844, 74.67232513427734, 78.28472900390625, 81.89713287353516, 85.50953674316406, 89.12194061279297, 92.73434448242188]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 10.0, 8.0, 7.0, 14.0, 22.0, 21.0, 29.0, 28.0, 23.0, 28.0, 37.0, 30.0, 36.0, 54.0, 43.0, 43.0, 52.0, 48.0, 48.0, 43.0, 36.0, 32.0, 33.0, 30.0, 32.0, 32.0, 30.0, 15.0, 16.0, 16.0, 15.0, 13.0, 11.0, 10.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.64378356933594, -71.24819946289062, -68.85261535644531, -66.45703887939453, -64.06145477294922, -61.665870666503906, -59.270286560058594, -56.87470245361328, -54.479122161865234, -52.08353805541992, -49.687957763671875, -47.29237365722656, -44.89678955078125, -42.5012092590332, -40.10562515258789, -37.710044860839844, -35.31446075439453, -32.91887664794922, -30.523296356201172, -28.12771224975586, -25.73213005065918, -23.3365478515625, -20.940963745117188, -18.545381546020508, -16.149799346923828, -13.754217147827148, -11.358633995056152, -8.963050842285156, -6.567468643188477, -4.171886444091797, -1.7763032913208008, 0.6192798614501953, 3.0148544311523438, 5.410437107086182, 7.8060197830200195, 10.201602935791016, 12.597185134887695, 14.992767333984375, 17.388351440429688, 19.783933639526367, 22.179515838623047, 24.575098037719727, 26.970680236816406, 29.36626434326172, 31.7618465423584, 34.15742874145508, 36.55301284790039, 38.94859313964844, 41.34417724609375, 43.73976135253906, 46.13534164428711, 48.53092575073242, 50.92650604248047, 53.32209014892578, 55.717674255371094, 58.113258361816406, 60.50883865356445, 62.904422760009766, 65.30000305175781, 67.69558715820312, 70.09117126464844, 72.48675537109375, 74.88233184814453, 77.27791595458984, 79.67350006103516]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 14.0, 21.0, 33.0, 41.0, 58.0, 69.0, 122.0, 198.0, 276.0, 397.0, 624.0, 912.0, 1322.0, 1827.0, 2915.0, 4343.0, 6503.0, 9940.0, 15338.0, 23651.0, 36824.0, 58933.0, 93955.0, 150048.0, 202967.0, 160531.0, 101126.0, 62567.0, 39714.0, 25510.0, 16402.0, 10563.0, 6899.0, 4569.0, 3042.0, 2045.0, 1306.0, 932.0, 638.0, 464.0, 291.0, 180.0, 142.0, 113.0, 68.0, 33.0, 22.0, 22.0, 19.0, 6.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-97.5625, -94.47265625, -91.3828125, -88.29296875, -85.203125, -82.11328125, -79.0234375, -75.93359375, -72.84375, -69.75390625, -66.6640625, -63.57421875, -60.484375, -57.39453125, -54.3046875, -51.21484375, -48.125, -45.03515625, -41.9453125, -38.85546875, -35.765625, -32.67578125, -29.5859375, -26.49609375, -23.40625, -20.31640625, -17.2265625, -14.13671875, -11.046875, -7.95703125, -4.8671875, -1.77734375, 1.3125, 4.40234375, 7.4921875, 10.58203125, 13.671875, 16.76171875, 19.8515625, 22.94140625, 26.03125, 29.12109375, 32.2109375, 35.30078125, 38.390625, 41.48046875, 44.5703125, 47.66015625, 50.75, 53.83984375, 56.9296875, 60.01953125, 63.109375, 66.19921875, 69.2890625, 72.37890625, 75.46875, 78.55859375, 81.6484375, 84.73828125, 87.828125, 90.91796875, 94.0078125, 97.09765625, 100.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 1.0, 6.0, 7.0, 8.0, 11.0, 15.0, 14.0, 19.0, 31.0, 25.0, 28.0, 35.0, 26.0, 36.0, 49.0, 52.0, 34.0, 49.0, 52.0, 57.0, 56.0, 36.0, 37.0, 28.0, 43.0, 32.0, 34.0, 33.0, 25.0, 17.0, 17.0, 13.0, 13.0, 11.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5625, -62.53515625, -60.5078125, -58.48046875, -56.453125, -54.42578125, -52.3984375, -50.37109375, -48.34375, -46.31640625, -44.2890625, -42.26171875, -40.234375, -38.20703125, -36.1796875, -34.15234375, -32.125, -30.09765625, -28.0703125, -26.04296875, -24.015625, -21.98828125, -19.9609375, -17.93359375, -15.90625, -13.87890625, -11.8515625, -9.82421875, -7.796875, -5.76953125, -3.7421875, -1.71484375, 0.3125, 2.33984375, 4.3671875, 6.39453125, 8.421875, 10.44921875, 12.4765625, 14.50390625, 16.53125, 18.55859375, 20.5859375, 22.61328125, 24.640625, 26.66796875, 28.6953125, 30.72265625, 32.75, 34.77734375, 36.8046875, 38.83203125, 40.859375, 42.88671875, 44.9140625, 46.94140625, 48.96875, 50.99609375, 53.0234375, 55.05078125, 57.078125, 59.10546875, 61.1328125, 63.16015625, 65.1875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 15.0, 14.0, 26.0, 29.0, 51.0, 71.0, 89.0, 134.0, 204.0, 268.0, 452.0, 605.0, 999.0, 1445.0, 2177.0, 3375.0, 5440.0, 8817.0, 14969.0, 26013.0, 47212.0, 91576.0, 193380.0, 301798.0, 167041.0, 80722.0, 42159.0, 23484.0, 13572.0, 8147.0, 4956.0, 3176.0, 2060.0, 1354.0, 881.0, 593.0, 375.0, 281.0, 208.0, 131.0, 84.0, 70.0, 40.0, 21.0, 16.0, 11.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-169.5, -164.26953125, -159.0390625, -153.80859375, -148.578125, -143.34765625, -138.1171875, -132.88671875, -127.65625, -122.42578125, -117.1953125, -111.96484375, -106.734375, -101.50390625, -96.2734375, -91.04296875, -85.8125, -80.58203125, -75.3515625, -70.12109375, -64.890625, -59.66015625, -54.4296875, -49.19921875, -43.96875, -38.73828125, -33.5078125, -28.27734375, -23.046875, -17.81640625, -12.5859375, -7.35546875, -2.125, 3.10546875, 8.3359375, 13.56640625, 18.796875, 24.02734375, 29.2578125, 34.48828125, 39.71875, 44.94921875, 50.1796875, 55.41015625, 60.640625, 65.87109375, 71.1015625, 76.33203125, 81.5625, 86.79296875, 92.0234375, 97.25390625, 102.484375, 107.71484375, 112.9453125, 118.17578125, 123.40625, 128.63671875, 133.8671875, 139.09765625, 144.328125, 149.55859375, 154.7890625, 160.01953125, 165.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 7.0, 8.0, 14.0, 14.0, 14.0, 25.0, 21.0, 16.0, 27.0, 38.0, 37.0, 28.0, 42.0, 46.0, 37.0, 41.0, 45.0, 43.0, 33.0, 51.0, 34.0, 37.0, 35.0, 34.0, 43.0, 24.0, 22.0, 25.0, 23.0, 13.0, 15.0, 16.0, 12.0, 9.0, 6.0, 8.0, 5.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-56.5625, -54.79833984375, -53.0341796875, -51.27001953125, -49.505859375, -47.74169921875, -45.9775390625, -44.21337890625, -42.44921875, -40.68505859375, -38.9208984375, -37.15673828125, -35.392578125, -33.62841796875, -31.8642578125, -30.10009765625, -28.3359375, -26.57177734375, -24.8076171875, -23.04345703125, -21.279296875, -19.51513671875, -17.7509765625, -15.98681640625, -14.22265625, -12.45849609375, -10.6943359375, -8.93017578125, -7.166015625, -5.40185546875, -3.6376953125, -1.87353515625, -0.109375, 1.65478515625, 3.4189453125, 5.18310546875, 6.947265625, 8.71142578125, 10.4755859375, 12.23974609375, 14.00390625, 15.76806640625, 17.5322265625, 19.29638671875, 21.060546875, 22.82470703125, 24.5888671875, 26.35302734375, 28.1171875, 29.88134765625, 31.6455078125, 33.40966796875, 35.173828125, 36.93798828125, 38.7021484375, 40.46630859375, 42.23046875, 43.99462890625, 45.7587890625, 47.52294921875, 49.287109375, 51.05126953125, 52.8154296875, 54.57958984375, 56.34375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 7.0, 19.0, 22.0, 36.0, 50.0, 72.0, 108.0, 169.0, 198.0, 375.0, 600.0, 883.0, 1375.0, 2328.0, 3837.0, 6596.0, 12337.0, 26910.0, 79133.0, 524016.0, 285298.0, 57454.0, 21479.0, 10566.0, 5634.0, 3358.0, 2069.0, 1290.0, 849.0, 532.0, 327.0, 205.0, 138.0, 82.0, 72.0, 48.0, 25.0, 16.0, 7.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-88.6875, -86.0693359375, -83.451171875, -80.8330078125, -78.21484375, -75.5966796875, -72.978515625, -70.3603515625, -67.7421875, -65.1240234375, -62.505859375, -59.8876953125, -57.26953125, -54.6513671875, -52.033203125, -49.4150390625, -46.796875, -44.1787109375, -41.560546875, -38.9423828125, -36.32421875, -33.7060546875, -31.087890625, -28.4697265625, -25.8515625, -23.2333984375, -20.615234375, -17.9970703125, -15.37890625, -12.7607421875, -10.142578125, -7.5244140625, -4.90625, -2.2880859375, 0.330078125, 2.9482421875, 5.56640625, 8.1845703125, 10.802734375, 13.4208984375, 16.0390625, 18.6572265625, 21.275390625, 23.8935546875, 26.51171875, 29.1298828125, 31.748046875, 34.3662109375, 36.984375, 39.6025390625, 42.220703125, 44.8388671875, 47.45703125, 50.0751953125, 52.693359375, 55.3115234375, 57.9296875, 60.5478515625, 63.166015625, 65.7841796875, 68.40234375, 71.0205078125, 73.638671875, 76.2568359375, 78.875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 19.0, 24.0, 52.0, 98.0, 225.0, 281.0, 89.0, 72.0, 40.0, 12.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012359619140625, -0.011920452117919922, -0.011481285095214844, -0.011042118072509766, -0.010602951049804688, -0.01016378402709961, -0.009724617004394531, -0.009285449981689453, -0.008846282958984375, -0.008407115936279297, -0.007967948913574219, -0.007528781890869141, -0.0070896148681640625, -0.006650447845458984, -0.006211280822753906, -0.005772113800048828, -0.00533294677734375, -0.004893779754638672, -0.004454612731933594, -0.004015445709228516, -0.0035762786865234375, -0.0031371116638183594, -0.0026979446411132812, -0.002258777618408203, -0.001819610595703125, -0.0013804435729980469, -0.0009412765502929688, -0.0005021095275878906, -6.29425048828125e-05, 0.0003762245178222656, 0.0008153915405273438, 0.0012545585632324219, 0.0016937255859375, 0.002132892608642578, 0.0025720596313476562, 0.0030112266540527344, 0.0034503936767578125, 0.0038895606994628906, 0.004328727722167969, 0.004767894744873047, 0.005207061767578125, 0.005646228790283203, 0.006085395812988281, 0.006524562835693359, 0.0069637298583984375, 0.007402896881103516, 0.007842063903808594, 0.008281230926513672, 0.00872039794921875, 0.009159564971923828, 0.009598731994628906, 0.010037899017333984, 0.010477066040039062, 0.01091623306274414, 0.011355400085449219, 0.011794567108154297, 0.012233734130859375, 0.012672901153564453, 0.013112068176269531, 0.01355123519897461, 0.013990402221679688, 0.014429569244384766, 0.014868736267089844, 0.015307903289794922, 0.0157470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 13.0, 11.0, 18.0, 18.0, 37.0, 50.0, 56.0, 118.0, 166.0, 231.0, 381.0, 534.0, 854.0, 1202.0, 1742.0, 2720.0, 4026.0, 5883.0, 9786.0, 17114.0, 32652.0, 81597.0, 320462.0, 393386.0, 92535.0, 35811.0, 17655.0, 10295.0, 6364.0, 4159.0, 2898.0, 1953.0, 1228.0, 845.0, 603.0, 377.0, 224.0, 169.0, 115.0, 84.0, 53.0, 33.0, 31.0, 19.0, 17.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-73.6875, -71.388671875, -69.08984375, -66.791015625, -64.4921875, -62.193359375, -59.89453125, -57.595703125, -55.296875, -52.998046875, -50.69921875, -48.400390625, -46.1015625, -43.802734375, -41.50390625, -39.205078125, -36.90625, -34.607421875, -32.30859375, -30.009765625, -27.7109375, -25.412109375, -23.11328125, -20.814453125, -18.515625, -16.216796875, -13.91796875, -11.619140625, -9.3203125, -7.021484375, -4.72265625, -2.423828125, -0.125, 2.173828125, 4.47265625, 6.771484375, 9.0703125, 11.369140625, 13.66796875, 15.966796875, 18.265625, 20.564453125, 22.86328125, 25.162109375, 27.4609375, 29.759765625, 32.05859375, 34.357421875, 36.65625, 38.955078125, 41.25390625, 43.552734375, 45.8515625, 48.150390625, 50.44921875, 52.748046875, 55.046875, 57.345703125, 59.64453125, 61.943359375, 64.2421875, 66.541015625, 68.83984375, 71.138671875, 73.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 8.0, 6.0, 5.0, 6.0, 13.0, 16.0, 24.0, 29.0, 28.0, 50.0, 63.0, 83.0, 123.0, 141.0, 78.0, 66.0, 46.0, 29.0, 34.0, 30.0, 21.0, 15.0, 8.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.52734375, -17.8203125, -17.11328125, -16.40625, -15.69921875, -14.9921875, -14.28515625, -13.578125, -12.87109375, -12.1640625, -11.45703125, -10.75, -10.04296875, -9.3359375, -8.62890625, -7.921875, -7.21484375, -6.5078125, -5.80078125, -5.09375, -4.38671875, -3.6796875, -2.97265625, -2.265625, -1.55859375, -0.8515625, -0.14453125, 0.5625, 1.26953125, 1.9765625, 2.68359375, 3.390625, 4.09765625, 4.8046875, 5.51171875, 6.21875, 6.92578125, 7.6328125, 8.33984375, 9.046875, 9.75390625, 10.4609375, 11.16796875, 11.875, 12.58203125, 13.2890625, 13.99609375, 14.703125, 15.41015625, 16.1171875, 16.82421875, 17.53125, 18.23828125, 18.9453125, 19.65234375, 20.359375, 21.06640625, 21.7734375, 22.48046875, 23.1875, 23.89453125, 24.6015625, 25.30859375, 26.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 8.0, 10.0, 13.0, 22.0, 28.0, 41.0, 52.0, 77.0, 106.0, 129.0, 123.0, 121.0, 73.0, 54.0, 46.0, 29.0, 23.0, 19.0, 14.0, 8.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.34735107421875, -130.0435333251953, -125.73973083496094, -121.4359130859375, -117.1321029663086, -112.82829284667969, -108.52448272705078, -104.22067260742188, -99.91685485839844, -95.61304473876953, -91.30923461914062, -87.00541687011719, -82.70160675048828, -78.39779663085938, -74.09398651123047, -69.79017639160156, -65.48636627197266, -61.18255615234375, -56.87874221801758, -52.57493209838867, -48.2711181640625, -43.967308044433594, -39.66349792480469, -35.35968780517578, -31.05587387084961, -26.75206184387207, -22.44824981689453, -18.144439697265625, -13.840627670288086, -9.536815643310547, -5.233005523681641, -0.9291934967041016, 3.3746185302734375, 7.678430080413818, 11.9822416305542, 16.286052703857422, 20.58986473083496, 24.8936767578125, 29.197486877441406, 33.50129699707031, 37.805110931396484, 42.10892105102539, 46.41273498535156, 50.71654510498047, 55.020355224609375, 59.32416915893555, 63.62797927856445, 67.93179321289062, 72.23560333251953, 76.53941345214844, 80.84322357177734, 85.14703369140625, 89.45085144042969, 93.7546615600586, 98.0584716796875, 102.3622817993164, 106.66609191894531, 110.96990203857422, 115.27371215820312, 119.57752990722656, 123.88134002685547, 128.18515014648438, 132.48895263671875, 136.7927703857422, 141.09658813476562]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 11.0, 0.0, 2.0, 7.0, 7.0, 10.0, 7.0, 14.0, 14.0, 12.0, 23.0, 32.0, 28.0, 33.0, 34.0, 41.0, 29.0, 42.0, 36.0, 51.0, 47.0, 51.0, 44.0, 39.0, 40.0, 42.0, 30.0, 33.0, 29.0, 30.0, 27.0, 28.0, 22.0, 17.0, 12.0, 16.0, 7.0, 8.0, 14.0, 11.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.6181526184082, -61.656272888183594, -59.694393157958984, -57.732513427734375, -55.770633697509766, -53.808753967285156, -51.84687423706055, -49.88499450683594, -47.92311477661133, -45.96123504638672, -43.99935531616211, -42.0374755859375, -40.07559585571289, -38.11371612548828, -36.15183639526367, -34.18995666503906, -32.22807693481445, -30.266197204589844, -28.304317474365234, -26.342437744140625, -24.380558013916016, -22.418678283691406, -20.456798553466797, -18.494918823242188, -16.533039093017578, -14.571159362792969, -12.60927963256836, -10.64739990234375, -8.68552017211914, -6.723640441894531, -4.761760711669922, -2.7998809814453125, -0.8380050659179688, 1.1238746643066406, 3.08575439453125, 5.047634124755859, 7.009513854980469, 8.971393585205078, 10.933273315429688, 12.895153045654297, 14.857032775878906, 16.818912506103516, 18.780792236328125, 20.742671966552734, 22.704551696777344, 24.666431427001953, 26.628311157226562, 28.590190887451172, 30.55207061767578, 32.51395034790039, 34.475830078125, 36.43770980834961, 38.39958953857422, 40.36146926879883, 42.32334899902344, 44.28522872924805, 46.247108459472656, 48.208988189697266, 50.170867919921875, 52.132747650146484, 54.094627380371094, 56.0565071105957, 58.01838684082031, 59.98026657104492, 61.94214630126953]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 12.0, 16.0, 19.0, 34.0, 46.0, 61.0, 98.0, 141.0, 229.0, 331.0, 459.0, 718.0, 1187.0, 1768.0, 2722.0, 4268.0, 6802.0, 10662.0, 17295.0, 28020.0, 46306.0, 76621.0, 127731.0, 204091.0, 201055.0, 124722.0, 74656.0, 45253.0, 27464.0, 16742.0, 10535.0, 6455.0, 4175.0, 2676.0, 1787.0, 1200.0, 748.0, 482.0, 333.0, 203.0, 138.0, 109.0, 66.0, 41.0, 27.0, 19.0, 10.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0], "bins": [-75.1875, -72.974609375, -70.76171875, -68.548828125, -66.3359375, -64.123046875, -61.91015625, -59.697265625, -57.484375, -55.271484375, -53.05859375, -50.845703125, -48.6328125, -46.419921875, -44.20703125, -41.994140625, -39.78125, -37.568359375, -35.35546875, -33.142578125, -30.9296875, -28.716796875, -26.50390625, -24.291015625, -22.078125, -19.865234375, -17.65234375, -15.439453125, -13.2265625, -11.013671875, -8.80078125, -6.587890625, -4.375, -2.162109375, 0.05078125, 2.263671875, 4.4765625, 6.689453125, 8.90234375, 11.115234375, 13.328125, 15.541015625, 17.75390625, 19.966796875, 22.1796875, 24.392578125, 26.60546875, 28.818359375, 31.03125, 33.244140625, 35.45703125, 37.669921875, 39.8828125, 42.095703125, 44.30859375, 46.521484375, 48.734375, 50.947265625, 53.16015625, 55.373046875, 57.5859375, 59.798828125, 62.01171875, 64.224609375, 66.4375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 1.0, 4.0, 2.0, 5.0, 11.0, 6.0, 10.0, 15.0, 12.0, 26.0, 22.0, 22.0, 30.0, 31.0, 39.0, 41.0, 33.0, 35.0, 47.0, 44.0, 54.0, 45.0, 36.0, 39.0, 48.0, 31.0, 45.0, 40.0, 28.0, 30.0, 23.0, 23.0, 17.0, 20.0, 16.0, 12.0, 9.0, 4.0, 3.0, 12.0, 9.0, 1.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0625, -52.27001953125, -50.4775390625, -48.68505859375, -46.892578125, -45.10009765625, -43.3076171875, -41.51513671875, -39.72265625, -37.93017578125, -36.1376953125, -34.34521484375, -32.552734375, -30.76025390625, -28.9677734375, -27.17529296875, -25.3828125, -23.59033203125, -21.7978515625, -20.00537109375, -18.212890625, -16.42041015625, -14.6279296875, -12.83544921875, -11.04296875, -9.25048828125, -7.4580078125, -5.66552734375, -3.873046875, -2.08056640625, -0.2880859375, 1.50439453125, 3.296875, 5.08935546875, 6.8818359375, 8.67431640625, 10.466796875, 12.25927734375, 14.0517578125, 15.84423828125, 17.63671875, 19.42919921875, 21.2216796875, 23.01416015625, 24.806640625, 26.59912109375, 28.3916015625, 30.18408203125, 31.9765625, 33.76904296875, 35.5615234375, 37.35400390625, 39.146484375, 40.93896484375, 42.7314453125, 44.52392578125, 46.31640625, 48.10888671875, 49.9013671875, 51.69384765625, 53.486328125, 55.27880859375, 57.0712890625, 58.86376953125, 60.65625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 10.0, 9.0, 21.0, 27.0, 31.0, 77.0, 86.0, 131.0, 172.0, 243.0, 413.0, 520.0, 748.0, 1167.0, 1663.0, 2524.0, 3729.0, 5382.0, 8103.0, 12290.0, 19038.0, 29361.0, 46655.0, 74970.0, 124149.0, 192016.0, 191574.0, 124685.0, 75751.0, 46728.0, 29480.0, 18988.0, 12366.0, 8323.0, 5386.0, 3740.0, 2551.0, 1738.0, 1135.0, 827.0, 543.0, 394.0, 262.0, 174.0, 109.0, 87.0, 67.0, 37.0, 33.0, 15.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-99.4375, -96.4248046875, -93.412109375, -90.3994140625, -87.38671875, -84.3740234375, -81.361328125, -78.3486328125, -75.3359375, -72.3232421875, -69.310546875, -66.2978515625, -63.28515625, -60.2724609375, -57.259765625, -54.2470703125, -51.234375, -48.2216796875, -45.208984375, -42.1962890625, -39.18359375, -36.1708984375, -33.158203125, -30.1455078125, -27.1328125, -24.1201171875, -21.107421875, -18.0947265625, -15.08203125, -12.0693359375, -9.056640625, -6.0439453125, -3.03125, -0.0185546875, 2.994140625, 6.0068359375, 9.01953125, 12.0322265625, 15.044921875, 18.0576171875, 21.0703125, 24.0830078125, 27.095703125, 30.1083984375, 33.12109375, 36.1337890625, 39.146484375, 42.1591796875, 45.171875, 48.1845703125, 51.197265625, 54.2099609375, 57.22265625, 60.2353515625, 63.248046875, 66.2607421875, 69.2734375, 72.2861328125, 75.298828125, 78.3115234375, 81.32421875, 84.3369140625, 87.349609375, 90.3623046875, 93.375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 5.0, 5.0, 14.0, 16.0, 16.0, 10.0, 20.0, 25.0, 31.0, 25.0, 25.0, 27.0, 32.0, 32.0, 32.0, 38.0, 38.0, 36.0, 38.0, 37.0, 49.0, 36.0, 22.0, 34.0, 34.0, 35.0, 36.0, 31.0, 26.0, 27.0, 14.0, 18.0, 22.0, 13.0, 11.0, 13.0, 8.0, 9.0, 9.0, 5.0, 13.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-38.84375, -37.69384765625, -36.5439453125, -35.39404296875, -34.244140625, -33.09423828125, -31.9443359375, -30.79443359375, -29.64453125, -28.49462890625, -27.3447265625, -26.19482421875, -25.044921875, -23.89501953125, -22.7451171875, -21.59521484375, -20.4453125, -19.29541015625, -18.1455078125, -16.99560546875, -15.845703125, -14.69580078125, -13.5458984375, -12.39599609375, -11.24609375, -10.09619140625, -8.9462890625, -7.79638671875, -6.646484375, -5.49658203125, -4.3466796875, -3.19677734375, -2.046875, -0.89697265625, 0.2529296875, 1.40283203125, 2.552734375, 3.70263671875, 4.8525390625, 6.00244140625, 7.15234375, 8.30224609375, 9.4521484375, 10.60205078125, 11.751953125, 12.90185546875, 14.0517578125, 15.20166015625, 16.3515625, 17.50146484375, 18.6513671875, 19.80126953125, 20.951171875, 22.10107421875, 23.2509765625, 24.40087890625, 25.55078125, 26.70068359375, 27.8505859375, 29.00048828125, 30.150390625, 31.30029296875, 32.4501953125, 33.60009765625, 34.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 18.0, 9.0, 29.0, 40.0, 58.0, 83.0, 121.0, 165.0, 236.0, 385.0, 528.0, 743.0, 1138.0, 1768.0, 2636.0, 4227.0, 6845.0, 11684.0, 19872.0, 35091.0, 64425.0, 125521.0, 236923.0, 245870.0, 132498.0, 68463.0, 36765.0, 20720.0, 12067.0, 7096.0, 4336.0, 2723.0, 1754.0, 1168.0, 790.0, 518.0, 411.0, 244.0, 169.0, 143.0, 89.0, 61.0, 42.0, 29.0, 19.0, 11.0, 8.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.311279296875, -18.62255859375, -17.933837890625, -17.2451171875, -16.556396484375, -15.86767578125, -15.178955078125, -14.490234375, -13.801513671875, -13.11279296875, -12.424072265625, -11.7353515625, -11.046630859375, -10.35791015625, -9.669189453125, -8.98046875, -8.291748046875, -7.60302734375, -6.914306640625, -6.2255859375, -5.536865234375, -4.84814453125, -4.159423828125, -3.470703125, -2.781982421875, -2.09326171875, -1.404541015625, -0.7158203125, -0.027099609375, 0.66162109375, 1.350341796875, 2.0390625, 2.727783203125, 3.41650390625, 4.105224609375, 4.7939453125, 5.482666015625, 6.17138671875, 6.860107421875, 7.548828125, 8.237548828125, 8.92626953125, 9.614990234375, 10.3037109375, 10.992431640625, 11.68115234375, 12.369873046875, 13.05859375, 13.747314453125, 14.43603515625, 15.124755859375, 15.8134765625, 16.502197265625, 17.19091796875, 17.879638671875, 18.568359375, 19.257080078125, 19.94580078125, 20.634521484375, 21.3232421875, 22.011962890625, 22.70068359375, 23.389404296875, 24.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 10.0, 5.0, 18.0, 17.0, 24.0, 33.0, 38.0, 47.0, 46.0, 65.0, 83.0, 88.0, 95.0, 96.0, 81.0, 41.0, 39.0, 38.0, 21.0, 28.0, 10.0, 10.0, 11.0, 5.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.002114593982696533, -0.0020357370376586914, -0.0019568800926208496, -0.0018780231475830078, -0.001799166202545166, -0.0017203092575073242, -0.0016414523124694824, -0.0015625953674316406, -0.0014837384223937988, -0.001404881477355957, -0.0013260245323181152, -0.0012471675872802734, -0.0011683106422424316, -0.0010894536972045898, -0.001010596752166748, -0.0009317398071289062, -0.0008528828620910645, -0.0007740259170532227, -0.0006951689720153809, -0.0006163120269775391, -0.0005374550819396973, -0.00045859813690185547, -0.00037974119186401367, -0.0003008842468261719, -0.00022202730178833008, -0.00014317035675048828, -6.431341171264648e-05, 1.4543533325195312e-05, 9.340047836303711e-05, 0.0001722574234008789, 0.0002511143684387207, 0.0003299713134765625, 0.0004088282585144043, 0.0004876852035522461, 0.0005665421485900879, 0.0006453990936279297, 0.0007242560386657715, 0.0008031129837036133, 0.0008819699287414551, 0.0009608268737792969, 0.0010396838188171387, 0.0011185407638549805, 0.0011973977088928223, 0.001276254653930664, 0.0013551115989685059, 0.0014339685440063477, 0.0015128254890441895, 0.0015916824340820312, 0.001670539379119873, 0.0017493963241577148, 0.0018282532691955566, 0.0019071102142333984, 0.0019859671592712402, 0.002064824104309082, 0.002143681049346924, 0.0022225379943847656, 0.0023013949394226074, 0.0023802518844604492, 0.002459108829498291, 0.002537965774536133, 0.0026168227195739746, 0.0026956796646118164, 0.002774536609649658, 0.0028533935546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 7.0, 13.0, 19.0, 23.0, 45.0, 47.0, 95.0, 128.0, 153.0, 258.0, 345.0, 489.0, 748.0, 1074.0, 1608.0, 2326.0, 3561.0, 5740.0, 8773.0, 13919.0, 23266.0, 40024.0, 70654.0, 125302.0, 206549.0, 217522.0, 137177.0, 77002.0, 43610.0, 25560.0, 15348.0, 9558.0, 5995.0, 3784.0, 2524.0, 1702.0, 1060.0, 820.0, 524.0, 379.0, 263.0, 162.0, 133.0, 85.0, 68.0, 39.0, 19.0, 16.0, 14.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.34716796875, -17.7568359375, -17.16650390625, -16.576171875, -15.98583984375, -15.3955078125, -14.80517578125, -14.21484375, -13.62451171875, -13.0341796875, -12.44384765625, -11.853515625, -11.26318359375, -10.6728515625, -10.08251953125, -9.4921875, -8.90185546875, -8.3115234375, -7.72119140625, -7.130859375, -6.54052734375, -5.9501953125, -5.35986328125, -4.76953125, -4.17919921875, -3.5888671875, -2.99853515625, -2.408203125, -1.81787109375, -1.2275390625, -0.63720703125, -0.046875, 0.54345703125, 1.1337890625, 1.72412109375, 2.314453125, 2.90478515625, 3.4951171875, 4.08544921875, 4.67578125, 5.26611328125, 5.8564453125, 6.44677734375, 7.037109375, 7.62744140625, 8.2177734375, 8.80810546875, 9.3984375, 9.98876953125, 10.5791015625, 11.16943359375, 11.759765625, 12.35009765625, 12.9404296875, 13.53076171875, 14.12109375, 14.71142578125, 15.3017578125, 15.89208984375, 16.482421875, 17.07275390625, 17.6630859375, 18.25341796875, 18.84375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 9.0, 6.0, 9.0, 10.0, 12.0, 16.0, 24.0, 23.0, 33.0, 28.0, 42.0, 45.0, 56.0, 41.0, 50.0, 68.0, 63.0, 53.0, 54.0, 48.0, 35.0, 50.0, 33.0, 31.0, 17.0, 21.0, 20.0, 21.0, 15.0, 7.0, 14.0, 10.0, 3.0, 6.0, 1.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.57421875, -6.378173828125, -6.18212890625, -5.986083984375, -5.7900390625, -5.593994140625, -5.39794921875, -5.201904296875, -5.005859375, -4.809814453125, -4.61376953125, -4.417724609375, -4.2216796875, -4.025634765625, -3.82958984375, -3.633544921875, -3.4375, -3.241455078125, -3.04541015625, -2.849365234375, -2.6533203125, -2.457275390625, -2.26123046875, -2.065185546875, -1.869140625, -1.673095703125, -1.47705078125, -1.281005859375, -1.0849609375, -0.888916015625, -0.69287109375, -0.496826171875, -0.30078125, -0.104736328125, 0.09130859375, 0.287353515625, 0.4833984375, 0.679443359375, 0.87548828125, 1.071533203125, 1.267578125, 1.463623046875, 1.65966796875, 1.855712890625, 2.0517578125, 2.247802734375, 2.44384765625, 2.639892578125, 2.8359375, 3.031982421875, 3.22802734375, 3.424072265625, 3.6201171875, 3.816162109375, 4.01220703125, 4.208251953125, 4.404296875, 4.600341796875, 4.79638671875, 4.992431640625, 5.1884765625, 5.384521484375, 5.58056640625, 5.776611328125, 5.97265625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 13.0, 12.0, 22.0, 25.0, 37.0, 51.0, 60.0, 85.0, 99.0, 117.0, 96.0, 85.0, 69.0, 73.0, 42.0, 21.0, 25.0, 15.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.57764434814453, -114.96800994873047, -111.35836791992188, -107.74873352050781, -104.13909149169922, -100.52945709228516, -96.91981506347656, -93.3101806640625, -89.7005386352539, -86.09090423583984, -82.48126220703125, -78.87162780761719, -75.2619857788086, -71.65235137939453, -68.04270935058594, -64.43307495117188, -60.82343673706055, -57.21379852294922, -53.60416030883789, -49.99452209472656, -46.384883880615234, -42.775245666503906, -39.165611267089844, -35.55596923828125, -31.946332931518555, -28.336694717407227, -24.7270565032959, -21.117420196533203, -17.507781982421875, -13.898143768310547, -10.288505554199219, -6.678867340087891, -3.0692291259765625, 0.5404088497161865, 4.1500468254089355, 7.7596845626831055, 11.369322776794434, 14.978960037231445, 18.588598251342773, 22.1982364654541, 25.80787467956543, 29.417512893676758, 33.02714920043945, 36.63678741455078, 40.24642562866211, 43.85606384277344, 47.465702056884766, 51.075340270996094, 54.68497848510742, 58.29461669921875, 61.90425491333008, 65.5138931274414, 69.12352752685547, 72.73316955566406, 76.34280395507812, 79.95244598388672, 83.56208038330078, 87.17171478271484, 90.78135681152344, 94.3909912109375, 98.0006332397461, 101.61026763916016, 105.21990966796875, 108.82954406738281, 112.4391860961914]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 0.0, 6.0, 5.0, 3.0, 6.0, 3.0, 7.0, 13.0, 9.0, 16.0, 18.0, 24.0, 15.0, 33.0, 22.0, 26.0, 39.0, 35.0, 32.0, 40.0, 34.0, 34.0, 47.0, 38.0, 48.0, 40.0, 45.0, 41.0, 30.0, 30.0, 35.0, 30.0, 27.0, 19.0, 18.0, 18.0, 19.0, 10.0, 19.0, 10.0, 9.0, 14.0, 6.0, 3.0, 6.0, 1.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-57.111000061035156, -55.35655975341797, -53.60212326049805, -51.84768295288086, -50.09324645996094, -48.33880615234375, -46.58436584472656, -44.82992935180664, -43.07549285888672, -41.32105255126953, -39.56661605834961, -37.81217575073242, -36.0577392578125, -34.30329895019531, -32.548858642578125, -30.794422149658203, -29.039981842041016, -27.28554344177246, -25.531105041503906, -23.77666473388672, -22.022228240966797, -20.26778793334961, -18.513349533081055, -16.7589111328125, -15.004472732543945, -13.25003433227539, -11.495595932006836, -9.741156578063965, -7.98671817779541, -6.2322797775268555, -4.477840423583984, -2.7234020233154297, -0.9689598083496094, 0.7854788303375244, 2.539917469024658, 4.294356346130371, 6.048794746398926, 7.8032331466674805, 9.557672500610352, 11.312110900878906, 13.066549301147461, 14.820987701416016, 16.57542610168457, 18.329864501953125, 20.084304809570312, 21.838741302490234, 23.593181610107422, 25.347620010375977, 27.10205841064453, 28.856496810913086, 30.61093521118164, 32.36537551879883, 34.11981201171875, 35.87425231933594, 37.628692626953125, 39.38312911987305, 41.13756561279297, 42.892005920410156, 44.64644241333008, 46.400882720947266, 48.15531921386719, 49.909759521484375, 51.66419982910156, 53.418636322021484, 55.17307662963867]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 16.0, 16.0, 32.0, 36.0, 49.0, 73.0, 97.0, 135.0, 211.0, 286.0, 393.0, 638.0, 900.0, 1351.0, 1990.0, 3004.0, 4795.0, 7559.0, 12518.0, 21141.0, 37572.0, 70918.0, 163143.0, 560551.0, 1619468.0, 1130163.0, 318665.0, 112459.0, 53638.0, 28960.0, 16505.0, 9773.0, 6069.0, 3795.0, 2525.0, 1560.0, 1126.0, 726.0, 471.0, 320.0, 225.0, 150.0, 92.0, 59.0, 36.0, 22.0, 14.0, 12.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-77.125, -74.6982421875, -72.271484375, -69.8447265625, -67.41796875, -64.9912109375, -62.564453125, -60.1376953125, -57.7109375, -55.2841796875, -52.857421875, -50.4306640625, -48.00390625, -45.5771484375, -43.150390625, -40.7236328125, -38.296875, -35.8701171875, -33.443359375, -31.0166015625, -28.58984375, -26.1630859375, -23.736328125, -21.3095703125, -18.8828125, -16.4560546875, -14.029296875, -11.6025390625, -9.17578125, -6.7490234375, -4.322265625, -1.8955078125, 0.53125, 2.9580078125, 5.384765625, 7.8115234375, 10.23828125, 12.6650390625, 15.091796875, 17.5185546875, 19.9453125, 22.3720703125, 24.798828125, 27.2255859375, 29.65234375, 32.0791015625, 34.505859375, 36.9326171875, 39.359375, 41.7861328125, 44.212890625, 46.6396484375, 49.06640625, 51.4931640625, 53.919921875, 56.3466796875, 58.7734375, 61.2001953125, 63.626953125, 66.0537109375, 68.48046875, 70.9072265625, 73.333984375, 75.7607421875, 78.1875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 3.0, 6.0, 5.0, 15.0, 11.0, 10.0, 13.0, 21.0, 23.0, 20.0, 39.0, 23.0, 24.0, 30.0, 47.0, 29.0, 39.0, 38.0, 51.0, 41.0, 47.0, 43.0, 32.0, 39.0, 51.0, 35.0, 32.0, 26.0, 22.0, 34.0, 19.0, 21.0, 13.0, 11.0, 14.0, 6.0, 14.0, 9.0, 8.0, 1.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-41.5625, -40.2880859375, -39.013671875, -37.7392578125, -36.46484375, -35.1904296875, -33.916015625, -32.6416015625, -31.3671875, -30.0927734375, -28.818359375, -27.5439453125, -26.26953125, -24.9951171875, -23.720703125, -22.4462890625, -21.171875, -19.8974609375, -18.623046875, -17.3486328125, -16.07421875, -14.7998046875, -13.525390625, -12.2509765625, -10.9765625, -9.7021484375, -8.427734375, -7.1533203125, -5.87890625, -4.6044921875, -3.330078125, -2.0556640625, -0.78125, 0.4931640625, 1.767578125, 3.0419921875, 4.31640625, 5.5908203125, 6.865234375, 8.1396484375, 9.4140625, 10.6884765625, 11.962890625, 13.2373046875, 14.51171875, 15.7861328125, 17.060546875, 18.3349609375, 19.609375, 20.8837890625, 22.158203125, 23.4326171875, 24.70703125, 25.9814453125, 27.255859375, 28.5302734375, 29.8046875, 31.0791015625, 32.353515625, 33.6279296875, 34.90234375, 36.1767578125, 37.451171875, 38.7255859375, 40.0]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 6.0, 22.0, 44.0, 50.0, 45.0, 112.0, 149.0, 241.0, 421.0, 634.0, 1011.0, 1682.0, 2706.0, 4563.0, 7833.0, 13554.0, 23477.0, 42373.0, 79959.0, 155866.0, 333833.0, 861504.0, 1540961.0, 601759.0, 252917.0, 122352.0, 64258.0, 35007.0, 19596.0, 11293.0, 6419.0, 3826.0, 2278.0, 1387.0, 856.0, 499.0, 306.0, 181.0, 110.0, 71.0, 35.0, 22.0, 16.0, 19.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.875, -61.6201171875, -59.365234375, -57.1103515625, -54.85546875, -52.6005859375, -50.345703125, -48.0908203125, -45.8359375, -43.5810546875, -41.326171875, -39.0712890625, -36.81640625, -34.5615234375, -32.306640625, -30.0517578125, -27.796875, -25.5419921875, -23.287109375, -21.0322265625, -18.77734375, -16.5224609375, -14.267578125, -12.0126953125, -9.7578125, -7.5029296875, -5.248046875, -2.9931640625, -0.73828125, 1.5166015625, 3.771484375, 6.0263671875, 8.28125, 10.5361328125, 12.791015625, 15.0458984375, 17.30078125, 19.5556640625, 21.810546875, 24.0654296875, 26.3203125, 28.5751953125, 30.830078125, 33.0849609375, 35.33984375, 37.5947265625, 39.849609375, 42.1044921875, 44.359375, 46.6142578125, 48.869140625, 51.1240234375, 53.37890625, 55.6337890625, 57.888671875, 60.1435546875, 62.3984375, 64.6533203125, 66.908203125, 69.1630859375, 71.41796875, 73.6728515625, 75.927734375, 78.1826171875, 80.4375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 13.0, 7.0, 11.0, 22.0, 16.0, 24.0, 36.0, 33.0, 50.0, 59.0, 72.0, 109.0, 104.0, 141.0, 163.0, 200.0, 235.0, 275.0, 336.0, 389.0, 278.0, 230.0, 202.0, 163.0, 149.0, 121.0, 89.0, 78.0, 78.0, 65.0, 55.0, 44.0, 27.0, 39.0, 35.0, 16.0, 17.0, 21.0, 10.0, 10.0, 10.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.4375, -18.8076171875, -18.177734375, -17.5478515625, -16.91796875, -16.2880859375, -15.658203125, -15.0283203125, -14.3984375, -13.7685546875, -13.138671875, -12.5087890625, -11.87890625, -11.2490234375, -10.619140625, -9.9892578125, -9.359375, -8.7294921875, -8.099609375, -7.4697265625, -6.83984375, -6.2099609375, -5.580078125, -4.9501953125, -4.3203125, -3.6904296875, -3.060546875, -2.4306640625, -1.80078125, -1.1708984375, -0.541015625, 0.0888671875, 0.71875, 1.3486328125, 1.978515625, 2.6083984375, 3.23828125, 3.8681640625, 4.498046875, 5.1279296875, 5.7578125, 6.3876953125, 7.017578125, 7.6474609375, 8.27734375, 8.9072265625, 9.537109375, 10.1669921875, 10.796875, 11.4267578125, 12.056640625, 12.6865234375, 13.31640625, 13.9462890625, 14.576171875, 15.2060546875, 15.8359375, 16.4658203125, 17.095703125, 17.7255859375, 18.35546875, 18.9853515625, 19.615234375, 20.2451171875, 20.875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 3.0, 12.0, 9.0, 16.0, 19.0, 30.0, 33.0, 38.0, 38.0, 43.0, 50.0, 67.0, 71.0, 62.0, 75.0, 63.0, 71.0, 43.0, 52.0, 33.0, 36.0, 15.0, 20.0, 20.0, 12.0, 7.0, 8.0, 11.0, 8.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.30702209472656, -55.384098052978516, -53.46117401123047, -51.538246154785156, -49.61532211303711, -47.69239807128906, -45.769474029541016, -43.84654998779297, -41.92362594604492, -40.000701904296875, -38.07777786254883, -36.15485382080078, -34.23192596435547, -32.30900192260742, -30.386077880859375, -28.463153839111328, -26.54022789001465, -24.6173038482666, -22.694377899169922, -20.771453857421875, -18.848529815673828, -16.92560577392578, -15.002679824829102, -13.079755783081055, -11.156830787658691, -9.233905792236328, -7.310981750488281, -5.388056755065918, -3.465132236480713, -1.5422077178955078, 0.38071727752685547, 2.3036413192749023, 4.226566314697266, 6.149490833282471, 8.072415351867676, 9.995340347290039, 11.918264389038086, 13.84118938446045, 15.764114379882812, 17.68703842163086, 19.609962463378906, 21.532886505126953, 23.455812454223633, 25.37873649597168, 27.301660537719727, 29.224586486816406, 31.147510528564453, 33.0704345703125, 34.99336242675781, 36.91628646850586, 38.839210510253906, 40.76213836669922, 42.685062408447266, 44.60798645019531, 46.53091049194336, 48.453834533691406, 50.37675857543945, 52.2996826171875, 54.22260665893555, 56.145530700683594, 58.068458557128906, 59.99138259887695, 61.914306640625, 63.83723068237305, 65.7601547241211]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 6.0, 11.0, 18.0, 18.0, 13.0, 24.0, 20.0, 24.0, 27.0, 38.0, 37.0, 36.0, 45.0, 51.0, 42.0, 38.0, 54.0, 40.0, 36.0, 42.0, 54.0, 31.0, 32.0, 38.0, 24.0, 21.0, 26.0, 25.0, 12.0, 19.0, 18.0, 10.0, 11.0, 9.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.858299255371094, -49.344215393066406, -47.830135345458984, -46.3160514831543, -44.801971435546875, -43.28788757324219, -41.7738037109375, -40.25972366333008, -38.745643615722656, -37.23155975341797, -35.71747970581055, -34.20339584350586, -32.68931579589844, -31.17523193359375, -29.661149978637695, -28.14706802368164, -26.632984161376953, -25.1189022064209, -23.604820251464844, -22.090736389160156, -20.576656341552734, -19.062572479248047, -17.548490524291992, -16.034408569335938, -14.520326614379883, -13.006244659423828, -11.492162704467773, -9.978079795837402, -8.463997840881348, -6.949915885925293, -5.435832977294922, -3.921751022338867, -2.407672882080078, -0.8935906887054443, 0.6204915046691895, 2.1345739364624023, 3.648655891418457, 5.162737846374512, 6.676820755004883, 8.190902709960938, 9.704984664916992, 11.219066619873047, 12.733148574829102, 14.247231483459473, 15.761313438415527, 17.275394439697266, 18.789478302001953, 20.303560256958008, 21.817642211914062, 23.331724166870117, 24.845806121826172, 26.35988998413086, 27.87397003173828, 29.38805389404297, 30.902135848999023, 32.41621780395508, 33.9302978515625, 35.44438171386719, 36.95846176147461, 38.4725456237793, 39.98662567138672, 41.500709533691406, 43.014793395996094, 44.528873443603516, 46.0429573059082]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 8.0, 21.0, 21.0, 23.0, 48.0, 78.0, 113.0, 189.0, 224.0, 338.0, 519.0, 790.0, 1350.0, 1957.0, 3063.0, 4528.0, 7627.0, 12342.0, 20637.0, 35370.0, 61580.0, 108851.0, 192780.0, 241600.0, 150328.0, 84377.0, 48605.0, 28015.0, 16262.0, 9853.0, 6164.0, 3791.0, 2436.0, 1561.0, 1052.0, 683.0, 475.0, 337.0, 178.0, 116.0, 94.0, 63.0, 31.0, 25.0, 18.0, 14.0, 11.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-91.875, -89.1142578125, -86.353515625, -83.5927734375, -80.83203125, -78.0712890625, -75.310546875, -72.5498046875, -69.7890625, -67.0283203125, -64.267578125, -61.5068359375, -58.74609375, -55.9853515625, -53.224609375, -50.4638671875, -47.703125, -44.9423828125, -42.181640625, -39.4208984375, -36.66015625, -33.8994140625, -31.138671875, -28.3779296875, -25.6171875, -22.8564453125, -20.095703125, -17.3349609375, -14.57421875, -11.8134765625, -9.052734375, -6.2919921875, -3.53125, -0.7705078125, 1.990234375, 4.7509765625, 7.51171875, 10.2724609375, 13.033203125, 15.7939453125, 18.5546875, 21.3154296875, 24.076171875, 26.8369140625, 29.59765625, 32.3583984375, 35.119140625, 37.8798828125, 40.640625, 43.4013671875, 46.162109375, 48.9228515625, 51.68359375, 54.4443359375, 57.205078125, 59.9658203125, 62.7265625, 65.4873046875, 68.248046875, 71.0087890625, 73.76953125, 76.5302734375, 79.291015625, 82.0517578125, 84.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 8.0, 8.0, 13.0, 15.0, 20.0, 11.0, 27.0, 28.0, 26.0, 39.0, 38.0, 43.0, 43.0, 48.0, 42.0, 45.0, 40.0, 51.0, 42.0, 44.0, 52.0, 42.0, 25.0, 36.0, 37.0, 24.0, 17.0, 24.0, 16.0, 20.0, 20.0, 9.0, 4.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.40625, -46.970703125, -45.53515625, -44.099609375, -42.6640625, -41.228515625, -39.79296875, -38.357421875, -36.921875, -35.486328125, -34.05078125, -32.615234375, -31.1796875, -29.744140625, -28.30859375, -26.873046875, -25.4375, -24.001953125, -22.56640625, -21.130859375, -19.6953125, -18.259765625, -16.82421875, -15.388671875, -13.953125, -12.517578125, -11.08203125, -9.646484375, -8.2109375, -6.775390625, -5.33984375, -3.904296875, -2.46875, -1.033203125, 0.40234375, 1.837890625, 3.2734375, 4.708984375, 6.14453125, 7.580078125, 9.015625, 10.451171875, 11.88671875, 13.322265625, 14.7578125, 16.193359375, 17.62890625, 19.064453125, 20.5, 21.935546875, 23.37109375, 24.806640625, 26.2421875, 27.677734375, 29.11328125, 30.548828125, 31.984375, 33.419921875, 34.85546875, 36.291015625, 37.7265625, 39.162109375, 40.59765625, 42.033203125, 43.46875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 29.0, 25.0, 36.0, 47.0, 59.0, 82.0, 96.0, 149.0, 241.0, 370.0, 542.0, 787.0, 1130.0, 1924.0, 2850.0, 4670.0, 7648.0, 13094.0, 23282.0, 43363.0, 88525.0, 204858.0, 335954.0, 161347.0, 72189.0, 36215.0, 19474.0, 11242.0, 6723.0, 4017.0, 2615.0, 1654.0, 1033.0, 727.0, 489.0, 344.0, 239.0, 146.0, 111.0, 73.0, 46.0, 29.0, 23.0, 17.0, 11.0, 5.0, 3.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.375, -108.7919921875, -105.208984375, -101.6259765625, -98.04296875, -94.4599609375, -90.876953125, -87.2939453125, -83.7109375, -80.1279296875, -76.544921875, -72.9619140625, -69.37890625, -65.7958984375, -62.212890625, -58.6298828125, -55.046875, -51.4638671875, -47.880859375, -44.2978515625, -40.71484375, -37.1318359375, -33.548828125, -29.9658203125, -26.3828125, -22.7998046875, -19.216796875, -15.6337890625, -12.05078125, -8.4677734375, -4.884765625, -1.3017578125, 2.28125, 5.8642578125, 9.447265625, 13.0302734375, 16.61328125, 20.1962890625, 23.779296875, 27.3623046875, 30.9453125, 34.5283203125, 38.111328125, 41.6943359375, 45.27734375, 48.8603515625, 52.443359375, 56.0263671875, 59.609375, 63.1923828125, 66.775390625, 70.3583984375, 73.94140625, 77.5244140625, 81.107421875, 84.6904296875, 88.2734375, 91.8564453125, 95.439453125, 99.0224609375, 102.60546875, 106.1884765625, 109.771484375, 113.3544921875, 116.9375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 9.0, 13.0, 8.0, 12.0, 19.0, 18.0, 16.0, 24.0, 32.0, 26.0, 31.0, 34.0, 32.0, 41.0, 43.0, 61.0, 38.0, 41.0, 47.0, 46.0, 37.0, 37.0, 47.0, 28.0, 28.0, 22.0, 34.0, 28.0, 18.0, 19.0, 23.0, 15.0, 9.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.234375, -30.186767578125, -29.13916015625, -28.091552734375, -27.0439453125, -25.996337890625, -24.94873046875, -23.901123046875, -22.853515625, -21.805908203125, -20.75830078125, -19.710693359375, -18.6630859375, -17.615478515625, -16.56787109375, -15.520263671875, -14.47265625, -13.425048828125, -12.37744140625, -11.329833984375, -10.2822265625, -9.234619140625, -8.18701171875, -7.139404296875, -6.091796875, -5.044189453125, -3.99658203125, -2.948974609375, -1.9013671875, -0.853759765625, 0.19384765625, 1.241455078125, 2.2890625, 3.336669921875, 4.38427734375, 5.431884765625, 6.4794921875, 7.527099609375, 8.57470703125, 9.622314453125, 10.669921875, 11.717529296875, 12.76513671875, 13.812744140625, 14.8603515625, 15.907958984375, 16.95556640625, 18.003173828125, 19.05078125, 20.098388671875, 21.14599609375, 22.193603515625, 23.2412109375, 24.288818359375, 25.33642578125, 26.384033203125, 27.431640625, 28.479248046875, 29.52685546875, 30.574462890625, 31.6220703125, 32.669677734375, 33.71728515625, 34.764892578125, 35.8125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 8.0, 18.0, 14.0, 20.0, 24.0, 38.0, 41.0, 60.0, 62.0, 81.0, 118.0, 143.0, 222.0, 304.0, 477.0, 764.0, 1324.0, 2672.0, 6039.0, 16609.0, 79438.0, 717217.0, 179517.0, 26755.0, 8286.0, 3492.0, 1826.0, 1043.0, 587.0, 399.0, 267.0, 177.0, 140.0, 83.0, 75.0, 57.0, 34.0, 27.0, 21.0, 16.0, 13.0, 5.0, 9.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.3125, -75.759765625, -73.20703125, -70.654296875, -68.1015625, -65.548828125, -62.99609375, -60.443359375, -57.890625, -55.337890625, -52.78515625, -50.232421875, -47.6796875, -45.126953125, -42.57421875, -40.021484375, -37.46875, -34.916015625, -32.36328125, -29.810546875, -27.2578125, -24.705078125, -22.15234375, -19.599609375, -17.046875, -14.494140625, -11.94140625, -9.388671875, -6.8359375, -4.283203125, -1.73046875, 0.822265625, 3.375, 5.927734375, 8.48046875, 11.033203125, 13.5859375, 16.138671875, 18.69140625, 21.244140625, 23.796875, 26.349609375, 28.90234375, 31.455078125, 34.0078125, 36.560546875, 39.11328125, 41.666015625, 44.21875, 46.771484375, 49.32421875, 51.876953125, 54.4296875, 56.982421875, 59.53515625, 62.087890625, 64.640625, 67.193359375, 69.74609375, 72.298828125, 74.8515625, 77.404296875, 79.95703125, 82.509765625, 85.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 8.0, 14.0, 20.0, 37.0, 92.0, 232.0, 316.0, 142.0, 63.0, 28.0, 9.0, 7.0, 10.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01021575927734375, -0.009941577911376953, -0.009667396545410156, -0.00939321517944336, -0.009119033813476562, -0.008844852447509766, -0.008570671081542969, -0.008296489715576172, -0.008022308349609375, -0.007748126983642578, -0.007473945617675781, -0.007199764251708984, -0.0069255828857421875, -0.006651401519775391, -0.006377220153808594, -0.006103038787841797, -0.005828857421875, -0.005554676055908203, -0.005280494689941406, -0.005006313323974609, -0.0047321319580078125, -0.004457950592041016, -0.004183769226074219, -0.003909587860107422, -0.003635406494140625, -0.003361225128173828, -0.0030870437622070312, -0.0028128623962402344, -0.0025386810302734375, -0.0022644996643066406, -0.0019903182983398438, -0.0017161369323730469, -0.00144195556640625, -0.0011677742004394531, -0.0008935928344726562, -0.0006194114685058594, -0.0003452301025390625, -7.104873657226562e-05, 0.00020313262939453125, 0.0004773139953613281, 0.000751495361328125, 0.0010256767272949219, 0.0012998580932617188, 0.0015740394592285156, 0.0018482208251953125, 0.0021224021911621094, 0.0023965835571289062, 0.002670764923095703, 0.0029449462890625, 0.003219127655029297, 0.0034933090209960938, 0.0037674903869628906, 0.0040416717529296875, 0.004315853118896484, 0.004590034484863281, 0.004864215850830078, 0.005138397216796875, 0.005412578582763672, 0.005686759948730469, 0.005960941314697266, 0.0062351226806640625, 0.006509304046630859, 0.006783485412597656, 0.007057666778564453, 0.00733184814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 7.0, 6.0, 8.0, 12.0, 17.0, 15.0, 23.0, 47.0, 50.0, 89.0, 107.0, 183.0, 270.0, 395.0, 632.0, 1040.0, 1712.0, 2920.0, 5096.0, 10367.0, 26470.0, 111332.0, 599301.0, 219077.0, 40359.0, 13771.0, 6276.0, 3486.0, 2012.0, 1241.0, 727.0, 454.0, 344.0, 253.0, 154.0, 102.0, 54.0, 47.0, 31.0, 21.0, 13.0, 15.0, 6.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-84.25, -81.95263671875, -79.6552734375, -77.35791015625, -75.060546875, -72.76318359375, -70.4658203125, -68.16845703125, -65.87109375, -63.57373046875, -61.2763671875, -58.97900390625, -56.681640625, -54.38427734375, -52.0869140625, -49.78955078125, -47.4921875, -45.19482421875, -42.8974609375, -40.60009765625, -38.302734375, -36.00537109375, -33.7080078125, -31.41064453125, -29.11328125, -26.81591796875, -24.5185546875, -22.22119140625, -19.923828125, -17.62646484375, -15.3291015625, -13.03173828125, -10.734375, -8.43701171875, -6.1396484375, -3.84228515625, -1.544921875, 0.75244140625, 3.0498046875, 5.34716796875, 7.64453125, 9.94189453125, 12.2392578125, 14.53662109375, 16.833984375, 19.13134765625, 21.4287109375, 23.72607421875, 26.0234375, 28.32080078125, 30.6181640625, 32.91552734375, 35.212890625, 37.51025390625, 39.8076171875, 42.10498046875, 44.40234375, 46.69970703125, 48.9970703125, 51.29443359375, 53.591796875, 55.88916015625, 58.1865234375, 60.48388671875, 62.78125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 10.0, 11.0, 18.0, 29.0, 48.0, 76.0, 131.0, 151.0, 144.0, 101.0, 90.0, 43.0, 31.0, 22.0, 13.0, 6.0, 9.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3778076171875, -12.794677734375, -12.2115478515625, -11.62841796875, -11.0452880859375, -10.462158203125, -9.8790283203125, -9.2958984375, -8.7127685546875, -8.129638671875, -7.5465087890625, -6.96337890625, -6.3802490234375, -5.797119140625, -5.2139892578125, -4.630859375, -4.0477294921875, -3.464599609375, -2.8814697265625, -2.29833984375, -1.7152099609375, -1.132080078125, -0.5489501953125, 0.0341796875, 0.6173095703125, 1.200439453125, 1.7835693359375, 2.36669921875, 2.9498291015625, 3.532958984375, 4.1160888671875, 4.69921875, 5.2823486328125, 5.865478515625, 6.4486083984375, 7.03173828125, 7.6148681640625, 8.197998046875, 8.7811279296875, 9.3642578125, 9.9473876953125, 10.530517578125, 11.1136474609375, 11.69677734375, 12.2799072265625, 12.863037109375, 13.4461669921875, 14.029296875, 14.6124267578125, 15.195556640625, 15.7786865234375, 16.36181640625, 16.9449462890625, 17.528076171875, 18.1112060546875, 18.6943359375, 19.2774658203125, 19.860595703125, 20.4437255859375, 21.02685546875, 21.6099853515625, 22.193115234375, 22.7762451171875, 23.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 8.0, 4.0, 8.0, 14.0, 15.0, 19.0, 33.0, 35.0, 46.0, 36.0, 48.0, 55.0, 61.0, 62.0, 59.0, 66.0, 53.0, 55.0, 45.0, 42.0, 28.0, 30.0, 32.0, 22.0, 21.0, 12.0, 16.0, 11.0, 10.0, 3.0, 5.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.002079010009766, -41.50918960571289, -40.016300201416016, -38.523406982421875, -37.030517578125, -35.537628173828125, -34.04473876953125, -32.551849365234375, -31.058958053588867, -29.566068649291992, -28.073177337646484, -26.58028793334961, -25.087398529052734, -23.594507217407227, -22.10161781311035, -20.608726501464844, -19.11583709716797, -17.622947692871094, -16.130056381225586, -14.637166976928711, -13.14427661895752, -11.651386260986328, -10.158496856689453, -8.665606498718262, -7.17271614074707, -5.679825782775879, -4.186935901641846, -2.6940460205078125, -1.201155662536621, 0.2917346954345703, 1.7846240997314453, 3.2775144577026367, 4.770404815673828, 6.2632951736450195, 7.756185054779053, 9.249074935913086, 10.741965293884277, 12.234855651855469, 13.727745056152344, 15.220635414123535, 16.713525772094727, 18.2064151763916, 19.69930648803711, 21.192195892333984, 22.68508529663086, 24.177976608276367, 25.670866012573242, 27.16375732421875, 28.656646728515625, 30.1495361328125, 31.642427444458008, 33.13531494140625, 34.62820816040039, 36.121097564697266, 37.61398696899414, 39.106876373291016, 40.599769592285156, 42.09265899658203, 43.585548400878906, 45.07843780517578, 46.57133102416992, 48.0642204284668, 49.55710983276367, 51.04999923706055, 52.54288864135742]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 4.0, 7.0, 10.0, 13.0, 17.0, 15.0, 14.0, 13.0, 25.0, 22.0, 30.0, 25.0, 43.0, 47.0, 50.0, 32.0, 30.0, 40.0, 38.0, 48.0, 57.0, 38.0, 40.0, 36.0, 35.0, 26.0, 27.0, 26.0, 28.0, 21.0, 17.0, 18.0, 20.0, 13.0, 13.0, 9.0, 8.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-44.74073791503906, -43.462337493896484, -42.18394088745117, -40.905540466308594, -39.627140045166016, -38.34873962402344, -37.070343017578125, -35.79194259643555, -34.51354217529297, -33.23514175415039, -31.956743240356445, -30.6783447265625, -29.399944305419922, -28.121545791625977, -26.84314727783203, -25.564746856689453, -24.28635025024414, -23.007951736450195, -21.729551315307617, -20.451152801513672, -19.172752380371094, -17.89435386657715, -16.615955352783203, -15.337555885314941, -14.05915641784668, -12.780756950378418, -11.502357482910156, -10.223958969116211, -8.94555950164795, -7.6671600341796875, -6.388761043548584, -5.1103620529174805, -3.8319664001464844, -2.5535671710968018, -1.2751679420471191, 0.0032312870025634766, 1.281630516052246, 2.560029983520508, 3.8384289741516113, 5.116827964782715, 6.395227432250977, 7.673626899719238, 8.9520263671875, 10.230424880981445, 11.508824348449707, 12.787223815917969, 14.065622329711914, 15.344021797180176, 16.622421264648438, 17.900819778442383, 19.17922019958496, 20.457618713378906, 21.736019134521484, 23.01441764831543, 24.292816162109375, 25.571216583251953, 26.8496150970459, 28.128013610839844, 29.406414031982422, 30.684812545776367, 31.963211059570312, 33.24161148071289, 34.52001190185547, 35.79840850830078, 37.07680892944336]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 13.0, 10.0, 16.0, 28.0, 43.0, 48.0, 67.0, 146.0, 216.0, 326.0, 473.0, 708.0, 1058.0, 1579.0, 2557.0, 3953.0, 6163.0, 9856.0, 15872.0, 25872.0, 41218.0, 66957.0, 108330.0, 166545.0, 198222.0, 148217.0, 95088.0, 58839.0, 35885.0, 22316.0, 13767.0, 8713.0, 5455.0, 3497.0, 2256.0, 1481.0, 999.0, 567.0, 398.0, 277.0, 159.0, 125.0, 78.0, 51.0, 35.0, 26.0, 23.0, 10.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-50.6875, -49.16796875, -47.6484375, -46.12890625, -44.609375, -43.08984375, -41.5703125, -40.05078125, -38.53125, -37.01171875, -35.4921875, -33.97265625, -32.453125, -30.93359375, -29.4140625, -27.89453125, -26.375, -24.85546875, -23.3359375, -21.81640625, -20.296875, -18.77734375, -17.2578125, -15.73828125, -14.21875, -12.69921875, -11.1796875, -9.66015625, -8.140625, -6.62109375, -5.1015625, -3.58203125, -2.0625, -0.54296875, 0.9765625, 2.49609375, 4.015625, 5.53515625, 7.0546875, 8.57421875, 10.09375, 11.61328125, 13.1328125, 14.65234375, 16.171875, 17.69140625, 19.2109375, 20.73046875, 22.25, 23.76953125, 25.2890625, 26.80859375, 28.328125, 29.84765625, 31.3671875, 32.88671875, 34.40625, 35.92578125, 37.4453125, 38.96484375, 40.484375, 42.00390625, 43.5234375, 45.04296875, 46.5625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 2.0, 6.0, 3.0, 6.0, 3.0, 4.0, 8.0, 11.0, 15.0, 17.0, 14.0, 17.0, 22.0, 22.0, 29.0, 30.0, 44.0, 50.0, 45.0, 32.0, 47.0, 35.0, 45.0, 39.0, 48.0, 40.0, 46.0, 43.0, 36.0, 27.0, 32.0, 29.0, 23.0, 26.0, 17.0, 17.0, 16.0, 10.0, 11.0, 7.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-45.3125, -44.0087890625, -42.705078125, -41.4013671875, -40.09765625, -38.7939453125, -37.490234375, -36.1865234375, -34.8828125, -33.5791015625, -32.275390625, -30.9716796875, -29.66796875, -28.3642578125, -27.060546875, -25.7568359375, -24.453125, -23.1494140625, -21.845703125, -20.5419921875, -19.23828125, -17.9345703125, -16.630859375, -15.3271484375, -14.0234375, -12.7197265625, -11.416015625, -10.1123046875, -8.80859375, -7.5048828125, -6.201171875, -4.8974609375, -3.59375, -2.2900390625, -0.986328125, 0.3173828125, 1.62109375, 2.9248046875, 4.228515625, 5.5322265625, 6.8359375, 8.1396484375, 9.443359375, 10.7470703125, 12.05078125, 13.3544921875, 14.658203125, 15.9619140625, 17.265625, 18.5693359375, 19.873046875, 21.1767578125, 22.48046875, 23.7841796875, 25.087890625, 26.3916015625, 27.6953125, 28.9990234375, 30.302734375, 31.6064453125, 32.91015625, 34.2138671875, 35.517578125, 36.8212890625, 38.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 12.0, 15.0, 14.0, 19.0, 39.0, 52.0, 77.0, 128.0, 202.0, 278.0, 477.0, 827.0, 1381.0, 2356.0, 4108.0, 7529.0, 13944.0, 26707.0, 51895.0, 102817.0, 199559.0, 272697.0, 176477.0, 89715.0, 45059.0, 23886.0, 12478.0, 6841.0, 3775.0, 2056.0, 1217.0, 689.0, 421.0, 286.0, 170.0, 130.0, 66.0, 46.0, 35.0, 22.0, 17.0, 10.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.3125, -68.8017578125, -66.291015625, -63.7802734375, -61.26953125, -58.7587890625, -56.248046875, -53.7373046875, -51.2265625, -48.7158203125, -46.205078125, -43.6943359375, -41.18359375, -38.6728515625, -36.162109375, -33.6513671875, -31.140625, -28.6298828125, -26.119140625, -23.6083984375, -21.09765625, -18.5869140625, -16.076171875, -13.5654296875, -11.0546875, -8.5439453125, -6.033203125, -3.5224609375, -1.01171875, 1.4990234375, 4.009765625, 6.5205078125, 9.03125, 11.5419921875, 14.052734375, 16.5634765625, 19.07421875, 21.5849609375, 24.095703125, 26.6064453125, 29.1171875, 31.6279296875, 34.138671875, 36.6494140625, 39.16015625, 41.6708984375, 44.181640625, 46.6923828125, 49.203125, 51.7138671875, 54.224609375, 56.7353515625, 59.24609375, 61.7568359375, 64.267578125, 66.7783203125, 69.2890625, 71.7998046875, 74.310546875, 76.8212890625, 79.33203125, 81.8427734375, 84.353515625, 86.8642578125, 89.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 14.0, 8.0, 13.0, 11.0, 20.0, 22.0, 32.0, 16.0, 32.0, 30.0, 29.0, 49.0, 37.0, 44.0, 28.0, 49.0, 34.0, 42.0, 49.0, 42.0, 45.0, 40.0, 30.0, 37.0, 29.0, 32.0, 28.0, 28.0, 17.0, 12.0, 17.0, 19.0, 9.0, 14.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -29.06884765625, -28.2001953125, -27.33154296875, -26.462890625, -25.59423828125, -24.7255859375, -23.85693359375, -22.98828125, -22.11962890625, -21.2509765625, -20.38232421875, -19.513671875, -18.64501953125, -17.7763671875, -16.90771484375, -16.0390625, -15.17041015625, -14.3017578125, -13.43310546875, -12.564453125, -11.69580078125, -10.8271484375, -9.95849609375, -9.08984375, -8.22119140625, -7.3525390625, -6.48388671875, -5.615234375, -4.74658203125, -3.8779296875, -3.00927734375, -2.140625, -1.27197265625, -0.4033203125, 0.46533203125, 1.333984375, 2.20263671875, 3.0712890625, 3.93994140625, 4.80859375, 5.67724609375, 6.5458984375, 7.41455078125, 8.283203125, 9.15185546875, 10.0205078125, 10.88916015625, 11.7578125, 12.62646484375, 13.4951171875, 14.36376953125, 15.232421875, 16.10107421875, 16.9697265625, 17.83837890625, 18.70703125, 19.57568359375, 20.4443359375, 21.31298828125, 22.181640625, 23.05029296875, 23.9189453125, 24.78759765625, 25.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 17.0, 23.0, 32.0, 34.0, 54.0, 90.0, 100.0, 143.0, 216.0, 354.0, 463.0, 743.0, 1142.0, 1844.0, 3024.0, 5075.0, 9225.0, 17601.0, 36579.0, 88436.0, 249293.0, 373052.0, 149232.0, 56263.0, 25236.0, 12728.0, 6892.0, 4029.0, 2300.0, 1462.0, 915.0, 591.0, 428.0, 277.0, 178.0, 130.0, 96.0, 85.0, 45.0, 32.0, 24.0, 15.0, 20.0, 10.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.21875, -32.18896484375, -31.1591796875, -30.12939453125, -29.099609375, -28.06982421875, -27.0400390625, -26.01025390625, -24.98046875, -23.95068359375, -22.9208984375, -21.89111328125, -20.861328125, -19.83154296875, -18.8017578125, -17.77197265625, -16.7421875, -15.71240234375, -14.6826171875, -13.65283203125, -12.623046875, -11.59326171875, -10.5634765625, -9.53369140625, -8.50390625, -7.47412109375, -6.4443359375, -5.41455078125, -4.384765625, -3.35498046875, -2.3251953125, -1.29541015625, -0.265625, 0.76416015625, 1.7939453125, 2.82373046875, 3.853515625, 4.88330078125, 5.9130859375, 6.94287109375, 7.97265625, 9.00244140625, 10.0322265625, 11.06201171875, 12.091796875, 13.12158203125, 14.1513671875, 15.18115234375, 16.2109375, 17.24072265625, 18.2705078125, 19.30029296875, 20.330078125, 21.35986328125, 22.3896484375, 23.41943359375, 24.44921875, 25.47900390625, 26.5087890625, 27.53857421875, 28.568359375, 29.59814453125, 30.6279296875, 31.65771484375, 32.6875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 5.0, 11.0, 8.0, 19.0, 19.0, 32.0, 54.0, 90.0, 155.0, 188.0, 154.0, 84.0, 68.0, 45.0, 20.0, 15.0, 16.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004175961017608643, -0.00402987003326416, -0.0038837790489196777, -0.0037376880645751953, -0.003591597080230713, -0.0034455060958862305, -0.003299415111541748, -0.0031533241271972656, -0.003007233142852783, -0.0028611421585083008, -0.0027150511741638184, -0.002568960189819336, -0.0024228692054748535, -0.002276778221130371, -0.0021306872367858887, -0.0019845962524414062, -0.0018385052680969238, -0.0016924142837524414, -0.001546323299407959, -0.0014002323150634766, -0.0012541413307189941, -0.0011080503463745117, -0.0009619593620300293, -0.0008158683776855469, -0.0006697773933410645, -0.000523686408996582, -0.0003775954246520996, -0.0002315044403076172, -8.541345596313477e-05, 6.0677528381347656e-05, 0.00020676851272583008, 0.0003528594970703125, 0.0004989504814147949, 0.0006450414657592773, 0.0007911324501037598, 0.0009372234344482422, 0.0010833144187927246, 0.001229405403137207, 0.0013754963874816895, 0.0015215873718261719, 0.0016676783561706543, 0.0018137693405151367, 0.001959860324859619, 0.0021059513092041016, 0.002252042293548584, 0.0023981332778930664, 0.002544224262237549, 0.0026903152465820312, 0.0028364062309265137, 0.002982497215270996, 0.0031285881996154785, 0.003274679183959961, 0.0034207701683044434, 0.0035668611526489258, 0.003712952136993408, 0.0038590431213378906, 0.004005134105682373, 0.0041512250900268555, 0.004297316074371338, 0.00444340705871582, 0.004589498043060303, 0.004735589027404785, 0.004881680011749268, 0.00502777099609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 8.0, 14.0, 11.0, 13.0, 26.0, 30.0, 63.0, 63.0, 114.0, 164.0, 252.0, 389.0, 645.0, 1053.0, 1819.0, 3290.0, 6125.0, 12201.0, 26035.0, 63161.0, 177763.0, 408843.0, 213376.0, 74138.0, 29930.0, 13580.0, 6827.0, 3600.0, 1919.0, 1156.0, 680.0, 445.0, 282.0, 156.0, 117.0, 70.0, 58.0, 41.0, 31.0, 18.0, 12.0, 10.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-37.5, -36.38330078125, -35.2666015625, -34.14990234375, -33.033203125, -31.91650390625, -30.7998046875, -29.68310546875, -28.56640625, -27.44970703125, -26.3330078125, -25.21630859375, -24.099609375, -22.98291015625, -21.8662109375, -20.74951171875, -19.6328125, -18.51611328125, -17.3994140625, -16.28271484375, -15.166015625, -14.04931640625, -12.9326171875, -11.81591796875, -10.69921875, -9.58251953125, -8.4658203125, -7.34912109375, -6.232421875, -5.11572265625, -3.9990234375, -2.88232421875, -1.765625, -0.64892578125, 0.4677734375, 1.58447265625, 2.701171875, 3.81787109375, 4.9345703125, 6.05126953125, 7.16796875, 8.28466796875, 9.4013671875, 10.51806640625, 11.634765625, 12.75146484375, 13.8681640625, 14.98486328125, 16.1015625, 17.21826171875, 18.3349609375, 19.45166015625, 20.568359375, 21.68505859375, 22.8017578125, 23.91845703125, 25.03515625, 26.15185546875, 27.2685546875, 28.38525390625, 29.501953125, 30.61865234375, 31.7353515625, 32.85205078125, 33.96875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 12.0, 14.0, 24.0, 23.0, 26.0, 42.0, 29.0, 40.0, 65.0, 76.0, 63.0, 70.0, 70.0, 73.0, 68.0, 61.0, 41.0, 25.0, 33.0, 23.0, 18.0, 21.0, 11.0, 15.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.55615234375, -7.2998046875, -7.04345703125, -6.787109375, -6.53076171875, -6.2744140625, -6.01806640625, -5.76171875, -5.50537109375, -5.2490234375, -4.99267578125, -4.736328125, -4.47998046875, -4.2236328125, -3.96728515625, -3.7109375, -3.45458984375, -3.1982421875, -2.94189453125, -2.685546875, -2.42919921875, -2.1728515625, -1.91650390625, -1.66015625, -1.40380859375, -1.1474609375, -0.89111328125, -0.634765625, -0.37841796875, -0.1220703125, 0.13427734375, 0.390625, 0.64697265625, 0.9033203125, 1.15966796875, 1.416015625, 1.67236328125, 1.9287109375, 2.18505859375, 2.44140625, 2.69775390625, 2.9541015625, 3.21044921875, 3.466796875, 3.72314453125, 3.9794921875, 4.23583984375, 4.4921875, 4.74853515625, 5.0048828125, 5.26123046875, 5.517578125, 5.77392578125, 6.0302734375, 6.28662109375, 6.54296875, 6.79931640625, 7.0556640625, 7.31201171875, 7.568359375, 7.82470703125, 8.0810546875, 8.33740234375, 8.59375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 5.0, 10.0, 11.0, 13.0, 20.0, 20.0, 19.0, 26.0, 37.0, 43.0, 48.0, 42.0, 68.0, 51.0, 49.0, 59.0, 66.0, 58.0, 52.0, 40.0, 38.0, 25.0, 32.0, 23.0, 18.0, 17.0, 18.0, 21.0, 9.0, 9.0, 6.0, 6.0, 3.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.66911697387695, -39.29092788696289, -37.912742614746094, -36.53455352783203, -35.15636444091797, -33.778175354003906, -32.399986267089844, -31.021800994873047, -29.643611907958984, -28.265422821044922, -26.887235641479492, -25.509048461914062, -24.130859375, -22.752670288085938, -21.374483108520508, -19.996295928955078, -18.618106842041016, -17.239917755126953, -15.861730575561523, -14.483542442321777, -13.105354309082031, -11.727166175842285, -10.348978042602539, -8.970789909362793, -7.592601776123047, -6.214413642883301, -4.836225509643555, -3.4580373764038086, -2.0798492431640625, -0.7016611099243164, 0.6765270233154297, 2.054715156555176, 3.4329071044921875, 4.811095237731934, 6.18928337097168, 7.567471504211426, 8.945659637451172, 10.323847770690918, 11.702035903930664, 13.08022403717041, 14.458412170410156, 15.836600303649902, 17.21478843688965, 18.592975616455078, 19.97116470336914, 21.349353790283203, 22.727540969848633, 24.105728149414062, 25.483917236328125, 26.862106323242188, 28.240293502807617, 29.618480682373047, 30.99666976928711, 32.37485885620117, 33.75304412841797, 35.13123321533203, 36.509422302246094, 37.887611389160156, 39.26580047607422, 40.643985748291016, 42.02217483520508, 43.40036392211914, 44.77854919433594, 46.15673828125, 47.53492736816406]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 10.0, 10.0, 8.0, 17.0, 16.0, 16.0, 29.0, 21.0, 24.0, 23.0, 35.0, 31.0, 40.0, 50.0, 51.0, 42.0, 45.0, 46.0, 54.0, 43.0, 46.0, 41.0, 34.0, 35.0, 40.0, 22.0, 25.0, 23.0, 18.0, 25.0, 16.0, 12.0, 10.0, 3.0, 11.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09554672241211, -40.7083854675293, -39.321224212646484, -37.934059143066406, -36.546897888183594, -35.15973663330078, -33.77257537841797, -32.385414123535156, -30.998252868652344, -29.61109161376953, -28.223928451538086, -26.836767196655273, -25.44960594177246, -24.062442779541016, -22.675281524658203, -21.28812026977539, -19.900957107543945, -18.513795852661133, -17.126632690429688, -15.739471435546875, -14.352310180664062, -12.965147972106934, -11.577985763549805, -10.190824508666992, -8.803662300109863, -7.416500568389893, -6.029338836669922, -4.642176628112793, -3.2550148963928223, -1.8678531646728516, -0.48069095611572266, 0.9064702987670898, 2.2936325073242188, 3.6807942390441895, 5.06795597076416, 6.455118179321289, 7.84227991104126, 9.22944164276123, 10.61660385131836, 12.003765106201172, 13.3909273147583, 14.77808952331543, 16.165250778198242, 17.552413940429688, 18.9395751953125, 20.326736450195312, 21.713897705078125, 23.101058959960938, 24.488222122192383, 25.875383377075195, 27.26254653930664, 28.649707794189453, 30.036869049072266, 31.424030303955078, 32.811195373535156, 34.19835662841797, 35.58551788330078, 36.972679138183594, 38.359840393066406, 39.74700164794922, 41.1341667175293, 42.52132797241211, 43.90848922729492, 45.295650482177734, 46.68281173706055]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 10.0, 13.0, 22.0, 23.0, 48.0, 59.0, 94.0, 135.0, 196.0, 314.0, 445.0, 676.0, 1100.0, 1742.0, 2935.0, 4821.0, 8480.0, 15336.0, 28358.0, 55106.0, 117470.0, 331195.0, 1103656.0, 1549676.0, 609556.0, 192868.0, 81404.0, 40173.0, 21282.0, 11449.0, 6509.0, 3605.0, 2121.0, 1273.0, 731.0, 509.0, 317.0, 216.0, 112.0, 90.0, 46.0, 44.0, 27.0, 12.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.9375, -58.134765625, -56.33203125, -54.529296875, -52.7265625, -50.923828125, -49.12109375, -47.318359375, -45.515625, -43.712890625, -41.91015625, -40.107421875, -38.3046875, -36.501953125, -34.69921875, -32.896484375, -31.09375, -29.291015625, -27.48828125, -25.685546875, -23.8828125, -22.080078125, -20.27734375, -18.474609375, -16.671875, -14.869140625, -13.06640625, -11.263671875, -9.4609375, -7.658203125, -5.85546875, -4.052734375, -2.25, -0.447265625, 1.35546875, 3.158203125, 4.9609375, 6.763671875, 8.56640625, 10.369140625, 12.171875, 13.974609375, 15.77734375, 17.580078125, 19.3828125, 21.185546875, 22.98828125, 24.791015625, 26.59375, 28.396484375, 30.19921875, 32.001953125, 33.8046875, 35.607421875, 37.41015625, 39.212890625, 41.015625, 42.818359375, 44.62109375, 46.423828125, 48.2265625, 50.029296875, 51.83203125, 53.634765625, 55.4375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 12.0, 17.0, 15.0, 14.0, 26.0, 25.0, 25.0, 31.0, 29.0, 29.0, 39.0, 46.0, 41.0, 34.0, 35.0, 50.0, 27.0, 34.0, 39.0, 54.0, 43.0, 33.0, 31.0, 36.0, 24.0, 14.0, 28.0, 18.0, 11.0, 21.0, 12.0, 19.0, 6.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-34.53125, -33.583251953125, -32.63525390625, -31.687255859375, -30.7392578125, -29.791259765625, -28.84326171875, -27.895263671875, -26.947265625, -25.999267578125, -25.05126953125, -24.103271484375, -23.1552734375, -22.207275390625, -21.25927734375, -20.311279296875, -19.36328125, -18.415283203125, -17.46728515625, -16.519287109375, -15.5712890625, -14.623291015625, -13.67529296875, -12.727294921875, -11.779296875, -10.831298828125, -9.88330078125, -8.935302734375, -7.9873046875, -7.039306640625, -6.09130859375, -5.143310546875, -4.1953125, -3.247314453125, -2.29931640625, -1.351318359375, -0.4033203125, 0.544677734375, 1.49267578125, 2.440673828125, 3.388671875, 4.336669921875, 5.28466796875, 6.232666015625, 7.1806640625, 8.128662109375, 9.07666015625, 10.024658203125, 10.97265625, 11.920654296875, 12.86865234375, 13.816650390625, 14.7646484375, 15.712646484375, 16.66064453125, 17.608642578125, 18.556640625, 19.504638671875, 20.45263671875, 21.400634765625, 22.3486328125, 23.296630859375, 24.24462890625, 25.192626953125, 26.140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 16.0, 24.0, 39.0, 55.0, 68.0, 107.0, 175.0, 254.0, 410.0, 698.0, 1103.0, 1747.0, 2784.0, 4998.0, 8297.0, 15276.0, 28117.0, 53791.0, 110263.0, 241838.0, 597793.0, 1499201.0, 953570.0, 358724.0, 156486.0, 74229.0, 37562.0, 19931.0, 11108.0, 6221.0, 3613.0, 2092.0, 1350.0, 851.0, 535.0, 356.0, 184.0, 131.0, 82.0, 61.0, 47.0, 26.0, 22.0, 16.0, 5.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.90625, -49.13427734375, -47.3623046875, -45.59033203125, -43.818359375, -42.04638671875, -40.2744140625, -38.50244140625, -36.73046875, -34.95849609375, -33.1865234375, -31.41455078125, -29.642578125, -27.87060546875, -26.0986328125, -24.32666015625, -22.5546875, -20.78271484375, -19.0107421875, -17.23876953125, -15.466796875, -13.69482421875, -11.9228515625, -10.15087890625, -8.37890625, -6.60693359375, -4.8349609375, -3.06298828125, -1.291015625, 0.48095703125, 2.2529296875, 4.02490234375, 5.796875, 7.56884765625, 9.3408203125, 11.11279296875, 12.884765625, 14.65673828125, 16.4287109375, 18.20068359375, 19.97265625, 21.74462890625, 23.5166015625, 25.28857421875, 27.060546875, 28.83251953125, 30.6044921875, 32.37646484375, 34.1484375, 35.92041015625, 37.6923828125, 39.46435546875, 41.236328125, 43.00830078125, 44.7802734375, 46.55224609375, 48.32421875, 50.09619140625, 51.8681640625, 53.64013671875, 55.412109375, 57.18408203125, 58.9560546875, 60.72802734375, 62.5]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 18.0, 19.0, 23.0, 24.0, 36.0, 56.0, 59.0, 75.0, 78.0, 99.0, 121.0, 142.0, 207.0, 186.0, 251.0, 314.0, 347.0, 291.0, 305.0, 262.0, 210.0, 149.0, 143.0, 120.0, 89.0, 74.0, 60.0, 44.0, 42.0, 42.0, 25.0, 26.0, 28.0, 16.0, 12.0, 8.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.3671875, -13.8990478515625, -13.430908203125, -12.9627685546875, -12.49462890625, -12.0264892578125, -11.558349609375, -11.0902099609375, -10.6220703125, -10.1539306640625, -9.685791015625, -9.2176513671875, -8.74951171875, -8.2813720703125, -7.813232421875, -7.3450927734375, -6.876953125, -6.4088134765625, -5.940673828125, -5.4725341796875, -5.00439453125, -4.5362548828125, -4.068115234375, -3.5999755859375, -3.1318359375, -2.6636962890625, -2.195556640625, -1.7274169921875, -1.25927734375, -0.7911376953125, -0.322998046875, 0.1451416015625, 0.61328125, 1.0814208984375, 1.549560546875, 2.0177001953125, 2.48583984375, 2.9539794921875, 3.422119140625, 3.8902587890625, 4.3583984375, 4.8265380859375, 5.294677734375, 5.7628173828125, 6.23095703125, 6.6990966796875, 7.167236328125, 7.6353759765625, 8.103515625, 8.5716552734375, 9.039794921875, 9.5079345703125, 9.97607421875, 10.4442138671875, 10.912353515625, 11.3804931640625, 11.8486328125, 12.3167724609375, 12.784912109375, 13.2530517578125, 13.72119140625, 14.1893310546875, 14.657470703125, 15.1256103515625, 15.59375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 5.0, 5.0, 11.0, 17.0, 19.0, 24.0, 26.0, 37.0, 43.0, 56.0, 51.0, 63.0, 54.0, 63.0, 59.0, 68.0, 68.0, 52.0, 56.0, 38.0, 33.0, 25.0, 28.0, 24.0, 17.0, 14.0, 5.0, 3.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03245544433594, -38.56648254394531, -37.10050964355469, -35.63453674316406, -34.16856384277344, -32.70259094238281, -31.236618041992188, -29.770645141601562, -28.304672241210938, -26.838699340820312, -25.372726440429688, -23.906753540039062, -22.440780639648438, -20.974807739257812, -19.508834838867188, -18.042861938476562, -16.576889038085938, -15.110916137695312, -13.644943237304688, -12.178970336914062, -10.712997436523438, -9.247024536132812, -7.7810516357421875, -6.3150787353515625, -4.8491058349609375, -3.3831329345703125, -1.9171600341796875, -0.4511871337890625, 1.0147857666015625, 2.4807586669921875, 3.9467315673828125, 5.4127044677734375, 6.878681182861328, 8.344654083251953, 9.810626983642578, 11.276599884033203, 12.742572784423828, 14.208545684814453, 15.674518585205078, 17.140491485595703, 18.606464385986328, 20.072437286376953, 21.538410186767578, 23.004383087158203, 24.470355987548828, 25.936328887939453, 27.402301788330078, 28.868274688720703, 30.334247589111328, 31.800220489501953, 33.26619338989258, 34.7321662902832, 36.19813919067383, 37.66411209106445, 39.13008499145508, 40.5960578918457, 42.06203079223633, 43.52800369262695, 44.99397659301758, 46.4599494934082, 47.92592239379883, 49.39189529418945, 50.85786819458008, 52.3238410949707, 53.78981399536133]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 14.0, 5.0, 8.0, 12.0, 20.0, 23.0, 22.0, 26.0, 28.0, 21.0, 47.0, 28.0, 37.0, 42.0, 41.0, 40.0, 36.0, 40.0, 34.0, 50.0, 44.0, 35.0, 40.0, 37.0, 39.0, 32.0, 24.0, 23.0, 26.0, 20.0, 14.0, 16.0, 10.0, 15.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.90105438232422, -34.77497482299805, -33.64889907836914, -32.52281951904297, -31.396739959716797, -30.270662307739258, -29.14458465576172, -28.018505096435547, -26.892427444458008, -25.76634979248047, -24.640270233154297, -23.514192581176758, -22.38811492919922, -21.262035369873047, -20.135957717895508, -19.00988006591797, -17.883800506591797, -16.757722854614258, -15.631643295288086, -14.505565643310547, -13.379487037658691, -12.253408432006836, -11.127330780029297, -10.001252174377441, -8.875173568725586, -7.7490949630737305, -6.623016834259033, -5.496938705444336, -4.3708600997924805, -3.244781494140625, -2.1187033653259277, -0.9926252365112305, 0.13345718383789062, 1.259535551071167, 2.3856139183044434, 3.5116922855377197, 4.637770652770996, 5.763849258422852, 6.889927387237549, 8.016005516052246, 9.142084121704102, 10.268162727355957, 11.394241333007812, 12.520318984985352, 13.646397590637207, 14.772476196289062, 15.898553848266602, 17.02463150024414, 18.150711059570312, 19.27678871154785, 20.402868270874023, 21.528945922851562, 22.655025482177734, 23.781103134155273, 24.907180786132812, 26.033260345458984, 27.159337997436523, 28.285415649414062, 29.411495208740234, 30.537572860717773, 31.663650512695312, 32.789730072021484, 33.915809631347656, 35.04188537597656, 36.167964935302734]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 18.0, 20.0, 24.0, 41.0, 65.0, 76.0, 135.0, 206.0, 346.0, 556.0, 969.0, 1730.0, 3159.0, 5925.0, 11661.0, 23425.0, 51624.0, 123203.0, 305118.0, 301255.0, 120544.0, 50393.0, 23352.0, 11430.0, 5922.0, 3120.0, 1717.0, 936.0, 594.0, 345.0, 190.0, 140.0, 95.0, 55.0, 41.0, 29.0, 30.0, 20.0, 8.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-78.25, -75.55078125, -72.8515625, -70.15234375, -67.453125, -64.75390625, -62.0546875, -59.35546875, -56.65625, -53.95703125, -51.2578125, -48.55859375, -45.859375, -43.16015625, -40.4609375, -37.76171875, -35.0625, -32.36328125, -29.6640625, -26.96484375, -24.265625, -21.56640625, -18.8671875, -16.16796875, -13.46875, -10.76953125, -8.0703125, -5.37109375, -2.671875, 0.02734375, 2.7265625, 5.42578125, 8.125, 10.82421875, 13.5234375, 16.22265625, 18.921875, 21.62109375, 24.3203125, 27.01953125, 29.71875, 32.41796875, 35.1171875, 37.81640625, 40.515625, 43.21484375, 45.9140625, 48.61328125, 51.3125, 54.01171875, 56.7109375, 59.41015625, 62.109375, 64.80859375, 67.5078125, 70.20703125, 72.90625, 75.60546875, 78.3046875, 81.00390625, 83.703125, 86.40234375, 89.1015625, 91.80078125, 94.5]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 9.0, 9.0, 4.0, 14.0, 19.0, 18.0, 22.0, 35.0, 28.0, 30.0, 38.0, 36.0, 40.0, 39.0, 44.0, 48.0, 36.0, 42.0, 38.0, 37.0, 50.0, 31.0, 38.0, 49.0, 40.0, 26.0, 23.0, 25.0, 21.0, 19.0, 25.0, 13.0, 9.0, 10.0, 6.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.21875, -35.0673828125, -33.916015625, -32.7646484375, -31.61328125, -30.4619140625, -29.310546875, -28.1591796875, -27.0078125, -25.8564453125, -24.705078125, -23.5537109375, -22.40234375, -21.2509765625, -20.099609375, -18.9482421875, -17.796875, -16.6455078125, -15.494140625, -14.3427734375, -13.19140625, -12.0400390625, -10.888671875, -9.7373046875, -8.5859375, -7.4345703125, -6.283203125, -5.1318359375, -3.98046875, -2.8291015625, -1.677734375, -0.5263671875, 0.625, 1.7763671875, 2.927734375, 4.0791015625, 5.23046875, 6.3818359375, 7.533203125, 8.6845703125, 9.8359375, 10.9873046875, 12.138671875, 13.2900390625, 14.44140625, 15.5927734375, 16.744140625, 17.8955078125, 19.046875, 20.1982421875, 21.349609375, 22.5009765625, 23.65234375, 24.8037109375, 25.955078125, 27.1064453125, 28.2578125, 29.4091796875, 30.560546875, 31.7119140625, 32.86328125, 34.0146484375, 35.166015625, 36.3173828125, 37.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 6.0, 4.0, 10.0, 18.0, 34.0, 45.0, 73.0, 81.0, 133.0, 193.0, 301.0, 470.0, 672.0, 1053.0, 1615.0, 2682.0, 4449.0, 7539.0, 13317.0, 24864.0, 49374.0, 112462.0, 291515.0, 305570.0, 120250.0, 52469.0, 25785.0, 13612.0, 7847.0, 4465.0, 2741.0, 1678.0, 1092.0, 672.0, 489.0, 301.0, 217.0, 149.0, 90.0, 62.0, 42.0, 32.0, 24.0, 17.0, 14.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-77.0625, -74.5791015625, -72.095703125, -69.6123046875, -67.12890625, -64.6455078125, -62.162109375, -59.6787109375, -57.1953125, -54.7119140625, -52.228515625, -49.7451171875, -47.26171875, -44.7783203125, -42.294921875, -39.8115234375, -37.328125, -34.8447265625, -32.361328125, -29.8779296875, -27.39453125, -24.9111328125, -22.427734375, -19.9443359375, -17.4609375, -14.9775390625, -12.494140625, -10.0107421875, -7.52734375, -5.0439453125, -2.560546875, -0.0771484375, 2.40625, 4.8896484375, 7.373046875, 9.8564453125, 12.33984375, 14.8232421875, 17.306640625, 19.7900390625, 22.2734375, 24.7568359375, 27.240234375, 29.7236328125, 32.20703125, 34.6904296875, 37.173828125, 39.6572265625, 42.140625, 44.6240234375, 47.107421875, 49.5908203125, 52.07421875, 54.5576171875, 57.041015625, 59.5244140625, 62.0078125, 64.4912109375, 66.974609375, 69.4580078125, 71.94140625, 74.4248046875, 76.908203125, 79.3916015625, 81.875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 6.0, 5.0, 9.0, 11.0, 15.0, 11.0, 11.0, 13.0, 24.0, 30.0, 20.0, 36.0, 28.0, 34.0, 36.0, 49.0, 43.0, 30.0, 33.0, 54.0, 39.0, 44.0, 42.0, 36.0, 37.0, 39.0, 33.0, 31.0, 25.0, 29.0, 21.0, 23.0, 21.0, 14.0, 12.0, 7.0, 5.0, 5.0, 8.0, 3.0, 7.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.376220703125, -21.64306640625, -20.909912109375, -20.1767578125, -19.443603515625, -18.71044921875, -17.977294921875, -17.244140625, -16.510986328125, -15.77783203125, -15.044677734375, -14.3115234375, -13.578369140625, -12.84521484375, -12.112060546875, -11.37890625, -10.645751953125, -9.91259765625, -9.179443359375, -8.4462890625, -7.713134765625, -6.97998046875, -6.246826171875, -5.513671875, -4.780517578125, -4.04736328125, -3.314208984375, -2.5810546875, -1.847900390625, -1.11474609375, -0.381591796875, 0.3515625, 1.084716796875, 1.81787109375, 2.551025390625, 3.2841796875, 4.017333984375, 4.75048828125, 5.483642578125, 6.216796875, 6.949951171875, 7.68310546875, 8.416259765625, 9.1494140625, 9.882568359375, 10.61572265625, 11.348876953125, 12.08203125, 12.815185546875, 13.54833984375, 14.281494140625, 15.0146484375, 15.747802734375, 16.48095703125, 17.214111328125, 17.947265625, 18.680419921875, 19.41357421875, 20.146728515625, 20.8798828125, 21.613037109375, 22.34619140625, 23.079345703125, 23.8125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 9.0, 14.0, 25.0, 33.0, 27.0, 76.0, 95.0, 135.0, 206.0, 300.0, 502.0, 885.0, 1489.0, 2845.0, 5399.0, 11367.0, 27477.0, 75206.0, 268835.0, 446563.0, 130843.0, 42612.0, 17100.0, 7639.0, 3816.0, 2067.0, 1094.0, 690.0, 412.0, 283.0, 163.0, 103.0, 72.0, 44.0, 40.0, 32.0, 14.0, 10.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-26.375, -25.530517578125, -24.68603515625, -23.841552734375, -22.9970703125, -22.152587890625, -21.30810546875, -20.463623046875, -19.619140625, -18.774658203125, -17.93017578125, -17.085693359375, -16.2412109375, -15.396728515625, -14.55224609375, -13.707763671875, -12.86328125, -12.018798828125, -11.17431640625, -10.329833984375, -9.4853515625, -8.640869140625, -7.79638671875, -6.951904296875, -6.107421875, -5.262939453125, -4.41845703125, -3.573974609375, -2.7294921875, -1.885009765625, -1.04052734375, -0.196044921875, 0.6484375, 1.492919921875, 2.33740234375, 3.181884765625, 4.0263671875, 4.870849609375, 5.71533203125, 6.559814453125, 7.404296875, 8.248779296875, 9.09326171875, 9.937744140625, 10.7822265625, 11.626708984375, 12.47119140625, 13.315673828125, 14.16015625, 15.004638671875, 15.84912109375, 16.693603515625, 17.5380859375, 18.382568359375, 19.22705078125, 20.071533203125, 20.916015625, 21.760498046875, 22.60498046875, 23.449462890625, 24.2939453125, 25.138427734375, 25.98291015625, 26.827392578125, 27.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 11.0, 15.0, 22.0, 15.0, 46.0, 46.0, 57.0, 74.0, 90.0, 106.0, 110.0, 78.0, 76.0, 56.0, 46.0, 32.0, 21.0, 18.0, 9.0, 9.0, 9.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002593994140625, -0.0025217533111572266, -0.002449512481689453, -0.0023772716522216797, -0.0023050308227539062, -0.002232789993286133, -0.0021605491638183594, -0.002088308334350586, -0.0020160675048828125, -0.001943826675415039, -0.0018715858459472656, -0.0017993450164794922, -0.0017271041870117188, -0.0016548633575439453, -0.0015826225280761719, -0.0015103816986083984, -0.001438140869140625, -0.0013659000396728516, -0.0012936592102050781, -0.0012214183807373047, -0.0011491775512695312, -0.0010769367218017578, -0.0010046958923339844, -0.0009324550628662109, -0.0008602142333984375, -0.0007879734039306641, -0.0007157325744628906, -0.0006434917449951172, -0.0005712509155273438, -0.0004990100860595703, -0.0004267692565917969, -0.00035452842712402344, -0.00028228759765625, -0.00021004676818847656, -0.00013780593872070312, -6.556510925292969e-05, 6.67572021484375e-06, 7.891654968261719e-05, 0.00015115737915039062, 0.00022339820861816406, 0.0002956390380859375, 0.00036787986755371094, 0.0004401206970214844, 0.0005123615264892578, 0.0005846023559570312, 0.0006568431854248047, 0.0007290840148925781, 0.0008013248443603516, 0.000873565673828125, 0.0009458065032958984, 0.0010180473327636719, 0.0010902881622314453, 0.0011625289916992188, 0.0012347698211669922, 0.0013070106506347656, 0.001379251480102539, 0.0014514923095703125, 0.001523733139038086, 0.0015959739685058594, 0.0016682147979736328, 0.0017404556274414062, 0.0018126964569091797, 0.0018849372863769531, 0.0019571781158447266, 0.0020294189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 3.0, 10.0, 16.0, 15.0, 36.0, 44.0, 48.0, 94.0, 121.0, 209.0, 281.0, 469.0, 693.0, 1132.0, 1913.0, 3295.0, 6165.0, 12607.0, 26493.0, 62347.0, 157100.0, 336697.0, 254709.0, 103027.0, 42064.0, 18765.0, 8950.0, 4600.0, 2602.0, 1457.0, 867.0, 589.0, 334.0, 245.0, 189.0, 128.0, 65.0, 49.0, 35.0, 29.0, 15.0, 17.0, 12.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.15625, -25.358154296875, -24.56005859375, -23.761962890625, -22.9638671875, -22.165771484375, -21.36767578125, -20.569580078125, -19.771484375, -18.973388671875, -18.17529296875, -17.377197265625, -16.5791015625, -15.781005859375, -14.98291015625, -14.184814453125, -13.38671875, -12.588623046875, -11.79052734375, -10.992431640625, -10.1943359375, -9.396240234375, -8.59814453125, -7.800048828125, -7.001953125, -6.203857421875, -5.40576171875, -4.607666015625, -3.8095703125, -3.011474609375, -2.21337890625, -1.415283203125, -0.6171875, 0.180908203125, 0.97900390625, 1.777099609375, 2.5751953125, 3.373291015625, 4.17138671875, 4.969482421875, 5.767578125, 6.565673828125, 7.36376953125, 8.161865234375, 8.9599609375, 9.758056640625, 10.55615234375, 11.354248046875, 12.15234375, 12.950439453125, 13.74853515625, 14.546630859375, 15.3447265625, 16.142822265625, 16.94091796875, 17.739013671875, 18.537109375, 19.335205078125, 20.13330078125, 20.931396484375, 21.7294921875, 22.527587890625, 23.32568359375, 24.123779296875, 24.921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 13.0, 13.0, 18.0, 25.0, 25.0, 41.0, 46.0, 54.0, 80.0, 67.0, 74.0, 66.0, 85.0, 66.0, 58.0, 59.0, 46.0, 40.0, 26.0, 20.0, 16.0, 15.0, 11.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0093994140625, -7.745361328125, -7.4813232421875, -7.21728515625, -6.9532470703125, -6.689208984375, -6.4251708984375, -6.1611328125, -5.8970947265625, -5.633056640625, -5.3690185546875, -5.10498046875, -4.8409423828125, -4.576904296875, -4.3128662109375, -4.048828125, -3.7847900390625, -3.520751953125, -3.2567138671875, -2.99267578125, -2.7286376953125, -2.464599609375, -2.2005615234375, -1.9365234375, -1.6724853515625, -1.408447265625, -1.1444091796875, -0.88037109375, -0.6163330078125, -0.352294921875, -0.0882568359375, 0.17578125, 0.4398193359375, 0.703857421875, 0.9678955078125, 1.23193359375, 1.4959716796875, 1.760009765625, 2.0240478515625, 2.2880859375, 2.5521240234375, 2.816162109375, 3.0802001953125, 3.34423828125, 3.6082763671875, 3.872314453125, 4.1363525390625, 4.400390625, 4.6644287109375, 4.928466796875, 5.1925048828125, 5.45654296875, 5.7205810546875, 5.984619140625, 6.2486572265625, 6.5126953125, 6.7767333984375, 7.040771484375, 7.3048095703125, 7.56884765625, 7.8328857421875, 8.096923828125, 8.3609619140625, 8.625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 6.0, 7.0, 9.0, 9.0, 14.0, 20.0, 10.0, 20.0, 30.0, 42.0, 38.0, 57.0, 48.0, 57.0, 51.0, 70.0, 56.0, 71.0, 58.0, 70.0, 41.0, 37.0, 40.0, 26.0, 27.0, 13.0, 19.0, 11.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.675437927246094, -33.38908386230469, -32.102725982666016, -30.816370010375977, -29.530014038085938, -28.2436580657959, -26.95730209350586, -25.67094612121582, -24.38459014892578, -23.098234176635742, -21.811878204345703, -20.525522232055664, -19.239166259765625, -17.952810287475586, -16.666454315185547, -15.380098342895508, -14.093742370605469, -12.80738639831543, -11.52103042602539, -10.234674453735352, -8.948318481445312, -7.661962509155273, -6.375606536865234, -5.089250564575195, -3.8028945922851562, -2.516538619995117, -1.2301826477050781, 0.05617332458496094, 1.342529296875, 2.628885269165039, 3.915241241455078, 5.201597213745117, 6.487953186035156, 7.774309158325195, 9.060665130615234, 10.347021102905273, 11.633377075195312, 12.919733047485352, 14.20608901977539, 15.49244499206543, 16.77880096435547, 18.065156936645508, 19.351512908935547, 20.637868881225586, 21.924224853515625, 23.210580825805664, 24.496936798095703, 25.783292770385742, 27.06964874267578, 28.35600471496582, 29.64236068725586, 30.9287166595459, 32.21507263183594, 33.501426696777344, 34.787784576416016, 36.07414245605469, 37.360496520996094, 38.6468505859375, 39.93320846557617, 41.219566345214844, 42.50592041015625, 43.792274475097656, 45.07863235473633, 46.364990234375, 47.651344299316406]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 8.0, 10.0, 9.0, 8.0, 14.0, 17.0, 23.0, 27.0, 20.0, 26.0, 34.0, 41.0, 42.0, 26.0, 35.0, 51.0, 40.0, 32.0, 38.0, 43.0, 55.0, 35.0, 44.0, 44.0, 40.0, 28.0, 25.0, 20.0, 25.0, 28.0, 21.0, 19.0, 13.0, 15.0, 7.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.04462432861328, -32.96225357055664, -31.8798828125, -30.797510147094727, -29.715139389038086, -28.632768630981445, -27.550395965576172, -26.46802520751953, -25.38565444946289, -24.30328369140625, -23.22091293334961, -22.138540267944336, -21.056169509887695, -19.973798751831055, -18.89142608642578, -17.80905532836914, -16.7266845703125, -15.64431381225586, -14.561942100524902, -13.479570388793945, -12.397199630737305, -11.314828872680664, -10.232457160949707, -9.15008544921875, -8.06771469116211, -6.9853434562683105, -5.902972221374512, -4.820600986480713, -3.738229751586914, -2.6558585166931152, -1.5734872817993164, -0.4911160469055176, 0.5912551879882812, 1.67362642288208, 2.755997657775879, 3.8383688926696777, 4.920740127563477, 6.003111362457275, 7.085482597351074, 8.167854309082031, 9.250225067138672, 10.332595825195312, 11.41496753692627, 12.497339248657227, 13.579710006713867, 14.662080764770508, 15.744452476501465, 16.826824188232422, 17.909194946289062, 18.991565704345703, 20.073936462402344, 21.156309127807617, 22.238679885864258, 23.3210506439209, 24.403423309326172, 25.485794067382812, 26.568164825439453, 27.650535583496094, 28.732906341552734, 29.815279006958008, 30.89764976501465, 31.98002052307129, 33.06239318847656, 34.1447639465332, 35.227134704589844]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 18.0, 16.0, 33.0, 47.0, 68.0, 103.0, 146.0, 218.0, 378.0, 606.0, 909.0, 1549.0, 2423.0, 4103.0, 6944.0, 12397.0, 21484.0, 37783.0, 67915.0, 119462.0, 188676.0, 213966.0, 155537.0, 92330.0, 52299.0, 29274.0, 16477.0, 9322.0, 5585.0, 3248.0, 1948.0, 1160.0, 741.0, 491.0, 323.0, 199.0, 119.0, 84.0, 54.0, 39.0, 18.0, 16.0, 17.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-53.96875, -52.4384765625, -50.908203125, -49.3779296875, -47.84765625, -46.3173828125, -44.787109375, -43.2568359375, -41.7265625, -40.1962890625, -38.666015625, -37.1357421875, -35.60546875, -34.0751953125, -32.544921875, -31.0146484375, -29.484375, -27.9541015625, -26.423828125, -24.8935546875, -23.36328125, -21.8330078125, -20.302734375, -18.7724609375, -17.2421875, -15.7119140625, -14.181640625, -12.6513671875, -11.12109375, -9.5908203125, -8.060546875, -6.5302734375, -5.0, -3.4697265625, -1.939453125, -0.4091796875, 1.12109375, 2.6513671875, 4.181640625, 5.7119140625, 7.2421875, 8.7724609375, 10.302734375, 11.8330078125, 13.36328125, 14.8935546875, 16.423828125, 17.9541015625, 19.484375, 21.0146484375, 22.544921875, 24.0751953125, 25.60546875, 27.1357421875, 28.666015625, 30.1962890625, 31.7265625, 33.2568359375, 34.787109375, 36.3173828125, 37.84765625, 39.3779296875, 40.908203125, 42.4384765625, 43.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 5.0, 10.0, 16.0, 19.0, 27.0, 28.0, 26.0, 26.0, 38.0, 47.0, 36.0, 43.0, 33.0, 41.0, 44.0, 33.0, 51.0, 51.0, 57.0, 40.0, 55.0, 43.0, 23.0, 27.0, 27.0, 22.0, 16.0, 24.0, 13.0, 12.0, 14.0, 6.0, 4.0, 4.0, 8.0, 1.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -34.04638671875, -32.9365234375, -31.82666015625, -30.716796875, -29.60693359375, -28.4970703125, -27.38720703125, -26.27734375, -25.16748046875, -24.0576171875, -22.94775390625, -21.837890625, -20.72802734375, -19.6181640625, -18.50830078125, -17.3984375, -16.28857421875, -15.1787109375, -14.06884765625, -12.958984375, -11.84912109375, -10.7392578125, -9.62939453125, -8.51953125, -7.40966796875, -6.2998046875, -5.18994140625, -4.080078125, -2.97021484375, -1.8603515625, -0.75048828125, 0.359375, 1.46923828125, 2.5791015625, 3.68896484375, 4.798828125, 5.90869140625, 7.0185546875, 8.12841796875, 9.23828125, 10.34814453125, 11.4580078125, 12.56787109375, 13.677734375, 14.78759765625, 15.8974609375, 17.00732421875, 18.1171875, 19.22705078125, 20.3369140625, 21.44677734375, 22.556640625, 23.66650390625, 24.7763671875, 25.88623046875, 26.99609375, 28.10595703125, 29.2158203125, 30.32568359375, 31.435546875, 32.54541015625, 33.6552734375, 34.76513671875, 35.875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 17.0, 17.0, 41.0, 58.0, 76.0, 134.0, 211.0, 285.0, 484.0, 700.0, 1100.0, 1754.0, 2741.0, 4315.0, 6872.0, 10901.0, 17583.0, 28749.0, 47217.0, 78003.0, 124260.0, 179172.0, 187472.0, 135345.0, 85541.0, 52170.0, 31567.0, 19417.0, 11903.0, 7394.0, 4760.0, 2883.0, 1908.0, 1218.0, 766.0, 537.0, 323.0, 230.0, 138.0, 91.0, 72.0, 38.0, 34.0, 23.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.5, -48.00439453125, -46.5087890625, -45.01318359375, -43.517578125, -42.02197265625, -40.5263671875, -39.03076171875, -37.53515625, -36.03955078125, -34.5439453125, -33.04833984375, -31.552734375, -30.05712890625, -28.5615234375, -27.06591796875, -25.5703125, -24.07470703125, -22.5791015625, -21.08349609375, -19.587890625, -18.09228515625, -16.5966796875, -15.10107421875, -13.60546875, -12.10986328125, -10.6142578125, -9.11865234375, -7.623046875, -6.12744140625, -4.6318359375, -3.13623046875, -1.640625, -0.14501953125, 1.3505859375, 2.84619140625, 4.341796875, 5.83740234375, 7.3330078125, 8.82861328125, 10.32421875, 11.81982421875, 13.3154296875, 14.81103515625, 16.306640625, 17.80224609375, 19.2978515625, 20.79345703125, 22.2890625, 23.78466796875, 25.2802734375, 26.77587890625, 28.271484375, 29.76708984375, 31.2626953125, 32.75830078125, 34.25390625, 35.74951171875, 37.2451171875, 38.74072265625, 40.236328125, 41.73193359375, 43.2275390625, 44.72314453125, 46.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 4.0, 6.0, 14.0, 20.0, 14.0, 20.0, 16.0, 12.0, 17.0, 19.0, 27.0, 42.0, 39.0, 33.0, 45.0, 33.0, 39.0, 49.0, 49.0, 42.0, 40.0, 40.0, 31.0, 40.0, 34.0, 32.0, 34.0, 25.0, 28.0, 23.0, 22.0, 14.0, 13.0, 19.0, 10.0, 6.0, 5.0, 7.0, 4.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.671875, -19.99560546875, -19.3193359375, -18.64306640625, -17.966796875, -17.29052734375, -16.6142578125, -15.93798828125, -15.26171875, -14.58544921875, -13.9091796875, -13.23291015625, -12.556640625, -11.88037109375, -11.2041015625, -10.52783203125, -9.8515625, -9.17529296875, -8.4990234375, -7.82275390625, -7.146484375, -6.47021484375, -5.7939453125, -5.11767578125, -4.44140625, -3.76513671875, -3.0888671875, -2.41259765625, -1.736328125, -1.06005859375, -0.3837890625, 0.29248046875, 0.96875, 1.64501953125, 2.3212890625, 2.99755859375, 3.673828125, 4.35009765625, 5.0263671875, 5.70263671875, 6.37890625, 7.05517578125, 7.7314453125, 8.40771484375, 9.083984375, 9.76025390625, 10.4365234375, 11.11279296875, 11.7890625, 12.46533203125, 13.1416015625, 13.81787109375, 14.494140625, 15.17041015625, 15.8466796875, 16.52294921875, 17.19921875, 17.87548828125, 18.5517578125, 19.22802734375, 19.904296875, 20.58056640625, 21.2568359375, 21.93310546875, 22.609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 11.0, 16.0, 25.0, 46.0, 60.0, 79.0, 117.0, 177.0, 259.0, 384.0, 605.0, 897.0, 1549.0, 2340.0, 3885.0, 6554.0, 11388.0, 21592.0, 42626.0, 89888.0, 194805.0, 302208.0, 190256.0, 87595.0, 41638.0, 21436.0, 11470.0, 6386.0, 3869.0, 2300.0, 1395.0, 934.0, 590.0, 359.0, 262.0, 166.0, 108.0, 82.0, 48.0, 36.0, 21.0, 30.0, 12.0, 11.0, 3.0, 5.0, 5.0, 0.0, 4.0, 4.0, 0.0, 3.0], "bins": [-18.5, -17.947509765625, -17.39501953125, -16.842529296875, -16.2900390625, -15.737548828125, -15.18505859375, -14.632568359375, -14.080078125, -13.527587890625, -12.97509765625, -12.422607421875, -11.8701171875, -11.317626953125, -10.76513671875, -10.212646484375, -9.66015625, -9.107666015625, -8.55517578125, -8.002685546875, -7.4501953125, -6.897705078125, -6.34521484375, -5.792724609375, -5.240234375, -4.687744140625, -4.13525390625, -3.582763671875, -3.0302734375, -2.477783203125, -1.92529296875, -1.372802734375, -0.8203125, -0.267822265625, 0.28466796875, 0.837158203125, 1.3896484375, 1.942138671875, 2.49462890625, 3.047119140625, 3.599609375, 4.152099609375, 4.70458984375, 5.257080078125, 5.8095703125, 6.362060546875, 6.91455078125, 7.467041015625, 8.01953125, 8.572021484375, 9.12451171875, 9.677001953125, 10.2294921875, 10.781982421875, 11.33447265625, 11.886962890625, 12.439453125, 12.991943359375, 13.54443359375, 14.096923828125, 14.6494140625, 15.201904296875, 15.75439453125, 16.306884765625, 16.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 8.0, 9.0, 15.0, 17.0, 23.0, 47.0, 56.0, 77.0, 99.0, 146.0, 132.0, 97.0, 68.0, 45.0, 29.0, 32.0, 25.0, 14.0, 12.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020694732666015625, -0.00199282169342041, -0.0019161701202392578, -0.0018395185470581055, -0.0017628669738769531, -0.0016862154006958008, -0.0016095638275146484, -0.001532912254333496, -0.0014562606811523438, -0.0013796091079711914, -0.001302957534790039, -0.0012263059616088867, -0.0011496543884277344, -0.001073002815246582, -0.0009963512420654297, -0.0009196996688842773, -0.000843048095703125, -0.0007663965225219727, -0.0006897449493408203, -0.000613093376159668, -0.0005364418029785156, -0.0004597902297973633, -0.00038313865661621094, -0.0003064870834350586, -0.00022983551025390625, -0.0001531839370727539, -7.653236389160156e-05, 1.1920928955078125e-07, 7.677078247070312e-05, 0.00015342235565185547, 0.0002300739288330078, 0.00030672550201416016, 0.0003833770751953125, 0.00046002864837646484, 0.0005366802215576172, 0.0006133317947387695, 0.0006899833679199219, 0.0007666349411010742, 0.0008432865142822266, 0.0009199380874633789, 0.0009965896606445312, 0.0010732412338256836, 0.001149892807006836, 0.0012265443801879883, 0.0013031959533691406, 0.001379847526550293, 0.0014564990997314453, 0.0015331506729125977, 0.00160980224609375, 0.0016864538192749023, 0.0017631053924560547, 0.001839756965637207, 0.0019164085388183594, 0.0019930601119995117, 0.002069711685180664, 0.0021463632583618164, 0.0022230148315429688, 0.002299666404724121, 0.0023763179779052734, 0.0024529695510864258, 0.002529621124267578, 0.0026062726974487305, 0.002682924270629883, 0.002759575843811035, 0.0028362274169921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 7.0, 15.0, 23.0, 31.0, 42.0, 57.0, 88.0, 153.0, 199.0, 312.0, 559.0, 869.0, 1626.0, 2810.0, 5282.0, 9870.0, 20253.0, 43133.0, 96989.0, 217999.0, 318493.0, 179618.0, 79028.0, 35383.0, 16846.0, 8518.0, 4454.0, 2445.0, 1321.0, 796.0, 490.0, 283.0, 174.0, 119.0, 82.0, 51.0, 24.0, 29.0, 23.0, 14.0, 11.0, 12.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.421875, -17.834716796875, -17.24755859375, -16.660400390625, -16.0732421875, -15.486083984375, -14.89892578125, -14.311767578125, -13.724609375, -13.137451171875, -12.55029296875, -11.963134765625, -11.3759765625, -10.788818359375, -10.20166015625, -9.614501953125, -9.02734375, -8.440185546875, -7.85302734375, -7.265869140625, -6.6787109375, -6.091552734375, -5.50439453125, -4.917236328125, -4.330078125, -3.742919921875, -3.15576171875, -2.568603515625, -1.9814453125, -1.394287109375, -0.80712890625, -0.219970703125, 0.3671875, 0.954345703125, 1.54150390625, 2.128662109375, 2.7158203125, 3.302978515625, 3.89013671875, 4.477294921875, 5.064453125, 5.651611328125, 6.23876953125, 6.825927734375, 7.4130859375, 8.000244140625, 8.58740234375, 9.174560546875, 9.76171875, 10.348876953125, 10.93603515625, 11.523193359375, 12.1103515625, 12.697509765625, 13.28466796875, 13.871826171875, 14.458984375, 15.046142578125, 15.63330078125, 16.220458984375, 16.8076171875, 17.394775390625, 17.98193359375, 18.569091796875, 19.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 8.0, 10.0, 9.0, 21.0, 18.0, 27.0, 22.0, 48.0, 32.0, 36.0, 33.0, 43.0, 56.0, 66.0, 66.0, 76.0, 72.0, 43.0, 50.0, 35.0, 31.0, 29.0, 23.0, 23.0, 15.0, 17.0, 11.0, 16.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.6851806640625, -4.550048828125, -4.4149169921875, -4.27978515625, -4.1446533203125, -4.009521484375, -3.8743896484375, -3.7392578125, -3.6041259765625, -3.468994140625, -3.3338623046875, -3.19873046875, -3.0635986328125, -2.928466796875, -2.7933349609375, -2.658203125, -2.5230712890625, -2.387939453125, -2.2528076171875, -2.11767578125, -1.9825439453125, -1.847412109375, -1.7122802734375, -1.5771484375, -1.4420166015625, -1.306884765625, -1.1717529296875, -1.03662109375, -0.9014892578125, -0.766357421875, -0.6312255859375, -0.49609375, -0.3609619140625, -0.225830078125, -0.0906982421875, 0.04443359375, 0.1795654296875, 0.314697265625, 0.4498291015625, 0.5849609375, 0.7200927734375, 0.855224609375, 0.9903564453125, 1.12548828125, 1.2606201171875, 1.395751953125, 1.5308837890625, 1.666015625, 1.8011474609375, 1.936279296875, 2.0714111328125, 2.20654296875, 2.3416748046875, 2.476806640625, 2.6119384765625, 2.7470703125, 2.8822021484375, 3.017333984375, 3.1524658203125, 3.28759765625, 3.4227294921875, 3.557861328125, 3.6929931640625, 3.828125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 7.0, 15.0, 17.0, 21.0, 18.0, 25.0, 22.0, 46.0, 51.0, 50.0, 70.0, 55.0, 73.0, 67.0, 78.0, 55.0, 55.0, 45.0, 41.0, 35.0, 27.0, 29.0, 24.0, 10.0, 16.0, 10.0, 7.0, 6.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.27734375, -35.90780258178711, -34.53826141357422, -33.16872024536133, -31.799179077148438, -30.429637908935547, -29.060096740722656, -27.690555572509766, -26.321014404296875, -24.951473236083984, -23.581932067871094, -22.212390899658203, -20.842849731445312, -19.473308563232422, -18.10376739501953, -16.73422622680664, -15.36468505859375, -13.99514389038086, -12.625602722167969, -11.256061553955078, -9.886520385742188, -8.516979217529297, -7.147438049316406, -5.777896881103516, -4.408355712890625, -3.0388145446777344, -1.6692733764648438, -0.2997322082519531, 1.0698089599609375, 2.439350128173828, 3.8088912963867188, 5.178432464599609, 6.547977447509766, 7.917518615722656, 9.287059783935547, 10.656600952148438, 12.026142120361328, 13.395683288574219, 14.76522445678711, 16.134765625, 17.50430679321289, 18.87384796142578, 20.243389129638672, 21.612930297851562, 22.982471466064453, 24.352012634277344, 25.721553802490234, 27.091094970703125, 28.460636138916016, 29.830177307128906, 31.199718475341797, 32.56925964355469, 33.93880081176758, 35.30834197998047, 36.67788314819336, 38.04742431640625, 39.41696548461914, 40.78650665283203, 42.15604782104492, 43.52558898925781, 44.8951301574707, 46.264671325683594, 47.634212493896484, 49.003753662109375, 50.373294830322266]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 2.0, 4.0, 6.0, 10.0, 12.0, 10.0, 9.0, 18.0, 19.0, 27.0, 33.0, 23.0, 26.0, 27.0, 34.0, 36.0, 32.0, 46.0, 47.0, 40.0, 29.0, 44.0, 40.0, 43.0, 45.0, 28.0, 32.0, 41.0, 38.0, 25.0, 27.0, 24.0, 13.0, 26.0, 18.0, 12.0, 9.0, 6.0, 7.0, 8.0, 5.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-37.34229278564453, -36.2725944519043, -35.20289611816406, -34.13319778442383, -33.063499450683594, -31.993799209594727, -30.924100875854492, -29.854402542114258, -28.78470230102539, -27.715003967285156, -26.645305633544922, -25.575607299804688, -24.50590705871582, -23.436208724975586, -22.36651039123535, -21.296812057495117, -20.227113723754883, -19.15741539001465, -18.087717056274414, -17.018016815185547, -15.948318481445312, -14.878620147705078, -13.808921813964844, -12.73922348022461, -11.669524192810059, -10.599825859069824, -9.530126571655273, -8.460428237915039, -7.3907294273376465, -6.321030616760254, -5.2513322830200195, -4.181633472442627, -3.1119327545166016, -2.042233943939209, -0.9725353717803955, 0.09716320037841797, 1.1668620109558105, 2.236560821533203, 3.3062591552734375, 4.37595796585083, 5.445656776428223, 6.515355587005615, 7.585054397583008, 8.654752731323242, 9.724451065063477, 10.794150352478027, 11.863848686218262, 12.933547973632812, 14.003246307373047, 15.072944641113281, 16.142642974853516, 17.21234130859375, 18.282041549682617, 19.35173988342285, 20.421438217163086, 21.49113655090332, 22.560836791992188, 23.630535125732422, 24.700233459472656, 25.76993179321289, 26.839632034301758, 27.909330368041992, 28.979028701782227, 30.04872703552246, 31.118425369262695]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 15.0, 25.0, 30.0, 40.0, 73.0, 131.0, 176.0, 270.0, 404.0, 613.0, 960.0, 1434.0, 2209.0, 3379.0, 5078.0, 7926.0, 12431.0, 20153.0, 33511.0, 59514.0, 119271.0, 311421.0, 838834.0, 1337144.0, 858503.0, 316341.0, 119757.0, 58782.0, 32842.0, 19275.0, 11914.0, 7573.0, 4867.0, 3185.0, 2064.0, 1387.0, 890.0, 565.0, 411.0, 273.0, 200.0, 143.0, 70.0, 57.0, 44.0, 20.0, 19.0, 10.0, 14.0, 11.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-37.8125, -36.57275390625, -35.3330078125, -34.09326171875, -32.853515625, -31.61376953125, -30.3740234375, -29.13427734375, -27.89453125, -26.65478515625, -25.4150390625, -24.17529296875, -22.935546875, -21.69580078125, -20.4560546875, -19.21630859375, -17.9765625, -16.73681640625, -15.4970703125, -14.25732421875, -13.017578125, -11.77783203125, -10.5380859375, -9.29833984375, -8.05859375, -6.81884765625, -5.5791015625, -4.33935546875, -3.099609375, -1.85986328125, -0.6201171875, 0.61962890625, 1.859375, 3.09912109375, 4.3388671875, 5.57861328125, 6.818359375, 8.05810546875, 9.2978515625, 10.53759765625, 11.77734375, 13.01708984375, 14.2568359375, 15.49658203125, 16.736328125, 17.97607421875, 19.2158203125, 20.45556640625, 21.6953125, 22.93505859375, 24.1748046875, 25.41455078125, 26.654296875, 27.89404296875, 29.1337890625, 30.37353515625, 31.61328125, 32.85302734375, 34.0927734375, 35.33251953125, 36.572265625, 37.81201171875, 39.0517578125, 40.29150390625, 41.53125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 18.0, 15.0, 18.0, 11.0, 24.0, 24.0, 27.0, 33.0, 31.0, 41.0, 33.0, 31.0, 51.0, 41.0, 39.0, 38.0, 40.0, 50.0, 37.0, 33.0, 30.0, 41.0, 31.0, 38.0, 30.0, 29.0, 18.0, 18.0, 17.0, 15.0, 14.0, 12.0, 10.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.47021484375, -26.5810546875, -25.69189453125, -24.802734375, -23.91357421875, -23.0244140625, -22.13525390625, -21.24609375, -20.35693359375, -19.4677734375, -18.57861328125, -17.689453125, -16.80029296875, -15.9111328125, -15.02197265625, -14.1328125, -13.24365234375, -12.3544921875, -11.46533203125, -10.576171875, -9.68701171875, -8.7978515625, -7.90869140625, -7.01953125, -6.13037109375, -5.2412109375, -4.35205078125, -3.462890625, -2.57373046875, -1.6845703125, -0.79541015625, 0.09375, 0.98291015625, 1.8720703125, 2.76123046875, 3.650390625, 4.53955078125, 5.4287109375, 6.31787109375, 7.20703125, 8.09619140625, 8.9853515625, 9.87451171875, 10.763671875, 11.65283203125, 12.5419921875, 13.43115234375, 14.3203125, 15.20947265625, 16.0986328125, 16.98779296875, 17.876953125, 18.76611328125, 19.6552734375, 20.54443359375, 21.43359375, 22.32275390625, 23.2119140625, 24.10107421875, 24.990234375, 25.87939453125, 26.7685546875, 27.65771484375, 28.546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 30.0, 29.0, 43.0, 65.0, 84.0, 174.0, 242.0, 407.0, 668.0, 1123.0, 1861.0, 3152.0, 5618.0, 9926.0, 17822.0, 33271.0, 65933.0, 138641.0, 323027.0, 909416.0, 1632692.0, 601930.0, 232897.0, 104413.0, 50886.0, 26461.0, 14313.0, 7961.0, 4514.0, 2674.0, 1498.0, 940.0, 571.0, 333.0, 238.0, 142.0, 87.0, 55.0, 32.0, 24.0, 20.0, 8.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-53.8125, -52.197265625, -50.58203125, -48.966796875, -47.3515625, -45.736328125, -44.12109375, -42.505859375, -40.890625, -39.275390625, -37.66015625, -36.044921875, -34.4296875, -32.814453125, -31.19921875, -29.583984375, -27.96875, -26.353515625, -24.73828125, -23.123046875, -21.5078125, -19.892578125, -18.27734375, -16.662109375, -15.046875, -13.431640625, -11.81640625, -10.201171875, -8.5859375, -6.970703125, -5.35546875, -3.740234375, -2.125, -0.509765625, 1.10546875, 2.720703125, 4.3359375, 5.951171875, 7.56640625, 9.181640625, 10.796875, 12.412109375, 14.02734375, 15.642578125, 17.2578125, 18.873046875, 20.48828125, 22.103515625, 23.71875, 25.333984375, 26.94921875, 28.564453125, 30.1796875, 31.794921875, 33.41015625, 35.025390625, 36.640625, 38.255859375, 39.87109375, 41.486328125, 43.1015625, 44.716796875, 46.33203125, 47.947265625, 49.5625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 12.0, 20.0, 30.0, 26.0, 39.0, 52.0, 78.0, 87.0, 139.0, 186.0, 265.0, 282.0, 361.0, 485.0, 442.0, 386.0, 290.0, 208.0, 168.0, 105.0, 93.0, 82.0, 40.0, 36.0, 33.0, 34.0, 23.0, 17.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.75, -20.171875, -19.59375, -19.015625, -18.4375, -17.859375, -17.28125, -16.703125, -16.125, -15.546875, -14.96875, -14.390625, -13.8125, -13.234375, -12.65625, -12.078125, -11.5, -10.921875, -10.34375, -9.765625, -9.1875, -8.609375, -8.03125, -7.453125, -6.875, -6.296875, -5.71875, -5.140625, -4.5625, -3.984375, -3.40625, -2.828125, -2.25, -1.671875, -1.09375, -0.515625, 0.0625, 0.640625, 1.21875, 1.796875, 2.375, 2.953125, 3.53125, 4.109375, 4.6875, 5.265625, 5.84375, 6.421875, 7.0, 7.578125, 8.15625, 8.734375, 9.3125, 9.890625, 10.46875, 11.046875, 11.625, 12.203125, 12.78125, 13.359375, 13.9375, 14.515625, 15.09375, 15.671875, 16.25]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 22.0, 13.0, 22.0, 19.0, 33.0, 44.0, 56.0, 49.0, 54.0, 68.0, 65.0, 66.0, 77.0, 54.0, 48.0, 45.0, 45.0, 32.0, 37.0, 19.0, 20.0, 13.0, 7.0, 14.0, 5.0, 8.0, 3.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.2828483581543, -34.0324592590332, -32.78207015991211, -31.53168296813965, -30.281293869018555, -29.03090476989746, -27.780517578125, -26.530128479003906, -25.279739379882812, -24.02935028076172, -22.778961181640625, -21.528573989868164, -20.27818489074707, -19.027795791625977, -17.777408599853516, -16.527019500732422, -15.276630401611328, -14.026241302490234, -12.775853157043457, -11.52546501159668, -10.275075912475586, -9.024686813354492, -7.774298667907715, -6.5239105224609375, -5.273521423339844, -4.023132801055908, -2.7727441787719727, -1.522355556488037, -0.27196693420410156, 0.978421688079834, 2.2288103103637695, 3.479198455810547, 4.729587554931641, 5.979976177215576, 7.230364799499512, 8.480752944946289, 9.731142044067383, 10.981531143188477, 12.231919288635254, 13.482307434082031, 14.732696533203125, 15.983085632324219, 17.233474731445312, 18.483861923217773, 19.734251022338867, 20.98464012145996, 22.235027313232422, 23.485416412353516, 24.73580551147461, 25.986194610595703, 27.236583709716797, 28.486970901489258, 29.73736000061035, 30.987749099731445, 32.238136291503906, 33.488525390625, 34.738914489746094, 35.98930358886719, 37.23969268798828, 38.490081787109375, 39.74047088623047, 40.9908561706543, 42.24124526977539, 43.491634368896484, 44.74202346801758]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 4.0, 4.0, 9.0, 11.0, 18.0, 15.0, 21.0, 21.0, 16.0, 26.0, 22.0, 25.0, 27.0, 29.0, 33.0, 32.0, 35.0, 37.0, 36.0, 43.0, 41.0, 42.0, 27.0, 32.0, 39.0, 48.0, 28.0, 24.0, 42.0, 31.0, 19.0, 17.0, 24.0, 19.0, 15.0, 19.0, 10.0, 10.0, 3.0, 9.0, 10.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.321773529052734, -30.385770797729492, -29.44976806640625, -28.513765335083008, -27.577762603759766, -26.641759872436523, -25.70575714111328, -24.76975440979004, -23.833751678466797, -22.897748947143555, -21.961746215820312, -21.02574348449707, -20.089740753173828, -19.153738021850586, -18.217735290527344, -17.2817325592041, -16.34572982788086, -15.409727096557617, -14.473724365234375, -13.537721633911133, -12.60171890258789, -11.665716171264648, -10.729713439941406, -9.793710708618164, -8.857709884643555, -7.9217071533203125, -6.98570442199707, -6.049701690673828, -5.113698959350586, -4.177696704864502, -3.2416939735412598, -2.3056912422180176, -1.3696880340576172, -0.4336853623390198, 0.5023173093795776, 1.4383199214935303, 2.3743226528167725, 3.3103251457214355, 4.246327877044678, 5.18233060836792, 6.118333339691162, 7.054336071014404, 7.9903388023376465, 8.92634105682373, 9.862343788146973, 10.798346519470215, 11.734349250793457, 12.6703519821167, 13.606354713439941, 14.542357444763184, 15.478360176086426, 16.41436195373535, 17.350364685058594, 18.286367416381836, 19.222370147705078, 20.15837287902832, 21.094375610351562, 22.030378341674805, 22.966381072998047, 23.90238380432129, 24.83838653564453, 25.774389266967773, 26.710391998291016, 27.646394729614258, 28.5823974609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 10.0, 18.0, 18.0, 23.0, 59.0, 69.0, 131.0, 246.0, 431.0, 773.0, 1331.0, 2332.0, 4549.0, 8796.0, 18500.0, 43790.0, 125115.0, 399205.0, 291256.0, 88913.0, 33156.0, 14435.0, 7031.0, 3709.0, 2040.0, 1072.0, 673.0, 362.0, 191.0, 117.0, 63.0, 42.0, 28.0, 16.0, 13.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.625, -80.25390625, -77.8828125, -75.51171875, -73.140625, -70.76953125, -68.3984375, -66.02734375, -63.65625, -61.28515625, -58.9140625, -56.54296875, -54.171875, -51.80078125, -49.4296875, -47.05859375, -44.6875, -42.31640625, -39.9453125, -37.57421875, -35.203125, -32.83203125, -30.4609375, -28.08984375, -25.71875, -23.34765625, -20.9765625, -18.60546875, -16.234375, -13.86328125, -11.4921875, -9.12109375, -6.75, -4.37890625, -2.0078125, 0.36328125, 2.734375, 5.10546875, 7.4765625, 9.84765625, 12.21875, 14.58984375, 16.9609375, 19.33203125, 21.703125, 24.07421875, 26.4453125, 28.81640625, 31.1875, 33.55859375, 35.9296875, 38.30078125, 40.671875, 43.04296875, 45.4140625, 47.78515625, 50.15625, 52.52734375, 54.8984375, 57.26953125, 59.640625, 62.01171875, 64.3828125, 66.75390625, 69.125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 21.0, 12.0, 17.0, 22.0, 14.0, 16.0, 20.0, 20.0, 28.0, 31.0, 39.0, 29.0, 43.0, 41.0, 41.0, 35.0, 37.0, 41.0, 49.0, 30.0, 25.0, 46.0, 36.0, 31.0, 39.0, 34.0, 23.0, 18.0, 12.0, 18.0, 25.0, 11.0, 13.0, 11.0, 11.0, 2.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-31.828125, -30.891845703125, -29.95556640625, -29.019287109375, -28.0830078125, -27.146728515625, -26.21044921875, -25.274169921875, -24.337890625, -23.401611328125, -22.46533203125, -21.529052734375, -20.5927734375, -19.656494140625, -18.72021484375, -17.783935546875, -16.84765625, -15.911376953125, -14.97509765625, -14.038818359375, -13.1025390625, -12.166259765625, -11.22998046875, -10.293701171875, -9.357421875, -8.421142578125, -7.48486328125, -6.548583984375, -5.6123046875, -4.676025390625, -3.73974609375, -2.803466796875, -1.8671875, -0.930908203125, 0.00537109375, 0.941650390625, 1.8779296875, 2.814208984375, 3.75048828125, 4.686767578125, 5.623046875, 6.559326171875, 7.49560546875, 8.431884765625, 9.3681640625, 10.304443359375, 11.24072265625, 12.177001953125, 13.11328125, 14.049560546875, 14.98583984375, 15.922119140625, 16.8583984375, 17.794677734375, 18.73095703125, 19.667236328125, 20.603515625, 21.539794921875, 22.47607421875, 23.412353515625, 24.3486328125, 25.284912109375, 26.22119140625, 27.157470703125, 28.09375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 7.0, 18.0, 25.0, 33.0, 66.0, 93.0, 105.0, 153.0, 232.0, 335.0, 444.0, 695.0, 963.0, 1489.0, 2329.0, 3883.0, 6533.0, 11740.0, 21125.0, 42824.0, 94243.0, 252209.0, 353056.0, 134892.0, 57377.0, 27909.0, 14417.0, 8135.0, 4753.0, 2976.0, 1858.0, 1141.0, 770.0, 495.0, 367.0, 271.0, 165.0, 107.0, 93.0, 51.0, 45.0, 28.0, 24.0, 25.0, 9.0, 9.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-57.90625, -56.0498046875, -54.193359375, -52.3369140625, -50.48046875, -48.6240234375, -46.767578125, -44.9111328125, -43.0546875, -41.1982421875, -39.341796875, -37.4853515625, -35.62890625, -33.7724609375, -31.916015625, -30.0595703125, -28.203125, -26.3466796875, -24.490234375, -22.6337890625, -20.77734375, -18.9208984375, -17.064453125, -15.2080078125, -13.3515625, -11.4951171875, -9.638671875, -7.7822265625, -5.92578125, -4.0693359375, -2.212890625, -0.3564453125, 1.5, 3.3564453125, 5.212890625, 7.0693359375, 8.92578125, 10.7822265625, 12.638671875, 14.4951171875, 16.3515625, 18.2080078125, 20.064453125, 21.9208984375, 23.77734375, 25.6337890625, 27.490234375, 29.3466796875, 31.203125, 33.0595703125, 34.916015625, 36.7724609375, 38.62890625, 40.4853515625, 42.341796875, 44.1982421875, 46.0546875, 47.9111328125, 49.767578125, 51.6240234375, 53.48046875, 55.3369140625, 57.193359375, 59.0498046875, 60.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 4.0, 12.0, 10.0, 12.0, 10.0, 14.0, 14.0, 27.0, 35.0, 27.0, 27.0, 25.0, 33.0, 34.0, 36.0, 35.0, 39.0, 45.0, 46.0, 43.0, 39.0, 39.0, 42.0, 38.0, 39.0, 35.0, 27.0, 29.0, 20.0, 36.0, 22.0, 20.0, 15.0, 11.0, 10.0, 10.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.5, -19.8662109375, -19.232421875, -18.5986328125, -17.96484375, -17.3310546875, -16.697265625, -16.0634765625, -15.4296875, -14.7958984375, -14.162109375, -13.5283203125, -12.89453125, -12.2607421875, -11.626953125, -10.9931640625, -10.359375, -9.7255859375, -9.091796875, -8.4580078125, -7.82421875, -7.1904296875, -6.556640625, -5.9228515625, -5.2890625, -4.6552734375, -4.021484375, -3.3876953125, -2.75390625, -2.1201171875, -1.486328125, -0.8525390625, -0.21875, 0.4150390625, 1.048828125, 1.6826171875, 2.31640625, 2.9501953125, 3.583984375, 4.2177734375, 4.8515625, 5.4853515625, 6.119140625, 6.7529296875, 7.38671875, 8.0205078125, 8.654296875, 9.2880859375, 9.921875, 10.5556640625, 11.189453125, 11.8232421875, 12.45703125, 13.0908203125, 13.724609375, 14.3583984375, 14.9921875, 15.6259765625, 16.259765625, 16.8935546875, 17.52734375, 18.1611328125, 18.794921875, 19.4287109375, 20.0625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 11.0, 21.0, 16.0, 30.0, 40.0, 68.0, 56.0, 100.0, 138.0, 202.0, 278.0, 390.0, 620.0, 882.0, 1305.0, 2034.0, 3204.0, 5279.0, 9869.0, 21683.0, 67695.0, 369025.0, 437182.0, 78303.0, 24045.0, 10669.0, 5643.0, 3262.0, 2040.0, 1345.0, 913.0, 611.0, 424.0, 308.0, 233.0, 182.0, 131.0, 82.0, 74.0, 42.0, 27.0, 20.0, 13.0, 14.0, 12.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.8125, -25.948974609375, -25.08544921875, -24.221923828125, -23.3583984375, -22.494873046875, -21.63134765625, -20.767822265625, -19.904296875, -19.040771484375, -18.17724609375, -17.313720703125, -16.4501953125, -15.586669921875, -14.72314453125, -13.859619140625, -12.99609375, -12.132568359375, -11.26904296875, -10.405517578125, -9.5419921875, -8.678466796875, -7.81494140625, -6.951416015625, -6.087890625, -5.224365234375, -4.36083984375, -3.497314453125, -2.6337890625, -1.770263671875, -0.90673828125, -0.043212890625, 0.8203125, 1.683837890625, 2.54736328125, 3.410888671875, 4.2744140625, 5.137939453125, 6.00146484375, 6.864990234375, 7.728515625, 8.592041015625, 9.45556640625, 10.319091796875, 11.1826171875, 12.046142578125, 12.90966796875, 13.773193359375, 14.63671875, 15.500244140625, 16.36376953125, 17.227294921875, 18.0908203125, 18.954345703125, 19.81787109375, 20.681396484375, 21.544921875, 22.408447265625, 23.27197265625, 24.135498046875, 24.9990234375, 25.862548828125, 26.72607421875, 27.589599609375, 28.453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 4.0, 8.0, 9.0, 22.0, 45.0, 80.0, 138.0, 200.0, 193.0, 116.0, 68.0, 43.0, 28.0, 11.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003154754638671875, -0.0030614733695983887, -0.0029681921005249023, -0.002874910831451416, -0.0027816295623779297, -0.0026883482933044434, -0.002595067024230957, -0.0025017857551574707, -0.0024085044860839844, -0.002315223217010498, -0.0022219419479370117, -0.0021286606788635254, -0.002035379409790039, -0.0019420981407165527, -0.0018488168716430664, -0.00175553560256958, -0.0016622543334960938, -0.0015689730644226074, -0.001475691795349121, -0.0013824105262756348, -0.0012891292572021484, -0.0011958479881286621, -0.0011025667190551758, -0.0010092854499816895, -0.0009160041809082031, -0.0008227229118347168, -0.0007294416427612305, -0.0006361603736877441, -0.0005428791046142578, -0.0004495978355407715, -0.00035631656646728516, -0.00026303529739379883, -0.0001697540283203125, -7.647275924682617e-05, 1.6808509826660156e-05, 0.00011008977890014648, 0.0002033710479736328, 0.00029665231704711914, 0.00038993358612060547, 0.0004832148551940918, 0.0005764961242675781, 0.0006697773933410645, 0.0007630586624145508, 0.0008563399314880371, 0.0009496212005615234, 0.0010429024696350098, 0.001136183738708496, 0.0012294650077819824, 0.0013227462768554688, 0.001416027545928955, 0.0015093088150024414, 0.0016025900840759277, 0.001695871353149414, 0.0017891526222229004, 0.0018824338912963867, 0.001975715160369873, 0.0020689964294433594, 0.0021622776985168457, 0.002255558967590332, 0.0023488402366638184, 0.0024421215057373047, 0.002535402774810791, 0.0026286840438842773, 0.0027219653129577637, 0.00281524658203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 11.0, 25.0, 34.0, 37.0, 61.0, 115.0, 145.0, 222.0, 362.0, 554.0, 903.0, 1332.0, 2044.0, 3206.0, 5177.0, 8702.0, 17189.0, 41884.0, 147818.0, 495454.0, 219652.0, 56002.0, 21168.0, 10435.0, 5876.0, 3680.0, 2288.0, 1525.0, 924.0, 600.0, 401.0, 242.0, 191.0, 110.0, 49.0, 46.0, 25.0, 27.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-32.90625, -31.9560546875, -31.005859375, -30.0556640625, -29.10546875, -28.1552734375, -27.205078125, -26.2548828125, -25.3046875, -24.3544921875, -23.404296875, -22.4541015625, -21.50390625, -20.5537109375, -19.603515625, -18.6533203125, -17.703125, -16.7529296875, -15.802734375, -14.8525390625, -13.90234375, -12.9521484375, -12.001953125, -11.0517578125, -10.1015625, -9.1513671875, -8.201171875, -7.2509765625, -6.30078125, -5.3505859375, -4.400390625, -3.4501953125, -2.5, -1.5498046875, -0.599609375, 0.3505859375, 1.30078125, 2.2509765625, 3.201171875, 4.1513671875, 5.1015625, 6.0517578125, 7.001953125, 7.9521484375, 8.90234375, 9.8525390625, 10.802734375, 11.7529296875, 12.703125, 13.6533203125, 14.603515625, 15.5537109375, 16.50390625, 17.4541015625, 18.404296875, 19.3544921875, 20.3046875, 21.2548828125, 22.205078125, 23.1552734375, 24.10546875, 25.0556640625, 26.005859375, 26.9560546875, 27.90625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 7.0, 10.0, 13.0, 23.0, 30.0, 41.0, 55.0, 89.0, 108.0, 109.0, 96.0, 91.0, 67.0, 57.0, 38.0, 26.0, 17.0, 17.0, 8.0, 11.0, 11.0, 3.0, 8.0, 3.0, 6.0, 4.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-8.8984375, -8.649658203125, -8.40087890625, -8.152099609375, -7.9033203125, -7.654541015625, -7.40576171875, -7.156982421875, -6.908203125, -6.659423828125, -6.41064453125, -6.161865234375, -5.9130859375, -5.664306640625, -5.41552734375, -5.166748046875, -4.91796875, -4.669189453125, -4.42041015625, -4.171630859375, -3.9228515625, -3.674072265625, -3.42529296875, -3.176513671875, -2.927734375, -2.678955078125, -2.43017578125, -2.181396484375, -1.9326171875, -1.683837890625, -1.43505859375, -1.186279296875, -0.9375, -0.688720703125, -0.43994140625, -0.191162109375, 0.0576171875, 0.306396484375, 0.55517578125, 0.803955078125, 1.052734375, 1.301513671875, 1.55029296875, 1.799072265625, 2.0478515625, 2.296630859375, 2.54541015625, 2.794189453125, 3.04296875, 3.291748046875, 3.54052734375, 3.789306640625, 4.0380859375, 4.286865234375, 4.53564453125, 4.784423828125, 5.033203125, 5.281982421875, 5.53076171875, 5.779541015625, 6.0283203125, 6.277099609375, 6.52587890625, 6.774658203125, 7.0234375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 10.0, 15.0, 11.0, 10.0, 20.0, 19.0, 24.0, 34.0, 38.0, 44.0, 58.0, 62.0, 66.0, 58.0, 65.0, 64.0, 58.0, 57.0, 53.0, 39.0, 35.0, 26.0, 25.0, 17.0, 9.0, 14.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.382720947265625, -27.211339950561523, -26.03995704650879, -24.868576049804688, -23.697195053100586, -22.525814056396484, -21.35443115234375, -20.18305015563965, -19.011669158935547, -17.840288162231445, -16.66890525817871, -15.49752426147461, -14.326143264770508, -13.15476131439209, -11.983379364013672, -10.81199836730957, -9.640615463256836, -8.469233512878418, -7.297852516174316, -6.126470565795898, -4.955089092254639, -3.783707618713379, -2.612325668334961, -1.4409446716308594, -0.2695627212524414, 0.9018188714981079, 2.0732004642486572, 3.244582176208496, 4.415963649749756, 5.587345123291016, 6.758727073669434, 7.930108070373535, 9.101490020751953, 10.272871971130371, 11.444252967834473, 12.61563491821289, 13.787015914916992, 14.95839786529541, 16.129779815673828, 17.30116081237793, 18.47254180908203, 19.643922805786133, 20.815305709838867, 21.98668670654297, 23.15806770324707, 24.329448699951172, 25.500831604003906, 26.672212600708008, 27.843595504760742, 29.014976501464844, 30.186359405517578, 31.35774040222168, 32.52912139892578, 33.700504302978516, 34.87188720703125, 36.04326629638672, 37.21464920043945, 38.38603210449219, 39.557411193847656, 40.72879409790039, 41.900177001953125, 43.071556091308594, 44.24293899536133, 45.41432189941406, 46.58570098876953]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 3.0, 8.0, 8.0, 11.0, 12.0, 16.0, 17.0, 13.0, 21.0, 13.0, 31.0, 23.0, 34.0, 36.0, 17.0, 39.0, 30.0, 36.0, 36.0, 42.0, 35.0, 31.0, 45.0, 34.0, 25.0, 27.0, 37.0, 42.0, 33.0, 29.0, 22.0, 21.0, 22.0, 21.0, 22.0, 15.0, 14.0, 13.0, 11.0, 6.0, 12.0, 8.0, 4.0, 7.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-28.52808380126953, -27.666709899902344, -26.80533790588379, -25.9439640045166, -25.082592010498047, -24.22121810913086, -23.359844207763672, -22.498472213745117, -21.63709831237793, -20.775724411010742, -19.914352416992188, -19.052978515625, -18.191606521606445, -17.330232620239258, -16.468860626220703, -15.607486724853516, -14.746113777160645, -13.884740829467773, -13.023367881774902, -12.161994934082031, -11.300621032714844, -10.439248085021973, -9.577875137329102, -8.716501235961914, -7.855128765106201, -6.99375581741333, -6.132382392883301, -5.27100944519043, -4.409636497497559, -3.5482630729675293, -2.686890125274658, -1.825516700744629, -0.9641437530517578, -0.10277062654495239, 0.758602499961853, 1.6199755668640137, 2.481348752975464, 3.342721939086914, 4.204094886779785, 5.0654683113098145, 5.9268412590026855, 6.788214206695557, 7.649587631225586, 8.510960578918457, 9.372333526611328, 10.233707427978516, 11.09507942199707, 11.956453323364258, 12.817826271057129, 13.67919921875, 14.540572166442871, 15.401945114135742, 16.26331901550293, 17.124691009521484, 17.986064910888672, 18.84743881225586, 19.708810806274414, 20.5701847076416, 21.431556701660156, 22.292930603027344, 23.1543025970459, 24.015676498413086, 24.87704849243164, 25.738422393798828, 26.599796295166016]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 7.0, 11.0, 16.0, 13.0, 35.0, 46.0, 55.0, 85.0, 152.0, 186.0, 289.0, 373.0, 546.0, 788.0, 1116.0, 1635.0, 2256.0, 3115.0, 4468.0, 6286.0, 9171.0, 13442.0, 19462.0, 28856.0, 43676.0, 64935.0, 98087.0, 139287.0, 164778.0, 141518.0, 99244.0, 66553.0, 44216.0, 29190.0, 19888.0, 13351.0, 9428.0, 6588.0, 4575.0, 3161.0, 2293.0, 1555.0, 1148.0, 852.0, 533.0, 388.0, 281.0, 191.0, 128.0, 103.0, 63.0, 45.0, 36.0, 17.0, 9.0, 14.0, 5.0, 3.0, 4.0, 4.0, 3.0], "bins": [-29.28125, -28.352294921875, -27.42333984375, -26.494384765625, -25.5654296875, -24.636474609375, -23.70751953125, -22.778564453125, -21.849609375, -20.920654296875, -19.99169921875, -19.062744140625, -18.1337890625, -17.204833984375, -16.27587890625, -15.346923828125, -14.41796875, -13.489013671875, -12.56005859375, -11.631103515625, -10.7021484375, -9.773193359375, -8.84423828125, -7.915283203125, -6.986328125, -6.057373046875, -5.12841796875, -4.199462890625, -3.2705078125, -2.341552734375, -1.41259765625, -0.483642578125, 0.4453125, 1.374267578125, 2.30322265625, 3.232177734375, 4.1611328125, 5.090087890625, 6.01904296875, 6.947998046875, 7.876953125, 8.805908203125, 9.73486328125, 10.663818359375, 11.5927734375, 12.521728515625, 13.45068359375, 14.379638671875, 15.30859375, 16.237548828125, 17.16650390625, 18.095458984375, 19.0244140625, 19.953369140625, 20.88232421875, 21.811279296875, 22.740234375, 23.669189453125, 24.59814453125, 25.527099609375, 26.4560546875, 27.385009765625, 28.31396484375, 29.242919921875, 30.171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 15.0, 12.0, 16.0, 17.0, 11.0, 13.0, 27.0, 19.0, 28.0, 34.0, 36.0, 27.0, 29.0, 43.0, 36.0, 34.0, 32.0, 39.0, 30.0, 44.0, 31.0, 33.0, 29.0, 32.0, 36.0, 39.0, 37.0, 25.0, 26.0, 19.0, 14.0, 21.0, 14.0, 17.0, 11.0, 11.0, 5.0, 9.0, 12.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-27.1875, -26.344970703125, -25.50244140625, -24.659912109375, -23.8173828125, -22.974853515625, -22.13232421875, -21.289794921875, -20.447265625, -19.604736328125, -18.76220703125, -17.919677734375, -17.0771484375, -16.234619140625, -15.39208984375, -14.549560546875, -13.70703125, -12.864501953125, -12.02197265625, -11.179443359375, -10.3369140625, -9.494384765625, -8.65185546875, -7.809326171875, -6.966796875, -6.124267578125, -5.28173828125, -4.439208984375, -3.5966796875, -2.754150390625, -1.91162109375, -1.069091796875, -0.2265625, 0.615966796875, 1.45849609375, 2.301025390625, 3.1435546875, 3.986083984375, 4.82861328125, 5.671142578125, 6.513671875, 7.356201171875, 8.19873046875, 9.041259765625, 9.8837890625, 10.726318359375, 11.56884765625, 12.411376953125, 13.25390625, 14.096435546875, 14.93896484375, 15.781494140625, 16.6240234375, 17.466552734375, 18.30908203125, 19.151611328125, 19.994140625, 20.836669921875, 21.67919921875, 22.521728515625, 23.3642578125, 24.206787109375, 25.04931640625, 25.891845703125, 26.734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 14.0, 10.0, 21.0, 26.0, 50.0, 72.0, 102.0, 174.0, 274.0, 400.0, 641.0, 995.0, 1611.0, 2712.0, 4543.0, 7240.0, 12187.0, 21308.0, 37633.0, 69287.0, 128201.0, 216967.0, 228647.0, 140303.0, 76502.0, 41357.0, 23334.0, 13451.0, 8081.0, 4698.0, 2903.0, 1823.0, 1102.0, 721.0, 402.0, 262.0, 171.0, 103.0, 73.0, 46.0, 35.0, 28.0, 18.0, 13.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-44.53125, -43.05078125, -41.5703125, -40.08984375, -38.609375, -37.12890625, -35.6484375, -34.16796875, -32.6875, -31.20703125, -29.7265625, -28.24609375, -26.765625, -25.28515625, -23.8046875, -22.32421875, -20.84375, -19.36328125, -17.8828125, -16.40234375, -14.921875, -13.44140625, -11.9609375, -10.48046875, -9.0, -7.51953125, -6.0390625, -4.55859375, -3.078125, -1.59765625, -0.1171875, 1.36328125, 2.84375, 4.32421875, 5.8046875, 7.28515625, 8.765625, 10.24609375, 11.7265625, 13.20703125, 14.6875, 16.16796875, 17.6484375, 19.12890625, 20.609375, 22.08984375, 23.5703125, 25.05078125, 26.53125, 28.01171875, 29.4921875, 30.97265625, 32.453125, 33.93359375, 35.4140625, 36.89453125, 38.375, 39.85546875, 41.3359375, 42.81640625, 44.296875, 45.77734375, 47.2578125, 48.73828125, 50.21875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 9.0, 12.0, 10.0, 17.0, 21.0, 19.0, 22.0, 27.0, 36.0, 26.0, 39.0, 48.0, 39.0, 51.0, 42.0, 45.0, 48.0, 36.0, 49.0, 40.0, 51.0, 33.0, 34.0, 38.0, 22.0, 29.0, 18.0, 21.0, 19.0, 14.0, 8.0, 10.0, 11.0, 5.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.3125, -18.662353515625, -18.01220703125, -17.362060546875, -16.7119140625, -16.061767578125, -15.41162109375, -14.761474609375, -14.111328125, -13.461181640625, -12.81103515625, -12.160888671875, -11.5107421875, -10.860595703125, -10.21044921875, -9.560302734375, -8.91015625, -8.260009765625, -7.60986328125, -6.959716796875, -6.3095703125, -5.659423828125, -5.00927734375, -4.359130859375, -3.708984375, -3.058837890625, -2.40869140625, -1.758544921875, -1.1083984375, -0.458251953125, 0.19189453125, 0.842041015625, 1.4921875, 2.142333984375, 2.79248046875, 3.442626953125, 4.0927734375, 4.742919921875, 5.39306640625, 6.043212890625, 6.693359375, 7.343505859375, 7.99365234375, 8.643798828125, 9.2939453125, 9.944091796875, 10.59423828125, 11.244384765625, 11.89453125, 12.544677734375, 13.19482421875, 13.844970703125, 14.4951171875, 15.145263671875, 15.79541015625, 16.445556640625, 17.095703125, 17.745849609375, 18.39599609375, 19.046142578125, 19.6962890625, 20.346435546875, 20.99658203125, 21.646728515625, 22.296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 8.0, 10.0, 27.0, 42.0, 48.0, 88.0, 115.0, 188.0, 281.0, 481.0, 731.0, 1090.0, 1844.0, 3102.0, 5097.0, 9015.0, 15700.0, 28433.0, 52139.0, 98316.0, 183573.0, 255465.0, 179427.0, 96880.0, 51284.0, 28008.0, 15482.0, 8730.0, 5097.0, 3049.0, 1794.0, 1062.0, 676.0, 412.0, 283.0, 192.0, 123.0, 79.0, 65.0, 37.0, 20.0, 18.0, 13.0, 11.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9453125, -12.4908447265625, -12.036376953125, -11.5819091796875, -11.12744140625, -10.6729736328125, -10.218505859375, -9.7640380859375, -9.3095703125, -8.8551025390625, -8.400634765625, -7.9461669921875, -7.49169921875, -7.0372314453125, -6.582763671875, -6.1282958984375, -5.673828125, -5.2193603515625, -4.764892578125, -4.3104248046875, -3.85595703125, -3.4014892578125, -2.947021484375, -2.4925537109375, -2.0380859375, -1.5836181640625, -1.129150390625, -0.6746826171875, -0.22021484375, 0.2342529296875, 0.688720703125, 1.1431884765625, 1.59765625, 2.0521240234375, 2.506591796875, 2.9610595703125, 3.41552734375, 3.8699951171875, 4.324462890625, 4.7789306640625, 5.2333984375, 5.6878662109375, 6.142333984375, 6.5968017578125, 7.05126953125, 7.5057373046875, 7.960205078125, 8.4146728515625, 8.869140625, 9.3236083984375, 9.778076171875, 10.2325439453125, 10.68701171875, 11.1414794921875, 11.595947265625, 12.0504150390625, 12.5048828125, 12.9593505859375, 13.413818359375, 13.8682861328125, 14.32275390625, 14.7772216796875, 15.231689453125, 15.6861572265625, 16.140625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 9.0, 8.0, 16.0, 17.0, 15.0, 22.0, 33.0, 42.0, 37.0, 56.0, 52.0, 68.0, 75.0, 76.0, 75.0, 62.0, 61.0, 49.0, 41.0, 33.0, 31.0, 18.0, 16.0, 17.0, 13.0, 8.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012683868408203125, -0.0012215673923492432, -0.0011747479438781738, -0.0011279284954071045, -0.0010811090469360352, -0.0010342895984649658, -0.0009874701499938965, -0.0009406507015228271, -0.0008938312530517578, -0.0008470118045806885, -0.0008001923561096191, -0.0007533729076385498, -0.0007065534591674805, -0.0006597340106964111, -0.0006129145622253418, -0.0005660951137542725, -0.0005192756652832031, -0.0004724562168121338, -0.00042563676834106445, -0.0003788173198699951, -0.0003319978713989258, -0.00028517842292785645, -0.0002383589744567871, -0.00019153952598571777, -0.00014472007751464844, -9.79006290435791e-05, -5.1081180572509766e-05, -4.26173210144043e-06, 4.2557716369628906e-05, 8.937716484069824e-05, 0.00013619661331176758, 0.00018301606178283691, 0.00022983551025390625, 0.0002766549587249756, 0.0003234744071960449, 0.00037029385566711426, 0.0004171133041381836, 0.00046393275260925293, 0.0005107522010803223, 0.0005575716495513916, 0.0006043910980224609, 0.0006512105464935303, 0.0006980299949645996, 0.0007448494434356689, 0.0007916688919067383, 0.0008384883403778076, 0.000885307788848877, 0.0009321272373199463, 0.0009789466857910156, 0.001025766134262085, 0.0010725855827331543, 0.0011194050312042236, 0.001166224479675293, 0.0012130439281463623, 0.0012598633766174316, 0.001306682825088501, 0.0013535022735595703, 0.0014003217220306396, 0.001447141170501709, 0.0014939606189727783, 0.0015407800674438477, 0.001587599515914917, 0.0016344189643859863, 0.0016812384128570557, 0.001728057861328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 8.0, 8.0, 18.0, 27.0, 28.0, 44.0, 85.0, 130.0, 198.0, 274.0, 434.0, 679.0, 1068.0, 1721.0, 2733.0, 4437.0, 7395.0, 12285.0, 20579.0, 35165.0, 60715.0, 104789.0, 173913.0, 216022.0, 166123.0, 100225.0, 56791.0, 33186.0, 19402.0, 11586.0, 6958.0, 4321.0, 2586.0, 1671.0, 1064.0, 678.0, 425.0, 227.0, 193.0, 116.0, 66.0, 61.0, 46.0, 21.0, 11.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9736328125, -10.587890625, -10.2021484375, -9.81640625, -9.4306640625, -9.044921875, -8.6591796875, -8.2734375, -7.8876953125, -7.501953125, -7.1162109375, -6.73046875, -6.3447265625, -5.958984375, -5.5732421875, -5.1875, -4.8017578125, -4.416015625, -4.0302734375, -3.64453125, -3.2587890625, -2.873046875, -2.4873046875, -2.1015625, -1.7158203125, -1.330078125, -0.9443359375, -0.55859375, -0.1728515625, 0.212890625, 0.5986328125, 0.984375, 1.3701171875, 1.755859375, 2.1416015625, 2.52734375, 2.9130859375, 3.298828125, 3.6845703125, 4.0703125, 4.4560546875, 4.841796875, 5.2275390625, 5.61328125, 5.9990234375, 6.384765625, 6.7705078125, 7.15625, 7.5419921875, 7.927734375, 8.3134765625, 8.69921875, 9.0849609375, 9.470703125, 9.8564453125, 10.2421875, 10.6279296875, 11.013671875, 11.3994140625, 11.78515625, 12.1708984375, 12.556640625, 12.9423828125, 13.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 4.0, 4.0, 10.0, 6.0, 11.0, 12.0, 24.0, 22.0, 25.0, 17.0, 30.0, 35.0, 39.0, 31.0, 41.0, 45.0, 65.0, 54.0, 64.0, 62.0, 52.0, 45.0, 38.0, 41.0, 39.0, 21.0, 18.0, 23.0, 13.0, 15.0, 15.0, 9.0, 9.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-3.482421875, -3.3782958984375, -3.274169921875, -3.1700439453125, -3.06591796875, -2.9617919921875, -2.857666015625, -2.7535400390625, -2.6494140625, -2.5452880859375, -2.441162109375, -2.3370361328125, -2.23291015625, -2.1287841796875, -2.024658203125, -1.9205322265625, -1.81640625, -1.7122802734375, -1.608154296875, -1.5040283203125, -1.39990234375, -1.2957763671875, -1.191650390625, -1.0875244140625, -0.9833984375, -0.8792724609375, -0.775146484375, -0.6710205078125, -0.56689453125, -0.4627685546875, -0.358642578125, -0.2545166015625, -0.150390625, -0.0462646484375, 0.057861328125, 0.1619873046875, 0.26611328125, 0.3702392578125, 0.474365234375, 0.5784912109375, 0.6826171875, 0.7867431640625, 0.890869140625, 0.9949951171875, 1.09912109375, 1.2032470703125, 1.307373046875, 1.4114990234375, 1.515625, 1.6197509765625, 1.723876953125, 1.8280029296875, 1.93212890625, 2.0362548828125, 2.140380859375, 2.2445068359375, 2.3486328125, 2.4527587890625, 2.556884765625, 2.6610107421875, 2.76513671875, 2.8692626953125, 2.973388671875, 3.0775146484375, 3.181640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 2.0, 7.0, 13.0, 11.0, 12.0, 13.0, 24.0, 17.0, 23.0, 29.0, 39.0, 40.0, 58.0, 55.0, 57.0, 61.0, 72.0, 48.0, 47.0, 65.0, 43.0, 50.0, 34.0, 28.0, 20.0, 19.0, 16.0, 18.0, 12.0, 9.0, 10.0, 8.0, 5.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.04131317138672, -32.99440383911133, -31.947498321533203, -30.900588989257812, -29.853681564331055, -28.806774139404297, -27.759864807128906, -26.71295738220215, -25.66604995727539, -24.619142532348633, -23.572235107421875, -22.525325775146484, -21.478418350219727, -20.43151092529297, -19.384601593017578, -18.33769416809082, -17.290786743164062, -16.243879318237305, -15.19697093963623, -14.150062561035156, -13.103155136108398, -12.05624771118164, -11.009339332580566, -9.962430953979492, -8.915523529052734, -7.868615627288818, -6.821707725524902, -5.774799823760986, -4.72789192199707, -3.6809840202331543, -2.6340761184692383, -1.5871682167053223, -0.5402565002441406, 0.5066514015197754, 1.5535593032836914, 2.6004672050476074, 3.6473751068115234, 4.6942830085754395, 5.7411909103393555, 6.7880988121032715, 7.8350067138671875, 8.881914138793945, 9.92882251739502, 10.975730895996094, 12.022638320922852, 13.06954574584961, 14.116454124450684, 15.163362503051758, 16.210269927978516, 17.257177352905273, 18.30408477783203, 19.350994110107422, 20.39790153503418, 21.444808959960938, 22.491718292236328, 23.538625717163086, 24.585533142089844, 25.6324405670166, 26.67934799194336, 27.72625732421875, 28.773164749145508, 29.820072174072266, 30.866981506347656, 31.913888931274414, 32.96079635620117]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 5.0, 5.0, 9.0, 9.0, 7.0, 19.0, 13.0, 18.0, 18.0, 15.0, 17.0, 29.0, 27.0, 29.0, 31.0, 20.0, 28.0, 32.0, 26.0, 42.0, 27.0, 17.0, 32.0, 49.0, 33.0, 37.0, 40.0, 23.0, 34.0, 25.0, 24.0, 25.0, 20.0, 30.0, 12.0, 22.0, 20.0, 26.0, 15.0, 15.0, 16.0, 8.0, 9.0, 12.0, 5.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0], "bins": [-28.643796920776367, -27.812063217163086, -26.980331420898438, -26.148597717285156, -25.316865921020508, -24.485132217407227, -23.653400421142578, -22.821666717529297, -21.989933013916016, -21.158199310302734, -20.326467514038086, -19.494733810424805, -18.663002014160156, -17.831268310546875, -16.999534606933594, -16.167802810668945, -15.336071014404297, -14.504338264465332, -13.672605514526367, -12.840871810913086, -12.009140014648438, -11.177406311035156, -10.345673561096191, -9.513940811157227, -8.682208061218262, -7.850475311279297, -7.018742561340332, -6.187009334564209, -5.355276584625244, -4.523543834686279, -3.6918106079101562, -2.8600778579711914, -2.0283432006835938, -1.1966103315353394, -0.36487746238708496, 0.466855525970459, 1.2985882759094238, 2.1303210258483887, 2.9620542526245117, 3.7937870025634766, 4.625519752502441, 5.457252502441406, 6.288985252380371, 7.120718479156494, 7.952451229095459, 8.784183502197266, 9.615917205810547, 10.447649955749512, 11.279382705688477, 12.111115455627441, 12.942848205566406, 13.774581909179688, 14.606313705444336, 15.438047409057617, 16.269779205322266, 17.101512908935547, 17.933246612548828, 18.76498031616211, 19.596712112426758, 20.42844581604004, 21.260177612304688, 22.09191131591797, 22.92364501953125, 23.7553768157959, 24.587108612060547]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 15.0, 18.0, 16.0, 32.0, 45.0, 67.0, 97.0, 144.0, 213.0, 315.0, 481.0, 736.0, 1097.0, 1604.0, 2505.0, 3557.0, 5300.0, 8082.0, 12363.0, 20033.0, 32894.0, 58627.0, 120909.0, 315600.0, 795236.0, 1258741.0, 883546.0, 370366.0, 141137.0, 64482.0, 36005.0, 21425.0, 13309.0, 8588.0, 5509.0, 3633.0, 2464.0, 1677.0, 1186.0, 796.0, 487.0, 340.0, 211.0, 141.0, 73.0, 64.0, 42.0, 30.0, 20.0, 11.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-33.6875, -32.62060546875, -31.5537109375, -30.48681640625, -29.419921875, -28.35302734375, -27.2861328125, -26.21923828125, -25.15234375, -24.08544921875, -23.0185546875, -21.95166015625, -20.884765625, -19.81787109375, -18.7509765625, -17.68408203125, -16.6171875, -15.55029296875, -14.4833984375, -13.41650390625, -12.349609375, -11.28271484375, -10.2158203125, -9.14892578125, -8.08203125, -7.01513671875, -5.9482421875, -4.88134765625, -3.814453125, -2.74755859375, -1.6806640625, -0.61376953125, 0.453125, 1.52001953125, 2.5869140625, 3.65380859375, 4.720703125, 5.78759765625, 6.8544921875, 7.92138671875, 8.98828125, 10.05517578125, 11.1220703125, 12.18896484375, 13.255859375, 14.32275390625, 15.3896484375, 16.45654296875, 17.5234375, 18.59033203125, 19.6572265625, 20.72412109375, 21.791015625, 22.85791015625, 23.9248046875, 24.99169921875, 26.05859375, 27.12548828125, 28.1923828125, 29.25927734375, 30.326171875, 31.39306640625, 32.4599609375, 33.52685546875, 34.59375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 7.0, 4.0, 6.0, 6.0, 6.0, 6.0, 15.0, 14.0, 17.0, 23.0, 16.0, 19.0, 25.0, 24.0, 21.0, 29.0, 35.0, 22.0, 38.0, 25.0, 48.0, 28.0, 32.0, 37.0, 38.0, 34.0, 38.0, 34.0, 40.0, 28.0, 23.0, 35.0, 23.0, 26.0, 22.0, 25.0, 21.0, 13.0, 23.0, 7.0, 16.0, 9.0, 10.0, 9.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-25.40625, -24.650146484375, -23.89404296875, -23.137939453125, -22.3818359375, -21.625732421875, -20.86962890625, -20.113525390625, -19.357421875, -18.601318359375, -17.84521484375, -17.089111328125, -16.3330078125, -15.576904296875, -14.82080078125, -14.064697265625, -13.30859375, -12.552490234375, -11.79638671875, -11.040283203125, -10.2841796875, -9.528076171875, -8.77197265625, -8.015869140625, -7.259765625, -6.503662109375, -5.74755859375, -4.991455078125, -4.2353515625, -3.479248046875, -2.72314453125, -1.967041015625, -1.2109375, -0.454833984375, 0.30126953125, 1.057373046875, 1.8134765625, 2.569580078125, 3.32568359375, 4.081787109375, 4.837890625, 5.593994140625, 6.35009765625, 7.106201171875, 7.8623046875, 8.618408203125, 9.37451171875, 10.130615234375, 10.88671875, 11.642822265625, 12.39892578125, 13.155029296875, 13.9111328125, 14.667236328125, 15.42333984375, 16.179443359375, 16.935546875, 17.691650390625, 18.44775390625, 19.203857421875, 19.9599609375, 20.716064453125, 21.47216796875, 22.228271484375, 22.984375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 11.0, 17.0, 27.0, 56.0, 66.0, 103.0, 173.0, 291.0, 470.0, 820.0, 1357.0, 2352.0, 4110.0, 7776.0, 14719.0, 29469.0, 61083.0, 137014.0, 346713.0, 1113030.0, 1634558.0, 497543.0, 184335.0, 80031.0, 37476.0, 18831.0, 9749.0, 5255.0, 2876.0, 1600.0, 905.0, 537.0, 319.0, 223.0, 137.0, 83.0, 57.0, 36.0, 19.0, 19.0, 8.0, 9.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.208984375, -49.51171875, -47.814453125, -46.1171875, -44.419921875, -42.72265625, -41.025390625, -39.328125, -37.630859375, -35.93359375, -34.236328125, -32.5390625, -30.841796875, -29.14453125, -27.447265625, -25.75, -24.052734375, -22.35546875, -20.658203125, -18.9609375, -17.263671875, -15.56640625, -13.869140625, -12.171875, -10.474609375, -8.77734375, -7.080078125, -5.3828125, -3.685546875, -1.98828125, -0.291015625, 1.40625, 3.103515625, 4.80078125, 6.498046875, 8.1953125, 9.892578125, 11.58984375, 13.287109375, 14.984375, 16.681640625, 18.37890625, 20.076171875, 21.7734375, 23.470703125, 25.16796875, 26.865234375, 28.5625, 30.259765625, 31.95703125, 33.654296875, 35.3515625, 37.048828125, 38.74609375, 40.443359375, 42.140625, 43.837890625, 45.53515625, 47.232421875, 48.9296875, 50.626953125, 52.32421875, 54.021484375, 55.71875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 4.0, 4.0, 7.0, 14.0, 23.0, 22.0, 25.0, 31.0, 51.0, 65.0, 91.0, 93.0, 105.0, 125.0, 155.0, 248.0, 289.0, 379.0, 457.0, 374.0, 302.0, 253.0, 200.0, 157.0, 115.0, 90.0, 74.0, 61.0, 61.0, 32.0, 33.0, 32.0, 26.0, 16.0, 10.0, 8.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.8853759765625, -11.419189453125, -10.9530029296875, -10.48681640625, -10.0206298828125, -9.554443359375, -9.0882568359375, -8.6220703125, -8.1558837890625, -7.689697265625, -7.2235107421875, -6.75732421875, -6.2911376953125, -5.824951171875, -5.3587646484375, -4.892578125, -4.4263916015625, -3.960205078125, -3.4940185546875, -3.02783203125, -2.5616455078125, -2.095458984375, -1.6292724609375, -1.1630859375, -0.6968994140625, -0.230712890625, 0.2354736328125, 0.70166015625, 1.1678466796875, 1.634033203125, 2.1002197265625, 2.56640625, 3.0325927734375, 3.498779296875, 3.9649658203125, 4.43115234375, 4.8973388671875, 5.363525390625, 5.8297119140625, 6.2958984375, 6.7620849609375, 7.228271484375, 7.6944580078125, 8.16064453125, 8.6268310546875, 9.093017578125, 9.5592041015625, 10.025390625, 10.4915771484375, 10.957763671875, 11.4239501953125, 11.89013671875, 12.3563232421875, 12.822509765625, 13.2886962890625, 13.7548828125, 14.2210693359375, 14.687255859375, 15.1534423828125, 15.61962890625, 16.0858154296875, 16.552001953125, 17.0181884765625, 17.484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 11.0, 3.0, 14.0, 6.0, 5.0, 14.0, 18.0, 16.0, 24.0, 21.0, 34.0, 31.0, 32.0, 50.0, 49.0, 52.0, 54.0, 72.0, 53.0, 65.0, 59.0, 61.0, 46.0, 42.0, 27.0, 24.0, 17.0, 19.0, 11.0, 12.0, 14.0, 7.0, 10.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.91046142578125, -29.837297439575195, -28.76413345336914, -27.690969467163086, -26.61780548095703, -25.54464340209961, -24.471479415893555, -23.3983154296875, -22.325151443481445, -21.25198745727539, -20.178823471069336, -19.10565948486328, -18.03249740600586, -16.959331512451172, -15.88616943359375, -14.813005447387695, -13.73984146118164, -12.666677474975586, -11.593513488769531, -10.520350456237793, -9.447186470031738, -8.374022483825684, -7.300858974456787, -6.227695465087891, -5.154531478881836, -4.081367492675781, -3.0082039833068848, -1.9350402355194092, -0.8618764877319336, 0.2112874984741211, 1.2844510078430176, 2.357614517211914, 3.4307823181152344, 4.503946304321289, 5.5771098136901855, 6.650273323059082, 7.723437309265137, 8.796601295471191, 9.86976432800293, 10.942928314208984, 12.016092300415039, 13.089256286621094, 14.162420272827148, 15.235583305358887, 16.308746337890625, 17.381912231445312, 18.455074310302734, 19.52823829650879, 20.601402282714844, 21.6745662689209, 22.747730255126953, 23.820894241333008, 24.894058227539062, 25.967220306396484, 27.04038429260254, 28.113548278808594, 29.18671226501465, 30.259876251220703, 31.333040237426758, 32.40620422363281, 33.479366302490234, 34.55253219604492, 35.625694274902344, 36.69886016845703, 37.77202224731445]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 8.0, 7.0, 16.0, 16.0, 18.0, 26.0, 20.0, 18.0, 32.0, 23.0, 33.0, 36.0, 31.0, 36.0, 40.0, 39.0, 37.0, 49.0, 37.0, 36.0, 31.0, 37.0, 36.0, 37.0, 31.0, 36.0, 34.0, 20.0, 30.0, 24.0, 19.0, 13.0, 16.0, 15.0, 13.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.769123077392578, -28.83692741394043, -27.90473175048828, -26.972537994384766, -26.040342330932617, -25.10814666748047, -24.17595100402832, -23.243755340576172, -22.311561584472656, -21.379365921020508, -20.44717025756836, -19.514976501464844, -18.582780838012695, -17.650585174560547, -16.7183895111084, -15.78619384765625, -14.853998184204102, -13.921802520751953, -12.989607810974121, -12.057412147521973, -11.12521743774414, -10.193021774291992, -9.260826110839844, -8.328630447387695, -7.396435737609863, -6.464240550994873, -5.532045364379883, -4.599849700927734, -3.667654514312744, -2.735459327697754, -1.8032636642456055, -0.8710684776306152, 0.06112480163574219, 0.993320107460022, 1.9255154132843018, 2.857710838317871, 3.7899060249328613, 4.722101211547852, 5.654296875, 6.58649206161499, 7.5186872482299805, 8.450882911682129, 9.383077621459961, 10.31527328491211, 11.247468948364258, 12.17966365814209, 13.111859321594238, 14.04405403137207, 14.976249694824219, 15.908445358276367, 16.840641021728516, 17.77283477783203, 18.70503044128418, 19.637226104736328, 20.569421768188477, 21.501617431640625, 22.43381118774414, 23.36600685119629, 24.298202514648438, 25.230396270751953, 26.1625919342041, 27.09478759765625, 28.0269832611084, 28.959178924560547, 29.891374588012695]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 13.0, 11.0, 22.0, 39.0, 44.0, 82.0, 108.0, 150.0, 212.0, 312.0, 466.0, 709.0, 1027.0, 1551.0, 2240.0, 3424.0, 5133.0, 7858.0, 12162.0, 19079.0, 29745.0, 48122.0, 78486.0, 127820.0, 192305.0, 189134.0, 123635.0, 75381.0, 46811.0, 29256.0, 18435.0, 11953.0, 7690.0, 5013.0, 3284.0, 2177.0, 1468.0, 995.0, 708.0, 464.0, 338.0, 227.0, 147.0, 89.0, 69.0, 51.0, 26.0, 21.0, 21.0, 9.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.219970703125, -21.50244140625, -20.784912109375, -20.0673828125, -19.349853515625, -18.63232421875, -17.914794921875, -17.197265625, -16.479736328125, -15.76220703125, -15.044677734375, -14.3271484375, -13.609619140625, -12.89208984375, -12.174560546875, -11.45703125, -10.739501953125, -10.02197265625, -9.304443359375, -8.5869140625, -7.869384765625, -7.15185546875, -6.434326171875, -5.716796875, -4.999267578125, -4.28173828125, -3.564208984375, -2.8466796875, -2.129150390625, -1.41162109375, -0.694091796875, 0.0234375, 0.740966796875, 1.45849609375, 2.176025390625, 2.8935546875, 3.611083984375, 4.32861328125, 5.046142578125, 5.763671875, 6.481201171875, 7.19873046875, 7.916259765625, 8.6337890625, 9.351318359375, 10.06884765625, 10.786376953125, 11.50390625, 12.221435546875, 12.93896484375, 13.656494140625, 14.3740234375, 15.091552734375, 15.80908203125, 16.526611328125, 17.244140625, 17.961669921875, 18.67919921875, 19.396728515625, 20.1142578125, 20.831787109375, 21.54931640625, 22.266845703125, 22.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 4.0, 3.0, 7.0, 16.0, 15.0, 16.0, 24.0, 16.0, 26.0, 34.0, 32.0, 24.0, 33.0, 28.0, 39.0, 42.0, 42.0, 40.0, 43.0, 53.0, 39.0, 32.0, 34.0, 33.0, 36.0, 44.0, 36.0, 33.0, 29.0, 26.0, 20.0, 21.0, 10.0, 14.0, 15.0, 10.0, 7.0, 6.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.738037109375, -29.74169921875, -28.745361328125, -27.7490234375, -26.752685546875, -25.75634765625, -24.760009765625, -23.763671875, -22.767333984375, -21.77099609375, -20.774658203125, -19.7783203125, -18.781982421875, -17.78564453125, -16.789306640625, -15.79296875, -14.796630859375, -13.80029296875, -12.803955078125, -11.8076171875, -10.811279296875, -9.81494140625, -8.818603515625, -7.822265625, -6.825927734375, -5.82958984375, -4.833251953125, -3.8369140625, -2.840576171875, -1.84423828125, -0.847900390625, 0.1484375, 1.144775390625, 2.14111328125, 3.137451171875, 4.1337890625, 5.130126953125, 6.12646484375, 7.122802734375, 8.119140625, 9.115478515625, 10.11181640625, 11.108154296875, 12.1044921875, 13.100830078125, 14.09716796875, 15.093505859375, 16.08984375, 17.086181640625, 18.08251953125, 19.078857421875, 20.0751953125, 21.071533203125, 22.06787109375, 23.064208984375, 24.060546875, 25.056884765625, 26.05322265625, 27.049560546875, 28.0458984375, 29.042236328125, 30.03857421875, 31.034912109375, 32.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 17.0, 30.0, 29.0, 48.0, 66.0, 101.0, 153.0, 194.0, 287.0, 423.0, 645.0, 984.0, 1592.0, 2490.0, 3977.0, 6738.0, 11371.0, 20600.0, 38926.0, 80717.0, 185181.0, 327926.0, 191314.0, 83592.0, 40478.0, 20975.0, 11687.0, 6741.0, 3978.0, 2531.0, 1638.0, 1026.0, 648.0, 440.0, 292.0, 208.0, 146.0, 104.0, 71.0, 53.0, 28.0, 26.0, 21.0, 11.0, 8.0, 7.0, 4.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.0625, -35.84814453125, -34.6337890625, -33.41943359375, -32.205078125, -30.99072265625, -29.7763671875, -28.56201171875, -27.34765625, -26.13330078125, -24.9189453125, -23.70458984375, -22.490234375, -21.27587890625, -20.0615234375, -18.84716796875, -17.6328125, -16.41845703125, -15.2041015625, -13.98974609375, -12.775390625, -11.56103515625, -10.3466796875, -9.13232421875, -7.91796875, -6.70361328125, -5.4892578125, -4.27490234375, -3.060546875, -1.84619140625, -0.6318359375, 0.58251953125, 1.796875, 3.01123046875, 4.2255859375, 5.43994140625, 6.654296875, 7.86865234375, 9.0830078125, 10.29736328125, 11.51171875, 12.72607421875, 13.9404296875, 15.15478515625, 16.369140625, 17.58349609375, 18.7978515625, 20.01220703125, 21.2265625, 22.44091796875, 23.6552734375, 24.86962890625, 26.083984375, 27.29833984375, 28.5126953125, 29.72705078125, 30.94140625, 32.15576171875, 33.3701171875, 34.58447265625, 35.798828125, 37.01318359375, 38.2275390625, 39.44189453125, 40.65625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 11.0, 15.0, 10.0, 13.0, 24.0, 25.0, 16.0, 27.0, 43.0, 25.0, 36.0, 32.0, 39.0, 39.0, 48.0, 24.0, 34.0, 43.0, 35.0, 39.0, 36.0, 37.0, 44.0, 40.0, 33.0, 32.0, 31.0, 29.0, 18.0, 12.0, 16.0, 11.0, 6.0, 15.0, 6.0, 5.0, 9.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.578125, -20.93798828125, -20.2978515625, -19.65771484375, -19.017578125, -18.37744140625, -17.7373046875, -17.09716796875, -16.45703125, -15.81689453125, -15.1767578125, -14.53662109375, -13.896484375, -13.25634765625, -12.6162109375, -11.97607421875, -11.3359375, -10.69580078125, -10.0556640625, -9.41552734375, -8.775390625, -8.13525390625, -7.4951171875, -6.85498046875, -6.21484375, -5.57470703125, -4.9345703125, -4.29443359375, -3.654296875, -3.01416015625, -2.3740234375, -1.73388671875, -1.09375, -0.45361328125, 0.1865234375, 0.82666015625, 1.466796875, 2.10693359375, 2.7470703125, 3.38720703125, 4.02734375, 4.66748046875, 5.3076171875, 5.94775390625, 6.587890625, 7.22802734375, 7.8681640625, 8.50830078125, 9.1484375, 9.78857421875, 10.4287109375, 11.06884765625, 11.708984375, 12.34912109375, 12.9892578125, 13.62939453125, 14.26953125, 14.90966796875, 15.5498046875, 16.18994140625, 16.830078125, 17.47021484375, 18.1103515625, 18.75048828125, 19.390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 11.0, 16.0, 30.0, 33.0, 46.0, 58.0, 102.0, 133.0, 184.0, 300.0, 436.0, 713.0, 1143.0, 1894.0, 3376.0, 6278.0, 12230.0, 27807.0, 77434.0, 286475.0, 435226.0, 120734.0, 39262.0, 16287.0, 7794.0, 4218.0, 2442.0, 1354.0, 849.0, 555.0, 361.0, 225.0, 165.0, 104.0, 58.0, 57.0, 33.0, 26.0, 18.0, 19.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.6484375, -15.1466064453125, -14.644775390625, -14.1429443359375, -13.64111328125, -13.1392822265625, -12.637451171875, -12.1356201171875, -11.6337890625, -11.1319580078125, -10.630126953125, -10.1282958984375, -9.62646484375, -9.1246337890625, -8.622802734375, -8.1209716796875, -7.619140625, -7.1173095703125, -6.615478515625, -6.1136474609375, -5.61181640625, -5.1099853515625, -4.608154296875, -4.1063232421875, -3.6044921875, -3.1026611328125, -2.600830078125, -2.0989990234375, -1.59716796875, -1.0953369140625, -0.593505859375, -0.0916748046875, 0.41015625, 0.9119873046875, 1.413818359375, 1.9156494140625, 2.41748046875, 2.9193115234375, 3.421142578125, 3.9229736328125, 4.4248046875, 4.9266357421875, 5.428466796875, 5.9302978515625, 6.43212890625, 6.9339599609375, 7.435791015625, 7.9376220703125, 8.439453125, 8.9412841796875, 9.443115234375, 9.9449462890625, 10.44677734375, 10.9486083984375, 11.450439453125, 11.9522705078125, 12.4541015625, 12.9559326171875, 13.457763671875, 13.9595947265625, 14.46142578125, 14.9632568359375, 15.465087890625, 15.9669189453125, 16.46875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 14.0, 18.0, 35.0, 41.0, 81.0, 87.0, 148.0, 159.0, 115.0, 96.0, 56.0, 37.0, 27.0, 19.0, 13.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018739700317382812, -0.0018118172883987427, -0.001749664545059204, -0.0016875118017196655, -0.001625359058380127, -0.0015632063150405884, -0.0015010535717010498, -0.0014389008283615112, -0.0013767480850219727, -0.001314595341682434, -0.0012524425983428955, -0.001190289855003357, -0.0011281371116638184, -0.0010659843683242798, -0.0010038316249847412, -0.0009416788816452026, -0.0008795261383056641, -0.0008173733949661255, -0.0007552206516265869, -0.0006930679082870483, -0.0006309151649475098, -0.0005687624216079712, -0.0005066096782684326, -0.00044445693492889404, -0.00038230419158935547, -0.0003201514482498169, -0.0002579987049102783, -0.00019584596157073975, -0.00013369321823120117, -7.15404748916626e-05, -9.387731552124023e-06, 5.276501178741455e-05, 0.00011491775512695312, 0.0001770704984664917, 0.00023922324180603027, 0.00030137598514556885, 0.0003635287284851074, 0.000425681471824646, 0.00048783421516418457, 0.0005499869585037231, 0.0006121397018432617, 0.0006742924451828003, 0.0007364451885223389, 0.0007985979318618774, 0.000860750675201416, 0.0009229034185409546, 0.0009850561618804932, 0.0010472089052200317, 0.0011093616485595703, 0.0011715143918991089, 0.0012336671352386475, 0.001295819878578186, 0.0013579726219177246, 0.0014201253652572632, 0.0014822781085968018, 0.0015444308519363403, 0.001606583595275879, 0.0016687363386154175, 0.001730889081954956, 0.0017930418252944946, 0.0018551945686340332, 0.0019173473119735718, 0.0019795000553131104, 0.002041652798652649, 0.0021038055419921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 21.0, 29.0, 45.0, 79.0, 119.0, 134.0, 208.0, 363.0, 427.0, 713.0, 1147.0, 1743.0, 2782.0, 4729.0, 7822.0, 14249.0, 27808.0, 60494.0, 153811.0, 334810.0, 250617.0, 98027.0, 41014.0, 20323.0, 10889.0, 6058.0, 3624.0, 2217.0, 1441.0, 892.0, 603.0, 412.0, 286.0, 174.0, 129.0, 86.0, 62.0, 41.0, 22.0, 25.0, 17.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.21875, -14.781005859375, -14.34326171875, -13.905517578125, -13.4677734375, -13.030029296875, -12.59228515625, -12.154541015625, -11.716796875, -11.279052734375, -10.84130859375, -10.403564453125, -9.9658203125, -9.528076171875, -9.09033203125, -8.652587890625, -8.21484375, -7.777099609375, -7.33935546875, -6.901611328125, -6.4638671875, -6.026123046875, -5.58837890625, -5.150634765625, -4.712890625, -4.275146484375, -3.83740234375, -3.399658203125, -2.9619140625, -2.524169921875, -2.08642578125, -1.648681640625, -1.2109375, -0.773193359375, -0.33544921875, 0.102294921875, 0.5400390625, 0.977783203125, 1.41552734375, 1.853271484375, 2.291015625, 2.728759765625, 3.16650390625, 3.604248046875, 4.0419921875, 4.479736328125, 4.91748046875, 5.355224609375, 5.79296875, 6.230712890625, 6.66845703125, 7.106201171875, 7.5439453125, 7.981689453125, 8.41943359375, 8.857177734375, 9.294921875, 9.732666015625, 10.17041015625, 10.608154296875, 11.0458984375, 11.483642578125, 11.92138671875, 12.359130859375, 12.796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 7.0, 5.0, 7.0, 7.0, 15.0, 16.0, 25.0, 24.0, 34.0, 52.0, 79.0, 63.0, 86.0, 71.0, 88.0, 82.0, 74.0, 61.0, 36.0, 21.0, 28.0, 24.0, 13.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.284912109375, -4.14013671875, -3.995361328125, -3.8505859375, -3.705810546875, -3.56103515625, -3.416259765625, -3.271484375, -3.126708984375, -2.98193359375, -2.837158203125, -2.6923828125, -2.547607421875, -2.40283203125, -2.258056640625, -2.11328125, -1.968505859375, -1.82373046875, -1.678955078125, -1.5341796875, -1.389404296875, -1.24462890625, -1.099853515625, -0.955078125, -0.810302734375, -0.66552734375, -0.520751953125, -0.3759765625, -0.231201171875, -0.08642578125, 0.058349609375, 0.203125, 0.347900390625, 0.49267578125, 0.637451171875, 0.7822265625, 0.927001953125, 1.07177734375, 1.216552734375, 1.361328125, 1.506103515625, 1.65087890625, 1.795654296875, 1.9404296875, 2.085205078125, 2.22998046875, 2.374755859375, 2.51953125, 2.664306640625, 2.80908203125, 2.953857421875, 3.0986328125, 3.243408203125, 3.38818359375, 3.532958984375, 3.677734375, 3.822509765625, 3.96728515625, 4.112060546875, 4.2568359375, 4.401611328125, 4.54638671875, 4.691162109375, 4.8359375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 8.0, 10.0, 7.0, 9.0, 12.0, 15.0, 21.0, 16.0, 23.0, 32.0, 22.0, 34.0, 32.0, 47.0, 54.0, 65.0, 61.0, 70.0, 51.0, 64.0, 43.0, 49.0, 41.0, 37.0, 30.0, 22.0, 23.0, 16.0, 17.0, 9.0, 12.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.662500381469727, -27.651273727416992, -26.64004898071289, -25.628822326660156, -24.617595672607422, -23.606369018554688, -22.595144271850586, -21.58391761779785, -20.57269287109375, -19.561466217041016, -18.550241470336914, -17.53901481628418, -16.527788162231445, -15.516562461853027, -14.50533676147461, -13.494110107421875, -12.48288345336914, -11.471657752990723, -10.460431098937988, -9.44920539855957, -8.437978744506836, -7.426753044128418, -6.41552734375, -5.404301166534424, -4.393074989318848, -3.3818488121032715, -2.3706228733062744, -1.3593969345092773, -0.34817075729370117, 0.663055419921875, 1.674281120300293, 2.685507297515869, 3.696735382080078, 4.707961559295654, 5.7191877365112305, 6.730413436889648, 7.741639614105225, 8.7528657913208, 9.764091491699219, 10.775318145751953, 11.786543846130371, 12.797769546508789, 13.808996200561523, 14.820221900939941, 15.83144760131836, 16.842674255371094, 17.853900909423828, 18.86512565612793, 19.876352310180664, 20.8875789642334, 21.8988037109375, 22.910030364990234, 23.92125701904297, 24.932483673095703, 25.943708419799805, 26.95493507385254, 27.96615982055664, 28.977386474609375, 29.988611221313477, 30.99983787536621, 32.01106262207031, 33.02228927612305, 34.03351593017578, 35.044742584228516, 36.05596923828125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 4.0, 10.0, 8.0, 14.0, 20.0, 23.0, 23.0, 25.0, 23.0, 30.0, 26.0, 27.0, 35.0, 35.0, 43.0, 27.0, 47.0, 38.0, 40.0, 40.0, 30.0, 39.0, 34.0, 42.0, 32.0, 35.0, 36.0, 23.0, 25.0, 32.0, 25.0, 10.0, 16.0, 11.0, 16.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-29.438772201538086, -28.533864974975586, -27.628957748413086, -26.724050521850586, -25.819143295288086, -24.914236068725586, -24.009328842163086, -23.104421615600586, -22.199514389038086, -21.294607162475586, -20.389699935913086, -19.484792709350586, -18.579885482788086, -17.674978256225586, -16.770071029663086, -15.865163803100586, -14.96025562286377, -14.05534839630127, -13.15044116973877, -12.24553394317627, -11.34062671661377, -10.435718536376953, -9.530811309814453, -8.625904083251953, -7.720997333526611, -6.816090106964111, -5.911182880401611, -5.006275177001953, -4.101367950439453, -3.196460723876953, -2.291553497314453, -1.3866462707519531, -0.4817390441894531, 0.42316824197769165, 1.3280755281448364, 2.232982873916626, 3.137890100479126, 4.042797565460205, 4.947704792022705, 5.852612018585205, 6.757519245147705, 7.662426471710205, 8.567334175109863, 9.472241401672363, 10.377148628234863, 11.282055854797363, 12.186963081359863, 13.091870307922363, 13.996777534484863, 14.901684761047363, 15.806591987609863, 16.71150016784668, 17.61640739440918, 18.52131462097168, 19.42622184753418, 20.33112907409668, 21.23603630065918, 22.14094352722168, 23.04585075378418, 23.95075798034668, 24.85566520690918, 25.76057243347168, 26.66547966003418, 27.57038688659668, 28.47529411315918]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 18.0, 46.0, 56.0, 94.0, 118.0, 212.0, 264.0, 460.0, 700.0, 1208.0, 1735.0, 2766.0, 4426.0, 6932.0, 11013.0, 17526.0, 28044.0, 45617.0, 72881.0, 115724.0, 169015.0, 187846.0, 140297.0, 91082.0, 55964.0, 35287.0, 21762.0, 13875.0, 8596.0, 5464.0, 3345.0, 2179.0, 1433.0, 923.0, 568.0, 380.0, 215.0, 152.0, 99.0, 82.0, 50.0, 24.0, 17.0, 10.0, 9.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.71875, -33.6416015625, -32.564453125, -31.4873046875, -30.41015625, -29.3330078125, -28.255859375, -27.1787109375, -26.1015625, -25.0244140625, -23.947265625, -22.8701171875, -21.79296875, -20.7158203125, -19.638671875, -18.5615234375, -17.484375, -16.4072265625, -15.330078125, -14.2529296875, -13.17578125, -12.0986328125, -11.021484375, -9.9443359375, -8.8671875, -7.7900390625, -6.712890625, -5.6357421875, -4.55859375, -3.4814453125, -2.404296875, -1.3271484375, -0.25, 0.8271484375, 1.904296875, 2.9814453125, 4.05859375, 5.1357421875, 6.212890625, 7.2900390625, 8.3671875, 9.4443359375, 10.521484375, 11.5986328125, 12.67578125, 13.7529296875, 14.830078125, 15.9072265625, 16.984375, 18.0615234375, 19.138671875, 20.2158203125, 21.29296875, 22.3701171875, 23.447265625, 24.5244140625, 25.6015625, 26.6787109375, 27.755859375, 28.8330078125, 29.91015625, 30.9873046875, 32.064453125, 33.1416015625, 34.21875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 13.0, 6.0, 9.0, 5.0, 13.0, 15.0, 25.0, 26.0, 14.0, 24.0, 29.0, 25.0, 28.0, 36.0, 41.0, 41.0, 30.0, 31.0, 31.0, 45.0, 51.0, 40.0, 36.0, 31.0, 36.0, 36.0, 46.0, 30.0, 33.0, 22.0, 24.0, 26.0, 19.0, 13.0, 19.0, 16.0, 12.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-31.234375, -30.31689453125, -29.3994140625, -28.48193359375, -27.564453125, -26.64697265625, -25.7294921875, -24.81201171875, -23.89453125, -22.97705078125, -22.0595703125, -21.14208984375, -20.224609375, -19.30712890625, -18.3896484375, -17.47216796875, -16.5546875, -15.63720703125, -14.7197265625, -13.80224609375, -12.884765625, -11.96728515625, -11.0498046875, -10.13232421875, -9.21484375, -8.29736328125, -7.3798828125, -6.46240234375, -5.544921875, -4.62744140625, -3.7099609375, -2.79248046875, -1.875, -0.95751953125, -0.0400390625, 0.87744140625, 1.794921875, 2.71240234375, 3.6298828125, 4.54736328125, 5.46484375, 6.38232421875, 7.2998046875, 8.21728515625, 9.134765625, 10.05224609375, 10.9697265625, 11.88720703125, 12.8046875, 13.72216796875, 14.6396484375, 15.55712890625, 16.474609375, 17.39208984375, 18.3095703125, 19.22705078125, 20.14453125, 21.06201171875, 21.9794921875, 22.89697265625, 23.814453125, 24.73193359375, 25.6494140625, 26.56689453125, 27.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 11.0, 22.0, 26.0, 34.0, 62.0, 101.0, 139.0, 271.0, 411.0, 708.0, 1132.0, 2097.0, 3602.0, 6459.0, 11792.0, 22277.0, 42685.0, 86421.0, 174303.0, 278965.0, 205499.0, 103223.0, 51100.0, 25981.0, 13821.0, 7483.0, 4117.0, 2372.0, 1388.0, 839.0, 453.0, 262.0, 189.0, 104.0, 80.0, 43.0, 28.0, 18.0, 18.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.46875, -47.853515625, -46.23828125, -44.623046875, -43.0078125, -41.392578125, -39.77734375, -38.162109375, -36.546875, -34.931640625, -33.31640625, -31.701171875, -30.0859375, -28.470703125, -26.85546875, -25.240234375, -23.625, -22.009765625, -20.39453125, -18.779296875, -17.1640625, -15.548828125, -13.93359375, -12.318359375, -10.703125, -9.087890625, -7.47265625, -5.857421875, -4.2421875, -2.626953125, -1.01171875, 0.603515625, 2.21875, 3.833984375, 5.44921875, 7.064453125, 8.6796875, 10.294921875, 11.91015625, 13.525390625, 15.140625, 16.755859375, 18.37109375, 19.986328125, 21.6015625, 23.216796875, 24.83203125, 26.447265625, 28.0625, 29.677734375, 31.29296875, 32.908203125, 34.5234375, 36.138671875, 37.75390625, 39.369140625, 40.984375, 42.599609375, 44.21484375, 45.830078125, 47.4453125, 49.060546875, 50.67578125, 52.291015625, 53.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 2.0, 2.0, 9.0, 7.0, 18.0, 13.0, 16.0, 11.0, 23.0, 25.0, 20.0, 31.0, 38.0, 32.0, 35.0, 37.0, 59.0, 52.0, 41.0, 40.0, 53.0, 38.0, 46.0, 49.0, 32.0, 34.0, 35.0, 36.0, 20.0, 16.0, 21.0, 23.0, 17.0, 12.0, 15.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.890625, -20.250732421875, -19.61083984375, -18.970947265625, -18.3310546875, -17.691162109375, -17.05126953125, -16.411376953125, -15.771484375, -15.131591796875, -14.49169921875, -13.851806640625, -13.2119140625, -12.572021484375, -11.93212890625, -11.292236328125, -10.65234375, -10.012451171875, -9.37255859375, -8.732666015625, -8.0927734375, -7.452880859375, -6.81298828125, -6.173095703125, -5.533203125, -4.893310546875, -4.25341796875, -3.613525390625, -2.9736328125, -2.333740234375, -1.69384765625, -1.053955078125, -0.4140625, 0.225830078125, 0.86572265625, 1.505615234375, 2.1455078125, 2.785400390625, 3.42529296875, 4.065185546875, 4.705078125, 5.344970703125, 5.98486328125, 6.624755859375, 7.2646484375, 7.904541015625, 8.54443359375, 9.184326171875, 9.82421875, 10.464111328125, 11.10400390625, 11.743896484375, 12.3837890625, 13.023681640625, 13.66357421875, 14.303466796875, 14.943359375, 15.583251953125, 16.22314453125, 16.863037109375, 17.5029296875, 18.142822265625, 18.78271484375, 19.422607421875, 20.0625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 11.0, 18.0, 26.0, 26.0, 33.0, 54.0, 78.0, 94.0, 117.0, 171.0, 260.0, 353.0, 507.0, 740.0, 1143.0, 1831.0, 3001.0, 5140.0, 9083.0, 18024.0, 37542.0, 85294.0, 206669.0, 336021.0, 190600.0, 78129.0, 34960.0, 16904.0, 8737.0, 4892.0, 2818.0, 1760.0, 1064.0, 706.0, 507.0, 355.0, 244.0, 174.0, 116.0, 105.0, 60.0, 45.0, 37.0, 36.0, 15.0, 11.0, 14.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.59375, -19.91748046875, -19.2412109375, -18.56494140625, -17.888671875, -17.21240234375, -16.5361328125, -15.85986328125, -15.18359375, -14.50732421875, -13.8310546875, -13.15478515625, -12.478515625, -11.80224609375, -11.1259765625, -10.44970703125, -9.7734375, -9.09716796875, -8.4208984375, -7.74462890625, -7.068359375, -6.39208984375, -5.7158203125, -5.03955078125, -4.36328125, -3.68701171875, -3.0107421875, -2.33447265625, -1.658203125, -0.98193359375, -0.3056640625, 0.37060546875, 1.046875, 1.72314453125, 2.3994140625, 3.07568359375, 3.751953125, 4.42822265625, 5.1044921875, 5.78076171875, 6.45703125, 7.13330078125, 7.8095703125, 8.48583984375, 9.162109375, 9.83837890625, 10.5146484375, 11.19091796875, 11.8671875, 12.54345703125, 13.2197265625, 13.89599609375, 14.572265625, 15.24853515625, 15.9248046875, 16.60107421875, 17.27734375, 17.95361328125, 18.6298828125, 19.30615234375, 19.982421875, 20.65869140625, 21.3349609375, 22.01123046875, 22.6875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 10.0, 16.0, 26.0, 33.0, 60.0, 78.0, 90.0, 137.0, 126.0, 108.0, 80.0, 66.0, 36.0, 38.0, 11.0, 19.0, 11.0, 9.0, 7.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0028972625732421875, -0.0028096139430999756, -0.0027219653129577637, -0.0026343166828155518, -0.00254666805267334, -0.002459019422531128, -0.002371370792388916, -0.002283722162246704, -0.002196073532104492, -0.0021084249019622803, -0.0020207762718200684, -0.0019331276416778564, -0.0018454790115356445, -0.0017578303813934326, -0.0016701817512512207, -0.0015825331211090088, -0.0014948844909667969, -0.001407235860824585, -0.001319587230682373, -0.0012319386005401611, -0.0011442899703979492, -0.0010566413402557373, -0.0009689927101135254, -0.0008813440799713135, -0.0007936954498291016, -0.0007060468196868896, -0.0006183981895446777, -0.0005307495594024658, -0.0004431009292602539, -0.000355452299118042, -0.0002678036689758301, -0.00018015503883361816, -9.250640869140625e-05, -4.857778549194336e-06, 8.279085159301758e-05, 0.0001704394817352295, 0.0002580881118774414, 0.0003457367420196533, 0.00043338537216186523, 0.0005210340023040771, 0.0006086826324462891, 0.000696331262588501, 0.0007839798927307129, 0.0008716285228729248, 0.0009592771530151367, 0.0010469257831573486, 0.0011345744132995605, 0.0012222230434417725, 0.0013098716735839844, 0.0013975203037261963, 0.0014851689338684082, 0.0015728175640106201, 0.001660466194152832, 0.001748114824295044, 0.0018357634544372559, 0.0019234120845794678, 0.0020110607147216797, 0.0020987093448638916, 0.0021863579750061035, 0.0022740066051483154, 0.0023616552352905273, 0.0024493038654327393, 0.002536952495574951, 0.002624601125717163, 0.002712249755859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 33.0, 28.0, 38.0, 52.0, 97.0, 146.0, 250.0, 419.0, 661.0, 1118.0, 1947.0, 3390.0, 6399.0, 12480.0, 26415.0, 58982.0, 137365.0, 289205.0, 276118.0, 127457.0, 55422.0, 24742.0, 11874.0, 6008.0, 3260.0, 1867.0, 1044.0, 612.0, 379.0, 219.0, 156.0, 100.0, 77.0, 43.0, 33.0, 17.0, 13.0, 12.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.828125, -19.166259765625, -18.50439453125, -17.842529296875, -17.1806640625, -16.518798828125, -15.85693359375, -15.195068359375, -14.533203125, -13.871337890625, -13.20947265625, -12.547607421875, -11.8857421875, -11.223876953125, -10.56201171875, -9.900146484375, -9.23828125, -8.576416015625, -7.91455078125, -7.252685546875, -6.5908203125, -5.928955078125, -5.26708984375, -4.605224609375, -3.943359375, -3.281494140625, -2.61962890625, -1.957763671875, -1.2958984375, -0.634033203125, 0.02783203125, 0.689697265625, 1.3515625, 2.013427734375, 2.67529296875, 3.337158203125, 3.9990234375, 4.660888671875, 5.32275390625, 5.984619140625, 6.646484375, 7.308349609375, 7.97021484375, 8.632080078125, 9.2939453125, 9.955810546875, 10.61767578125, 11.279541015625, 11.94140625, 12.603271484375, 13.26513671875, 13.927001953125, 14.5888671875, 15.250732421875, 15.91259765625, 16.574462890625, 17.236328125, 17.898193359375, 18.56005859375, 19.221923828125, 19.8837890625, 20.545654296875, 21.20751953125, 21.869384765625, 22.53125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 16.0, 16.0, 17.0, 32.0, 32.0, 35.0, 50.0, 50.0, 66.0, 56.0, 71.0, 79.0, 83.0, 84.0, 57.0, 46.0, 41.0, 32.0, 34.0, 17.0, 13.0, 12.0, 13.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.22869873046875, -4.0355224609375, -3.84234619140625, -3.649169921875, -3.45599365234375, -3.2628173828125, -3.06964111328125, -2.87646484375, -2.68328857421875, -2.4901123046875, -2.29693603515625, -2.103759765625, -1.91058349609375, -1.7174072265625, -1.52423095703125, -1.3310546875, -1.13787841796875, -0.9447021484375, -0.75152587890625, -0.558349609375, -0.36517333984375, -0.1719970703125, 0.02117919921875, 0.21435546875, 0.40753173828125, 0.6007080078125, 0.79388427734375, 0.987060546875, 1.18023681640625, 1.3734130859375, 1.56658935546875, 1.759765625, 1.95294189453125, 2.1461181640625, 2.33929443359375, 2.532470703125, 2.72564697265625, 2.9188232421875, 3.11199951171875, 3.30517578125, 3.49835205078125, 3.6915283203125, 3.88470458984375, 4.077880859375, 4.27105712890625, 4.4642333984375, 4.65740966796875, 4.8505859375, 5.04376220703125, 5.2369384765625, 5.43011474609375, 5.623291015625, 5.81646728515625, 6.0096435546875, 6.20281982421875, 6.39599609375, 6.58917236328125, 6.7823486328125, 6.97552490234375, 7.168701171875, 7.36187744140625, 7.5550537109375, 7.74822998046875, 7.94140625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 5.0, 9.0, 15.0, 20.0, 16.0, 18.0, 30.0, 33.0, 28.0, 41.0, 35.0, 50.0, 45.0, 59.0, 47.0, 49.0, 53.0, 48.0, 64.0, 43.0, 38.0, 43.0, 27.0, 20.0, 19.0, 18.0, 16.0, 22.0, 16.0, 6.0, 5.0, 8.0, 7.0, 3.0, 2.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0], "bins": [-28.101316452026367, -27.175453186035156, -26.249591827392578, -25.323728561401367, -24.397865295410156, -23.472002029418945, -22.546138763427734, -21.620277404785156, -20.694414138793945, -19.768550872802734, -18.842689514160156, -17.916826248168945, -16.990962982177734, -16.065099716186523, -15.139237403869629, -14.213375091552734, -13.287511825561523, -12.361648559570312, -11.435786247253418, -10.509923934936523, -9.584060668945312, -8.658197402954102, -7.732335090637207, -6.806472301483154, -5.880609512329102, -4.954746723175049, -4.028883934020996, -3.1030211448669434, -2.1771583557128906, -1.251295566558838, -0.32543277740478516, 0.6004300117492676, 1.5262908935546875, 2.4521536827087402, 3.378016471862793, 4.303879261016846, 5.229742050170898, 6.155604839324951, 7.081467628479004, 8.007329940795898, 8.93319320678711, 9.85905647277832, 10.784918785095215, 11.71078109741211, 12.63664436340332, 13.562507629394531, 14.488369941711426, 15.41423225402832, 16.34009552001953, 17.265958786010742, 18.191822052001953, 19.11768341064453, 20.043546676635742, 20.969409942626953, 21.89527130126953, 22.821134567260742, 23.746997833251953, 24.672861099243164, 25.598724365234375, 26.524585723876953, 27.450448989868164, 28.376312255859375, 29.302173614501953, 30.228036880493164, 31.153900146484375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 5.0, 11.0, 10.0, 7.0, 19.0, 15.0, 22.0, 17.0, 20.0, 21.0, 26.0, 27.0, 33.0, 35.0, 38.0, 34.0, 30.0, 39.0, 40.0, 28.0, 30.0, 30.0, 36.0, 25.0, 31.0, 40.0, 29.0, 28.0, 35.0, 30.0, 29.0, 27.0, 17.0, 17.0, 17.0, 16.0, 12.0, 6.0, 7.0, 12.0, 5.0, 9.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0], "bins": [-28.420991897583008, -27.608470916748047, -26.795949935913086, -25.983428955078125, -25.170909881591797, -24.358386993408203, -23.545867919921875, -22.733346939086914, -21.920825958251953, -21.108304977416992, -20.29578399658203, -19.48326301574707, -18.67074203491211, -17.85822296142578, -17.04570198059082, -16.23318099975586, -15.420660018920898, -14.608139038085938, -13.795618057250977, -12.983098030090332, -12.170577049255371, -11.35805606842041, -10.545536041259766, -9.733015060424805, -8.920494079589844, -8.107973098754883, -7.29545259475708, -6.482932090759277, -5.670411109924316, -4.8578901290893555, -4.045369625091553, -3.23284912109375, -2.4203262329101562, -1.6078054904937744, -0.7952847480773926, 0.017235994338989258, 0.8297567367553711, 1.642277717590332, 2.4547982215881348, 3.2673187255859375, 4.079839706420898, 4.892360687255859, 5.704881191253662, 6.517401695251465, 7.329922676086426, 8.142443656921387, 8.954963684082031, 9.767484664916992, 10.580005645751953, 11.392526626586914, 12.205047607421875, 13.01756763458252, 13.83008861541748, 14.642609596252441, 15.455129623413086, 16.267650604248047, 17.080171585083008, 17.89269256591797, 18.70521354675293, 19.51773452758789, 20.33025360107422, 21.142776489257812, 21.95529556274414, 22.7678165435791, 23.580337524414062]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 9.0, 7.0, 9.0, 10.0, 14.0, 24.0, 38.0, 45.0, 51.0, 89.0, 155.0, 182.0, 314.0, 412.0, 578.0, 899.0, 1249.0, 1954.0, 2973.0, 4645.0, 6920.0, 10970.0, 17514.0, 29326.0, 52229.0, 108345.0, 295432.0, 852505.0, 1386435.0, 847479.0, 320843.0, 119100.0, 56137.0, 30531.0, 17605.0, 10655.0, 6609.0, 4254.0, 2650.0, 1786.0, 1109.0, 750.0, 483.0, 328.0, 230.0, 147.0, 100.0, 42.0, 44.0, 28.0, 20.0, 13.0, 12.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-38.5625, -37.4453125, -36.328125, -35.2109375, -34.09375, -32.9765625, -31.859375, -30.7421875, -29.625, -28.5078125, -27.390625, -26.2734375, -25.15625, -24.0390625, -22.921875, -21.8046875, -20.6875, -19.5703125, -18.453125, -17.3359375, -16.21875, -15.1015625, -13.984375, -12.8671875, -11.75, -10.6328125, -9.515625, -8.3984375, -7.28125, -6.1640625, -5.046875, -3.9296875, -2.8125, -1.6953125, -0.578125, 0.5390625, 1.65625, 2.7734375, 3.890625, 5.0078125, 6.125, 7.2421875, 8.359375, 9.4765625, 10.59375, 11.7109375, 12.828125, 13.9453125, 15.0625, 16.1796875, 17.296875, 18.4140625, 19.53125, 20.6484375, 21.765625, 22.8828125, 24.0, 25.1171875, 26.234375, 27.3515625, 28.46875, 29.5859375, 30.703125, 31.8203125, 32.9375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 12.0, 18.0, 12.0, 13.0, 12.0, 21.0, 24.0, 30.0, 15.0, 27.0, 29.0, 39.0, 29.0, 37.0, 30.0, 38.0, 39.0, 40.0, 25.0, 40.0, 32.0, 42.0, 45.0, 39.0, 24.0, 30.0, 33.0, 28.0, 29.0, 14.0, 17.0, 12.0, 11.0, 18.0, 18.0, 7.0, 5.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.671875, -24.945556640625, -24.21923828125, -23.492919921875, -22.7666015625, -22.040283203125, -21.31396484375, -20.587646484375, -19.861328125, -19.135009765625, -18.40869140625, -17.682373046875, -16.9560546875, -16.229736328125, -15.50341796875, -14.777099609375, -14.05078125, -13.324462890625, -12.59814453125, -11.871826171875, -11.1455078125, -10.419189453125, -9.69287109375, -8.966552734375, -8.240234375, -7.513916015625, -6.78759765625, -6.061279296875, -5.3349609375, -4.608642578125, -3.88232421875, -3.156005859375, -2.4296875, -1.703369140625, -0.97705078125, -0.250732421875, 0.4755859375, 1.201904296875, 1.92822265625, 2.654541015625, 3.380859375, 4.107177734375, 4.83349609375, 5.559814453125, 6.2861328125, 7.012451171875, 7.73876953125, 8.465087890625, 9.19140625, 9.917724609375, 10.64404296875, 11.370361328125, 12.0966796875, 12.822998046875, 13.54931640625, 14.275634765625, 15.001953125, 15.728271484375, 16.45458984375, 17.180908203125, 17.9072265625, 18.633544921875, 19.35986328125, 20.086181640625, 20.8125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 1.0, 21.0, 33.0, 35.0, 38.0, 64.0, 98.0, 159.0, 226.0, 372.0, 508.0, 879.0, 1303.0, 2175.0, 3481.0, 5669.0, 10039.0, 17643.0, 32848.0, 62899.0, 128569.0, 293018.0, 771625.0, 1628720.0, 708548.0, 271835.0, 121760.0, 59737.0, 30933.0, 16951.0, 9594.0, 5520.0, 3315.0, 2060.0, 1298.0, 781.0, 509.0, 322.0, 235.0, 159.0, 101.0, 77.0, 44.0, 22.0, 22.0, 12.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.09375, -39.74462890625, -38.3955078125, -37.04638671875, -35.697265625, -34.34814453125, -32.9990234375, -31.64990234375, -30.30078125, -28.95166015625, -27.6025390625, -26.25341796875, -24.904296875, -23.55517578125, -22.2060546875, -20.85693359375, -19.5078125, -18.15869140625, -16.8095703125, -15.46044921875, -14.111328125, -12.76220703125, -11.4130859375, -10.06396484375, -8.71484375, -7.36572265625, -6.0166015625, -4.66748046875, -3.318359375, -1.96923828125, -0.6201171875, 0.72900390625, 2.078125, 3.42724609375, 4.7763671875, 6.12548828125, 7.474609375, 8.82373046875, 10.1728515625, 11.52197265625, 12.87109375, 14.22021484375, 15.5693359375, 16.91845703125, 18.267578125, 19.61669921875, 20.9658203125, 22.31494140625, 23.6640625, 25.01318359375, 26.3623046875, 27.71142578125, 29.060546875, 30.40966796875, 31.7587890625, 33.10791015625, 34.45703125, 35.80615234375, 37.1552734375, 38.50439453125, 39.853515625, 41.20263671875, 42.5517578125, 43.90087890625, 45.25]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 9.0, 12.0, 23.0, 30.0, 29.0, 46.0, 41.0, 48.0, 83.0, 96.0, 139.0, 183.0, 247.0, 341.0, 416.0, 466.0, 431.0, 334.0, 267.0, 181.0, 169.0, 107.0, 92.0, 63.0, 56.0, 39.0, 32.0, 24.0, 16.0, 11.0, 16.0, 3.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.953125, -12.466552734375, -11.97998046875, -11.493408203125, -11.0068359375, -10.520263671875, -10.03369140625, -9.547119140625, -9.060546875, -8.573974609375, -8.08740234375, -7.600830078125, -7.1142578125, -6.627685546875, -6.14111328125, -5.654541015625, -5.16796875, -4.681396484375, -4.19482421875, -3.708251953125, -3.2216796875, -2.735107421875, -2.24853515625, -1.761962890625, -1.275390625, -0.788818359375, -0.30224609375, 0.184326171875, 0.6708984375, 1.157470703125, 1.64404296875, 2.130615234375, 2.6171875, 3.103759765625, 3.59033203125, 4.076904296875, 4.5634765625, 5.050048828125, 5.53662109375, 6.023193359375, 6.509765625, 6.996337890625, 7.48291015625, 7.969482421875, 8.4560546875, 8.942626953125, 9.42919921875, 9.915771484375, 10.40234375, 10.888916015625, 11.37548828125, 11.862060546875, 12.3486328125, 12.835205078125, 13.32177734375, 13.808349609375, 14.294921875, 14.781494140625, 15.26806640625, 15.754638671875, 16.2412109375, 16.727783203125, 17.21435546875, 17.700927734375, 18.1875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 6.0, 13.0, 8.0, 19.0, 24.0, 26.0, 35.0, 39.0, 45.0, 54.0, 76.0, 62.0, 67.0, 82.0, 69.0, 73.0, 60.0, 43.0, 32.0, 29.0, 31.0, 15.0, 17.0, 16.0, 7.0, 12.0, 5.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-43.4337272644043, -42.22896194458008, -41.024200439453125, -39.819435119628906, -38.61466979980469, -37.40990447998047, -36.20513916015625, -35.0003776550293, -33.79561233520508, -32.59084701538086, -31.386083602905273, -30.181320190429688, -28.97655487060547, -27.77178955078125, -26.567026138305664, -25.362262725830078, -24.15749740600586, -22.95273208618164, -21.747968673706055, -20.54320526123047, -19.33843994140625, -18.13367462158203, -16.928911209106445, -15.724146842956543, -14.51938247680664, -13.314618110656738, -12.109853744506836, -10.905089378356934, -9.700325012207031, -8.495560646057129, -7.290796279907227, -6.086031913757324, -4.8812713623046875, -3.676506996154785, -2.471742630004883, -1.2669782638549805, -0.062213897705078125, 1.1425504684448242, 2.3473148345947266, 3.552079200744629, 4.756843566894531, 5.961607933044434, 7.166372299194336, 8.371136665344238, 9.57590103149414, 10.780665397644043, 11.985429763793945, 13.190194129943848, 14.39495849609375, 15.599722862243652, 16.804487228393555, 18.00925064086914, 19.21401596069336, 20.418781280517578, 21.623544692993164, 22.82830810546875, 24.03307342529297, 25.237838745117188, 26.442602157592773, 27.64736557006836, 28.852130889892578, 30.056896209716797, 31.261659622192383, 32.46642303466797, 33.67118835449219]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 15.0, 9.0, 8.0, 10.0, 17.0, 18.0, 16.0, 14.0, 23.0, 23.0, 23.0, 26.0, 34.0, 30.0, 37.0, 37.0, 44.0, 41.0, 41.0, 33.0, 51.0, 34.0, 37.0, 36.0, 35.0, 35.0, 25.0, 35.0, 29.0, 19.0, 15.0, 21.0, 22.0, 22.0, 12.0, 16.0, 8.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.403141021728516, -27.558950424194336, -26.714757919311523, -25.870567321777344, -25.026376724243164, -24.182186126708984, -23.337993621826172, -22.493803024291992, -21.649612426757812, -20.805421829223633, -19.96122932434082, -19.11703872680664, -18.27284812927246, -17.42865753173828, -16.58446502685547, -15.740274429321289, -14.896081924438477, -14.05189037322998, -13.2076997756958, -12.363508224487305, -11.519317626953125, -10.675126075744629, -9.830934524536133, -8.986743927001953, -8.142552375793457, -7.298361301422119, -6.454170227050781, -5.609978675842285, -4.765787601470947, -3.9215965270996094, -3.0774049758911133, -2.2332139015197754, -1.3890228271484375, -0.5448316335678101, 0.2993595600128174, 1.1435508728027344, 1.9877419471740723, 2.83193302154541, 3.6761245727539062, 4.520315647125244, 5.364506721496582, 6.20869779586792, 7.052888870239258, 7.897080421447754, 8.74127197265625, 9.58546257019043, 10.429654121398926, 11.273845672607422, 12.118036270141602, 12.962227821350098, 13.806418418884277, 14.650609970092773, 15.494800567626953, 16.338993072509766, 17.183183670043945, 18.027374267578125, 18.871566772460938, 19.715757369995117, 20.55994987487793, 21.40414047241211, 22.24833106994629, 23.09252166748047, 23.93671417236328, 24.78090476989746, 25.62509536743164]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 9.0, 11.0, 27.0, 30.0, 45.0, 62.0, 93.0, 143.0, 210.0, 359.0, 516.0, 911.0, 1582.0, 2843.0, 4881.0, 8905.0, 16162.0, 30746.0, 59894.0, 127007.0, 271466.0, 268490.0, 127189.0, 59912.0, 30562.0, 16110.0, 8726.0, 4836.0, 2793.0, 1533.0, 949.0, 558.0, 335.0, 216.0, 134.0, 102.0, 70.0, 37.0, 23.0, 22.0, 16.0, 16.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -27.927490234375, -26.96435546875, -26.001220703125, -25.0380859375, -24.074951171875, -23.11181640625, -22.148681640625, -21.185546875, -20.222412109375, -19.25927734375, -18.296142578125, -17.3330078125, -16.369873046875, -15.40673828125, -14.443603515625, -13.48046875, -12.517333984375, -11.55419921875, -10.591064453125, -9.6279296875, -8.664794921875, -7.70166015625, -6.738525390625, -5.775390625, -4.812255859375, -3.84912109375, -2.885986328125, -1.9228515625, -0.959716796875, 0.00341796875, 0.966552734375, 1.9296875, 2.892822265625, 3.85595703125, 4.819091796875, 5.7822265625, 6.745361328125, 7.70849609375, 8.671630859375, 9.634765625, 10.597900390625, 11.56103515625, 12.524169921875, 13.4873046875, 14.450439453125, 15.41357421875, 16.376708984375, 17.33984375, 18.302978515625, 19.26611328125, 20.229248046875, 21.1923828125, 22.155517578125, 23.11865234375, 24.081787109375, 25.044921875, 26.008056640625, 26.97119140625, 27.934326171875, 28.8974609375, 29.860595703125, 30.82373046875, 31.786865234375, 32.75]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 7.0, 6.0, 13.0, 17.0, 14.0, 20.0, 7.0, 16.0, 19.0, 26.0, 26.0, 25.0, 34.0, 35.0, 43.0, 31.0, 33.0, 44.0, 46.0, 34.0, 43.0, 41.0, 30.0, 40.0, 35.0, 24.0, 34.0, 29.0, 30.0, 28.0, 16.0, 16.0, 19.0, 15.0, 15.0, 13.0, 19.0, 12.0, 4.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.25, -27.404052734375, -26.55810546875, -25.712158203125, -24.8662109375, -24.020263671875, -23.17431640625, -22.328369140625, -21.482421875, -20.636474609375, -19.79052734375, -18.944580078125, -18.0986328125, -17.252685546875, -16.40673828125, -15.560791015625, -14.71484375, -13.868896484375, -13.02294921875, -12.177001953125, -11.3310546875, -10.485107421875, -9.63916015625, -8.793212890625, -7.947265625, -7.101318359375, -6.25537109375, -5.409423828125, -4.5634765625, -3.717529296875, -2.87158203125, -2.025634765625, -1.1796875, -0.333740234375, 0.51220703125, 1.358154296875, 2.2041015625, 3.050048828125, 3.89599609375, 4.741943359375, 5.587890625, 6.433837890625, 7.27978515625, 8.125732421875, 8.9716796875, 9.817626953125, 10.66357421875, 11.509521484375, 12.35546875, 13.201416015625, 14.04736328125, 14.893310546875, 15.7392578125, 16.585205078125, 17.43115234375, 18.277099609375, 19.123046875, 19.968994140625, 20.81494140625, 21.660888671875, 22.5068359375, 23.352783203125, 24.19873046875, 25.044677734375, 25.890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 8.0, 9.0, 18.0, 35.0, 58.0, 62.0, 100.0, 155.0, 197.0, 352.0, 550.0, 901.0, 1409.0, 2295.0, 3898.0, 6346.0, 11108.0, 20127.0, 39549.0, 87323.0, 226993.0, 363424.0, 152195.0, 63045.0, 30192.0, 15956.0, 8876.0, 5144.0, 3067.0, 1914.0, 1175.0, 754.0, 426.0, 313.0, 199.0, 117.0, 82.0, 55.0, 44.0, 32.0, 20.0, 8.0, 7.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40625, -37.21728515625, -36.0283203125, -34.83935546875, -33.650390625, -32.46142578125, -31.2724609375, -30.08349609375, -28.89453125, -27.70556640625, -26.5166015625, -25.32763671875, -24.138671875, -22.94970703125, -21.7607421875, -20.57177734375, -19.3828125, -18.19384765625, -17.0048828125, -15.81591796875, -14.626953125, -13.43798828125, -12.2490234375, -11.06005859375, -9.87109375, -8.68212890625, -7.4931640625, -6.30419921875, -5.115234375, -3.92626953125, -2.7373046875, -1.54833984375, -0.359375, 0.82958984375, 2.0185546875, 3.20751953125, 4.396484375, 5.58544921875, 6.7744140625, 7.96337890625, 9.15234375, 10.34130859375, 11.5302734375, 12.71923828125, 13.908203125, 15.09716796875, 16.2861328125, 17.47509765625, 18.6640625, 19.85302734375, 21.0419921875, 22.23095703125, 23.419921875, 24.60888671875, 25.7978515625, 26.98681640625, 28.17578125, 29.36474609375, 30.5537109375, 31.74267578125, 32.931640625, 34.12060546875, 35.3095703125, 36.49853515625, 37.6875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 3.0, 8.0, 9.0, 13.0, 19.0, 14.0, 18.0, 21.0, 20.0, 26.0, 33.0, 28.0, 39.0, 38.0, 43.0, 51.0, 46.0, 49.0, 41.0, 44.0, 37.0, 46.0, 35.0, 43.0, 43.0, 32.0, 25.0, 18.0, 29.0, 21.0, 24.0, 15.0, 7.0, 10.0, 9.0, 5.0, 9.0, 4.0, 1.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.0712890625, -19.439453125, -18.8076171875, -18.17578125, -17.5439453125, -16.912109375, -16.2802734375, -15.6484375, -15.0166015625, -14.384765625, -13.7529296875, -13.12109375, -12.4892578125, -11.857421875, -11.2255859375, -10.59375, -9.9619140625, -9.330078125, -8.6982421875, -8.06640625, -7.4345703125, -6.802734375, -6.1708984375, -5.5390625, -4.9072265625, -4.275390625, -3.6435546875, -3.01171875, -2.3798828125, -1.748046875, -1.1162109375, -0.484375, 0.1474609375, 0.779296875, 1.4111328125, 2.04296875, 2.6748046875, 3.306640625, 3.9384765625, 4.5703125, 5.2021484375, 5.833984375, 6.4658203125, 7.09765625, 7.7294921875, 8.361328125, 8.9931640625, 9.625, 10.2568359375, 10.888671875, 11.5205078125, 12.15234375, 12.7841796875, 13.416015625, 14.0478515625, 14.6796875, 15.3115234375, 15.943359375, 16.5751953125, 17.20703125, 17.8388671875, 18.470703125, 19.1025390625, 19.734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 12.0, 9.0, 15.0, 27.0, 36.0, 43.0, 51.0, 87.0, 104.0, 173.0, 254.0, 364.0, 545.0, 845.0, 1400.0, 2192.0, 3773.0, 6596.0, 12241.0, 25278.0, 56288.0, 133764.0, 308554.0, 279554.0, 117789.0, 49360.0, 22486.0, 11294.0, 6004.0, 3468.0, 2095.0, 1365.0, 819.0, 564.0, 373.0, 219.0, 148.0, 104.0, 65.0, 58.0, 33.0, 27.0, 18.0, 13.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0], "bins": [-10.2734375, -9.96142578125, -9.6494140625, -9.33740234375, -9.025390625, -8.71337890625, -8.4013671875, -8.08935546875, -7.77734375, -7.46533203125, -7.1533203125, -6.84130859375, -6.529296875, -6.21728515625, -5.9052734375, -5.59326171875, -5.28125, -4.96923828125, -4.6572265625, -4.34521484375, -4.033203125, -3.72119140625, -3.4091796875, -3.09716796875, -2.78515625, -2.47314453125, -2.1611328125, -1.84912109375, -1.537109375, -1.22509765625, -0.9130859375, -0.60107421875, -0.2890625, 0.02294921875, 0.3349609375, 0.64697265625, 0.958984375, 1.27099609375, 1.5830078125, 1.89501953125, 2.20703125, 2.51904296875, 2.8310546875, 3.14306640625, 3.455078125, 3.76708984375, 4.0791015625, 4.39111328125, 4.703125, 5.01513671875, 5.3271484375, 5.63916015625, 5.951171875, 6.26318359375, 6.5751953125, 6.88720703125, 7.19921875, 7.51123046875, 7.8232421875, 8.13525390625, 8.447265625, 8.75927734375, 9.0712890625, 9.38330078125, 9.6953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 9.0, 11.0, 22.0, 32.0, 29.0, 30.0, 39.0, 51.0, 67.0, 59.0, 75.0, 67.0, 64.0, 58.0, 63.0, 58.0, 43.0, 34.0, 29.0, 26.0, 25.0, 19.0, 18.0, 7.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006732940673828125, -0.0006482452154159546, -0.0006231963634490967, -0.0005981475114822388, -0.0005730986595153809, -0.000548049807548523, -0.000523000955581665, -0.0004979521036148071, -0.0004729032516479492, -0.0004478543996810913, -0.0004228055477142334, -0.0003977566957473755, -0.0003727078437805176, -0.00034765899181365967, -0.00032261013984680176, -0.00029756128787994385, -0.00027251243591308594, -0.00024746358394622803, -0.00022241473197937012, -0.0001973658800125122, -0.0001723170280456543, -0.0001472681760787964, -0.00012221932411193848, -9.717047214508057e-05, -7.212162017822266e-05, -4.7072768211364746e-05, -2.2023916244506836e-05, 3.0249357223510742e-06, 2.8073787689208984e-05, 5.3122639656066895e-05, 7.81714916229248e-05, 0.00010322034358978271, 0.00012826919555664062, 0.00015331804752349854, 0.00017836689949035645, 0.00020341575145721436, 0.00022846460342407227, 0.0002535134553909302, 0.0002785623073577881, 0.000303611159324646, 0.0003286600112915039, 0.0003537088632583618, 0.0003787577152252197, 0.00040380656719207764, 0.00042885541915893555, 0.00045390427112579346, 0.00047895312309265137, 0.0005040019750595093, 0.0005290508270263672, 0.0005540996789932251, 0.000579148530960083, 0.0006041973829269409, 0.0006292462348937988, 0.0006542950868606567, 0.0006793439388275146, 0.0007043927907943726, 0.0007294416427612305, 0.0007544904947280884, 0.0007795393466949463, 0.0008045881986618042, 0.0008296370506286621, 0.00085468590259552, 0.0008797347545623779, 0.0009047836065292358, 0.0009298324584960938]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 26.0, 24.0, 36.0, 49.0, 60.0, 103.0, 155.0, 228.0, 315.0, 487.0, 802.0, 1391.0, 2262.0, 4103.0, 7155.0, 13721.0, 27192.0, 56831.0, 132686.0, 284589.0, 277865.0, 127116.0, 55081.0, 26162.0, 13188.0, 7107.0, 3941.0, 2298.0, 1318.0, 761.0, 459.0, 310.0, 231.0, 143.0, 97.0, 71.0, 37.0, 42.0, 25.0, 19.0, 8.0, 14.0, 11.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.515625, -11.1314697265625, -10.747314453125, -10.3631591796875, -9.97900390625, -9.5948486328125, -9.210693359375, -8.8265380859375, -8.4423828125, -8.0582275390625, -7.674072265625, -7.2899169921875, -6.90576171875, -6.5216064453125, -6.137451171875, -5.7532958984375, -5.369140625, -4.9849853515625, -4.600830078125, -4.2166748046875, -3.83251953125, -3.4483642578125, -3.064208984375, -2.6800537109375, -2.2958984375, -1.9117431640625, -1.527587890625, -1.1434326171875, -0.75927734375, -0.3751220703125, 0.009033203125, 0.3931884765625, 0.77734375, 1.1614990234375, 1.545654296875, 1.9298095703125, 2.31396484375, 2.6981201171875, 3.082275390625, 3.4664306640625, 3.8505859375, 4.2347412109375, 4.618896484375, 5.0030517578125, 5.38720703125, 5.7713623046875, 6.155517578125, 6.5396728515625, 6.923828125, 7.3079833984375, 7.692138671875, 8.0762939453125, 8.46044921875, 8.8446044921875, 9.228759765625, 9.6129150390625, 9.9970703125, 10.3812255859375, 10.765380859375, 11.1495361328125, 11.53369140625, 11.9178466796875, 12.302001953125, 12.6861572265625, 13.0703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 10.0, 7.0, 8.0, 12.0, 7.0, 16.0, 26.0, 23.0, 18.0, 25.0, 44.0, 59.0, 48.0, 67.0, 85.0, 61.0, 74.0, 84.0, 52.0, 43.0, 30.0, 41.0, 33.0, 17.0, 23.0, 12.0, 16.0, 11.0, 8.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7421875, -3.6197509765625, -3.497314453125, -3.3748779296875, -3.25244140625, -3.1300048828125, -3.007568359375, -2.8851318359375, -2.7626953125, -2.6402587890625, -2.517822265625, -2.3953857421875, -2.27294921875, -2.1505126953125, -2.028076171875, -1.9056396484375, -1.783203125, -1.6607666015625, -1.538330078125, -1.4158935546875, -1.29345703125, -1.1710205078125, -1.048583984375, -0.9261474609375, -0.8037109375, -0.6812744140625, -0.558837890625, -0.4364013671875, -0.31396484375, -0.1915283203125, -0.069091796875, 0.0533447265625, 0.17578125, 0.2982177734375, 0.420654296875, 0.5430908203125, 0.66552734375, 0.7879638671875, 0.910400390625, 1.0328369140625, 1.1552734375, 1.2777099609375, 1.400146484375, 1.5225830078125, 1.64501953125, 1.7674560546875, 1.889892578125, 2.0123291015625, 2.134765625, 2.2572021484375, 2.379638671875, 2.5020751953125, 2.62451171875, 2.7469482421875, 2.869384765625, 2.9918212890625, 3.1142578125, 3.2366943359375, 3.359130859375, 3.4815673828125, 3.60400390625, 3.7264404296875, 3.848876953125, 3.9713134765625, 4.09375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 12.0, 16.0, 13.0, 20.0, 24.0, 33.0, 39.0, 33.0, 57.0, 62.0, 73.0, 64.0, 79.0, 70.0, 71.0, 76.0, 45.0, 31.0, 39.0, 22.0, 17.0, 16.0, 20.0, 12.0, 9.0, 7.0, 6.0, 1.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.1654167175293, -42.00754928588867, -40.84968185424805, -39.69181442260742, -38.53395080566406, -37.37608337402344, -36.21821594238281, -35.06034851074219, -33.90248107910156, -32.74461364746094, -31.586746215820312, -30.42888069152832, -29.271013259887695, -28.11314582824707, -26.955280303955078, -25.797412872314453, -24.639545440673828, -23.481678009033203, -22.323810577392578, -21.165945053100586, -20.00807762145996, -18.850210189819336, -17.692344665527344, -16.53447723388672, -15.376609802246094, -14.218742370605469, -13.06087589263916, -11.903009414672852, -10.745141983032227, -9.587274551391602, -8.429408073425293, -7.271541595458984, -6.113676071166992, -4.955809116363525, -3.7979421615600586, -2.640075206756592, -1.482208251953125, -0.3243412971496582, 0.8335256576538086, 1.9913921356201172, 3.149259567260742, 4.307126522064209, 5.464993476867676, 6.622860431671143, 7.780727386474609, 8.938594818115234, 10.096461296081543, 11.254327774047852, 12.412195205688477, 13.570062637329102, 14.72792911529541, 15.885795593261719, 17.043663024902344, 18.20153045654297, 19.359397888183594, 20.517263412475586, 21.67513084411621, 22.832998275756836, 23.990863800048828, 25.148731231689453, 26.306598663330078, 27.464466094970703, 28.622333526611328, 29.78019905090332, 30.938066482543945]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 7.0, 7.0, 17.0, 12.0, 17.0, 20.0, 21.0, 17.0, 22.0, 17.0, 26.0, 32.0, 35.0, 35.0, 40.0, 31.0, 44.0, 47.0, 29.0, 42.0, 45.0, 39.0, 44.0, 37.0, 33.0, 22.0, 29.0, 28.0, 18.0, 21.0, 20.0, 20.0, 24.0, 13.0, 14.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.629261016845703, -25.817188262939453, -25.005117416381836, -24.193044662475586, -23.380971908569336, -22.56890106201172, -21.75682830810547, -20.94475555419922, -20.13268280029297, -19.32061004638672, -18.5085391998291, -17.69646644592285, -16.8843936920166, -16.072322845458984, -15.260250091552734, -14.448177337646484, -13.636106491088867, -12.824034690856934, -12.011961936950684, -11.19989013671875, -10.3878173828125, -9.575745582580566, -8.763673782348633, -7.951601505279541, -7.139529228210449, -6.327456951141357, -5.515384674072266, -4.703312873840332, -3.8912405967712402, -3.0791683197021484, -2.267096519470215, -1.455024242401123, -0.6429519653320312, 0.169120192527771, 0.9811923503875732, 1.793264389038086, 2.6053366661071777, 3.4174089431762695, 4.229480743408203, 5.041553020477295, 5.853625297546387, 6.6656975746154785, 7.47776985168457, 8.289841651916504, 9.101913452148438, 9.913986206054688, 10.726058006286621, 11.538129806518555, 12.350202560424805, 13.162274360656738, 13.974347114562988, 14.786418914794922, 15.598491668701172, 16.410564422607422, 17.22263526916504, 18.03470802307129, 18.846778869628906, 19.658851623535156, 20.470922470092773, 21.282995223999023, 22.095067977905273, 22.90713882446289, 23.71921157836914, 24.53128433227539, 25.34335708618164]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 7.0, 26.0, 29.0, 46.0, 66.0, 94.0, 103.0, 193.0, 275.0, 418.0, 595.0, 867.0, 1227.0, 1786.0, 2693.0, 3842.0, 5901.0, 8841.0, 13363.0, 20522.0, 31955.0, 49995.0, 79080.0, 121049.0, 167738.0, 172279.0, 128502.0, 84280.0, 53910.0, 34106.0, 21931.0, 14165.0, 9448.0, 6216.0, 4192.0, 2840.0, 1916.0, 1252.0, 872.0, 614.0, 428.0, 273.0, 184.0, 155.0, 73.0, 70.0, 44.0, 27.0, 21.0, 12.0, 8.0, 6.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-28.625, -27.703857421875, -26.78271484375, -25.861572265625, -24.9404296875, -24.019287109375, -23.09814453125, -22.177001953125, -21.255859375, -20.334716796875, -19.41357421875, -18.492431640625, -17.5712890625, -16.650146484375, -15.72900390625, -14.807861328125, -13.88671875, -12.965576171875, -12.04443359375, -11.123291015625, -10.2021484375, -9.281005859375, -8.35986328125, -7.438720703125, -6.517578125, -5.596435546875, -4.67529296875, -3.754150390625, -2.8330078125, -1.911865234375, -0.99072265625, -0.069580078125, 0.8515625, 1.772705078125, 2.69384765625, 3.614990234375, 4.5361328125, 5.457275390625, 6.37841796875, 7.299560546875, 8.220703125, 9.141845703125, 10.06298828125, 10.984130859375, 11.9052734375, 12.826416015625, 13.74755859375, 14.668701171875, 15.58984375, 16.510986328125, 17.43212890625, 18.353271484375, 19.2744140625, 20.195556640625, 21.11669921875, 22.037841796875, 22.958984375, 23.880126953125, 24.80126953125, 25.722412109375, 26.6435546875, 27.564697265625, 28.48583984375, 29.406982421875, 30.328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 9.0, 8.0, 13.0, 14.0, 18.0, 14.0, 14.0, 16.0, 30.0, 21.0, 28.0, 31.0, 41.0, 35.0, 34.0, 27.0, 43.0, 41.0, 46.0, 30.0, 51.0, 48.0, 32.0, 36.0, 37.0, 29.0, 28.0, 21.0, 24.0, 19.0, 21.0, 23.0, 16.0, 20.0, 13.0, 12.0, 12.0, 11.0, 3.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.671875, -25.84326171875, -25.0146484375, -24.18603515625, -23.357421875, -22.52880859375, -21.7001953125, -20.87158203125, -20.04296875, -19.21435546875, -18.3857421875, -17.55712890625, -16.728515625, -15.89990234375, -15.0712890625, -14.24267578125, -13.4140625, -12.58544921875, -11.7568359375, -10.92822265625, -10.099609375, -9.27099609375, -8.4423828125, -7.61376953125, -6.78515625, -5.95654296875, -5.1279296875, -4.29931640625, -3.470703125, -2.64208984375, -1.8134765625, -0.98486328125, -0.15625, 0.67236328125, 1.5009765625, 2.32958984375, 3.158203125, 3.98681640625, 4.8154296875, 5.64404296875, 6.47265625, 7.30126953125, 8.1298828125, 8.95849609375, 9.787109375, 10.61572265625, 11.4443359375, 12.27294921875, 13.1015625, 13.93017578125, 14.7587890625, 15.58740234375, 16.416015625, 17.24462890625, 18.0732421875, 18.90185546875, 19.73046875, 20.55908203125, 21.3876953125, 22.21630859375, 23.044921875, 23.87353515625, 24.7021484375, 25.53076171875, 26.359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 10.0, 8.0, 18.0, 15.0, 38.0, 42.0, 73.0, 131.0, 223.0, 293.0, 510.0, 806.0, 1214.0, 1953.0, 2997.0, 4762.0, 7716.0, 12501.0, 20206.0, 33788.0, 58153.0, 101080.0, 168514.0, 218334.0, 168854.0, 101090.0, 57975.0, 33532.0, 20255.0, 12409.0, 7718.0, 4829.0, 3123.0, 2021.0, 1237.0, 783.0, 449.0, 351.0, 193.0, 156.0, 73.0, 48.0, 33.0, 20.0, 10.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.53125, -36.37646484375, -35.2216796875, -34.06689453125, -32.912109375, -31.75732421875, -30.6025390625, -29.44775390625, -28.29296875, -27.13818359375, -25.9833984375, -24.82861328125, -23.673828125, -22.51904296875, -21.3642578125, -20.20947265625, -19.0546875, -17.89990234375, -16.7451171875, -15.59033203125, -14.435546875, -13.28076171875, -12.1259765625, -10.97119140625, -9.81640625, -8.66162109375, -7.5068359375, -6.35205078125, -5.197265625, -4.04248046875, -2.8876953125, -1.73291015625, -0.578125, 0.57666015625, 1.7314453125, 2.88623046875, 4.041015625, 5.19580078125, 6.3505859375, 7.50537109375, 8.66015625, 9.81494140625, 10.9697265625, 12.12451171875, 13.279296875, 14.43408203125, 15.5888671875, 16.74365234375, 17.8984375, 19.05322265625, 20.2080078125, 21.36279296875, 22.517578125, 23.67236328125, 24.8271484375, 25.98193359375, 27.13671875, 28.29150390625, 29.4462890625, 30.60107421875, 31.755859375, 32.91064453125, 34.0654296875, 35.22021484375, 36.375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 7.0, 16.0, 21.0, 19.0, 11.0, 18.0, 18.0, 26.0, 23.0, 25.0, 25.0, 42.0, 26.0, 41.0, 39.0, 35.0, 47.0, 36.0, 38.0, 46.0, 43.0, 28.0, 37.0, 35.0, 39.0, 29.0, 32.0, 29.0, 12.0, 16.0, 20.0, 20.0, 14.0, 9.0, 15.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.75, -17.2158203125, -16.681640625, -16.1474609375, -15.61328125, -15.0791015625, -14.544921875, -14.0107421875, -13.4765625, -12.9423828125, -12.408203125, -11.8740234375, -11.33984375, -10.8056640625, -10.271484375, -9.7373046875, -9.203125, -8.6689453125, -8.134765625, -7.6005859375, -7.06640625, -6.5322265625, -5.998046875, -5.4638671875, -4.9296875, -4.3955078125, -3.861328125, -3.3271484375, -2.79296875, -2.2587890625, -1.724609375, -1.1904296875, -0.65625, -0.1220703125, 0.412109375, 0.9462890625, 1.48046875, 2.0146484375, 2.548828125, 3.0830078125, 3.6171875, 4.1513671875, 4.685546875, 5.2197265625, 5.75390625, 6.2880859375, 6.822265625, 7.3564453125, 7.890625, 8.4248046875, 8.958984375, 9.4931640625, 10.02734375, 10.5615234375, 11.095703125, 11.6298828125, 12.1640625, 12.6982421875, 13.232421875, 13.7666015625, 14.30078125, 14.8349609375, 15.369140625, 15.9033203125, 16.4375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 15.0, 15.0, 29.0, 30.0, 48.0, 65.0, 105.0, 156.0, 208.0, 327.0, 494.0, 727.0, 1156.0, 1781.0, 2919.0, 4789.0, 7852.0, 13825.0, 25051.0, 46071.0, 89734.0, 172152.0, 259253.0, 196347.0, 103955.0, 53728.0, 28562.0, 15783.0, 9036.0, 5321.0, 3257.0, 2043.0, 1243.0, 818.0, 540.0, 357.0, 228.0, 157.0, 107.0, 78.0, 46.0, 42.0, 29.0, 19.0, 16.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-13.296875, -12.88916015625, -12.4814453125, -12.07373046875, -11.666015625, -11.25830078125, -10.8505859375, -10.44287109375, -10.03515625, -9.62744140625, -9.2197265625, -8.81201171875, -8.404296875, -7.99658203125, -7.5888671875, -7.18115234375, -6.7734375, -6.36572265625, -5.9580078125, -5.55029296875, -5.142578125, -4.73486328125, -4.3271484375, -3.91943359375, -3.51171875, -3.10400390625, -2.6962890625, -2.28857421875, -1.880859375, -1.47314453125, -1.0654296875, -0.65771484375, -0.25, 0.15771484375, 0.5654296875, 0.97314453125, 1.380859375, 1.78857421875, 2.1962890625, 2.60400390625, 3.01171875, 3.41943359375, 3.8271484375, 4.23486328125, 4.642578125, 5.05029296875, 5.4580078125, 5.86572265625, 6.2734375, 6.68115234375, 7.0888671875, 7.49658203125, 7.904296875, 8.31201171875, 8.7197265625, 9.12744140625, 9.53515625, 9.94287109375, 10.3505859375, 10.75830078125, 11.166015625, 11.57373046875, 11.9814453125, 12.38916015625, 12.796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 9.0, 10.0, 12.0, 12.0, 15.0, 25.0, 37.0, 52.0, 88.0, 96.0, 128.0, 113.0, 112.0, 87.0, 59.0, 45.0, 27.0, 18.0, 18.0, 12.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017309188842773438, -0.0016647130250930786, -0.0015985071659088135, -0.0015323013067245483, -0.0014660954475402832, -0.001399889588356018, -0.001333683729171753, -0.0012674778699874878, -0.0012012720108032227, -0.0011350661516189575, -0.0010688602924346924, -0.0010026544332504272, -0.0009364485740661621, -0.000870242714881897, -0.0008040368556976318, -0.0007378309965133667, -0.0006716251373291016, -0.0006054192781448364, -0.0005392134189605713, -0.00047300755977630615, -0.000406801700592041, -0.0003405958414077759, -0.00027438998222351074, -0.0002081841230392456, -0.00014197826385498047, -7.577240467071533e-05, -9.566545486450195e-06, 5.663931369781494e-05, 0.00012284517288208008, 0.00018905103206634521, 0.00025525689125061035, 0.0003214627504348755, 0.0003876686096191406, 0.00045387446880340576, 0.0005200803279876709, 0.000586286187171936, 0.0006524920463562012, 0.0007186979055404663, 0.0007849037647247314, 0.0008511096239089966, 0.0009173154830932617, 0.0009835213422775269, 0.001049727201461792, 0.0011159330606460571, 0.0011821389198303223, 0.0012483447790145874, 0.0013145506381988525, 0.0013807564973831177, 0.0014469623565673828, 0.001513168215751648, 0.001579374074935913, 0.0016455799341201782, 0.0017117857933044434, 0.0017779916524887085, 0.0018441975116729736, 0.0019104033708572388, 0.001976609230041504, 0.002042815089225769, 0.002109020948410034, 0.0021752268075942993, 0.0022414326667785645, 0.0023076385259628296, 0.0023738443851470947, 0.00244005024433136, 0.002506256103515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 7.0, 9.0, 16.0, 20.0, 32.0, 45.0, 55.0, 71.0, 96.0, 143.0, 188.0, 267.0, 403.0, 527.0, 760.0, 1043.0, 1682.0, 2420.0, 3479.0, 5413.0, 8295.0, 13206.0, 21171.0, 35188.0, 58665.0, 99786.0, 165383.0, 215301.0, 163863.0, 99056.0, 58414.0, 34835.0, 21127.0, 13155.0, 8088.0, 5241.0, 3455.0, 2332.0, 1590.0, 1065.0, 795.0, 548.0, 359.0, 269.0, 198.0, 138.0, 106.0, 75.0, 62.0, 33.0, 28.0, 23.0, 13.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-10.8515625, -10.5069580078125, -10.162353515625, -9.8177490234375, -9.47314453125, -9.1285400390625, -8.783935546875, -8.4393310546875, -8.0947265625, -7.7501220703125, -7.405517578125, -7.0609130859375, -6.71630859375, -6.3717041015625, -6.027099609375, -5.6824951171875, -5.337890625, -4.9932861328125, -4.648681640625, -4.3040771484375, -3.95947265625, -3.6148681640625, -3.270263671875, -2.9256591796875, -2.5810546875, -2.2364501953125, -1.891845703125, -1.5472412109375, -1.20263671875, -0.8580322265625, -0.513427734375, -0.1688232421875, 0.17578125, 0.5203857421875, 0.864990234375, 1.2095947265625, 1.55419921875, 1.8988037109375, 2.243408203125, 2.5880126953125, 2.9326171875, 3.2772216796875, 3.621826171875, 3.9664306640625, 4.31103515625, 4.6556396484375, 5.000244140625, 5.3448486328125, 5.689453125, 6.0340576171875, 6.378662109375, 6.7232666015625, 7.06787109375, 7.4124755859375, 7.757080078125, 8.1016845703125, 8.4462890625, 8.7908935546875, 9.135498046875, 9.4801025390625, 9.82470703125, 10.1693115234375, 10.513916015625, 10.8585205078125, 11.203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 9.0, 13.0, 14.0, 14.0, 22.0, 25.0, 36.0, 31.0, 25.0, 44.0, 44.0, 45.0, 71.0, 72.0, 70.0, 54.0, 50.0, 56.0, 48.0, 29.0, 35.0, 39.0, 23.0, 26.0, 18.0, 12.0, 12.0, 6.0, 2.0, 5.0, 4.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.0289306640625, -3.885986328125, -3.7430419921875, -3.60009765625, -3.4571533203125, -3.314208984375, -3.1712646484375, -3.0283203125, -2.8853759765625, -2.742431640625, -2.5994873046875, -2.45654296875, -2.3135986328125, -2.170654296875, -2.0277099609375, -1.884765625, -1.7418212890625, -1.598876953125, -1.4559326171875, -1.31298828125, -1.1700439453125, -1.027099609375, -0.8841552734375, -0.7412109375, -0.5982666015625, -0.455322265625, -0.3123779296875, -0.16943359375, -0.0264892578125, 0.116455078125, 0.2593994140625, 0.40234375, 0.5452880859375, 0.688232421875, 0.8311767578125, 0.97412109375, 1.1170654296875, 1.260009765625, 1.4029541015625, 1.5458984375, 1.6888427734375, 1.831787109375, 1.9747314453125, 2.11767578125, 2.2606201171875, 2.403564453125, 2.5465087890625, 2.689453125, 2.8323974609375, 2.975341796875, 3.1182861328125, 3.26123046875, 3.4041748046875, 3.547119140625, 3.6900634765625, 3.8330078125, 3.9759521484375, 4.118896484375, 4.2618408203125, 4.40478515625, 4.5477294921875, 4.690673828125, 4.8336181640625, 4.9765625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 9.0, 10.0, 12.0, 23.0, 14.0, 33.0, 25.0, 34.0, 52.0, 52.0, 51.0, 69.0, 80.0, 69.0, 71.0, 63.0, 56.0, 50.0, 37.0, 38.0, 32.0, 24.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.26683807373047, -42.10720443725586, -40.947574615478516, -39.787940979003906, -38.62831115722656, -37.46867752075195, -36.30904769897461, -35.1494140625, -33.989784240722656, -32.83015060424805, -31.670520782470703, -30.510889053344727, -29.35125732421875, -28.19162368774414, -27.031991958618164, -25.872360229492188, -24.712726593017578, -23.5530948638916, -22.393463134765625, -21.23383140563965, -20.074199676513672, -18.914566040039062, -17.754934310913086, -16.59530258178711, -15.435670852661133, -14.276039123535156, -13.11640739440918, -11.956774711608887, -10.79714298248291, -9.637511253356934, -8.47787857055664, -7.318246841430664, -6.158613204956055, -4.998981475830078, -3.8393492698669434, -2.6797173023223877, -1.520085334777832, -0.36045360565185547, 0.7991786003112793, 1.958810806274414, 3.1184425354003906, 4.278074264526367, 5.437706470489502, 6.597338676452637, 7.756970405578613, 8.91660213470459, 10.076234817504883, 11.23586654663086, 12.395498275756836, 13.555130004882812, 14.714761734008789, 15.874394416809082, 17.034027099609375, 18.19365692138672, 19.353290557861328, 20.512922286987305, 21.67255401611328, 22.832185745239258, 23.991817474365234, 25.15144920349121, 26.311080932617188, 27.470714569091797, 28.630346298217773, 29.78997802734375, 30.949609756469727]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 7.0, 15.0, 15.0, 12.0, 13.0, 27.0, 22.0, 25.0, 26.0, 19.0, 32.0, 35.0, 33.0, 39.0, 49.0, 41.0, 45.0, 39.0, 50.0, 49.0, 36.0, 39.0, 28.0, 31.0, 32.0, 22.0, 32.0, 21.0, 23.0, 24.0, 15.0, 21.0, 14.0, 10.0, 5.0, 10.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-29.358545303344727, -28.471513748168945, -27.584484100341797, -26.697452545166016, -25.810420989990234, -24.923389434814453, -24.036357879638672, -23.149328231811523, -22.262296676635742, -21.37526512145996, -20.488235473632812, -19.60120391845703, -18.71417236328125, -17.82714080810547, -16.940109252929688, -16.05307960510254, -15.166048049926758, -14.279016494750977, -13.391985893249512, -12.504955291748047, -11.617923736572266, -10.730892181396484, -9.84386157989502, -8.956830978393555, -8.069799423217773, -7.18276834487915, -6.295737266540527, -5.408706188201904, -4.521675109863281, -3.634644031524658, -2.747612953186035, -1.860581874847412, -0.9735527038574219, -0.08652162551879883, 0.8005094528198242, 1.6875405311584473, 2.5745716094970703, 3.4616026878356934, 4.348633766174316, 5.2356648445129395, 6.1226959228515625, 7.0097270011901855, 7.896758079528809, 8.783788681030273, 9.670820236206055, 10.557851791381836, 11.4448823928833, 12.331912994384766, 13.218944549560547, 14.105976104736328, 14.993006706237793, 15.880037307739258, 16.76706886291504, 17.65410041809082, 18.54113006591797, 19.42816162109375, 20.31519317626953, 21.202224731445312, 22.089256286621094, 22.976285934448242, 23.863317489624023, 24.750349044799805, 25.637378692626953, 26.524410247802734, 27.411441802978516]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 17.0, 27.0, 44.0, 49.0, 80.0, 122.0, 136.0, 221.0, 345.0, 466.0, 804.0, 1178.0, 1860.0, 3111.0, 5185.0, 8839.0, 15820.0, 30271.0, 62163.0, 154929.0, 539737.0, 1535579.0, 1229159.0, 379015.0, 117786.0, 50151.0, 24996.0, 13398.0, 7456.0, 4337.0, 2628.0, 1590.0, 986.0, 628.0, 387.0, 255.0, 175.0, 120.0, 64.0, 57.0, 34.0, 26.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-49.65625, -48.30908203125, -46.9619140625, -45.61474609375, -44.267578125, -42.92041015625, -41.5732421875, -40.22607421875, -38.87890625, -37.53173828125, -36.1845703125, -34.83740234375, -33.490234375, -32.14306640625, -30.7958984375, -29.44873046875, -28.1015625, -26.75439453125, -25.4072265625, -24.06005859375, -22.712890625, -21.36572265625, -20.0185546875, -18.67138671875, -17.32421875, -15.97705078125, -14.6298828125, -13.28271484375, -11.935546875, -10.58837890625, -9.2412109375, -7.89404296875, -6.546875, -5.19970703125, -3.8525390625, -2.50537109375, -1.158203125, 0.18896484375, 1.5361328125, 2.88330078125, 4.23046875, 5.57763671875, 6.9248046875, 8.27197265625, 9.619140625, 10.96630859375, 12.3134765625, 13.66064453125, 15.0078125, 16.35498046875, 17.7021484375, 19.04931640625, 20.396484375, 21.74365234375, 23.0908203125, 24.43798828125, 25.78515625, 27.13232421875, 28.4794921875, 29.82666015625, 31.173828125, 32.52099609375, 33.8681640625, 35.21533203125, 36.5625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 6.0, 13.0, 15.0, 14.0, 13.0, 19.0, 21.0, 27.0, 29.0, 18.0, 29.0, 36.0, 40.0, 38.0, 37.0, 35.0, 49.0, 48.0, 49.0, 52.0, 43.0, 48.0, 36.0, 28.0, 31.0, 23.0, 21.0, 26.0, 26.0, 16.0, 17.0, 20.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.84375, -25.05224609375, -24.2607421875, -23.46923828125, -22.677734375, -21.88623046875, -21.0947265625, -20.30322265625, -19.51171875, -18.72021484375, -17.9287109375, -17.13720703125, -16.345703125, -15.55419921875, -14.7626953125, -13.97119140625, -13.1796875, -12.38818359375, -11.5966796875, -10.80517578125, -10.013671875, -9.22216796875, -8.4306640625, -7.63916015625, -6.84765625, -6.05615234375, -5.2646484375, -4.47314453125, -3.681640625, -2.89013671875, -2.0986328125, -1.30712890625, -0.515625, 0.27587890625, 1.0673828125, 1.85888671875, 2.650390625, 3.44189453125, 4.2333984375, 5.02490234375, 5.81640625, 6.60791015625, 7.3994140625, 8.19091796875, 8.982421875, 9.77392578125, 10.5654296875, 11.35693359375, 12.1484375, 12.93994140625, 13.7314453125, 14.52294921875, 15.314453125, 16.10595703125, 16.8974609375, 17.68896484375, 18.48046875, 19.27197265625, 20.0634765625, 20.85498046875, 21.646484375, 22.43798828125, 23.2294921875, 24.02099609375, 24.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 9.0, 10.0, 12.0, 14.0, 21.0, 38.0, 55.0, 68.0, 102.0, 154.0, 227.0, 343.0, 557.0, 834.0, 1308.0, 1975.0, 3129.0, 5135.0, 8686.0, 14954.0, 26342.0, 49705.0, 98836.0, 216866.0, 547488.0, 1462841.0, 1051277.0, 377911.0, 159083.0, 75207.0, 38878.0, 21143.0, 12090.0, 7223.0, 4312.0, 2631.0, 1649.0, 1104.0, 711.0, 437.0, 352.0, 192.0, 128.0, 98.0, 43.0, 42.0, 21.0, 24.0, 10.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.46875, -39.1552734375, -37.841796875, -36.5283203125, -35.21484375, -33.9013671875, -32.587890625, -31.2744140625, -29.9609375, -28.6474609375, -27.333984375, -26.0205078125, -24.70703125, -23.3935546875, -22.080078125, -20.7666015625, -19.453125, -18.1396484375, -16.826171875, -15.5126953125, -14.19921875, -12.8857421875, -11.572265625, -10.2587890625, -8.9453125, -7.6318359375, -6.318359375, -5.0048828125, -3.69140625, -2.3779296875, -1.064453125, 0.2490234375, 1.5625, 2.8759765625, 4.189453125, 5.5029296875, 6.81640625, 8.1298828125, 9.443359375, 10.7568359375, 12.0703125, 13.3837890625, 14.697265625, 16.0107421875, 17.32421875, 18.6376953125, 19.951171875, 21.2646484375, 22.578125, 23.8916015625, 25.205078125, 26.5185546875, 27.83203125, 29.1455078125, 30.458984375, 31.7724609375, 33.0859375, 34.3994140625, 35.712890625, 37.0263671875, 38.33984375, 39.6533203125, 40.966796875, 42.2802734375, 43.59375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 14.0, 11.0, 17.0, 17.0, 23.0, 43.0, 51.0, 58.0, 56.0, 94.0, 112.0, 165.0, 217.0, 251.0, 324.0, 411.0, 439.0, 369.0, 310.0, 258.0, 183.0, 139.0, 119.0, 91.0, 60.0, 56.0, 41.0, 26.0, 26.0, 12.0, 18.0, 4.0, 9.0, 6.0, 9.0, 7.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.2232666015625, -12.774658203125, -12.3260498046875, -11.87744140625, -11.4288330078125, -10.980224609375, -10.5316162109375, -10.0830078125, -9.6343994140625, -9.185791015625, -8.7371826171875, -8.28857421875, -7.8399658203125, -7.391357421875, -6.9427490234375, -6.494140625, -6.0455322265625, -5.596923828125, -5.1483154296875, -4.69970703125, -4.2510986328125, -3.802490234375, -3.3538818359375, -2.9052734375, -2.4566650390625, -2.008056640625, -1.5594482421875, -1.11083984375, -0.6622314453125, -0.213623046875, 0.2349853515625, 0.68359375, 1.1322021484375, 1.580810546875, 2.0294189453125, 2.47802734375, 2.9266357421875, 3.375244140625, 3.8238525390625, 4.2724609375, 4.7210693359375, 5.169677734375, 5.6182861328125, 6.06689453125, 6.5155029296875, 6.964111328125, 7.4127197265625, 7.861328125, 8.3099365234375, 8.758544921875, 9.2071533203125, 9.65576171875, 10.1043701171875, 10.552978515625, 11.0015869140625, 11.4501953125, 11.8988037109375, 12.347412109375, 12.7960205078125, 13.24462890625, 13.6932373046875, 14.141845703125, 14.5904541015625, 15.0390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 10.0, 20.0, 22.0, 15.0, 34.0, 47.0, 37.0, 35.0, 70.0, 61.0, 78.0, 71.0, 83.0, 68.0, 68.0, 56.0, 43.0, 35.0, 27.0, 20.0, 18.0, 17.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.255611419677734, -37.085819244384766, -35.91602325439453, -34.74623107910156, -33.57643508911133, -32.40664291381836, -31.236846923828125, -30.067054748535156, -28.897258758544922, -27.72746467590332, -26.55767059326172, -25.387876510620117, -24.218082427978516, -23.048288345336914, -21.878494262695312, -20.708702087402344, -19.538908004760742, -18.36911392211914, -17.19931983947754, -16.029525756835938, -14.859731674194336, -13.689937591552734, -12.52014446258545, -11.350350379943848, -10.180556297302246, -9.010762214660645, -7.840968132019043, -6.6711745262146, -5.501380443572998, -4.3315863609313965, -3.161792755126953, -1.9919986724853516, -0.82220458984375, 0.347589373588562, 1.517383337020874, 2.6871771812438965, 3.856971263885498, 5.0267653465271, 6.196558952331543, 7.3663530349731445, 8.536147117614746, 9.705941200256348, 10.87573528289795, 12.045528411865234, 13.215322494506836, 14.385116577148438, 15.554910659790039, 16.72470474243164, 17.894498825073242, 19.064292907714844, 20.234086990356445, 21.403881072998047, 22.57367515563965, 23.74346923828125, 24.91326141357422, 26.083057403564453, 27.252849578857422, 28.422643661499023, 29.592437744140625, 30.762231826782227, 31.932025909423828, 33.1018180847168, 34.27161407470703, 35.44140625, 36.611202239990234]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 9.0, 18.0, 14.0, 13.0, 23.0, 15.0, 18.0, 28.0, 28.0, 33.0, 25.0, 24.0, 40.0, 31.0, 42.0, 36.0, 35.0, 44.0, 39.0, 44.0, 35.0, 45.0, 43.0, 43.0, 40.0, 27.0, 15.0, 20.0, 36.0, 21.0, 13.0, 14.0, 11.0, 13.0, 11.0, 9.0, 4.0, 4.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.972131729125977, -27.14262580871582, -26.31311798095703, -25.483612060546875, -24.65410614013672, -23.82459831237793, -22.995092391967773, -22.165584564208984, -21.336078643798828, -20.506572723388672, -19.677064895629883, -18.847558975219727, -18.018051147460938, -17.18854522705078, -16.359039306640625, -15.529532432556152, -14.70002555847168, -13.870518684387207, -13.041011810302734, -12.211505889892578, -11.381999015808105, -10.552492141723633, -9.722986221313477, -8.893479347229004, -8.063972473144531, -7.234465599060059, -6.404959201812744, -5.57545280456543, -4.745945930480957, -3.9164390563964844, -3.08693265914917, -2.2574262619018555, -1.4279193878173828, -0.5984127521514893, 0.2310938835144043, 1.0606005191802979, 1.8901071548461914, 2.719614028930664, 3.5491204261779785, 4.378626823425293, 5.208133697509766, 6.037640571594238, 6.867146968841553, 7.696653366088867, 8.52616024017334, 9.355667114257812, 10.185173034667969, 11.014679908752441, 11.844186782836914, 12.673693656921387, 13.50320053100586, 14.332706451416016, 15.162213325500488, 15.991720199584961, 16.821226119995117, 17.650733947753906, 18.480239868164062, 19.30974578857422, 20.139253616333008, 20.968759536743164, 21.798267364501953, 22.62777328491211, 23.457279205322266, 24.286785125732422, 25.11629295349121]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 13.0, 11.0, 40.0, 57.0, 71.0, 112.0, 148.0, 282.0, 403.0, 660.0, 978.0, 1592.0, 2518.0, 3827.0, 6479.0, 10157.0, 17138.0, 29844.0, 54302.0, 104605.0, 210993.0, 273010.0, 154197.0, 76789.0, 41323.0, 23243.0, 13595.0, 8291.0, 5007.0, 3311.0, 2010.0, 1297.0, 789.0, 504.0, 323.0, 213.0, 137.0, 87.0, 62.0, 42.0, 24.0, 23.0, 15.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.4443359375, -22.669921875, -21.8955078125, -21.12109375, -20.3466796875, -19.572265625, -18.7978515625, -18.0234375, -17.2490234375, -16.474609375, -15.7001953125, -14.92578125, -14.1513671875, -13.376953125, -12.6025390625, -11.828125, -11.0537109375, -10.279296875, -9.5048828125, -8.73046875, -7.9560546875, -7.181640625, -6.4072265625, -5.6328125, -4.8583984375, -4.083984375, -3.3095703125, -2.53515625, -1.7607421875, -0.986328125, -0.2119140625, 0.5625, 1.3369140625, 2.111328125, 2.8857421875, 3.66015625, 4.4345703125, 5.208984375, 5.9833984375, 6.7578125, 7.5322265625, 8.306640625, 9.0810546875, 9.85546875, 10.6298828125, 11.404296875, 12.1787109375, 12.953125, 13.7275390625, 14.501953125, 15.2763671875, 16.05078125, 16.8251953125, 17.599609375, 18.3740234375, 19.1484375, 19.9228515625, 20.697265625, 21.4716796875, 22.24609375, 23.0205078125, 23.794921875, 24.5693359375, 25.34375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 11.0, 22.0, 20.0, 16.0, 22.0, 26.0, 21.0, 24.0, 30.0, 41.0, 30.0, 35.0, 51.0, 36.0, 54.0, 46.0, 52.0, 42.0, 34.0, 55.0, 45.0, 33.0, 33.0, 19.0, 19.0, 29.0, 26.0, 17.0, 16.0, 9.0, 10.0, 12.0, 6.0, 2.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.03125, -29.1220703125, -28.212890625, -27.3037109375, -26.39453125, -25.4853515625, -24.576171875, -23.6669921875, -22.7578125, -21.8486328125, -20.939453125, -20.0302734375, -19.12109375, -18.2119140625, -17.302734375, -16.3935546875, -15.484375, -14.5751953125, -13.666015625, -12.7568359375, -11.84765625, -10.9384765625, -10.029296875, -9.1201171875, -8.2109375, -7.3017578125, -6.392578125, -5.4833984375, -4.57421875, -3.6650390625, -2.755859375, -1.8466796875, -0.9375, -0.0283203125, 0.880859375, 1.7900390625, 2.69921875, 3.6083984375, 4.517578125, 5.4267578125, 6.3359375, 7.2451171875, 8.154296875, 9.0634765625, 9.97265625, 10.8818359375, 11.791015625, 12.7001953125, 13.609375, 14.5185546875, 15.427734375, 16.3369140625, 17.24609375, 18.1552734375, 19.064453125, 19.9736328125, 20.8828125, 21.7919921875, 22.701171875, 23.6103515625, 24.51953125, 25.4287109375, 26.337890625, 27.2470703125, 28.15625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 13.0, 8.0, 13.0, 20.0, 31.0, 28.0, 53.0, 81.0, 90.0, 152.0, 198.0, 325.0, 455.0, 632.0, 959.0, 1420.0, 2204.0, 3270.0, 5262.0, 8152.0, 13313.0, 22071.0, 39399.0, 74392.0, 155012.0, 302880.0, 205408.0, 94305.0, 48727.0, 26908.0, 15764.0, 9438.0, 5960.0, 3918.0, 2451.0, 1656.0, 1114.0, 810.0, 521.0, 376.0, 211.0, 150.0, 135.0, 88.0, 62.0, 34.0, 24.0, 24.0, 9.0, 10.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-28.65625, -27.75146484375, -26.8466796875, -25.94189453125, -25.037109375, -24.13232421875, -23.2275390625, -22.32275390625, -21.41796875, -20.51318359375, -19.6083984375, -18.70361328125, -17.798828125, -16.89404296875, -15.9892578125, -15.08447265625, -14.1796875, -13.27490234375, -12.3701171875, -11.46533203125, -10.560546875, -9.65576171875, -8.7509765625, -7.84619140625, -6.94140625, -6.03662109375, -5.1318359375, -4.22705078125, -3.322265625, -2.41748046875, -1.5126953125, -0.60791015625, 0.296875, 1.20166015625, 2.1064453125, 3.01123046875, 3.916015625, 4.82080078125, 5.7255859375, 6.63037109375, 7.53515625, 8.43994140625, 9.3447265625, 10.24951171875, 11.154296875, 12.05908203125, 12.9638671875, 13.86865234375, 14.7734375, 15.67822265625, 16.5830078125, 17.48779296875, 18.392578125, 19.29736328125, 20.2021484375, 21.10693359375, 22.01171875, 22.91650390625, 23.8212890625, 24.72607421875, 25.630859375, 26.53564453125, 27.4404296875, 28.34521484375, 29.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 10.0, 4.0, 12.0, 9.0, 16.0, 18.0, 15.0, 13.0, 23.0, 25.0, 19.0, 26.0, 33.0, 28.0, 26.0, 38.0, 31.0, 30.0, 41.0, 34.0, 44.0, 41.0, 42.0, 39.0, 34.0, 31.0, 35.0, 32.0, 33.0, 34.0, 24.0, 27.0, 19.0, 19.0, 19.0, 10.0, 11.0, 5.0, 14.0, 6.0, 3.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.65625, -14.1484375, -13.640625, -13.1328125, -12.625, -12.1171875, -11.609375, -11.1015625, -10.59375, -10.0859375, -9.578125, -9.0703125, -8.5625, -8.0546875, -7.546875, -7.0390625, -6.53125, -6.0234375, -5.515625, -5.0078125, -4.5, -3.9921875, -3.484375, -2.9765625, -2.46875, -1.9609375, -1.453125, -0.9453125, -0.4375, 0.0703125, 0.578125, 1.0859375, 1.59375, 2.1015625, 2.609375, 3.1171875, 3.625, 4.1328125, 4.640625, 5.1484375, 5.65625, 6.1640625, 6.671875, 7.1796875, 7.6875, 8.1953125, 8.703125, 9.2109375, 9.71875, 10.2265625, 10.734375, 11.2421875, 11.75, 12.2578125, 12.765625, 13.2734375, 13.78125, 14.2890625, 14.796875, 15.3046875, 15.8125, 16.3203125, 16.828125, 17.3359375, 17.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 8.0, 11.0, 24.0, 20.0, 41.0, 68.0, 82.0, 117.0, 197.0, 335.0, 528.0, 909.0, 1559.0, 3005.0, 5702.0, 11659.0, 25370.0, 62858.0, 182163.0, 431196.0, 201097.0, 68036.0, 27710.0, 12551.0, 5988.0, 3102.0, 1697.0, 1001.0, 534.0, 340.0, 224.0, 138.0, 76.0, 56.0, 42.0, 27.0, 33.0, 15.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.70703125, -11.296875, -10.88671875, -10.4765625, -10.06640625, -9.65625, -9.24609375, -8.8359375, -8.42578125, -8.015625, -7.60546875, -7.1953125, -6.78515625, -6.375, -5.96484375, -5.5546875, -5.14453125, -4.734375, -4.32421875, -3.9140625, -3.50390625, -3.09375, -2.68359375, -2.2734375, -1.86328125, -1.453125, -1.04296875, -0.6328125, -0.22265625, 0.1875, 0.59765625, 1.0078125, 1.41796875, 1.828125, 2.23828125, 2.6484375, 3.05859375, 3.46875, 3.87890625, 4.2890625, 4.69921875, 5.109375, 5.51953125, 5.9296875, 6.33984375, 6.75, 7.16015625, 7.5703125, 7.98046875, 8.390625, 8.80078125, 9.2109375, 9.62109375, 10.03125, 10.44140625, 10.8515625, 11.26171875, 11.671875, 12.08203125, 12.4921875, 12.90234375, 13.3125, 13.72265625, 14.1328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 23.0, 41.0, 36.0, 37.0, 66.0, 86.0, 108.0, 89.0, 115.0, 93.0, 50.0, 50.0, 44.0, 35.0, 18.0, 14.0, 20.0, 8.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013818740844726562, -0.0013416856527328491, -0.001301497220993042, -0.0012613087892532349, -0.0012211203575134277, -0.0011809319257736206, -0.0011407434940338135, -0.0011005550622940063, -0.0010603666305541992, -0.001020178198814392, -0.000979989767074585, -0.0009398013353347778, -0.0008996129035949707, -0.0008594244718551636, -0.0008192360401153564, -0.0007790476083755493, -0.0007388591766357422, -0.0006986707448959351, -0.0006584823131561279, -0.0006182938814163208, -0.0005781054496765137, -0.0005379170179367065, -0.0004977285861968994, -0.0004575401544570923, -0.00041735172271728516, -0.00037716329097747803, -0.0003369748592376709, -0.00029678642749786377, -0.00025659799575805664, -0.0002164095640182495, -0.00017622113227844238, -0.00013603270053863525, -9.584426879882812e-05, -5.5655837059020996e-05, -1.5467405319213867e-05, 2.4721026420593262e-05, 6.490945816040039e-05, 0.00010509788990020752, 0.00014528632164001465, 0.00018547475337982178, 0.0002256631851196289, 0.00026585161685943604, 0.00030604004859924316, 0.0003462284803390503, 0.0003864169120788574, 0.00042660534381866455, 0.0004667937755584717, 0.0005069822072982788, 0.0005471706390380859, 0.0005873590707778931, 0.0006275475025177002, 0.0006677359342575073, 0.0007079243659973145, 0.0007481127977371216, 0.0007883012294769287, 0.0008284896612167358, 0.000868678092956543, 0.0009088665246963501, 0.0009490549564361572, 0.0009892433881759644, 0.0010294318199157715, 0.0010696202516555786, 0.0011098086833953857, 0.0011499971151351929, 0.001190185546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 14.0, 16.0, 26.0, 37.0, 40.0, 74.0, 90.0, 161.0, 207.0, 311.0, 472.0, 739.0, 1183.0, 1844.0, 3029.0, 5032.0, 8606.0, 14913.0, 26812.0, 50837.0, 101220.0, 211750.0, 290174.0, 161745.0, 77637.0, 39747.0, 21536.0, 12099.0, 7020.0, 4257.0, 2455.0, 1576.0, 969.0, 662.0, 412.0, 260.0, 186.0, 110.0, 80.0, 62.0, 40.0, 25.0, 17.0, 15.0, 12.0, 9.0, 5.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5703125, -10.209716796875, -9.84912109375, -9.488525390625, -9.1279296875, -8.767333984375, -8.40673828125, -8.046142578125, -7.685546875, -7.324951171875, -6.96435546875, -6.603759765625, -6.2431640625, -5.882568359375, -5.52197265625, -5.161376953125, -4.80078125, -4.440185546875, -4.07958984375, -3.718994140625, -3.3583984375, -2.997802734375, -2.63720703125, -2.276611328125, -1.916015625, -1.555419921875, -1.19482421875, -0.834228515625, -0.4736328125, -0.113037109375, 0.24755859375, 0.608154296875, 0.96875, 1.329345703125, 1.68994140625, 2.050537109375, 2.4111328125, 2.771728515625, 3.13232421875, 3.492919921875, 3.853515625, 4.214111328125, 4.57470703125, 4.935302734375, 5.2958984375, 5.656494140625, 6.01708984375, 6.377685546875, 6.73828125, 7.098876953125, 7.45947265625, 7.820068359375, 8.1806640625, 8.541259765625, 8.90185546875, 9.262451171875, 9.623046875, 9.983642578125, 10.34423828125, 10.704833984375, 11.0654296875, 11.426025390625, 11.78662109375, 12.147216796875, 12.5078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 8.0, 1.0, 7.0, 7.0, 9.0, 10.0, 15.0, 21.0, 29.0, 29.0, 27.0, 38.0, 46.0, 50.0, 67.0, 61.0, 79.0, 60.0, 64.0, 55.0, 61.0, 52.0, 44.0, 37.0, 27.0, 16.0, 17.0, 21.0, 12.0, 10.0, 7.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248046875, -3.131256103515625, -3.01446533203125, -2.897674560546875, -2.7808837890625, -2.664093017578125, -2.54730224609375, -2.430511474609375, -2.313720703125, -2.196929931640625, -2.08013916015625, -1.963348388671875, -1.8465576171875, -1.729766845703125, -1.61297607421875, -1.496185302734375, -1.37939453125, -1.262603759765625, -1.14581298828125, -1.029022216796875, -0.9122314453125, -0.795440673828125, -0.67864990234375, -0.561859130859375, -0.445068359375, -0.328277587890625, -0.21148681640625, -0.094696044921875, 0.0220947265625, 0.138885498046875, 0.25567626953125, 0.372467041015625, 0.4892578125, 0.606048583984375, 0.72283935546875, 0.839630126953125, 0.9564208984375, 1.073211669921875, 1.19000244140625, 1.306793212890625, 1.423583984375, 1.540374755859375, 1.65716552734375, 1.773956298828125, 1.8907470703125, 2.007537841796875, 2.12432861328125, 2.241119384765625, 2.35791015625, 2.474700927734375, 2.59149169921875, 2.708282470703125, 2.8250732421875, 2.941864013671875, 3.05865478515625, 3.175445556640625, 3.292236328125, 3.409027099609375, 3.52581787109375, 3.642608642578125, 3.7593994140625, 3.876190185546875, 3.99298095703125, 4.109771728515625, 4.2265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 12.0, 13.0, 14.0, 19.0, 22.0, 24.0, 32.0, 39.0, 55.0, 54.0, 59.0, 75.0, 83.0, 86.0, 63.0, 61.0, 52.0, 43.0, 40.0, 30.0, 22.0, 19.0, 14.0, 24.0, 16.0, 10.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.25048828125, -36.11517333984375, -34.9798583984375, -33.84454345703125, -32.709228515625, -31.573911666870117, -30.438594818115234, -29.303279876708984, -28.167964935302734, -27.032649993896484, -25.897335052490234, -24.76201820373535, -23.6267032623291, -22.49138832092285, -21.35607147216797, -20.22075653076172, -19.08544158935547, -17.95012664794922, -16.81481170654297, -15.679494857788086, -14.544179916381836, -13.408864974975586, -12.27354907989502, -11.138233184814453, -10.002918243408203, -8.867603302001953, -7.732287406921387, -6.5969719886779785, -5.46165657043457, -4.326341152191162, -3.191025733947754, -2.0557103157043457, -0.9203987121582031, 0.21491670608520508, 1.3502321243286133, 2.4855475425720215, 3.6208629608154297, 4.756178379058838, 5.891493797302246, 7.026809215545654, 8.162124633789062, 9.297439575195312, 10.432755470275879, 11.568071365356445, 12.703386306762695, 13.838701248168945, 14.974017143249512, 16.109333038330078, 17.244647979736328, 18.379962921142578, 19.515277862548828, 20.65059471130371, 21.78590965270996, 22.92122459411621, 24.056541442871094, 25.191856384277344, 26.327171325683594, 27.462486267089844, 28.597801208496094, 29.733118057250977, 30.868432998657227, 32.00374984741211, 33.13906478881836, 34.27437973022461, 35.40969467163086]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 11.0, 11.0, 14.0, 10.0, 14.0, 22.0, 15.0, 15.0, 30.0, 25.0, 21.0, 26.0, 29.0, 34.0, 31.0, 41.0, 42.0, 31.0, 40.0, 43.0, 39.0, 35.0, 40.0, 36.0, 46.0, 45.0, 32.0, 25.0, 19.0, 26.0, 30.0, 17.0, 11.0, 13.0, 15.0, 14.0, 8.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.385093688964844, -25.59136962890625, -24.79764747619629, -24.003923416137695, -23.210201263427734, -22.41647720336914, -21.622753143310547, -20.829030990600586, -20.035308837890625, -19.24158477783203, -18.44786262512207, -17.654138565063477, -16.860416412353516, -16.066692352294922, -15.272969245910645, -14.479246139526367, -13.685522079467773, -12.891798973083496, -12.098075866699219, -11.304351806640625, -10.510629653930664, -9.71690559387207, -8.923182487487793, -8.129459381103516, -7.335736274719238, -6.542013168334961, -5.748290061950684, -4.954566478729248, -4.160843372344971, -3.3671202659606934, -2.573396682739258, -1.7796735763549805, -0.9859504699707031, -0.19222724437713623, 0.6014959812164307, 1.395219326019287, 2.1889424324035645, 2.982665538787842, 3.7763891220092773, 4.570112228393555, 5.363835334777832, 6.157558441162109, 6.951281547546387, 7.745005130767822, 8.538728713989258, 9.332450866699219, 10.126174926757812, 10.91989803314209, 11.713621139526367, 12.507344245910645, 13.301067352294922, 14.094791412353516, 14.888513565063477, 15.68223762512207, 16.47595977783203, 17.269683837890625, 18.06340789794922, 18.857131958007812, 19.650854110717773, 20.444578170776367, 21.238300323486328, 22.032024383544922, 22.825748443603516, 23.619470596313477, 24.413192749023438]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 11.0, 21.0, 15.0, 18.0, 36.0, 66.0, 80.0, 108.0, 156.0, 196.0, 297.0, 463.0, 707.0, 973.0, 1564.0, 2392.0, 3562.0, 5637.0, 9027.0, 14300.0, 23560.0, 39083.0, 66204.0, 111337.0, 173931.0, 204217.0, 153534.0, 94311.0, 55750.0, 32982.0, 19821.0, 12400.0, 7579.0, 4932.0, 3126.0, 2074.0, 1324.0, 880.0, 572.0, 383.0, 306.0, 185.0, 138.0, 83.0, 72.0, 47.0, 29.0, 23.0, 17.0, 17.0, 3.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0], "bins": [-34.59375, -33.52392578125, -32.4541015625, -31.38427734375, -30.314453125, -29.24462890625, -28.1748046875, -27.10498046875, -26.03515625, -24.96533203125, -23.8955078125, -22.82568359375, -21.755859375, -20.68603515625, -19.6162109375, -18.54638671875, -17.4765625, -16.40673828125, -15.3369140625, -14.26708984375, -13.197265625, -12.12744140625, -11.0576171875, -9.98779296875, -8.91796875, -7.84814453125, -6.7783203125, -5.70849609375, -4.638671875, -3.56884765625, -2.4990234375, -1.42919921875, -0.359375, 0.71044921875, 1.7802734375, 2.85009765625, 3.919921875, 4.98974609375, 6.0595703125, 7.12939453125, 8.19921875, 9.26904296875, 10.3388671875, 11.40869140625, 12.478515625, 13.54833984375, 14.6181640625, 15.68798828125, 16.7578125, 17.82763671875, 18.8974609375, 19.96728515625, 21.037109375, 22.10693359375, 23.1767578125, 24.24658203125, 25.31640625, 26.38623046875, 27.4560546875, 28.52587890625, 29.595703125, 30.66552734375, 31.7353515625, 32.80517578125, 33.875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 9.0, 7.0, 15.0, 12.0, 10.0, 21.0, 14.0, 18.0, 24.0, 22.0, 26.0, 24.0, 30.0, 30.0, 42.0, 47.0, 35.0, 43.0, 31.0, 38.0, 38.0, 51.0, 41.0, 46.0, 32.0, 44.0, 32.0, 20.0, 25.0, 19.0, 26.0, 29.0, 19.0, 11.0, 13.0, 10.0, 10.0, 4.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.046875, -26.2158203125, -25.384765625, -24.5537109375, -23.72265625, -22.8916015625, -22.060546875, -21.2294921875, -20.3984375, -19.5673828125, -18.736328125, -17.9052734375, -17.07421875, -16.2431640625, -15.412109375, -14.5810546875, -13.75, -12.9189453125, -12.087890625, -11.2568359375, -10.42578125, -9.5947265625, -8.763671875, -7.9326171875, -7.1015625, -6.2705078125, -5.439453125, -4.6083984375, -3.77734375, -2.9462890625, -2.115234375, -1.2841796875, -0.453125, 0.3779296875, 1.208984375, 2.0400390625, 2.87109375, 3.7021484375, 4.533203125, 5.3642578125, 6.1953125, 7.0263671875, 7.857421875, 8.6884765625, 9.51953125, 10.3505859375, 11.181640625, 12.0126953125, 12.84375, 13.6748046875, 14.505859375, 15.3369140625, 16.16796875, 16.9990234375, 17.830078125, 18.6611328125, 19.4921875, 20.3232421875, 21.154296875, 21.9853515625, 22.81640625, 23.6474609375, 24.478515625, 25.3095703125, 26.140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 10.0, 15.0, 21.0, 42.0, 58.0, 81.0, 104.0, 160.0, 235.0, 336.0, 545.0, 717.0, 1109.0, 1699.0, 2526.0, 3658.0, 5751.0, 8589.0, 13531.0, 21243.0, 33847.0, 54834.0, 89713.0, 140775.0, 185413.0, 171065.0, 117404.0, 72494.0, 44769.0, 27648.0, 17343.0, 11180.0, 7223.0, 4815.0, 3152.0, 2132.0, 1366.0, 905.0, 618.0, 479.0, 311.0, 213.0, 121.0, 90.0, 57.0, 45.0, 34.0, 27.0, 15.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-32.59375, -31.568359375, -30.54296875, -29.517578125, -28.4921875, -27.466796875, -26.44140625, -25.416015625, -24.390625, -23.365234375, -22.33984375, -21.314453125, -20.2890625, -19.263671875, -18.23828125, -17.212890625, -16.1875, -15.162109375, -14.13671875, -13.111328125, -12.0859375, -11.060546875, -10.03515625, -9.009765625, -7.984375, -6.958984375, -5.93359375, -4.908203125, -3.8828125, -2.857421875, -1.83203125, -0.806640625, 0.21875, 1.244140625, 2.26953125, 3.294921875, 4.3203125, 5.345703125, 6.37109375, 7.396484375, 8.421875, 9.447265625, 10.47265625, 11.498046875, 12.5234375, 13.548828125, 14.57421875, 15.599609375, 16.625, 17.650390625, 18.67578125, 19.701171875, 20.7265625, 21.751953125, 22.77734375, 23.802734375, 24.828125, 25.853515625, 26.87890625, 27.904296875, 28.9296875, 29.955078125, 30.98046875, 32.005859375, 33.03125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 11.0, 6.0, 21.0, 14.0, 23.0, 25.0, 25.0, 30.0, 30.0, 25.0, 31.0, 39.0, 36.0, 35.0, 36.0, 42.0, 44.0, 39.0, 43.0, 38.0, 34.0, 35.0, 37.0, 32.0, 26.0, 28.0, 27.0, 24.0, 13.0, 14.0, 12.0, 17.0, 15.0, 13.0, 10.0, 8.0, 5.0, 12.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.515625, -16.00146484375, -15.4873046875, -14.97314453125, -14.458984375, -13.94482421875, -13.4306640625, -12.91650390625, -12.40234375, -11.88818359375, -11.3740234375, -10.85986328125, -10.345703125, -9.83154296875, -9.3173828125, -8.80322265625, -8.2890625, -7.77490234375, -7.2607421875, -6.74658203125, -6.232421875, -5.71826171875, -5.2041015625, -4.68994140625, -4.17578125, -3.66162109375, -3.1474609375, -2.63330078125, -2.119140625, -1.60498046875, -1.0908203125, -0.57666015625, -0.0625, 0.45166015625, 0.9658203125, 1.47998046875, 1.994140625, 2.50830078125, 3.0224609375, 3.53662109375, 4.05078125, 4.56494140625, 5.0791015625, 5.59326171875, 6.107421875, 6.62158203125, 7.1357421875, 7.64990234375, 8.1640625, 8.67822265625, 9.1923828125, 9.70654296875, 10.220703125, 10.73486328125, 11.2490234375, 11.76318359375, 12.27734375, 12.79150390625, 13.3056640625, 13.81982421875, 14.333984375, 14.84814453125, 15.3623046875, 15.87646484375, 16.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 17.0, 26.0, 33.0, 65.0, 92.0, 140.0, 216.0, 314.0, 512.0, 898.0, 1341.0, 2109.0, 3410.0, 5805.0, 10145.0, 18105.0, 34563.0, 71358.0, 154123.0, 275540.0, 236089.0, 117056.0, 54267.0, 27059.0, 14440.0, 8170.0, 4831.0, 2901.0, 1765.0, 1139.0, 721.0, 462.0, 280.0, 197.0, 113.0, 78.0, 50.0, 43.0, 22.0, 7.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.9609375, -12.5535888671875, -12.146240234375, -11.7388916015625, -11.33154296875, -10.9241943359375, -10.516845703125, -10.1094970703125, -9.7021484375, -9.2947998046875, -8.887451171875, -8.4801025390625, -8.07275390625, -7.6654052734375, -7.258056640625, -6.8507080078125, -6.443359375, -6.0360107421875, -5.628662109375, -5.2213134765625, -4.81396484375, -4.4066162109375, -3.999267578125, -3.5919189453125, -3.1845703125, -2.7772216796875, -2.369873046875, -1.9625244140625, -1.55517578125, -1.1478271484375, -0.740478515625, -0.3331298828125, 0.07421875, 0.4815673828125, 0.888916015625, 1.2962646484375, 1.70361328125, 2.1109619140625, 2.518310546875, 2.9256591796875, 3.3330078125, 3.7403564453125, 4.147705078125, 4.5550537109375, 4.96240234375, 5.3697509765625, 5.777099609375, 6.1844482421875, 6.591796875, 6.9991455078125, 7.406494140625, 7.8138427734375, 8.22119140625, 8.6285400390625, 9.035888671875, 9.4432373046875, 9.8505859375, 10.2579345703125, 10.665283203125, 11.0726318359375, 11.47998046875, 11.8873291015625, 12.294677734375, 12.7020263671875, 13.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 8.0, 17.0, 13.0, 18.0, 43.0, 42.0, 65.0, 90.0, 112.0, 137.0, 124.0, 96.0, 63.0, 49.0, 33.0, 21.0, 15.0, 15.0, 8.0, 8.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00164794921875, -0.0015880763530731201, -0.0015282034873962402, -0.0014683306217193604, -0.0014084577560424805, -0.0013485848903656006, -0.0012887120246887207, -0.0012288391590118408, -0.001168966293334961, -0.001109093427658081, -0.0010492205619812012, -0.0009893476963043213, -0.0009294748306274414, -0.0008696019649505615, -0.0008097290992736816, -0.0007498562335968018, -0.0006899833679199219, -0.000630110502243042, -0.0005702376365661621, -0.0005103647708892822, -0.00045049190521240234, -0.00039061903953552246, -0.0003307461738586426, -0.0002708733081817627, -0.0002110004425048828, -0.00015112757682800293, -9.125471115112305e-05, -3.1381845474243164e-05, 2.849102020263672e-05, 8.83638858795166e-05, 0.00014823675155639648, 0.00020810961723327637, 0.00026798248291015625, 0.00032785534858703613, 0.000387728214263916, 0.0004476010799407959, 0.0005074739456176758, 0.0005673468112945557, 0.0006272196769714355, 0.0006870925426483154, 0.0007469654083251953, 0.0008068382740020752, 0.0008667111396789551, 0.000926584005355835, 0.0009864568710327148, 0.0010463297367095947, 0.0011062026023864746, 0.0011660754680633545, 0.0012259483337402344, 0.0012858211994171143, 0.0013456940650939941, 0.001405566930770874, 0.001465439796447754, 0.0015253126621246338, 0.0015851855278015137, 0.0016450583934783936, 0.0017049312591552734, 0.0017648041248321533, 0.0018246769905090332, 0.001884549856185913, 0.001944422721862793, 0.002004295587539673, 0.0020641684532165527, 0.0021240413188934326, 0.0021839141845703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 0.0, 6.0, 5.0, 5.0, 16.0, 26.0, 45.0, 70.0, 112.0, 150.0, 263.0, 365.0, 639.0, 870.0, 1484.0, 2409.0, 3989.0, 6755.0, 12309.0, 23693.0, 48522.0, 105058.0, 219719.0, 289671.0, 172236.0, 79897.0, 37345.0, 18603.0, 10065.0, 5497.0, 3287.0, 2049.0, 1265.0, 732.0, 536.0, 290.0, 204.0, 126.0, 89.0, 61.0, 41.0, 18.0, 15.0, 11.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6737060546875, -11.230224609375, -10.7867431640625, -10.34326171875, -9.8997802734375, -9.456298828125, -9.0128173828125, -8.5693359375, -8.1258544921875, -7.682373046875, -7.2388916015625, -6.79541015625, -6.3519287109375, -5.908447265625, -5.4649658203125, -5.021484375, -4.5780029296875, -4.134521484375, -3.6910400390625, -3.24755859375, -2.8040771484375, -2.360595703125, -1.9171142578125, -1.4736328125, -1.0301513671875, -0.586669921875, -0.1431884765625, 0.30029296875, 0.7437744140625, 1.187255859375, 1.6307373046875, 2.07421875, 2.5177001953125, 2.961181640625, 3.4046630859375, 3.84814453125, 4.2916259765625, 4.735107421875, 5.1785888671875, 5.6220703125, 6.0655517578125, 6.509033203125, 6.9525146484375, 7.39599609375, 7.8394775390625, 8.282958984375, 8.7264404296875, 9.169921875, 9.6134033203125, 10.056884765625, 10.5003662109375, 10.94384765625, 11.3873291015625, 11.830810546875, 12.2742919921875, 12.7177734375, 13.1612548828125, 13.604736328125, 14.0482177734375, 14.49169921875, 14.9351806640625, 15.378662109375, 15.8221435546875, 16.265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 4.0, 11.0, 6.0, 7.0, 6.0, 13.0, 20.0, 16.0, 20.0, 35.0, 27.0, 32.0, 42.0, 37.0, 59.0, 73.0, 57.0, 61.0, 70.0, 66.0, 55.0, 54.0, 42.0, 30.0, 27.0, 25.0, 17.0, 23.0, 14.0, 9.0, 9.0, 8.0, 4.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.93927001953125, -2.8277587890625, -2.71624755859375, -2.604736328125, -2.49322509765625, -2.3817138671875, -2.27020263671875, -2.15869140625, -2.04718017578125, -1.9356689453125, -1.82415771484375, -1.712646484375, -1.60113525390625, -1.4896240234375, -1.37811279296875, -1.2666015625, -1.15509033203125, -1.0435791015625, -0.93206787109375, -0.820556640625, -0.70904541015625, -0.5975341796875, -0.48602294921875, -0.37451171875, -0.26300048828125, -0.1514892578125, -0.03997802734375, 0.071533203125, 0.18304443359375, 0.2945556640625, 0.40606689453125, 0.517578125, 0.62908935546875, 0.7406005859375, 0.85211181640625, 0.963623046875, 1.07513427734375, 1.1866455078125, 1.29815673828125, 1.40966796875, 1.52117919921875, 1.6326904296875, 1.74420166015625, 1.855712890625, 1.96722412109375, 2.0787353515625, 2.19024658203125, 2.3017578125, 2.41326904296875, 2.5247802734375, 2.63629150390625, 2.747802734375, 2.85931396484375, 2.9708251953125, 3.08233642578125, 3.19384765625, 3.30535888671875, 3.4168701171875, 3.52838134765625, 3.639892578125, 3.75140380859375, 3.8629150390625, 3.97442626953125, 4.0859375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 15.0, 16.0, 24.0, 30.0, 36.0, 39.0, 61.0, 60.0, 75.0, 59.0, 88.0, 73.0, 60.0, 71.0, 49.0, 38.0, 42.0, 28.0, 23.0, 26.0, 17.0, 12.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.118370056152344, -42.949161529541016, -41.77995300292969, -40.610748291015625, -39.4415397644043, -38.27233123779297, -37.10312271118164, -35.93391418457031, -34.76470947265625, -33.59550094604492, -32.426292419433594, -31.2570858001709, -30.087879180908203, -28.918670654296875, -27.749462127685547, -26.58025550842285, -25.411046981811523, -24.241838455200195, -23.0726318359375, -21.903423309326172, -20.734216690063477, -19.56500816345215, -18.395801544189453, -17.226593017578125, -16.057384490966797, -14.888176918029785, -13.718969345092773, -12.549760818481445, -11.38055419921875, -10.211345672607422, -9.04213809967041, -7.872930526733398, -6.70372200012207, -5.534514427185059, -4.365306854248047, -3.196098804473877, -2.0268912315368652, -0.8576836585998535, 0.3115243911743164, 1.4807319641113281, 2.64993953704834, 3.8191471099853516, 4.988354682922363, 6.157562732696533, 7.326770305633545, 8.495977401733398, 9.665185928344727, 10.834393501281738, 12.00360107421875, 13.172808647155762, 14.342016220092773, 15.511224746704102, 16.680431365966797, 17.849639892578125, 19.018848419189453, 20.18805503845215, 21.357261657714844, 22.526470184326172, 23.695676803588867, 24.864885330200195, 26.03409194946289, 27.20330047607422, 28.372509002685547, 29.541715621948242, 30.71092414855957]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 10.0, 4.0, 12.0, 15.0, 15.0, 15.0, 15.0, 10.0, 23.0, 24.0, 27.0, 32.0, 32.0, 37.0, 28.0, 38.0, 38.0, 30.0, 21.0, 38.0, 37.0, 43.0, 40.0, 39.0, 41.0, 29.0, 29.0, 31.0, 29.0, 29.0, 24.0, 19.0, 21.0, 12.0, 15.0, 9.0, 10.0, 18.0, 4.0, 5.0, 3.0, 11.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.878774642944336, -24.09693145751953, -23.315088272094727, -22.533245086669922, -21.751399993896484, -20.96955680847168, -20.187713623046875, -19.40587043762207, -18.624027252197266, -17.84218406677246, -17.060340881347656, -16.27849578857422, -15.496652603149414, -14.71480941772461, -13.932966232299805, -13.151123046875, -12.369277954101562, -11.587434768676758, -10.805590629577637, -10.023747444152832, -9.241903305053711, -8.460060119628906, -7.678216934204102, -6.896373271942139, -6.114529609680176, -5.332685947418213, -4.55084228515625, -3.7689990997314453, -2.9871554374694824, -2.2053117752075195, -1.4234685897827148, -0.641624927520752, 0.14022064208984375, 0.9220641851425171, 1.7039077281951904, 2.485751152038574, 3.267594814300537, 4.0494384765625, 4.831281661987305, 5.613125324249268, 6.3949689865112305, 7.176812648773193, 7.958656311035156, 8.740499496459961, 9.522342681884766, 10.304186820983887, 11.086030006408691, 11.867874145507812, 12.649717330932617, 13.431560516357422, 14.213404655456543, 14.995247840881348, 15.777091979980469, 16.558935165405273, 17.340778350830078, 18.122621536254883, 18.904464721679688, 19.686307907104492, 20.468151092529297, 21.249996185302734, 22.03183937072754, 22.813682556152344, 23.59552574157715, 24.377368927001953, 25.15921401977539]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 15.0, 18.0, 23.0, 35.0, 39.0, 69.0, 101.0, 116.0, 158.0, 247.0, 353.0, 500.0, 694.0, 1040.0, 1593.0, 2468.0, 3790.0, 6468.0, 10965.0, 19271.0, 35639.0, 71373.0, 166347.0, 493834.0, 1277056.0, 1271683.0, 500511.0, 175041.0, 73067.0, 35833.0, 18963.0, 10621.0, 6055.0, 3705.0, 2222.0, 1443.0, 931.0, 637.0, 435.0, 261.0, 183.0, 141.0, 104.0, 77.0, 46.0, 27.0, 28.0, 20.0, 7.0, 12.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.53125, -37.36376953125, -36.1962890625, -35.02880859375, -33.861328125, -32.69384765625, -31.5263671875, -30.35888671875, -29.19140625, -28.02392578125, -26.8564453125, -25.68896484375, -24.521484375, -23.35400390625, -22.1865234375, -21.01904296875, -19.8515625, -18.68408203125, -17.5166015625, -16.34912109375, -15.181640625, -14.01416015625, -12.8466796875, -11.67919921875, -10.51171875, -9.34423828125, -8.1767578125, -7.00927734375, -5.841796875, -4.67431640625, -3.5068359375, -2.33935546875, -1.171875, -0.00439453125, 1.1630859375, 2.33056640625, 3.498046875, 4.66552734375, 5.8330078125, 7.00048828125, 8.16796875, 9.33544921875, 10.5029296875, 11.67041015625, 12.837890625, 14.00537109375, 15.1728515625, 16.34033203125, 17.5078125, 18.67529296875, 19.8427734375, 21.01025390625, 22.177734375, 23.34521484375, 24.5126953125, 25.68017578125, 26.84765625, 28.01513671875, 29.1826171875, 30.35009765625, 31.517578125, 32.68505859375, 33.8525390625, 35.02001953125, 36.1875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 6.0, 7.0, 7.0, 4.0, 12.0, 7.0, 19.0, 11.0, 14.0, 17.0, 22.0, 24.0, 23.0, 38.0, 38.0, 30.0, 44.0, 39.0, 30.0, 36.0, 35.0, 34.0, 41.0, 36.0, 48.0, 43.0, 37.0, 43.0, 32.0, 21.0, 22.0, 26.0, 22.0, 21.0, 12.0, 16.0, 14.0, 15.0, 5.0, 16.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.140625, -22.42431640625, -21.7080078125, -20.99169921875, -20.275390625, -19.55908203125, -18.8427734375, -18.12646484375, -17.41015625, -16.69384765625, -15.9775390625, -15.26123046875, -14.544921875, -13.82861328125, -13.1123046875, -12.39599609375, -11.6796875, -10.96337890625, -10.2470703125, -9.53076171875, -8.814453125, -8.09814453125, -7.3818359375, -6.66552734375, -5.94921875, -5.23291015625, -4.5166015625, -3.80029296875, -3.083984375, -2.36767578125, -1.6513671875, -0.93505859375, -0.21875, 0.49755859375, 1.2138671875, 1.93017578125, 2.646484375, 3.36279296875, 4.0791015625, 4.79541015625, 5.51171875, 6.22802734375, 6.9443359375, 7.66064453125, 8.376953125, 9.09326171875, 9.8095703125, 10.52587890625, 11.2421875, 11.95849609375, 12.6748046875, 13.39111328125, 14.107421875, 14.82373046875, 15.5400390625, 16.25634765625, 16.97265625, 17.68896484375, 18.4052734375, 19.12158203125, 19.837890625, 20.55419921875, 21.2705078125, 21.98681640625, 22.703125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 15.0, 14.0, 26.0, 41.0, 67.0, 101.0, 135.0, 247.0, 344.0, 513.0, 820.0, 1189.0, 1870.0, 3061.0, 5018.0, 8260.0, 13816.0, 24881.0, 47202.0, 97556.0, 223215.0, 576722.0, 1513856.0, 1012689.0, 363797.0, 148805.0, 68519.0, 34579.0, 18873.0, 10733.0, 6376.0, 3941.0, 2571.0, 1553.0, 1001.0, 631.0, 426.0, 250.0, 189.0, 136.0, 73.0, 44.0, 33.0, 31.0, 22.0, 13.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-47.34375, -45.98193359375, -44.6201171875, -43.25830078125, -41.896484375, -40.53466796875, -39.1728515625, -37.81103515625, -36.44921875, -35.08740234375, -33.7255859375, -32.36376953125, -31.001953125, -29.64013671875, -28.2783203125, -26.91650390625, -25.5546875, -24.19287109375, -22.8310546875, -21.46923828125, -20.107421875, -18.74560546875, -17.3837890625, -16.02197265625, -14.66015625, -13.29833984375, -11.9365234375, -10.57470703125, -9.212890625, -7.85107421875, -6.4892578125, -5.12744140625, -3.765625, -2.40380859375, -1.0419921875, 0.31982421875, 1.681640625, 3.04345703125, 4.4052734375, 5.76708984375, 7.12890625, 8.49072265625, 9.8525390625, 11.21435546875, 12.576171875, 13.93798828125, 15.2998046875, 16.66162109375, 18.0234375, 19.38525390625, 20.7470703125, 22.10888671875, 23.470703125, 24.83251953125, 26.1943359375, 27.55615234375, 28.91796875, 30.27978515625, 31.6416015625, 33.00341796875, 34.365234375, 35.72705078125, 37.0888671875, 38.45068359375, 39.8125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 14.0, 9.0, 9.0, 21.0, 17.0, 39.0, 46.0, 68.0, 68.0, 84.0, 106.0, 128.0, 204.0, 233.0, 318.0, 367.0, 429.0, 401.0, 344.0, 259.0, 199.0, 167.0, 110.0, 89.0, 63.0, 49.0, 51.0, 29.0, 23.0, 21.0, 23.0, 18.0, 9.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.109375, -13.663818359375, -13.21826171875, -12.772705078125, -12.3271484375, -11.881591796875, -11.43603515625, -10.990478515625, -10.544921875, -10.099365234375, -9.65380859375, -9.208251953125, -8.7626953125, -8.317138671875, -7.87158203125, -7.426025390625, -6.98046875, -6.534912109375, -6.08935546875, -5.643798828125, -5.1982421875, -4.752685546875, -4.30712890625, -3.861572265625, -3.416015625, -2.970458984375, -2.52490234375, -2.079345703125, -1.6337890625, -1.188232421875, -0.74267578125, -0.297119140625, 0.1484375, 0.593994140625, 1.03955078125, 1.485107421875, 1.9306640625, 2.376220703125, 2.82177734375, 3.267333984375, 3.712890625, 4.158447265625, 4.60400390625, 5.049560546875, 5.4951171875, 5.940673828125, 6.38623046875, 6.831787109375, 7.27734375, 7.722900390625, 8.16845703125, 8.614013671875, 9.0595703125, 9.505126953125, 9.95068359375, 10.396240234375, 10.841796875, 11.287353515625, 11.73291015625, 12.178466796875, 12.6240234375, 13.069580078125, 13.51513671875, 13.960693359375, 14.40625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 12.0, 10.0, 24.0, 16.0, 26.0, 29.0, 38.0, 39.0, 40.0, 65.0, 70.0, 90.0, 81.0, 68.0, 73.0, 56.0, 43.0, 44.0, 36.0, 29.0, 27.0, 14.0, 11.0, 6.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.50014877319336, -39.3203010559082, -38.14045715332031, -36.960609436035156, -35.78076171875, -34.600914001464844, -33.42106628417969, -32.2412223815918, -31.06137466430664, -29.881526947021484, -28.70168113708496, -27.521835327148438, -26.34198760986328, -25.162139892578125, -23.9822940826416, -22.802448272705078, -21.622600555419922, -20.442752838134766, -19.262907028198242, -18.08306121826172, -16.903213500976562, -15.723366737365723, -14.543519973754883, -13.363673210144043, -12.183826446533203, -11.003979682922363, -9.824132919311523, -8.644286155700684, -7.464439392089844, -6.284592628479004, -5.104745864868164, -3.924899101257324, -2.7450523376464844, -1.5652055740356445, -0.3853588104248047, 0.7944879531860352, 1.974334716796875, 3.154181480407715, 4.334028244018555, 5.5138750076293945, 6.693721771240234, 7.873568534851074, 9.053415298461914, 10.233262062072754, 11.413108825683594, 12.592955589294434, 13.772802352905273, 14.952649116516113, 16.132495880126953, 17.31234359741211, 18.492189407348633, 19.672035217285156, 20.851882934570312, 22.03173065185547, 23.211576461791992, 24.391422271728516, 25.571269989013672, 26.751117706298828, 27.93096351623535, 29.110809326171875, 30.29065704345703, 31.470504760742188, 32.650352478027344, 33.830196380615234, 35.01004409790039]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 9.0, 5.0, 9.0, 9.0, 7.0, 14.0, 13.0, 19.0, 15.0, 20.0, 22.0, 19.0, 30.0, 39.0, 36.0, 27.0, 26.0, 47.0, 39.0, 43.0, 47.0, 39.0, 28.0, 38.0, 44.0, 42.0, 38.0, 20.0, 32.0, 28.0, 20.0, 29.0, 19.0, 18.0, 16.0, 19.0, 12.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 0.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.00770378112793, -26.189672470092773, -25.37164306640625, -24.553611755371094, -23.735580444335938, -22.917551040649414, -22.099519729614258, -21.281490325927734, -20.463459014892578, -19.645427703857422, -18.8273983001709, -18.009366989135742, -17.19133758544922, -16.373306274414062, -15.555274963378906, -14.737244606018066, -13.919214248657227, -13.101183891296387, -12.283153533935547, -11.46512222290039, -10.64709186553955, -9.829061508178711, -9.011030197143555, -8.192999839782715, -7.374969482421875, -6.556939125061035, -5.738908290863037, -4.920877456665039, -4.102847099304199, -3.2848167419433594, -2.4667859077453613, -1.6487550735473633, -0.8307228088378906, -0.01269221305847168, 0.8053383827209473, 1.6233689785003662, 2.441399574279785, 3.259429931640625, 4.077460765838623, 4.895491600036621, 5.713521957397461, 6.531552314758301, 7.349583148956299, 8.167613983154297, 8.985644340515137, 9.803674697875977, 10.621706008911133, 11.439736366271973, 12.257766723632812, 13.075797080993652, 13.893827438354492, 14.711858749389648, 15.529889106750488, 16.347919464111328, 17.165950775146484, 17.98398208618164, 18.802011489868164, 19.62004280090332, 20.438072204589844, 21.256103515625, 22.074134826660156, 22.89216423034668, 23.710195541381836, 24.52822494506836, 25.346256256103516]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 14.0, 13.0, 21.0, 31.0, 47.0, 50.0, 94.0, 140.0, 221.0, 352.0, 499.0, 779.0, 1235.0, 1989.0, 3218.0, 5306.0, 9033.0, 15735.0, 28390.0, 54843.0, 112559.0, 234187.0, 281370.0, 146667.0, 69528.0, 35559.0, 19205.0, 10934.0, 6299.0, 3764.0, 2385.0, 1457.0, 897.0, 579.0, 408.0, 259.0, 157.0, 115.0, 76.0, 44.0, 33.0, 28.0, 7.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.109375, -23.282958984375, -22.45654296875, -21.630126953125, -20.8037109375, -19.977294921875, -19.15087890625, -18.324462890625, -17.498046875, -16.671630859375, -15.84521484375, -15.018798828125, -14.1923828125, -13.365966796875, -12.53955078125, -11.713134765625, -10.88671875, -10.060302734375, -9.23388671875, -8.407470703125, -7.5810546875, -6.754638671875, -5.92822265625, -5.101806640625, -4.275390625, -3.448974609375, -2.62255859375, -1.796142578125, -0.9697265625, -0.143310546875, 0.68310546875, 1.509521484375, 2.3359375, 3.162353515625, 3.98876953125, 4.815185546875, 5.6416015625, 6.468017578125, 7.29443359375, 8.120849609375, 8.947265625, 9.773681640625, 10.60009765625, 11.426513671875, 12.2529296875, 13.079345703125, 13.90576171875, 14.732177734375, 15.55859375, 16.385009765625, 17.21142578125, 18.037841796875, 18.8642578125, 19.690673828125, 20.51708984375, 21.343505859375, 22.169921875, 22.996337890625, 23.82275390625, 24.649169921875, 25.4755859375, 26.302001953125, 27.12841796875, 27.954833984375, 28.78125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 11.0, 13.0, 13.0, 24.0, 17.0, 18.0, 26.0, 31.0, 30.0, 38.0, 40.0, 51.0, 38.0, 36.0, 47.0, 36.0, 23.0, 50.0, 40.0, 44.0, 35.0, 39.0, 29.0, 37.0, 24.0, 27.0, 22.0, 20.0, 10.0, 18.0, 12.0, 6.0, 4.0, 7.0, 4.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.75, -26.885498046875, -26.02099609375, -25.156494140625, -24.2919921875, -23.427490234375, -22.56298828125, -21.698486328125, -20.833984375, -19.969482421875, -19.10498046875, -18.240478515625, -17.3759765625, -16.511474609375, -15.64697265625, -14.782470703125, -13.91796875, -13.053466796875, -12.18896484375, -11.324462890625, -10.4599609375, -9.595458984375, -8.73095703125, -7.866455078125, -7.001953125, -6.137451171875, -5.27294921875, -4.408447265625, -3.5439453125, -2.679443359375, -1.81494140625, -0.950439453125, -0.0859375, 0.778564453125, 1.64306640625, 2.507568359375, 3.3720703125, 4.236572265625, 5.10107421875, 5.965576171875, 6.830078125, 7.694580078125, 8.55908203125, 9.423583984375, 10.2880859375, 11.152587890625, 12.01708984375, 12.881591796875, 13.74609375, 14.610595703125, 15.47509765625, 16.339599609375, 17.2041015625, 18.068603515625, 18.93310546875, 19.797607421875, 20.662109375, 21.526611328125, 22.39111328125, 23.255615234375, 24.1201171875, 24.984619140625, 25.84912109375, 26.713623046875, 27.578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 11.0, 7.0, 13.0, 15.0, 28.0, 39.0, 53.0, 73.0, 124.0, 139.0, 184.0, 307.0, 413.0, 557.0, 887.0, 1253.0, 1956.0, 3020.0, 4691.0, 7591.0, 12507.0, 21374.0, 38597.0, 73828.0, 161121.0, 316051.0, 203853.0, 90588.0, 45469.0, 25069.0, 14428.0, 8731.0, 5290.0, 3469.0, 2154.0, 1461.0, 974.0, 680.0, 490.0, 294.0, 214.0, 149.0, 113.0, 81.0, 60.0, 42.0, 28.0, 23.0, 11.0, 9.0, 12.0, 11.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-30.71875, -29.747802734375, -28.77685546875, -27.805908203125, -26.8349609375, -25.864013671875, -24.89306640625, -23.922119140625, -22.951171875, -21.980224609375, -21.00927734375, -20.038330078125, -19.0673828125, -18.096435546875, -17.12548828125, -16.154541015625, -15.18359375, -14.212646484375, -13.24169921875, -12.270751953125, -11.2998046875, -10.328857421875, -9.35791015625, -8.386962890625, -7.416015625, -6.445068359375, -5.47412109375, -4.503173828125, -3.5322265625, -2.561279296875, -1.59033203125, -0.619384765625, 0.3515625, 1.322509765625, 2.29345703125, 3.264404296875, 4.2353515625, 5.206298828125, 6.17724609375, 7.148193359375, 8.119140625, 9.090087890625, 10.06103515625, 11.031982421875, 12.0029296875, 12.973876953125, 13.94482421875, 14.915771484375, 15.88671875, 16.857666015625, 17.82861328125, 18.799560546875, 19.7705078125, 20.741455078125, 21.71240234375, 22.683349609375, 23.654296875, 24.625244140625, 25.59619140625, 26.567138671875, 27.5380859375, 28.509033203125, 29.47998046875, 30.450927734375, 31.421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 8.0, 7.0, 7.0, 12.0, 4.0, 21.0, 11.0, 18.0, 15.0, 18.0, 21.0, 23.0, 26.0, 32.0, 28.0, 29.0, 27.0, 41.0, 43.0, 38.0, 36.0, 36.0, 29.0, 37.0, 38.0, 35.0, 39.0, 44.0, 34.0, 29.0, 23.0, 31.0, 20.0, 16.0, 20.0, 20.0, 18.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.03125, -16.510498046875, -15.98974609375, -15.468994140625, -14.9482421875, -14.427490234375, -13.90673828125, -13.385986328125, -12.865234375, -12.344482421875, -11.82373046875, -11.302978515625, -10.7822265625, -10.261474609375, -9.74072265625, -9.219970703125, -8.69921875, -8.178466796875, -7.65771484375, -7.136962890625, -6.6162109375, -6.095458984375, -5.57470703125, -5.053955078125, -4.533203125, -4.012451171875, -3.49169921875, -2.970947265625, -2.4501953125, -1.929443359375, -1.40869140625, -0.887939453125, -0.3671875, 0.153564453125, 0.67431640625, 1.195068359375, 1.7158203125, 2.236572265625, 2.75732421875, 3.278076171875, 3.798828125, 4.319580078125, 4.84033203125, 5.361083984375, 5.8818359375, 6.402587890625, 6.92333984375, 7.444091796875, 7.96484375, 8.485595703125, 9.00634765625, 9.527099609375, 10.0478515625, 10.568603515625, 11.08935546875, 11.610107421875, 12.130859375, 12.651611328125, 13.17236328125, 13.693115234375, 14.2138671875, 14.734619140625, 15.25537109375, 15.776123046875, 16.296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 7.0, 8.0, 8.0, 13.0, 17.0, 16.0, 28.0, 35.0, 69.0, 73.0, 104.0, 153.0, 226.0, 293.0, 494.0, 674.0, 1014.0, 1632.0, 2551.0, 4373.0, 8143.0, 16482.0, 38717.0, 108711.0, 345287.0, 338790.0, 106200.0, 38250.0, 16362.0, 8053.0, 4461.0, 2539.0, 1591.0, 983.0, 680.0, 417.0, 301.0, 231.0, 155.0, 125.0, 86.0, 50.0, 39.0, 29.0, 24.0, 21.0, 11.0, 7.0, 6.0, 10.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.3828125, -11.9957275390625, -11.608642578125, -11.2215576171875, -10.83447265625, -10.4473876953125, -10.060302734375, -9.6732177734375, -9.2861328125, -8.8990478515625, -8.511962890625, -8.1248779296875, -7.73779296875, -7.3507080078125, -6.963623046875, -6.5765380859375, -6.189453125, -5.8023681640625, -5.415283203125, -5.0281982421875, -4.64111328125, -4.2540283203125, -3.866943359375, -3.4798583984375, -3.0927734375, -2.7056884765625, -2.318603515625, -1.9315185546875, -1.54443359375, -1.1573486328125, -0.770263671875, -0.3831787109375, 0.00390625, 0.3909912109375, 0.778076171875, 1.1651611328125, 1.55224609375, 1.9393310546875, 2.326416015625, 2.7135009765625, 3.1005859375, 3.4876708984375, 3.874755859375, 4.2618408203125, 4.64892578125, 5.0360107421875, 5.423095703125, 5.8101806640625, 6.197265625, 6.5843505859375, 6.971435546875, 7.3585205078125, 7.74560546875, 8.1326904296875, 8.519775390625, 8.9068603515625, 9.2939453125, 9.6810302734375, 10.068115234375, 10.4552001953125, 10.84228515625, 11.2293701171875, 11.616455078125, 12.0035400390625, 12.390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 6.0, 6.0, 21.0, 15.0, 22.0, 40.0, 58.0, 85.0, 90.0, 123.0, 131.0, 109.0, 78.0, 62.0, 28.0, 31.0, 16.0, 18.0, 8.0, 17.0, 7.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001354217529296875, -0.0013121068477630615, -0.001269996166229248, -0.0012278854846954346, -0.001185774803161621, -0.0011436641216278076, -0.0011015534400939941, -0.0010594427585601807, -0.0010173320770263672, -0.0009752213954925537, -0.0009331107139587402, -0.0008910000324249268, -0.0008488893508911133, -0.0008067786693572998, -0.0007646679878234863, -0.0007225573062896729, -0.0006804466247558594, -0.0006383359432220459, -0.0005962252616882324, -0.0005541145801544189, -0.0005120038986206055, -0.000469893217086792, -0.0004277825355529785, -0.00038567185401916504, -0.00034356117248535156, -0.0003014504909515381, -0.0002593398094177246, -0.00021722912788391113, -0.00017511844635009766, -0.00013300776481628418, -9.08970832824707e-05, -4.8786401748657227e-05, -6.67572021484375e-06, 3.5434961318969727e-05, 7.75456428527832e-05, 0.00011965632438659668, 0.00016176700592041016, 0.00020387768745422363, 0.0002459883689880371, 0.0002880990505218506, 0.00033020973205566406, 0.00037232041358947754, 0.000414431095123291, 0.0004565417766571045, 0.000498652458190918, 0.0005407631397247314, 0.0005828738212585449, 0.0006249845027923584, 0.0006670951843261719, 0.0007092058658599854, 0.0007513165473937988, 0.0007934272289276123, 0.0008355379104614258, 0.0008776485919952393, 0.0009197592735290527, 0.0009618699550628662, 0.0010039806365966797, 0.0010460913181304932, 0.0010882019996643066, 0.0011303126811981201, 0.0011724233627319336, 0.001214534044265747, 0.0012566447257995605, 0.001298755407333374, 0.0013408660888671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 20.0, 27.0, 35.0, 44.0, 89.0, 104.0, 142.0, 266.0, 381.0, 558.0, 931.0, 1436.0, 2421.0, 4361.0, 8479.0, 18028.0, 42162.0, 110200.0, 302873.0, 337153.0, 129158.0, 47914.0, 20440.0, 9449.0, 4912.0, 2693.0, 1532.0, 945.0, 604.0, 407.0, 256.0, 172.0, 109.0, 79.0, 56.0, 36.0, 31.0, 14.0, 14.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1484375, -14.6904296875, -14.232421875, -13.7744140625, -13.31640625, -12.8583984375, -12.400390625, -11.9423828125, -11.484375, -11.0263671875, -10.568359375, -10.1103515625, -9.65234375, -9.1943359375, -8.736328125, -8.2783203125, -7.8203125, -7.3623046875, -6.904296875, -6.4462890625, -5.98828125, -5.5302734375, -5.072265625, -4.6142578125, -4.15625, -3.6982421875, -3.240234375, -2.7822265625, -2.32421875, -1.8662109375, -1.408203125, -0.9501953125, -0.4921875, -0.0341796875, 0.423828125, 0.8818359375, 1.33984375, 1.7978515625, 2.255859375, 2.7138671875, 3.171875, 3.6298828125, 4.087890625, 4.5458984375, 5.00390625, 5.4619140625, 5.919921875, 6.3779296875, 6.8359375, 7.2939453125, 7.751953125, 8.2099609375, 8.66796875, 9.1259765625, 9.583984375, 10.0419921875, 10.5, 10.9580078125, 11.416015625, 11.8740234375, 12.33203125, 12.7900390625, 13.248046875, 13.7060546875, 14.1640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 13.0, 13.0, 13.0, 20.0, 21.0, 24.0, 36.0, 44.0, 34.0, 69.0, 51.0, 71.0, 79.0, 68.0, 94.0, 59.0, 45.0, 34.0, 38.0, 35.0, 18.0, 27.0, 17.0, 13.0, 10.0, 7.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.673370361328125, -3.55377197265625, -3.434173583984375, -3.3145751953125, -3.194976806640625, -3.07537841796875, -2.955780029296875, -2.836181640625, -2.716583251953125, -2.59698486328125, -2.477386474609375, -2.3577880859375, -2.238189697265625, -2.11859130859375, -1.998992919921875, -1.87939453125, -1.759796142578125, -1.64019775390625, -1.520599365234375, -1.4010009765625, -1.281402587890625, -1.16180419921875, -1.042205810546875, -0.922607421875, -0.803009033203125, -0.68341064453125, -0.563812255859375, -0.4442138671875, -0.324615478515625, -0.20501708984375, -0.085418701171875, 0.0341796875, 0.153778076171875, 0.27337646484375, 0.392974853515625, 0.5125732421875, 0.632171630859375, 0.75177001953125, 0.871368408203125, 0.990966796875, 1.110565185546875, 1.23016357421875, 1.349761962890625, 1.4693603515625, 1.588958740234375, 1.70855712890625, 1.828155517578125, 1.94775390625, 2.067352294921875, 2.18695068359375, 2.306549072265625, 2.4261474609375, 2.545745849609375, 2.66534423828125, 2.784942626953125, 2.904541015625, 3.024139404296875, 3.14373779296875, 3.263336181640625, 3.3829345703125, 3.502532958984375, 3.62213134765625, 3.741729736328125, 3.861328125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 0.0, 4.0, 4.0, 6.0, 12.0, 13.0, 13.0, 18.0, 18.0, 22.0, 25.0, 37.0, 31.0, 47.0, 37.0, 78.0, 67.0, 81.0, 60.0, 73.0, 62.0, 51.0, 45.0, 44.0, 37.0, 21.0, 19.0, 20.0, 13.0, 4.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.11933517456055, -35.052528381347656, -33.98572540283203, -32.91891860961914, -31.85211181640625, -30.78530502319336, -29.7185001373291, -28.651695251464844, -27.584888458251953, -26.518081665039062, -25.451276779174805, -24.384471893310547, -23.317665100097656, -22.250858306884766, -21.184053421020508, -20.11724853515625, -19.05044174194336, -17.98363494873047, -16.91683006286621, -15.850024223327637, -14.783218383789062, -13.716412544250488, -12.649606704711914, -11.58280086517334, -10.515995025634766, -9.449189186096191, -8.382383346557617, -7.315577507019043, -6.248771667480469, -5.1819658279418945, -4.11515998840332, -3.048354148864746, -1.9815483093261719, -0.9147424697875977, 0.15206336975097656, 1.2188692092895508, 2.285675048828125, 3.352480888366699, 4.419286727905273, 5.486092567443848, 6.552898406982422, 7.619704246520996, 8.68651008605957, 9.753315925598145, 10.820121765136719, 11.886927604675293, 12.953733444213867, 14.020539283752441, 15.087345123291016, 16.154151916503906, 17.220956802368164, 18.287761688232422, 19.354568481445312, 20.421375274658203, 21.48818016052246, 22.55498504638672, 23.62179183959961, 24.6885986328125, 25.755403518676758, 26.822208404541016, 27.889015197753906, 28.955821990966797, 30.022626876831055, 31.089431762695312, 32.1562385559082]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 10.0, 10.0, 20.0, 11.0, 15.0, 17.0, 20.0, 28.0, 34.0, 29.0, 29.0, 37.0, 34.0, 42.0, 40.0, 40.0, 43.0, 55.0, 36.0, 35.0, 39.0, 38.0, 44.0, 20.0, 33.0, 28.0, 22.0, 24.0, 20.0, 16.0, 17.0, 17.0, 14.0, 11.0, 6.0, 12.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.12033462524414, -26.297992706298828, -25.47565269470215, -24.65331268310547, -23.830970764160156, -23.008628845214844, -22.186288833618164, -21.363948822021484, -20.541606903076172, -19.71926498413086, -18.89692497253418, -18.0745849609375, -17.252243041992188, -16.429901123046875, -15.607561111450195, -14.7852201461792, -13.962879180908203, -13.140538215637207, -12.318197250366211, -11.495856285095215, -10.673515319824219, -9.851174354553223, -9.028833389282227, -8.20649242401123, -7.384151458740234, -6.561810493469238, -5.739469528198242, -4.917128562927246, -4.09478759765625, -3.272446632385254, -2.450105667114258, -1.6277647018432617, -0.8054256439208984, 0.016915321350097656, 0.8392562866210938, 1.6615972518920898, 2.483938217163086, 3.306279182434082, 4.128620147705078, 4.950961112976074, 5.77330207824707, 6.595643043518066, 7.4179840087890625, 8.240324974060059, 9.062665939331055, 9.88500690460205, 10.707347869873047, 11.529688835144043, 12.352029800415039, 13.174370765686035, 13.996711730957031, 14.819052696228027, 15.641393661499023, 16.463733673095703, 17.286075592041016, 18.108417510986328, 18.930757522583008, 19.753097534179688, 20.575439453125, 21.397781372070312, 22.220121383666992, 23.042461395263672, 23.864803314208984, 24.687145233154297, 25.509485244750977]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 11.0, 23.0, 26.0, 50.0, 61.0, 86.0, 136.0, 185.0, 267.0, 462.0, 668.0, 1018.0, 1528.0, 2482.0, 4022.0, 6486.0, 10565.0, 17866.0, 30177.0, 51644.0, 90415.0, 155859.0, 223901.0, 185500.0, 110358.0, 62959.0, 36558.0, 21603.0, 12812.0, 7783.0, 4844.0, 2892.0, 1879.0, 1202.0, 747.0, 493.0, 330.0, 186.0, 145.0, 105.0, 83.0, 40.0, 25.0, 24.0, 19.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.5, -33.4443359375, -32.388671875, -31.3330078125, -30.27734375, -29.2216796875, -28.166015625, -27.1103515625, -26.0546875, -24.9990234375, -23.943359375, -22.8876953125, -21.83203125, -20.7763671875, -19.720703125, -18.6650390625, -17.609375, -16.5537109375, -15.498046875, -14.4423828125, -13.38671875, -12.3310546875, -11.275390625, -10.2197265625, -9.1640625, -8.1083984375, -7.052734375, -5.9970703125, -4.94140625, -3.8857421875, -2.830078125, -1.7744140625, -0.71875, 0.3369140625, 1.392578125, 2.4482421875, 3.50390625, 4.5595703125, 5.615234375, 6.6708984375, 7.7265625, 8.7822265625, 9.837890625, 10.8935546875, 11.94921875, 13.0048828125, 14.060546875, 15.1162109375, 16.171875, 17.2275390625, 18.283203125, 19.3388671875, 20.39453125, 21.4501953125, 22.505859375, 23.5615234375, 24.6171875, 25.6728515625, 26.728515625, 27.7841796875, 28.83984375, 29.8955078125, 30.951171875, 32.0068359375, 33.0625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 8.0, 7.0, 14.0, 8.0, 7.0, 21.0, 16.0, 21.0, 25.0, 17.0, 31.0, 32.0, 31.0, 32.0, 34.0, 51.0, 50.0, 49.0, 44.0, 49.0, 51.0, 42.0, 39.0, 37.0, 36.0, 30.0, 23.0, 29.0, 21.0, 29.0, 17.0, 16.0, 19.0, 13.0, 10.0, 9.0, 4.0, 9.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.353759765625, -27.45751953125, -26.561279296875, -25.6650390625, -24.768798828125, -23.87255859375, -22.976318359375, -22.080078125, -21.183837890625, -20.28759765625, -19.391357421875, -18.4951171875, -17.598876953125, -16.70263671875, -15.806396484375, -14.91015625, -14.013916015625, -13.11767578125, -12.221435546875, -11.3251953125, -10.428955078125, -9.53271484375, -8.636474609375, -7.740234375, -6.843994140625, -5.94775390625, -5.051513671875, -4.1552734375, -3.259033203125, -2.36279296875, -1.466552734375, -0.5703125, 0.325927734375, 1.22216796875, 2.118408203125, 3.0146484375, 3.910888671875, 4.80712890625, 5.703369140625, 6.599609375, 7.495849609375, 8.39208984375, 9.288330078125, 10.1845703125, 11.080810546875, 11.97705078125, 12.873291015625, 13.76953125, 14.665771484375, 15.56201171875, 16.458251953125, 17.3544921875, 18.250732421875, 19.14697265625, 20.043212890625, 20.939453125, 21.835693359375, 22.73193359375, 23.628173828125, 24.5244140625, 25.420654296875, 26.31689453125, 27.213134765625, 28.109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 16.0, 33.0, 45.0, 72.0, 94.0, 156.0, 214.0, 336.0, 521.0, 774.0, 1145.0, 1670.0, 2568.0, 4167.0, 6660.0, 10820.0, 17870.0, 30627.0, 53721.0, 91574.0, 150177.0, 205882.0, 181913.0, 117987.0, 69567.0, 39868.0, 22959.0, 13917.0, 8489.0, 5319.0, 3217.0, 2074.0, 1349.0, 924.0, 613.0, 412.0, 249.0, 190.0, 109.0, 75.0, 53.0, 45.0, 28.0, 15.0, 5.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.4375, -35.28955078125, -34.1416015625, -32.99365234375, -31.845703125, -30.69775390625, -29.5498046875, -28.40185546875, -27.25390625, -26.10595703125, -24.9580078125, -23.81005859375, -22.662109375, -21.51416015625, -20.3662109375, -19.21826171875, -18.0703125, -16.92236328125, -15.7744140625, -14.62646484375, -13.478515625, -12.33056640625, -11.1826171875, -10.03466796875, -8.88671875, -7.73876953125, -6.5908203125, -5.44287109375, -4.294921875, -3.14697265625, -1.9990234375, -0.85107421875, 0.296875, 1.44482421875, 2.5927734375, 3.74072265625, 4.888671875, 6.03662109375, 7.1845703125, 8.33251953125, 9.48046875, 10.62841796875, 11.7763671875, 12.92431640625, 14.072265625, 15.22021484375, 16.3681640625, 17.51611328125, 18.6640625, 19.81201171875, 20.9599609375, 22.10791015625, 23.255859375, 24.40380859375, 25.5517578125, 26.69970703125, 27.84765625, 28.99560546875, 30.1435546875, 31.29150390625, 32.439453125, 33.58740234375, 34.7353515625, 35.88330078125, 37.03125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 6.0, 7.0, 13.0, 8.0, 13.0, 12.0, 20.0, 26.0, 31.0, 39.0, 29.0, 29.0, 35.0, 44.0, 35.0, 46.0, 32.0, 36.0, 27.0, 40.0, 42.0, 48.0, 37.0, 36.0, 27.0, 30.0, 43.0, 39.0, 27.0, 24.0, 16.0, 15.0, 11.0, 10.0, 5.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.34375, -15.7919921875, -15.240234375, -14.6884765625, -14.13671875, -13.5849609375, -13.033203125, -12.4814453125, -11.9296875, -11.3779296875, -10.826171875, -10.2744140625, -9.72265625, -9.1708984375, -8.619140625, -8.0673828125, -7.515625, -6.9638671875, -6.412109375, -5.8603515625, -5.30859375, -4.7568359375, -4.205078125, -3.6533203125, -3.1015625, -2.5498046875, -1.998046875, -1.4462890625, -0.89453125, -0.3427734375, 0.208984375, 0.7607421875, 1.3125, 1.8642578125, 2.416015625, 2.9677734375, 3.51953125, 4.0712890625, 4.623046875, 5.1748046875, 5.7265625, 6.2783203125, 6.830078125, 7.3818359375, 7.93359375, 8.4853515625, 9.037109375, 9.5888671875, 10.140625, 10.6923828125, 11.244140625, 11.7958984375, 12.34765625, 12.8994140625, 13.451171875, 14.0029296875, 14.5546875, 15.1064453125, 15.658203125, 16.2099609375, 16.76171875, 17.3134765625, 17.865234375, 18.4169921875, 18.96875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 8.0, 14.0, 23.0, 21.0, 44.0, 66.0, 68.0, 122.0, 185.0, 291.0, 395.0, 608.0, 1017.0, 1666.0, 3040.0, 5700.0, 11886.0, 27226.0, 70105.0, 209928.0, 423218.0, 183367.0, 62248.0, 24285.0, 10688.0, 5259.0, 2680.0, 1602.0, 951.0, 580.0, 409.0, 269.0, 171.0, 125.0, 92.0, 60.0, 41.0, 33.0, 20.0, 10.0, 12.0, 6.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.109375, -20.392333984375, -19.67529296875, -18.958251953125, -18.2412109375, -17.524169921875, -16.80712890625, -16.090087890625, -15.373046875, -14.656005859375, -13.93896484375, -13.221923828125, -12.5048828125, -11.787841796875, -11.07080078125, -10.353759765625, -9.63671875, -8.919677734375, -8.20263671875, -7.485595703125, -6.7685546875, -6.051513671875, -5.33447265625, -4.617431640625, -3.900390625, -3.183349609375, -2.46630859375, -1.749267578125, -1.0322265625, -0.315185546875, 0.40185546875, 1.118896484375, 1.8359375, 2.552978515625, 3.27001953125, 3.987060546875, 4.7041015625, 5.421142578125, 6.13818359375, 6.855224609375, 7.572265625, 8.289306640625, 9.00634765625, 9.723388671875, 10.4404296875, 11.157470703125, 11.87451171875, 12.591552734375, 13.30859375, 14.025634765625, 14.74267578125, 15.459716796875, 16.1767578125, 16.893798828125, 17.61083984375, 18.327880859375, 19.044921875, 19.761962890625, 20.47900390625, 21.196044921875, 21.9130859375, 22.630126953125, 23.34716796875, 24.064208984375, 24.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 5.0, 13.0, 10.0, 27.0, 39.0, 54.0, 81.0, 125.0, 201.0, 166.0, 106.0, 57.0, 35.0, 20.0, 16.0, 11.0, 7.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.002658754587173462, -0.0025690197944641113, -0.0024792850017547607, -0.00238955020904541, -0.0022998154163360596, -0.002210080623626709, -0.0021203458309173584, -0.002030611038208008, -0.0019408762454986572, -0.0018511414527893066, -0.001761406660079956, -0.0016716718673706055, -0.0015819370746612549, -0.0014922022819519043, -0.0014024674892425537, -0.0013127326965332031, -0.0012229979038238525, -0.001133263111114502, -0.0010435283184051514, -0.0009537935256958008, -0.0008640587329864502, -0.0007743239402770996, -0.000684589147567749, -0.0005948543548583984, -0.0005051195621490479, -0.00041538476943969727, -0.0003256499767303467, -0.0002359151840209961, -0.0001461803913116455, -5.644559860229492e-05, 3.3289194107055664e-05, 0.00012302398681640625, 0.00021275877952575684, 0.0003024935722351074, 0.000392228364944458, 0.0004819631576538086, 0.0005716979503631592, 0.0006614327430725098, 0.0007511675357818604, 0.0008409023284912109, 0.0009306371212005615, 0.0010203719139099121, 0.0011101067066192627, 0.0011998414993286133, 0.0012895762920379639, 0.0013793110847473145, 0.001469045877456665, 0.0015587806701660156, 0.0016485154628753662, 0.0017382502555847168, 0.0018279850482940674, 0.001917719841003418, 0.0020074546337127686, 0.002097189426422119, 0.0021869242191314697, 0.0022766590118408203, 0.002366393804550171, 0.0024561285972595215, 0.002545863389968872, 0.0026355981826782227, 0.0027253329753875732, 0.002815067768096924, 0.0029048025608062744, 0.002994537353515625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 15.0, 23.0, 38.0, 37.0, 56.0, 79.0, 109.0, 137.0, 188.0, 315.0, 418.0, 631.0, 993.0, 1495.0, 2242.0, 3685.0, 6216.0, 10991.0, 19692.0, 37247.0, 74553.0, 156111.0, 280633.0, 225012.0, 109639.0, 53671.0, 27452.0, 15172.0, 8334.0, 4905.0, 2913.0, 1824.0, 1176.0, 790.0, 548.0, 364.0, 222.0, 167.0, 117.0, 81.0, 62.0, 48.0, 23.0, 33.0, 18.0, 18.0, 9.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0], "bins": [-14.78125, -14.28466796875, -13.7880859375, -13.29150390625, -12.794921875, -12.29833984375, -11.8017578125, -11.30517578125, -10.80859375, -10.31201171875, -9.8154296875, -9.31884765625, -8.822265625, -8.32568359375, -7.8291015625, -7.33251953125, -6.8359375, -6.33935546875, -5.8427734375, -5.34619140625, -4.849609375, -4.35302734375, -3.8564453125, -3.35986328125, -2.86328125, -2.36669921875, -1.8701171875, -1.37353515625, -0.876953125, -0.38037109375, 0.1162109375, 0.61279296875, 1.109375, 1.60595703125, 2.1025390625, 2.59912109375, 3.095703125, 3.59228515625, 4.0888671875, 4.58544921875, 5.08203125, 5.57861328125, 6.0751953125, 6.57177734375, 7.068359375, 7.56494140625, 8.0615234375, 8.55810546875, 9.0546875, 9.55126953125, 10.0478515625, 10.54443359375, 11.041015625, 11.53759765625, 12.0341796875, 12.53076171875, 13.02734375, 13.52392578125, 14.0205078125, 14.51708984375, 15.013671875, 15.51025390625, 16.0068359375, 16.50341796875, 17.0]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 3.0, 4.0, 12.0, 13.0, 10.0, 13.0, 13.0, 23.0, 15.0, 41.0, 32.0, 44.0, 60.0, 53.0, 82.0, 87.0, 80.0, 68.0, 53.0, 40.0, 34.0, 37.0, 26.0, 30.0, 21.0, 21.0, 12.0, 23.0, 12.0, 4.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.97265625, -4.8109130859375, -4.649169921875, -4.4874267578125, -4.32568359375, -4.1639404296875, -4.002197265625, -3.8404541015625, -3.6787109375, -3.5169677734375, -3.355224609375, -3.1934814453125, -3.03173828125, -2.8699951171875, -2.708251953125, -2.5465087890625, -2.384765625, -2.2230224609375, -2.061279296875, -1.8995361328125, -1.73779296875, -1.5760498046875, -1.414306640625, -1.2525634765625, -1.0908203125, -0.9290771484375, -0.767333984375, -0.6055908203125, -0.44384765625, -0.2821044921875, -0.120361328125, 0.0413818359375, 0.203125, 0.3648681640625, 0.526611328125, 0.6883544921875, 0.85009765625, 1.0118408203125, 1.173583984375, 1.3353271484375, 1.4970703125, 1.6588134765625, 1.820556640625, 1.9822998046875, 2.14404296875, 2.3057861328125, 2.467529296875, 2.6292724609375, 2.791015625, 2.9527587890625, 3.114501953125, 3.2762451171875, 3.43798828125, 3.5997314453125, 3.761474609375, 3.9232177734375, 4.0849609375, 4.2467041015625, 4.408447265625, 4.5701904296875, 4.73193359375, 4.8936767578125, 5.055419921875, 5.2171630859375, 5.37890625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 12.0, 14.0, 17.0, 24.0, 30.0, 35.0, 55.0, 40.0, 56.0, 76.0, 90.0, 67.0, 73.0, 64.0, 54.0, 52.0, 43.0, 39.0, 26.0, 20.0, 12.0, 14.0, 10.0, 7.0, 10.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.735443115234375, -35.59249496459961, -34.44954299926758, -33.30659484863281, -32.16364288330078, -31.020694732666016, -29.877744674682617, -28.73479461669922, -27.59184455871582, -26.448894500732422, -25.305944442749023, -24.162994384765625, -23.02004623413086, -21.877094268798828, -20.734146118164062, -19.591196060180664, -18.448246002197266, -17.305295944213867, -16.16234588623047, -15.019396781921387, -13.876446723937988, -12.73349666595459, -11.590547561645508, -10.44759750366211, -9.304647445678711, -8.161697387695312, -7.018747806549072, -5.875798225402832, -4.732848167419434, -3.589898109436035, -2.446948528289795, -1.3039989471435547, -0.16104507446289062, 0.9819047451019287, 2.124854564666748, 3.2678043842315674, 4.410754203796387, 5.553704261779785, 6.696653842926025, 7.839603424072266, 8.982553482055664, 10.125503540039062, 11.268453598022461, 12.411402702331543, 13.554352760314941, 14.69730281829834, 15.840251922607422, 16.98320198059082, 18.12615203857422, 19.269102096557617, 20.412052154541016, 21.555002212524414, 22.697952270507812, 23.840900421142578, 24.983850479125977, 26.126800537109375, 27.269750595092773, 28.412700653076172, 29.55565071105957, 30.69860076904297, 31.841548919677734, 32.984500885009766, 34.12744903564453, 35.27040100097656, 36.41334915161133]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 10.0, 10.0, 7.0, 10.0, 13.0, 13.0, 21.0, 23.0, 26.0, 29.0, 45.0, 35.0, 38.0, 33.0, 31.0, 45.0, 50.0, 40.0, 47.0, 37.0, 37.0, 39.0, 43.0, 43.0, 44.0, 25.0, 32.0, 26.0, 21.0, 29.0, 17.0, 17.0, 14.0, 7.0, 14.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.86671257019043, -25.917133331298828, -24.967554092407227, -24.017974853515625, -23.068397521972656, -22.118816375732422, -21.169239044189453, -20.21965980529785, -19.27008056640625, -18.32050132751465, -17.370922088623047, -16.421342849731445, -15.47176456451416, -14.522185325622559, -13.572607040405273, -12.623027801513672, -11.67344856262207, -10.723869323730469, -9.774290084838867, -8.824711799621582, -7.8751325607299805, -6.925553321838379, -5.9759745597839355, -5.026395797729492, -4.076816558837891, -3.127237558364868, -2.1776585578918457, -1.2280795574188232, -0.2785005569458008, 0.6710786819458008, 1.6206574440002441, 2.5702362060546875, 3.5198135375976562, 4.469392776489258, 5.418971538543701, 6.3685503005981445, 7.318129539489746, 8.267708778381348, 9.217287063598633, 10.166866302490234, 11.116445541381836, 12.066024780273438, 13.015604019165039, 13.965182304382324, 14.914761543273926, 15.864340782165527, 16.813919067382812, 17.763498306274414, 18.713077545166016, 19.662656784057617, 20.61223602294922, 21.56181526184082, 22.511394500732422, 23.46097183227539, 24.410551071166992, 25.360130310058594, 26.309709548950195, 27.259288787841797, 28.2088680267334, 29.158447265625, 30.10802459716797, 31.057605743408203, 32.00718307495117, 32.956764221191406, 33.906341552734375]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 12.0, 18.0, 19.0, 25.0, 44.0, 71.0, 76.0, 118.0, 197.0, 265.0, 390.0, 572.0, 816.0, 1203.0, 1902.0, 2836.0, 4372.0, 7179.0, 11711.0, 20385.0, 37611.0, 77496.0, 183391.0, 533117.0, 1277159.0, 1214469.0, 480743.0, 175517.0, 74058.0, 37242.0, 20494.0, 11794.0, 6987.0, 4307.0, 2668.0, 1668.0, 1178.0, 735.0, 471.0, 308.0, 209.0, 151.0, 91.0, 61.0, 47.0, 39.0, 18.0, 12.0, 8.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.5625, -31.39794921875, -30.2333984375, -29.06884765625, -27.904296875, -26.73974609375, -25.5751953125, -24.41064453125, -23.24609375, -22.08154296875, -20.9169921875, -19.75244140625, -18.587890625, -17.42333984375, -16.2587890625, -15.09423828125, -13.9296875, -12.76513671875, -11.6005859375, -10.43603515625, -9.271484375, -8.10693359375, -6.9423828125, -5.77783203125, -4.61328125, -3.44873046875, -2.2841796875, -1.11962890625, 0.044921875, 1.20947265625, 2.3740234375, 3.53857421875, 4.703125, 5.86767578125, 7.0322265625, 8.19677734375, 9.361328125, 10.52587890625, 11.6904296875, 12.85498046875, 14.01953125, 15.18408203125, 16.3486328125, 17.51318359375, 18.677734375, 19.84228515625, 21.0068359375, 22.17138671875, 23.3359375, 24.50048828125, 25.6650390625, 26.82958984375, 27.994140625, 29.15869140625, 30.3232421875, 31.48779296875, 32.65234375, 33.81689453125, 34.9814453125, 36.14599609375, 37.310546875, 38.47509765625, 39.6396484375, 40.80419921875, 41.96875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 5.0, 11.0, 9.0, 10.0, 18.0, 22.0, 25.0, 26.0, 28.0, 43.0, 47.0, 27.0, 52.0, 35.0, 49.0, 44.0, 51.0, 51.0, 38.0, 32.0, 52.0, 40.0, 39.0, 38.0, 32.0, 19.0, 23.0, 20.0, 34.0, 12.0, 14.0, 14.0, 5.0, 8.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.49072265625, -22.6064453125, -21.72216796875, -20.837890625, -19.95361328125, -19.0693359375, -18.18505859375, -17.30078125, -16.41650390625, -15.5322265625, -14.64794921875, -13.763671875, -12.87939453125, -11.9951171875, -11.11083984375, -10.2265625, -9.34228515625, -8.4580078125, -7.57373046875, -6.689453125, -5.80517578125, -4.9208984375, -4.03662109375, -3.15234375, -2.26806640625, -1.3837890625, -0.49951171875, 0.384765625, 1.26904296875, 2.1533203125, 3.03759765625, 3.921875, 4.80615234375, 5.6904296875, 6.57470703125, 7.458984375, 8.34326171875, 9.2275390625, 10.11181640625, 10.99609375, 11.88037109375, 12.7646484375, 13.64892578125, 14.533203125, 15.41748046875, 16.3017578125, 17.18603515625, 18.0703125, 18.95458984375, 19.8388671875, 20.72314453125, 21.607421875, 22.49169921875, 23.3759765625, 24.26025390625, 25.14453125, 26.02880859375, 26.9130859375, 27.79736328125, 28.681640625, 29.56591796875, 30.4501953125, 31.33447265625, 32.21875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 15.0, 18.0, 12.0, 25.0, 39.0, 65.0, 84.0, 125.0, 159.0, 239.0, 366.0, 577.0, 779.0, 1158.0, 1687.0, 2609.0, 3975.0, 6297.0, 10359.0, 16809.0, 28425.0, 50058.0, 93015.0, 182286.0, 385855.0, 886596.0, 1299613.0, 630591.0, 282965.0, 137642.0, 72103.0, 39403.0, 22726.0, 13624.0, 8399.0, 5280.0, 3483.0, 2263.0, 1458.0, 1006.0, 652.0, 471.0, 317.0, 197.0, 162.0, 101.0, 62.0, 44.0, 27.0, 19.0, 19.0, 14.0, 10.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.25, -36.0966796875, -34.943359375, -33.7900390625, -32.63671875, -31.4833984375, -30.330078125, -29.1767578125, -28.0234375, -26.8701171875, -25.716796875, -24.5634765625, -23.41015625, -22.2568359375, -21.103515625, -19.9501953125, -18.796875, -17.6435546875, -16.490234375, -15.3369140625, -14.18359375, -13.0302734375, -11.876953125, -10.7236328125, -9.5703125, -8.4169921875, -7.263671875, -6.1103515625, -4.95703125, -3.8037109375, -2.650390625, -1.4970703125, -0.34375, 0.8095703125, 1.962890625, 3.1162109375, 4.26953125, 5.4228515625, 6.576171875, 7.7294921875, 8.8828125, 10.0361328125, 11.189453125, 12.3427734375, 13.49609375, 14.6494140625, 15.802734375, 16.9560546875, 18.109375, 19.2626953125, 20.416015625, 21.5693359375, 22.72265625, 23.8759765625, 25.029296875, 26.1826171875, 27.3359375, 28.4892578125, 29.642578125, 30.7958984375, 31.94921875, 33.1025390625, 34.255859375, 35.4091796875, 36.5625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 12.0, 12.0, 14.0, 20.0, 18.0, 26.0, 34.0, 30.0, 38.0, 61.0, 82.0, 105.0, 119.0, 140.0, 189.0, 234.0, 268.0, 330.0, 370.0, 346.0, 281.0, 256.0, 191.0, 164.0, 134.0, 129.0, 88.0, 84.0, 52.0, 44.0, 39.0, 34.0, 28.0, 28.0, 15.0, 13.0, 6.0, 7.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.78125, -12.3785400390625, -11.975830078125, -11.5731201171875, -11.17041015625, -10.7677001953125, -10.364990234375, -9.9622802734375, -9.5595703125, -9.1568603515625, -8.754150390625, -8.3514404296875, -7.94873046875, -7.5460205078125, -7.143310546875, -6.7406005859375, -6.337890625, -5.9351806640625, -5.532470703125, -5.1297607421875, -4.72705078125, -4.3243408203125, -3.921630859375, -3.5189208984375, -3.1162109375, -2.7135009765625, -2.310791015625, -1.9080810546875, -1.50537109375, -1.1026611328125, -0.699951171875, -0.2972412109375, 0.10546875, 0.5081787109375, 0.910888671875, 1.3135986328125, 1.71630859375, 2.1190185546875, 2.521728515625, 2.9244384765625, 3.3271484375, 3.7298583984375, 4.132568359375, 4.5352783203125, 4.93798828125, 5.3406982421875, 5.743408203125, 6.1461181640625, 6.548828125, 6.9515380859375, 7.354248046875, 7.7569580078125, 8.15966796875, 8.5623779296875, 8.965087890625, 9.3677978515625, 9.7705078125, 10.1732177734375, 10.575927734375, 10.9786376953125, 11.38134765625, 11.7840576171875, 12.186767578125, 12.5894775390625, 12.9921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 12.0, 17.0, 15.0, 19.0, 28.0, 37.0, 43.0, 58.0, 71.0, 67.0, 68.0, 61.0, 60.0, 71.0, 71.0, 52.0, 51.0, 33.0, 29.0, 24.0, 21.0, 14.0, 7.0, 12.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9119758605957, -35.81083679199219, -34.709693908691406, -33.60855484008789, -32.507415771484375, -31.406272888183594, -30.305133819580078, -29.20399284362793, -28.10285186767578, -27.001710891723633, -25.900569915771484, -24.79943084716797, -23.69828987121582, -22.597148895263672, -21.496009826660156, -20.394868850708008, -19.29372787475586, -18.19258689880371, -17.091445922851562, -15.990306854248047, -14.889165878295898, -13.78802490234375, -12.686884880065918, -11.585744857788086, -10.484603881835938, -9.383462905883789, -8.282322883605957, -7.181182384490967, -6.080041885375977, -4.978901386260986, -3.877760887145996, -2.776620388031006, -1.6754798889160156, -0.5743393898010254, 0.5268011093139648, 1.627941608428955, 2.7290821075439453, 3.8302226066589355, 4.931363105773926, 6.032503604888916, 7.133644104003906, 8.234785079956055, 9.335925102233887, 10.437065124511719, 11.538206100463867, 12.639347076416016, 13.740487098693848, 14.84162712097168, 15.942768096923828, 17.043909072875977, 18.145050048828125, 19.24618911743164, 20.34733009338379, 21.448471069335938, 22.549610137939453, 23.6507511138916, 24.75189208984375, 25.8530330657959, 26.954174041748047, 28.055313110351562, 29.15645408630371, 30.25759506225586, 31.358734130859375, 32.459877014160156, 33.56101608276367]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 12.0, 9.0, 10.0, 8.0, 18.0, 15.0, 28.0, 21.0, 23.0, 31.0, 32.0, 37.0, 24.0, 32.0, 31.0, 36.0, 45.0, 53.0, 38.0, 37.0, 34.0, 60.0, 27.0, 35.0, 24.0, 29.0, 34.0, 30.0, 20.0, 30.0, 17.0, 25.0, 15.0, 11.0, 10.0, 8.0, 10.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.57047462463379, -25.722055435180664, -24.87363624572754, -24.025217056274414, -23.17679786682129, -22.328378677368164, -21.47995948791504, -20.631540298461914, -19.78312110900879, -18.934701919555664, -18.08628273010254, -17.237863540649414, -16.38944435119629, -15.541025161743164, -14.692605972290039, -13.844186782836914, -12.995767593383789, -12.147348403930664, -11.298929214477539, -10.450510025024414, -9.602090835571289, -8.753671646118164, -7.905252456665039, -7.056833267211914, -6.208414077758789, -5.359994888305664, -4.511575698852539, -3.663156509399414, -2.814737319946289, -1.966318130493164, -1.117898941040039, -0.26947975158691406, 0.5789413452148438, 1.4273605346679688, 2.2757797241210938, 3.1241989135742188, 3.9726181030273438, 4.821037292480469, 5.669456481933594, 6.517875671386719, 7.366294860839844, 8.214714050292969, 9.063133239746094, 9.911552429199219, 10.759971618652344, 11.608390808105469, 12.456809997558594, 13.305229187011719, 14.153648376464844, 15.002067565917969, 15.850486755371094, 16.69890594482422, 17.547325134277344, 18.39574432373047, 19.244163513183594, 20.09258270263672, 20.941001892089844, 21.78942108154297, 22.637840270996094, 23.48625946044922, 24.334678649902344, 25.18309783935547, 26.031517028808594, 26.87993621826172, 27.728355407714844]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 15.0, 16.0, 27.0, 44.0, 45.0, 70.0, 96.0, 143.0, 184.0, 309.0, 418.0, 566.0, 819.0, 1226.0, 1890.0, 2784.0, 4068.0, 6376.0, 9887.0, 15692.0, 24234.0, 39118.0, 65207.0, 112547.0, 192558.0, 222163.0, 138914.0, 79704.0, 47739.0, 29465.0, 18334.0, 11453.0, 7454.0, 4921.0, 3231.0, 2199.0, 1477.0, 956.0, 679.0, 451.0, 321.0, 238.0, 153.0, 100.0, 88.0, 51.0, 31.0, 23.0, 26.0, 16.0, 6.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0], "bins": [-18.453125, -17.8798828125, -17.306640625, -16.7333984375, -16.16015625, -15.5869140625, -15.013671875, -14.4404296875, -13.8671875, -13.2939453125, -12.720703125, -12.1474609375, -11.57421875, -11.0009765625, -10.427734375, -9.8544921875, -9.28125, -8.7080078125, -8.134765625, -7.5615234375, -6.98828125, -6.4150390625, -5.841796875, -5.2685546875, -4.6953125, -4.1220703125, -3.548828125, -2.9755859375, -2.40234375, -1.8291015625, -1.255859375, -0.6826171875, -0.109375, 0.4638671875, 1.037109375, 1.6103515625, 2.18359375, 2.7568359375, 3.330078125, 3.9033203125, 4.4765625, 5.0498046875, 5.623046875, 6.1962890625, 6.76953125, 7.3427734375, 7.916015625, 8.4892578125, 9.0625, 9.6357421875, 10.208984375, 10.7822265625, 11.35546875, 11.9287109375, 12.501953125, 13.0751953125, 13.6484375, 14.2216796875, 14.794921875, 15.3681640625, 15.94140625, 16.5146484375, 17.087890625, 17.6611328125, 18.234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 7.0, 13.0, 6.0, 13.0, 21.0, 26.0, 31.0, 33.0, 31.0, 35.0, 31.0, 31.0, 26.0, 30.0, 36.0, 51.0, 46.0, 38.0, 51.0, 42.0, 50.0, 33.0, 33.0, 27.0, 32.0, 22.0, 29.0, 22.0, 19.0, 15.0, 18.0, 15.0, 11.0, 9.0, 5.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-27.8125, -26.935546875, -26.05859375, -25.181640625, -24.3046875, -23.427734375, -22.55078125, -21.673828125, -20.796875, -19.919921875, -19.04296875, -18.166015625, -17.2890625, -16.412109375, -15.53515625, -14.658203125, -13.78125, -12.904296875, -12.02734375, -11.150390625, -10.2734375, -9.396484375, -8.51953125, -7.642578125, -6.765625, -5.888671875, -5.01171875, -4.134765625, -3.2578125, -2.380859375, -1.50390625, -0.626953125, 0.25, 1.126953125, 2.00390625, 2.880859375, 3.7578125, 4.634765625, 5.51171875, 6.388671875, 7.265625, 8.142578125, 9.01953125, 9.896484375, 10.7734375, 11.650390625, 12.52734375, 13.404296875, 14.28125, 15.158203125, 16.03515625, 16.912109375, 17.7890625, 18.666015625, 19.54296875, 20.419921875, 21.296875, 22.173828125, 23.05078125, 23.927734375, 24.8046875, 25.681640625, 26.55859375, 27.435546875, 28.3125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 15.0, 22.0, 24.0, 53.0, 60.0, 118.0, 158.0, 220.0, 375.0, 620.0, 899.0, 1390.0, 2304.0, 3907.0, 6554.0, 11660.0, 21292.0, 41404.0, 89085.0, 231667.0, 359984.0, 146292.0, 61939.0, 30226.0, 16078.0, 8808.0, 5171.0, 3117.0, 1833.0, 1200.0, 704.0, 448.0, 321.0, 201.0, 122.0, 77.0, 51.0, 40.0, 27.0, 19.0, 20.0, 14.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0], "bins": [-38.0, -36.952392578125, -35.90478515625, -34.857177734375, -33.8095703125, -32.761962890625, -31.71435546875, -30.666748046875, -29.619140625, -28.571533203125, -27.52392578125, -26.476318359375, -25.4287109375, -24.381103515625, -23.33349609375, -22.285888671875, -21.23828125, -20.190673828125, -19.14306640625, -18.095458984375, -17.0478515625, -16.000244140625, -14.95263671875, -13.905029296875, -12.857421875, -11.809814453125, -10.76220703125, -9.714599609375, -8.6669921875, -7.619384765625, -6.57177734375, -5.524169921875, -4.4765625, -3.428955078125, -2.38134765625, -1.333740234375, -0.2861328125, 0.761474609375, 1.80908203125, 2.856689453125, 3.904296875, 4.951904296875, 5.99951171875, 7.047119140625, 8.0947265625, 9.142333984375, 10.18994140625, 11.237548828125, 12.28515625, 13.332763671875, 14.38037109375, 15.427978515625, 16.4755859375, 17.523193359375, 18.57080078125, 19.618408203125, 20.666015625, 21.713623046875, 22.76123046875, 23.808837890625, 24.8564453125, 25.904052734375, 26.95166015625, 27.999267578125, 29.046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 18.0, 11.0, 19.0, 14.0, 19.0, 26.0, 29.0, 15.0, 30.0, 30.0, 40.0, 41.0, 40.0, 42.0, 38.0, 45.0, 44.0, 35.0, 44.0, 34.0, 30.0, 35.0, 31.0, 33.0, 30.0, 27.0, 26.0, 24.0, 19.0, 13.0, 26.0, 13.0, 9.0, 7.0, 7.0, 7.0, 9.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-18.28125, -17.7333984375, -17.185546875, -16.6376953125, -16.08984375, -15.5419921875, -14.994140625, -14.4462890625, -13.8984375, -13.3505859375, -12.802734375, -12.2548828125, -11.70703125, -11.1591796875, -10.611328125, -10.0634765625, -9.515625, -8.9677734375, -8.419921875, -7.8720703125, -7.32421875, -6.7763671875, -6.228515625, -5.6806640625, -5.1328125, -4.5849609375, -4.037109375, -3.4892578125, -2.94140625, -2.3935546875, -1.845703125, -1.2978515625, -0.75, -0.2021484375, 0.345703125, 0.8935546875, 1.44140625, 1.9892578125, 2.537109375, 3.0849609375, 3.6328125, 4.1806640625, 4.728515625, 5.2763671875, 5.82421875, 6.3720703125, 6.919921875, 7.4677734375, 8.015625, 8.5634765625, 9.111328125, 9.6591796875, 10.20703125, 10.7548828125, 11.302734375, 11.8505859375, 12.3984375, 12.9462890625, 13.494140625, 14.0419921875, 14.58984375, 15.1376953125, 15.685546875, 16.2333984375, 16.78125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 14.0, 34.0, 29.0, 69.0, 94.0, 169.0, 303.0, 586.0, 1068.0, 2033.0, 4140.0, 9580.0, 24473.0, 73042.0, 253905.0, 444599.0, 156431.0, 47178.0, 17187.0, 6979.0, 3239.0, 1493.0, 796.0, 451.0, 240.0, 124.0, 88.0, 48.0, 33.0, 32.0, 17.0, 9.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.421875, -10.126708984375, -9.83154296875, -9.536376953125, -9.2412109375, -8.946044921875, -8.65087890625, -8.355712890625, -8.060546875, -7.765380859375, -7.47021484375, -7.175048828125, -6.8798828125, -6.584716796875, -6.28955078125, -5.994384765625, -5.69921875, -5.404052734375, -5.10888671875, -4.813720703125, -4.5185546875, -4.223388671875, -3.92822265625, -3.633056640625, -3.337890625, -3.042724609375, -2.74755859375, -2.452392578125, -2.1572265625, -1.862060546875, -1.56689453125, -1.271728515625, -0.9765625, -0.681396484375, -0.38623046875, -0.091064453125, 0.2041015625, 0.499267578125, 0.79443359375, 1.089599609375, 1.384765625, 1.679931640625, 1.97509765625, 2.270263671875, 2.5654296875, 2.860595703125, 3.15576171875, 3.450927734375, 3.74609375, 4.041259765625, 4.33642578125, 4.631591796875, 4.9267578125, 5.221923828125, 5.51708984375, 5.812255859375, 6.107421875, 6.402587890625, 6.69775390625, 6.992919921875, 7.2880859375, 7.583251953125, 7.87841796875, 8.173583984375, 8.46875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 17.0, 20.0, 32.0, 43.0, 53.0, 82.0, 77.0, 106.0, 96.0, 87.0, 97.0, 87.0, 42.0, 29.0, 25.0, 19.0, 15.0, 15.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005488395690917969, -0.0005241706967353821, -0.0004995018243789673, -0.0004748329520225525, -0.0004501640796661377, -0.0004254952073097229, -0.0004008263349533081, -0.0003761574625968933, -0.0003514885902404785, -0.0003268197178840637, -0.0003021508455276489, -0.00027748197317123413, -0.00025281310081481934, -0.00022814422845840454, -0.00020347535610198975, -0.00017880648374557495, -0.00015413761138916016, -0.00012946873903274536, -0.00010479986667633057, -8.013099431991577e-05, -5.5462121963500977e-05, -3.079324960708618e-05, -6.124377250671387e-06, 1.8544495105743408e-05, 4.32133674621582e-05, 6.7882239818573e-05, 9.255111217498779e-05, 0.00011721998453140259, 0.00014188885688781738, 0.00016655772924423218, 0.00019122660160064697, 0.00021589547395706177, 0.00024056434631347656, 0.00026523321866989136, 0.00028990209102630615, 0.00031457096338272095, 0.00033923983573913574, 0.00036390870809555054, 0.00038857758045196533, 0.0004132464528083801, 0.0004379153251647949, 0.0004625841975212097, 0.0004872530698776245, 0.0005119219422340393, 0.0005365908145904541, 0.0005612596869468689, 0.0005859285593032837, 0.0006105974316596985, 0.0006352663040161133, 0.0006599351763725281, 0.0006846040487289429, 0.0007092729210853577, 0.0007339417934417725, 0.0007586106657981873, 0.000783279538154602, 0.0008079484105110168, 0.0008326172828674316, 0.0008572861552238464, 0.0008819550275802612, 0.000906623899936676, 0.0009312927722930908, 0.0009559616446495056, 0.0009806305170059204, 0.0010052993893623352, 0.00102996826171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 17.0, 17.0, 42.0, 32.0, 50.0, 46.0, 96.0, 141.0, 219.0, 256.0, 487.0, 758.0, 1385.0, 2547.0, 5326.0, 11856.0, 28825.0, 76813.0, 216077.0, 383154.0, 199802.0, 71561.0, 26952.0, 11196.0, 5057.0, 2501.0, 1269.0, 695.0, 453.0, 247.0, 173.0, 141.0, 102.0, 57.0, 41.0, 41.0, 19.0, 22.0, 14.0, 5.0, 10.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-11.6484375, -11.3104248046875, -10.972412109375, -10.6343994140625, -10.29638671875, -9.9583740234375, -9.620361328125, -9.2823486328125, -8.9443359375, -8.6063232421875, -8.268310546875, -7.9302978515625, -7.59228515625, -7.2542724609375, -6.916259765625, -6.5782470703125, -6.240234375, -5.9022216796875, -5.564208984375, -5.2261962890625, -4.88818359375, -4.5501708984375, -4.212158203125, -3.8741455078125, -3.5361328125, -3.1981201171875, -2.860107421875, -2.5220947265625, -2.18408203125, -1.8460693359375, -1.508056640625, -1.1700439453125, -0.83203125, -0.4940185546875, -0.156005859375, 0.1820068359375, 0.52001953125, 0.8580322265625, 1.196044921875, 1.5340576171875, 1.8720703125, 2.2100830078125, 2.548095703125, 2.8861083984375, 3.22412109375, 3.5621337890625, 3.900146484375, 4.2381591796875, 4.576171875, 4.9141845703125, 5.252197265625, 5.5902099609375, 5.92822265625, 6.2662353515625, 6.604248046875, 6.9422607421875, 7.2802734375, 7.6182861328125, 7.956298828125, 8.2943115234375, 8.63232421875, 8.9703369140625, 9.308349609375, 9.6463623046875, 9.984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 0.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 15.0, 29.0, 23.0, 45.0, 44.0, 60.0, 77.0, 71.0, 92.0, 101.0, 71.0, 67.0, 53.0, 36.0, 32.0, 29.0, 21.0, 19.0, 16.0, 11.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.2362060546875, -2.156005859375, -2.0758056640625, -1.99560546875, -1.9154052734375, -1.835205078125, -1.7550048828125, -1.6748046875, -1.5946044921875, -1.514404296875, -1.4342041015625, -1.35400390625, -1.2738037109375, -1.193603515625, -1.1134033203125, -1.033203125, -0.9530029296875, -0.872802734375, -0.7926025390625, -0.71240234375, -0.6322021484375, -0.552001953125, -0.4718017578125, -0.3916015625, -0.3114013671875, -0.231201171875, -0.1510009765625, -0.07080078125, 0.0093994140625, 0.089599609375, 0.1697998046875, 0.25, 0.3302001953125, 0.410400390625, 0.4906005859375, 0.57080078125, 0.6510009765625, 0.731201171875, 0.8114013671875, 0.8916015625, 0.9718017578125, 1.052001953125, 1.1322021484375, 1.21240234375, 1.2926025390625, 1.372802734375, 1.4530029296875, 1.533203125, 1.6134033203125, 1.693603515625, 1.7738037109375, 1.85400390625, 1.9342041015625, 2.014404296875, 2.0946044921875, 2.1748046875, 2.2550048828125, 2.335205078125, 2.4154052734375, 2.49560546875, 2.5758056640625, 2.656005859375, 2.7362060546875, 2.81640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 8.0, 7.0, 17.0, 14.0, 13.0, 25.0, 32.0, 44.0, 44.0, 53.0, 69.0, 70.0, 64.0, 66.0, 56.0, 57.0, 79.0, 63.0, 35.0, 37.0, 31.0, 20.0, 20.0, 15.0, 9.0, 8.0, 10.0, 4.0, 1.0, 7.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.088653564453125, -34.002357482910156, -32.91605758666992, -31.829761505126953, -30.74346351623535, -29.65716552734375, -28.57086944580078, -27.48457145690918, -26.398273468017578, -25.311975479125977, -24.225677490234375, -23.139381408691406, -22.053083419799805, -20.966785430908203, -19.880489349365234, -18.794191360473633, -17.70789337158203, -16.62159538269043, -15.535298347473145, -14.44900131225586, -13.362703323364258, -12.276405334472656, -11.190108299255371, -10.103811264038086, -9.017513275146484, -7.931215763092041, -6.844918251037598, -5.758620738983154, -4.672323226928711, -3.5860257148742676, -2.499728202819824, -1.4134306907653809, -0.3271331787109375, 0.7591643333435059, 1.8454618453979492, 2.9317593574523926, 4.018056869506836, 5.104354381561279, 6.190651893615723, 7.276949405670166, 8.36324691772461, 9.449544906616211, 10.535841941833496, 11.622138977050781, 12.708436965942383, 13.794734954833984, 14.88103199005127, 15.967329025268555, 17.053627014160156, 18.139925003051758, 19.22622299194336, 20.312519073486328, 21.39881706237793, 22.48511505126953, 23.5714111328125, 24.6577091217041, 25.744007110595703, 26.830305099487305, 27.916603088378906, 29.002899169921875, 30.089197158813477, 31.175495147705078, 32.26179122924805, 33.34809112548828, 34.43438720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 10.0, 10.0, 10.0, 16.0, 16.0, 25.0, 18.0, 33.0, 36.0, 31.0, 28.0, 28.0, 29.0, 35.0, 38.0, 41.0, 47.0, 41.0, 38.0, 39.0, 47.0, 40.0, 30.0, 29.0, 24.0, 35.0, 27.0, 25.0, 22.0, 27.0, 17.0, 17.0, 12.0, 7.0, 12.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.153217315673828, -25.315322875976562, -24.477428436279297, -23.639535903930664, -22.8016414642334, -21.963747024536133, -21.1258544921875, -20.287960052490234, -19.45006561279297, -18.612171173095703, -17.774276733398438, -16.936384201049805, -16.09848976135254, -15.260595321655273, -14.422701835632324, -13.584808349609375, -12.74691390991211, -11.909019470214844, -11.071125984191895, -10.233232498168945, -9.39533805847168, -8.557443618774414, -7.719550132751465, -6.881656169891357, -6.04376220703125, -5.205868244171143, -4.367974281311035, -3.5300803184509277, -2.6921863555908203, -1.854292392730713, -1.0163984298706055, -0.17850446701049805, 0.6593914031982422, 1.4972853660583496, 2.335179328918457, 3.1730732917785645, 4.010967254638672, 4.848861217498779, 5.686755180358887, 6.524649143218994, 7.362543106079102, 8.200437545776367, 9.038331031799316, 9.876224517822266, 10.714118957519531, 11.552013397216797, 12.389906883239746, 13.227800369262695, 14.065694808959961, 14.903589248657227, 15.741482734680176, 16.579376220703125, 17.41727066040039, 18.255165100097656, 19.093059539794922, 19.930952072143555, 20.76884651184082, 21.606740951538086, 22.44463348388672, 23.282527923583984, 24.12042236328125, 24.958316802978516, 25.79621124267578, 26.634103775024414, 27.47199821472168]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 6.0, 11.0, 10.0, 30.0, 42.0, 66.0, 77.0, 115.0, 167.0, 243.0, 438.0, 580.0, 929.0, 1464.0, 2248.0, 3696.0, 5803.0, 9707.0, 16143.0, 28077.0, 49471.0, 89902.0, 163310.0, 240956.0, 189486.0, 106744.0, 58149.0, 32629.0, 18789.0, 10990.0, 6740.0, 4184.0, 2607.0, 1676.0, 1039.0, 693.0, 430.0, 300.0, 199.0, 150.0, 75.0, 62.0, 36.0, 20.0, 19.0, 12.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.9375, -35.73193359375, -34.5263671875, -33.32080078125, -32.115234375, -30.90966796875, -29.7041015625, -28.49853515625, -27.29296875, -26.08740234375, -24.8818359375, -23.67626953125, -22.470703125, -21.26513671875, -20.0595703125, -18.85400390625, -17.6484375, -16.44287109375, -15.2373046875, -14.03173828125, -12.826171875, -11.62060546875, -10.4150390625, -9.20947265625, -8.00390625, -6.79833984375, -5.5927734375, -4.38720703125, -3.181640625, -1.97607421875, -0.7705078125, 0.43505859375, 1.640625, 2.84619140625, 4.0517578125, 5.25732421875, 6.462890625, 7.66845703125, 8.8740234375, 10.07958984375, 11.28515625, 12.49072265625, 13.6962890625, 14.90185546875, 16.107421875, 17.31298828125, 18.5185546875, 19.72412109375, 20.9296875, 22.13525390625, 23.3408203125, 24.54638671875, 25.751953125, 26.95751953125, 28.1630859375, 29.36865234375, 30.57421875, 31.77978515625, 32.9853515625, 34.19091796875, 35.396484375, 36.60205078125, 37.8076171875, 39.01318359375, 40.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 14.0, 12.0, 9.0, 10.0, 13.0, 12.0, 19.0, 20.0, 35.0, 35.0, 36.0, 35.0, 29.0, 33.0, 26.0, 41.0, 51.0, 44.0, 48.0, 48.0, 43.0, 30.0, 52.0, 38.0, 24.0, 32.0, 26.0, 27.0, 22.0, 19.0, 27.0, 16.0, 19.0, 14.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.515625, -26.6328125, -25.75, -24.8671875, -23.984375, -23.1015625, -22.21875, -21.3359375, -20.453125, -19.5703125, -18.6875, -17.8046875, -16.921875, -16.0390625, -15.15625, -14.2734375, -13.390625, -12.5078125, -11.625, -10.7421875, -9.859375, -8.9765625, -8.09375, -7.2109375, -6.328125, -5.4453125, -4.5625, -3.6796875, -2.796875, -1.9140625, -1.03125, -0.1484375, 0.734375, 1.6171875, 2.5, 3.3828125, 4.265625, 5.1484375, 6.03125, 6.9140625, 7.796875, 8.6796875, 9.5625, 10.4453125, 11.328125, 12.2109375, 13.09375, 13.9765625, 14.859375, 15.7421875, 16.625, 17.5078125, 18.390625, 19.2734375, 20.15625, 21.0390625, 21.921875, 22.8046875, 23.6875, 24.5703125, 25.453125, 26.3359375, 27.21875, 28.1015625, 28.984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 9.0, 19.0, 30.0, 45.0, 50.0, 80.0, 100.0, 136.0, 198.0, 285.0, 390.0, 628.0, 905.0, 1238.0, 1957.0, 2678.0, 3993.0, 5928.0, 9163.0, 14176.0, 22019.0, 33987.0, 54456.0, 86907.0, 132918.0, 177215.0, 168148.0, 119601.0, 76215.0, 48193.0, 30421.0, 19134.0, 12442.0, 8096.0, 5322.0, 3658.0, 2421.0, 1627.0, 1078.0, 852.0, 543.0, 395.0, 272.0, 189.0, 125.0, 85.0, 65.0, 52.0, 26.0, 31.0, 11.0, 14.0, 8.0, 11.0, 3.0, 1.0, 2.0, 3.0], "bins": [-32.53125, -31.51025390625, -30.4892578125, -29.46826171875, -28.447265625, -27.42626953125, -26.4052734375, -25.38427734375, -24.36328125, -23.34228515625, -22.3212890625, -21.30029296875, -20.279296875, -19.25830078125, -18.2373046875, -17.21630859375, -16.1953125, -15.17431640625, -14.1533203125, -13.13232421875, -12.111328125, -11.09033203125, -10.0693359375, -9.04833984375, -8.02734375, -7.00634765625, -5.9853515625, -4.96435546875, -3.943359375, -2.92236328125, -1.9013671875, -0.88037109375, 0.140625, 1.16162109375, 2.1826171875, 3.20361328125, 4.224609375, 5.24560546875, 6.2666015625, 7.28759765625, 8.30859375, 9.32958984375, 10.3505859375, 11.37158203125, 12.392578125, 13.41357421875, 14.4345703125, 15.45556640625, 16.4765625, 17.49755859375, 18.5185546875, 19.53955078125, 20.560546875, 21.58154296875, 22.6025390625, 23.62353515625, 24.64453125, 25.66552734375, 26.6865234375, 27.70751953125, 28.728515625, 29.74951171875, 30.7705078125, 31.79150390625, 32.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 8.0, 10.0, 19.0, 15.0, 16.0, 22.0, 23.0, 29.0, 35.0, 41.0, 42.0, 44.0, 29.0, 40.0, 57.0, 49.0, 35.0, 46.0, 50.0, 51.0, 44.0, 34.0, 32.0, 36.0, 29.0, 28.0, 18.0, 20.0, 13.0, 10.0, 11.0, 12.0, 8.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.2021484375, -20.560546875, -19.9189453125, -19.27734375, -18.6357421875, -17.994140625, -17.3525390625, -16.7109375, -16.0693359375, -15.427734375, -14.7861328125, -14.14453125, -13.5029296875, -12.861328125, -12.2197265625, -11.578125, -10.9365234375, -10.294921875, -9.6533203125, -9.01171875, -8.3701171875, -7.728515625, -7.0869140625, -6.4453125, -5.8037109375, -5.162109375, -4.5205078125, -3.87890625, -3.2373046875, -2.595703125, -1.9541015625, -1.3125, -0.6708984375, -0.029296875, 0.6123046875, 1.25390625, 1.8955078125, 2.537109375, 3.1787109375, 3.8203125, 4.4619140625, 5.103515625, 5.7451171875, 6.38671875, 7.0283203125, 7.669921875, 8.3115234375, 8.953125, 9.5947265625, 10.236328125, 10.8779296875, 11.51953125, 12.1611328125, 12.802734375, 13.4443359375, 14.0859375, 14.7275390625, 15.369140625, 16.0107421875, 16.65234375, 17.2939453125, 17.935546875, 18.5771484375, 19.21875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 18.0, 23.0, 57.0, 68.0, 127.0, 163.0, 285.0, 440.0, 856.0, 1379.0, 2435.0, 4581.0, 9096.0, 18975.0, 42703.0, 102665.0, 258287.0, 340391.0, 151950.0, 61396.0, 26562.0, 12362.0, 6187.0, 3248.0, 1709.0, 991.0, 584.0, 350.0, 206.0, 124.0, 95.0, 68.0, 50.0, 23.0, 18.0, 13.0, 14.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.21875, -17.61572265625, -17.0126953125, -16.40966796875, -15.806640625, -15.20361328125, -14.6005859375, -13.99755859375, -13.39453125, -12.79150390625, -12.1884765625, -11.58544921875, -10.982421875, -10.37939453125, -9.7763671875, -9.17333984375, -8.5703125, -7.96728515625, -7.3642578125, -6.76123046875, -6.158203125, -5.55517578125, -4.9521484375, -4.34912109375, -3.74609375, -3.14306640625, -2.5400390625, -1.93701171875, -1.333984375, -0.73095703125, -0.1279296875, 0.47509765625, 1.078125, 1.68115234375, 2.2841796875, 2.88720703125, 3.490234375, 4.09326171875, 4.6962890625, 5.29931640625, 5.90234375, 6.50537109375, 7.1083984375, 7.71142578125, 8.314453125, 8.91748046875, 9.5205078125, 10.12353515625, 10.7265625, 11.32958984375, 11.9326171875, 12.53564453125, 13.138671875, 13.74169921875, 14.3447265625, 14.94775390625, 15.55078125, 16.15380859375, 16.7568359375, 17.35986328125, 17.962890625, 18.56591796875, 19.1689453125, 19.77197265625, 20.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 8.0, 5.0, 16.0, 25.0, 60.0, 74.0, 114.0, 131.0, 164.0, 143.0, 92.0, 66.0, 41.0, 16.0, 19.0, 7.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036602020263671875, -0.0035697519779205322, -0.003479301929473877, -0.0033888518810272217, -0.0032984018325805664, -0.003207951784133911, -0.003117501735687256, -0.0030270516872406006, -0.0029366016387939453, -0.00284615159034729, -0.0027557015419006348, -0.0026652514934539795, -0.0025748014450073242, -0.002484351396560669, -0.0023939013481140137, -0.0023034512996673584, -0.002213001251220703, -0.002122551202774048, -0.0020321011543273926, -0.0019416511058807373, -0.001851201057434082, -0.0017607510089874268, -0.0016703009605407715, -0.0015798509120941162, -0.001489400863647461, -0.0013989508152008057, -0.0013085007667541504, -0.0012180507183074951, -0.0011276006698608398, -0.0010371506214141846, -0.0009467005729675293, -0.000856250524520874, -0.0007658004760742188, -0.0006753504276275635, -0.0005849003791809082, -0.0004944503307342529, -0.00040400028228759766, -0.0003135502338409424, -0.0002231001853942871, -0.00013265013694763184, -4.220008850097656e-05, 4.824995994567871e-05, 0.00013870000839233398, 0.00022915005683898926, 0.00031960010528564453, 0.0004100501537322998, 0.0005005002021789551, 0.0005909502506256104, 0.0006814002990722656, 0.0007718503475189209, 0.0008623003959655762, 0.0009527504444122314, 0.0010432004928588867, 0.001133650541305542, 0.0012241005897521973, 0.0013145506381988525, 0.0014050006866455078, 0.001495450735092163, 0.0015859007835388184, 0.0016763508319854736, 0.001766800880432129, 0.0018572509288787842, 0.0019477009773254395, 0.0020381510257720947, 0.00212860107421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 5.0, 3.0, 8.0, 3.0, 6.0, 9.0, 14.0, 13.0, 32.0, 28.0, 41.0, 50.0, 66.0, 105.0, 143.0, 221.0, 266.0, 409.0, 664.0, 898.0, 1542.0, 2628.0, 4467.0, 7893.0, 14613.0, 29231.0, 61383.0, 134249.0, 265373.0, 264964.0, 134512.0, 61556.0, 28974.0, 14741.0, 7833.0, 4357.0, 2545.0, 1601.0, 1011.0, 685.0, 415.0, 292.0, 205.0, 140.0, 94.0, 72.0, 53.0, 43.0, 33.0, 24.0, 7.0, 13.0, 12.0, 10.0, 5.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.484375, -16.93798828125, -16.3916015625, -15.84521484375, -15.298828125, -14.75244140625, -14.2060546875, -13.65966796875, -13.11328125, -12.56689453125, -12.0205078125, -11.47412109375, -10.927734375, -10.38134765625, -9.8349609375, -9.28857421875, -8.7421875, -8.19580078125, -7.6494140625, -7.10302734375, -6.556640625, -6.01025390625, -5.4638671875, -4.91748046875, -4.37109375, -3.82470703125, -3.2783203125, -2.73193359375, -2.185546875, -1.63916015625, -1.0927734375, -0.54638671875, 0.0, 0.54638671875, 1.0927734375, 1.63916015625, 2.185546875, 2.73193359375, 3.2783203125, 3.82470703125, 4.37109375, 4.91748046875, 5.4638671875, 6.01025390625, 6.556640625, 7.10302734375, 7.6494140625, 8.19580078125, 8.7421875, 9.28857421875, 9.8349609375, 10.38134765625, 10.927734375, 11.47412109375, 12.0205078125, 12.56689453125, 13.11328125, 13.65966796875, 14.2060546875, 14.75244140625, 15.298828125, 15.84521484375, 16.3916015625, 16.93798828125, 17.484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 10.0, 8.0, 9.0, 9.0, 17.0, 23.0, 28.0, 40.0, 55.0, 64.0, 68.0, 92.0, 85.0, 91.0, 100.0, 67.0, 47.0, 46.0, 34.0, 16.0, 20.0, 12.0, 20.0, 10.0, 7.0, 8.0, 2.0, 9.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.54296875, -6.33160400390625, -6.1202392578125, -5.90887451171875, -5.697509765625, -5.48614501953125, -5.2747802734375, -5.06341552734375, -4.85205078125, -4.64068603515625, -4.4293212890625, -4.21795654296875, -4.006591796875, -3.79522705078125, -3.5838623046875, -3.37249755859375, -3.1611328125, -2.94976806640625, -2.7384033203125, -2.52703857421875, -2.315673828125, -2.10430908203125, -1.8929443359375, -1.68157958984375, -1.47021484375, -1.25885009765625, -1.0474853515625, -0.83612060546875, -0.624755859375, -0.41339111328125, -0.2020263671875, 0.00933837890625, 0.220703125, 0.43206787109375, 0.6434326171875, 0.85479736328125, 1.066162109375, 1.27752685546875, 1.4888916015625, 1.70025634765625, 1.91162109375, 2.12298583984375, 2.3343505859375, 2.54571533203125, 2.757080078125, 2.96844482421875, 3.1798095703125, 3.39117431640625, 3.6025390625, 3.81390380859375, 4.0252685546875, 4.23663330078125, 4.447998046875, 4.65936279296875, 4.8707275390625, 5.08209228515625, 5.29345703125, 5.50482177734375, 5.7161865234375, 5.92755126953125, 6.138916015625, 6.35028076171875, 6.5616455078125, 6.77301025390625, 6.984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 2.0, 13.0, 9.0, 14.0, 18.0, 29.0, 26.0, 28.0, 38.0, 41.0, 55.0, 38.0, 60.0, 51.0, 69.0, 65.0, 53.0, 62.0, 50.0, 46.0, 40.0, 31.0, 29.0, 24.0, 17.0, 12.0, 17.0, 8.0, 11.0, 3.0, 3.0, 9.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.605167388916016, -27.641395568847656, -26.67762565612793, -25.71385383605957, -24.75008201599121, -23.786312103271484, -22.822540283203125, -21.858768463134766, -20.894996643066406, -19.931224822998047, -18.96745491027832, -18.00368309020996, -17.0399112701416, -16.076141357421875, -15.112369537353516, -14.148597717285156, -13.18482780456543, -12.221056938171387, -11.257285118103027, -10.293514251708984, -9.329742431640625, -8.365971565246582, -7.402200698852539, -6.438429355621338, -5.474658012390137, -4.5108866691589355, -3.5471155643463135, -2.5833444595336914, -1.6195731163024902, -0.6558017730712891, 0.3079690933227539, 1.271740436553955, 2.2355117797851562, 3.1992831230163574, 4.163054466247559, 5.126825332641602, 6.090596675872803, 7.054368019104004, 8.018138885498047, 8.981910705566406, 9.94568157196045, 10.909452438354492, 11.873224258422852, 12.836995124816895, 13.800765991210938, 14.764537811279297, 15.72830867767334, 16.692079544067383, 17.655851364135742, 18.6196231842041, 19.583393096923828, 20.547164916992188, 21.510936737060547, 22.474708557128906, 23.438478469848633, 24.402250289916992, 25.36602020263672, 26.329792022705078, 27.293561935424805, 28.257333755493164, 29.221105575561523, 30.18487548828125, 31.14864730834961, 32.11241912841797, 33.07619094848633]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 9.0, 22.0, 10.0, 17.0, 20.0, 22.0, 35.0, 29.0, 38.0, 34.0, 41.0, 47.0, 31.0, 46.0, 34.0, 47.0, 44.0, 38.0, 49.0, 43.0, 36.0, 33.0, 35.0, 36.0, 37.0, 16.0, 28.0, 20.0, 21.0, 16.0, 8.0, 5.0, 7.0, 2.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.032825469970703, -26.050125122070312, -25.06742286682129, -24.0847225189209, -23.102020263671875, -22.119319915771484, -21.136619567871094, -20.15391731262207, -19.17121696472168, -18.18851661682129, -17.205814361572266, -16.223114013671875, -15.240412712097168, -14.257711410522461, -13.275010108947754, -12.292308807373047, -11.30960750579834, -10.326906204223633, -9.344204902648926, -8.361503601074219, -7.378803253173828, -6.396101951599121, -5.413400650024414, -4.430699825286865, -3.447998523712158, -2.4652974605560303, -1.4825962781906128, -0.4998950958251953, 0.4828059673309326, 1.4655070304870605, 2.4482083320617676, 3.4309091567993164, 4.413610458374023, 5.3963117599487305, 6.379012584686279, 7.361713886260986, 8.344414710998535, 9.327116012573242, 10.30981731414795, 11.292518615722656, 12.275218963623047, 13.257920265197754, 14.240621566772461, 15.223321914672852, 16.206024169921875, 17.188724517822266, 18.171424865722656, 19.15412712097168, 20.136829376220703, 21.119529724121094, 22.102231979370117, 23.084932327270508, 24.06763458251953, 25.050334930419922, 26.033035278320312, 27.015737533569336, 27.998437881469727, 28.981138229370117, 29.96384048461914, 30.94654083251953, 31.929243087768555, 32.91194152832031, 33.89464569091797, 34.87734603881836, 35.86004638671875]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 7.0, 3.0, 14.0, 20.0, 24.0, 55.0, 79.0, 131.0, 167.0, 234.0, 297.0, 439.0, 567.0, 876.0, 1287.0, 1775.0, 2838.0, 4263.0, 6501.0, 10682.0, 17277.0, 29531.0, 53876.0, 107253.0, 249101.0, 647771.0, 1288494.0, 1009853.0, 419475.0, 167094.0, 75940.0, 39902.0, 22446.0, 13199.0, 8167.0, 4925.0, 3263.0, 2065.0, 1430.0, 923.0, 641.0, 424.0, 297.0, 176.0, 131.0, 111.0, 76.0, 45.0, 48.0, 36.0, 23.0, 11.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-32.6875, -31.58935546875, -30.4912109375, -29.39306640625, -28.294921875, -27.19677734375, -26.0986328125, -25.00048828125, -23.90234375, -22.80419921875, -21.7060546875, -20.60791015625, -19.509765625, -18.41162109375, -17.3134765625, -16.21533203125, -15.1171875, -14.01904296875, -12.9208984375, -11.82275390625, -10.724609375, -9.62646484375, -8.5283203125, -7.43017578125, -6.33203125, -5.23388671875, -4.1357421875, -3.03759765625, -1.939453125, -0.84130859375, 0.2568359375, 1.35498046875, 2.453125, 3.55126953125, 4.6494140625, 5.74755859375, 6.845703125, 7.94384765625, 9.0419921875, 10.14013671875, 11.23828125, 12.33642578125, 13.4345703125, 14.53271484375, 15.630859375, 16.72900390625, 17.8271484375, 18.92529296875, 20.0234375, 21.12158203125, 22.2197265625, 23.31787109375, 24.416015625, 25.51416015625, 26.6123046875, 27.71044921875, 28.80859375, 29.90673828125, 31.0048828125, 32.10302734375, 33.201171875, 34.29931640625, 35.3974609375, 36.49560546875, 37.59375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 10.0, 21.0, 21.0, 22.0, 27.0, 31.0, 28.0, 36.0, 29.0, 31.0, 31.0, 45.0, 42.0, 37.0, 49.0, 53.0, 44.0, 45.0, 38.0, 36.0, 40.0, 27.0, 27.0, 38.0, 24.0, 20.0, 20.0, 18.0, 15.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.140625, -22.302490234375, -21.46435546875, -20.626220703125, -19.7880859375, -18.949951171875, -18.11181640625, -17.273681640625, -16.435546875, -15.597412109375, -14.75927734375, -13.921142578125, -13.0830078125, -12.244873046875, -11.40673828125, -10.568603515625, -9.73046875, -8.892333984375, -8.05419921875, -7.216064453125, -6.3779296875, -5.539794921875, -4.70166015625, -3.863525390625, -3.025390625, -2.187255859375, -1.34912109375, -0.510986328125, 0.3271484375, 1.165283203125, 2.00341796875, 2.841552734375, 3.6796875, 4.517822265625, 5.35595703125, 6.194091796875, 7.0322265625, 7.870361328125, 8.70849609375, 9.546630859375, 10.384765625, 11.222900390625, 12.06103515625, 12.899169921875, 13.7373046875, 14.575439453125, 15.41357421875, 16.251708984375, 17.08984375, 17.927978515625, 18.76611328125, 19.604248046875, 20.4423828125, 21.280517578125, 22.11865234375, 22.956787109375, 23.794921875, 24.633056640625, 25.47119140625, 26.309326171875, 27.1474609375, 27.985595703125, 28.82373046875, 29.661865234375, 30.5]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 19.0, 24.0, 42.0, 40.0, 76.0, 111.0, 176.0, 274.0, 433.0, 708.0, 1240.0, 2214.0, 4057.0, 7333.0, 14404.0, 28458.0, 60369.0, 136011.0, 341527.0, 971845.0, 1569859.0, 634232.0, 233085.0, 97480.0, 44507.0, 21347.0, 11012.0, 5792.0, 3156.0, 1812.0, 1018.0, 575.0, 366.0, 210.0, 152.0, 85.0, 70.0, 49.0, 28.0, 17.0, 17.0, 12.0, 8.0, 2.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-50.40625, -48.845703125, -47.28515625, -45.724609375, -44.1640625, -42.603515625, -41.04296875, -39.482421875, -37.921875, -36.361328125, -34.80078125, -33.240234375, -31.6796875, -30.119140625, -28.55859375, -26.998046875, -25.4375, -23.876953125, -22.31640625, -20.755859375, -19.1953125, -17.634765625, -16.07421875, -14.513671875, -12.953125, -11.392578125, -9.83203125, -8.271484375, -6.7109375, -5.150390625, -3.58984375, -2.029296875, -0.46875, 1.091796875, 2.65234375, 4.212890625, 5.7734375, 7.333984375, 8.89453125, 10.455078125, 12.015625, 13.576171875, 15.13671875, 16.697265625, 18.2578125, 19.818359375, 21.37890625, 22.939453125, 24.5, 26.060546875, 27.62109375, 29.181640625, 30.7421875, 32.302734375, 33.86328125, 35.423828125, 36.984375, 38.544921875, 40.10546875, 41.666015625, 43.2265625, 44.787109375, 46.34765625, 47.908203125, 49.46875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 1.0, 2.0, 4.0, 8.0, 8.0, 16.0, 16.0, 16.0, 34.0, 39.0, 48.0, 68.0, 98.0, 106.0, 149.0, 178.0, 220.0, 296.0, 353.0, 381.0, 383.0, 309.0, 315.0, 240.0, 172.0, 138.0, 104.0, 97.0, 58.0, 57.0, 39.0, 27.0, 22.0, 22.0, 15.0, 16.0, 4.0, 12.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.066650390625, -12.58642578125, -12.106201171875, -11.6259765625, -11.145751953125, -10.66552734375, -10.185302734375, -9.705078125, -9.224853515625, -8.74462890625, -8.264404296875, -7.7841796875, -7.303955078125, -6.82373046875, -6.343505859375, -5.86328125, -5.383056640625, -4.90283203125, -4.422607421875, -3.9423828125, -3.462158203125, -2.98193359375, -2.501708984375, -2.021484375, -1.541259765625, -1.06103515625, -0.580810546875, -0.1005859375, 0.379638671875, 0.85986328125, 1.340087890625, 1.8203125, 2.300537109375, 2.78076171875, 3.260986328125, 3.7412109375, 4.221435546875, 4.70166015625, 5.181884765625, 5.662109375, 6.142333984375, 6.62255859375, 7.102783203125, 7.5830078125, 8.063232421875, 8.54345703125, 9.023681640625, 9.50390625, 9.984130859375, 10.46435546875, 10.944580078125, 11.4248046875, 11.905029296875, 12.38525390625, 12.865478515625, 13.345703125, 13.825927734375, 14.30615234375, 14.786376953125, 15.2666015625, 15.746826171875, 16.22705078125, 16.707275390625, 17.1875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 8.0, 15.0, 16.0, 19.0, 18.0, 25.0, 45.0, 37.0, 47.0, 47.0, 55.0, 66.0, 66.0, 72.0, 74.0, 57.0, 52.0, 55.0, 34.0, 33.0, 31.0, 19.0, 13.0, 14.0, 14.0, 13.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.146879196166992, -28.024721145629883, -26.902563095092773, -25.78040313720703, -24.658245086669922, -23.536087036132812, -22.413928985595703, -21.291770935058594, -20.169612884521484, -19.047454833984375, -17.925296783447266, -16.803138732910156, -15.680978775024414, -14.558820724487305, -13.436662673950195, -12.314504623413086, -11.192344665527344, -10.070186614990234, -8.948027610778809, -7.825869560241699, -6.703711032867432, -5.581552505493164, -4.459394454956055, -3.337235927581787, -2.2150774002075195, -1.0929189920425415, 0.029239416122436523, 1.151397705078125, 2.2735562324523926, 3.39571475982666, 4.5178728103637695, 5.640031337738037, 6.762187957763672, 7.8843464851379395, 9.006505012512207, 10.128663063049316, 11.250822067260742, 12.372980117797852, 13.495138168334961, 14.61729621887207, 15.739455223083496, 16.861614227294922, 17.98377227783203, 19.10593032836914, 20.22808837890625, 21.35024642944336, 22.47240447998047, 23.59456443786621, 24.71672248840332, 25.83888053894043, 26.96103858947754, 28.08319854736328, 29.20535659790039, 30.3275146484375, 31.44967269897461, 32.57183074951172, 33.69398880004883, 34.81614685058594, 35.93830490112305, 37.060462951660156, 38.182621002197266, 39.304779052734375, 40.42694091796875, 41.54909896850586, 42.67125701904297]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 10.0, 11.0, 8.0, 23.0, 25.0, 18.0, 34.0, 33.0, 18.0, 30.0, 41.0, 42.0, 46.0, 40.0, 26.0, 41.0, 38.0, 40.0, 44.0, 40.0, 47.0, 50.0, 28.0, 35.0, 39.0, 23.0, 16.0, 16.0, 26.0, 18.0, 18.0, 6.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.92987823486328, -26.966094970703125, -26.00231170654297, -25.03852653503418, -24.074743270874023, -23.110960006713867, -22.14717674255371, -21.183391571044922, -20.219608306884766, -19.25582504272461, -18.292041778564453, -17.328256607055664, -16.364473342895508, -15.400690078735352, -14.436906814575195, -13.473122596740723, -12.509339332580566, -11.54555606842041, -10.581771850585938, -9.617988586425781, -8.654204368591309, -7.690421104431152, -6.726637363433838, -5.762853622436523, -4.799069881439209, -3.8352861404418945, -2.87150239944458, -1.9077188968658447, -0.9439351558685303, 0.019848346710205078, 0.9836320877075195, 1.947415828704834, 2.9111995697021484, 3.874983310699463, 4.838767051696777, 5.802550315856934, 6.766334533691406, 7.7301177978515625, 8.693901062011719, 9.657685279846191, 10.621469497680664, 11.58525276184082, 12.549036979675293, 13.51282024383545, 14.476604461669922, 15.440387725830078, 16.404170989990234, 17.36795425415039, 18.331737518310547, 19.295520782470703, 20.25930404663086, 21.22308921813965, 22.186872482299805, 23.15065574645996, 24.114439010620117, 25.078224182128906, 26.042007446289062, 27.00579071044922, 27.969573974609375, 28.933359146118164, 29.89714241027832, 30.860925674438477, 31.824708938598633, 32.78849411010742, 33.75227737426758]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 6.0, 11.0, 20.0, 33.0, 37.0, 48.0, 70.0, 133.0, 171.0, 260.0, 360.0, 653.0, 899.0, 1351.0, 2044.0, 3177.0, 5166.0, 8392.0, 13912.0, 23654.0, 43074.0, 80186.0, 161704.0, 274271.0, 202797.0, 101878.0, 52046.0, 28734.0, 16783.0, 9815.0, 6058.0, 3768.0, 2376.0, 1610.0, 1025.0, 642.0, 473.0, 293.0, 188.0, 129.0, 79.0, 69.0, 48.0, 33.0, 23.0, 16.0, 12.0, 9.0, 8.0, 4.0, 3.0, 0.0, 2.0], "bins": [-23.453125, -22.776611328125, -22.10009765625, -21.423583984375, -20.7470703125, -20.070556640625, -19.39404296875, -18.717529296875, -18.041015625, -17.364501953125, -16.68798828125, -16.011474609375, -15.3349609375, -14.658447265625, -13.98193359375, -13.305419921875, -12.62890625, -11.952392578125, -11.27587890625, -10.599365234375, -9.9228515625, -9.246337890625, -8.56982421875, -7.893310546875, -7.216796875, -6.540283203125, -5.86376953125, -5.187255859375, -4.5107421875, -3.834228515625, -3.15771484375, -2.481201171875, -1.8046875, -1.128173828125, -0.45166015625, 0.224853515625, 0.9013671875, 1.577880859375, 2.25439453125, 2.930908203125, 3.607421875, 4.283935546875, 4.96044921875, 5.636962890625, 6.3134765625, 6.989990234375, 7.66650390625, 8.343017578125, 9.01953125, 9.696044921875, 10.37255859375, 11.049072265625, 11.7255859375, 12.402099609375, 13.07861328125, 13.755126953125, 14.431640625, 15.108154296875, 15.78466796875, 16.461181640625, 17.1376953125, 17.814208984375, 18.49072265625, 19.167236328125, 19.84375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 7.0, 6.0, 10.0, 7.0, 3.0, 16.0, 17.0, 17.0, 27.0, 25.0, 29.0, 34.0, 22.0, 41.0, 55.0, 43.0, 48.0, 40.0, 42.0, 46.0, 35.0, 48.0, 43.0, 43.0, 36.0, 37.0, 34.0, 33.0, 21.0, 21.0, 17.0, 27.0, 12.0, 9.0, 6.0, 7.0, 3.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.40625, -27.38427734375, -26.3623046875, -25.34033203125, -24.318359375, -23.29638671875, -22.2744140625, -21.25244140625, -20.23046875, -19.20849609375, -18.1865234375, -17.16455078125, -16.142578125, -15.12060546875, -14.0986328125, -13.07666015625, -12.0546875, -11.03271484375, -10.0107421875, -8.98876953125, -7.966796875, -6.94482421875, -5.9228515625, -4.90087890625, -3.87890625, -2.85693359375, -1.8349609375, -0.81298828125, 0.208984375, 1.23095703125, 2.2529296875, 3.27490234375, 4.296875, 5.31884765625, 6.3408203125, 7.36279296875, 8.384765625, 9.40673828125, 10.4287109375, 11.45068359375, 12.47265625, 13.49462890625, 14.5166015625, 15.53857421875, 16.560546875, 17.58251953125, 18.6044921875, 19.62646484375, 20.6484375, 21.67041015625, 22.6923828125, 23.71435546875, 24.736328125, 25.75830078125, 26.7802734375, 27.80224609375, 28.82421875, 29.84619140625, 30.8681640625, 31.89013671875, 32.912109375, 33.93408203125, 34.9560546875, 35.97802734375, 37.0]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 12.0, 18.0, 20.0, 41.0, 40.0, 68.0, 107.0, 152.0, 255.0, 356.0, 562.0, 782.0, 1285.0, 2028.0, 3064.0, 4784.0, 7908.0, 12806.0, 22322.0, 40218.0, 80458.0, 185266.0, 331329.0, 179958.0, 79122.0, 40135.0, 21787.0, 12796.0, 7599.0, 4759.0, 2952.0, 1882.0, 1245.0, 840.0, 552.0, 364.0, 231.0, 168.0, 88.0, 52.0, 46.0, 27.0, 23.0, 13.0, 14.0, 11.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.21875, -28.26025390625, -27.3017578125, -26.34326171875, -25.384765625, -24.42626953125, -23.4677734375, -22.50927734375, -21.55078125, -20.59228515625, -19.6337890625, -18.67529296875, -17.716796875, -16.75830078125, -15.7998046875, -14.84130859375, -13.8828125, -12.92431640625, -11.9658203125, -11.00732421875, -10.048828125, -9.09033203125, -8.1318359375, -7.17333984375, -6.21484375, -5.25634765625, -4.2978515625, -3.33935546875, -2.380859375, -1.42236328125, -0.4638671875, 0.49462890625, 1.453125, 2.41162109375, 3.3701171875, 4.32861328125, 5.287109375, 6.24560546875, 7.2041015625, 8.16259765625, 9.12109375, 10.07958984375, 11.0380859375, 11.99658203125, 12.955078125, 13.91357421875, 14.8720703125, 15.83056640625, 16.7890625, 17.74755859375, 18.7060546875, 19.66455078125, 20.623046875, 21.58154296875, 22.5400390625, 23.49853515625, 24.45703125, 25.41552734375, 26.3740234375, 27.33251953125, 28.291015625, 29.24951171875, 30.2080078125, 31.16650390625, 32.125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 13.0, 10.0, 17.0, 15.0, 16.0, 22.0, 31.0, 22.0, 27.0, 23.0, 38.0, 29.0, 29.0, 50.0, 34.0, 36.0, 44.0, 38.0, 36.0, 38.0, 40.0, 41.0, 38.0, 34.0, 34.0, 29.0, 33.0, 21.0, 17.0, 22.0, 19.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.34375, -18.75244140625, -18.1611328125, -17.56982421875, -16.978515625, -16.38720703125, -15.7958984375, -15.20458984375, -14.61328125, -14.02197265625, -13.4306640625, -12.83935546875, -12.248046875, -11.65673828125, -11.0654296875, -10.47412109375, -9.8828125, -9.29150390625, -8.7001953125, -8.10888671875, -7.517578125, -6.92626953125, -6.3349609375, -5.74365234375, -5.15234375, -4.56103515625, -3.9697265625, -3.37841796875, -2.787109375, -2.19580078125, -1.6044921875, -1.01318359375, -0.421875, 0.16943359375, 0.7607421875, 1.35205078125, 1.943359375, 2.53466796875, 3.1259765625, 3.71728515625, 4.30859375, 4.89990234375, 5.4912109375, 6.08251953125, 6.673828125, 7.26513671875, 7.8564453125, 8.44775390625, 9.0390625, 9.63037109375, 10.2216796875, 10.81298828125, 11.404296875, 11.99560546875, 12.5869140625, 13.17822265625, 13.76953125, 14.36083984375, 14.9521484375, 15.54345703125, 16.134765625, 16.72607421875, 17.3173828125, 17.90869140625, 18.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 9.0, 12.0, 19.0, 28.0, 31.0, 48.0, 83.0, 94.0, 187.0, 297.0, 445.0, 845.0, 1506.0, 2967.0, 5936.0, 13104.0, 30892.0, 81385.0, 233454.0, 394767.0, 175024.0, 62221.0, 24110.0, 10579.0, 4885.0, 2500.0, 1262.0, 744.0, 410.0, 256.0, 147.0, 96.0, 56.0, 44.0, 32.0, 17.0, 16.0, 3.0, 4.0, 7.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.078125, -9.7667236328125, -9.455322265625, -9.1439208984375, -8.83251953125, -8.5211181640625, -8.209716796875, -7.8983154296875, -7.5869140625, -7.2755126953125, -6.964111328125, -6.6527099609375, -6.34130859375, -6.0299072265625, -5.718505859375, -5.4071044921875, -5.095703125, -4.7843017578125, -4.472900390625, -4.1614990234375, -3.85009765625, -3.5386962890625, -3.227294921875, -2.9158935546875, -2.6044921875, -2.2930908203125, -1.981689453125, -1.6702880859375, -1.35888671875, -1.0474853515625, -0.736083984375, -0.4246826171875, -0.11328125, 0.1981201171875, 0.509521484375, 0.8209228515625, 1.13232421875, 1.4437255859375, 1.755126953125, 2.0665283203125, 2.3779296875, 2.6893310546875, 3.000732421875, 3.3121337890625, 3.62353515625, 3.9349365234375, 4.246337890625, 4.5577392578125, 4.869140625, 5.1805419921875, 5.491943359375, 5.8033447265625, 6.11474609375, 6.4261474609375, 6.737548828125, 7.0489501953125, 7.3603515625, 7.6717529296875, 7.983154296875, 8.2945556640625, 8.60595703125, 8.9173583984375, 9.228759765625, 9.5401611328125, 9.8515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 15.0, 17.0, 26.0, 37.0, 47.0, 54.0, 75.0, 50.0, 81.0, 69.0, 90.0, 75.0, 62.0, 55.0, 50.0, 40.0, 28.0, 25.0, 19.0, 14.0, 12.0, 7.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0009746551513671875, -0.0009489357471466064, -0.0009232163429260254, -0.0008974969387054443, -0.0008717775344848633, -0.0008460581302642822, -0.0008203387260437012, -0.0007946193218231201, -0.0007688999176025391, -0.000743180513381958, -0.000717461109161377, -0.0006917417049407959, -0.0006660223007202148, -0.0006403028964996338, -0.0006145834922790527, -0.0005888640880584717, -0.0005631446838378906, -0.0005374252796173096, -0.0005117058753967285, -0.00048598647117614746, -0.0004602670669555664, -0.00043454766273498535, -0.0004088282585144043, -0.00038310885429382324, -0.0003573894500732422, -0.00033167004585266113, -0.0003059506416320801, -0.000280231237411499, -0.00025451183319091797, -0.00022879242897033691, -0.00020307302474975586, -0.0001773536205291748, -0.00015163421630859375, -0.0001259148120880127, -0.00010019540786743164, -7.447600364685059e-05, -4.875659942626953e-05, -2.3037195205688477e-05, 2.682209014892578e-06, 2.8401613235473633e-05, 5.412101745605469e-05, 7.984042167663574e-05, 0.0001055598258972168, 0.00013127923011779785, 0.0001569986343383789, 0.00018271803855895996, 0.00020843744277954102, 0.00023415684700012207, 0.0002598762512207031, 0.0002855956554412842, 0.00031131505966186523, 0.0003370344638824463, 0.00036275386810302734, 0.0003884732723236084, 0.00041419267654418945, 0.0004399120807647705, 0.00046563148498535156, 0.0004913508892059326, 0.0005170702934265137, 0.0005427896976470947, 0.0005685091018676758, 0.0005942285060882568, 0.0006199479103088379, 0.0006456673145294189, 0.00067138671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 6.0, 9.0, 12.0, 23.0, 20.0, 27.0, 35.0, 61.0, 86.0, 112.0, 179.0, 244.0, 317.0, 441.0, 635.0, 887.0, 1268.0, 2043.0, 3154.0, 4952.0, 7859.0, 13185.0, 22901.0, 40634.0, 74186.0, 135201.0, 213936.0, 214713.0, 135990.0, 75239.0, 41260.0, 23166.0, 13337.0, 8001.0, 4844.0, 3214.0, 2028.0, 1304.0, 920.0, 640.0, 439.0, 301.0, 198.0, 155.0, 110.0, 73.0, 51.0, 53.0, 33.0, 23.0, 23.0, 9.0, 12.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.51171875, -7.26947021484375, -7.0272216796875, -6.78497314453125, -6.542724609375, -6.30047607421875, -6.0582275390625, -5.81597900390625, -5.57373046875, -5.33148193359375, -5.0892333984375, -4.84698486328125, -4.604736328125, -4.36248779296875, -4.1202392578125, -3.87799072265625, -3.6357421875, -3.39349365234375, -3.1512451171875, -2.90899658203125, -2.666748046875, -2.42449951171875, -2.1822509765625, -1.94000244140625, -1.69775390625, -1.45550537109375, -1.2132568359375, -0.97100830078125, -0.728759765625, -0.48651123046875, -0.2442626953125, -0.00201416015625, 0.240234375, 0.48248291015625, 0.7247314453125, 0.96697998046875, 1.209228515625, 1.45147705078125, 1.6937255859375, 1.93597412109375, 2.17822265625, 2.42047119140625, 2.6627197265625, 2.90496826171875, 3.147216796875, 3.38946533203125, 3.6317138671875, 3.87396240234375, 4.1162109375, 4.35845947265625, 4.6007080078125, 4.84295654296875, 5.085205078125, 5.32745361328125, 5.5697021484375, 5.81195068359375, 6.05419921875, 6.29644775390625, 6.5386962890625, 6.78094482421875, 7.023193359375, 7.26544189453125, 7.5076904296875, 7.74993896484375, 7.9921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 13.0, 9.0, 14.0, 25.0, 29.0, 32.0, 40.0, 29.0, 25.0, 37.0, 56.0, 51.0, 55.0, 61.0, 56.0, 54.0, 59.0, 57.0, 36.0, 38.0, 32.0, 32.0, 13.0, 29.0, 14.0, 12.0, 14.0, 14.0, 13.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.466522216796875, -2.38812255859375, -2.309722900390625, -2.2313232421875, -2.152923583984375, -2.07452392578125, -1.996124267578125, -1.917724609375, -1.839324951171875, -1.76092529296875, -1.682525634765625, -1.6041259765625, -1.525726318359375, -1.44732666015625, -1.368927001953125, -1.29052734375, -1.212127685546875, -1.13372802734375, -1.055328369140625, -0.9769287109375, -0.898529052734375, -0.82012939453125, -0.741729736328125, -0.663330078125, -0.584930419921875, -0.50653076171875, -0.428131103515625, -0.3497314453125, -0.271331787109375, -0.19293212890625, -0.114532470703125, -0.0361328125, 0.042266845703125, 0.12066650390625, 0.199066162109375, 0.2774658203125, 0.355865478515625, 0.43426513671875, 0.512664794921875, 0.591064453125, 0.669464111328125, 0.74786376953125, 0.826263427734375, 0.9046630859375, 0.983062744140625, 1.06146240234375, 1.139862060546875, 1.21826171875, 1.296661376953125, 1.37506103515625, 1.453460693359375, 1.5318603515625, 1.610260009765625, 1.68865966796875, 1.767059326171875, 1.845458984375, 1.923858642578125, 2.00225830078125, 2.080657958984375, 2.1590576171875, 2.237457275390625, 2.31585693359375, 2.394256591796875, 2.47265625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 13.0, 11.0, 11.0, 14.0, 20.0, 20.0, 22.0, 33.0, 39.0, 43.0, 52.0, 62.0, 60.0, 71.0, 74.0, 71.0, 62.0, 46.0, 56.0, 39.0, 40.0, 30.0, 20.0, 19.0, 14.0, 16.0, 9.0, 6.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.11594581604004, -28.96799659729004, -27.820049285888672, -26.672100067138672, -25.524152755737305, -24.376203536987305, -23.228256225585938, -22.080307006835938, -20.932357788085938, -19.784408569335938, -18.63646125793457, -17.48851203918457, -16.340564727783203, -15.192615509033203, -14.04466724395752, -12.896718978881836, -11.748771667480469, -10.600823402404785, -9.452875137329102, -8.304925918579102, -7.156978130340576, -6.009029865264893, -4.861081123352051, -3.713132858276367, -2.5651845932006836, -1.4172362089157104, -0.2692878246307373, 0.8786606788635254, 2.026608943939209, 3.1745572090148926, 4.322505950927734, 5.470454216003418, 6.618400573730469, 7.766348838806152, 8.914297103881836, 10.062246322631836, 11.210193634033203, 12.358142852783203, 13.506091117858887, 14.65403938293457, 15.801987648010254, 16.949935913085938, 18.097885131835938, 19.245832443237305, 20.393781661987305, 21.541728973388672, 22.689678192138672, 23.837627410888672, 24.98557472229004, 26.13352394104004, 27.281471252441406, 28.429420471191406, 29.577367782592773, 30.725317001342773, 31.87326431274414, 33.02121353149414, 34.16916275024414, 35.31711196899414, 36.46506118774414, 37.613006591796875, 38.760955810546875, 39.908905029296875, 41.056854248046875, 42.204803466796875, 43.35274887084961]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 5.0, 3.0, 8.0, 9.0, 16.0, 4.0, 14.0, 17.0, 23.0, 20.0, 27.0, 34.0, 28.0, 32.0, 43.0, 36.0, 48.0, 34.0, 33.0, 40.0, 36.0, 41.0, 46.0, 36.0, 46.0, 45.0, 39.0, 38.0, 33.0, 21.0, 16.0, 19.0, 22.0, 22.0, 15.0, 7.0, 8.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.48418617248535, -26.535245895385742, -25.586307525634766, -24.637367248535156, -23.688426971435547, -22.739486694335938, -21.79054832458496, -20.84160804748535, -19.892669677734375, -18.943729400634766, -17.99479103088379, -17.04585075378418, -16.09691047668457, -15.147971153259277, -14.199031829833984, -13.250091552734375, -12.301151275634766, -11.352211952209473, -10.403271675109863, -9.45433235168457, -8.505392074584961, -7.556452751159668, -6.607513427734375, -5.658573627471924, -4.709633827209473, -3.7606940269470215, -2.8117544651031494, -1.8628149032592773, -0.9138751029968262, 0.035064697265625, 0.984004020690918, 1.9329438209533691, 2.8818817138671875, 3.8308215141296387, 4.77976131439209, 5.728700637817383, 6.677640438079834, 7.626580238342285, 8.575519561767578, 9.524459838867188, 10.47339916229248, 11.422338485717773, 12.371278762817383, 13.320218086242676, 14.269157409667969, 15.218097686767578, 16.167037963867188, 17.115976333618164, 18.064916610717773, 19.013856887817383, 19.96279525756836, 20.91173553466797, 21.860675811767578, 22.809616088867188, 23.758554458618164, 24.707494735717773, 25.65643310546875, 26.60537338256836, 27.554311752319336, 28.503252029418945, 29.452192306518555, 30.40113067626953, 31.35007095336914, 32.29901123046875, 33.24795150756836]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 12.0, 22.0, 43.0, 37.0, 48.0, 69.0, 118.0, 143.0, 234.0, 252.0, 473.0, 643.0, 999.0, 1507.0, 2341.0, 3582.0, 5815.0, 9469.0, 15864.0, 26251.0, 44416.0, 75638.0, 127650.0, 190309.0, 199100.0, 138370.0, 82855.0, 48474.0, 28547.0, 17055.0, 10408.0, 6307.0, 3933.0, 2609.0, 1576.0, 1102.0, 702.0, 487.0, 316.0, 227.0, 181.0, 121.0, 71.0, 48.0, 49.0, 26.0, 14.0, 11.0, 15.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.09375, -34.9326171875, -33.771484375, -32.6103515625, -31.44921875, -30.2880859375, -29.126953125, -27.9658203125, -26.8046875, -25.6435546875, -24.482421875, -23.3212890625, -22.16015625, -20.9990234375, -19.837890625, -18.6767578125, -17.515625, -16.3544921875, -15.193359375, -14.0322265625, -12.87109375, -11.7099609375, -10.548828125, -9.3876953125, -8.2265625, -7.0654296875, -5.904296875, -4.7431640625, -3.58203125, -2.4208984375, -1.259765625, -0.0986328125, 1.0625, 2.2236328125, 3.384765625, 4.5458984375, 5.70703125, 6.8681640625, 8.029296875, 9.1904296875, 10.3515625, 11.5126953125, 12.673828125, 13.8349609375, 14.99609375, 16.1572265625, 17.318359375, 18.4794921875, 19.640625, 20.8017578125, 21.962890625, 23.1240234375, 24.28515625, 25.4462890625, 26.607421875, 27.7685546875, 28.9296875, 30.0908203125, 31.251953125, 32.4130859375, 33.57421875, 34.7353515625, 35.896484375, 37.0576171875, 38.21875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 2.0, 3.0, 8.0, 14.0, 9.0, 13.0, 18.0, 19.0, 14.0, 25.0, 36.0, 36.0, 29.0, 33.0, 47.0, 51.0, 36.0, 38.0, 39.0, 42.0, 50.0, 48.0, 39.0, 58.0, 34.0, 33.0, 36.0, 27.0, 25.0, 24.0, 24.0, 11.0, 20.0, 15.0, 6.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.546875, -27.561279296875, -26.57568359375, -25.590087890625, -24.6044921875, -23.618896484375, -22.63330078125, -21.647705078125, -20.662109375, -19.676513671875, -18.69091796875, -17.705322265625, -16.7197265625, -15.734130859375, -14.74853515625, -13.762939453125, -12.77734375, -11.791748046875, -10.80615234375, -9.820556640625, -8.8349609375, -7.849365234375, -6.86376953125, -5.878173828125, -4.892578125, -3.906982421875, -2.92138671875, -1.935791015625, -0.9501953125, 0.035400390625, 1.02099609375, 2.006591796875, 2.9921875, 3.977783203125, 4.96337890625, 5.948974609375, 6.9345703125, 7.920166015625, 8.90576171875, 9.891357421875, 10.876953125, 11.862548828125, 12.84814453125, 13.833740234375, 14.8193359375, 15.804931640625, 16.79052734375, 17.776123046875, 18.76171875, 19.747314453125, 20.73291015625, 21.718505859375, 22.7041015625, 23.689697265625, 24.67529296875, 25.660888671875, 26.646484375, 27.632080078125, 28.61767578125, 29.603271484375, 30.5888671875, 31.574462890625, 32.56005859375, 33.545654296875, 34.53125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 17.0, 13.0, 38.0, 46.0, 60.0, 82.0, 133.0, 180.0, 300.0, 419.0, 588.0, 921.0, 1311.0, 1973.0, 2965.0, 4521.0, 6793.0, 10234.0, 15872.0, 24676.0, 39124.0, 61328.0, 96746.0, 146143.0, 183297.0, 156526.0, 105962.0, 67385.0, 43086.0, 27016.0, 17334.0, 11242.0, 7440.0, 4860.0, 3257.0, 2127.0, 1471.0, 946.0, 658.0, 472.0, 287.0, 235.0, 138.0, 107.0, 68.0, 53.0, 32.0, 25.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.65625, -32.59130859375, -31.5263671875, -30.46142578125, -29.396484375, -28.33154296875, -27.2666015625, -26.20166015625, -25.13671875, -24.07177734375, -23.0068359375, -21.94189453125, -20.876953125, -19.81201171875, -18.7470703125, -17.68212890625, -16.6171875, -15.55224609375, -14.4873046875, -13.42236328125, -12.357421875, -11.29248046875, -10.2275390625, -9.16259765625, -8.09765625, -7.03271484375, -5.9677734375, -4.90283203125, -3.837890625, -2.77294921875, -1.7080078125, -0.64306640625, 0.421875, 1.48681640625, 2.5517578125, 3.61669921875, 4.681640625, 5.74658203125, 6.8115234375, 7.87646484375, 8.94140625, 10.00634765625, 11.0712890625, 12.13623046875, 13.201171875, 14.26611328125, 15.3310546875, 16.39599609375, 17.4609375, 18.52587890625, 19.5908203125, 20.65576171875, 21.720703125, 22.78564453125, 23.8505859375, 24.91552734375, 25.98046875, 27.04541015625, 28.1103515625, 29.17529296875, 30.240234375, 31.30517578125, 32.3701171875, 33.43505859375, 34.5]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 13.0, 9.0, 11.0, 13.0, 16.0, 23.0, 17.0, 26.0, 24.0, 33.0, 41.0, 31.0, 24.0, 42.0, 44.0, 46.0, 40.0, 46.0, 39.0, 40.0, 32.0, 33.0, 30.0, 34.0, 38.0, 35.0, 27.0, 19.0, 27.0, 19.0, 26.0, 7.0, 16.0, 15.0, 9.0, 6.0, 14.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-20.03125, -19.42626953125, -18.8212890625, -18.21630859375, -17.611328125, -17.00634765625, -16.4013671875, -15.79638671875, -15.19140625, -14.58642578125, -13.9814453125, -13.37646484375, -12.771484375, -12.16650390625, -11.5615234375, -10.95654296875, -10.3515625, -9.74658203125, -9.1416015625, -8.53662109375, -7.931640625, -7.32666015625, -6.7216796875, -6.11669921875, -5.51171875, -4.90673828125, -4.3017578125, -3.69677734375, -3.091796875, -2.48681640625, -1.8818359375, -1.27685546875, -0.671875, -0.06689453125, 0.5380859375, 1.14306640625, 1.748046875, 2.35302734375, 2.9580078125, 3.56298828125, 4.16796875, 4.77294921875, 5.3779296875, 5.98291015625, 6.587890625, 7.19287109375, 7.7978515625, 8.40283203125, 9.0078125, 9.61279296875, 10.2177734375, 10.82275390625, 11.427734375, 12.03271484375, 12.6376953125, 13.24267578125, 13.84765625, 14.45263671875, 15.0576171875, 15.66259765625, 16.267578125, 16.87255859375, 17.4775390625, 18.08251953125, 18.6875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 14.0, 15.0, 18.0, 31.0, 59.0, 75.0, 85.0, 129.0, 196.0, 296.0, 445.0, 623.0, 910.0, 1276.0, 1935.0, 2861.0, 4666.0, 7178.0, 12050.0, 20247.0, 36016.0, 65074.0, 115439.0, 194141.0, 226680.0, 153817.0, 87139.0, 48445.0, 26973.0, 15623.0, 9274.0, 5688.0, 3673.0, 2359.0, 1588.0, 1090.0, 736.0, 517.0, 373.0, 230.0, 171.0, 118.0, 75.0, 61.0, 38.0, 30.0, 28.0, 20.0, 12.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.9140625, -13.482666015625, -13.05126953125, -12.619873046875, -12.1884765625, -11.757080078125, -11.32568359375, -10.894287109375, -10.462890625, -10.031494140625, -9.60009765625, -9.168701171875, -8.7373046875, -8.305908203125, -7.87451171875, -7.443115234375, -7.01171875, -6.580322265625, -6.14892578125, -5.717529296875, -5.2861328125, -4.854736328125, -4.42333984375, -3.991943359375, -3.560546875, -3.129150390625, -2.69775390625, -2.266357421875, -1.8349609375, -1.403564453125, -0.97216796875, -0.540771484375, -0.109375, 0.322021484375, 0.75341796875, 1.184814453125, 1.6162109375, 2.047607421875, 2.47900390625, 2.910400390625, 3.341796875, 3.773193359375, 4.20458984375, 4.635986328125, 5.0673828125, 5.498779296875, 5.93017578125, 6.361572265625, 6.79296875, 7.224365234375, 7.65576171875, 8.087158203125, 8.5185546875, 8.949951171875, 9.38134765625, 9.812744140625, 10.244140625, 10.675537109375, 11.10693359375, 11.538330078125, 11.9697265625, 12.401123046875, 12.83251953125, 13.263916015625, 13.6953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 6.0, 13.0, 18.0, 27.0, 27.0, 43.0, 61.0, 55.0, 78.0, 103.0, 104.0, 93.0, 91.0, 56.0, 52.0, 37.0, 31.0, 24.0, 20.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019588470458984375, -0.0019006580114364624, -0.0018424689769744873, -0.0017842799425125122, -0.0017260909080505371, -0.001667901873588562, -0.001609712839126587, -0.0015515238046646118, -0.0014933347702026367, -0.0014351457357406616, -0.0013769567012786865, -0.0013187676668167114, -0.0012605786323547363, -0.0012023895978927612, -0.0011442005634307861, -0.001086011528968811, -0.001027822494506836, -0.0009696334600448608, -0.0009114444255828857, -0.0008532553911209106, -0.0007950663566589355, -0.0007368773221969604, -0.0006786882877349854, -0.0006204992532730103, -0.0005623102188110352, -0.0005041211843490601, -0.00044593214988708496, -0.00038774311542510986, -0.00032955408096313477, -0.00027136504650115967, -0.00021317601203918457, -0.00015498697757720947, -9.679794311523438e-05, -3.860890865325928e-05, 1.958012580871582e-05, 7.776916027069092e-05, 0.00013595819473266602, 0.0001941472291946411, 0.0002523362636566162, 0.0003105252981185913, 0.0003687143325805664, 0.0004269033670425415, 0.0004850924015045166, 0.0005432814359664917, 0.0006014704704284668, 0.0006596595048904419, 0.000717848539352417, 0.0007760375738143921, 0.0008342266082763672, 0.0008924156427383423, 0.0009506046772003174, 0.0010087937116622925, 0.0010669827461242676, 0.0011251717805862427, 0.0011833608150482178, 0.0012415498495101929, 0.001299738883972168, 0.001357927918434143, 0.0014161169528961182, 0.0014743059873580933, 0.0015324950218200684, 0.0015906840562820435, 0.0016488730907440186, 0.0017070621252059937, 0.0017652511596679688]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 14.0, 9.0, 18.0, 21.0, 36.0, 50.0, 71.0, 74.0, 140.0, 181.0, 255.0, 381.0, 614.0, 916.0, 1443.0, 2330.0, 3794.0, 6541.0, 11643.0, 21174.0, 40724.0, 79475.0, 155702.0, 260167.0, 218421.0, 116056.0, 59127.0, 30324.0, 16422.0, 8824.0, 5213.0, 3032.0, 1810.0, 1263.0, 717.0, 491.0, 378.0, 223.0, 145.0, 103.0, 76.0, 57.0, 27.0, 31.0, 10.0, 7.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.03125, -15.492919921875, -14.95458984375, -14.416259765625, -13.8779296875, -13.339599609375, -12.80126953125, -12.262939453125, -11.724609375, -11.186279296875, -10.64794921875, -10.109619140625, -9.5712890625, -9.032958984375, -8.49462890625, -7.956298828125, -7.41796875, -6.879638671875, -6.34130859375, -5.802978515625, -5.2646484375, -4.726318359375, -4.18798828125, -3.649658203125, -3.111328125, -2.572998046875, -2.03466796875, -1.496337890625, -0.9580078125, -0.419677734375, 0.11865234375, 0.656982421875, 1.1953125, 1.733642578125, 2.27197265625, 2.810302734375, 3.3486328125, 3.886962890625, 4.42529296875, 4.963623046875, 5.501953125, 6.040283203125, 6.57861328125, 7.116943359375, 7.6552734375, 8.193603515625, 8.73193359375, 9.270263671875, 9.80859375, 10.346923828125, 10.88525390625, 11.423583984375, 11.9619140625, 12.500244140625, 13.03857421875, 13.576904296875, 14.115234375, 14.653564453125, 15.19189453125, 15.730224609375, 16.2685546875, 16.806884765625, 17.34521484375, 17.883544921875, 18.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 8.0, 4.0, 12.0, 20.0, 16.0, 28.0, 32.0, 32.0, 36.0, 48.0, 51.0, 45.0, 54.0, 64.0, 60.0, 53.0, 51.0, 69.0, 48.0, 32.0, 44.0, 35.0, 27.0, 16.0, 15.0, 17.0, 11.0, 9.0, 10.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.71875, -4.55792236328125, -4.3970947265625, -4.23626708984375, -4.075439453125, -3.91461181640625, -3.7537841796875, -3.59295654296875, -3.43212890625, -3.27130126953125, -3.1104736328125, -2.94964599609375, -2.788818359375, -2.62799072265625, -2.4671630859375, -2.30633544921875, -2.1455078125, -1.98468017578125, -1.8238525390625, -1.66302490234375, -1.502197265625, -1.34136962890625, -1.1805419921875, -1.01971435546875, -0.85888671875, -0.69805908203125, -0.5372314453125, -0.37640380859375, -0.215576171875, -0.05474853515625, 0.1060791015625, 0.26690673828125, 0.427734375, 0.58856201171875, 0.7493896484375, 0.91021728515625, 1.071044921875, 1.23187255859375, 1.3927001953125, 1.55352783203125, 1.71435546875, 1.87518310546875, 2.0360107421875, 2.19683837890625, 2.357666015625, 2.51849365234375, 2.6793212890625, 2.84014892578125, 3.0009765625, 3.16180419921875, 3.3226318359375, 3.48345947265625, 3.644287109375, 3.80511474609375, 3.9659423828125, 4.12677001953125, 4.28759765625, 4.44842529296875, 4.6092529296875, 4.77008056640625, 4.930908203125, 5.09173583984375, 5.2525634765625, 5.41339111328125, 5.57421875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 13.0, 12.0, 8.0, 15.0, 16.0, 20.0, 13.0, 17.0, 29.0, 38.0, 38.0, 47.0, 52.0, 56.0, 54.0, 70.0, 67.0, 62.0, 47.0, 52.0, 43.0, 34.0, 27.0, 35.0, 24.0, 13.0, 11.0, 19.0, 9.0, 10.0, 10.0, 6.0, 9.0, 4.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.63134765625, -29.641857147216797, -28.652366638183594, -27.66287612915039, -26.673383712768555, -25.68389320373535, -24.69440269470215, -23.704912185668945, -22.715421676635742, -21.72593116760254, -20.736440658569336, -19.7469482421875, -18.757457733154297, -17.767967224121094, -16.77847671508789, -15.788986206054688, -14.799494743347168, -13.810004234313965, -12.820512771606445, -11.831022262573242, -10.841531753540039, -9.852041244506836, -8.862549781799316, -7.873059272766113, -6.883568286895752, -5.894077301025391, -4.9045867919921875, -3.915095806121826, -2.925605058670044, -1.9361143112182617, -0.9466233253479004, 0.042867183685302734, 1.032358169555664, 2.0218489170074463, 3.0113396644592285, 4.00083065032959, 4.990321159362793, 5.979812145233154, 6.969303131103516, 7.958793640136719, 8.948284149169922, 9.937774658203125, 10.927266120910645, 11.916756629943848, 12.90624713897705, 13.89573860168457, 14.885229110717773, 15.874719619750977, 16.864212036132812, 17.853702545166016, 18.84319305419922, 19.832683563232422, 20.822175979614258, 21.81166648864746, 22.801156997680664, 23.790647506713867, 24.78013801574707, 25.769628524780273, 26.759119033813477, 27.748611450195312, 28.738101959228516, 29.72759246826172, 30.717082977294922, 31.706573486328125, 32.69606399536133]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 4.0, 4.0, 8.0, 10.0, 12.0, 8.0, 13.0, 13.0, 10.0, 22.0, 28.0, 22.0, 32.0, 31.0, 48.0, 33.0, 35.0, 34.0, 40.0, 39.0, 40.0, 33.0, 55.0, 57.0, 46.0, 39.0, 33.0, 36.0, 38.0, 36.0, 31.0, 18.0, 18.0, 14.0, 10.0, 12.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.73298263549805, -31.6606388092041, -30.588294982910156, -29.51595115661621, -28.443607330322266, -27.371261596679688, -26.298917770385742, -25.226573944091797, -24.15423011779785, -23.081886291503906, -22.00954246520996, -20.937198638916016, -19.864852905273438, -18.792510986328125, -17.720165252685547, -16.6478214263916, -15.575477600097656, -14.503133773803711, -13.430789947509766, -12.358445167541504, -11.286101341247559, -10.213757514953613, -9.141412734985352, -8.069068908691406, -6.996725082397461, -5.924381256103516, -4.852036952972412, -3.7796928882598877, -2.7073488235473633, -1.635004997253418, -0.5626606941223145, 0.5096836090087891, 1.5820236206054688, 2.654367685317993, 3.7267117500305176, 4.799056053161621, 5.871399879455566, 6.943743705749512, 8.016088485717773, 9.088432312011719, 10.160776138305664, 11.23311996459961, 12.305463790893555, 13.377808570861816, 14.450152397155762, 15.522496223449707, 16.59484100341797, 17.667184829711914, 18.73952865600586, 19.811872482299805, 20.88421630859375, 21.956560134887695, 23.02890396118164, 24.10124969482422, 25.173593521118164, 26.24593734741211, 27.318281173706055, 28.390625, 29.462968826293945, 30.53531265258789, 31.60765838623047, 32.68000030517578, 33.75234603881836, 34.82469177246094, 35.89703369140625]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 15.0, 24.0, 33.0, 46.0, 60.0, 101.0, 154.0, 212.0, 353.0, 590.0, 992.0, 1719.0, 3071.0, 5870.0, 11618.0, 24885.0, 58800.0, 166852.0, 589452.0, 1646101.0, 1161127.0, 337742.0, 104979.0, 41353.0, 18563.0, 8848.0, 4577.0, 2613.0, 1398.0, 823.0, 472.0, 294.0, 195.0, 99.0, 84.0, 56.0, 29.0, 26.0, 13.0, 16.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.40625, -55.70703125, -54.0078125, -52.30859375, -50.609375, -48.91015625, -47.2109375, -45.51171875, -43.8125, -42.11328125, -40.4140625, -38.71484375, -37.015625, -35.31640625, -33.6171875, -31.91796875, -30.21875, -28.51953125, -26.8203125, -25.12109375, -23.421875, -21.72265625, -20.0234375, -18.32421875, -16.625, -14.92578125, -13.2265625, -11.52734375, -9.828125, -8.12890625, -6.4296875, -4.73046875, -3.03125, -1.33203125, 0.3671875, 2.06640625, 3.765625, 5.46484375, 7.1640625, 8.86328125, 10.5625, 12.26171875, 13.9609375, 15.66015625, 17.359375, 19.05859375, 20.7578125, 22.45703125, 24.15625, 25.85546875, 27.5546875, 29.25390625, 30.953125, 32.65234375, 34.3515625, 36.05078125, 37.75, 39.44921875, 41.1484375, 42.84765625, 44.546875, 46.24609375, 47.9453125, 49.64453125, 51.34375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 6.0, 0.0, 11.0, 8.0, 7.0, 8.0, 19.0, 10.0, 9.0, 12.0, 18.0, 27.0, 23.0, 40.0, 27.0, 42.0, 39.0, 31.0, 27.0, 40.0, 37.0, 41.0, 51.0, 46.0, 45.0, 50.0, 46.0, 43.0, 30.0, 38.0, 28.0, 27.0, 19.0, 21.0, 10.0, 9.0, 13.0, 13.0, 7.0, 6.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.125, -32.139404296875, -31.15380859375, -30.168212890625, -29.1826171875, -28.197021484375, -27.21142578125, -26.225830078125, -25.240234375, -24.254638671875, -23.26904296875, -22.283447265625, -21.2978515625, -20.312255859375, -19.32666015625, -18.341064453125, -17.35546875, -16.369873046875, -15.38427734375, -14.398681640625, -13.4130859375, -12.427490234375, -11.44189453125, -10.456298828125, -9.470703125, -8.485107421875, -7.49951171875, -6.513916015625, -5.5283203125, -4.542724609375, -3.55712890625, -2.571533203125, -1.5859375, -0.600341796875, 0.38525390625, 1.370849609375, 2.3564453125, 3.342041015625, 4.32763671875, 5.313232421875, 6.298828125, 7.284423828125, 8.27001953125, 9.255615234375, 10.2412109375, 11.226806640625, 12.21240234375, 13.197998046875, 14.18359375, 15.169189453125, 16.15478515625, 17.140380859375, 18.1259765625, 19.111572265625, 20.09716796875, 21.082763671875, 22.068359375, 23.053955078125, 24.03955078125, 25.025146484375, 26.0107421875, 26.996337890625, 27.98193359375, 28.967529296875, 29.953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [8.0, 1.0, 7.0, 7.0, 9.0, 15.0, 17.0, 31.0, 34.0, 43.0, 67.0, 105.0, 134.0, 203.0, 271.0, 402.0, 590.0, 872.0, 1246.0, 1838.0, 2822.0, 4430.0, 6847.0, 10856.0, 18845.0, 32495.0, 59437.0, 113174.0, 227545.0, 495106.0, 1081006.0, 1118286.0, 516599.0, 237300.0, 117548.0, 61606.0, 33627.0, 19206.0, 11211.0, 7161.0, 4420.0, 2855.0, 1839.0, 1217.0, 931.0, 597.0, 426.0, 274.0, 226.0, 159.0, 103.0, 61.0, 52.0, 50.0, 24.0, 20.0, 10.0, 10.0, 10.0, 8.0, 3.0, 1.0, 0.0, 1.0], "bins": [-41.375, -40.04150390625, -38.7080078125, -37.37451171875, -36.041015625, -34.70751953125, -33.3740234375, -32.04052734375, -30.70703125, -29.37353515625, -28.0400390625, -26.70654296875, -25.373046875, -24.03955078125, -22.7060546875, -21.37255859375, -20.0390625, -18.70556640625, -17.3720703125, -16.03857421875, -14.705078125, -13.37158203125, -12.0380859375, -10.70458984375, -9.37109375, -8.03759765625, -6.7041015625, -5.37060546875, -4.037109375, -2.70361328125, -1.3701171875, -0.03662109375, 1.296875, 2.63037109375, 3.9638671875, 5.29736328125, 6.630859375, 7.96435546875, 9.2978515625, 10.63134765625, 11.96484375, 13.29833984375, 14.6318359375, 15.96533203125, 17.298828125, 18.63232421875, 19.9658203125, 21.29931640625, 22.6328125, 23.96630859375, 25.2998046875, 26.63330078125, 27.966796875, 29.30029296875, 30.6337890625, 31.96728515625, 33.30078125, 34.63427734375, 35.9677734375, 37.30126953125, 38.634765625, 39.96826171875, 41.3017578125, 42.63525390625, 43.96875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 6.0, 12.0, 9.0, 23.0, 18.0, 19.0, 35.0, 29.0, 54.0, 50.0, 78.0, 91.0, 90.0, 146.0, 166.0, 201.0, 275.0, 306.0, 310.0, 315.0, 304.0, 281.0, 245.0, 202.0, 162.0, 123.0, 109.0, 85.0, 72.0, 63.0, 39.0, 36.0, 16.0, 20.0, 13.0, 13.0, 6.0, 11.0, 8.0, 2.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.203125, -13.72119140625, -13.2392578125, -12.75732421875, -12.275390625, -11.79345703125, -11.3115234375, -10.82958984375, -10.34765625, -9.86572265625, -9.3837890625, -8.90185546875, -8.419921875, -7.93798828125, -7.4560546875, -6.97412109375, -6.4921875, -6.01025390625, -5.5283203125, -5.04638671875, -4.564453125, -4.08251953125, -3.6005859375, -3.11865234375, -2.63671875, -2.15478515625, -1.6728515625, -1.19091796875, -0.708984375, -0.22705078125, 0.2548828125, 0.73681640625, 1.21875, 1.70068359375, 2.1826171875, 2.66455078125, 3.146484375, 3.62841796875, 4.1103515625, 4.59228515625, 5.07421875, 5.55615234375, 6.0380859375, 6.52001953125, 7.001953125, 7.48388671875, 7.9658203125, 8.44775390625, 8.9296875, 9.41162109375, 9.8935546875, 10.37548828125, 10.857421875, 11.33935546875, 11.8212890625, 12.30322265625, 12.78515625, 13.26708984375, 13.7490234375, 14.23095703125, 14.712890625, 15.19482421875, 15.6767578125, 16.15869140625, 16.640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 12.0, 22.0, 26.0, 36.0, 45.0, 52.0, 57.0, 63.0, 70.0, 78.0, 78.0, 79.0, 59.0, 56.0, 54.0, 44.0, 27.0, 18.0, 21.0, 22.0, 16.0, 5.0, 12.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.362735748291016, -45.93781280517578, -44.51289367675781, -43.08797073364258, -41.663047790527344, -40.23812484741211, -38.81320571899414, -37.388282775878906, -35.96335983276367, -34.53843688964844, -33.11351776123047, -31.688594818115234, -30.263671875, -28.8387508392334, -27.413829803466797, -25.988906860351562, -24.56398582458496, -23.13906478881836, -21.714141845703125, -20.289220809936523, -18.86429786682129, -17.439376831054688, -16.014453887939453, -14.589532852172852, -13.164610862731934, -11.739688873291016, -10.314766883850098, -8.88984489440918, -7.46492338180542, -6.040001392364502, -4.615079879760742, -3.190157890319824, -1.7652359008789062, -0.34031403064727783, 1.0846078395843506, 2.5095295906066895, 3.9344515800476074, 5.359373569488525, 6.784295082092285, 8.209217071533203, 9.634139060974121, 11.059061050415039, 12.483983039855957, 13.908905029296875, 15.333826065063477, 16.75874900817871, 18.183670043945312, 19.608592987060547, 21.03351402282715, 22.45843505859375, 23.883358001708984, 25.308279037475586, 26.73320198059082, 28.158123016357422, 29.583045959472656, 31.007966995239258, 32.43288803100586, 33.857810974121094, 35.28273010253906, 36.7076530456543, 38.13257598876953, 39.557498931884766, 40.982418060302734, 42.40734100341797, 43.8322639465332]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 1.0, 3.0, 7.0, 15.0, 6.0, 10.0, 17.0, 14.0, 19.0, 25.0, 19.0, 32.0, 26.0, 16.0, 37.0, 33.0, 41.0, 47.0, 44.0, 51.0, 52.0, 38.0, 51.0, 43.0, 48.0, 51.0, 37.0, 35.0, 40.0, 24.0, 19.0, 25.0, 13.0, 9.0, 9.0, 10.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.490203857421875, -41.285099029541016, -40.079994201660156, -38.8748893737793, -37.66978454589844, -36.46467971801758, -35.25957489013672, -34.05447006225586, -32.849365234375, -31.64426040649414, -30.43915557861328, -29.234050750732422, -28.028945922851562, -26.823841094970703, -25.618736267089844, -24.413631439208984, -23.208526611328125, -22.003421783447266, -20.798316955566406, -19.593212127685547, -18.388107299804688, -17.183002471923828, -15.977897644042969, -14.77279281616211, -13.56768798828125, -12.36258316040039, -11.157478332519531, -9.952373504638672, -8.747268676757812, -7.542163848876953, -6.337059020996094, -5.131954193115234, -3.9268455505371094, -2.72174072265625, -1.5166358947753906, -0.31153106689453125, 0.8935737609863281, 2.0986785888671875, 3.303783416748047, 4.508888244628906, 5.713993072509766, 6.919097900390625, 8.124202728271484, 9.329307556152344, 10.534412384033203, 11.739517211914062, 12.944622039794922, 14.149726867675781, 15.35483169555664, 16.5599365234375, 17.76504135131836, 18.97014617919922, 20.175251007080078, 21.380355834960938, 22.585460662841797, 23.790565490722656, 24.995670318603516, 26.200775146484375, 27.405879974365234, 28.610984802246094, 29.816089630126953, 31.021194458007812, 32.22629928588867, 33.43140411376953, 34.63650894165039]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 20.0, 28.0, 42.0, 58.0, 74.0, 116.0, 193.0, 265.0, 448.0, 632.0, 1047.0, 1566.0, 2565.0, 4295.0, 7225.0, 12532.0, 22700.0, 42685.0, 86629.0, 182185.0, 297433.0, 193571.0, 91024.0, 44556.0, 23743.0, 13207.0, 7759.0, 4530.0, 2745.0, 1704.0, 1027.0, 675.0, 426.0, 298.0, 180.0, 125.0, 78.0, 38.0, 29.0, 34.0, 21.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-28.375, -27.553466796875, -26.73193359375, -25.910400390625, -25.0888671875, -24.267333984375, -23.44580078125, -22.624267578125, -21.802734375, -20.981201171875, -20.15966796875, -19.338134765625, -18.5166015625, -17.695068359375, -16.87353515625, -16.052001953125, -15.23046875, -14.408935546875, -13.58740234375, -12.765869140625, -11.9443359375, -11.122802734375, -10.30126953125, -9.479736328125, -8.658203125, -7.836669921875, -7.01513671875, -6.193603515625, -5.3720703125, -4.550537109375, -3.72900390625, -2.907470703125, -2.0859375, -1.264404296875, -0.44287109375, 0.378662109375, 1.2001953125, 2.021728515625, 2.84326171875, 3.664794921875, 4.486328125, 5.307861328125, 6.12939453125, 6.950927734375, 7.7724609375, 8.593994140625, 9.41552734375, 10.237060546875, 11.05859375, 11.880126953125, 12.70166015625, 13.523193359375, 14.3447265625, 15.166259765625, 15.98779296875, 16.809326171875, 17.630859375, 18.452392578125, 19.27392578125, 20.095458984375, 20.9169921875, 21.738525390625, 22.56005859375, 23.381591796875, 24.203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 11.0, 20.0, 12.0, 20.0, 15.0, 29.0, 21.0, 23.0, 28.0, 35.0, 44.0, 41.0, 49.0, 54.0, 51.0, 57.0, 50.0, 51.0, 49.0, 43.0, 42.0, 40.0, 40.0, 40.0, 21.0, 14.0, 17.0, 10.0, 13.0, 6.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.9375, -45.6298828125, -44.322265625, -43.0146484375, -41.70703125, -40.3994140625, -39.091796875, -37.7841796875, -36.4765625, -35.1689453125, -33.861328125, -32.5537109375, -31.24609375, -29.9384765625, -28.630859375, -27.3232421875, -26.015625, -24.7080078125, -23.400390625, -22.0927734375, -20.78515625, -19.4775390625, -18.169921875, -16.8623046875, -15.5546875, -14.2470703125, -12.939453125, -11.6318359375, -10.32421875, -9.0166015625, -7.708984375, -6.4013671875, -5.09375, -3.7861328125, -2.478515625, -1.1708984375, 0.13671875, 1.4443359375, 2.751953125, 4.0595703125, 5.3671875, 6.6748046875, 7.982421875, 9.2900390625, 10.59765625, 11.9052734375, 13.212890625, 14.5205078125, 15.828125, 17.1357421875, 18.443359375, 19.7509765625, 21.05859375, 22.3662109375, 23.673828125, 24.9814453125, 26.2890625, 27.5966796875, 28.904296875, 30.2119140625, 31.51953125, 32.8271484375, 34.134765625, 35.4423828125, 36.75]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 14.0, 15.0, 15.0, 24.0, 35.0, 47.0, 73.0, 117.0, 178.0, 289.0, 462.0, 669.0, 1086.0, 1746.0, 2724.0, 4756.0, 7998.0, 13618.0, 24344.0, 46730.0, 99934.0, 259997.0, 330142.0, 127810.0, 56989.0, 29092.0, 15981.0, 9347.0, 5484.0, 3316.0, 1995.0, 1311.0, 771.0, 468.0, 341.0, 235.0, 111.0, 100.0, 64.0, 41.0, 22.0, 19.0, 14.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.6875, -32.56982421875, -31.4521484375, -30.33447265625, -29.216796875, -28.09912109375, -26.9814453125, -25.86376953125, -24.74609375, -23.62841796875, -22.5107421875, -21.39306640625, -20.275390625, -19.15771484375, -18.0400390625, -16.92236328125, -15.8046875, -14.68701171875, -13.5693359375, -12.45166015625, -11.333984375, -10.21630859375, -9.0986328125, -7.98095703125, -6.86328125, -5.74560546875, -4.6279296875, -3.51025390625, -2.392578125, -1.27490234375, -0.1572265625, 0.96044921875, 2.078125, 3.19580078125, 4.3134765625, 5.43115234375, 6.548828125, 7.66650390625, 8.7841796875, 9.90185546875, 11.01953125, 12.13720703125, 13.2548828125, 14.37255859375, 15.490234375, 16.60791015625, 17.7255859375, 18.84326171875, 19.9609375, 21.07861328125, 22.1962890625, 23.31396484375, 24.431640625, 25.54931640625, 26.6669921875, 27.78466796875, 28.90234375, 30.02001953125, 31.1376953125, 32.25537109375, 33.373046875, 34.49072265625, 35.6083984375, 36.72607421875, 37.84375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 16.0, 23.0, 20.0, 34.0, 28.0, 32.0, 36.0, 32.0, 39.0, 48.0, 41.0, 48.0, 51.0, 42.0, 58.0, 46.0, 35.0, 38.0, 33.0, 31.0, 22.0, 30.0, 26.0, 28.0, 18.0, 16.0, 16.0, 12.0, 16.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.171875, -19.4619140625, -18.751953125, -18.0419921875, -17.33203125, -16.6220703125, -15.912109375, -15.2021484375, -14.4921875, -13.7822265625, -13.072265625, -12.3623046875, -11.65234375, -10.9423828125, -10.232421875, -9.5224609375, -8.8125, -8.1025390625, -7.392578125, -6.6826171875, -5.97265625, -5.2626953125, -4.552734375, -3.8427734375, -3.1328125, -2.4228515625, -1.712890625, -1.0029296875, -0.29296875, 0.4169921875, 1.126953125, 1.8369140625, 2.546875, 3.2568359375, 3.966796875, 4.6767578125, 5.38671875, 6.0966796875, 6.806640625, 7.5166015625, 8.2265625, 8.9365234375, 9.646484375, 10.3564453125, 11.06640625, 11.7763671875, 12.486328125, 13.1962890625, 13.90625, 14.6162109375, 15.326171875, 16.0361328125, 16.74609375, 17.4560546875, 18.166015625, 18.8759765625, 19.5859375, 20.2958984375, 21.005859375, 21.7158203125, 22.42578125, 23.1357421875, 23.845703125, 24.5556640625, 25.265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 12.0, 10.0, 16.0, 23.0, 40.0, 40.0, 76.0, 92.0, 131.0, 201.0, 278.0, 458.0, 586.0, 916.0, 1476.0, 2307.0, 3702.0, 6330.0, 11234.0, 20532.0, 40198.0, 82439.0, 173009.0, 296167.0, 206428.0, 98484.0, 47249.0, 24197.0, 13043.0, 7292.0, 4264.0, 2601.0, 1625.0, 1061.0, 642.0, 420.0, 303.0, 213.0, 136.0, 109.0, 50.0, 55.0, 31.0, 24.0, 13.0, 13.0, 9.0, 3.0, 2.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.5389404296875, -7.300537109375, -7.0621337890625, -6.82373046875, -6.5853271484375, -6.346923828125, -6.1085205078125, -5.8701171875, -5.6317138671875, -5.393310546875, -5.1549072265625, -4.91650390625, -4.6781005859375, -4.439697265625, -4.2012939453125, -3.962890625, -3.7244873046875, -3.486083984375, -3.2476806640625, -3.00927734375, -2.7708740234375, -2.532470703125, -2.2940673828125, -2.0556640625, -1.8172607421875, -1.578857421875, -1.3404541015625, -1.10205078125, -0.8636474609375, -0.625244140625, -0.3868408203125, -0.1484375, 0.0899658203125, 0.328369140625, 0.5667724609375, 0.80517578125, 1.0435791015625, 1.281982421875, 1.5203857421875, 1.7587890625, 1.9971923828125, 2.235595703125, 2.4739990234375, 2.71240234375, 2.9508056640625, 3.189208984375, 3.4276123046875, 3.666015625, 3.9044189453125, 4.142822265625, 4.3812255859375, 4.61962890625, 4.8580322265625, 5.096435546875, 5.3348388671875, 5.5732421875, 5.8116455078125, 6.050048828125, 6.2884521484375, 6.52685546875, 6.7652587890625, 7.003662109375, 7.2420654296875, 7.48046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 11.0, 12.0, 11.0, 14.0, 19.0, 28.0, 30.0, 42.0, 41.0, 73.0, 73.0, 82.0, 90.0, 82.0, 61.0, 57.0, 46.0, 46.0, 41.0, 32.0, 29.0, 21.0, 20.0, 14.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010938644409179688, -0.001065678894519806, -0.001037493348121643, -0.0010093078017234802, -0.0009811222553253174, -0.0009529367089271545, -0.0009247511625289917, -0.0008965656161308289, -0.000868380069732666, -0.0008401945233345032, -0.0008120089769363403, -0.0007838234305381775, -0.0007556378841400146, -0.0007274523377418518, -0.000699266791343689, -0.0006710812449455261, -0.0006428956985473633, -0.0006147101521492004, -0.0005865246057510376, -0.0005583390593528748, -0.0005301535129547119, -0.0005019679665565491, -0.00047378242015838623, -0.0004455968737602234, -0.00041741132736206055, -0.0003892257809638977, -0.00036104023456573486, -0.000332854688167572, -0.0003046691417694092, -0.00027648359537124634, -0.0002482980489730835, -0.00022011250257492065, -0.0001919269561767578, -0.00016374140977859497, -0.00013555586338043213, -0.00010737031698226929, -7.918477058410645e-05, -5.0999224185943604e-05, -2.2813677787780762e-05, 5.37186861038208e-06, 3.355741500854492e-05, 6.174296140670776e-05, 8.99285078048706e-05, 0.00011811405420303345, 0.0001462996006011963, 0.00017448514699935913, 0.00020267069339752197, 0.00023085623979568481, 0.00025904178619384766, 0.0002872273325920105, 0.00031541287899017334, 0.0003435984253883362, 0.000371783971786499, 0.00039996951818466187, 0.0004281550645828247, 0.00045634061098098755, 0.0004845261573791504, 0.0005127117037773132, 0.0005408972501754761, 0.0005690827965736389, 0.0005972683429718018, 0.0006254538893699646, 0.0006536394357681274, 0.0006818249821662903, 0.0007100105285644531]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 14.0, 14.0, 23.0, 19.0, 45.0, 72.0, 89.0, 134.0, 161.0, 257.0, 382.0, 655.0, 1031.0, 1725.0, 2881.0, 5142.0, 9570.0, 18481.0, 37291.0, 78460.0, 166162.0, 288396.0, 223825.0, 108538.0, 51595.0, 24784.0, 12699.0, 6661.0, 3698.0, 2171.0, 1291.0, 786.0, 525.0, 333.0, 206.0, 136.0, 96.0, 52.0, 34.0, 38.0, 19.0, 18.0, 6.0, 15.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-10.203125, -9.9005126953125, -9.597900390625, -9.2952880859375, -8.99267578125, -8.6900634765625, -8.387451171875, -8.0848388671875, -7.7822265625, -7.4796142578125, -7.177001953125, -6.8743896484375, -6.57177734375, -6.2691650390625, -5.966552734375, -5.6639404296875, -5.361328125, -5.0587158203125, -4.756103515625, -4.4534912109375, -4.15087890625, -3.8482666015625, -3.545654296875, -3.2430419921875, -2.9404296875, -2.6378173828125, -2.335205078125, -2.0325927734375, -1.72998046875, -1.4273681640625, -1.124755859375, -0.8221435546875, -0.51953125, -0.2169189453125, 0.085693359375, 0.3883056640625, 0.69091796875, 0.9935302734375, 1.296142578125, 1.5987548828125, 1.9013671875, 2.2039794921875, 2.506591796875, 2.8092041015625, 3.11181640625, 3.4144287109375, 3.717041015625, 4.0196533203125, 4.322265625, 4.6248779296875, 4.927490234375, 5.2301025390625, 5.53271484375, 5.8353271484375, 6.137939453125, 6.4405517578125, 6.7431640625, 7.0457763671875, 7.348388671875, 7.6510009765625, 7.95361328125, 8.2562255859375, 8.558837890625, 8.8614501953125, 9.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 12.0, 10.0, 10.0, 16.0, 14.0, 27.0, 26.0, 31.0, 42.0, 58.0, 62.0, 80.0, 61.0, 76.0, 76.0, 66.0, 69.0, 48.0, 35.0, 37.0, 21.0, 18.0, 18.0, 15.0, 10.0, 7.0, 5.0, 12.0, 4.0, 5.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.859100341796875, -2.77288818359375, -2.686676025390625, -2.6004638671875, -2.514251708984375, -2.42803955078125, -2.341827392578125, -2.255615234375, -2.169403076171875, -2.08319091796875, -1.996978759765625, -1.9107666015625, -1.824554443359375, -1.73834228515625, -1.652130126953125, -1.56591796875, -1.479705810546875, -1.39349365234375, -1.307281494140625, -1.2210693359375, -1.134857177734375, -1.04864501953125, -0.962432861328125, -0.876220703125, -0.790008544921875, -0.70379638671875, -0.617584228515625, -0.5313720703125, -0.445159912109375, -0.35894775390625, -0.272735595703125, -0.1865234375, -0.100311279296875, -0.01409912109375, 0.072113037109375, 0.1583251953125, 0.244537353515625, 0.33074951171875, 0.416961669921875, 0.503173828125, 0.589385986328125, 0.67559814453125, 0.761810302734375, 0.8480224609375, 0.934234619140625, 1.02044677734375, 1.106658935546875, 1.19287109375, 1.279083251953125, 1.36529541015625, 1.451507568359375, 1.5377197265625, 1.623931884765625, 1.71014404296875, 1.796356201171875, 1.882568359375, 1.968780517578125, 2.05499267578125, 2.141204833984375, 2.2274169921875, 2.313629150390625, 2.39984130859375, 2.486053466796875, 2.572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 17.0, 14.0, 25.0, 30.0, 45.0, 44.0, 64.0, 61.0, 60.0, 75.0, 83.0, 80.0, 67.0, 57.0, 61.0, 44.0, 27.0, 28.0, 20.0, 16.0, 16.0, 12.0, 6.0, 8.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.283668518066406, -45.869693756103516, -44.455718994140625, -43.04174041748047, -41.62776565551758, -40.21379089355469, -38.79981231689453, -37.38583755493164, -35.97186279296875, -34.55788803100586, -33.14391326904297, -31.729934692382812, -30.315959930419922, -28.90198516845703, -27.488008499145508, -26.074031829833984, -24.660057067871094, -23.246082305908203, -21.83210563659668, -20.418128967285156, -19.004154205322266, -17.590179443359375, -16.17620277404785, -14.762227058410645, -13.348251342773438, -11.93427562713623, -10.520299911499023, -9.106324195861816, -7.692348480224609, -6.278372764587402, -4.864397048950195, -3.4504213333129883, -2.0364456176757812, -0.6224699020385742, 0.7915058135986328, 2.20548152923584, 3.619457244873047, 5.033432960510254, 6.447408676147461, 7.861384391784668, 9.275360107421875, 10.689335823059082, 12.103311538696289, 13.517287254333496, 14.931262969970703, 16.345237731933594, 17.759214401245117, 19.17319107055664, 20.58716583251953, 22.001140594482422, 23.415117263793945, 24.82909393310547, 26.24306869506836, 27.65704345703125, 29.071020126342773, 30.484996795654297, 31.898971557617188, 33.31294631958008, 34.72692108154297, 36.140899658203125, 37.554874420166016, 38.968849182128906, 40.38282775878906, 41.79680252075195, 43.210777282714844]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 14.0, 8.0, 12.0, 13.0, 14.0, 14.0, 26.0, 19.0, 28.0, 31.0, 20.0, 28.0, 31.0, 43.0, 47.0, 42.0, 49.0, 50.0, 43.0, 48.0, 43.0, 48.0, 52.0, 34.0, 41.0, 42.0, 28.0, 23.0, 22.0, 16.0, 10.0, 10.0, 8.0, 14.0, 11.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.58190155029297, -41.38736343383789, -40.19282531738281, -38.998291015625, -37.80375289916992, -36.609214782714844, -35.41468048095703, -34.22014236450195, -33.025604248046875, -31.831066131591797, -30.63652992248535, -29.441993713378906, -28.247455596923828, -27.05291748046875, -25.858381271362305, -24.66384506225586, -23.46930694580078, -22.274768829345703, -21.080232620239258, -19.885696411132812, -18.691158294677734, -17.496620178222656, -16.30208396911621, -15.10754680633545, -13.913009643554688, -12.718472480773926, -11.523935317993164, -10.329398155212402, -9.13486099243164, -7.940323829650879, -6.745786666870117, -5.5512495040893555, -4.356708526611328, -3.1621713638305664, -1.9676342010498047, -0.773097038269043, 0.42144012451171875, 1.6159772872924805, 2.810514450073242, 4.005051612854004, 5.199588775634766, 6.394125938415527, 7.588663101196289, 8.78320026397705, 9.977737426757812, 11.172274589538574, 12.366811752319336, 13.561348915100098, 14.75588607788086, 15.950423240661621, 17.144960403442383, 18.339496612548828, 19.534034729003906, 20.728572845458984, 21.92310905456543, 23.117645263671875, 24.312183380126953, 25.50672149658203, 26.701257705688477, 27.895793914794922, 29.09033203125, 30.284870147705078, 31.479406356811523, 32.67394256591797, 33.86848068237305]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 7.0, 23.0, 37.0, 34.0, 59.0, 95.0, 154.0, 230.0, 341.0, 556.0, 829.0, 1411.0, 2186.0, 3465.0, 5566.0, 8891.0, 14905.0, 23717.0, 38754.0, 63073.0, 101748.0, 157298.0, 198170.0, 158873.0, 102970.0, 63138.0, 38982.0, 24053.0, 14761.0, 8999.0, 5566.0, 3528.0, 2278.0, 1406.0, 875.0, 580.0, 340.0, 237.0, 157.0, 80.0, 54.0, 48.0, 17.0, 22.0, 13.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-38.96875, -37.73193359375, -36.4951171875, -35.25830078125, -34.021484375, -32.78466796875, -31.5478515625, -30.31103515625, -29.07421875, -27.83740234375, -26.6005859375, -25.36376953125, -24.126953125, -22.89013671875, -21.6533203125, -20.41650390625, -19.1796875, -17.94287109375, -16.7060546875, -15.46923828125, -14.232421875, -12.99560546875, -11.7587890625, -10.52197265625, -9.28515625, -8.04833984375, -6.8115234375, -5.57470703125, -4.337890625, -3.10107421875, -1.8642578125, -0.62744140625, 0.609375, 1.84619140625, 3.0830078125, 4.31982421875, 5.556640625, 6.79345703125, 8.0302734375, 9.26708984375, 10.50390625, 11.74072265625, 12.9775390625, 14.21435546875, 15.451171875, 16.68798828125, 17.9248046875, 19.16162109375, 20.3984375, 21.63525390625, 22.8720703125, 24.10888671875, 25.345703125, 26.58251953125, 27.8193359375, 29.05615234375, 30.29296875, 31.52978515625, 32.7666015625, 34.00341796875, 35.240234375, 36.47705078125, 37.7138671875, 38.95068359375, 40.1875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 1.0, 7.0, 6.0, 9.0, 13.0, 14.0, 8.0, 15.0, 19.0, 26.0, 19.0, 25.0, 20.0, 32.0, 37.0, 30.0, 49.0, 55.0, 49.0, 52.0, 49.0, 49.0, 50.0, 60.0, 47.0, 34.0, 45.0, 39.0, 31.0, 27.0, 13.0, 13.0, 11.0, 11.0, 10.0, 7.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.21875, -42.01171875, -40.8046875, -39.59765625, -38.390625, -37.18359375, -35.9765625, -34.76953125, -33.5625, -32.35546875, -31.1484375, -29.94140625, -28.734375, -27.52734375, -26.3203125, -25.11328125, -23.90625, -22.69921875, -21.4921875, -20.28515625, -19.078125, -17.87109375, -16.6640625, -15.45703125, -14.25, -13.04296875, -11.8359375, -10.62890625, -9.421875, -8.21484375, -7.0078125, -5.80078125, -4.59375, -3.38671875, -2.1796875, -0.97265625, 0.234375, 1.44140625, 2.6484375, 3.85546875, 5.0625, 6.26953125, 7.4765625, 8.68359375, 9.890625, 11.09765625, 12.3046875, 13.51171875, 14.71875, 15.92578125, 17.1328125, 18.33984375, 19.546875, 20.75390625, 21.9609375, 23.16796875, 24.375, 25.58203125, 26.7890625, 27.99609375, 29.203125, 30.41015625, 31.6171875, 32.82421875, 34.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 10.0, 13.0, 25.0, 22.0, 31.0, 44.0, 88.0, 124.0, 192.0, 256.0, 409.0, 633.0, 920.0, 1411.0, 2037.0, 3102.0, 4774.0, 7116.0, 10917.0, 16508.0, 25070.0, 38595.0, 58686.0, 88533.0, 129064.0, 166779.0, 155948.0, 114212.0, 76289.0, 50302.0, 33135.0, 21554.0, 14195.0, 9385.0, 6187.0, 4055.0, 2674.0, 1727.0, 1195.0, 780.0, 499.0, 343.0, 237.0, 144.0, 111.0, 79.0, 48.0, 36.0, 25.0, 11.0, 11.0, 11.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-35.25, -34.02685546875, -32.8037109375, -31.58056640625, -30.357421875, -29.13427734375, -27.9111328125, -26.68798828125, -25.46484375, -24.24169921875, -23.0185546875, -21.79541015625, -20.572265625, -19.34912109375, -18.1259765625, -16.90283203125, -15.6796875, -14.45654296875, -13.2333984375, -12.01025390625, -10.787109375, -9.56396484375, -8.3408203125, -7.11767578125, -5.89453125, -4.67138671875, -3.4482421875, -2.22509765625, -1.001953125, 0.22119140625, 1.4443359375, 2.66748046875, 3.890625, 5.11376953125, 6.3369140625, 7.56005859375, 8.783203125, 10.00634765625, 11.2294921875, 12.45263671875, 13.67578125, 14.89892578125, 16.1220703125, 17.34521484375, 18.568359375, 19.79150390625, 21.0146484375, 22.23779296875, 23.4609375, 24.68408203125, 25.9072265625, 27.13037109375, 28.353515625, 29.57666015625, 30.7998046875, 32.02294921875, 33.24609375, 34.46923828125, 35.6923828125, 36.91552734375, 38.138671875, 39.36181640625, 40.5849609375, 41.80810546875, 43.03125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 14.0, 10.0, 8.0, 11.0, 8.0, 15.0, 22.0, 19.0, 11.0, 27.0, 24.0, 23.0, 29.0, 39.0, 31.0, 37.0, 24.0, 37.0, 26.0, 43.0, 42.0, 38.0, 32.0, 36.0, 34.0, 47.0, 30.0, 26.0, 37.0, 22.0, 28.0, 20.0, 20.0, 18.0, 23.0, 14.0, 16.0, 7.0, 12.0, 8.0, 9.0, 2.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.709228515625, -18.05908203125, -17.408935546875, -16.7587890625, -16.108642578125, -15.45849609375, -14.808349609375, -14.158203125, -13.508056640625, -12.85791015625, -12.207763671875, -11.5576171875, -10.907470703125, -10.25732421875, -9.607177734375, -8.95703125, -8.306884765625, -7.65673828125, -7.006591796875, -6.3564453125, -5.706298828125, -5.05615234375, -4.406005859375, -3.755859375, -3.105712890625, -2.45556640625, -1.805419921875, -1.1552734375, -0.505126953125, 0.14501953125, 0.795166015625, 1.4453125, 2.095458984375, 2.74560546875, 3.395751953125, 4.0458984375, 4.696044921875, 5.34619140625, 5.996337890625, 6.646484375, 7.296630859375, 7.94677734375, 8.596923828125, 9.2470703125, 9.897216796875, 10.54736328125, 11.197509765625, 11.84765625, 12.497802734375, 13.14794921875, 13.798095703125, 14.4482421875, 15.098388671875, 15.74853515625, 16.398681640625, 17.048828125, 17.698974609375, 18.34912109375, 18.999267578125, 19.6494140625, 20.299560546875, 20.94970703125, 21.599853515625, 22.25]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 14.0, 34.0, 35.0, 64.0, 65.0, 83.0, 159.0, 243.0, 344.0, 506.0, 822.0, 1317.0, 2163.0, 3585.0, 6398.0, 11480.0, 21717.0, 42286.0, 87756.0, 184611.0, 287426.0, 200708.0, 97234.0, 46716.0, 23570.0, 12483.0, 6785.0, 3790.0, 2283.0, 1388.0, 841.0, 535.0, 342.0, 255.0, 173.0, 99.0, 69.0, 52.0, 43.0, 21.0, 8.0, 9.0, 15.0, 4.0, 4.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -24.020263671875, -23.25927734375, -22.498291015625, -21.7373046875, -20.976318359375, -20.21533203125, -19.454345703125, -18.693359375, -17.932373046875, -17.17138671875, -16.410400390625, -15.6494140625, -14.888427734375, -14.12744140625, -13.366455078125, -12.60546875, -11.844482421875, -11.08349609375, -10.322509765625, -9.5615234375, -8.800537109375, -8.03955078125, -7.278564453125, -6.517578125, -5.756591796875, -4.99560546875, -4.234619140625, -3.4736328125, -2.712646484375, -1.95166015625, -1.190673828125, -0.4296875, 0.331298828125, 1.09228515625, 1.853271484375, 2.6142578125, 3.375244140625, 4.13623046875, 4.897216796875, 5.658203125, 6.419189453125, 7.18017578125, 7.941162109375, 8.7021484375, 9.463134765625, 10.22412109375, 10.985107421875, 11.74609375, 12.507080078125, 13.26806640625, 14.029052734375, 14.7900390625, 15.551025390625, 16.31201171875, 17.072998046875, 17.833984375, 18.594970703125, 19.35595703125, 20.116943359375, 20.8779296875, 21.638916015625, 22.39990234375, 23.160888671875, 23.921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 13.0, 8.0, 18.0, 23.0, 34.0, 33.0, 45.0, 54.0, 72.0, 81.0, 94.0, 117.0, 83.0, 72.0, 59.0, 52.0, 34.0, 22.0, 15.0, 16.0, 6.0, 10.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028076171875, -0.0027250945568084717, -0.0026425719261169434, -0.002560049295425415, -0.0024775266647338867, -0.0023950040340423584, -0.00231248140335083, -0.0022299587726593018, -0.0021474361419677734, -0.002064913511276245, -0.001982390880584717, -0.0018998682498931885, -0.0018173456192016602, -0.0017348229885101318, -0.0016523003578186035, -0.0015697777271270752, -0.0014872550964355469, -0.0014047324657440186, -0.0013222098350524902, -0.001239687204360962, -0.0011571645736694336, -0.0010746419429779053, -0.000992119312286377, -0.0009095966815948486, -0.0008270740509033203, -0.000744551420211792, -0.0006620287895202637, -0.0005795061588287354, -0.000496983528137207, -0.0004144608974456787, -0.0003319382667541504, -0.00024941563606262207, -0.00016689300537109375, -8.437037467956543e-05, -1.8477439880371094e-06, 8.067488670349121e-05, 0.00016319751739501953, 0.00024572014808654785, 0.00032824277877807617, 0.0004107654094696045, 0.0004932880401611328, 0.0005758106708526611, 0.0006583333015441895, 0.0007408559322357178, 0.0008233785629272461, 0.0009059011936187744, 0.0009884238243103027, 0.001070946455001831, 0.0011534690856933594, 0.0012359917163848877, 0.001318514347076416, 0.0014010369777679443, 0.0014835596084594727, 0.001566082239151001, 0.0016486048698425293, 0.0017311275005340576, 0.001813650131225586, 0.0018961727619171143, 0.0019786953926086426, 0.002061218023300171, 0.0021437406539916992, 0.0022262632846832275, 0.002308785915374756, 0.002391308546066284, 0.0024738311767578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 18.0, 26.0, 31.0, 41.0, 79.0, 73.0, 150.0, 200.0, 346.0, 512.0, 855.0, 1462.0, 2249.0, 3954.0, 6690.0, 11593.0, 21262.0, 39563.0, 74866.0, 141246.0, 237694.0, 224822.0, 130174.0, 68629.0, 36377.0, 19419.0, 10850.0, 6092.0, 3548.0, 2132.0, 1308.0, 795.0, 520.0, 339.0, 195.0, 137.0, 86.0, 56.0, 53.0, 28.0, 17.0, 17.0, 7.0, 8.0, 3.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.25, -20.56298828125, -19.8759765625, -19.18896484375, -18.501953125, -17.81494140625, -17.1279296875, -16.44091796875, -15.75390625, -15.06689453125, -14.3798828125, -13.69287109375, -13.005859375, -12.31884765625, -11.6318359375, -10.94482421875, -10.2578125, -9.57080078125, -8.8837890625, -8.19677734375, -7.509765625, -6.82275390625, -6.1357421875, -5.44873046875, -4.76171875, -4.07470703125, -3.3876953125, -2.70068359375, -2.013671875, -1.32666015625, -0.6396484375, 0.04736328125, 0.734375, 1.42138671875, 2.1083984375, 2.79541015625, 3.482421875, 4.16943359375, 4.8564453125, 5.54345703125, 6.23046875, 6.91748046875, 7.6044921875, 8.29150390625, 8.978515625, 9.66552734375, 10.3525390625, 11.03955078125, 11.7265625, 12.41357421875, 13.1005859375, 13.78759765625, 14.474609375, 15.16162109375, 15.8486328125, 16.53564453125, 17.22265625, 17.90966796875, 18.5966796875, 19.28369140625, 19.970703125, 20.65771484375, 21.3447265625, 22.03173828125, 22.71875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 4.0, 4.0, 8.0, 13.0, 14.0, 17.0, 17.0, 33.0, 34.0, 33.0, 40.0, 39.0, 48.0, 47.0, 50.0, 66.0, 52.0, 68.0, 64.0, 52.0, 47.0, 37.0, 32.0, 25.0, 31.0, 31.0, 11.0, 21.0, 12.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.46728515625, -7.2509765625, -7.03466796875, -6.818359375, -6.60205078125, -6.3857421875, -6.16943359375, -5.953125, -5.73681640625, -5.5205078125, -5.30419921875, -5.087890625, -4.87158203125, -4.6552734375, -4.43896484375, -4.22265625, -4.00634765625, -3.7900390625, -3.57373046875, -3.357421875, -3.14111328125, -2.9248046875, -2.70849609375, -2.4921875, -2.27587890625, -2.0595703125, -1.84326171875, -1.626953125, -1.41064453125, -1.1943359375, -0.97802734375, -0.76171875, -0.54541015625, -0.3291015625, -0.11279296875, 0.103515625, 0.31982421875, 0.5361328125, 0.75244140625, 0.96875, 1.18505859375, 1.4013671875, 1.61767578125, 1.833984375, 2.05029296875, 2.2666015625, 2.48291015625, 2.69921875, 2.91552734375, 3.1318359375, 3.34814453125, 3.564453125, 3.78076171875, 3.9970703125, 4.21337890625, 4.4296875, 4.64599609375, 4.8623046875, 5.07861328125, 5.294921875, 5.51123046875, 5.7275390625, 5.94384765625, 6.16015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 9.0, 15.0, 19.0, 15.0, 22.0, 25.0, 32.0, 50.0, 40.0, 56.0, 58.0, 68.0, 58.0, 57.0, 62.0, 64.0, 59.0, 37.0, 40.0, 47.0, 17.0, 21.0, 22.0, 20.0, 15.0, 12.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.43230438232422, -41.18538284301758, -39.93846130371094, -38.6915397644043, -37.444618225097656, -36.197696685791016, -34.950775146484375, -33.703853607177734, -32.456932067871094, -31.210010528564453, -29.963088989257812, -28.716167449951172, -27.46924591064453, -26.22232437133789, -24.97540283203125, -23.72848129272461, -22.481557846069336, -21.234636306762695, -19.987714767456055, -18.740793228149414, -17.493871688842773, -16.246950149536133, -15.000027656555176, -13.753106117248535, -12.506184577941895, -11.259263038635254, -10.012341499328613, -8.765419006347656, -7.518497943878174, -6.271576404571533, -5.024654388427734, -3.7777328491210938, -2.530811309814453, -1.283889651298523, -0.03696799278259277, 1.209953784942627, 2.4568753242492676, 3.703796863555908, 4.950718879699707, 6.197640419006348, 7.444561958312988, 8.691483497619629, 9.93840503692627, 11.185327529907227, 12.432249069213867, 13.679170608520508, 14.926092147827148, 16.17301368713379, 17.41993522644043, 18.66685676574707, 19.91377830505371, 21.16069984436035, 22.407621383666992, 23.654542922973633, 24.901466369628906, 26.148387908935547, 27.395309448242188, 28.642230987548828, 29.88915252685547, 31.13607406616211, 32.38299560546875, 33.62991714477539, 34.87683868408203, 36.12376022338867, 37.37068176269531]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 6.0, 10.0, 9.0, 13.0, 9.0, 13.0, 19.0, 25.0, 22.0, 30.0, 34.0, 34.0, 31.0, 47.0, 32.0, 52.0, 43.0, 44.0, 44.0, 39.0, 52.0, 42.0, 42.0, 47.0, 44.0, 38.0, 28.0, 26.0, 19.0, 23.0, 16.0, 14.0, 12.0, 14.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.439571380615234, -45.023658752441406, -43.607749938964844, -42.191837310791016, -40.77592468261719, -39.360015869140625, -37.9441032409668, -36.52819061279297, -35.112281799316406, -33.69636917114258, -32.280460357666016, -30.864547729492188, -29.448637008666992, -28.032726287841797, -26.61681365966797, -25.200902938842773, -23.784992218017578, -22.369081497192383, -20.953170776367188, -19.53725814819336, -18.121347427368164, -16.70543670654297, -15.289525032043457, -13.873613357543945, -12.45770263671875, -11.041791915893555, -9.625880241394043, -8.209968566894531, -6.794057846069336, -5.378146648406982, -3.962235450744629, -2.546323776245117, -1.1304092407226562, 0.28550195693969727, 1.7014131546020508, 3.1173243522644043, 4.533235549926758, 5.949146747589111, 7.365057945251465, 8.780969619750977, 10.196880340576172, 11.612791061401367, 13.028702735900879, 14.44461441040039, 15.860525131225586, 17.27643585205078, 18.69234848022461, 20.108259201049805, 21.524169921875, 22.940080642700195, 24.35599136352539, 25.77190399169922, 27.187814712524414, 28.60372543334961, 30.019638061523438, 31.435548782348633, 32.85145950317383, 34.267372131347656, 35.68328094482422, 37.09919357299805, 38.515106201171875, 39.93101501464844, 41.346927642822266, 42.762840270996094, 44.178749084472656]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 8.0, 14.0, 17.0, 17.0, 21.0, 32.0, 45.0, 56.0, 64.0, 85.0, 127.0, 163.0, 233.0, 304.0, 419.0, 671.0, 874.0, 1043125.0, 1167.0, 856.0, 648.0, 462.0, 319.0, 198.0, 166.0, 129.0, 78.0, 62.0, 51.0, 48.0, 27.0, 26.0, 20.0, 8.0, 11.0, 11.0, 7.0, 7.0, 6.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-885.319091796875, -860.0007934570312, -834.6824951171875, -809.3641967773438, -784.0458984375, -758.7276000976562, -733.4093017578125, -708.0910034179688, -682.772705078125, -657.4544067382812, -632.1361083984375, -606.8178100585938, -581.49951171875, -556.1812133789062, -530.8629150390625, -505.54461669921875, -480.2263488769531, -454.9080505371094, -429.5897521972656, -404.2714538574219, -378.9531555175781, -353.6348571777344, -328.31658935546875, -302.998291015625, -277.67999267578125, -252.3616943359375, -227.04339599609375, -201.72509765625, -176.40679931640625, -151.0885009765625, -125.77021789550781, -100.45191955566406, -75.13360595703125, -49.8153076171875, -24.497013092041016, 0.8212814331054688, 26.13957977294922, 51.45787811279297, 76.77616882324219, 102.09446716308594, 127.41276550292969, 152.73106384277344, 178.0493621826172, 203.36764526367188, 228.68594360351562, 254.00424194335938, 279.3225402832031, 304.6408386230469, 329.9591369628906, 355.2774353027344, 380.5957336425781, 405.9140319824219, 431.2323303222656, 456.5506286621094, 481.868896484375, 507.18719482421875, 532.5054931640625, 557.8237915039062, 583.14208984375, 608.4603881835938, 633.7786865234375, 659.0969848632812, 684.415283203125, 709.7335815429688, 735.0518798828125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 2.0, 10.0, 9.0, 14.0, 18.0, 23.0, 26.0, 23.0, 23.0, 39.0, 52.0, 62.0, 81.0, 110.0, 130.0, 168.0, 238.0, 413.0, 1584.0, 51458464.0, 7699.0, 902.0, 325.0, 202.0, 149.0, 115.0, 95.0, 74.0, 60.0, 47.0, 29.0, 26.0, 22.0, 22.0, 14.0, 16.0, 12.0, 14.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3355.04296875, -3238.647705078125, -3122.25244140625, -3005.857177734375, -2889.4619140625, -2773.066650390625, -2656.67138671875, -2540.276123046875, -2423.880859375, -2307.485595703125, -2191.09033203125, -2074.695068359375, -1958.2998046875, -1841.904541015625, -1725.50927734375, -1609.114013671875, -1492.71875, -1376.323486328125, -1259.92822265625, -1143.532958984375, -1027.1376953125, -910.742431640625, -794.34716796875, -677.951904296875, -561.556640625, -445.161376953125, -328.76611328125, -212.370849609375, -95.9755859375, 20.419677734375, 136.81494140625, 253.210205078125, 369.605712890625, 486.0009765625, 602.396240234375, 718.79150390625, 835.186767578125, 951.58203125, 1067.977294921875, 1184.37255859375, 1300.767822265625, 1417.1630859375, 1533.558349609375, 1649.95361328125, 1766.348876953125, 1882.744140625, 1999.139404296875, 2115.53466796875, 2231.929931640625, 2348.3251953125, 2464.720458984375, 2581.11572265625, 2697.510986328125, 2813.90625, 2930.301513671875, 3046.69677734375, 3163.092041015625, 3279.4873046875, 3395.882568359375, 3512.27783203125, 3628.673095703125, 3745.068359375, 3861.463623046875, 3977.85888671875, 4094.254150390625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 13.0, 13.0, 21.0, 54.0, 67.0, 111.0, 205.0, 375.0, 647.0, 1167.0, 2128.0, 3966.0, 8101.0, 16808.0, 35378.0, 79686.0, 192082.0, 522875.0, 1990817.0, 2437926.0, 612143.0, 218663.0, 90331.0, 40360.0, 18642.0, 9076.0, 4563.0, 2370.0, 1208.0, 698.0, 373.0, 208.0, 122.0, 84.0, 54.0, 36.0, 18.0, 21.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-162.375, -157.8740234375, -153.373046875, -148.8720703125, -144.37109375, -139.8701171875, -135.369140625, -130.8681640625, -126.3671875, -121.8662109375, -117.365234375, -112.8642578125, -108.36328125, -103.8623046875, -99.361328125, -94.8603515625, -90.359375, -85.8583984375, -81.357421875, -76.8564453125, -72.35546875, -67.8544921875, -63.353515625, -58.8525390625, -54.3515625, -49.8505859375, -45.349609375, -40.8486328125, -36.34765625, -31.8466796875, -27.345703125, -22.8447265625, -18.34375, -13.8427734375, -9.341796875, -4.8408203125, -0.33984375, 4.1611328125, 8.662109375, 13.1630859375, 17.6640625, 22.1650390625, 26.666015625, 31.1669921875, 35.66796875, 40.1689453125, 44.669921875, 49.1708984375, 53.671875, 58.1728515625, 62.673828125, 67.1748046875, 71.67578125, 76.1767578125, 80.677734375, 85.1787109375, 89.6796875, 94.1806640625, 98.681640625, 103.1826171875, 107.68359375, 112.1845703125, 116.685546875, 121.1865234375, 125.6875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 2.0, 6.0, 9.0, 15.0, 13.0, 13.0, 15.0, 18.0, 18.0, 18.0, 34.0, 40.0, 39.0, 50.0, 72.0, 97.0, 120.0, 162.0, 181.0, 212.0, 161.0, 155.0, 112.0, 93.0, 60.0, 43.0, 45.0, 33.0, 30.0, 31.0, 21.0, 14.0, 8.0, 14.0, 13.0, 8.0, 6.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.3486328125, -59.259765625, -57.1708984375, -55.08203125, -52.9931640625, -50.904296875, -48.8154296875, -46.7265625, -44.6376953125, -42.548828125, -40.4599609375, -38.37109375, -36.2822265625, -34.193359375, -32.1044921875, -30.015625, -27.9267578125, -25.837890625, -23.7490234375, -21.66015625, -19.5712890625, -17.482421875, -15.3935546875, -13.3046875, -11.2158203125, -9.126953125, -7.0380859375, -4.94921875, -2.8603515625, -0.771484375, 1.3173828125, 3.40625, 5.4951171875, 7.583984375, 9.6728515625, 11.76171875, 13.8505859375, 15.939453125, 18.0283203125, 20.1171875, 22.2060546875, 24.294921875, 26.3837890625, 28.47265625, 30.5615234375, 32.650390625, 34.7392578125, 36.828125, 38.9169921875, 41.005859375, 43.0947265625, 45.18359375, 47.2724609375, 49.361328125, 51.4501953125, 53.5390625, 55.6279296875, 57.716796875, 59.8056640625, 61.89453125, 63.9833984375, 66.072265625, 68.1611328125, 70.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 18.0, 27.0, 35.0, 36.0, 74.0, 110.0, 157.0, 238.0, 369.0, 557.0, 898.0, 1498.0, 2437.0, 3794.0, 6321.0, 10177.0, 16228.0, 26613.0, 43788.0, 72166.0, 120200.0, 200852.0, 347439.0, 711819.0, 2035070.0, 1444843.0, 536120.0, 285309.0, 168284.0, 100737.0, 60792.0, 36631.0, 22215.0, 13433.0, 8353.0, 4993.0, 3238.0, 2070.0, 1222.0, 783.0, 517.0, 321.0, 214.0, 144.0, 96.0, 43.0, 35.0, 40.0, 21.0, 25.0, 8.0, 13.0, 7.0, 0.0, 1.0, 2.0, 3.0], "bins": [-54.03125, -52.33349609375, -50.6357421875, -48.93798828125, -47.240234375, -45.54248046875, -43.8447265625, -42.14697265625, -40.44921875, -38.75146484375, -37.0537109375, -35.35595703125, -33.658203125, -31.96044921875, -30.2626953125, -28.56494140625, -26.8671875, -25.16943359375, -23.4716796875, -21.77392578125, -20.076171875, -18.37841796875, -16.6806640625, -14.98291015625, -13.28515625, -11.58740234375, -9.8896484375, -8.19189453125, -6.494140625, -4.79638671875, -3.0986328125, -1.40087890625, 0.296875, 1.99462890625, 3.6923828125, 5.39013671875, 7.087890625, 8.78564453125, 10.4833984375, 12.18115234375, 13.87890625, 15.57666015625, 17.2744140625, 18.97216796875, 20.669921875, 22.36767578125, 24.0654296875, 25.76318359375, 27.4609375, 29.15869140625, 30.8564453125, 32.55419921875, 34.251953125, 35.94970703125, 37.6474609375, 39.34521484375, 41.04296875, 42.74072265625, 44.4384765625, 46.13623046875, 47.833984375, 49.53173828125, 51.2294921875, 52.92724609375, 54.625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 6.0, 9.0, 11.0, 9.0, 15.0, 17.0, 35.0, 21.0, 32.0, 39.0, 41.0, 42.0, 55.0, 82.0, 120.0, 191.0, 265.0, 291.0, 219.0, 110.0, 75.0, 52.0, 55.0, 38.0, 29.0, 26.0, 23.0, 21.0, 17.0, 8.0, 8.0, 16.0, 6.0, 8.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.375, -77.4052734375, -74.435546875, -71.4658203125, -68.49609375, -65.5263671875, -62.556640625, -59.5869140625, -56.6171875, -53.6474609375, -50.677734375, -47.7080078125, -44.73828125, -41.7685546875, -38.798828125, -35.8291015625, -32.859375, -29.8896484375, -26.919921875, -23.9501953125, -20.98046875, -18.0107421875, -15.041015625, -12.0712890625, -9.1015625, -6.1318359375, -3.162109375, -0.1923828125, 2.77734375, 5.7470703125, 8.716796875, 11.6865234375, 14.65625, 17.6259765625, 20.595703125, 23.5654296875, 26.53515625, 29.5048828125, 32.474609375, 35.4443359375, 38.4140625, 41.3837890625, 44.353515625, 47.3232421875, 50.29296875, 53.2626953125, 56.232421875, 59.2021484375, 62.171875, 65.1416015625, 68.111328125, 71.0810546875, 74.05078125, 77.0205078125, 79.990234375, 82.9599609375, 85.9296875, 88.8994140625, 91.869140625, 94.8388671875, 97.80859375, 100.7783203125, 103.748046875, 106.7177734375, 109.6875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 10.0, 8.0, 25.0, 43.0, 56.0, 93.0, 102.0, 135.0, 228.0, 310.0, 446.0, 625.0, 887.0, 1264.0, 1819.0, 2545.0, 3713.0, 5343.0, 7789.0, 11437.0, 17611.0, 27081.0, 43863.0, 75192.0, 176320.0, 5419130.0, 271450.0, 85783.0, 48318.0, 29903.0, 19478.0, 12715.0, 8397.0, 5788.0, 4074.0, 2810.0, 1894.0, 1403.0, 997.0, 707.0, 525.0, 335.0, 256.0, 175.0, 111.0, 85.0, 61.0, 44.0, 17.0, 16.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.1669921875, -93.771484375, -90.3759765625, -86.98046875, -83.5849609375, -80.189453125, -76.7939453125, -73.3984375, -70.0029296875, -66.607421875, -63.2119140625, -59.81640625, -56.4208984375, -53.025390625, -49.6298828125, -46.234375, -42.8388671875, -39.443359375, -36.0478515625, -32.65234375, -29.2568359375, -25.861328125, -22.4658203125, -19.0703125, -15.6748046875, -12.279296875, -8.8837890625, -5.48828125, -2.0927734375, 1.302734375, 4.6982421875, 8.09375, 11.4892578125, 14.884765625, 18.2802734375, 21.67578125, 25.0712890625, 28.466796875, 31.8623046875, 35.2578125, 38.6533203125, 42.048828125, 45.4443359375, 48.83984375, 52.2353515625, 55.630859375, 59.0263671875, 62.421875, 65.8173828125, 69.212890625, 72.6083984375, 76.00390625, 79.3994140625, 82.794921875, 86.1904296875, 89.5859375, 92.9814453125, 96.376953125, 99.7724609375, 103.16796875, 106.5634765625, 109.958984375, 113.3544921875, 116.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 13.0, 12.0, 12.0, 10.0, 18.0, 15.0, 19.0, 25.0, 29.0, 19.0, 40.0, 29.0, 33.0, 43.0, 52.0, 77.0, 152.0, 281.0, 404.0, 205.0, 97.0, 71.0, 36.0, 40.0, 36.0, 23.0, 31.0, 33.0, 20.0, 21.0, 14.0, 15.0, 12.0, 11.0, 14.0, 13.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.685546875, -137.99609375, -133.306640625, -128.6171875, -123.927734375, -119.23828125, -114.548828125, -109.859375, -105.169921875, -100.48046875, -95.791015625, -91.1015625, -86.412109375, -81.72265625, -77.033203125, -72.34375, -67.654296875, -62.96484375, -58.275390625, -53.5859375, -48.896484375, -44.20703125, -39.517578125, -34.828125, -30.138671875, -25.44921875, -20.759765625, -16.0703125, -11.380859375, -6.69140625, -2.001953125, 2.6875, 7.376953125, 12.06640625, 16.755859375, 21.4453125, 26.134765625, 30.82421875, 35.513671875, 40.203125, 44.892578125, 49.58203125, 54.271484375, 58.9609375, 63.650390625, 68.33984375, 73.029296875, 77.71875, 82.408203125, 87.09765625, 91.787109375, 96.4765625, 101.166015625, 105.85546875, 110.544921875, 115.234375, 119.923828125, 124.61328125, 129.302734375, 133.9921875, 138.681640625, 143.37109375, 148.060546875, 152.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 7.0, 8.0, 14.0, 18.0, 23.0, 35.0, 48.0, 50.0, 63.0, 87.0, 159.0, 121.0, 61.0, 61.0, 47.0, 34.0, 30.0, 16.0, 17.0, 19.0, 14.0, 7.0, 10.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2396.674072265625, -2304.192626953125, -2211.711181640625, -2119.229736328125, -2026.748291015625, -1934.266845703125, -1841.7852783203125, -1749.3038330078125, -1656.8223876953125, -1564.3409423828125, -1471.8594970703125, -1379.3779296875, -1286.896484375, -1194.4150390625, -1101.93359375, -1009.4521484375, -916.970703125, -824.4892578125, -732.0078125, -639.5263061523438, -547.0448608398438, -454.56341552734375, -362.0819091796875, -269.6004638671875, -177.1190185546875, -84.63755798339844, 7.843902587890625, 100.32537841796875, 192.80682373046875, 285.28826904296875, 377.769775390625, 470.251220703125, 562.732666015625, 655.214111328125, 747.695556640625, 840.1770629882812, 932.6585083007812, 1025.139892578125, 1117.6214599609375, 1210.1029052734375, 1302.5843505859375, 1395.0657958984375, 1487.5472412109375, 1580.02880859375, 1672.51025390625, 1764.99169921875, 1857.47314453125, 1949.95458984375, 2042.43603515625, 2134.91748046875, 2227.39892578125, 2319.88037109375, 2412.36181640625, 2504.84326171875, 2597.32470703125, 2689.80615234375, 2782.28759765625, 2874.76904296875, 2967.25048828125, 3059.73193359375, 3152.21337890625, 3244.69482421875, 3337.17626953125, 3429.65771484375, 3522.139404296875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 6.0, 10.0, 10.0, 14.0, 19.0, 19.0, 17.0, 22.0, 18.0, 28.0, 23.0, 32.0, 47.0, 49.0, 81.0, 105.0, 76.0, 74.0, 44.0, 25.0, 27.0, 27.0, 23.0, 21.0, 25.0, 21.0, 16.0, 16.0, 16.0, 8.0, 9.0, 10.0, 11.0, 1.0, 2.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3043.0244140625, -2941.0390625, -2839.053955078125, -2737.068603515625, -2635.08349609375, -2533.09814453125, -2431.11279296875, -2329.127685546875, -2227.142333984375, -2125.156982421875, -2023.171875, -1921.1865234375, -1819.2012939453125, -1717.216064453125, -1615.2308349609375, -1513.24560546875, -1411.2603759765625, -1309.275146484375, -1207.2899169921875, -1105.3046875, -1003.3193359375, -901.3341064453125, -799.348876953125, -697.3635864257812, -595.3783569335938, -493.3930969238281, -391.4078369140625, -289.422607421875, -187.43734741210938, -85.45208740234375, 16.53314208984375, 118.5184326171875, 220.503662109375, 322.4889221191406, 424.47418212890625, 526.4594116210938, 628.4447021484375, 730.429931640625, 832.4151611328125, 934.4004516601562, 1036.3857421875, 1138.3709716796875, 1240.356201171875, 1342.341552734375, 1444.3267822265625, 1546.31201171875, 1648.2972412109375, 1750.282470703125, 1852.2677001953125, 1954.2529296875, 2056.23828125, 2158.223388671875, 2260.208740234375, 2362.19384765625, 2464.17919921875, 2566.16455078125, 2668.149658203125, 2770.135009765625, 2872.1201171875, 2974.10546875, 3076.090576171875, 3178.075927734375, 3280.06103515625, 3382.04638671875, 3484.03173828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 27.0, 43.0, 83.0, 126.0, 208.0, 381.0, 660.0, 1029.0, 1616.0, 2868.0, 5176.0, 10051.0, 23423.0, 75797.0, 653358.0, 3228009.0, 139557.0, 32000.0, 10747.0, 4408.0, 2112.0, 1106.0, 588.0, 339.0, 187.0, 106.0, 75.0, 52.0, 36.0, 24.0, 17.0, 16.0, 3.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.328125, -28.416259765625, -27.50439453125, -26.592529296875, -25.6806640625, -24.768798828125, -23.85693359375, -22.945068359375, -22.033203125, -21.121337890625, -20.20947265625, -19.297607421875, -18.3857421875, -17.473876953125, -16.56201171875, -15.650146484375, -14.73828125, -13.826416015625, -12.91455078125, -12.002685546875, -11.0908203125, -10.178955078125, -9.26708984375, -8.355224609375, -7.443359375, -6.531494140625, -5.61962890625, -4.707763671875, -3.7958984375, -2.884033203125, -1.97216796875, -1.060302734375, -0.1484375, 0.763427734375, 1.67529296875, 2.587158203125, 3.4990234375, 4.410888671875, 5.32275390625, 6.234619140625, 7.146484375, 8.058349609375, 8.97021484375, 9.882080078125, 10.7939453125, 11.705810546875, 12.61767578125, 13.529541015625, 14.44140625, 15.353271484375, 16.26513671875, 17.177001953125, 18.0888671875, 19.000732421875, 19.91259765625, 20.824462890625, 21.736328125, 22.648193359375, 23.56005859375, 24.471923828125, 25.3837890625, 26.295654296875, 27.20751953125, 28.119384765625, 29.03125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 8.0, 4.0, 17.0, 26.0, 38.0, 54.0, 87.0, 96.0, 165.0, 142.0, 89.0, 83.0, 53.0, 33.0, 33.0, 16.0, 8.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.65155029296875, -3.5101318359375, -3.36871337890625, -3.227294921875, -3.08587646484375, -2.9444580078125, -2.80303955078125, -2.66162109375, -2.52020263671875, -2.3787841796875, -2.23736572265625, -2.095947265625, -1.95452880859375, -1.8131103515625, -1.67169189453125, -1.5302734375, -1.38885498046875, -1.2474365234375, -1.10601806640625, -0.964599609375, -0.82318115234375, -0.6817626953125, -0.54034423828125, -0.39892578125, -0.25750732421875, -0.1160888671875, 0.02532958984375, 0.166748046875, 0.30816650390625, 0.4495849609375, 0.59100341796875, 0.732421875, 0.87384033203125, 1.0152587890625, 1.15667724609375, 1.298095703125, 1.43951416015625, 1.5809326171875, 1.72235107421875, 1.86376953125, 2.00518798828125, 2.1466064453125, 2.28802490234375, 2.429443359375, 2.57086181640625, 2.7122802734375, 2.85369873046875, 2.9951171875, 3.13653564453125, 3.2779541015625, 3.41937255859375, 3.560791015625, 3.70220947265625, 3.8436279296875, 3.98504638671875, 4.12646484375, 4.26788330078125, 4.4093017578125, 4.55072021484375, 4.692138671875, 4.83355712890625, 4.9749755859375, 5.11639404296875, 5.2578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 1.0, 5.0, 14.0, 12.0, 24.0, 21.0, 28.0, 51.0, 77.0, 90.0, 163.0, 209.0, 353.0, 582.0, 911.0, 1568.0, 2694.0, 4944.0, 9157.0, 17976.0, 38070.0, 86314.0, 228095.0, 856772.0, 2265271.0, 432912.0, 139687.0, 56128.0, 25477.0, 12288.0, 6340.0, 3415.0, 1812.0, 1095.0, 646.0, 373.0, 263.0, 153.0, 92.0, 65.0, 46.0, 30.0, 17.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5234375, -15.0269775390625, -14.530517578125, -14.0340576171875, -13.53759765625, -13.0411376953125, -12.544677734375, -12.0482177734375, -11.5517578125, -11.0552978515625, -10.558837890625, -10.0623779296875, -9.56591796875, -9.0694580078125, -8.572998046875, -8.0765380859375, -7.580078125, -7.0836181640625, -6.587158203125, -6.0906982421875, -5.59423828125, -5.0977783203125, -4.601318359375, -4.1048583984375, -3.6083984375, -3.1119384765625, -2.615478515625, -2.1190185546875, -1.62255859375, -1.1260986328125, -0.629638671875, -0.1331787109375, 0.36328125, 0.8597412109375, 1.356201171875, 1.8526611328125, 2.34912109375, 2.8455810546875, 3.342041015625, 3.8385009765625, 4.3349609375, 4.8314208984375, 5.327880859375, 5.8243408203125, 6.32080078125, 6.8172607421875, 7.313720703125, 7.8101806640625, 8.306640625, 8.8031005859375, 9.299560546875, 9.7960205078125, 10.29248046875, 10.7889404296875, 11.285400390625, 11.7818603515625, 12.2783203125, 12.7747802734375, 13.271240234375, 13.7677001953125, 14.26416015625, 14.7606201171875, 15.257080078125, 15.7535400390625, 16.25]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 6.0, 12.0, 16.0, 18.0, 25.0, 32.0, 42.0, 45.0, 62.0, 81.0, 99.0, 127.0, 152.0, 219.0, 298.0, 518.0, 844.0, 430.0, 254.0, 199.0, 141.0, 105.0, 70.0, 58.0, 51.0, 44.0, 26.0, 19.0, 13.0, 18.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.5306396484375, -7.322998046875, -7.1153564453125, -6.90771484375, -6.7000732421875, -6.492431640625, -6.2847900390625, -6.0771484375, -5.8695068359375, -5.661865234375, -5.4542236328125, -5.24658203125, -5.0389404296875, -4.831298828125, -4.6236572265625, -4.416015625, -4.2083740234375, -4.000732421875, -3.7930908203125, -3.58544921875, -3.3778076171875, -3.170166015625, -2.9625244140625, -2.7548828125, -2.5472412109375, -2.339599609375, -2.1319580078125, -1.92431640625, -1.7166748046875, -1.509033203125, -1.3013916015625, -1.09375, -0.8861083984375, -0.678466796875, -0.4708251953125, -0.26318359375, -0.0555419921875, 0.152099609375, 0.3597412109375, 0.5673828125, 0.7750244140625, 0.982666015625, 1.1903076171875, 1.39794921875, 1.6055908203125, 1.813232421875, 2.0208740234375, 2.228515625, 2.4361572265625, 2.643798828125, 2.8514404296875, 3.05908203125, 3.2667236328125, 3.474365234375, 3.6820068359375, 3.8896484375, 4.0972900390625, 4.304931640625, 4.5125732421875, 4.72021484375, 4.9278564453125, 5.135498046875, 5.3431396484375, 5.55078125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 13.0, 24.0, 28.0, 50.0, 67.0, 61.0, 93.0, 92.0, 99.0, 111.0, 81.0, 66.0, 45.0, 50.0, 22.0, 15.0, 10.0, 13.0, 4.0, 4.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.39988708496094, -46.92252731323242, -45.445167541503906, -43.96780776977539, -42.490447998046875, -41.01308822631836, -39.535728454589844, -38.05836868286133, -36.58100891113281, -35.1036491394043, -33.62628936767578, -32.148929595947266, -30.67156982421875, -29.194210052490234, -27.71685028076172, -26.239490509033203, -24.762128829956055, -23.28476905822754, -21.807409286499023, -20.330049514770508, -18.852689743041992, -17.375329971313477, -15.897969245910645, -14.420609474182129, -12.943249702453613, -11.465889930725098, -9.988530158996582, -8.51116943359375, -7.033810138702393, -5.556450366973877, -4.079090118408203, -2.6017303466796875, -1.1243705749511719, 0.3529893159866333, 1.8303492069244385, 3.307709217071533, 4.785068988800049, 6.2624287605285645, 7.739789009094238, 9.217148780822754, 10.69450855255127, 12.171868324279785, 13.6492280960083, 15.126588821411133, 16.60394859313965, 18.081308364868164, 19.55866813659668, 21.036027908325195, 22.51338768005371, 23.990747451782227, 25.468107223510742, 26.945466995239258, 28.422826766967773, 29.90018653869629, 31.377548217773438, 32.85490798950195, 34.33226776123047, 35.809627532958984, 37.2869873046875, 38.764347076416016, 40.24170684814453, 41.71906661987305, 43.19642639160156, 44.67378616333008, 46.151145935058594]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 10.0, 15.0, 13.0, 18.0, 18.0, 15.0, 22.0, 23.0, 23.0, 34.0, 31.0, 37.0, 31.0, 39.0, 45.0, 41.0, 33.0, 45.0, 35.0, 38.0, 39.0, 43.0, 42.0, 35.0, 27.0, 32.0, 26.0, 22.0, 23.0, 15.0, 16.0, 16.0, 15.0, 15.0, 10.0, 9.0, 2.0, 4.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.855472564697266, -27.86359405517578, -26.871715545654297, -25.879837036132812, -24.887958526611328, -23.896080017089844, -22.90420150756836, -21.912322998046875, -20.92044448852539, -19.928565979003906, -18.936687469482422, -17.944808959960938, -16.952930450439453, -15.961051940917969, -14.969173431396484, -13.977294921875, -12.985416412353516, -11.993537902832031, -11.001659393310547, -10.009780883789062, -9.017902374267578, -8.026023864746094, -7.034145355224609, -6.042266845703125, -5.050388336181641, -4.058509826660156, -3.066631317138672, -2.0747528076171875, -1.0828742980957031, -0.09099578857421875, 0.9008827209472656, 1.89276123046875, 2.8846397399902344, 3.8765182495117188, 4.868396759033203, 5.8602752685546875, 6.852153778076172, 7.844032287597656, 8.83591079711914, 9.827789306640625, 10.81966781616211, 11.811546325683594, 12.803424835205078, 13.795303344726562, 14.787181854248047, 15.779060363769531, 16.770938873291016, 17.7628173828125, 18.754695892333984, 19.74657440185547, 20.738452911376953, 21.730331420898438, 22.722209930419922, 23.714088439941406, 24.70596694946289, 25.697845458984375, 26.68972396850586, 27.681602478027344, 28.673480987548828, 29.665359497070312, 30.657238006591797, 31.64911651611328, 32.640995025634766, 33.63287353515625, 34.624752044677734]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 23.0, 26.0, 38.0, 72.0, 70.0, 120.0, 164.0, 244.0, 365.0, 534.0, 786.0, 1239.0, 2012.0, 3753.0, 7744.0, 19971.0, 69384.0, 464456.0, 380759.0, 61780.0, 18404.0, 7274.0, 3768.0, 2028.0, 1201.0, 794.0, 520.0, 308.0, 228.0, 141.0, 95.0, 72.0, 36.0, 23.0, 26.0, 7.0, 8.0, 14.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.6171875, -14.1124267578125, -13.607666015625, -13.1029052734375, -12.59814453125, -12.0933837890625, -11.588623046875, -11.0838623046875, -10.5791015625, -10.0743408203125, -9.569580078125, -9.0648193359375, -8.56005859375, -8.0552978515625, -7.550537109375, -7.0457763671875, -6.541015625, -6.0362548828125, -5.531494140625, -5.0267333984375, -4.52197265625, -4.0172119140625, -3.512451171875, -3.0076904296875, -2.5029296875, -1.9981689453125, -1.493408203125, -0.9886474609375, -0.48388671875, 0.0208740234375, 0.525634765625, 1.0303955078125, 1.53515625, 2.0399169921875, 2.544677734375, 3.0494384765625, 3.55419921875, 4.0589599609375, 4.563720703125, 5.0684814453125, 5.5732421875, 6.0780029296875, 6.582763671875, 7.0875244140625, 7.59228515625, 8.0970458984375, 8.601806640625, 9.1065673828125, 9.611328125, 10.1160888671875, 10.620849609375, 11.1256103515625, 11.63037109375, 12.1351318359375, 12.639892578125, 13.1446533203125, 13.6494140625, 14.1541748046875, 14.658935546875, 15.1636962890625, 15.66845703125, 16.1732177734375, 16.677978515625, 17.1827392578125, 17.6875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 5.0, 12.0, 23.0, 43.0, 72.0, 93.0, 117.0, 128.0, 131.0, 124.0, 66.0, 55.0, 37.0, 27.0, 17.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23828125, -4.073486328125, -3.90869140625, -3.743896484375, -3.5791015625, -3.414306640625, -3.24951171875, -3.084716796875, -2.919921875, -2.755126953125, -2.59033203125, -2.425537109375, -2.2607421875, -2.095947265625, -1.93115234375, -1.766357421875, -1.6015625, -1.436767578125, -1.27197265625, -1.107177734375, -0.9423828125, -0.777587890625, -0.61279296875, -0.447998046875, -0.283203125, -0.118408203125, 0.04638671875, 0.211181640625, 0.3759765625, 0.540771484375, 0.70556640625, 0.870361328125, 1.03515625, 1.199951171875, 1.36474609375, 1.529541015625, 1.6943359375, 1.859130859375, 2.02392578125, 2.188720703125, 2.353515625, 2.518310546875, 2.68310546875, 2.847900390625, 3.0126953125, 3.177490234375, 3.34228515625, 3.507080078125, 3.671875, 3.836669921875, 4.00146484375, 4.166259765625, 4.3310546875, 4.495849609375, 4.66064453125, 4.825439453125, 4.990234375, 5.155029296875, 5.31982421875, 5.484619140625, 5.6494140625, 5.814208984375, 5.97900390625, 6.143798828125, 6.30859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 8.0, 6.0, 7.0, 8.0, 24.0, 38.0, 69.0, 73.0, 131.0, 176.0, 299.0, 517.0, 799.0, 1344.0, 2374.0, 4005.0, 6966.0, 13019.0, 25641.0, 54330.0, 136180.0, 445886.0, 210882.0, 74490.0, 33743.0, 16673.0, 8854.0, 4968.0, 2784.0, 1644.0, 968.0, 606.0, 372.0, 225.0, 146.0, 98.0, 62.0, 47.0, 24.0, 21.0, 11.0, 8.0, 6.0, 10.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1796875, -12.7884521484375, -12.397216796875, -12.0059814453125, -11.61474609375, -11.2235107421875, -10.832275390625, -10.4410400390625, -10.0498046875, -9.6585693359375, -9.267333984375, -8.8760986328125, -8.48486328125, -8.0936279296875, -7.702392578125, -7.3111572265625, -6.919921875, -6.5286865234375, -6.137451171875, -5.7462158203125, -5.35498046875, -4.9637451171875, -4.572509765625, -4.1812744140625, -3.7900390625, -3.3988037109375, -3.007568359375, -2.6163330078125, -2.22509765625, -1.8338623046875, -1.442626953125, -1.0513916015625, -0.66015625, -0.2689208984375, 0.122314453125, 0.5135498046875, 0.90478515625, 1.2960205078125, 1.687255859375, 2.0784912109375, 2.4697265625, 2.8609619140625, 3.252197265625, 3.6434326171875, 4.03466796875, 4.4259033203125, 4.817138671875, 5.2083740234375, 5.599609375, 5.9908447265625, 6.382080078125, 6.7733154296875, 7.16455078125, 7.5557861328125, 7.947021484375, 8.3382568359375, 8.7294921875, 9.1207275390625, 9.511962890625, 9.9031982421875, 10.29443359375, 10.6856689453125, 11.076904296875, 11.4681396484375, 11.859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 8.0, 13.0, 12.0, 15.0, 14.0, 16.0, 19.0, 24.0, 19.0, 27.0, 32.0, 26.0, 46.0, 27.0, 44.0, 32.0, 42.0, 40.0, 46.0, 42.0, 48.0, 39.0, 34.0, 36.0, 36.0, 34.0, 41.0, 36.0, 20.0, 25.0, 17.0, 14.0, 13.0, 4.0, 10.0, 11.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3984375, -12.9661865234375, -12.533935546875, -12.1016845703125, -11.66943359375, -11.2371826171875, -10.804931640625, -10.3726806640625, -9.9404296875, -9.5081787109375, -9.075927734375, -8.6436767578125, -8.21142578125, -7.7791748046875, -7.346923828125, -6.9146728515625, -6.482421875, -6.0501708984375, -5.617919921875, -5.1856689453125, -4.75341796875, -4.3211669921875, -3.888916015625, -3.4566650390625, -3.0244140625, -2.5921630859375, -2.159912109375, -1.7276611328125, -1.29541015625, -0.8631591796875, -0.430908203125, 0.0013427734375, 0.43359375, 0.8658447265625, 1.298095703125, 1.7303466796875, 2.16259765625, 2.5948486328125, 3.027099609375, 3.4593505859375, 3.8916015625, 4.3238525390625, 4.756103515625, 5.1883544921875, 5.62060546875, 6.0528564453125, 6.485107421875, 6.9173583984375, 7.349609375, 7.7818603515625, 8.214111328125, 8.6463623046875, 9.07861328125, 9.5108642578125, 9.943115234375, 10.3753662109375, 10.8076171875, 11.2398681640625, 11.672119140625, 12.1043701171875, 12.53662109375, 12.9688720703125, 13.401123046875, 13.8333740234375, 14.265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 11.0, 6.0, 18.0, 12.0, 14.0, 34.0, 35.0, 49.0, 81.0, 98.0, 166.0, 302.0, 476.0, 910.0, 1868.0, 4352.0, 10999.0, 34189.0, 160408.0, 599087.0, 177771.0, 37176.0, 11586.0, 4599.0, 1991.0, 975.0, 516.0, 277.0, 182.0, 97.0, 49.0, 54.0, 27.0, 33.0, 20.0, 15.0, 19.0, 10.0, 10.0, 3.0, 6.0, 1.0, 3.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-11.28125, -10.9344482421875, -10.587646484375, -10.2408447265625, -9.89404296875, -9.5472412109375, -9.200439453125, -8.8536376953125, -8.5068359375, -8.1600341796875, -7.813232421875, -7.4664306640625, -7.11962890625, -6.7728271484375, -6.426025390625, -6.0792236328125, -5.732421875, -5.3856201171875, -5.038818359375, -4.6920166015625, -4.34521484375, -3.9984130859375, -3.651611328125, -3.3048095703125, -2.9580078125, -2.6112060546875, -2.264404296875, -1.9176025390625, -1.57080078125, -1.2239990234375, -0.877197265625, -0.5303955078125, -0.18359375, 0.1632080078125, 0.510009765625, 0.8568115234375, 1.20361328125, 1.5504150390625, 1.897216796875, 2.2440185546875, 2.5908203125, 2.9376220703125, 3.284423828125, 3.6312255859375, 3.97802734375, 4.3248291015625, 4.671630859375, 5.0184326171875, 5.365234375, 5.7120361328125, 6.058837890625, 6.4056396484375, 6.75244140625, 7.0992431640625, 7.446044921875, 7.7928466796875, 8.1396484375, 8.4864501953125, 8.833251953125, 9.1800537109375, 9.52685546875, 9.8736572265625, 10.220458984375, 10.5672607421875, 10.9140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 14.0, 25.0, 34.0, 37.0, 60.0, 102.0, 92.0, 95.0, 84.0, 81.0, 81.0, 58.0, 51.0, 25.0, 25.0, 14.0, 13.0, 14.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007904917001724243, -0.0007598698139190674, -0.0007292479276657104, -0.0006986260414123535, -0.0006680041551589966, -0.0006373822689056396, -0.0006067603826522827, -0.0005761384963989258, -0.0005455166101455688, -0.0005148947238922119, -0.000484272837638855, -0.00045365095138549805, -0.0004230290651321411, -0.0003924071788787842, -0.00036178529262542725, -0.0003311634063720703, -0.0003005415201187134, -0.00026991963386535645, -0.0002392977476119995, -0.00020867586135864258, -0.00017805397510528564, -0.0001474320888519287, -0.00011681020259857178, -8.618831634521484e-05, -5.556643009185791e-05, -2.4944543838500977e-05, 5.677342414855957e-06, 3.629922866821289e-05, 6.692111492156982e-05, 9.754300117492676e-05, 0.0001281648874282837, 0.00015878677368164062, 0.00018940865993499756, 0.0002200305461883545, 0.0002506524324417114, 0.00028127431869506836, 0.0003118962049484253, 0.0003425180912017822, 0.00037313997745513916, 0.0004037618637084961, 0.00043438374996185303, 0.00046500563621520996, 0.0004956275224685669, 0.0005262494087219238, 0.0005568712949752808, 0.0005874931812286377, 0.0006181150674819946, 0.0006487369537353516, 0.0006793588399887085, 0.0007099807262420654, 0.0007406026124954224, 0.0007712244987487793, 0.0008018463850021362, 0.0008324682712554932, 0.0008630901575088501, 0.000893712043762207, 0.000924333930015564, 0.0009549558162689209, 0.0009855777025222778, 0.0010161995887756348, 0.0010468214750289917, 0.0010774433612823486, 0.0011080652475357056, 0.0011386871337890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 5.0, 9.0, 12.0, 29.0, 40.0, 52.0, 83.0, 114.0, 207.0, 317.0, 475.0, 715.0, 1187.0, 2171.0, 4111.0, 8467.0, 18944.0, 47906.0, 145887.0, 435294.0, 253623.0, 76643.0, 27942.0, 11700.0, 5567.0, 2862.0, 1634.0, 940.0, 548.0, 372.0, 223.0, 128.0, 92.0, 80.0, 48.0, 44.0, 28.0, 9.0, 13.0, 6.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7713623046875, -6.527099609375, -6.2828369140625, -6.03857421875, -5.7943115234375, -5.550048828125, -5.3057861328125, -5.0615234375, -4.8172607421875, -4.572998046875, -4.3287353515625, -4.08447265625, -3.8402099609375, -3.595947265625, -3.3516845703125, -3.107421875, -2.8631591796875, -2.618896484375, -2.3746337890625, -2.13037109375, -1.8861083984375, -1.641845703125, -1.3975830078125, -1.1533203125, -0.9090576171875, -0.664794921875, -0.4205322265625, -0.17626953125, 0.0679931640625, 0.312255859375, 0.5565185546875, 0.80078125, 1.0450439453125, 1.289306640625, 1.5335693359375, 1.77783203125, 2.0220947265625, 2.266357421875, 2.5106201171875, 2.7548828125, 2.9991455078125, 3.243408203125, 3.4876708984375, 3.73193359375, 3.9761962890625, 4.220458984375, 4.4647216796875, 4.708984375, 4.9532470703125, 5.197509765625, 5.4417724609375, 5.68603515625, 5.9302978515625, 6.174560546875, 6.4188232421875, 6.6630859375, 6.9073486328125, 7.151611328125, 7.3958740234375, 7.64013671875, 7.8843994140625, 8.128662109375, 8.3729248046875, 8.6171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 13.0, 12.0, 23.0, 15.0, 21.0, 28.0, 30.0, 38.0, 47.0, 45.0, 51.0, 54.0, 62.0, 66.0, 72.0, 59.0, 69.0, 39.0, 49.0, 33.0, 30.0, 21.0, 20.0, 14.0, 14.0, 15.0, 8.0, 8.0, 7.0, 7.0, 2.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.43865966796875, -5.2640380859375, -5.08941650390625, -4.914794921875, -4.74017333984375, -4.5655517578125, -4.39093017578125, -4.21630859375, -4.04168701171875, -3.8670654296875, -3.69244384765625, -3.517822265625, -3.34320068359375, -3.1685791015625, -2.99395751953125, -2.8193359375, -2.64471435546875, -2.4700927734375, -2.29547119140625, -2.120849609375, -1.94622802734375, -1.7716064453125, -1.59698486328125, -1.42236328125, -1.24774169921875, -1.0731201171875, -0.89849853515625, -0.723876953125, -0.54925537109375, -0.3746337890625, -0.20001220703125, -0.025390625, 0.14923095703125, 0.3238525390625, 0.49847412109375, 0.673095703125, 0.84771728515625, 1.0223388671875, 1.19696044921875, 1.37158203125, 1.54620361328125, 1.7208251953125, 1.89544677734375, 2.070068359375, 2.24468994140625, 2.4193115234375, 2.59393310546875, 2.7685546875, 2.94317626953125, 3.1177978515625, 3.29241943359375, 3.467041015625, 3.64166259765625, 3.8162841796875, 3.99090576171875, 4.16552734375, 4.34014892578125, 4.5147705078125, 4.68939208984375, 4.864013671875, 5.03863525390625, 5.2132568359375, 5.38787841796875, 5.5625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 14.0, 33.0, 45.0, 99.0, 250.0, 296.0, 111.0, 68.0, 34.0, 16.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2933654785156, -251.33868408203125, -244.3839874267578, -237.42930603027344, -230.47462463378906, -223.51992797851562, -216.56524658203125, -209.61056518554688, -202.6558837890625, -195.70120239257812, -188.7465057373047, -181.7918243408203, -174.83714294433594, -167.8824462890625, -160.92776489257812, -153.97308349609375, -147.0183868408203, -140.06370544433594, -133.1090087890625, -126.15432739257812, -119.19964599609375, -112.24495697021484, -105.29026794433594, -98.33558654785156, -91.38089752197266, -84.42620849609375, -77.47152709960938, -70.51683807373047, -63.56215286254883, -56.60746765136719, -49.65277862548828, -42.69809341430664, -35.743408203125, -28.78872299194336, -21.834035873413086, -14.879348754882812, -7.924663543701172, -0.9699783325195312, 5.984710693359375, 12.939395904541016, 19.894081115722656, 26.848766326904297, 33.80345153808594, 40.758140563964844, 47.712825775146484, 54.667510986328125, 61.62220001220703, 68.57688903808594, 75.53157043457031, 82.48625946044922, 89.4409408569336, 96.3956298828125, 103.35031127929688, 110.30500030517578, 117.25968933105469, 124.21437072753906, 131.1690673828125, 138.12374877929688, 145.0784454345703, 152.0331268310547, 158.98780822753906, 165.9425048828125, 172.89718627929688, 179.85186767578125, 186.80654907226562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 11.0, 13.0, 7.0, 16.0, 23.0, 47.0, 88.0, 141.0, 179.0, 149.0, 118.0, 74.0, 36.0, 26.0, 12.0, 10.0, 7.0, 7.0, 1.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-230.62716674804688, -221.70372009277344, -212.78025817871094, -203.8568115234375, -194.933349609375, -186.00990295410156, -177.08645629882812, -168.16299438476562, -159.2395477294922, -150.31610107421875, -141.39263916015625, -132.4691925048828, -123.54573822021484, -114.62228393554688, -105.69883728027344, -96.77538299560547, -87.8519287109375, -78.92847442626953, -70.00502014160156, -61.081573486328125, -52.158119201660156, -43.23466491699219, -34.311214447021484, -25.38776397705078, -16.464309692382812, -7.540857315063477, 1.3825950622558594, 10.306047439575195, 19.22949981689453, 28.1529541015625, 37.0764045715332, 45.999855041503906, 54.92333984375, 63.84679412841797, 72.77024841308594, 81.69369506835938, 90.61714935302734, 99.54060363769531, 108.46405029296875, 117.38750457763672, 126.31095886230469, 135.23440551757812, 144.15786743164062, 153.08131408691406, 162.0047607421875, 170.92822265625, 179.85166931152344, 188.77511596679688, 197.69857788085938, 206.6220245361328, 215.5454864501953, 224.46893310546875, 233.39239501953125, 242.3158416748047, 251.23928833007812, 260.1627502441406, 269.086181640625, 278.0096435546875, 286.9330749511719, 295.8565368652344, 304.7799987792969, 313.70343017578125, 322.62689208984375, 331.55035400390625, 340.47381591796875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 6.0, 11.0, 18.0, 19.0, 49.0, 86.0, 174.0, 322.0, 701.0, 1379.0, 3540.0, 10439.0, 52685.0, 3781214.0, 307449.0, 26344.0, 6054.0, 2035.0, 799.0, 420.0, 209.0, 135.0, 68.0, 39.0, 26.0, 17.0, 9.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -62.140625, -59.90625, -57.671875, -55.4375, -53.203125, -50.96875, -48.734375, -46.5, -44.265625, -42.03125, -39.796875, -37.5625, -35.328125, -33.09375, -30.859375, -28.625, -26.390625, -24.15625, -21.921875, -19.6875, -17.453125, -15.21875, -12.984375, -10.75, -8.515625, -6.28125, -4.046875, -1.8125, 0.421875, 2.65625, 4.890625, 7.125, 9.359375, 11.59375, 13.828125, 16.0625, 18.296875, 20.53125, 22.765625, 25.0, 27.234375, 29.46875, 31.703125, 33.9375, 36.171875, 38.40625, 40.640625, 42.875, 45.109375, 47.34375, 49.578125, 51.8125, 54.046875, 56.28125, 58.515625, 60.75, 62.984375, 65.21875, 67.453125, 69.6875, 71.921875, 74.15625, 76.390625, 78.625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 12.0, 9.0, 7.0, 11.0, 17.0, 26.0, 37.0, 59.0, 65.0, 87.0, 94.0, 105.0, 120.0, 85.0, 66.0, 44.0, 44.0, 29.0, 20.0, 21.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0390625, -2.90386962890625, -2.7686767578125, -2.63348388671875, -2.498291015625, -2.36309814453125, -2.2279052734375, -2.09271240234375, -1.95751953125, -1.82232666015625, -1.6871337890625, -1.55194091796875, -1.416748046875, -1.28155517578125, -1.1463623046875, -1.01116943359375, -0.8759765625, -0.74078369140625, -0.6055908203125, -0.47039794921875, -0.335205078125, -0.20001220703125, -0.0648193359375, 0.07037353515625, 0.20556640625, 0.34075927734375, 0.4759521484375, 0.61114501953125, 0.746337890625, 0.88153076171875, 1.0167236328125, 1.15191650390625, 1.287109375, 1.42230224609375, 1.5574951171875, 1.69268798828125, 1.827880859375, 1.96307373046875, 2.0982666015625, 2.23345947265625, 2.36865234375, 2.50384521484375, 2.6390380859375, 2.77423095703125, 2.909423828125, 3.04461669921875, 3.1798095703125, 3.31500244140625, 3.4501953125, 3.58538818359375, 3.7205810546875, 3.85577392578125, 3.990966796875, 4.12615966796875, 4.2613525390625, 4.39654541015625, 4.53173828125, 4.66693115234375, 4.8021240234375, 4.93731689453125, 5.072509765625, 5.20770263671875, 5.3428955078125, 5.47808837890625, 5.61328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 16.0, 16.0, 25.0, 32.0, 50.0, 71.0, 93.0, 154.0, 246.0, 367.0, 639.0, 1029.0, 1862.0, 3334.0, 6262.0, 12954.0, 29057.0, 78145.0, 317399.0, 3295717.0, 315678.0, 76740.0, 28324.0, 12508.0, 6061.0, 3207.0, 1726.0, 942.0, 548.0, 376.0, 220.0, 134.0, 93.0, 80.0, 52.0, 33.0, 25.0, 18.0, 9.0, 11.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.0625, -31.075927734375, -30.08935546875, -29.102783203125, -28.1162109375, -27.129638671875, -26.14306640625, -25.156494140625, -24.169921875, -23.183349609375, -22.19677734375, -21.210205078125, -20.2236328125, -19.237060546875, -18.25048828125, -17.263916015625, -16.27734375, -15.290771484375, -14.30419921875, -13.317626953125, -12.3310546875, -11.344482421875, -10.35791015625, -9.371337890625, -8.384765625, -7.398193359375, -6.41162109375, -5.425048828125, -4.4384765625, -3.451904296875, -2.46533203125, -1.478759765625, -0.4921875, 0.494384765625, 1.48095703125, 2.467529296875, 3.4541015625, 4.440673828125, 5.42724609375, 6.413818359375, 7.400390625, 8.386962890625, 9.37353515625, 10.360107421875, 11.3466796875, 12.333251953125, 13.31982421875, 14.306396484375, 15.29296875, 16.279541015625, 17.26611328125, 18.252685546875, 19.2392578125, 20.225830078125, 21.21240234375, 22.198974609375, 23.185546875, 24.172119140625, 25.15869140625, 26.145263671875, 27.1318359375, 28.118408203125, 29.10498046875, 30.091552734375, 31.078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 5.0, 12.0, 16.0, 9.0, 18.0, 20.0, 23.0, 34.0, 50.0, 55.0, 83.0, 147.0, 254.0, 460.0, 2035.0, 326.0, 162.0, 101.0, 59.0, 65.0, 42.0, 18.0, 19.0, 9.0, 11.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.78717041015625, -4.5977783203125, -4.40838623046875, -4.218994140625, -4.02960205078125, -3.8402099609375, -3.65081787109375, -3.46142578125, -3.27203369140625, -3.0826416015625, -2.89324951171875, -2.703857421875, -2.51446533203125, -2.3250732421875, -2.13568115234375, -1.9462890625, -1.75689697265625, -1.5675048828125, -1.37811279296875, -1.188720703125, -0.99932861328125, -0.8099365234375, -0.62054443359375, -0.43115234375, -0.24176025390625, -0.0523681640625, 0.13702392578125, 0.326416015625, 0.51580810546875, 0.7052001953125, 0.89459228515625, 1.083984375, 1.27337646484375, 1.4627685546875, 1.65216064453125, 1.841552734375, 2.03094482421875, 2.2203369140625, 2.40972900390625, 2.59912109375, 2.78851318359375, 2.9779052734375, 3.16729736328125, 3.356689453125, 3.54608154296875, 3.7354736328125, 3.92486572265625, 4.1142578125, 4.30364990234375, 4.4930419921875, 4.68243408203125, 4.871826171875, 5.06121826171875, 5.2506103515625, 5.44000244140625, 5.62939453125, 5.81878662109375, 6.0081787109375, 6.19757080078125, 6.386962890625, 6.57635498046875, 6.7657470703125, 6.95513916015625, 7.14453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 11.0, 3.0, 8.0, 17.0, 10.0, 28.0, 63.0, 63.0, 130.0, 172.0, 161.0, 134.0, 64.0, 64.0, 25.0, 17.0, 11.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.96562194824219, -61.54591751098633, -60.1262092590332, -58.706504821777344, -57.28679656982422, -55.86709213256836, -54.4473876953125, -53.027679443359375, -51.607975006103516, -50.188270568847656, -48.76856231689453, -47.34885787963867, -45.92915344238281, -44.50944519042969, -43.08974075317383, -41.67003631591797, -40.250328063964844, -38.830623626708984, -37.41091537475586, -35.9912109375, -34.571502685546875, -33.151798248291016, -31.732093811035156, -30.312387466430664, -28.892681121826172, -27.47297477722168, -26.053268432617188, -24.633563995361328, -23.213857650756836, -21.794151306152344, -20.374446868896484, -18.954740524291992, -17.5350341796875, -16.115327835083008, -14.695622444152832, -13.275917053222656, -11.856210708618164, -10.436504364013672, -9.016798973083496, -7.59709358215332, -6.177387237548828, -4.757681369781494, -3.33797550201416, -1.9182696342468262, -0.4985637664794922, 0.9211421012878418, 2.340847969055176, 3.7605533599853516, 5.180259704589844, 6.599965572357178, 8.019671440124512, 9.439376831054688, 10.85908317565918, 12.278789520263672, 13.698494911193848, 15.118200302124023, 16.537906646728516, 17.957612991333008, 19.3773193359375, 20.79702377319336, 22.21673011779785, 23.636436462402344, 25.056140899658203, 26.475847244262695, 27.895553588867188]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 8.0, 15.0, 14.0, 20.0, 25.0, 31.0, 37.0, 42.0, 57.0, 51.0, 57.0, 70.0, 60.0, 55.0, 63.0, 52.0, 40.0, 61.0, 44.0, 40.0, 34.0, 16.0, 19.0, 14.0, 10.0, 14.0, 6.0, 3.0, 7.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.37102699279785, -28.486143112182617, -27.601259231567383, -26.71637535095215, -25.83148956298828, -24.946605682373047, -24.061721801757812, -23.176837921142578, -22.291954040527344, -21.40707015991211, -20.522186279296875, -19.63730239868164, -18.752418518066406, -17.867534637451172, -16.982648849487305, -16.09776496887207, -15.212881088256836, -14.327997207641602, -13.443113327026367, -12.558228492736816, -11.673344612121582, -10.788460731506348, -9.903575897216797, -9.018692016601562, -8.133808135986328, -7.248924255371094, -6.364039897918701, -5.479155540466309, -4.594271659851074, -3.70938777923584, -2.8245034217834473, -1.9396190643310547, -1.0547332763671875, -0.16984915733337402, 0.7150349617004395, 1.599919080734253, 2.4848031997680664, 3.369687080383301, 4.254571437835693, 5.139455795288086, 6.02433967590332, 6.909223556518555, 7.794107913970947, 8.67899227142334, 9.563876152038574, 10.448760032653809, 11.33364486694336, 12.218528747558594, 13.103412628173828, 13.988296508789062, 14.873180389404297, 15.758065223693848, 16.642948150634766, 17.52783203125, 18.412717819213867, 19.2976016998291, 20.182485580444336, 21.06736946105957, 21.952253341674805, 22.83713722229004, 23.722023010253906, 24.60690689086914, 25.491790771484375, 26.37667465209961, 27.261558532714844]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 6.0, 15.0, 31.0, 25.0, 60.0, 85.0, 136.0, 261.0, 494.0, 1091.0, 2517.0, 5991.0, 19358.0, 84212.0, 499382.0, 350720.0, 60493.0, 14823.0, 4825.0, 2057.0, 887.0, 463.0, 229.0, 113.0, 82.0, 56.0, 35.0, 30.0, 27.0, 10.0, 9.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.8232421875, -41.521484375, -40.2197265625, -38.91796875, -37.6162109375, -36.314453125, -35.0126953125, -33.7109375, -32.4091796875, -31.107421875, -29.8056640625, -28.50390625, -27.2021484375, -25.900390625, -24.5986328125, -23.296875, -21.9951171875, -20.693359375, -19.3916015625, -18.08984375, -16.7880859375, -15.486328125, -14.1845703125, -12.8828125, -11.5810546875, -10.279296875, -8.9775390625, -7.67578125, -6.3740234375, -5.072265625, -3.7705078125, -2.46875, -1.1669921875, 0.134765625, 1.4365234375, 2.73828125, 4.0400390625, 5.341796875, 6.6435546875, 7.9453125, 9.2470703125, 10.548828125, 11.8505859375, 13.15234375, 14.4541015625, 15.755859375, 17.0576171875, 18.359375, 19.6611328125, 20.962890625, 22.2646484375, 23.56640625, 24.8681640625, 26.169921875, 27.4716796875, 28.7734375, 30.0751953125, 31.376953125, 32.6787109375, 33.98046875, 35.2822265625, 36.583984375, 37.8857421875, 39.1875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 1.0, 2.0, 4.0, 10.0, 11.0, 19.0, 36.0, 45.0, 59.0, 79.0, 79.0, 75.0, 106.0, 102.0, 94.0, 61.0, 62.0, 51.0, 44.0, 10.0, 19.0, 7.0, 8.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.13232421875, -2.9873046875, -2.84228515625, -2.697265625, -2.55224609375, -2.4072265625, -2.26220703125, -2.1171875, -1.97216796875, -1.8271484375, -1.68212890625, -1.537109375, -1.39208984375, -1.2470703125, -1.10205078125, -0.95703125, -0.81201171875, -0.6669921875, -0.52197265625, -0.376953125, -0.23193359375, -0.0869140625, 0.05810546875, 0.203125, 0.34814453125, 0.4931640625, 0.63818359375, 0.783203125, 0.92822265625, 1.0732421875, 1.21826171875, 1.36328125, 1.50830078125, 1.6533203125, 1.79833984375, 1.943359375, 2.08837890625, 2.2333984375, 2.37841796875, 2.5234375, 2.66845703125, 2.8134765625, 2.95849609375, 3.103515625, 3.24853515625, 3.3935546875, 3.53857421875, 3.68359375, 3.82861328125, 3.9736328125, 4.11865234375, 4.263671875, 4.40869140625, 4.5537109375, 4.69873046875, 4.84375, 4.98876953125, 5.1337890625, 5.27880859375, 5.423828125, 5.56884765625, 5.7138671875, 5.85888671875, 6.00390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 18.0, 32.0, 34.0, 53.0, 79.0, 131.0, 216.0, 355.0, 672.0, 1226.0, 2699.0, 6851.0, 18988.0, 68136.0, 329450.0, 475961.0, 101930.0, 26267.0, 8582.0, 3413.0, 1533.0, 735.0, 437.0, 244.0, 158.0, 108.0, 54.0, 56.0, 32.0, 29.0, 14.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.783935546875, -21.97412109375, -21.164306640625, -20.3544921875, -19.544677734375, -18.73486328125, -17.925048828125, -17.115234375, -16.305419921875, -15.49560546875, -14.685791015625, -13.8759765625, -13.066162109375, -12.25634765625, -11.446533203125, -10.63671875, -9.826904296875, -9.01708984375, -8.207275390625, -7.3974609375, -6.587646484375, -5.77783203125, -4.968017578125, -4.158203125, -3.348388671875, -2.53857421875, -1.728759765625, -0.9189453125, -0.109130859375, 0.70068359375, 1.510498046875, 2.3203125, 3.130126953125, 3.93994140625, 4.749755859375, 5.5595703125, 6.369384765625, 7.17919921875, 7.989013671875, 8.798828125, 9.608642578125, 10.41845703125, 11.228271484375, 12.0380859375, 12.847900390625, 13.65771484375, 14.467529296875, 15.27734375, 16.087158203125, 16.89697265625, 17.706787109375, 18.5166015625, 19.326416015625, 20.13623046875, 20.946044921875, 21.755859375, 22.565673828125, 23.37548828125, 24.185302734375, 24.9951171875, 25.804931640625, 26.61474609375, 27.424560546875, 28.234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 9.0, 6.0, 17.0, 29.0, 21.0, 27.0, 40.0, 43.0, 55.0, 58.0, 50.0, 72.0, 68.0, 54.0, 56.0, 59.0, 55.0, 48.0, 45.0, 40.0, 30.0, 27.0, 17.0, 14.0, 8.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.3927001953125, -13.910400390625, -13.4281005859375, -12.94580078125, -12.4635009765625, -11.981201171875, -11.4989013671875, -11.0166015625, -10.5343017578125, -10.052001953125, -9.5697021484375, -9.08740234375, -8.6051025390625, -8.122802734375, -7.6405029296875, -7.158203125, -6.6759033203125, -6.193603515625, -5.7113037109375, -5.22900390625, -4.7467041015625, -4.264404296875, -3.7821044921875, -3.2998046875, -2.8175048828125, -2.335205078125, -1.8529052734375, -1.37060546875, -0.8883056640625, -0.406005859375, 0.0762939453125, 0.55859375, 1.0408935546875, 1.523193359375, 2.0054931640625, 2.48779296875, 2.9700927734375, 3.452392578125, 3.9346923828125, 4.4169921875, 4.8992919921875, 5.381591796875, 5.8638916015625, 6.34619140625, 6.8284912109375, 7.310791015625, 7.7930908203125, 8.275390625, 8.7576904296875, 9.239990234375, 9.7222900390625, 10.20458984375, 10.6868896484375, 11.169189453125, 11.6514892578125, 12.1337890625, 12.6160888671875, 13.098388671875, 13.5806884765625, 14.06298828125, 14.5452880859375, 15.027587890625, 15.5098876953125, 15.9921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 7.0, 6.0, 9.0, 14.0, 14.0, 16.0, 42.0, 60.0, 57.0, 106.0, 148.0, 228.0, 374.0, 628.0, 1068.0, 1938.0, 3723.0, 7858.0, 17829.0, 48304.0, 165256.0, 477794.0, 221199.0, 61177.0, 21799.0, 9187.0, 4436.0, 2205.0, 1213.0, 678.0, 364.0, 276.0, 183.0, 100.0, 68.0, 41.0, 45.0, 26.0, 17.0, 17.0, 12.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0], "bins": [-27.078125, -26.317626953125, -25.55712890625, -24.796630859375, -24.0361328125, -23.275634765625, -22.51513671875, -21.754638671875, -20.994140625, -20.233642578125, -19.47314453125, -18.712646484375, -17.9521484375, -17.191650390625, -16.43115234375, -15.670654296875, -14.91015625, -14.149658203125, -13.38916015625, -12.628662109375, -11.8681640625, -11.107666015625, -10.34716796875, -9.586669921875, -8.826171875, -8.065673828125, -7.30517578125, -6.544677734375, -5.7841796875, -5.023681640625, -4.26318359375, -3.502685546875, -2.7421875, -1.981689453125, -1.22119140625, -0.460693359375, 0.2998046875, 1.060302734375, 1.82080078125, 2.581298828125, 3.341796875, 4.102294921875, 4.86279296875, 5.623291015625, 6.3837890625, 7.144287109375, 7.90478515625, 8.665283203125, 9.42578125, 10.186279296875, 10.94677734375, 11.707275390625, 12.4677734375, 13.228271484375, 13.98876953125, 14.749267578125, 15.509765625, 16.270263671875, 17.03076171875, 17.791259765625, 18.5517578125, 19.312255859375, 20.07275390625, 20.833251953125, 21.59375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 11.0, 10.0, 16.0, 31.0, 36.0, 62.0, 99.0, 157.0, 171.0, 125.0, 87.0, 64.0, 52.0, 23.0, 12.0, 13.0, 9.0, 1.0, 4.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003108978271484375, -0.0030025839805603027, -0.0028961896896362305, -0.002789795398712158, -0.002683401107788086, -0.0025770068168640137, -0.0024706125259399414, -0.002364218235015869, -0.002257823944091797, -0.0021514296531677246, -0.0020450353622436523, -0.00193864107131958, -0.0018322467803955078, -0.0017258524894714355, -0.0016194581985473633, -0.001513063907623291, -0.0014066696166992188, -0.0013002753257751465, -0.0011938810348510742, -0.001087486743927002, -0.0009810924530029297, -0.0008746981620788574, -0.0007683038711547852, -0.0006619095802307129, -0.0005555152893066406, -0.00044912099838256836, -0.0003427267074584961, -0.00023633241653442383, -0.00012993812561035156, -2.3543834686279297e-05, 8.285045623779297e-05, 0.00018924474716186523, 0.0002956390380859375, 0.00040203332901000977, 0.000508427619934082, 0.0006148219108581543, 0.0007212162017822266, 0.0008276104927062988, 0.0009340047836303711, 0.0010403990745544434, 0.0011467933654785156, 0.0012531876564025879, 0.0013595819473266602, 0.0014659762382507324, 0.0015723705291748047, 0.001678764820098877, 0.0017851591110229492, 0.0018915534019470215, 0.0019979476928710938, 0.002104341983795166, 0.0022107362747192383, 0.0023171305656433105, 0.002423524856567383, 0.002529919147491455, 0.0026363134384155273, 0.0027427077293395996, 0.002849102020263672, 0.002955496311187744, 0.0030618906021118164, 0.0031682848930358887, 0.003274679183959961, 0.003381073474884033, 0.0034874677658081055, 0.0035938620567321777, 0.00370025634765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 8.0, 18.0, 6.0, 23.0, 23.0, 45.0, 77.0, 101.0, 157.0, 259.0, 393.0, 697.0, 1210.0, 2430.0, 4856.0, 11128.0, 29000.0, 96094.0, 403275.0, 365593.0, 86136.0, 26745.0, 10379.0, 4664.0, 2282.0, 1201.0, 671.0, 406.0, 225.0, 138.0, 92.0, 67.0, 47.0, 27.0, 20.0, 15.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.09375, -23.28955078125, -22.4853515625, -21.68115234375, -20.876953125, -20.07275390625, -19.2685546875, -18.46435546875, -17.66015625, -16.85595703125, -16.0517578125, -15.24755859375, -14.443359375, -13.63916015625, -12.8349609375, -12.03076171875, -11.2265625, -10.42236328125, -9.6181640625, -8.81396484375, -8.009765625, -7.20556640625, -6.4013671875, -5.59716796875, -4.79296875, -3.98876953125, -3.1845703125, -2.38037109375, -1.576171875, -0.77197265625, 0.0322265625, 0.83642578125, 1.640625, 2.44482421875, 3.2490234375, 4.05322265625, 4.857421875, 5.66162109375, 6.4658203125, 7.27001953125, 8.07421875, 8.87841796875, 9.6826171875, 10.48681640625, 11.291015625, 12.09521484375, 12.8994140625, 13.70361328125, 14.5078125, 15.31201171875, 16.1162109375, 16.92041015625, 17.724609375, 18.52880859375, 19.3330078125, 20.13720703125, 20.94140625, 21.74560546875, 22.5498046875, 23.35400390625, 24.158203125, 24.96240234375, 25.7666015625, 26.57080078125, 27.375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 10.0, 11.0, 19.0, 20.0, 25.0, 25.0, 29.0, 38.0, 46.0, 57.0, 53.0, 66.0, 79.0, 69.0, 72.0, 53.0, 53.0, 43.0, 40.0, 33.0, 34.0, 16.0, 13.0, 14.0, 7.0, 12.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9234619140625, -10.518798828125, -10.1141357421875, -9.70947265625, -9.3048095703125, -8.900146484375, -8.4954833984375, -8.0908203125, -7.6861572265625, -7.281494140625, -6.8768310546875, -6.47216796875, -6.0675048828125, -5.662841796875, -5.2581787109375, -4.853515625, -4.4488525390625, -4.044189453125, -3.6395263671875, -3.23486328125, -2.8302001953125, -2.425537109375, -2.0208740234375, -1.6162109375, -1.2115478515625, -0.806884765625, -0.4022216796875, 0.00244140625, 0.4071044921875, 0.811767578125, 1.2164306640625, 1.62109375, 2.0257568359375, 2.430419921875, 2.8350830078125, 3.23974609375, 3.6444091796875, 4.049072265625, 4.4537353515625, 4.8583984375, 5.2630615234375, 5.667724609375, 6.0723876953125, 6.47705078125, 6.8817138671875, 7.286376953125, 7.6910400390625, 8.095703125, 8.5003662109375, 8.905029296875, 9.3096923828125, 9.71435546875, 10.1190185546875, 10.523681640625, 10.9283447265625, 11.3330078125, 11.7376708984375, 12.142333984375, 12.5469970703125, 12.95166015625, 13.3563232421875, 13.760986328125, 14.1656494140625, 14.5703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 35.0, 145.0, 359.0, 307.0, 78.0, 30.0, 24.0, 9.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.84410095214844, -149.30491638183594, -137.7657470703125, -126.2265625, -114.6873779296875, -103.148193359375, -91.60901641845703, -80.06983947753906, -68.53065490722656, -56.99147415161133, -45.452293395996094, -33.91311264038086, -22.373931884765625, -10.83475112915039, 0.7044296264648438, 12.243606567382812, 23.782791137695312, 35.32197189331055, 46.86115264892578, 58.400333404541016, 69.93951416015625, 81.47869873046875, 93.01787567138672, 104.55705261230469, 116.09623718261719, 127.63542175292969, 139.17459106445312, 150.71377563476562, 162.25296020507812, 173.79214477539062, 185.33132934570312, 196.87049865722656, 208.40966796875, 219.9488525390625, 231.488037109375, 243.02720642089844, 254.56639099121094, 266.1055603027344, 277.6447448730469, 289.1839294433594, 300.7231140136719, 312.2622985839844, 323.8014831542969, 335.3406677246094, 346.87982177734375, 358.41900634765625, 369.95819091796875, 381.49737548828125, 393.03656005859375, 404.57574462890625, 416.11492919921875, 427.65411376953125, 439.19329833984375, 450.7324523925781, 462.2716369628906, 473.8108215332031, 485.3500061035156, 496.8891906738281, 508.4283752441406, 519.967529296875, 531.5067138671875, 543.0458984375, 554.5850830078125, 566.124267578125, 577.6634521484375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 11.0, 16.0, 15.0, 25.0, 23.0, 29.0, 36.0, 33.0, 47.0, 64.0, 65.0, 67.0, 50.0, 58.0, 70.0, 60.0, 57.0, 56.0, 39.0, 34.0, 31.0, 14.0, 10.0, 12.0, 10.0, 7.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.30193328857422, -82.23118591308594, -79.16043853759766, -76.08969116210938, -73.01893615722656, -69.94818878173828, -66.87744140625, -63.80669403076172, -60.73594284057617, -57.66519546508789, -54.594444274902344, -51.52369689941406, -48.45294952392578, -45.382198333740234, -42.31145095825195, -39.240699768066406, -36.169952392578125, -33.099205017089844, -30.028453826904297, -26.957706451416016, -23.8869571685791, -20.816207885742188, -17.745460510253906, -14.674711227416992, -11.603961944580078, -8.533212661743164, -5.462464332580566, -2.3917160034179688, 0.6790332794189453, 3.7497825622558594, 6.820529937744141, 9.891279220581055, 12.962020874023438, 16.03277015686035, 19.103519439697266, 22.174266815185547, 25.24501609802246, 28.315765380859375, 31.386512756347656, 34.45726013183594, 37.528011322021484, 40.598758697509766, 43.66950988769531, 46.740257263183594, 49.811004638671875, 52.88175582885742, 55.9525032043457, 59.02325439453125, 62.09400177001953, 65.16474914550781, 68.2354965209961, 71.30624389648438, 74.37699890136719, 77.44774627685547, 80.51849365234375, 83.58924102783203, 86.65998840332031, 89.7307357788086, 92.80148315429688, 95.87223815917969, 98.94298553466797, 102.01373291015625, 105.08448028564453, 108.15522766113281, 111.22598266601562]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 0.0, 2.0, 6.0, 4.0, 19.0, 19.0, 23.0, 40.0, 64.0, 102.0, 142.0, 240.0, 429.0, 738.0, 1305.0, 2672.0, 6185.0, 15721.0, 51130.0, 270382.0, 3471573.0, 290656.0, 54248.0, 16697.0, 6283.0, 2704.0, 1230.0, 617.0, 404.0, 228.0, 136.0, 84.0, 56.0, 38.0, 39.0, 16.0, 17.0, 6.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-67.875, -66.01611328125, -64.1572265625, -62.29833984375, -60.439453125, -58.58056640625, -56.7216796875, -54.86279296875, -53.00390625, -51.14501953125, -49.2861328125, -47.42724609375, -45.568359375, -43.70947265625, -41.8505859375, -39.99169921875, -38.1328125, -36.27392578125, -34.4150390625, -32.55615234375, -30.697265625, -28.83837890625, -26.9794921875, -25.12060546875, -23.26171875, -21.40283203125, -19.5439453125, -17.68505859375, -15.826171875, -13.96728515625, -12.1083984375, -10.24951171875, -8.390625, -6.53173828125, -4.6728515625, -2.81396484375, -0.955078125, 0.90380859375, 2.7626953125, 4.62158203125, 6.48046875, 8.33935546875, 10.1982421875, 12.05712890625, 13.916015625, 15.77490234375, 17.6337890625, 19.49267578125, 21.3515625, 23.21044921875, 25.0693359375, 26.92822265625, 28.787109375, 30.64599609375, 32.5048828125, 34.36376953125, 36.22265625, 38.08154296875, 39.9404296875, 41.79931640625, 43.658203125, 45.51708984375, 47.3759765625, 49.23486328125, 51.09375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 7.0, 13.0, 12.0, 25.0, 29.0, 40.0, 46.0, 56.0, 56.0, 80.0, 85.0, 91.0, 89.0, 78.0, 57.0, 49.0, 36.0, 42.0, 30.0, 24.0, 13.0, 6.0, 9.0, 6.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.97515869140625, -2.8526611328125, -2.73016357421875, -2.607666015625, -2.48516845703125, -2.3626708984375, -2.24017333984375, -2.11767578125, -1.99517822265625, -1.8726806640625, -1.75018310546875, -1.627685546875, -1.50518798828125, -1.3826904296875, -1.26019287109375, -1.1376953125, -1.01519775390625, -0.8927001953125, -0.77020263671875, -0.647705078125, -0.52520751953125, -0.4027099609375, -0.28021240234375, -0.15771484375, -0.03521728515625, 0.0872802734375, 0.20977783203125, 0.332275390625, 0.45477294921875, 0.5772705078125, 0.69976806640625, 0.822265625, 0.94476318359375, 1.0672607421875, 1.18975830078125, 1.312255859375, 1.43475341796875, 1.5572509765625, 1.67974853515625, 1.80224609375, 1.92474365234375, 2.0472412109375, 2.16973876953125, 2.292236328125, 2.41473388671875, 2.5372314453125, 2.65972900390625, 2.7822265625, 2.90472412109375, 3.0272216796875, 3.14971923828125, 3.272216796875, 3.39471435546875, 3.5172119140625, 3.63970947265625, 3.76220703125, 3.88470458984375, 4.0072021484375, 4.12969970703125, 4.252197265625, 4.37469482421875, 4.4971923828125, 4.61968994140625, 4.7421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 9.0, 11.0, 7.0, 15.0, 12.0, 25.0, 26.0, 43.0, 56.0, 85.0, 163.0, 265.0, 570.0, 1373.0, 3953.0, 14455.0, 82214.0, 1189914.0, 2766463.0, 109169.0, 17875.0, 4634.0, 1573.0, 612.0, 281.0, 153.0, 100.0, 56.0, 39.0, 28.0, 32.0, 16.0, 9.0, 9.0, 4.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.7470703125, -64.369140625, -61.9912109375, -59.61328125, -57.2353515625, -54.857421875, -52.4794921875, -50.1015625, -47.7236328125, -45.345703125, -42.9677734375, -40.58984375, -38.2119140625, -35.833984375, -33.4560546875, -31.078125, -28.7001953125, -26.322265625, -23.9443359375, -21.56640625, -19.1884765625, -16.810546875, -14.4326171875, -12.0546875, -9.6767578125, -7.298828125, -4.9208984375, -2.54296875, -0.1650390625, 2.212890625, 4.5908203125, 6.96875, 9.3466796875, 11.724609375, 14.1025390625, 16.48046875, 18.8583984375, 21.236328125, 23.6142578125, 25.9921875, 28.3701171875, 30.748046875, 33.1259765625, 35.50390625, 37.8818359375, 40.259765625, 42.6376953125, 45.015625, 47.3935546875, 49.771484375, 52.1494140625, 54.52734375, 56.9052734375, 59.283203125, 61.6611328125, 64.0390625, 66.4169921875, 68.794921875, 71.1728515625, 73.55078125, 75.9287109375, 78.306640625, 80.6845703125, 83.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 18.0, 13.0, 19.0, 18.0, 47.0, 51.0, 70.0, 88.0, 118.0, 173.0, 227.0, 354.0, 1095.0, 620.0, 298.0, 228.0, 168.0, 121.0, 72.0, 73.0, 39.0, 30.0, 17.0, 26.0, 13.0, 14.0, 8.0, 6.0, 7.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87890625, -6.6561279296875, -6.433349609375, -6.2105712890625, -5.98779296875, -5.7650146484375, -5.542236328125, -5.3194580078125, -5.0966796875, -4.8739013671875, -4.651123046875, -4.4283447265625, -4.20556640625, -3.9827880859375, -3.760009765625, -3.5372314453125, -3.314453125, -3.0916748046875, -2.868896484375, -2.6461181640625, -2.42333984375, -2.2005615234375, -1.977783203125, -1.7550048828125, -1.5322265625, -1.3094482421875, -1.086669921875, -0.8638916015625, -0.64111328125, -0.4183349609375, -0.195556640625, 0.0272216796875, 0.25, 0.4727783203125, 0.695556640625, 0.9183349609375, 1.14111328125, 1.3638916015625, 1.586669921875, 1.8094482421875, 2.0322265625, 2.2550048828125, 2.477783203125, 2.7005615234375, 2.92333984375, 3.1461181640625, 3.368896484375, 3.5916748046875, 3.814453125, 4.0372314453125, 4.260009765625, 4.4827880859375, 4.70556640625, 4.9283447265625, 5.151123046875, 5.3739013671875, 5.5966796875, 5.8194580078125, 6.042236328125, 6.2650146484375, 6.48779296875, 6.7105712890625, 6.933349609375, 7.1561279296875, 7.37890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 10.0, 57.0, 165.0, 435.0, 245.0, 59.0, 26.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.42633056640625, -113.62159729003906, -107.8168716430664, -102.01214599609375, -96.20741271972656, -90.40267944335938, -84.59795379638672, -78.79322814941406, -72.98849487304688, -67.18376159667969, -61.37903594970703, -55.57430648803711, -49.76957702636719, -43.964847564697266, -38.160118103027344, -32.35538864135742, -26.5506591796875, -20.745929718017578, -14.941200256347656, -9.136470794677734, -3.3317413330078125, 2.4729881286621094, 8.277717590332031, 14.082447052001953, 19.887176513671875, 25.691905975341797, 31.49663543701172, 37.30136489868164, 43.10609436035156, 48.910823822021484, 54.715553283691406, 60.52028274536133, 66.32501220703125, 72.12974548339844, 77.9344711303711, 83.73919677734375, 89.54393005371094, 95.34866333007812, 101.15338897705078, 106.95811462402344, 112.76284790039062, 118.56758117675781, 124.37230682373047, 130.17703247070312, 135.9817657470703, 141.7864990234375, 147.59121704101562, 153.3959503173828, 159.20068359375, 165.0054168701172, 170.81015014648438, 176.6148681640625, 182.4196014404297, 188.22433471679688, 194.029052734375, 199.8337860107422, 205.63851928710938, 211.44325256347656, 217.24798583984375, 223.05270385742188, 228.85743713378906, 234.66217041015625, 240.46688842773438, 246.27162170410156, 252.07635498046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 10.0, 8.0, 14.0, 20.0, 20.0, 30.0, 17.0, 32.0, 34.0, 30.0, 48.0, 32.0, 40.0, 39.0, 41.0, 44.0, 46.0, 46.0, 57.0, 38.0, 37.0, 44.0, 27.0, 29.0, 21.0, 25.0, 20.0, 26.0, 16.0, 12.0, 11.0, 11.0, 6.0, 8.0, 7.0, 7.0, 3.0, 1.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.201194763183594, -28.271142959594727, -27.341093063354492, -26.411041259765625, -25.48099136352539, -24.550939559936523, -23.620887756347656, -22.690837860107422, -21.760786056518555, -20.830734252929688, -19.900684356689453, -18.970632553100586, -18.04058265686035, -17.110530853271484, -16.18048095703125, -15.250429153442383, -14.320378303527832, -13.390327453613281, -12.46027660369873, -11.53022575378418, -10.600173950195312, -9.670123100280762, -8.740072250366211, -7.810020923614502, -6.879970073699951, -5.9499192237854, -5.019867897033691, -4.089817047119141, -3.1597659587860107, -2.229714870452881, -1.29966402053833, -0.3696126937866211, 0.5604381561279297, 1.4904892444610596, 2.4205403327941895, 3.3505911827087402, 4.280642509460449, 5.210693359375, 6.140744209289551, 7.07079553604126, 8.000846862792969, 8.93089771270752, 9.86094856262207, 10.791000366210938, 11.721051216125488, 12.651102066040039, 13.58115291595459, 14.51120376586914, 15.441254615783691, 16.371305465698242, 17.30135726928711, 18.231407165527344, 19.16145896911621, 20.091510772705078, 21.021560668945312, 21.95161247253418, 22.881662368774414, 23.81171417236328, 24.741764068603516, 25.671815872192383, 26.601865768432617, 27.531917572021484, 28.46196746826172, 29.392019271850586, 30.322071075439453]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 8.0, 7.0, 20.0, 26.0, 38.0, 45.0, 65.0, 66.0, 145.0, 177.0, 287.0, 426.0, 751.0, 1288.0, 2498.0, 5222.0, 11632.0, 29347.0, 78833.0, 214369.0, 380425.0, 200658.0, 73100.0, 27686.0, 10978.0, 4843.0, 2388.0, 1248.0, 673.0, 399.0, 288.0, 189.0, 113.0, 94.0, 68.0, 47.0, 33.0, 24.0, 16.0, 17.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.3125, -32.345947265625, -31.37939453125, -30.412841796875, -29.4462890625, -28.479736328125, -27.51318359375, -26.546630859375, -25.580078125, -24.613525390625, -23.64697265625, -22.680419921875, -21.7138671875, -20.747314453125, -19.78076171875, -18.814208984375, -17.84765625, -16.881103515625, -15.91455078125, -14.947998046875, -13.9814453125, -13.014892578125, -12.04833984375, -11.081787109375, -10.115234375, -9.148681640625, -8.18212890625, -7.215576171875, -6.2490234375, -5.282470703125, -4.31591796875, -3.349365234375, -2.3828125, -1.416259765625, -0.44970703125, 0.516845703125, 1.4833984375, 2.449951171875, 3.41650390625, 4.383056640625, 5.349609375, 6.316162109375, 7.28271484375, 8.249267578125, 9.2158203125, 10.182373046875, 11.14892578125, 12.115478515625, 13.08203125, 14.048583984375, 15.01513671875, 15.981689453125, 16.9482421875, 17.914794921875, 18.88134765625, 19.847900390625, 20.814453125, 21.781005859375, 22.74755859375, 23.714111328125, 24.6806640625, 25.647216796875, 26.61376953125, 27.580322265625, 28.546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 9.0, 16.0, 24.0, 28.0, 42.0, 47.0, 68.0, 69.0, 89.0, 85.0, 84.0, 76.0, 76.0, 62.0, 56.0, 33.0, 30.0, 27.0, 21.0, 13.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.0909423828125, -2.963134765625, -2.8353271484375, -2.70751953125, -2.5797119140625, -2.451904296875, -2.3240966796875, -2.1962890625, -2.0684814453125, -1.940673828125, -1.8128662109375, -1.68505859375, -1.5572509765625, -1.429443359375, -1.3016357421875, -1.173828125, -1.0460205078125, -0.918212890625, -0.7904052734375, -0.66259765625, -0.5347900390625, -0.406982421875, -0.2791748046875, -0.1513671875, -0.0235595703125, 0.104248046875, 0.2320556640625, 0.35986328125, 0.4876708984375, 0.615478515625, 0.7432861328125, 0.87109375, 0.9989013671875, 1.126708984375, 1.2545166015625, 1.38232421875, 1.5101318359375, 1.637939453125, 1.7657470703125, 1.8935546875, 2.0213623046875, 2.149169921875, 2.2769775390625, 2.40478515625, 2.5325927734375, 2.660400390625, 2.7882080078125, 2.916015625, 3.0438232421875, 3.171630859375, 3.2994384765625, 3.42724609375, 3.5550537109375, 3.682861328125, 3.8106689453125, 3.9384765625, 4.0662841796875, 4.194091796875, 4.3218994140625, 4.44970703125, 4.5775146484375, 4.705322265625, 4.8331298828125, 4.9609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 9.0, 12.0, 14.0, 13.0, 26.0, 27.0, 43.0, 49.0, 83.0, 110.0, 168.0, 337.0, 539.0, 1127.0, 2530.0, 6620.0, 20189.0, 69282.0, 261674.0, 460632.0, 160004.0, 43250.0, 13289.0, 4673.0, 1840.0, 813.0, 456.0, 251.0, 126.0, 115.0, 68.0, 48.0, 34.0, 33.0, 17.0, 15.0, 5.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.71875, -36.474609375, -35.23046875, -33.986328125, -32.7421875, -31.498046875, -30.25390625, -29.009765625, -27.765625, -26.521484375, -25.27734375, -24.033203125, -22.7890625, -21.544921875, -20.30078125, -19.056640625, -17.8125, -16.568359375, -15.32421875, -14.080078125, -12.8359375, -11.591796875, -10.34765625, -9.103515625, -7.859375, -6.615234375, -5.37109375, -4.126953125, -2.8828125, -1.638671875, -0.39453125, 0.849609375, 2.09375, 3.337890625, 4.58203125, 5.826171875, 7.0703125, 8.314453125, 9.55859375, 10.802734375, 12.046875, 13.291015625, 14.53515625, 15.779296875, 17.0234375, 18.267578125, 19.51171875, 20.755859375, 22.0, 23.244140625, 24.48828125, 25.732421875, 26.9765625, 28.220703125, 29.46484375, 30.708984375, 31.953125, 33.197265625, 34.44140625, 35.685546875, 36.9296875, 38.173828125, 39.41796875, 40.662109375, 41.90625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 2.0, 7.0, 14.0, 13.0, 19.0, 16.0, 23.0, 29.0, 31.0, 33.0, 35.0, 45.0, 43.0, 62.0, 46.0, 54.0, 54.0, 51.0, 47.0, 58.0, 44.0, 33.0, 29.0, 33.0, 29.0, 26.0, 28.0, 16.0, 16.0, 10.0, 15.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.212158203125, -15.64306640625, -15.073974609375, -14.5048828125, -13.935791015625, -13.36669921875, -12.797607421875, -12.228515625, -11.659423828125, -11.09033203125, -10.521240234375, -9.9521484375, -9.383056640625, -8.81396484375, -8.244873046875, -7.67578125, -7.106689453125, -6.53759765625, -5.968505859375, -5.3994140625, -4.830322265625, -4.26123046875, -3.692138671875, -3.123046875, -2.553955078125, -1.98486328125, -1.415771484375, -0.8466796875, -0.277587890625, 0.29150390625, 0.860595703125, 1.4296875, 1.998779296875, 2.56787109375, 3.136962890625, 3.7060546875, 4.275146484375, 4.84423828125, 5.413330078125, 5.982421875, 6.551513671875, 7.12060546875, 7.689697265625, 8.2587890625, 8.827880859375, 9.39697265625, 9.966064453125, 10.53515625, 11.104248046875, 11.67333984375, 12.242431640625, 12.8115234375, 13.380615234375, 13.94970703125, 14.518798828125, 15.087890625, 15.656982421875, 16.22607421875, 16.795166015625, 17.3642578125, 17.933349609375, 18.50244140625, 19.071533203125, 19.640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 22.0, 32.0, 43.0, 55.0, 107.0, 160.0, 317.0, 571.0, 1063.0, 2157.0, 4607.0, 10536.0, 27540.0, 83744.0, 298168.0, 417497.0, 134721.0, 40548.0, 14606.0, 6097.0, 2784.0, 1325.0, 712.0, 411.0, 220.0, 157.0, 102.0, 56.0, 37.0, 25.0, 23.0, 21.0, 17.0, 4.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-22.984375, -22.270263671875, -21.55615234375, -20.842041015625, -20.1279296875, -19.413818359375, -18.69970703125, -17.985595703125, -17.271484375, -16.557373046875, -15.84326171875, -15.129150390625, -14.4150390625, -13.700927734375, -12.98681640625, -12.272705078125, -11.55859375, -10.844482421875, -10.13037109375, -9.416259765625, -8.7021484375, -7.988037109375, -7.27392578125, -6.559814453125, -5.845703125, -5.131591796875, -4.41748046875, -3.703369140625, -2.9892578125, -2.275146484375, -1.56103515625, -0.846923828125, -0.1328125, 0.581298828125, 1.29541015625, 2.009521484375, 2.7236328125, 3.437744140625, 4.15185546875, 4.865966796875, 5.580078125, 6.294189453125, 7.00830078125, 7.722412109375, 8.4365234375, 9.150634765625, 9.86474609375, 10.578857421875, 11.29296875, 12.007080078125, 12.72119140625, 13.435302734375, 14.1494140625, 14.863525390625, 15.57763671875, 16.291748046875, 17.005859375, 17.719970703125, 18.43408203125, 19.148193359375, 19.8623046875, 20.576416015625, 21.29052734375, 22.004638671875, 22.71875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 11.0, 12.0, 12.0, 20.0, 37.0, 50.0, 56.0, 65.0, 103.0, 94.0, 122.0, 84.0, 84.0, 69.0, 33.0, 32.0, 36.0, 19.0, 13.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042266845703125, -0.0040991902351379395, -0.003971695899963379, -0.0038442015647888184, -0.003716707229614258, -0.0035892128944396973, -0.0034617185592651367, -0.003334224224090576, -0.0032067298889160156, -0.003079235553741455, -0.0029517412185668945, -0.002824246883392334, -0.0026967525482177734, -0.002569258213043213, -0.0024417638778686523, -0.002314269542694092, -0.0021867752075195312, -0.0020592808723449707, -0.0019317865371704102, -0.0018042922019958496, -0.001676797866821289, -0.0015493035316467285, -0.001421809196472168, -0.0012943148612976074, -0.0011668205261230469, -0.0010393261909484863, -0.0009118318557739258, -0.0007843375205993652, -0.0006568431854248047, -0.0005293488502502441, -0.0004018545150756836, -0.00027436017990112305, -0.0001468658447265625, -1.9371509552001953e-05, 0.0001081228256225586, 0.00023561716079711914, 0.0003631114959716797, 0.0004906058311462402, 0.0006181001663208008, 0.0007455945014953613, 0.0008730888366699219, 0.0010005831718444824, 0.001128077507019043, 0.0012555718421936035, 0.001383066177368164, 0.0015105605125427246, 0.0016380548477172852, 0.0017655491828918457, 0.0018930435180664062, 0.002020537853240967, 0.0021480321884155273, 0.002275526523590088, 0.0024030208587646484, 0.002530515193939209, 0.0026580095291137695, 0.00278550386428833, 0.0029129981994628906, 0.003040492534637451, 0.0031679868698120117, 0.0032954812049865723, 0.003422975540161133, 0.0035504698753356934, 0.003677964210510254, 0.0038054585456848145, 0.003932952880859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 14.0, 23.0, 41.0, 71.0, 115.0, 233.0, 484.0, 973.0, 2617.0, 8691.0, 39710.0, 344976.0, 570037.0, 62339.0, 12252.0, 3512.0, 1293.0, 539.0, 253.0, 117.0, 92.0, 46.0, 31.0, 16.0, 17.0, 11.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-51.96875, -50.56884765625, -49.1689453125, -47.76904296875, -46.369140625, -44.96923828125, -43.5693359375, -42.16943359375, -40.76953125, -39.36962890625, -37.9697265625, -36.56982421875, -35.169921875, -33.77001953125, -32.3701171875, -30.97021484375, -29.5703125, -28.17041015625, -26.7705078125, -25.37060546875, -23.970703125, -22.57080078125, -21.1708984375, -19.77099609375, -18.37109375, -16.97119140625, -15.5712890625, -14.17138671875, -12.771484375, -11.37158203125, -9.9716796875, -8.57177734375, -7.171875, -5.77197265625, -4.3720703125, -2.97216796875, -1.572265625, -0.17236328125, 1.2275390625, 2.62744140625, 4.02734375, 5.42724609375, 6.8271484375, 8.22705078125, 9.626953125, 11.02685546875, 12.4267578125, 13.82666015625, 15.2265625, 16.62646484375, 18.0263671875, 19.42626953125, 20.826171875, 22.22607421875, 23.6259765625, 25.02587890625, 26.42578125, 27.82568359375, 29.2255859375, 30.62548828125, 32.025390625, 33.42529296875, 34.8251953125, 36.22509765625, 37.625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 9.0, 13.0, 20.0, 16.0, 25.0, 51.0, 49.0, 73.0, 88.0, 118.0, 107.0, 103.0, 82.0, 63.0, 37.0, 26.0, 19.0, 21.0, 17.0, 9.0, 7.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.96875, -19.4305419921875, -18.892333984375, -18.3541259765625, -17.81591796875, -17.2777099609375, -16.739501953125, -16.2012939453125, -15.6630859375, -15.1248779296875, -14.586669921875, -14.0484619140625, -13.51025390625, -12.9720458984375, -12.433837890625, -11.8956298828125, -11.357421875, -10.8192138671875, -10.281005859375, -9.7427978515625, -9.20458984375, -8.6663818359375, -8.128173828125, -7.5899658203125, -7.0517578125, -6.5135498046875, -5.975341796875, -5.4371337890625, -4.89892578125, -4.3607177734375, -3.822509765625, -3.2843017578125, -2.74609375, -2.2078857421875, -1.669677734375, -1.1314697265625, -0.59326171875, -0.0550537109375, 0.483154296875, 1.0213623046875, 1.5595703125, 2.0977783203125, 2.635986328125, 3.1741943359375, 3.71240234375, 4.2506103515625, 4.788818359375, 5.3270263671875, 5.865234375, 6.4034423828125, 6.941650390625, 7.4798583984375, 8.01806640625, 8.5562744140625, 9.094482421875, 9.6326904296875, 10.1708984375, 10.7091064453125, 11.247314453125, 11.7855224609375, 12.32373046875, 12.8619384765625, 13.400146484375, 13.9383544921875, 14.4765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 12.0, 26.0, 62.0, 104.0, 183.0, 223.0, 169.0, 110.0, 54.0, 18.0, 12.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.73016357421875, -367.71539306640625, -356.70062255859375, -345.6858215332031, -334.6710510253906, -323.6562805175781, -312.6414794921875, -301.626708984375, -290.6119384765625, -279.59716796875, -268.5823974609375, -257.5675964355469, -246.55282592773438, -235.53805541992188, -224.5232696533203, -213.50848388671875, -202.49371337890625, -191.47894287109375, -180.4641571044922, -169.44937133789062, -158.43460083007812, -147.41983032226562, -136.40504455566406, -125.39026641845703, -114.37548828125, -103.36071014404297, -92.34593200683594, -81.3311538696289, -70.31637573242188, -59.301597595214844, -48.28681945800781, -37.27204132080078, -26.257232666015625, -15.242454528808594, -4.2276763916015625, 6.787101745605469, 17.8018798828125, 28.81665802001953, 39.83143615722656, 50.846214294433594, 61.860992431640625, 72.87577056884766, 83.89054870605469, 94.90532684326172, 105.92010498046875, 116.93488311767578, 127.94966125488281, 138.96444702148438, 149.97921752929688, 160.99398803710938, 172.00877380371094, 183.0235595703125, 194.038330078125, 205.0531005859375, 216.06788635253906, 227.08267211914062, 238.09744262695312, 249.11221313476562, 260.12701416015625, 271.14178466796875, 282.15655517578125, 293.17132568359375, 304.18609619140625, 315.2008972167969, 326.2156677246094]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 11.0, 12.0, 18.0, 19.0, 25.0, 18.0, 15.0, 31.0, 28.0, 49.0, 49.0, 43.0, 56.0, 26.0, 47.0, 54.0, 41.0, 50.0, 34.0, 45.0, 39.0, 38.0, 43.0, 29.0, 22.0, 26.0, 20.0, 11.0, 16.0, 10.0, 9.0, 8.0, 8.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-133.895263671875, -130.08030700683594, -126.2653579711914, -122.45040130615234, -118.63545227050781, -114.82049560546875, -111.00553894042969, -107.19058990478516, -103.37564086914062, -99.56068420410156, -95.74573516845703, -91.93077850341797, -88.11582946777344, -84.30087280273438, -80.48591613769531, -76.67096710205078, -72.85601043701172, -69.04105377197266, -65.22610473632812, -61.41114807128906, -57.59619903564453, -53.78124237060547, -49.96628952026367, -46.151336669921875, -42.33638381958008, -38.52143096923828, -34.706478118896484, -30.891523361206055, -27.076570510864258, -23.26161766052246, -19.44666290283203, -15.631710052490234, -11.816764831542969, -8.001811981201172, -4.186858177185059, -0.3719043731689453, 3.4430484771728516, 7.258001327514648, 11.072956085205078, 14.887908935546875, 18.702861785888672, 22.51781463623047, 26.332767486572266, 30.147722244262695, 33.962677001953125, 37.777626037597656, 41.59258270263672, 45.407535552978516, 49.22248840332031, 53.03744125366211, 56.852394104003906, 60.66735076904297, 64.4822998046875, 68.29725646972656, 72.11221313476562, 75.92716217041016, 79.74211120605469, 83.55706787109375, 87.37201690673828, 91.18697357177734, 95.00192260742188, 98.81687927246094, 102.6318359375, 106.44678497314453, 110.2617416381836]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 9.0, 15.0, 21.0, 20.0, 30.0, 46.0, 62.0, 78.0, 121.0, 172.0, 243.0, 390.0, 638.0, 1051.0, 1938.0, 3712.0, 8289.0, 21419.0, 68032.0, 337218.0, 3383230.0, 270800.0, 61660.0, 20071.0, 7884.0, 3433.0, 1649.0, 860.0, 440.0, 272.0, 165.0, 99.0, 60.0, 35.0, 36.0, 22.0, 22.0, 17.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.375, -53.71923828125, -52.0634765625, -50.40771484375, -48.751953125, -47.09619140625, -45.4404296875, -43.78466796875, -42.12890625, -40.47314453125, -38.8173828125, -37.16162109375, -35.505859375, -33.85009765625, -32.1943359375, -30.53857421875, -28.8828125, -27.22705078125, -25.5712890625, -23.91552734375, -22.259765625, -20.60400390625, -18.9482421875, -17.29248046875, -15.63671875, -13.98095703125, -12.3251953125, -10.66943359375, -9.013671875, -7.35791015625, -5.7021484375, -4.04638671875, -2.390625, -0.73486328125, 0.9208984375, 2.57666015625, 4.232421875, 5.88818359375, 7.5439453125, 9.19970703125, 10.85546875, 12.51123046875, 14.1669921875, 15.82275390625, 17.478515625, 19.13427734375, 20.7900390625, 22.44580078125, 24.1015625, 25.75732421875, 27.4130859375, 29.06884765625, 30.724609375, 32.38037109375, 34.0361328125, 35.69189453125, 37.34765625, 39.00341796875, 40.6591796875, 42.31494140625, 43.970703125, 45.62646484375, 47.2822265625, 48.93798828125, 50.59375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 16.0, 19.0, 27.0, 36.0, 43.0, 46.0, 60.0, 69.0, 78.0, 63.0, 73.0, 69.0, 77.0, 60.0, 42.0, 45.0, 32.0, 29.0, 29.0, 12.0, 16.0, 9.0, 12.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.77362060546875, -3.6292724609375, -3.48492431640625, -3.340576171875, -3.19622802734375, -3.0518798828125, -2.90753173828125, -2.76318359375, -2.61883544921875, -2.4744873046875, -2.33013916015625, -2.185791015625, -2.04144287109375, -1.8970947265625, -1.75274658203125, -1.6083984375, -1.46405029296875, -1.3197021484375, -1.17535400390625, -1.031005859375, -0.88665771484375, -0.7423095703125, -0.59796142578125, -0.45361328125, -0.30926513671875, -0.1649169921875, -0.02056884765625, 0.123779296875, 0.26812744140625, 0.4124755859375, 0.55682373046875, 0.701171875, 0.84552001953125, 0.9898681640625, 1.13421630859375, 1.278564453125, 1.42291259765625, 1.5672607421875, 1.71160888671875, 1.85595703125, 2.00030517578125, 2.1446533203125, 2.28900146484375, 2.433349609375, 2.57769775390625, 2.7220458984375, 2.86639404296875, 3.0107421875, 3.15509033203125, 3.2994384765625, 3.44378662109375, 3.588134765625, 3.73248291015625, 3.8768310546875, 4.02117919921875, 4.16552734375, 4.30987548828125, 4.4542236328125, 4.59857177734375, 4.742919921875, 4.88726806640625, 5.0316162109375, 5.17596435546875, 5.3203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 20.0, 15.0, 22.0, 53.0, 69.0, 130.0, 194.0, 337.0, 571.0, 1116.0, 2436.0, 5544.0, 14333.0, 43011.0, 168149.0, 2431916.0, 1315696.0, 148499.0, 39227.0, 13306.0, 5190.0, 2216.0, 1005.0, 516.0, 289.0, 153.0, 97.0, 40.0, 37.0, 21.0, 21.0, 14.0, 11.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.759765625, -45.98828125, -44.216796875, -42.4453125, -40.673828125, -38.90234375, -37.130859375, -35.359375, -33.587890625, -31.81640625, -30.044921875, -28.2734375, -26.501953125, -24.73046875, -22.958984375, -21.1875, -19.416015625, -17.64453125, -15.873046875, -14.1015625, -12.330078125, -10.55859375, -8.787109375, -7.015625, -5.244140625, -3.47265625, -1.701171875, 0.0703125, 1.841796875, 3.61328125, 5.384765625, 7.15625, 8.927734375, 10.69921875, 12.470703125, 14.2421875, 16.013671875, 17.78515625, 19.556640625, 21.328125, 23.099609375, 24.87109375, 26.642578125, 28.4140625, 30.185546875, 31.95703125, 33.728515625, 35.5, 37.271484375, 39.04296875, 40.814453125, 42.5859375, 44.357421875, 46.12890625, 47.900390625, 49.671875, 51.443359375, 53.21484375, 54.986328125, 56.7578125, 58.529296875, 60.30078125, 62.072265625, 63.84375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 17.0, 10.0, 23.0, 25.0, 39.0, 49.0, 53.0, 70.0, 133.0, 151.0, 267.0, 463.0, 1434.0, 448.0, 259.0, 169.0, 110.0, 80.0, 60.0, 44.0, 37.0, 28.0, 20.0, 14.0, 13.0, 16.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.75, -12.40087890625, -12.0517578125, -11.70263671875, -11.353515625, -11.00439453125, -10.6552734375, -10.30615234375, -9.95703125, -9.60791015625, -9.2587890625, -8.90966796875, -8.560546875, -8.21142578125, -7.8623046875, -7.51318359375, -7.1640625, -6.81494140625, -6.4658203125, -6.11669921875, -5.767578125, -5.41845703125, -5.0693359375, -4.72021484375, -4.37109375, -4.02197265625, -3.6728515625, -3.32373046875, -2.974609375, -2.62548828125, -2.2763671875, -1.92724609375, -1.578125, -1.22900390625, -0.8798828125, -0.53076171875, -0.181640625, 0.16748046875, 0.5166015625, 0.86572265625, 1.21484375, 1.56396484375, 1.9130859375, 2.26220703125, 2.611328125, 2.96044921875, 3.3095703125, 3.65869140625, 4.0078125, 4.35693359375, 4.7060546875, 5.05517578125, 5.404296875, 5.75341796875, 6.1025390625, 6.45166015625, 6.80078125, 7.14990234375, 7.4990234375, 7.84814453125, 8.197265625, 8.54638671875, 8.8955078125, 9.24462890625, 9.59375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 14.0, 10.0, 17.0, 23.0, 30.0, 46.0, 50.0, 69.0, 87.0, 106.0, 101.0, 90.0, 82.0, 63.0, 45.0, 35.0, 32.0, 20.0, 16.0, 12.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-57.18735885620117, -55.36600112915039, -53.54464340209961, -51.72328186035156, -49.90192413330078, -48.08056640625, -46.25920867919922, -44.43785095214844, -42.61648941040039, -40.79513168334961, -38.97377395629883, -37.15241241455078, -35.3310546875, -33.50969696044922, -31.688339233398438, -29.866979598999023, -28.045621871948242, -26.22426414489746, -24.402904510498047, -22.581546783447266, -20.76018714904785, -18.93882942199707, -17.117469787597656, -15.296112060546875, -13.474753379821777, -11.65339469909668, -9.832036018371582, -8.010677337646484, -6.189319133758545, -4.3679609298706055, -2.546602249145508, -0.7252435684204102, 1.0961151123046875, 2.917473793029785, 4.738832473754883, 6.560190677642822, 8.381549835205078, 10.20290756225586, 12.024266242980957, 13.845624923706055, 15.666983604431152, 17.48834228515625, 19.30970001220703, 21.131059646606445, 22.952417373657227, 24.77377700805664, 26.595134735107422, 28.416492462158203, 30.237852096557617, 32.05921173095703, 33.88056945800781, 35.701927185058594, 37.523284912109375, 39.344642639160156, 41.1660041809082, 42.987361907958984, 44.808719635009766, 46.63007736206055, 48.45143508911133, 50.272796630859375, 52.094154357910156, 53.91551208496094, 55.73686981201172, 57.5582275390625, 59.37958908081055]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 9.0, 8.0, 18.0, 11.0, 18.0, 25.0, 23.0, 31.0, 26.0, 30.0, 42.0, 32.0, 31.0, 50.0, 49.0, 42.0, 41.0, 57.0, 41.0, 50.0, 33.0, 38.0, 31.0, 29.0, 27.0, 29.0, 26.0, 26.0, 19.0, 16.0, 7.0, 12.0, 9.0, 6.0, 7.0, 11.0, 1.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-43.58074951171875, -42.231414794921875, -40.882076263427734, -39.53274154663086, -38.183406829833984, -36.83407211303711, -35.48473358154297, -34.135398864746094, -32.78606414794922, -31.43672752380371, -30.087392807006836, -28.738056182861328, -27.388721466064453, -26.039384841918945, -24.690048217773438, -23.340713500976562, -21.991376876831055, -20.642040252685547, -19.292705535888672, -17.943368911743164, -16.59403419494629, -15.244697570800781, -13.89536190032959, -12.546026229858398, -11.196690559387207, -9.847354888916016, -8.498019218444824, -7.148683071136475, -5.799347400665283, -4.450011730194092, -3.100675582885742, -1.7513399124145508, -0.4020042419433594, 0.9473315477371216, 2.2966673374176025, 3.646003246307373, 4.9953389167785645, 6.344674587249756, 7.6940107345581055, 9.043346405029297, 10.392682075500488, 11.74201774597168, 13.091353416442871, 14.440689086914062, 15.79002571105957, 17.139360427856445, 18.488697052001953, 19.838031768798828, 21.187368392944336, 22.536705017089844, 23.88603973388672, 25.235376358032227, 26.5847110748291, 27.93404769897461, 29.283382415771484, 30.632719039916992, 31.9820556640625, 33.331390380859375, 34.680728912353516, 36.03006362915039, 37.379398345947266, 38.72873306274414, 40.07807159423828, 41.427406311035156, 42.77674102783203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 7.0, 6.0, 8.0, 16.0, 18.0, 30.0, 41.0, 74.0, 77.0, 112.0, 186.0, 244.0, 361.0, 526.0, 871.0, 1405.0, 2308.0, 4192.0, 7831.0, 15966.0, 33910.0, 74963.0, 165963.0, 303664.0, 232084.0, 108473.0, 48541.0, 22378.0, 10713.0, 5633.0, 3095.0, 1709.0, 1052.0, 688.0, 434.0, 306.0, 206.0, 147.0, 91.0, 67.0, 48.0, 30.0, 17.0, 20.0, 10.0, 8.0, 3.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-25.3125, -24.48876953125, -23.6650390625, -22.84130859375, -22.017578125, -21.19384765625, -20.3701171875, -19.54638671875, -18.72265625, -17.89892578125, -17.0751953125, -16.25146484375, -15.427734375, -14.60400390625, -13.7802734375, -12.95654296875, -12.1328125, -11.30908203125, -10.4853515625, -9.66162109375, -8.837890625, -8.01416015625, -7.1904296875, -6.36669921875, -5.54296875, -4.71923828125, -3.8955078125, -3.07177734375, -2.248046875, -1.42431640625, -0.6005859375, 0.22314453125, 1.046875, 1.87060546875, 2.6943359375, 3.51806640625, 4.341796875, 5.16552734375, 5.9892578125, 6.81298828125, 7.63671875, 8.46044921875, 9.2841796875, 10.10791015625, 10.931640625, 11.75537109375, 12.5791015625, 13.40283203125, 14.2265625, 15.05029296875, 15.8740234375, 16.69775390625, 17.521484375, 18.34521484375, 19.1689453125, 19.99267578125, 20.81640625, 21.64013671875, 22.4638671875, 23.28759765625, 24.111328125, 24.93505859375, 25.7587890625, 26.58251953125, 27.40625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 11.0, 15.0, 19.0, 24.0, 29.0, 34.0, 45.0, 55.0, 48.0, 56.0, 69.0, 69.0, 53.0, 64.0, 59.0, 56.0, 51.0, 43.0, 37.0, 41.0, 25.0, 18.0, 6.0, 13.0, 6.0, 10.0, 4.0, 6.0, 1.0, 8.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.009521484375, -3.86669921875, -3.723876953125, -3.5810546875, -3.438232421875, -3.29541015625, -3.152587890625, -3.009765625, -2.866943359375, -2.72412109375, -2.581298828125, -2.4384765625, -2.295654296875, -2.15283203125, -2.010009765625, -1.8671875, -1.724365234375, -1.58154296875, -1.438720703125, -1.2958984375, -1.153076171875, -1.01025390625, -0.867431640625, -0.724609375, -0.581787109375, -0.43896484375, -0.296142578125, -0.1533203125, -0.010498046875, 0.13232421875, 0.275146484375, 0.41796875, 0.560791015625, 0.70361328125, 0.846435546875, 0.9892578125, 1.132080078125, 1.27490234375, 1.417724609375, 1.560546875, 1.703369140625, 1.84619140625, 1.989013671875, 2.1318359375, 2.274658203125, 2.41748046875, 2.560302734375, 2.703125, 2.845947265625, 2.98876953125, 3.131591796875, 3.2744140625, 3.417236328125, 3.56005859375, 3.702880859375, 3.845703125, 3.988525390625, 4.13134765625, 4.274169921875, 4.4169921875, 4.559814453125, 4.70263671875, 4.845458984375, 4.98828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 16.0, 24.0, 34.0, 50.0, 79.0, 107.0, 187.0, 325.0, 650.0, 1482.0, 3650.0, 10869.0, 38739.0, 164795.0, 548171.0, 210809.0, 48292.0, 12950.0, 4138.0, 1643.0, 704.0, 325.0, 193.0, 95.0, 66.0, 46.0, 37.0, 19.0, 14.0, 5.0, 5.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.53125, -46.8330078125, -45.134765625, -43.4365234375, -41.73828125, -40.0400390625, -38.341796875, -36.6435546875, -34.9453125, -33.2470703125, -31.548828125, -29.8505859375, -28.15234375, -26.4541015625, -24.755859375, -23.0576171875, -21.359375, -19.6611328125, -17.962890625, -16.2646484375, -14.56640625, -12.8681640625, -11.169921875, -9.4716796875, -7.7734375, -6.0751953125, -4.376953125, -2.6787109375, -0.98046875, 0.7177734375, 2.416015625, 4.1142578125, 5.8125, 7.5107421875, 9.208984375, 10.9072265625, 12.60546875, 14.3037109375, 16.001953125, 17.7001953125, 19.3984375, 21.0966796875, 22.794921875, 24.4931640625, 26.19140625, 27.8896484375, 29.587890625, 31.2861328125, 32.984375, 34.6826171875, 36.380859375, 38.0791015625, 39.77734375, 41.4755859375, 43.173828125, 44.8720703125, 46.5703125, 48.2685546875, 49.966796875, 51.6650390625, 53.36328125, 55.0615234375, 56.759765625, 58.4580078125, 60.15625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 11.0, 12.0, 5.0, 9.0, 13.0, 17.0, 22.0, 30.0, 35.0, 29.0, 32.0, 51.0, 50.0, 51.0, 44.0, 52.0, 52.0, 57.0, 37.0, 44.0, 37.0, 52.0, 39.0, 40.0, 33.0, 28.0, 25.0, 22.0, 15.0, 12.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.413330078125, -22.59228515625, -21.771240234375, -20.9501953125, -20.129150390625, -19.30810546875, -18.487060546875, -17.666015625, -16.844970703125, -16.02392578125, -15.202880859375, -14.3818359375, -13.560791015625, -12.73974609375, -11.918701171875, -11.09765625, -10.276611328125, -9.45556640625, -8.634521484375, -7.8134765625, -6.992431640625, -6.17138671875, -5.350341796875, -4.529296875, -3.708251953125, -2.88720703125, -2.066162109375, -1.2451171875, -0.424072265625, 0.39697265625, 1.218017578125, 2.0390625, 2.860107421875, 3.68115234375, 4.502197265625, 5.3232421875, 6.144287109375, 6.96533203125, 7.786376953125, 8.607421875, 9.428466796875, 10.24951171875, 11.070556640625, 11.8916015625, 12.712646484375, 13.53369140625, 14.354736328125, 15.17578125, 15.996826171875, 16.81787109375, 17.638916015625, 18.4599609375, 19.281005859375, 20.10205078125, 20.923095703125, 21.744140625, 22.565185546875, 23.38623046875, 24.207275390625, 25.0283203125, 25.849365234375, 26.67041015625, 27.491455078125, 28.3125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 1.0, 9.0, 8.0, 8.0, 20.0, 21.0, 30.0, 32.0, 70.0, 98.0, 139.0, 191.0, 375.0, 643.0, 1124.0, 2156.0, 4285.0, 9301.0, 21238.0, 54844.0, 153291.0, 385568.0, 262777.0, 91129.0, 34354.0, 13880.0, 6261.0, 3007.0, 1503.0, 876.0, 496.0, 277.0, 189.0, 123.0, 74.0, 42.0, 35.0, 27.0, 13.0, 15.0, 4.0, 11.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.63037109375, -16.9951171875, -16.35986328125, -15.724609375, -15.08935546875, -14.4541015625, -13.81884765625, -13.18359375, -12.54833984375, -11.9130859375, -11.27783203125, -10.642578125, -10.00732421875, -9.3720703125, -8.73681640625, -8.1015625, -7.46630859375, -6.8310546875, -6.19580078125, -5.560546875, -4.92529296875, -4.2900390625, -3.65478515625, -3.01953125, -2.38427734375, -1.7490234375, -1.11376953125, -0.478515625, 0.15673828125, 0.7919921875, 1.42724609375, 2.0625, 2.69775390625, 3.3330078125, 3.96826171875, 4.603515625, 5.23876953125, 5.8740234375, 6.50927734375, 7.14453125, 7.77978515625, 8.4150390625, 9.05029296875, 9.685546875, 10.32080078125, 10.9560546875, 11.59130859375, 12.2265625, 12.86181640625, 13.4970703125, 14.13232421875, 14.767578125, 15.40283203125, 16.0380859375, 16.67333984375, 17.30859375, 17.94384765625, 18.5791015625, 19.21435546875, 19.849609375, 20.48486328125, 21.1201171875, 21.75537109375, 22.390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 13.0, 12.0, 17.0, 20.0, 37.0, 54.0, 63.0, 94.0, 155.0, 144.0, 124.0, 77.0, 54.0, 43.0, 29.0, 15.0, 8.0, 13.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004970550537109375, -0.004788458347320557, -0.004606366157531738, -0.00442427396774292, -0.0042421817779541016, -0.004060089588165283, -0.003877997398376465, -0.0036959052085876465, -0.003513813018798828, -0.0033317208290100098, -0.0031496286392211914, -0.002967536449432373, -0.0027854442596435547, -0.0026033520698547363, -0.002421259880065918, -0.0022391676902770996, -0.0020570755004882812, -0.0018749833106994629, -0.0016928911209106445, -0.0015107989311218262, -0.0013287067413330078, -0.0011466145515441895, -0.0009645223617553711, -0.0007824301719665527, -0.0006003379821777344, -0.000418245792388916, -0.00023615360260009766, -5.40614128112793e-05, 0.00012803077697753906, 0.0003101229667663574, 0.0004922151565551758, 0.0006743073463439941, 0.0008563995361328125, 0.0010384917259216309, 0.0012205839157104492, 0.0014026761054992676, 0.001584768295288086, 0.0017668604850769043, 0.0019489526748657227, 0.002131044864654541, 0.0023131370544433594, 0.0024952292442321777, 0.002677321434020996, 0.0028594136238098145, 0.003041505813598633, 0.003223598003387451, 0.0034056901931762695, 0.003587782382965088, 0.0037698745727539062, 0.003951966762542725, 0.004134058952331543, 0.004316151142120361, 0.00449824333190918, 0.004680335521697998, 0.004862427711486816, 0.005044519901275635, 0.005226612091064453, 0.0054087042808532715, 0.00559079647064209, 0.005772888660430908, 0.0059549808502197266, 0.006137073040008545, 0.006319165229797363, 0.006501257419586182, 0.006683349609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 12.0, 19.0, 20.0, 40.0, 63.0, 109.0, 212.0, 430.0, 937.0, 2331.0, 7297.0, 28229.0, 161314.0, 673197.0, 138323.0, 25301.0, 6720.0, 2243.0, 872.0, 387.0, 193.0, 100.0, 76.0, 44.0, 23.0, 12.0, 10.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.96875, -35.57177734375, -34.1748046875, -32.77783203125, -31.380859375, -29.98388671875, -28.5869140625, -27.18994140625, -25.79296875, -24.39599609375, -22.9990234375, -21.60205078125, -20.205078125, -18.80810546875, -17.4111328125, -16.01416015625, -14.6171875, -13.22021484375, -11.8232421875, -10.42626953125, -9.029296875, -7.63232421875, -6.2353515625, -4.83837890625, -3.44140625, -2.04443359375, -0.6474609375, 0.74951171875, 2.146484375, 3.54345703125, 4.9404296875, 6.33740234375, 7.734375, 9.13134765625, 10.5283203125, 11.92529296875, 13.322265625, 14.71923828125, 16.1162109375, 17.51318359375, 18.91015625, 20.30712890625, 21.7041015625, 23.10107421875, 24.498046875, 25.89501953125, 27.2919921875, 28.68896484375, 30.0859375, 31.48291015625, 32.8798828125, 34.27685546875, 35.673828125, 37.07080078125, 38.4677734375, 39.86474609375, 41.26171875, 42.65869140625, 44.0556640625, 45.45263671875, 46.849609375, 48.24658203125, 49.6435546875, 51.04052734375, 52.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 3.0, 9.0, 9.0, 7.0, 8.0, 11.0, 12.0, 22.0, 18.0, 28.0, 31.0, 34.0, 42.0, 50.0, 65.0, 62.0, 79.0, 81.0, 64.0, 75.0, 51.0, 43.0, 35.0, 30.0, 23.0, 10.0, 12.0, 14.0, 11.0, 10.0, 11.0, 11.0, 6.0, 9.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.3878173828125, -13.892822265625, -13.3978271484375, -12.90283203125, -12.4078369140625, -11.912841796875, -11.4178466796875, -10.9228515625, -10.4278564453125, -9.932861328125, -9.4378662109375, -8.94287109375, -8.4478759765625, -7.952880859375, -7.4578857421875, -6.962890625, -6.4678955078125, -5.972900390625, -5.4779052734375, -4.98291015625, -4.4879150390625, -3.992919921875, -3.4979248046875, -3.0029296875, -2.5079345703125, -2.012939453125, -1.5179443359375, -1.02294921875, -0.5279541015625, -0.032958984375, 0.4620361328125, 0.95703125, 1.4520263671875, 1.947021484375, 2.4420166015625, 2.93701171875, 3.4320068359375, 3.927001953125, 4.4219970703125, 4.9169921875, 5.4119873046875, 5.906982421875, 6.4019775390625, 6.89697265625, 7.3919677734375, 7.886962890625, 8.3819580078125, 8.876953125, 9.3719482421875, 9.866943359375, 10.3619384765625, 10.85693359375, 11.3519287109375, 11.846923828125, 12.3419189453125, 12.8369140625, 13.3319091796875, 13.826904296875, 14.3218994140625, 14.81689453125, 15.3118896484375, 15.806884765625, 16.3018798828125, 16.796875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 12.0, 18.0, 18.0, 51.0, 68.0, 146.0, 157.0, 182.0, 125.0, 76.0, 62.0, 30.0, 22.0, 8.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-250.466064453125, -239.61849975585938, -228.77093505859375, -217.92335510253906, -207.07579040527344, -196.2282257080078, -185.38064575195312, -174.5330810546875, -163.68551635742188, -152.83795166015625, -141.99038696289062, -131.14280700683594, -120.29524230957031, -109.44767761230469, -98.60010528564453, -87.75253295898438, -76.90496826171875, -66.05740356445312, -55.20983123779297, -44.36226272583008, -33.51469421386719, -22.667125701904297, -11.819557189941406, -0.97198486328125, 9.875579833984375, 20.723148345947266, 31.570716857910156, 42.41828536987305, 53.26585388183594, 64.11341857910156, 74.96099090576172, 85.80856323242188, 96.65609741210938, 107.503662109375, 118.35123443603516, 129.1988067626953, 140.04637145996094, 150.89393615722656, 161.74151611328125, 172.58908081054688, 183.4366455078125, 194.28421020507812, 205.13177490234375, 215.97935485839844, 226.82691955566406, 237.6744842529297, 248.52206420898438, 259.36962890625, 270.2171936035156, 281.06475830078125, 291.9123229980469, 302.7598876953125, 313.60748291015625, 324.4550476074219, 335.3026123046875, 346.1501770019531, 356.99774169921875, 367.8453063964844, 378.69287109375, 389.5404357910156, 400.38800048828125, 411.235595703125, 422.0831604003906, 432.93072509765625, 443.7782897949219]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 10.0, 16.0, 16.0, 9.0, 24.0, 27.0, 29.0, 27.0, 30.0, 30.0, 33.0, 39.0, 35.0, 30.0, 42.0, 54.0, 33.0, 47.0, 40.0, 50.0, 46.0, 28.0, 26.0, 36.0, 34.0, 33.0, 27.0, 14.0, 16.0, 15.0, 10.0, 15.0, 8.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-160.94764709472656, -155.8898468017578, -150.83206176757812, -145.77426147460938, -140.7164764404297, -135.65867614746094, -130.60089111328125, -125.5430908203125, -120.48529815673828, -115.42750549316406, -110.36971282958984, -105.31192016601562, -100.25411987304688, -95.19633483886719, -90.13853454589844, -85.08074188232422, -80.02294921875, -74.96515655517578, -69.90736389160156, -64.84957122802734, -59.79177474975586, -54.73398208618164, -49.676185607910156, -44.61839294433594, -39.56060028076172, -34.5028076171875, -29.44501304626465, -24.387218475341797, -19.329425811767578, -14.27163314819336, -9.213838577270508, -4.156044006347656, 0.9017486572265625, 5.959542274475098, 11.017335891723633, 16.075130462646484, 21.132923126220703, 26.190715789794922, 31.248510360717773, 36.306304931640625, 41.364097595214844, 46.42189025878906, 51.47968292236328, 56.537479400634766, 61.595272064208984, 66.65306091308594, 71.71086120605469, 76.7686538696289, 81.82644653320312, 86.88423919677734, 91.94203186035156, 96.99982452392578, 102.0576171875, 107.11541748046875, 112.17321014404297, 117.23100280761719, 122.2887954711914, 127.34658813476562, 132.40438842773438, 137.46217346191406, 142.5199737548828, 147.5777587890625, 152.63555908203125, 157.693359375, 162.7511444091797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 7.0, 17.0, 26.0, 36.0, 34.0, 77.0, 112.0, 160.0, 244.0, 407.0, 715.0, 1535.0, 3271.0, 7469.0, 19346.0, 61789.0, 353539.0, 3523583.0, 158653.0, 38272.0, 13807.0, 5669.0, 2631.0, 1298.0, 710.0, 356.0, 201.0, 109.0, 55.0, 54.0, 27.0, 16.0, 8.0, 9.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.6875, -63.0419921875, -61.396484375, -59.7509765625, -58.10546875, -56.4599609375, -54.814453125, -53.1689453125, -51.5234375, -49.8779296875, -48.232421875, -46.5869140625, -44.94140625, -43.2958984375, -41.650390625, -40.0048828125, -38.359375, -36.7138671875, -35.068359375, -33.4228515625, -31.77734375, -30.1318359375, -28.486328125, -26.8408203125, -25.1953125, -23.5498046875, -21.904296875, -20.2587890625, -18.61328125, -16.9677734375, -15.322265625, -13.6767578125, -12.03125, -10.3857421875, -8.740234375, -7.0947265625, -5.44921875, -3.8037109375, -2.158203125, -0.5126953125, 1.1328125, 2.7783203125, 4.423828125, 6.0693359375, 7.71484375, 9.3603515625, 11.005859375, 12.6513671875, 14.296875, 15.9423828125, 17.587890625, 19.2333984375, 20.87890625, 22.5244140625, 24.169921875, 25.8154296875, 27.4609375, 29.1064453125, 30.751953125, 32.3974609375, 34.04296875, 35.6884765625, 37.333984375, 38.9794921875, 40.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 10.0, 16.0, 14.0, 21.0, 22.0, 32.0, 36.0, 39.0, 53.0, 46.0, 64.0, 54.0, 72.0, 61.0, 64.0, 60.0, 51.0, 43.0, 41.0, 41.0, 33.0, 26.0, 12.0, 25.0, 13.0, 11.0, 12.0, 3.0, 5.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12109375, -5.9432373046875, -5.765380859375, -5.5875244140625, -5.40966796875, -5.2318115234375, -5.053955078125, -4.8760986328125, -4.6982421875, -4.5203857421875, -4.342529296875, -4.1646728515625, -3.98681640625, -3.8089599609375, -3.631103515625, -3.4532470703125, -3.275390625, -3.0975341796875, -2.919677734375, -2.7418212890625, -2.56396484375, -2.3861083984375, -2.208251953125, -2.0303955078125, -1.8525390625, -1.6746826171875, -1.496826171875, -1.3189697265625, -1.14111328125, -0.9632568359375, -0.785400390625, -0.6075439453125, -0.4296875, -0.2518310546875, -0.073974609375, 0.1038818359375, 0.28173828125, 0.4595947265625, 0.637451171875, 0.8153076171875, 0.9931640625, 1.1710205078125, 1.348876953125, 1.5267333984375, 1.70458984375, 1.8824462890625, 2.060302734375, 2.2381591796875, 2.416015625, 2.5938720703125, 2.771728515625, 2.9495849609375, 3.12744140625, 3.3052978515625, 3.483154296875, 3.6610107421875, 3.8388671875, 4.0167236328125, 4.194580078125, 4.3724365234375, 4.55029296875, 4.7281494140625, 4.906005859375, 5.0838623046875, 5.26171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 13.0, 19.0, 33.0, 34.0, 57.0, 110.0, 158.0, 275.0, 473.0, 825.0, 1521.0, 2989.0, 6576.0, 16666.0, 52132.0, 256378.0, 3425931.0, 337176.0, 60423.0, 18441.0, 7202.0, 3157.0, 1575.0, 826.0, 487.0, 274.0, 183.0, 115.0, 84.0, 50.0, 31.0, 24.0, 14.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.59375, -61.8056640625, -60.017578125, -58.2294921875, -56.44140625, -54.6533203125, -52.865234375, -51.0771484375, -49.2890625, -47.5009765625, -45.712890625, -43.9248046875, -42.13671875, -40.3486328125, -38.560546875, -36.7724609375, -34.984375, -33.1962890625, -31.408203125, -29.6201171875, -27.83203125, -26.0439453125, -24.255859375, -22.4677734375, -20.6796875, -18.8916015625, -17.103515625, -15.3154296875, -13.52734375, -11.7392578125, -9.951171875, -8.1630859375, -6.375, -4.5869140625, -2.798828125, -1.0107421875, 0.77734375, 2.5654296875, 4.353515625, 6.1416015625, 7.9296875, 9.7177734375, 11.505859375, 13.2939453125, 15.08203125, 16.8701171875, 18.658203125, 20.4462890625, 22.234375, 24.0224609375, 25.810546875, 27.5986328125, 29.38671875, 31.1748046875, 32.962890625, 34.7509765625, 36.5390625, 38.3271484375, 40.115234375, 41.9033203125, 43.69140625, 45.4794921875, 47.267578125, 49.0556640625, 50.84375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 4.0, 18.0, 13.0, 19.0, 35.0, 36.0, 62.0, 65.0, 96.0, 156.0, 262.0, 537.0, 1779.0, 363.0, 180.0, 128.0, 64.0, 59.0, 40.0, 33.0, 29.0, 17.0, 14.0, 8.0, 2.0, 6.0, 3.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.8203125, -12.4102783203125, -12.000244140625, -11.5902099609375, -11.18017578125, -10.7701416015625, -10.360107421875, -9.9500732421875, -9.5400390625, -9.1300048828125, -8.719970703125, -8.3099365234375, -7.89990234375, -7.4898681640625, -7.079833984375, -6.6697998046875, -6.259765625, -5.8497314453125, -5.439697265625, -5.0296630859375, -4.61962890625, -4.2095947265625, -3.799560546875, -3.3895263671875, -2.9794921875, -2.5694580078125, -2.159423828125, -1.7493896484375, -1.33935546875, -0.9293212890625, -0.519287109375, -0.1092529296875, 0.30078125, 0.7108154296875, 1.120849609375, 1.5308837890625, 1.94091796875, 2.3509521484375, 2.760986328125, 3.1710205078125, 3.5810546875, 3.9910888671875, 4.401123046875, 4.8111572265625, 5.22119140625, 5.6312255859375, 6.041259765625, 6.4512939453125, 6.861328125, 7.2713623046875, 7.681396484375, 8.0914306640625, 8.50146484375, 8.9114990234375, 9.321533203125, 9.7315673828125, 10.1416015625, 10.5516357421875, 10.961669921875, 11.3717041015625, 11.78173828125, 12.1917724609375, 12.601806640625, 13.0118408203125, 13.421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 18.0, 17.0, 22.0, 41.0, 62.0, 74.0, 156.0, 152.0, 127.0, 106.0, 78.0, 56.0, 29.0, 18.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.20330047607422, -78.2730712890625, -75.34284973144531, -72.41262817382812, -69.4823989868164, -66.55216979980469, -63.6219482421875, -60.69172286987305, -57.761497497558594, -54.83127212524414, -51.90104675292969, -48.970821380615234, -46.04059600830078, -43.11037063598633, -40.180145263671875, -37.24991989135742, -34.31969451904297, -31.389469146728516, -28.459243774414062, -25.52901840209961, -22.598793029785156, -19.668567657470703, -16.73834228515625, -13.808116912841797, -10.877891540527344, -7.947666168212891, -5.0174407958984375, -2.0872154235839844, 0.8430099487304688, 3.773235321044922, 6.703460693359375, 9.633686065673828, 12.563919067382812, 15.494144439697266, 18.42436981201172, 21.354595184326172, 24.284820556640625, 27.215045928955078, 30.14527130126953, 33.075496673583984, 36.00572204589844, 38.93594741821289, 41.866172790527344, 44.7963981628418, 47.72662353515625, 50.6568489074707, 53.587074279785156, 56.51729965209961, 59.44752502441406, 62.377750396728516, 65.30797576904297, 68.23820495605469, 71.16842651367188, 74.09864807128906, 77.02887725830078, 79.9591064453125, 82.88932800292969, 85.81954956054688, 88.7497787475586, 91.68000793457031, 94.6102294921875, 97.54045104980469, 100.4706802368164, 103.40090942382812, 106.33113098144531]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 13.0, 8.0, 25.0, 24.0, 15.0, 36.0, 29.0, 40.0, 36.0, 46.0, 40.0, 39.0, 61.0, 41.0, 52.0, 44.0, 43.0, 38.0, 28.0, 41.0, 36.0, 35.0, 32.0, 29.0, 27.0, 17.0, 16.0, 13.0, 11.0, 7.0, 6.0, 12.0, 6.0, 10.0, 10.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.28271484375, -46.7509880065918, -45.21925735473633, -43.687530517578125, -42.15580368041992, -40.62407684326172, -39.09234619140625, -37.56061935424805, -36.028892517089844, -34.49716567993164, -32.96543502807617, -31.43370819091797, -29.901981353759766, -28.37025260925293, -26.838523864746094, -25.30679702758789, -23.775066375732422, -22.243337631225586, -20.711610794067383, -19.179882049560547, -17.648155212402344, -16.116426467895508, -14.584697723388672, -13.052969932556152, -11.521242141723633, -9.989514350891113, -8.457786560058594, -6.926057815551758, -5.394330024719238, -3.8626022338867188, -2.330873489379883, -0.7991456985473633, 0.7325820922851562, 2.264310121536255, 3.7960381507873535, 5.327766418457031, 6.859494209289551, 8.39122200012207, 9.922950744628906, 11.454678535461426, 12.986406326293945, 14.518134117126465, 16.049861907958984, 17.58159065246582, 19.113319396972656, 20.64504623413086, 22.176774978637695, 23.70850372314453, 25.240230560302734, 26.77195930480957, 28.303686141967773, 29.83541488647461, 31.367141723632812, 32.89887237548828, 34.430599212646484, 35.96232604980469, 37.494056701660156, 39.02578353881836, 40.55751419067383, 42.08924102783203, 43.620967864990234, 45.15269470214844, 46.684425354003906, 48.21615219116211, 49.74787902832031]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 11.0, 18.0, 14.0, 31.0, 26.0, 68.0, 72.0, 131.0, 186.0, 287.0, 396.0, 638.0, 1040.0, 1880.0, 3269.0, 5772.0, 11059.0, 22474.0, 46201.0, 98852.0, 211631.0, 311793.0, 173689.0, 81114.0, 38038.0, 18613.0, 9357.0, 4999.0, 2746.0, 1683.0, 955.0, 573.0, 302.0, 220.0, 123.0, 111.0, 62.0, 38.0, 17.0, 18.0, 10.0, 8.0, 8.0, 5.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-25.921875, -25.14501953125, -24.3681640625, -23.59130859375, -22.814453125, -22.03759765625, -21.2607421875, -20.48388671875, -19.70703125, -18.93017578125, -18.1533203125, -17.37646484375, -16.599609375, -15.82275390625, -15.0458984375, -14.26904296875, -13.4921875, -12.71533203125, -11.9384765625, -11.16162109375, -10.384765625, -9.60791015625, -8.8310546875, -8.05419921875, -7.27734375, -6.50048828125, -5.7236328125, -4.94677734375, -4.169921875, -3.39306640625, -2.6162109375, -1.83935546875, -1.0625, -0.28564453125, 0.4912109375, 1.26806640625, 2.044921875, 2.82177734375, 3.5986328125, 4.37548828125, 5.15234375, 5.92919921875, 6.7060546875, 7.48291015625, 8.259765625, 9.03662109375, 9.8134765625, 10.59033203125, 11.3671875, 12.14404296875, 12.9208984375, 13.69775390625, 14.474609375, 15.25146484375, 16.0283203125, 16.80517578125, 17.58203125, 18.35888671875, 19.1357421875, 19.91259765625, 20.689453125, 21.46630859375, 22.2431640625, 23.02001953125, 23.796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 12.0, 18.0, 30.0, 25.0, 29.0, 26.0, 43.0, 43.0, 45.0, 62.0, 67.0, 60.0, 65.0, 55.0, 42.0, 53.0, 48.0, 50.0, 46.0, 25.0, 29.0, 22.0, 18.0, 15.0, 10.0, 5.0, 5.0, 13.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.56817626953125, -5.3863525390625, -5.20452880859375, -5.022705078125, -4.84088134765625, -4.6590576171875, -4.47723388671875, -4.29541015625, -4.11358642578125, -3.9317626953125, -3.74993896484375, -3.568115234375, -3.38629150390625, -3.2044677734375, -3.02264404296875, -2.8408203125, -2.65899658203125, -2.4771728515625, -2.29534912109375, -2.113525390625, -1.93170166015625, -1.7498779296875, -1.56805419921875, -1.38623046875, -1.20440673828125, -1.0225830078125, -0.84075927734375, -0.658935546875, -0.47711181640625, -0.2952880859375, -0.11346435546875, 0.068359375, 0.25018310546875, 0.4320068359375, 0.61383056640625, 0.795654296875, 0.97747802734375, 1.1593017578125, 1.34112548828125, 1.52294921875, 1.70477294921875, 1.8865966796875, 2.06842041015625, 2.250244140625, 2.43206787109375, 2.6138916015625, 2.79571533203125, 2.9775390625, 3.15936279296875, 3.3411865234375, 3.52301025390625, 3.704833984375, 3.88665771484375, 4.0684814453125, 4.25030517578125, 4.43212890625, 4.61395263671875, 4.7957763671875, 4.97760009765625, 5.159423828125, 5.34124755859375, 5.5230712890625, 5.70489501953125, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 21.0, 20.0, 23.0, 34.0, 66.0, 116.0, 159.0, 280.0, 468.0, 914.0, 1515.0, 3059.0, 6371.0, 14825.0, 36784.0, 104342.0, 317935.0, 365965.0, 121827.0, 42519.0, 16689.0, 7309.0, 3364.0, 1673.0, 872.0, 524.0, 312.0, 176.0, 128.0, 92.0, 47.0, 31.0, 23.0, 15.0, 13.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.6875, -37.614990234375, -36.54248046875, -35.469970703125, -34.3974609375, -33.324951171875, -32.25244140625, -31.179931640625, -30.107421875, -29.034912109375, -27.96240234375, -26.889892578125, -25.8173828125, -24.744873046875, -23.67236328125, -22.599853515625, -21.52734375, -20.454833984375, -19.38232421875, -18.309814453125, -17.2373046875, -16.164794921875, -15.09228515625, -14.019775390625, -12.947265625, -11.874755859375, -10.80224609375, -9.729736328125, -8.6572265625, -7.584716796875, -6.51220703125, -5.439697265625, -4.3671875, -3.294677734375, -2.22216796875, -1.149658203125, -0.0771484375, 0.995361328125, 2.06787109375, 3.140380859375, 4.212890625, 5.285400390625, 6.35791015625, 7.430419921875, 8.5029296875, 9.575439453125, 10.64794921875, 11.720458984375, 12.79296875, 13.865478515625, 14.93798828125, 16.010498046875, 17.0830078125, 18.155517578125, 19.22802734375, 20.300537109375, 21.373046875, 22.445556640625, 23.51806640625, 24.590576171875, 25.6630859375, 26.735595703125, 27.80810546875, 28.880615234375, 29.953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 9.0, 5.0, 12.0, 2.0, 3.0, 16.0, 23.0, 21.0, 21.0, 31.0, 42.0, 45.0, 38.0, 65.0, 54.0, 65.0, 57.0, 40.0, 54.0, 51.0, 49.0, 52.0, 40.0, 26.0, 33.0, 22.0, 24.0, 18.0, 13.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.21875, -32.24267578125, -31.2666015625, -30.29052734375, -29.314453125, -28.33837890625, -27.3623046875, -26.38623046875, -25.41015625, -24.43408203125, -23.4580078125, -22.48193359375, -21.505859375, -20.52978515625, -19.5537109375, -18.57763671875, -17.6015625, -16.62548828125, -15.6494140625, -14.67333984375, -13.697265625, -12.72119140625, -11.7451171875, -10.76904296875, -9.79296875, -8.81689453125, -7.8408203125, -6.86474609375, -5.888671875, -4.91259765625, -3.9365234375, -2.96044921875, -1.984375, -1.00830078125, -0.0322265625, 0.94384765625, 1.919921875, 2.89599609375, 3.8720703125, 4.84814453125, 5.82421875, 6.80029296875, 7.7763671875, 8.75244140625, 9.728515625, 10.70458984375, 11.6806640625, 12.65673828125, 13.6328125, 14.60888671875, 15.5849609375, 16.56103515625, 17.537109375, 18.51318359375, 19.4892578125, 20.46533203125, 21.44140625, 22.41748046875, 23.3935546875, 24.36962890625, 25.345703125, 26.32177734375, 27.2978515625, 28.27392578125, 29.25]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 16.0, 13.0, 13.0, 22.0, 28.0, 46.0, 59.0, 90.0, 138.0, 198.0, 250.0, 486.0, 873.0, 1454.0, 2792.0, 5890.0, 14037.0, 39795.0, 139089.0, 444961.0, 282633.0, 74082.0, 23604.0, 9098.0, 4021.0, 2019.0, 1082.0, 623.0, 349.0, 230.0, 158.0, 98.0, 96.0, 55.0, 43.0, 32.0, 21.0, 18.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0], "bins": [-16.828125, -16.314453125, -15.80078125, -15.287109375, -14.7734375, -14.259765625, -13.74609375, -13.232421875, -12.71875, -12.205078125, -11.69140625, -11.177734375, -10.6640625, -10.150390625, -9.63671875, -9.123046875, -8.609375, -8.095703125, -7.58203125, -7.068359375, -6.5546875, -6.041015625, -5.52734375, -5.013671875, -4.5, -3.986328125, -3.47265625, -2.958984375, -2.4453125, -1.931640625, -1.41796875, -0.904296875, -0.390625, 0.123046875, 0.63671875, 1.150390625, 1.6640625, 2.177734375, 2.69140625, 3.205078125, 3.71875, 4.232421875, 4.74609375, 5.259765625, 5.7734375, 6.287109375, 6.80078125, 7.314453125, 7.828125, 8.341796875, 8.85546875, 9.369140625, 9.8828125, 10.396484375, 10.91015625, 11.423828125, 11.9375, 12.451171875, 12.96484375, 13.478515625, 13.9921875, 14.505859375, 15.01953125, 15.533203125, 16.046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 0.0, 5.0, 6.0, 7.0, 7.0, 6.0, 19.0, 13.0, 21.0, 33.0, 39.0, 67.0, 111.0, 111.0, 125.0, 104.0, 98.0, 66.0, 42.0, 34.0, 20.0, 18.0, 10.0, 9.0, 6.0, 4.0, 1.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030345916748046875, -0.002905339002609253, -0.0027760863304138184, -0.002646833658218384, -0.0025175809860229492, -0.0023883283138275146, -0.00225907564163208, -0.0021298229694366455, -0.002000570297241211, -0.0018713176250457764, -0.0017420649528503418, -0.0016128122806549072, -0.0014835596084594727, -0.001354306936264038, -0.0012250542640686035, -0.001095801591873169, -0.0009665489196777344, -0.0008372962474822998, -0.0007080435752868652, -0.0005787909030914307, -0.0004495382308959961, -0.0003202855587005615, -0.00019103288650512695, -6.178021430969238e-05, 6.747245788574219e-05, 0.00019672513008117676, 0.00032597780227661133, 0.0004552304744720459, 0.0005844831466674805, 0.000713735818862915, 0.0008429884910583496, 0.0009722411632537842, 0.0011014938354492188, 0.0012307465076446533, 0.0013599991798400879, 0.0014892518520355225, 0.001618504524230957, 0.0017477571964263916, 0.0018770098686218262, 0.0020062625408172607, 0.0021355152130126953, 0.00226476788520813, 0.0023940205574035645, 0.002523273229598999, 0.0026525259017944336, 0.002781778573989868, 0.0029110312461853027, 0.0030402839183807373, 0.003169536590576172, 0.0032987892627716064, 0.003428041934967041, 0.0035572946071624756, 0.00368654727935791, 0.0038157999515533447, 0.003945052623748779, 0.004074305295944214, 0.0042035579681396484, 0.004332810640335083, 0.004462063312530518, 0.004591315984725952, 0.004720568656921387, 0.004849821329116821, 0.004979074001312256, 0.00510832667350769, 0.005237579345703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 3.0, 11.0, 13.0, 15.0, 18.0, 32.0, 29.0, 41.0, 63.0, 97.0, 148.0, 219.0, 304.0, 566.0, 895.0, 1642.0, 3455.0, 8130.0, 24018.0, 96368.0, 453432.0, 353777.0, 72707.0, 19234.0, 6634.0, 2914.0, 1514.0, 822.0, 513.0, 280.0, 212.0, 115.0, 94.0, 62.0, 56.0, 39.0, 15.0, 12.0, 10.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.24951171875, -16.6083984375, -15.96728515625, -15.326171875, -14.68505859375, -14.0439453125, -13.40283203125, -12.76171875, -12.12060546875, -11.4794921875, -10.83837890625, -10.197265625, -9.55615234375, -8.9150390625, -8.27392578125, -7.6328125, -6.99169921875, -6.3505859375, -5.70947265625, -5.068359375, -4.42724609375, -3.7861328125, -3.14501953125, -2.50390625, -1.86279296875, -1.2216796875, -0.58056640625, 0.060546875, 0.70166015625, 1.3427734375, 1.98388671875, 2.625, 3.26611328125, 3.9072265625, 4.54833984375, 5.189453125, 5.83056640625, 6.4716796875, 7.11279296875, 7.75390625, 8.39501953125, 9.0361328125, 9.67724609375, 10.318359375, 10.95947265625, 11.6005859375, 12.24169921875, 12.8828125, 13.52392578125, 14.1650390625, 14.80615234375, 15.447265625, 16.08837890625, 16.7294921875, 17.37060546875, 18.01171875, 18.65283203125, 19.2939453125, 19.93505859375, 20.576171875, 21.21728515625, 21.8583984375, 22.49951171875, 23.140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 4.0, 15.0, 29.0, 36.0, 42.0, 63.0, 101.0, 119.0, 128.0, 113.0, 107.0, 85.0, 45.0, 29.0, 21.0, 17.0, 13.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.90087890625, -15.2548828125, -14.60888671875, -13.962890625, -13.31689453125, -12.6708984375, -12.02490234375, -11.37890625, -10.73291015625, -10.0869140625, -9.44091796875, -8.794921875, -8.14892578125, -7.5029296875, -6.85693359375, -6.2109375, -5.56494140625, -4.9189453125, -4.27294921875, -3.626953125, -2.98095703125, -2.3349609375, -1.68896484375, -1.04296875, -0.39697265625, 0.2490234375, 0.89501953125, 1.541015625, 2.18701171875, 2.8330078125, 3.47900390625, 4.125, 4.77099609375, 5.4169921875, 6.06298828125, 6.708984375, 7.35498046875, 8.0009765625, 8.64697265625, 9.29296875, 9.93896484375, 10.5849609375, 11.23095703125, 11.876953125, 12.52294921875, 13.1689453125, 13.81494140625, 14.4609375, 15.10693359375, 15.7529296875, 16.39892578125, 17.044921875, 17.69091796875, 18.3369140625, 18.98291015625, 19.62890625, 20.27490234375, 20.9208984375, 21.56689453125, 22.212890625, 22.85888671875, 23.5048828125, 24.15087890625, 24.796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 26.0, 49.0, 125.0, 311.0, 293.0, 134.0, 40.0, 21.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.3655700683594, -411.714111328125, -391.0626220703125, -370.4111328125, -349.7596740722656, -329.10821533203125, -308.45672607421875, -287.80523681640625, -267.1537780761719, -246.50230407714844, -225.850830078125, -205.19935607910156, -184.54788208007812, -163.8964080810547, -143.24493408203125, -122.59346008300781, -101.94198608398438, -81.29051208496094, -60.6390380859375, -39.98756408691406, -19.336090087890625, 1.3153839111328125, 21.96685791015625, 42.61833190917969, 63.269805908203125, 83.92127990722656, 104.57275390625, 125.22422790527344, 145.87570190429688, 166.5271759033203, 187.17864990234375, 207.8301239013672, 228.4815673828125, 249.13304138183594, 269.7845153808594, 290.43597412109375, 311.08746337890625, 331.73895263671875, 352.3904113769531, 373.0418701171875, 393.693359375, 414.3448486328125, 434.9963073730469, 455.64776611328125, 476.29925537109375, 496.95074462890625, 517.6021728515625, 538.253662109375, 558.9051513671875, 579.556640625, 600.2081298828125, 620.8595581054688, 641.5110473632812, 662.1625366210938, 682.81396484375, 703.4654541015625, 724.116943359375, 744.7684326171875, 765.419921875, 786.0713500976562, 806.7228393554688, 827.3743286132812, 848.0257568359375, 868.67724609375, 889.3287353515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 1.0, 7.0, 14.0, 8.0, 10.0, 18.0, 22.0, 38.0, 44.0, 43.0, 45.0, 51.0, 58.0, 72.0, 66.0, 69.0, 49.0, 64.0, 40.0, 54.0, 36.0, 40.0, 33.0, 18.0, 25.0, 19.0, 16.0, 12.0, 9.0, 4.0, 11.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.98704528808594, -127.05823516845703, -120.12942504882812, -113.20062255859375, -106.27181243896484, -99.34300231933594, -92.41419982910156, -85.48538970947266, -78.55657958984375, -71.62776947021484, -64.69895935058594, -57.77015686035156, -50.841346740722656, -43.91253662109375, -36.98373031616211, -30.05492401123047, -23.126113891601562, -16.19730567932129, -9.268497467041016, -2.339689254760742, 4.589118957519531, 11.517929077148438, 18.446735382080078, 25.37554168701172, 32.304351806640625, 39.23316192626953, 46.16196823120117, 53.09077453613281, 60.01958465576172, 66.94839477539062, 73.877197265625, 80.8060073852539, 87.73483276367188, 94.66364288330078, 101.59245300292969, 108.52125549316406, 115.45006561279297, 122.37887573242188, 129.30767822265625, 136.23648071289062, 143.16529846191406, 150.09410095214844, 157.02291870117188, 163.95172119140625, 170.88052368164062, 177.80934143066406, 184.73814392089844, 191.66696166992188, 198.59576416015625, 205.52456665039062, 212.45338439941406, 219.38218688964844, 226.31100463867188, 233.23980712890625, 240.16860961914062, 247.097412109375, 254.02622985839844, 260.9550476074219, 267.88385009765625, 274.8126525878906, 281.741455078125, 288.6702880859375, 295.5990905761719, 302.52789306640625, 309.4566955566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 13.0, 9.0, 8.0, 16.0, 30.0, 56.0, 39.0, 48.0, 99.0, 153.0, 229.0, 360.0, 586.0, 962.0, 1797.0, 3294.0, 6100.0, 12796.0, 29957.0, 94175.0, 2820837.0, 1077015.0, 89594.0, 29348.0, 12570.0, 6040.0, 3262.0, 1889.0, 1058.0, 637.0, 420.0, 289.0, 168.0, 128.0, 90.0, 56.0, 44.0, 24.0, 20.0, 18.0, 13.0, 7.0, 4.0, 9.0, 2.0, 4.0], "bins": [-46.53125, -45.337646484375, -44.14404296875, -42.950439453125, -41.7568359375, -40.563232421875, -39.36962890625, -38.176025390625, -36.982421875, -35.788818359375, -34.59521484375, -33.401611328125, -32.2080078125, -31.014404296875, -29.82080078125, -28.627197265625, -27.43359375, -26.239990234375, -25.04638671875, -23.852783203125, -22.6591796875, -21.465576171875, -20.27197265625, -19.078369140625, -17.884765625, -16.691162109375, -15.49755859375, -14.303955078125, -13.1103515625, -11.916748046875, -10.72314453125, -9.529541015625, -8.3359375, -7.142333984375, -5.94873046875, -4.755126953125, -3.5615234375, -2.367919921875, -1.17431640625, 0.019287109375, 1.212890625, 2.406494140625, 3.60009765625, 4.793701171875, 5.9873046875, 7.180908203125, 8.37451171875, 9.568115234375, 10.76171875, 11.955322265625, 13.14892578125, 14.342529296875, 15.5361328125, 16.729736328125, 17.92333984375, 19.116943359375, 20.310546875, 21.504150390625, 22.69775390625, 23.891357421875, 25.0849609375, 26.278564453125, 27.47216796875, 28.665771484375, 29.859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 11.0, 11.0, 25.0, 28.0, 30.0, 54.0, 46.0, 61.0, 62.0, 82.0, 82.0, 86.0, 69.0, 63.0, 65.0, 50.0, 50.0, 33.0, 25.0, 19.0, 11.0, 7.0, 10.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.678955078125, -6.41259765625, -6.146240234375, -5.8798828125, -5.613525390625, -5.34716796875, -5.080810546875, -4.814453125, -4.548095703125, -4.28173828125, -4.015380859375, -3.7490234375, -3.482666015625, -3.21630859375, -2.949951171875, -2.68359375, -2.417236328125, -2.15087890625, -1.884521484375, -1.6181640625, -1.351806640625, -1.08544921875, -0.819091796875, -0.552734375, -0.286376953125, -0.02001953125, 0.246337890625, 0.5126953125, 0.779052734375, 1.04541015625, 1.311767578125, 1.578125, 1.844482421875, 2.11083984375, 2.377197265625, 2.6435546875, 2.909912109375, 3.17626953125, 3.442626953125, 3.708984375, 3.975341796875, 4.24169921875, 4.508056640625, 4.7744140625, 5.040771484375, 5.30712890625, 5.573486328125, 5.83984375, 6.106201171875, 6.37255859375, 6.638916015625, 6.9052734375, 7.171630859375, 7.43798828125, 7.704345703125, 7.970703125, 8.237060546875, 8.50341796875, 8.769775390625, 9.0361328125, 9.302490234375, 9.56884765625, 9.835205078125, 10.1015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 4.0, 12.0, 13.0, 7.0, 15.0, 36.0, 46.0, 60.0, 102.0, 142.0, 217.0, 386.0, 625.0, 1217.0, 2132.0, 4372.0, 9660.0, 22993.0, 67920.0, 319793.0, 3439845.0, 233334.0, 55379.0, 19674.0, 8271.0, 3716.0, 1841.0, 1009.0, 509.0, 306.0, 202.0, 141.0, 90.0, 55.0, 47.0, 34.0, 25.0, 19.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.96875, -45.52001953125, -44.0712890625, -42.62255859375, -41.173828125, -39.72509765625, -38.2763671875, -36.82763671875, -35.37890625, -33.93017578125, -32.4814453125, -31.03271484375, -29.583984375, -28.13525390625, -26.6865234375, -25.23779296875, -23.7890625, -22.34033203125, -20.8916015625, -19.44287109375, -17.994140625, -16.54541015625, -15.0966796875, -13.64794921875, -12.19921875, -10.75048828125, -9.3017578125, -7.85302734375, -6.404296875, -4.95556640625, -3.5068359375, -2.05810546875, -0.609375, 0.83935546875, 2.2880859375, 3.73681640625, 5.185546875, 6.63427734375, 8.0830078125, 9.53173828125, 10.98046875, 12.42919921875, 13.8779296875, 15.32666015625, 16.775390625, 18.22412109375, 19.6728515625, 21.12158203125, 22.5703125, 24.01904296875, 25.4677734375, 26.91650390625, 28.365234375, 29.81396484375, 31.2626953125, 32.71142578125, 34.16015625, 35.60888671875, 37.0576171875, 38.50634765625, 39.955078125, 41.40380859375, 42.8525390625, 44.30126953125, 45.75]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 4.0, 3.0, 5.0, 10.0, 12.0, 13.0, 16.0, 21.0, 33.0, 49.0, 76.0, 98.0, 168.0, 343.0, 2202.0, 470.0, 194.0, 106.0, 71.0, 54.0, 35.0, 23.0, 20.0, 12.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4375, -14.94921875, -14.4609375, -13.97265625, -13.484375, -12.99609375, -12.5078125, -12.01953125, -11.53125, -11.04296875, -10.5546875, -10.06640625, -9.578125, -9.08984375, -8.6015625, -8.11328125, -7.625, -7.13671875, -6.6484375, -6.16015625, -5.671875, -5.18359375, -4.6953125, -4.20703125, -3.71875, -3.23046875, -2.7421875, -2.25390625, -1.765625, -1.27734375, -0.7890625, -0.30078125, 0.1875, 0.67578125, 1.1640625, 1.65234375, 2.140625, 2.62890625, 3.1171875, 3.60546875, 4.09375, 4.58203125, 5.0703125, 5.55859375, 6.046875, 6.53515625, 7.0234375, 7.51171875, 8.0, 8.48828125, 8.9765625, 9.46484375, 9.953125, 10.44140625, 10.9296875, 11.41796875, 11.90625, 12.39453125, 12.8828125, 13.37109375, 13.859375, 14.34765625, 14.8359375, 15.32421875, 15.8125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 17.0, 29.0, 52.0, 83.0, 105.0, 144.0, 154.0, 140.0, 94.0, 69.0, 45.0, 10.0, 20.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-96.26805114746094, -93.10364532470703, -89.9392318725586, -86.77482604980469, -83.61042022705078, -80.44601440429688, -77.28160095214844, -74.11719512939453, -70.95278930664062, -67.78838348388672, -64.62397003173828, -61.459564208984375, -58.29515838623047, -55.1307487487793, -51.966339111328125, -48.80193328857422, -45.63751983642578, -42.47311019897461, -39.3087043762207, -36.14429473876953, -32.979888916015625, -29.815479278564453, -26.65106964111328, -23.486661911010742, -20.322254180908203, -17.157846450805664, -13.993437767028809, -10.829029083251953, -7.664621353149414, -4.500213623046875, -1.3358039855957031, 1.828603744506836, 4.993019104003906, 8.157426834106445, 11.3218355178833, 14.486244201660156, 17.650651931762695, 20.815059661865234, 23.979469299316406, 27.143877029418945, 30.308284759521484, 33.472694396972656, 36.63710021972656, 39.801509857177734, 42.965919494628906, 46.13032531738281, 49.294734954833984, 52.459144592285156, 55.62355041503906, 58.787960052490234, 61.95236587524414, 65.11677551269531, 68.28118133544922, 71.44558715820312, 74.61000061035156, 77.77440643310547, 80.93881225585938, 84.10321807861328, 87.26763153076172, 90.43203735351562, 93.59644317626953, 96.76084899902344, 99.92526245117188, 103.08966827392578, 106.25408172607422]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 10.0, 6.0, 16.0, 10.0, 15.0, 19.0, 12.0, 28.0, 37.0, 30.0, 33.0, 44.0, 44.0, 52.0, 57.0, 63.0, 50.0, 65.0, 58.0, 43.0, 51.0, 50.0, 44.0, 32.0, 24.0, 35.0, 13.0, 20.0, 17.0, 9.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.17987060546875, -60.27134704589844, -58.36282730102539, -56.45430374145508, -54.545780181884766, -52.63726043701172, -50.728736877441406, -48.820213317871094, -46.91168975830078, -45.00316619873047, -43.09464645385742, -41.18612289428711, -39.2775993347168, -37.36907958984375, -35.46055603027344, -33.552032470703125, -31.643512725830078, -29.7349910736084, -27.826467514038086, -25.917945861816406, -24.009422302246094, -22.100900650024414, -20.192378997802734, -18.283855438232422, -16.375333786010742, -14.466811180114746, -12.55828857421875, -10.64976692199707, -8.741244316101074, -6.832721710205078, -4.924200057983398, -3.0156774520874023, -1.1071548461914062, 0.8013675212860107, 2.7098898887634277, 4.618412017822266, 6.526934623718262, 8.435457229614258, 10.343978881835938, 12.252501487731934, 14.16102409362793, 16.06954574584961, 17.978069305419922, 19.8865909576416, 21.79511260986328, 23.703636169433594, 25.612157821655273, 27.520679473876953, 29.429203033447266, 31.337724685668945, 33.246246337890625, 35.15476989746094, 37.06329345703125, 38.97181701660156, 40.88033676147461, 42.78886032104492, 44.69738006591797, 46.60590362548828, 48.51442337036133, 50.42294692993164, 52.33147048950195, 54.239990234375, 56.14851379394531, 58.057037353515625, 59.96556091308594]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 24.0, 34.0, 35.0, 56.0, 86.0, 119.0, 207.0, 282.0, 462.0, 762.0, 1261.0, 2208.0, 3913.0, 7131.0, 13323.0, 26350.0, 54431.0, 113010.0, 240900.0, 295633.0, 147638.0, 69736.0, 33691.0, 16960.0, 8930.0, 4622.0, 2736.0, 1549.0, 922.0, 510.0, 365.0, 202.0, 165.0, 97.0, 51.0, 40.0, 34.0, 16.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.265625, -23.433837890625, -22.60205078125, -21.770263671875, -20.9384765625, -20.106689453125, -19.27490234375, -18.443115234375, -17.611328125, -16.779541015625, -15.94775390625, -15.115966796875, -14.2841796875, -13.452392578125, -12.62060546875, -11.788818359375, -10.95703125, -10.125244140625, -9.29345703125, -8.461669921875, -7.6298828125, -6.798095703125, -5.96630859375, -5.134521484375, -4.302734375, -3.470947265625, -2.63916015625, -1.807373046875, -0.9755859375, -0.143798828125, 0.68798828125, 1.519775390625, 2.3515625, 3.183349609375, 4.01513671875, 4.846923828125, 5.6787109375, 6.510498046875, 7.34228515625, 8.174072265625, 9.005859375, 9.837646484375, 10.66943359375, 11.501220703125, 12.3330078125, 13.164794921875, 13.99658203125, 14.828369140625, 15.66015625, 16.491943359375, 17.32373046875, 18.155517578125, 18.9873046875, 19.819091796875, 20.65087890625, 21.482666015625, 22.314453125, 23.146240234375, 23.97802734375, 24.809814453125, 25.6416015625, 26.473388671875, 27.30517578125, 28.136962890625, 28.96875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 8.0, 6.0, 17.0, 18.0, 16.0, 22.0, 35.0, 36.0, 34.0, 33.0, 42.0, 43.0, 52.0, 51.0, 46.0, 52.0, 50.0, 47.0, 51.0, 52.0, 45.0, 39.0, 34.0, 28.0, 29.0, 18.0, 19.0, 16.0, 9.0, 9.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.48828125, -6.29949951171875, -6.1107177734375, -5.92193603515625, -5.733154296875, -5.54437255859375, -5.3555908203125, -5.16680908203125, -4.97802734375, -4.78924560546875, -4.6004638671875, -4.41168212890625, -4.222900390625, -4.03411865234375, -3.8453369140625, -3.65655517578125, -3.4677734375, -3.27899169921875, -3.0902099609375, -2.90142822265625, -2.712646484375, -2.52386474609375, -2.3350830078125, -2.14630126953125, -1.95751953125, -1.76873779296875, -1.5799560546875, -1.39117431640625, -1.202392578125, -1.01361083984375, -0.8248291015625, -0.63604736328125, -0.447265625, -0.25848388671875, -0.0697021484375, 0.11907958984375, 0.307861328125, 0.49664306640625, 0.6854248046875, 0.87420654296875, 1.06298828125, 1.25177001953125, 1.4405517578125, 1.62933349609375, 1.818115234375, 2.00689697265625, 2.1956787109375, 2.38446044921875, 2.5732421875, 2.76202392578125, 2.9508056640625, 3.13958740234375, 3.328369140625, 3.51715087890625, 3.7059326171875, 3.89471435546875, 4.08349609375, 4.27227783203125, 4.4610595703125, 4.64984130859375, 4.838623046875, 5.02740478515625, 5.2161865234375, 5.40496826171875, 5.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 7.0, 12.0, 25.0, 18.0, 42.0, 53.0, 80.0, 99.0, 151.0, 278.0, 413.0, 659.0, 1155.0, 2141.0, 4237.0, 9061.0, 21225.0, 52775.0, 148034.0, 384038.0, 266972.0, 93917.0, 34946.0, 14701.0, 6347.0, 3151.0, 1620.0, 910.0, 524.0, 325.0, 219.0, 126.0, 92.0, 64.0, 49.0, 18.0, 22.0, 17.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.09375, -30.145263671875, -29.19677734375, -28.248291015625, -27.2998046875, -26.351318359375, -25.40283203125, -24.454345703125, -23.505859375, -22.557373046875, -21.60888671875, -20.660400390625, -19.7119140625, -18.763427734375, -17.81494140625, -16.866455078125, -15.91796875, -14.969482421875, -14.02099609375, -13.072509765625, -12.1240234375, -11.175537109375, -10.22705078125, -9.278564453125, -8.330078125, -7.381591796875, -6.43310546875, -5.484619140625, -4.5361328125, -3.587646484375, -2.63916015625, -1.690673828125, -0.7421875, 0.206298828125, 1.15478515625, 2.103271484375, 3.0517578125, 4.000244140625, 4.94873046875, 5.897216796875, 6.845703125, 7.794189453125, 8.74267578125, 9.691162109375, 10.6396484375, 11.588134765625, 12.53662109375, 13.485107421875, 14.43359375, 15.382080078125, 16.33056640625, 17.279052734375, 18.2275390625, 19.176025390625, 20.12451171875, 21.072998046875, 22.021484375, 22.969970703125, 23.91845703125, 24.866943359375, 25.8154296875, 26.763916015625, 27.71240234375, 28.660888671875, 29.609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 3.0, 11.0, 10.0, 16.0, 8.0, 17.0, 31.0, 24.0, 25.0, 29.0, 26.0, 48.0, 38.0, 56.0, 51.0, 65.0, 49.0, 47.0, 64.0, 65.0, 38.0, 47.0, 36.0, 41.0, 33.0, 21.0, 23.0, 24.0, 20.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.386474609375, -31.39794921875, -30.409423828125, -29.4208984375, -28.432373046875, -27.44384765625, -26.455322265625, -25.466796875, -24.478271484375, -23.48974609375, -22.501220703125, -21.5126953125, -20.524169921875, -19.53564453125, -18.547119140625, -17.55859375, -16.570068359375, -15.58154296875, -14.593017578125, -13.6044921875, -12.615966796875, -11.62744140625, -10.638916015625, -9.650390625, -8.661865234375, -7.67333984375, -6.684814453125, -5.6962890625, -4.707763671875, -3.71923828125, -2.730712890625, -1.7421875, -0.753662109375, 0.23486328125, 1.223388671875, 2.2119140625, 3.200439453125, 4.18896484375, 5.177490234375, 6.166015625, 7.154541015625, 8.14306640625, 9.131591796875, 10.1201171875, 11.108642578125, 12.09716796875, 13.085693359375, 14.07421875, 15.062744140625, 16.05126953125, 17.039794921875, 18.0283203125, 19.016845703125, 20.00537109375, 20.993896484375, 21.982421875, 22.970947265625, 23.95947265625, 24.947998046875, 25.9365234375, 26.925048828125, 27.91357421875, 28.902099609375, 29.890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 26.0, 34.0, 52.0, 69.0, 104.0, 187.0, 354.0, 490.0, 888.0, 1655.0, 3198.0, 7489.0, 22159.0, 116825.0, 647692.0, 198656.0, 30890.0, 9331.0, 4007.0, 1897.0, 1025.0, 564.0, 336.0, 221.0, 136.0, 85.0, 55.0, 36.0, 22.0, 18.0, 8.0, 9.0, 8.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.203125, -26.39404296875, -25.5849609375, -24.77587890625, -23.966796875, -23.15771484375, -22.3486328125, -21.53955078125, -20.73046875, -19.92138671875, -19.1123046875, -18.30322265625, -17.494140625, -16.68505859375, -15.8759765625, -15.06689453125, -14.2578125, -13.44873046875, -12.6396484375, -11.83056640625, -11.021484375, -10.21240234375, -9.4033203125, -8.59423828125, -7.78515625, -6.97607421875, -6.1669921875, -5.35791015625, -4.548828125, -3.73974609375, -2.9306640625, -2.12158203125, -1.3125, -0.50341796875, 0.3056640625, 1.11474609375, 1.923828125, 2.73291015625, 3.5419921875, 4.35107421875, 5.16015625, 5.96923828125, 6.7783203125, 7.58740234375, 8.396484375, 9.20556640625, 10.0146484375, 10.82373046875, 11.6328125, 12.44189453125, 13.2509765625, 14.06005859375, 14.869140625, 15.67822265625, 16.4873046875, 17.29638671875, 18.10546875, 18.91455078125, 19.7236328125, 20.53271484375, 21.341796875, 22.15087890625, 22.9599609375, 23.76904296875, 24.578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 11.0, 21.0, 39.0, 60.0, 140.0, 235.0, 204.0, 90.0, 61.0, 40.0, 18.0, 7.0, 12.0, 9.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007381439208984375, -0.00712507963180542, -0.006868720054626465, -0.00661236047744751, -0.006356000900268555, -0.0060996413230896, -0.0058432817459106445, -0.0055869221687316895, -0.005330562591552734, -0.005074203014373779, -0.004817843437194824, -0.004561483860015869, -0.004305124282836914, -0.004048764705657959, -0.003792405128479004, -0.003536045551300049, -0.0032796859741210938, -0.0030233263969421387, -0.0027669668197631836, -0.0025106072425842285, -0.0022542476654052734, -0.0019978880882263184, -0.0017415285110473633, -0.0014851689338684082, -0.0012288093566894531, -0.000972449779510498, -0.000716090202331543, -0.0004597306251525879, -0.0002033710479736328, 5.2988529205322266e-05, 0.00030934810638427734, 0.0005657076835632324, 0.0008220672607421875, 0.0010784268379211426, 0.0013347864151000977, 0.0015911459922790527, 0.0018475055694580078, 0.002103865146636963, 0.002360224723815918, 0.002616584300994873, 0.002872943878173828, 0.003129303455352783, 0.0033856630325317383, 0.0036420226097106934, 0.0038983821868896484, 0.0041547417640686035, 0.004411101341247559, 0.004667460918426514, 0.004923820495605469, 0.005180180072784424, 0.005436539649963379, 0.005692899227142334, 0.005949258804321289, 0.006205618381500244, 0.006461977958679199, 0.006718337535858154, 0.006974697113037109, 0.0072310566902160645, 0.0074874162673950195, 0.007743775844573975, 0.00800013542175293, 0.008256494998931885, 0.00851285457611084, 0.008769214153289795, 0.00902557373046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 11.0, 11.0, 16.0, 24.0, 23.0, 42.0, 68.0, 105.0, 154.0, 208.0, 345.0, 525.0, 919.0, 1603.0, 3137.0, 6666.0, 17359.0, 74089.0, 564272.0, 312702.0, 43067.0, 12141.0, 5102.0, 2544.0, 1271.0, 805.0, 445.0, 286.0, 193.0, 127.0, 91.0, 50.0, 44.0, 34.0, 17.0, 15.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.046875, -25.228759765625, -24.41064453125, -23.592529296875, -22.7744140625, -21.956298828125, -21.13818359375, -20.320068359375, -19.501953125, -18.683837890625, -17.86572265625, -17.047607421875, -16.2294921875, -15.411376953125, -14.59326171875, -13.775146484375, -12.95703125, -12.138916015625, -11.32080078125, -10.502685546875, -9.6845703125, -8.866455078125, -8.04833984375, -7.230224609375, -6.412109375, -5.593994140625, -4.77587890625, -3.957763671875, -3.1396484375, -2.321533203125, -1.50341796875, -0.685302734375, 0.1328125, 0.950927734375, 1.76904296875, 2.587158203125, 3.4052734375, 4.223388671875, 5.04150390625, 5.859619140625, 6.677734375, 7.495849609375, 8.31396484375, 9.132080078125, 9.9501953125, 10.768310546875, 11.58642578125, 12.404541015625, 13.22265625, 14.040771484375, 14.85888671875, 15.677001953125, 16.4951171875, 17.313232421875, 18.13134765625, 18.949462890625, 19.767578125, 20.585693359375, 21.40380859375, 22.221923828125, 23.0400390625, 23.858154296875, 24.67626953125, 25.494384765625, 26.3125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 2.0, 6.0, 6.0, 6.0, 17.0, 11.0, 39.0, 60.0, 60.0, 100.0, 131.0, 147.0, 126.0, 99.0, 53.0, 50.0, 23.0, 19.0, 10.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.96875, -24.279296875, -23.58984375, -22.900390625, -22.2109375, -21.521484375, -20.83203125, -20.142578125, -19.453125, -18.763671875, -18.07421875, -17.384765625, -16.6953125, -16.005859375, -15.31640625, -14.626953125, -13.9375, -13.248046875, -12.55859375, -11.869140625, -11.1796875, -10.490234375, -9.80078125, -9.111328125, -8.421875, -7.732421875, -7.04296875, -6.353515625, -5.6640625, -4.974609375, -4.28515625, -3.595703125, -2.90625, -2.216796875, -1.52734375, -0.837890625, -0.1484375, 0.541015625, 1.23046875, 1.919921875, 2.609375, 3.298828125, 3.98828125, 4.677734375, 5.3671875, 6.056640625, 6.74609375, 7.435546875, 8.125, 8.814453125, 9.50390625, 10.193359375, 10.8828125, 11.572265625, 12.26171875, 12.951171875, 13.640625, 14.330078125, 15.01953125, 15.708984375, 16.3984375, 17.087890625, 17.77734375, 18.466796875, 19.15625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 15.0, 24.0, 86.0, 172.0, 295.0, 228.0, 110.0, 35.0, 22.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-733.7855224609375, -717.6943969726562, -701.603271484375, -685.5120849609375, -669.4209594726562, -653.329833984375, -637.2387084960938, -621.1475830078125, -605.056396484375, -588.9652709960938, -572.8741455078125, -556.782958984375, -540.6918334960938, -524.6007080078125, -508.50958251953125, -492.4184265136719, -476.3273010253906, -460.2361755371094, -444.14501953125, -428.05389404296875, -411.9627380371094, -395.8716125488281, -379.78045654296875, -363.6893310546875, -347.59820556640625, -331.507080078125, -315.4159240722656, -299.3247985839844, -283.233642578125, -267.14251708984375, -251.05137634277344, -234.96023559570312, -218.86907958984375, -202.77793884277344, -186.68679809570312, -170.59567260742188, -154.5045166015625, -138.41339111328125, -122.32225036621094, -106.23110961914062, -90.13996887207031, -74.048828125, -57.95769119262695, -41.866554260253906, -25.775413513183594, -9.684272766113281, 6.4068603515625, 22.498001098632812, 38.589141845703125, 54.68028259277344, 70.77142333984375, 86.86255645751953, 102.95369720458984, 119.04483795166016, 135.13597106933594, 151.22711181640625, 167.31825256347656, 183.40939331054688, 199.5005340576172, 215.5916748046875, 231.68280029296875, 247.77395629882812, 263.8650817871094, 279.95623779296875, 296.04736328125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 5.0, 16.0, 8.0, 18.0, 20.0, 28.0, 28.0, 19.0, 22.0, 29.0, 40.0, 46.0, 41.0, 43.0, 44.0, 34.0, 34.0, 37.0, 42.0, 45.0, 49.0, 35.0, 33.0, 27.0, 26.0, 30.0, 20.0, 24.0, 21.0, 15.0, 8.0, 15.0, 15.0, 11.0, 14.0, 7.0, 0.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-136.99783325195312, -132.920654296875, -128.84347534179688, -124.76631164550781, -120.68913269042969, -116.61195373535156, -112.53478240966797, -108.45761108398438, -104.38043212890625, -100.30325317382812, -96.22608184814453, -92.14891052246094, -88.07173156738281, -83.99455261230469, -79.9173812866211, -75.8402099609375, -71.76303100585938, -67.68585205078125, -63.608680725097656, -59.5315055847168, -55.45433044433594, -51.37715530395508, -47.29998016357422, -43.22280502319336, -39.1456298828125, -35.06845474243164, -30.99127960205078, -26.914104461669922, -22.836929321289062, -18.759754180908203, -14.682579040527344, -10.605403900146484, -6.528221130371094, -2.4510459899902344, 1.626129150390625, 5.703304290771484, 9.780479431152344, 13.857654571533203, 17.934829711914062, 22.012004852294922, 26.08917999267578, 30.16635513305664, 34.2435302734375, 38.32070541381836, 42.39788055419922, 46.47505569458008, 50.55223083496094, 54.6294059753418, 58.706581115722656, 62.783756256103516, 66.86093139648438, 70.9381103515625, 75.0152816772461, 79.09245300292969, 83.16963195800781, 87.24681091308594, 91.32398223876953, 95.40115356445312, 99.47833251953125, 103.55551147460938, 107.63268280029297, 111.70985412597656, 115.78703308105469, 119.86421203613281, 123.9413833618164]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 20.0, 33.0, 45.0, 53.0, 82.0, 211.0, 344.0, 609.0, 1177.0, 2760.0, 6638.0, 17387.0, 55073.0, 287098.0, 3556693.0, 197355.0, 44065.0, 14474.0, 5596.0, 2320.0, 1056.0, 513.0, 282.0, 149.0, 85.0, 40.0, 20.0, 24.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.53125, -52.01953125, -50.5078125, -48.99609375, -47.484375, -45.97265625, -44.4609375, -42.94921875, -41.4375, -39.92578125, -38.4140625, -36.90234375, -35.390625, -33.87890625, -32.3671875, -30.85546875, -29.34375, -27.83203125, -26.3203125, -24.80859375, -23.296875, -21.78515625, -20.2734375, -18.76171875, -17.25, -15.73828125, -14.2265625, -12.71484375, -11.203125, -9.69140625, -8.1796875, -6.66796875, -5.15625, -3.64453125, -2.1328125, -0.62109375, 0.890625, 2.40234375, 3.9140625, 5.42578125, 6.9375, 8.44921875, 9.9609375, 11.47265625, 12.984375, 14.49609375, 16.0078125, 17.51953125, 19.03125, 20.54296875, 22.0546875, 23.56640625, 25.078125, 26.58984375, 28.1015625, 29.61328125, 31.125, 32.63671875, 34.1484375, 35.66015625, 37.171875, 38.68359375, 40.1953125, 41.70703125, 43.21875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 9.0, 16.0, 17.0, 21.0, 25.0, 37.0, 34.0, 32.0, 53.0, 53.0, 51.0, 51.0, 70.0, 58.0, 57.0, 56.0, 55.0, 51.0, 45.0, 33.0, 36.0, 29.0, 15.0, 17.0, 13.0, 14.0, 4.0, 6.0, 3.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.45703125, -7.24420166015625, -7.0313720703125, -6.81854248046875, -6.605712890625, -6.39288330078125, -6.1800537109375, -5.96722412109375, -5.75439453125, -5.54156494140625, -5.3287353515625, -5.11590576171875, -4.903076171875, -4.69024658203125, -4.4774169921875, -4.26458740234375, -4.0517578125, -3.83892822265625, -3.6260986328125, -3.41326904296875, -3.200439453125, -2.98760986328125, -2.7747802734375, -2.56195068359375, -2.34912109375, -2.13629150390625, -1.9234619140625, -1.71063232421875, -1.497802734375, -1.28497314453125, -1.0721435546875, -0.85931396484375, -0.646484375, -0.43365478515625, -0.2208251953125, -0.00799560546875, 0.204833984375, 0.41766357421875, 0.6304931640625, 0.84332275390625, 1.05615234375, 1.26898193359375, 1.4818115234375, 1.69464111328125, 1.907470703125, 2.12030029296875, 2.3331298828125, 2.54595947265625, 2.7587890625, 2.97161865234375, 3.1844482421875, 3.39727783203125, 3.610107421875, 3.82293701171875, 4.0357666015625, 4.24859619140625, 4.46142578125, 4.67425537109375, 4.8870849609375, 5.09991455078125, 5.312744140625, 5.52557373046875, 5.7384033203125, 5.95123291015625, 6.1640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 4.0, 7.0, 10.0, 8.0, 28.0, 26.0, 56.0, 49.0, 101.0, 112.0, 169.0, 259.0, 426.0, 649.0, 1035.0, 1796.0, 3025.0, 5376.0, 10109.0, 20782.0, 47356.0, 128416.0, 526775.0, 2957008.0, 322767.0, 93674.0, 36664.0, 17035.0, 8596.0, 4657.0, 2700.0, 1647.0, 969.0, 640.0, 400.0, 311.0, 181.0, 124.0, 100.0, 66.0, 46.0, 39.0, 18.0, 20.0, 11.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-29.46875, -28.529052734375, -27.58935546875, -26.649658203125, -25.7099609375, -24.770263671875, -23.83056640625, -22.890869140625, -21.951171875, -21.011474609375, -20.07177734375, -19.132080078125, -18.1923828125, -17.252685546875, -16.31298828125, -15.373291015625, -14.43359375, -13.493896484375, -12.55419921875, -11.614501953125, -10.6748046875, -9.735107421875, -8.79541015625, -7.855712890625, -6.916015625, -5.976318359375, -5.03662109375, -4.096923828125, -3.1572265625, -2.217529296875, -1.27783203125, -0.338134765625, 0.6015625, 1.541259765625, 2.48095703125, 3.420654296875, 4.3603515625, 5.300048828125, 6.23974609375, 7.179443359375, 8.119140625, 9.058837890625, 9.99853515625, 10.938232421875, 11.8779296875, 12.817626953125, 13.75732421875, 14.697021484375, 15.63671875, 16.576416015625, 17.51611328125, 18.455810546875, 19.3955078125, 20.335205078125, 21.27490234375, 22.214599609375, 23.154296875, 24.093994140625, 25.03369140625, 25.973388671875, 26.9130859375, 27.852783203125, 28.79248046875, 29.732177734375, 30.671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 9.0, 21.0, 16.0, 19.0, 49.0, 47.0, 90.0, 86.0, 135.0, 200.0, 313.0, 1102.0, 999.0, 312.0, 178.0, 130.0, 77.0, 58.0, 32.0, 30.0, 31.0, 19.0, 15.0, 15.0, 13.0, 6.0, 6.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1484375, -12.6785888671875, -12.208740234375, -11.7388916015625, -11.26904296875, -10.7991943359375, -10.329345703125, -9.8594970703125, -9.3896484375, -8.9197998046875, -8.449951171875, -7.9801025390625, -7.51025390625, -7.0404052734375, -6.570556640625, -6.1007080078125, -5.630859375, -5.1610107421875, -4.691162109375, -4.2213134765625, -3.75146484375, -3.2816162109375, -2.811767578125, -2.3419189453125, -1.8720703125, -1.4022216796875, -0.932373046875, -0.4625244140625, 0.00732421875, 0.4771728515625, 0.947021484375, 1.4168701171875, 1.88671875, 2.3565673828125, 2.826416015625, 3.2962646484375, 3.76611328125, 4.2359619140625, 4.705810546875, 5.1756591796875, 5.6455078125, 6.1153564453125, 6.585205078125, 7.0550537109375, 7.52490234375, 7.9947509765625, 8.464599609375, 8.9344482421875, 9.404296875, 9.8741455078125, 10.343994140625, 10.8138427734375, 11.28369140625, 11.7535400390625, 12.223388671875, 12.6932373046875, 13.1630859375, 13.6329345703125, 14.102783203125, 14.5726318359375, 15.04248046875, 15.5123291015625, 15.982177734375, 16.4520263671875, 16.921875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 7.0, 7.0, 15.0, 24.0, 48.0, 62.0, 100.0, 146.0, 183.0, 138.0, 101.0, 67.0, 41.0, 29.0, 16.0, 12.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.6975555419922, -159.95765686035156, -155.2177734375, -150.47787475585938, -145.73797607421875, -140.99807739257812, -136.2581787109375, -131.51829528808594, -126.77839660644531, -122.03849792480469, -117.2986068725586, -112.5587158203125, -107.81881713867188, -103.07891845703125, -98.33902740478516, -93.59913635253906, -88.85923767089844, -84.11933898925781, -79.37944793701172, -74.63955688476562, -69.899658203125, -65.15975952148438, -60.41986846923828, -55.67997360229492, -50.94007873535156, -46.2001838684082, -41.460289001464844, -36.720394134521484, -31.980499267578125, -27.240604400634766, -22.500709533691406, -17.760814666748047, -13.020904541015625, -8.281009674072266, -3.5411148071289062, 1.1987800598144531, 5.9386749267578125, 10.678569793701172, 15.418464660644531, 20.15835952758789, 24.89825439453125, 29.63814926147461, 34.37804412841797, 39.11793899536133, 43.85783386230469, 48.59772872924805, 53.337623596191406, 58.077518463134766, 62.817413330078125, 67.55731201171875, 72.29720306396484, 77.03709411621094, 81.77699279785156, 86.51689147949219, 91.25678253173828, 95.99667358398438, 100.736572265625, 105.47647094726562, 110.21636199951172, 114.95625305175781, 119.69615173339844, 124.43605041503906, 129.17593383789062, 133.91583251953125, 138.65573120117188]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 6.0, 10.0, 14.0, 7.0, 12.0, 14.0, 11.0, 19.0, 22.0, 18.0, 20.0, 26.0, 31.0, 26.0, 33.0, 34.0, 39.0, 40.0, 43.0, 41.0, 40.0, 36.0, 46.0, 39.0, 38.0, 27.0, 34.0, 29.0, 31.0, 32.0, 24.0, 19.0, 25.0, 7.0, 15.0, 18.0, 9.0, 13.0, 9.0, 13.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-53.023902893066406, -51.3731689453125, -49.722434997558594, -48.07170104980469, -46.42096710205078, -44.770233154296875, -43.11949920654297, -41.46876525878906, -39.818031311035156, -38.16729736328125, -36.516563415527344, -34.86582946777344, -33.21509552001953, -31.564361572265625, -29.91362953186035, -28.262895584106445, -26.612163543701172, -24.961429595947266, -23.31069564819336, -21.659961700439453, -20.009227752685547, -18.35849380493164, -16.707761764526367, -15.057027816772461, -13.406293869018555, -11.755559921264648, -10.104825973510742, -8.454092979431152, -6.803359031677246, -5.15262508392334, -3.50189208984375, -1.8511581420898438, -0.2004241943359375, 1.4503095149993896, 3.101043224334717, 4.751776695251465, 6.402510643005371, 8.053244590759277, 9.703977584838867, 11.354711532592773, 13.00544548034668, 14.656179428100586, 16.306913375854492, 17.957645416259766, 19.608379364013672, 21.259113311767578, 22.909847259521484, 24.56058120727539, 26.211315155029297, 27.862049102783203, 29.51278305053711, 31.163516998291016, 32.81425094604492, 34.46498489379883, 36.11571502685547, 37.766448974609375, 39.41718292236328, 41.06791687011719, 42.718650817871094, 44.369384765625, 46.020118713378906, 47.67085266113281, 49.32158660888672, 50.972320556640625, 52.62305450439453]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 18.0, 16.0, 20.0, 45.0, 51.0, 100.0, 150.0, 239.0, 472.0, 875.0, 1992.0, 4451.0, 11528.0, 32583.0, 103283.0, 377490.0, 364283.0, 99754.0, 31566.0, 11278.0, 4400.0, 1939.0, 934.0, 451.0, 243.0, 134.0, 83.0, 62.0, 40.0, 22.0, 17.0, 14.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.56005859375, -48.0576171875, -46.55517578125, -45.052734375, -43.55029296875, -42.0478515625, -40.54541015625, -39.04296875, -37.54052734375, -36.0380859375, -34.53564453125, -33.033203125, -31.53076171875, -30.0283203125, -28.52587890625, -27.0234375, -25.52099609375, -24.0185546875, -22.51611328125, -21.013671875, -19.51123046875, -18.0087890625, -16.50634765625, -15.00390625, -13.50146484375, -11.9990234375, -10.49658203125, -8.994140625, -7.49169921875, -5.9892578125, -4.48681640625, -2.984375, -1.48193359375, 0.0205078125, 1.52294921875, 3.025390625, 4.52783203125, 6.0302734375, 7.53271484375, 9.03515625, 10.53759765625, 12.0400390625, 13.54248046875, 15.044921875, 16.54736328125, 18.0498046875, 19.55224609375, 21.0546875, 22.55712890625, 24.0595703125, 25.56201171875, 27.064453125, 28.56689453125, 30.0693359375, 31.57177734375, 33.07421875, 34.57666015625, 36.0791015625, 37.58154296875, 39.083984375, 40.58642578125, 42.0888671875, 43.59130859375, 45.09375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 10.0, 12.0, 15.0, 17.0, 12.0, 25.0, 24.0, 34.0, 42.0, 35.0, 42.0, 35.0, 50.0, 62.0, 49.0, 55.0, 62.0, 53.0, 52.0, 43.0, 45.0, 45.0, 30.0, 24.0, 25.0, 15.0, 16.0, 13.0, 11.0, 5.0, 9.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.02734375, -5.82806396484375, -5.6287841796875, -5.42950439453125, -5.230224609375, -5.03094482421875, -4.8316650390625, -4.63238525390625, -4.43310546875, -4.23382568359375, -4.0345458984375, -3.83526611328125, -3.635986328125, -3.43670654296875, -3.2374267578125, -3.03814697265625, -2.8388671875, -2.63958740234375, -2.4403076171875, -2.24102783203125, -2.041748046875, -1.84246826171875, -1.6431884765625, -1.44390869140625, -1.24462890625, -1.04534912109375, -0.8460693359375, -0.64678955078125, -0.447509765625, -0.24822998046875, -0.0489501953125, 0.15032958984375, 0.349609375, 0.54888916015625, 0.7481689453125, 0.94744873046875, 1.146728515625, 1.34600830078125, 1.5452880859375, 1.74456787109375, 1.94384765625, 2.14312744140625, 2.3424072265625, 2.54168701171875, 2.740966796875, 2.94024658203125, 3.1395263671875, 3.33880615234375, 3.5380859375, 3.73736572265625, 3.9366455078125, 4.13592529296875, 4.335205078125, 4.53448486328125, 4.7337646484375, 4.93304443359375, 5.13232421875, 5.33160400390625, 5.5308837890625, 5.73016357421875, 5.929443359375, 6.12872314453125, 6.3280029296875, 6.52728271484375, 6.7265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 11.0, 11.0, 18.0, 27.0, 39.0, 68.0, 86.0, 157.0, 246.0, 444.0, 778.0, 1293.0, 2520.0, 5012.0, 11777.0, 30295.0, 85781.0, 274777.0, 423919.0, 134443.0, 45696.0, 16878.0, 7022.0, 3297.0, 1684.0, 914.0, 537.0, 302.0, 175.0, 133.0, 65.0, 43.0, 30.0, 25.0, 13.0, 18.0, 6.0, 5.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.125, -30.98583984375, -29.8466796875, -28.70751953125, -27.568359375, -26.42919921875, -25.2900390625, -24.15087890625, -23.01171875, -21.87255859375, -20.7333984375, -19.59423828125, -18.455078125, -17.31591796875, -16.1767578125, -15.03759765625, -13.8984375, -12.75927734375, -11.6201171875, -10.48095703125, -9.341796875, -8.20263671875, -7.0634765625, -5.92431640625, -4.78515625, -3.64599609375, -2.5068359375, -1.36767578125, -0.228515625, 0.91064453125, 2.0498046875, 3.18896484375, 4.328125, 5.46728515625, 6.6064453125, 7.74560546875, 8.884765625, 10.02392578125, 11.1630859375, 12.30224609375, 13.44140625, 14.58056640625, 15.7197265625, 16.85888671875, 17.998046875, 19.13720703125, 20.2763671875, 21.41552734375, 22.5546875, 23.69384765625, 24.8330078125, 25.97216796875, 27.111328125, 28.25048828125, 29.3896484375, 30.52880859375, 31.66796875, 32.80712890625, 33.9462890625, 35.08544921875, 36.224609375, 37.36376953125, 38.5029296875, 39.64208984375, 40.78125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 5.0, 15.0, 12.0, 20.0, 23.0, 21.0, 27.0, 34.0, 39.0, 40.0, 48.0, 38.0, 64.0, 43.0, 64.0, 59.0, 58.0, 57.0, 35.0, 42.0, 35.0, 29.0, 30.0, 29.0, 25.0, 19.0, 23.0, 9.0, 11.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.15625, -28.10595703125, -27.0556640625, -26.00537109375, -24.955078125, -23.90478515625, -22.8544921875, -21.80419921875, -20.75390625, -19.70361328125, -18.6533203125, -17.60302734375, -16.552734375, -15.50244140625, -14.4521484375, -13.40185546875, -12.3515625, -11.30126953125, -10.2509765625, -9.20068359375, -8.150390625, -7.10009765625, -6.0498046875, -4.99951171875, -3.94921875, -2.89892578125, -1.8486328125, -0.79833984375, 0.251953125, 1.30224609375, 2.3525390625, 3.40283203125, 4.453125, 5.50341796875, 6.5537109375, 7.60400390625, 8.654296875, 9.70458984375, 10.7548828125, 11.80517578125, 12.85546875, 13.90576171875, 14.9560546875, 16.00634765625, 17.056640625, 18.10693359375, 19.1572265625, 20.20751953125, 21.2578125, 22.30810546875, 23.3583984375, 24.40869140625, 25.458984375, 26.50927734375, 27.5595703125, 28.60986328125, 29.66015625, 30.71044921875, 31.7607421875, 32.81103515625, 33.861328125, 34.91162109375, 35.9619140625, 37.01220703125, 38.0625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 15.0, 28.0, 45.0, 76.0, 95.0, 171.0, 326.0, 594.0, 1271.0, 2672.0, 6970.0, 26457.0, 216110.0, 685800.0, 84330.0, 14701.0, 4837.0, 1957.0, 948.0, 495.0, 262.0, 138.0, 86.0, 59.0, 44.0, 10.0, 12.0, 14.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.390625, -30.387939453125, -29.38525390625, -28.382568359375, -27.3798828125, -26.377197265625, -25.37451171875, -24.371826171875, -23.369140625, -22.366455078125, -21.36376953125, -20.361083984375, -19.3583984375, -18.355712890625, -17.35302734375, -16.350341796875, -15.34765625, -14.344970703125, -13.34228515625, -12.339599609375, -11.3369140625, -10.334228515625, -9.33154296875, -8.328857421875, -7.326171875, -6.323486328125, -5.32080078125, -4.318115234375, -3.3154296875, -2.312744140625, -1.31005859375, -0.307373046875, 0.6953125, 1.697998046875, 2.70068359375, 3.703369140625, 4.7060546875, 5.708740234375, 6.71142578125, 7.714111328125, 8.716796875, 9.719482421875, 10.72216796875, 11.724853515625, 12.7275390625, 13.730224609375, 14.73291015625, 15.735595703125, 16.73828125, 17.740966796875, 18.74365234375, 19.746337890625, 20.7490234375, 21.751708984375, 22.75439453125, 23.757080078125, 24.759765625, 25.762451171875, 26.76513671875, 27.767822265625, 28.7705078125, 29.773193359375, 30.77587890625, 31.778564453125, 32.78125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 20.0, 30.0, 73.0, 165.0, 293.0, 226.0, 82.0, 39.0, 14.0, 13.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01534271240234375, -0.014990806579589844, -0.014638900756835938, -0.014286994934082031, -0.013935089111328125, -0.013583183288574219, -0.013231277465820312, -0.012879371643066406, -0.0125274658203125, -0.012175559997558594, -0.011823654174804688, -0.011471748352050781, -0.011119842529296875, -0.010767936706542969, -0.010416030883789062, -0.010064125061035156, -0.00971221923828125, -0.009360313415527344, -0.009008407592773438, -0.008656501770019531, -0.008304595947265625, -0.007952690124511719, -0.0076007843017578125, -0.007248878479003906, -0.00689697265625, -0.006545066833496094, -0.0061931610107421875, -0.005841255187988281, -0.005489349365234375, -0.005137443542480469, -0.0047855377197265625, -0.004433631896972656, -0.00408172607421875, -0.0037298202514648438, -0.0033779144287109375, -0.0030260086059570312, -0.002674102783203125, -0.0023221969604492188, -0.0019702911376953125, -0.0016183853149414062, -0.0012664794921875, -0.0009145736694335938, -0.0005626678466796875, -0.00021076202392578125, 0.000141143798828125, 0.0004930496215820312, 0.0008449554443359375, 0.0011968612670898438, 0.00154876708984375, 0.0019006729125976562, 0.0022525787353515625, 0.0026044845581054688, 0.002956390380859375, 0.0033082962036132812, 0.0036602020263671875, 0.004012107849121094, 0.004364013671875, 0.004715919494628906, 0.0050678253173828125, 0.005419731140136719, 0.005771636962890625, 0.006123542785644531, 0.0064754486083984375, 0.006827354431152344, 0.00717926025390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 7.0, 10.0, 8.0, 18.0, 26.0, 29.0, 32.0, 66.0, 96.0, 219.0, 483.0, 1273.0, 4264.0, 18873.0, 207185.0, 753871.0, 49893.0, 8553.0, 2228.0, 759.0, 293.0, 133.0, 84.0, 47.0, 31.0, 16.0, 21.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0830078125, -37.791015625, -36.4990234375, -35.20703125, -33.9150390625, -32.623046875, -31.3310546875, -30.0390625, -28.7470703125, -27.455078125, -26.1630859375, -24.87109375, -23.5791015625, -22.287109375, -20.9951171875, -19.703125, -18.4111328125, -17.119140625, -15.8271484375, -14.53515625, -13.2431640625, -11.951171875, -10.6591796875, -9.3671875, -8.0751953125, -6.783203125, -5.4912109375, -4.19921875, -2.9072265625, -1.615234375, -0.3232421875, 0.96875, 2.2607421875, 3.552734375, 4.8447265625, 6.13671875, 7.4287109375, 8.720703125, 10.0126953125, 11.3046875, 12.5966796875, 13.888671875, 15.1806640625, 16.47265625, 17.7646484375, 19.056640625, 20.3486328125, 21.640625, 22.9326171875, 24.224609375, 25.5166015625, 26.80859375, 28.1005859375, 29.392578125, 30.6845703125, 31.9765625, 33.2685546875, 34.560546875, 35.8525390625, 37.14453125, 38.4365234375, 39.728515625, 41.0205078125, 42.3125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 12.0, 15.0, 28.0, 38.0, 84.0, 139.0, 147.0, 182.0, 128.0, 69.0, 59.0, 29.0, 14.0, 18.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.1529541015625, -12.376220703125, -11.5994873046875, -10.82275390625, -10.0460205078125, -9.269287109375, -8.4925537109375, -7.7158203125, -6.9390869140625, -6.162353515625, -5.3856201171875, -4.60888671875, -3.8321533203125, -3.055419921875, -2.2786865234375, -1.501953125, -0.7252197265625, 0.051513671875, 0.8282470703125, 1.60498046875, 2.3817138671875, 3.158447265625, 3.9351806640625, 4.7119140625, 5.4886474609375, 6.265380859375, 7.0421142578125, 7.81884765625, 8.5955810546875, 9.372314453125, 10.1490478515625, 10.92578125, 11.7025146484375, 12.479248046875, 13.2559814453125, 14.03271484375, 14.8094482421875, 15.586181640625, 16.3629150390625, 17.1396484375, 17.9163818359375, 18.693115234375, 19.4698486328125, 20.24658203125, 21.0233154296875, 21.800048828125, 22.5767822265625, 23.353515625, 24.1302490234375, 24.906982421875, 25.6837158203125, 26.46044921875, 27.2371826171875, 28.013916015625, 28.7906494140625, 29.5673828125, 30.3441162109375, 31.120849609375, 31.8975830078125, 32.67431640625, 33.4510498046875, 34.227783203125, 35.0045166015625, 35.78125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 10.0, 8.0, 16.0, 34.0, 43.0, 55.0, 71.0, 94.0, 113.0, 138.0, 103.0, 88.0, 76.0, 50.0, 24.0, 18.0, 18.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.0894775390625, -247.854736328125, -239.6199951171875, -231.38525390625, -223.15049743652344, -214.91575622558594, -206.68101501464844, -198.44627380371094, -190.21151733398438, -181.97677612304688, -173.74203491210938, -165.50729370117188, -157.2725372314453, -149.0377960205078, -140.8030548095703, -132.5683135986328, -124.33357238769531, -116.09883117675781, -107.86408233642578, -99.62934112548828, -91.39459228515625, -83.15985107421875, -74.92510986328125, -66.69036865234375, -58.45561981201172, -50.22087478637695, -41.98612976074219, -33.75138854980469, -25.516643524169922, -17.281898498535156, -9.047157287597656, -0.8124122619628906, 7.422332763671875, 15.657076835632324, 23.891820907592773, 32.126564025878906, 40.36130905151367, 48.59605407714844, 56.83079528808594, 65.06553649902344, 73.30028533935547, 81.53502655029297, 89.769775390625, 98.0045166015625, 106.2392578125, 114.47400665283203, 122.70874786376953, 130.94349670410156, 139.17823791503906, 147.41297912597656, 155.64772033691406, 163.88247680664062, 172.11721801757812, 180.35195922851562, 188.58670043945312, 196.82144165039062, 205.05618286132812, 213.29092407226562, 221.52566528320312, 229.76040649414062, 237.9951629638672, 246.2299041748047, 254.4646453857422, 262.69940185546875, 270.93414306640625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 5.0, 5.0, 13.0, 10.0, 10.0, 17.0, 12.0, 19.0, 22.0, 26.0, 30.0, 23.0, 23.0, 35.0, 26.0, 34.0, 38.0, 43.0, 48.0, 46.0, 39.0, 42.0, 40.0, 41.0, 30.0, 43.0, 29.0, 27.0, 45.0, 21.0, 21.0, 15.0, 20.0, 15.0, 15.0, 13.0, 18.0, 5.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.3483428955078, -152.33303833007812, -147.31773376464844, -142.3024139404297, -137.287109375, -132.2718048095703, -127.25650024414062, -122.24119567871094, -117.22588348388672, -112.21057891845703, -107.19526672363281, -102.17996215820312, -97.16465759277344, -92.14934539794922, -87.13404083251953, -82.11872863769531, -77.10342407226562, -72.08811950683594, -67.07280731201172, -62.05750274658203, -57.04219436645508, -52.026885986328125, -47.01158142089844, -41.996273040771484, -36.98096466064453, -31.965656280517578, -26.950349807739258, -21.935043334960938, -16.919734954833984, -11.904426574707031, -6.889120101928711, -1.8738136291503906, 3.1414947509765625, 8.1568021774292, 13.172109603881836, 18.187416076660156, 23.20272445678711, 28.218032836914062, 33.23333740234375, 38.2486457824707, 43.263954162597656, 48.27926254272461, 53.29457092285156, 58.30987548828125, 63.3251838684082, 68.34049224853516, 73.35579681396484, 78.37110900878906, 83.38641357421875, 88.40171813964844, 93.41703033447266, 98.43233489990234, 103.44764709472656, 108.46295166015625, 113.47825622558594, 118.49356079101562, 123.50887298583984, 128.52418518066406, 133.53948974609375, 138.55479431152344, 143.57009887695312, 148.58541870117188, 153.60072326660156, 158.61602783203125, 163.63133239746094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 8.0, 9.0, 7.0, 13.0, 11.0, 19.0, 31.0, 36.0, 50.0, 63.0, 90.0, 127.0, 200.0, 297.0, 451.0, 627.0, 1018.0, 1594.0, 2755.0, 4804.0, 9020.0, 18885.0, 47462.0, 182228.0, 3613362.0, 215585.0, 52137.0, 20819.0, 9798.0, 5069.0, 2837.0, 1707.0, 1064.0, 676.0, 420.0, 292.0, 216.0, 158.0, 97.0, 72.0, 42.0, 42.0, 27.0, 17.0, 6.0, 14.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.15625, -36.98388671875, -35.8115234375, -34.63916015625, -33.466796875, -32.29443359375, -31.1220703125, -29.94970703125, -28.77734375, -27.60498046875, -26.4326171875, -25.26025390625, -24.087890625, -22.91552734375, -21.7431640625, -20.57080078125, -19.3984375, -18.22607421875, -17.0537109375, -15.88134765625, -14.708984375, -13.53662109375, -12.3642578125, -11.19189453125, -10.01953125, -8.84716796875, -7.6748046875, -6.50244140625, -5.330078125, -4.15771484375, -2.9853515625, -1.81298828125, -0.640625, 0.53173828125, 1.7041015625, 2.87646484375, 4.048828125, 5.22119140625, 6.3935546875, 7.56591796875, 8.73828125, 9.91064453125, 11.0830078125, 12.25537109375, 13.427734375, 14.60009765625, 15.7724609375, 16.94482421875, 18.1171875, 19.28955078125, 20.4619140625, 21.63427734375, 22.806640625, 23.97900390625, 25.1513671875, 26.32373046875, 27.49609375, 28.66845703125, 29.8408203125, 31.01318359375, 32.185546875, 33.35791015625, 34.5302734375, 35.70263671875, 36.875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 7.0, 13.0, 11.0, 19.0, 26.0, 22.0, 33.0, 30.0, 41.0, 50.0, 63.0, 67.0, 46.0, 70.0, 62.0, 56.0, 57.0, 49.0, 40.0, 40.0, 44.0, 23.0, 20.0, 17.0, 22.0, 17.0, 6.0, 12.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.83197021484375, -7.5858154296875, -7.33966064453125, -7.093505859375, -6.84735107421875, -6.6011962890625, -6.35504150390625, -6.10888671875, -5.86273193359375, -5.6165771484375, -5.37042236328125, -5.124267578125, -4.87811279296875, -4.6319580078125, -4.38580322265625, -4.1396484375, -3.89349365234375, -3.6473388671875, -3.40118408203125, -3.155029296875, -2.90887451171875, -2.6627197265625, -2.41656494140625, -2.17041015625, -1.92425537109375, -1.6781005859375, -1.43194580078125, -1.185791015625, -0.93963623046875, -0.6934814453125, -0.44732666015625, -0.201171875, 0.04498291015625, 0.2911376953125, 0.53729248046875, 0.783447265625, 1.02960205078125, 1.2757568359375, 1.52191162109375, 1.76806640625, 2.01422119140625, 2.2603759765625, 2.50653076171875, 2.752685546875, 2.99884033203125, 3.2449951171875, 3.49114990234375, 3.7373046875, 3.98345947265625, 4.2296142578125, 4.47576904296875, 4.721923828125, 4.96807861328125, 5.2142333984375, 5.46038818359375, 5.70654296875, 5.95269775390625, 6.1988525390625, 6.44500732421875, 6.691162109375, 6.93731689453125, 7.1834716796875, 7.42962646484375, 7.67578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 13.0, 11.0, 16.0, 14.0, 14.0, 29.0, 41.0, 40.0, 59.0, 70.0, 128.0, 173.0, 301.0, 532.0, 1241.0, 3288.0, 10633.0, 49090.0, 1468107.0, 2592680.0, 50599.0, 11171.0, 3273.0, 1282.0, 554.0, 280.0, 169.0, 122.0, 73.0, 54.0, 48.0, 39.0, 26.0, 17.0, 16.0, 16.0, 10.0, 8.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.125, -80.4443359375, -77.763671875, -75.0830078125, -72.40234375, -69.7216796875, -67.041015625, -64.3603515625, -61.6796875, -58.9990234375, -56.318359375, -53.6376953125, -50.95703125, -48.2763671875, -45.595703125, -42.9150390625, -40.234375, -37.5537109375, -34.873046875, -32.1923828125, -29.51171875, -26.8310546875, -24.150390625, -21.4697265625, -18.7890625, -16.1083984375, -13.427734375, -10.7470703125, -8.06640625, -5.3857421875, -2.705078125, -0.0244140625, 2.65625, 5.3369140625, 8.017578125, 10.6982421875, 13.37890625, 16.0595703125, 18.740234375, 21.4208984375, 24.1015625, 26.7822265625, 29.462890625, 32.1435546875, 34.82421875, 37.5048828125, 40.185546875, 42.8662109375, 45.546875, 48.2275390625, 50.908203125, 53.5888671875, 56.26953125, 58.9501953125, 61.630859375, 64.3115234375, 66.9921875, 69.6728515625, 72.353515625, 75.0341796875, 77.71484375, 80.3955078125, 83.076171875, 85.7568359375, 88.4375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 9.0, 15.0, 22.0, 36.0, 48.0, 114.0, 301.0, 2643.0, 532.0, 168.0, 80.0, 34.0, 30.0, 19.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.84375, -46.74853515625, -45.6533203125, -44.55810546875, -43.462890625, -42.36767578125, -41.2724609375, -40.17724609375, -39.08203125, -37.98681640625, -36.8916015625, -35.79638671875, -34.701171875, -33.60595703125, -32.5107421875, -31.41552734375, -30.3203125, -29.22509765625, -28.1298828125, -27.03466796875, -25.939453125, -24.84423828125, -23.7490234375, -22.65380859375, -21.55859375, -20.46337890625, -19.3681640625, -18.27294921875, -17.177734375, -16.08251953125, -14.9873046875, -13.89208984375, -12.796875, -11.70166015625, -10.6064453125, -9.51123046875, -8.416015625, -7.32080078125, -6.2255859375, -5.13037109375, -4.03515625, -2.93994140625, -1.8447265625, -0.74951171875, 0.345703125, 1.44091796875, 2.5361328125, 3.63134765625, 4.7265625, 5.82177734375, 6.9169921875, 8.01220703125, 9.107421875, 10.20263671875, 11.2978515625, 12.39306640625, 13.48828125, 14.58349609375, 15.6787109375, 16.77392578125, 17.869140625, 18.96435546875, 20.0595703125, 21.15478515625, 22.25]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 12.0, 14.0, 10.0, 38.0, 45.0, 49.0, 88.0, 87.0, 132.0, 132.0, 101.0, 83.0, 56.0, 39.0, 29.0, 18.0, 12.0, 9.0, 11.0, 6.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-143.51214599609375, -140.02114868164062, -136.53013610839844, -133.03912353515625, -129.54812622070312, -126.05712127685547, -122.56611633300781, -119.07511138916016, -115.5841064453125, -112.09310150146484, -108.60209655761719, -105.11109161376953, -101.62008666992188, -98.12908172607422, -94.63807678222656, -91.1470718383789, -87.65606689453125, -84.1650619506836, -80.67405700683594, -77.18305206298828, -73.69204711914062, -70.20104217529297, -66.71003723144531, -63.219032287597656, -59.72802734375, -56.237022399902344, -52.74601745605469, -49.25501251220703, -45.764007568359375, -42.27300262451172, -38.78199768066406, -35.290992736816406, -31.79998779296875, -28.308982849121094, -24.817977905273438, -21.32697296142578, -17.835968017578125, -14.344963073730469, -10.853958129882812, -7.362953186035156, -3.8719482421875, -0.38094329833984375, 3.1100616455078125, 6.601066589355469, 10.092071533203125, 13.583076477050781, 17.074081420898438, 20.565086364746094, 24.05609130859375, 27.547096252441406, 31.038101196289062, 34.52910614013672, 38.020111083984375, 41.51111602783203, 45.00212097167969, 48.493125915527344, 51.984130859375, 55.475135803222656, 58.96614074707031, 62.45714569091797, 65.94815063476562, 69.43915557861328, 72.93016052246094, 76.4211654663086, 79.91217041015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 15.0, 15.0, 25.0, 15.0, 27.0, 41.0, 39.0, 51.0, 42.0, 58.0, 64.0, 70.0, 62.0, 68.0, 66.0, 66.0, 57.0, 49.0, 36.0, 35.0, 28.0, 17.0, 16.0, 13.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.21607971191406, -96.05860137939453, -92.901123046875, -89.74364471435547, -86.58616638183594, -83.4286880493164, -80.27120971679688, -77.11373138427734, -73.95625305175781, -70.79877471923828, -67.64129638671875, -64.48381805419922, -61.32633972167969, -58.168861389160156, -55.011383056640625, -51.853904724121094, -48.69643020629883, -45.5389518737793, -42.381473541259766, -39.223995208740234, -36.0665168762207, -32.90903854370117, -29.751562118530273, -26.594083786010742, -23.43660545349121, -20.27912712097168, -17.12164878845215, -13.964171409606934, -10.806693077087402, -7.649214744567871, -4.491737365722656, -1.334259033203125, 1.8232192993164062, 4.9806976318359375, 8.138175964355469, 11.295653343200684, 14.453131675720215, 17.610610961914062, 20.76808738708496, 23.925565719604492, 27.083044052124023, 30.240522384643555, 33.39799880981445, 36.555477142333984, 39.712955474853516, 42.87043380737305, 46.02791213989258, 49.18539047241211, 52.34286880493164, 55.50034713745117, 58.6578254699707, 61.815303802490234, 64.9727783203125, 68.13025665283203, 71.28773498535156, 74.4452133178711, 77.60269165039062, 80.76016998291016, 83.91764831542969, 87.07512664794922, 90.23260498046875, 93.39008331298828, 96.54756164550781, 99.70503997802734, 102.86251831054688]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 13.0, 11.0, 20.0, 47.0, 38.0, 95.0, 120.0, 194.0, 309.0, 632.0, 1120.0, 2051.0, 3879.0, 7826.0, 16601.0, 36770.0, 86855.0, 226346.0, 385835.0, 162083.0, 64195.0, 27732.0, 12814.0, 6045.0, 3060.0, 1581.0, 916.0, 533.0, 293.0, 183.0, 120.0, 78.0, 52.0, 27.0, 23.0, 17.0, 11.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.46826171875, -31.2802734375, -30.09228515625, -28.904296875, -27.71630859375, -26.5283203125, -25.34033203125, -24.15234375, -22.96435546875, -21.7763671875, -20.58837890625, -19.400390625, -18.21240234375, -17.0244140625, -15.83642578125, -14.6484375, -13.46044921875, -12.2724609375, -11.08447265625, -9.896484375, -8.70849609375, -7.5205078125, -6.33251953125, -5.14453125, -3.95654296875, -2.7685546875, -1.58056640625, -0.392578125, 0.79541015625, 1.9833984375, 3.17138671875, 4.359375, 5.54736328125, 6.7353515625, 7.92333984375, 9.111328125, 10.29931640625, 11.4873046875, 12.67529296875, 13.86328125, 15.05126953125, 16.2392578125, 17.42724609375, 18.615234375, 19.80322265625, 20.9912109375, 22.17919921875, 23.3671875, 24.55517578125, 25.7431640625, 26.93115234375, 28.119140625, 29.30712890625, 30.4951171875, 31.68310546875, 32.87109375, 34.05908203125, 35.2470703125, 36.43505859375, 37.623046875, 38.81103515625, 39.9990234375, 41.18701171875, 42.375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 4.0, 10.0, 12.0, 6.0, 13.0, 12.0, 19.0, 21.0, 18.0, 20.0, 31.0, 27.0, 36.0, 55.0, 45.0, 36.0, 42.0, 43.0, 55.0, 48.0, 46.0, 42.0, 49.0, 43.0, 21.0, 24.0, 32.0, 25.0, 24.0, 25.0, 20.0, 17.0, 13.0, 13.0, 13.0, 10.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3046875, -6.10009765625, -5.8955078125, -5.69091796875, -5.486328125, -5.28173828125, -5.0771484375, -4.87255859375, -4.66796875, -4.46337890625, -4.2587890625, -4.05419921875, -3.849609375, -3.64501953125, -3.4404296875, -3.23583984375, -3.03125, -2.82666015625, -2.6220703125, -2.41748046875, -2.212890625, -2.00830078125, -1.8037109375, -1.59912109375, -1.39453125, -1.18994140625, -0.9853515625, -0.78076171875, -0.576171875, -0.37158203125, -0.1669921875, 0.03759765625, 0.2421875, 0.44677734375, 0.6513671875, 0.85595703125, 1.060546875, 1.26513671875, 1.4697265625, 1.67431640625, 1.87890625, 2.08349609375, 2.2880859375, 2.49267578125, 2.697265625, 2.90185546875, 3.1064453125, 3.31103515625, 3.515625, 3.72021484375, 3.9248046875, 4.12939453125, 4.333984375, 4.53857421875, 4.7431640625, 4.94775390625, 5.15234375, 5.35693359375, 5.5615234375, 5.76611328125, 5.970703125, 6.17529296875, 6.3798828125, 6.58447265625, 6.7890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 11.0, 11.0, 18.0, 14.0, 36.0, 49.0, 81.0, 110.0, 161.0, 220.0, 394.0, 569.0, 976.0, 1602.0, 2919.0, 5879.0, 11430.0, 24759.0, 56053.0, 139399.0, 357677.0, 266490.0, 100040.0, 41257.0, 18713.0, 9083.0, 4582.0, 2376.0, 1395.0, 795.0, 483.0, 324.0, 215.0, 131.0, 87.0, 59.0, 45.0, 25.0, 22.0, 11.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.609375, -25.74609375, -24.8828125, -24.01953125, -23.15625, -22.29296875, -21.4296875, -20.56640625, -19.703125, -18.83984375, -17.9765625, -17.11328125, -16.25, -15.38671875, -14.5234375, -13.66015625, -12.796875, -11.93359375, -11.0703125, -10.20703125, -9.34375, -8.48046875, -7.6171875, -6.75390625, -5.890625, -5.02734375, -4.1640625, -3.30078125, -2.4375, -1.57421875, -0.7109375, 0.15234375, 1.015625, 1.87890625, 2.7421875, 3.60546875, 4.46875, 5.33203125, 6.1953125, 7.05859375, 7.921875, 8.78515625, 9.6484375, 10.51171875, 11.375, 12.23828125, 13.1015625, 13.96484375, 14.828125, 15.69140625, 16.5546875, 17.41796875, 18.28125, 19.14453125, 20.0078125, 20.87109375, 21.734375, 22.59765625, 23.4609375, 24.32421875, 25.1875, 26.05078125, 26.9140625, 27.77734375, 28.640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 3.0, 3.0, 11.0, 14.0, 19.0, 15.0, 18.0, 22.0, 28.0, 30.0, 35.0, 46.0, 41.0, 53.0, 39.0, 42.0, 51.0, 49.0, 61.0, 35.0, 40.0, 43.0, 36.0, 36.0, 37.0, 24.0, 30.0, 13.0, 24.0, 16.0, 11.0, 16.0, 9.0, 13.0, 7.0, 8.0, 6.0, 3.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.81982421875, -24.8583984375, -23.89697265625, -22.935546875, -21.97412109375, -21.0126953125, -20.05126953125, -19.08984375, -18.12841796875, -17.1669921875, -16.20556640625, -15.244140625, -14.28271484375, -13.3212890625, -12.35986328125, -11.3984375, -10.43701171875, -9.4755859375, -8.51416015625, -7.552734375, -6.59130859375, -5.6298828125, -4.66845703125, -3.70703125, -2.74560546875, -1.7841796875, -0.82275390625, 0.138671875, 1.10009765625, 2.0615234375, 3.02294921875, 3.984375, 4.94580078125, 5.9072265625, 6.86865234375, 7.830078125, 8.79150390625, 9.7529296875, 10.71435546875, 11.67578125, 12.63720703125, 13.5986328125, 14.56005859375, 15.521484375, 16.48291015625, 17.4443359375, 18.40576171875, 19.3671875, 20.32861328125, 21.2900390625, 22.25146484375, 23.212890625, 24.17431640625, 25.1357421875, 26.09716796875, 27.05859375, 28.02001953125, 28.9814453125, 29.94287109375, 30.904296875, 31.86572265625, 32.8271484375, 33.78857421875, 34.75]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 10.0, 22.0, 19.0, 31.0, 54.0, 100.0, 145.0, 242.0, 357.0, 595.0, 1008.0, 1992.0, 4135.0, 11513.0, 45642.0, 296493.0, 556064.0, 97893.0, 19912.0, 6309.0, 2714.0, 1291.0, 774.0, 473.0, 306.0, 178.0, 99.0, 56.0, 41.0, 25.0, 14.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.0, -27.267333984375, -26.53466796875, -25.802001953125, -25.0693359375, -24.336669921875, -23.60400390625, -22.871337890625, -22.138671875, -21.406005859375, -20.67333984375, -19.940673828125, -19.2080078125, -18.475341796875, -17.74267578125, -17.010009765625, -16.27734375, -15.544677734375, -14.81201171875, -14.079345703125, -13.3466796875, -12.614013671875, -11.88134765625, -11.148681640625, -10.416015625, -9.683349609375, -8.95068359375, -8.218017578125, -7.4853515625, -6.752685546875, -6.02001953125, -5.287353515625, -4.5546875, -3.822021484375, -3.08935546875, -2.356689453125, -1.6240234375, -0.891357421875, -0.15869140625, 0.573974609375, 1.306640625, 2.039306640625, 2.77197265625, 3.504638671875, 4.2373046875, 4.969970703125, 5.70263671875, 6.435302734375, 7.16796875, 7.900634765625, 8.63330078125, 9.365966796875, 10.0986328125, 10.831298828125, 11.56396484375, 12.296630859375, 13.029296875, 13.761962890625, 14.49462890625, 15.227294921875, 15.9599609375, 16.692626953125, 17.42529296875, 18.157958984375, 18.890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 28.0, 54.0, 120.0, 286.0, 256.0, 122.0, 43.0, 16.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0139617919921875, -0.01358342170715332, -0.01320505142211914, -0.012826681137084961, -0.012448310852050781, -0.012069940567016602, -0.011691570281982422, -0.011313199996948242, -0.010934829711914062, -0.010556459426879883, -0.010178089141845703, -0.009799718856811523, -0.009421348571777344, -0.009042978286743164, -0.008664608001708984, -0.008286237716674805, -0.007907867431640625, -0.007529497146606445, -0.007151126861572266, -0.006772756576538086, -0.006394386291503906, -0.0060160160064697266, -0.005637645721435547, -0.005259275436401367, -0.0048809051513671875, -0.004502534866333008, -0.004124164581298828, -0.0037457942962646484, -0.0033674240112304688, -0.002989053726196289, -0.0026106834411621094, -0.0022323131561279297, -0.00185394287109375, -0.0014755725860595703, -0.0010972023010253906, -0.0007188320159912109, -0.00034046173095703125, 3.790855407714844e-05, 0.0004162788391113281, 0.0007946491241455078, 0.0011730194091796875, 0.0015513896942138672, 0.0019297599792480469, 0.0023081302642822266, 0.0026865005493164062, 0.003064870834350586, 0.0034432411193847656, 0.0038216114044189453, 0.004199981689453125, 0.004578351974487305, 0.004956722259521484, 0.005335092544555664, 0.005713462829589844, 0.0060918331146240234, 0.006470203399658203, 0.006848573684692383, 0.0072269439697265625, 0.007605314254760742, 0.007983684539794922, 0.008362054824829102, 0.008740425109863281, 0.009118795394897461, 0.00949716567993164, 0.00987553596496582, 0.01025390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 10.0, 17.0, 24.0, 21.0, 42.0, 49.0, 68.0, 107.0, 162.0, 242.0, 459.0, 813.0, 1766.0, 4330.0, 16814.0, 130442.0, 738636.0, 129846.0, 16230.0, 4549.0, 1814.0, 903.0, 446.0, 240.0, 160.0, 117.0, 58.0, 49.0, 46.0, 26.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.53125, -28.56298828125, -27.5947265625, -26.62646484375, -25.658203125, -24.68994140625, -23.7216796875, -22.75341796875, -21.78515625, -20.81689453125, -19.8486328125, -18.88037109375, -17.912109375, -16.94384765625, -15.9755859375, -15.00732421875, -14.0390625, -13.07080078125, -12.1025390625, -11.13427734375, -10.166015625, -9.19775390625, -8.2294921875, -7.26123046875, -6.29296875, -5.32470703125, -4.3564453125, -3.38818359375, -2.419921875, -1.45166015625, -0.4833984375, 0.48486328125, 1.453125, 2.42138671875, 3.3896484375, 4.35791015625, 5.326171875, 6.29443359375, 7.2626953125, 8.23095703125, 9.19921875, 10.16748046875, 11.1357421875, 12.10400390625, 13.072265625, 14.04052734375, 15.0087890625, 15.97705078125, 16.9453125, 17.91357421875, 18.8818359375, 19.85009765625, 20.818359375, 21.78662109375, 22.7548828125, 23.72314453125, 24.69140625, 25.65966796875, 26.6279296875, 27.59619140625, 28.564453125, 29.53271484375, 30.5009765625, 31.46923828125, 32.4375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 17.0, 51.0, 68.0, 112.0, 185.0, 184.0, 132.0, 95.0, 60.0, 38.0, 8.0, 11.0, 4.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.59375, -28.77490234375, -27.9560546875, -27.13720703125, -26.318359375, -25.49951171875, -24.6806640625, -23.86181640625, -23.04296875, -22.22412109375, -21.4052734375, -20.58642578125, -19.767578125, -18.94873046875, -18.1298828125, -17.31103515625, -16.4921875, -15.67333984375, -14.8544921875, -14.03564453125, -13.216796875, -12.39794921875, -11.5791015625, -10.76025390625, -9.94140625, -9.12255859375, -8.3037109375, -7.48486328125, -6.666015625, -5.84716796875, -5.0283203125, -4.20947265625, -3.390625, -2.57177734375, -1.7529296875, -0.93408203125, -0.115234375, 0.70361328125, 1.5224609375, 2.34130859375, 3.16015625, 3.97900390625, 4.7978515625, 5.61669921875, 6.435546875, 7.25439453125, 8.0732421875, 8.89208984375, 9.7109375, 10.52978515625, 11.3486328125, 12.16748046875, 12.986328125, 13.80517578125, 14.6240234375, 15.44287109375, 16.26171875, 17.08056640625, 17.8994140625, 18.71826171875, 19.537109375, 20.35595703125, 21.1748046875, 21.99365234375, 22.8125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 19.0, 66.0, 165.0, 291.0, 257.0, 131.0, 56.0, 12.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-947.981201171875, -928.575439453125, -909.1696166992188, -889.7638549804688, -870.3580322265625, -850.9522705078125, -831.5465087890625, -812.1406860351562, -792.7349243164062, -773.3291625976562, -753.92333984375, -734.517578125, -715.1117553710938, -695.7059936523438, -676.3001708984375, -656.8944091796875, -637.4886474609375, -618.0828857421875, -598.6770629882812, -579.2713012695312, -559.865478515625, -540.459716796875, -521.053955078125, -501.64813232421875, -482.2423095703125, -462.8365173339844, -443.43072509765625, -424.02496337890625, -404.6191711425781, -385.21337890625, -365.8075866699219, -346.40179443359375, -326.9960021972656, -307.5902099609375, -288.1844177246094, -268.77862548828125, -249.37286376953125, -229.96707153320312, -210.561279296875, -191.15550231933594, -171.7497100830078, -152.3439178466797, -132.93814086914062, -113.5323486328125, -94.1265640258789, -74.72077941894531, -55.31498718261719, -35.909210205078125, -16.50341796875, 2.9023685455322266, 22.308155059814453, 41.71394348144531, 61.119728088378906, 80.5255126953125, 99.93130493164062, 119.33708190917969, 138.7428741455078, 158.14866638183594, 177.554443359375, 196.96023559570312, 216.36602783203125, 235.7718048095703, 255.17759704589844, 274.5833740234375, 293.9891662597656]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 13.0, 7.0, 8.0, 7.0, 13.0, 11.0, 20.0, 24.0, 29.0, 24.0, 39.0, 35.0, 39.0, 35.0, 47.0, 47.0, 49.0, 30.0, 40.0, 37.0, 56.0, 37.0, 34.0, 45.0, 35.0, 36.0, 29.0, 36.0, 16.0, 12.0, 20.0, 17.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-176.2188262939453, -171.19631958007812, -166.17381286621094, -161.15130615234375, -156.12879943847656, -151.10629272460938, -146.0837860107422, -141.061279296875, -136.0387725830078, -131.01626586914062, -125.99375915527344, -120.97125244140625, -115.94874572753906, -110.92623901367188, -105.90373229980469, -100.8812255859375, -95.85871124267578, -90.8362045288086, -85.8136978149414, -80.79119110107422, -75.76868438720703, -70.74617767333984, -65.72366333007812, -60.7011604309082, -55.678653717041016, -50.65614700317383, -45.63364028930664, -40.61112976074219, -35.588623046875, -30.566118240356445, -25.543609619140625, -20.521102905273438, -15.49859619140625, -10.476089477539062, -5.453581809997559, -0.4310741424560547, 4.591432571411133, 9.61393928527832, 14.63644790649414, 19.658954620361328, 24.681461334228516, 29.703968048095703, 34.72647476196289, 39.748985290527344, 44.77149200439453, 49.79399871826172, 54.816505432128906, 59.839012145996094, 64.86151885986328, 69.88402557373047, 74.90653228759766, 79.92903900146484, 84.95154571533203, 89.97405242919922, 94.99656677246094, 100.01907348632812, 105.04158020019531, 110.0640869140625, 115.08659362792969, 120.10910034179688, 125.13160705566406, 130.15411376953125, 135.17662048339844, 140.19912719726562, 145.2216339111328]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 4.0, 15.0, 18.0, 28.0, 28.0, 46.0, 59.0, 81.0, 106.0, 170.0, 214.0, 322.0, 530.0, 711.0, 1206.0, 1961.0, 3306.0, 5875.0, 12223.0, 31335.0, 117355.0, 3529191.0, 389619.0, 60109.0, 19977.0, 8690.0, 4462.0, 2496.0, 1453.0, 957.0, 543.0, 381.0, 260.0, 173.0, 123.0, 67.0, 67.0, 39.0, 26.0, 17.0, 11.0, 6.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-45.15625, -43.73486328125, -42.3134765625, -40.89208984375, -39.470703125, -38.04931640625, -36.6279296875, -35.20654296875, -33.78515625, -32.36376953125, -30.9423828125, -29.52099609375, -28.099609375, -26.67822265625, -25.2568359375, -23.83544921875, -22.4140625, -20.99267578125, -19.5712890625, -18.14990234375, -16.728515625, -15.30712890625, -13.8857421875, -12.46435546875, -11.04296875, -9.62158203125, -8.2001953125, -6.77880859375, -5.357421875, -3.93603515625, -2.5146484375, -1.09326171875, 0.328125, 1.74951171875, 3.1708984375, 4.59228515625, 6.013671875, 7.43505859375, 8.8564453125, 10.27783203125, 11.69921875, 13.12060546875, 14.5419921875, 15.96337890625, 17.384765625, 18.80615234375, 20.2275390625, 21.64892578125, 23.0703125, 24.49169921875, 25.9130859375, 27.33447265625, 28.755859375, 30.17724609375, 31.5986328125, 33.02001953125, 34.44140625, 35.86279296875, 37.2841796875, 38.70556640625, 40.126953125, 41.54833984375, 42.9697265625, 44.39111328125, 45.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 12.0, 25.0, 20.0, 29.0, 25.0, 23.0, 39.0, 36.0, 42.0, 66.0, 46.0, 40.0, 59.0, 41.0, 48.0, 45.0, 44.0, 44.0, 32.0, 32.0, 39.0, 35.0, 24.0, 29.0, 20.0, 13.0, 16.0, 10.0, 11.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.94921875, -7.73040771484375, -7.5115966796875, -7.29278564453125, -7.073974609375, -6.85516357421875, -6.6363525390625, -6.41754150390625, -6.19873046875, -5.97991943359375, -5.7611083984375, -5.54229736328125, -5.323486328125, -5.10467529296875, -4.8858642578125, -4.66705322265625, -4.4482421875, -4.22943115234375, -4.0106201171875, -3.79180908203125, -3.572998046875, -3.35418701171875, -3.1353759765625, -2.91656494140625, -2.69775390625, -2.47894287109375, -2.2601318359375, -2.04132080078125, -1.822509765625, -1.60369873046875, -1.3848876953125, -1.16607666015625, -0.947265625, -0.72845458984375, -0.5096435546875, -0.29083251953125, -0.072021484375, 0.14678955078125, 0.3656005859375, 0.58441162109375, 0.80322265625, 1.02203369140625, 1.2408447265625, 1.45965576171875, 1.678466796875, 1.89727783203125, 2.1160888671875, 2.33489990234375, 2.5537109375, 2.77252197265625, 2.9913330078125, 3.21014404296875, 3.428955078125, 3.64776611328125, 3.8665771484375, 4.08538818359375, 4.30419921875, 4.52301025390625, 4.7418212890625, 4.96063232421875, 5.179443359375, 5.39825439453125, 5.6170654296875, 5.83587646484375, 6.0546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 20.0, 17.0, 21.0, 30.0, 33.0, 37.0, 42.0, 45.0, 67.0, 69.0, 108.0, 148.0, 224.0, 339.0, 544.0, 1037.0, 2258.0, 5027.0, 15493.0, 74735.0, 2946855.0, 1061756.0, 62012.0, 13734.0, 4771.0, 2027.0, 1060.0, 559.0, 305.0, 231.0, 164.0, 104.0, 87.0, 55.0, 50.0, 41.0, 27.0, 25.0, 30.0, 17.0, 12.0, 11.0, 10.0, 7.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-71.875, -69.7578125, -67.640625, -65.5234375, -63.40625, -61.2890625, -59.171875, -57.0546875, -54.9375, -52.8203125, -50.703125, -48.5859375, -46.46875, -44.3515625, -42.234375, -40.1171875, -38.0, -35.8828125, -33.765625, -31.6484375, -29.53125, -27.4140625, -25.296875, -23.1796875, -21.0625, -18.9453125, -16.828125, -14.7109375, -12.59375, -10.4765625, -8.359375, -6.2421875, -4.125, -2.0078125, 0.109375, 2.2265625, 4.34375, 6.4609375, 8.578125, 10.6953125, 12.8125, 14.9296875, 17.046875, 19.1640625, 21.28125, 23.3984375, 25.515625, 27.6328125, 29.75, 31.8671875, 33.984375, 36.1015625, 38.21875, 40.3359375, 42.453125, 44.5703125, 46.6875, 48.8046875, 50.921875, 53.0390625, 55.15625, 57.2734375, 59.390625, 61.5078125, 63.625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 14.0, 5.0, 19.0, 62.0, 100.0, 195.0, 649.0, 2325.0, 380.0, 150.0, 63.0, 39.0, 23.0, 19.0, 9.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.184814453125, -42.02587890625, -40.866943359375, -39.7080078125, -38.549072265625, -37.39013671875, -36.231201171875, -35.072265625, -33.913330078125, -32.75439453125, -31.595458984375, -30.4365234375, -29.277587890625, -28.11865234375, -26.959716796875, -25.80078125, -24.641845703125, -23.48291015625, -22.323974609375, -21.1650390625, -20.006103515625, -18.84716796875, -17.688232421875, -16.529296875, -15.370361328125, -14.21142578125, -13.052490234375, -11.8935546875, -10.734619140625, -9.57568359375, -8.416748046875, -7.2578125, -6.098876953125, -4.93994140625, -3.781005859375, -2.6220703125, -1.463134765625, -0.30419921875, 0.854736328125, 2.013671875, 3.172607421875, 4.33154296875, 5.490478515625, 6.6494140625, 7.808349609375, 8.96728515625, 10.126220703125, 11.28515625, 12.444091796875, 13.60302734375, 14.761962890625, 15.9208984375, 17.079833984375, 18.23876953125, 19.397705078125, 20.556640625, 21.715576171875, 22.87451171875, 24.033447265625, 25.1923828125, 26.351318359375, 27.51025390625, 28.669189453125, 29.828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 14.0, 34.0, 70.0, 136.0, 209.0, 219.0, 156.0, 77.0, 37.0, 23.0, 15.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.14600372314453, -97.03350067138672, -88.9209976196289, -80.8084945678711, -72.69599151611328, -64.58348846435547, -56.470985412597656, -48.358482360839844, -40.24597930908203, -32.13347625732422, -24.020973205566406, -15.908470153808594, -7.795967102050781, 0.31653594970703125, 8.429039001464844, 16.541542053222656, 24.65404510498047, 32.76654815673828, 40.879051208496094, 48.991554260253906, 57.10405731201172, 65.21656036376953, 73.32906341552734, 81.44156646728516, 89.55406951904297, 97.66657257080078, 105.7790756225586, 113.8915786743164, 122.00408172607422, 130.1165771484375, 138.22909545898438, 146.34158325195312, 154.4541015625, 162.5666046142578, 170.67910766601562, 178.79161071777344, 186.90411376953125, 195.01661682128906, 203.12911987304688, 211.2416229248047, 219.3541259765625, 227.4666290283203, 235.57913208007812, 243.69163513183594, 251.80413818359375, 259.9166259765625, 268.0291442871094, 276.14166259765625, 284.254150390625, 292.36663818359375, 300.4791564941406, 308.5916748046875, 316.70416259765625, 324.816650390625, 332.9291687011719, 341.04168701171875, 349.1541748046875, 357.26666259765625, 365.3791809082031, 373.49169921875, 381.60418701171875, 389.7166748046875, 397.8291931152344, 405.94171142578125, 414.05419921875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 3.0, 10.0, 7.0, 9.0, 11.0, 13.0, 18.0, 23.0, 29.0, 17.0, 30.0, 21.0, 33.0, 31.0, 32.0, 31.0, 42.0, 44.0, 38.0, 51.0, 40.0, 45.0, 33.0, 40.0, 40.0, 25.0, 25.0, 34.0, 24.0, 23.0, 21.0, 16.0, 18.0, 14.0, 15.0, 25.0, 10.0, 14.0, 5.0, 13.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-72.34542083740234, -70.24555206298828, -68.14569091796875, -66.04582214355469, -63.94595718383789, -61.846092224121094, -59.74622344970703, -57.646358489990234, -55.54649353027344, -53.44662857055664, -51.346763610839844, -49.24689483642578, -47.147029876708984, -45.04716491699219, -42.947296142578125, -40.84743118286133, -38.74756622314453, -36.647701263427734, -34.54783630371094, -32.447967529296875, -30.348102569580078, -28.24823760986328, -26.14837074279785, -24.048503875732422, -21.948638916015625, -19.848773956298828, -17.7489070892334, -15.649041175842285, -13.549175262451172, -11.449309349060059, -9.349443435668945, -7.249577522277832, -5.149715423583984, -3.049849510192871, -0.9499835968017578, 1.1498823165893555, 3.2497482299804688, 5.349614143371582, 7.449480056762695, 9.549345970153809, 11.649211883544922, 13.749077796936035, 15.848943710327148, 17.948810577392578, 20.048675537109375, 22.148540496826172, 24.2484073638916, 26.34827423095703, 28.448139190673828, 30.548004150390625, 32.64787292480469, 34.747737884521484, 36.84760284423828, 38.94746780395508, 41.047332763671875, 43.14720153808594, 45.247066497802734, 47.34693145751953, 49.446800231933594, 51.54666519165039, 53.64653015136719, 55.746395111083984, 57.84626007080078, 59.946128845214844, 62.04599380493164]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 13.0, 13.0, 14.0, 38.0, 39.0, 57.0, 92.0, 141.0, 185.0, 389.0, 544.0, 919.0, 1722.0, 3140.0, 6254.0, 13382.0, 32580.0, 91712.0, 397513.0, 358154.0, 85201.0, 30840.0, 12652.0, 5942.0, 2985.0, 1615.0, 900.0, 539.0, 348.0, 222.0, 131.0, 73.0, 65.0, 36.0, 28.0, 23.0, 15.0, 14.0, 7.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.78125, -40.43212890625, -39.0830078125, -37.73388671875, -36.384765625, -35.03564453125, -33.6865234375, -32.33740234375, -30.98828125, -29.63916015625, -28.2900390625, -26.94091796875, -25.591796875, -24.24267578125, -22.8935546875, -21.54443359375, -20.1953125, -18.84619140625, -17.4970703125, -16.14794921875, -14.798828125, -13.44970703125, -12.1005859375, -10.75146484375, -9.40234375, -8.05322265625, -6.7041015625, -5.35498046875, -4.005859375, -2.65673828125, -1.3076171875, 0.04150390625, 1.390625, 2.73974609375, 4.0888671875, 5.43798828125, 6.787109375, 8.13623046875, 9.4853515625, 10.83447265625, 12.18359375, 13.53271484375, 14.8818359375, 16.23095703125, 17.580078125, 18.92919921875, 20.2783203125, 21.62744140625, 22.9765625, 24.32568359375, 25.6748046875, 27.02392578125, 28.373046875, 29.72216796875, 31.0712890625, 32.42041015625, 33.76953125, 35.11865234375, 36.4677734375, 37.81689453125, 39.166015625, 40.51513671875, 41.8642578125, 43.21337890625, 44.5625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 8.0, 10.0, 5.0, 13.0, 13.0, 26.0, 22.0, 28.0, 39.0, 36.0, 38.0, 44.0, 49.0, 40.0, 57.0, 46.0, 45.0, 47.0, 42.0, 41.0, 48.0, 40.0, 38.0, 28.0, 24.0, 32.0, 18.0, 28.0, 9.0, 16.0, 11.0, 13.0, 6.0, 11.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.5390625, -7.31964111328125, -7.1002197265625, -6.88079833984375, -6.661376953125, -6.44195556640625, -6.2225341796875, -6.00311279296875, -5.78369140625, -5.56427001953125, -5.3448486328125, -5.12542724609375, -4.906005859375, -4.68658447265625, -4.4671630859375, -4.24774169921875, -4.0283203125, -3.80889892578125, -3.5894775390625, -3.37005615234375, -3.150634765625, -2.93121337890625, -2.7117919921875, -2.49237060546875, -2.27294921875, -2.05352783203125, -1.8341064453125, -1.61468505859375, -1.395263671875, -1.17584228515625, -0.9564208984375, -0.73699951171875, -0.517578125, -0.29815673828125, -0.0787353515625, 0.14068603515625, 0.360107421875, 0.57952880859375, 0.7989501953125, 1.01837158203125, 1.23779296875, 1.45721435546875, 1.6766357421875, 1.89605712890625, 2.115478515625, 2.33489990234375, 2.5543212890625, 2.77374267578125, 2.9931640625, 3.21258544921875, 3.4320068359375, 3.65142822265625, 3.870849609375, 4.09027099609375, 4.3096923828125, 4.52911376953125, 4.74853515625, 4.96795654296875, 5.1873779296875, 5.40679931640625, 5.626220703125, 5.84564208984375, 6.0650634765625, 6.28448486328125, 6.50390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 6.0, 6.0, 15.0, 8.0, 27.0, 25.0, 47.0, 53.0, 80.0, 131.0, 220.0, 326.0, 483.0, 768.0, 1352.0, 2267.0, 4538.0, 10369.0, 30607.0, 123809.0, 600582.0, 201603.0, 44520.0, 13989.0, 5652.0, 2858.0, 1597.0, 952.0, 608.0, 328.0, 214.0, 142.0, 98.0, 75.0, 49.0, 29.0, 24.0, 25.0, 11.0, 8.0, 8.0, 7.0, 9.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-42.46875, -41.16796875, -39.8671875, -38.56640625, -37.265625, -35.96484375, -34.6640625, -33.36328125, -32.0625, -30.76171875, -29.4609375, -28.16015625, -26.859375, -25.55859375, -24.2578125, -22.95703125, -21.65625, -20.35546875, -19.0546875, -17.75390625, -16.453125, -15.15234375, -13.8515625, -12.55078125, -11.25, -9.94921875, -8.6484375, -7.34765625, -6.046875, -4.74609375, -3.4453125, -2.14453125, -0.84375, 0.45703125, 1.7578125, 3.05859375, 4.359375, 5.66015625, 6.9609375, 8.26171875, 9.5625, 10.86328125, 12.1640625, 13.46484375, 14.765625, 16.06640625, 17.3671875, 18.66796875, 19.96875, 21.26953125, 22.5703125, 23.87109375, 25.171875, 26.47265625, 27.7734375, 29.07421875, 30.375, 31.67578125, 32.9765625, 34.27734375, 35.578125, 36.87890625, 38.1796875, 39.48046875, 40.78125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 12.0, 12.0, 9.0, 22.0, 17.0, 28.0, 29.0, 52.0, 48.0, 45.0, 31.0, 72.0, 51.0, 69.0, 62.0, 60.0, 58.0, 42.0, 44.0, 52.0, 34.0, 36.0, 26.0, 19.0, 12.0, 10.0, 10.0, 8.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.515625, -30.291259765625, -29.06689453125, -27.842529296875, -26.6181640625, -25.393798828125, -24.16943359375, -22.945068359375, -21.720703125, -20.496337890625, -19.27197265625, -18.047607421875, -16.8232421875, -15.598876953125, -14.37451171875, -13.150146484375, -11.92578125, -10.701416015625, -9.47705078125, -8.252685546875, -7.0283203125, -5.803955078125, -4.57958984375, -3.355224609375, -2.130859375, -0.906494140625, 0.31787109375, 1.542236328125, 2.7666015625, 3.990966796875, 5.21533203125, 6.439697265625, 7.6640625, 8.888427734375, 10.11279296875, 11.337158203125, 12.5615234375, 13.785888671875, 15.01025390625, 16.234619140625, 17.458984375, 18.683349609375, 19.90771484375, 21.132080078125, 22.3564453125, 23.580810546875, 24.80517578125, 26.029541015625, 27.25390625, 28.478271484375, 29.70263671875, 30.927001953125, 32.1513671875, 33.375732421875, 34.60009765625, 35.824462890625, 37.048828125, 38.273193359375, 39.49755859375, 40.721923828125, 41.9462890625, 43.170654296875, 44.39501953125, 45.619384765625, 46.84375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 14.0, 13.0, 19.0, 23.0, 47.0, 48.0, 101.0, 114.0, 182.0, 330.0, 524.0, 978.0, 1976.0, 4405.0, 11937.0, 41592.0, 286570.0, 591956.0, 77240.0, 18320.0, 6445.0, 2655.0, 1274.0, 715.0, 393.0, 239.0, 126.0, 82.0, 63.0, 42.0, 38.0, 20.0, 18.0, 14.0, 5.0, 5.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.796875, -21.074951171875, -20.35302734375, -19.631103515625, -18.9091796875, -18.187255859375, -17.46533203125, -16.743408203125, -16.021484375, -15.299560546875, -14.57763671875, -13.855712890625, -13.1337890625, -12.411865234375, -11.68994140625, -10.968017578125, -10.24609375, -9.524169921875, -8.80224609375, -8.080322265625, -7.3583984375, -6.636474609375, -5.91455078125, -5.192626953125, -4.470703125, -3.748779296875, -3.02685546875, -2.304931640625, -1.5830078125, -0.861083984375, -0.13916015625, 0.582763671875, 1.3046875, 2.026611328125, 2.74853515625, 3.470458984375, 4.1923828125, 4.914306640625, 5.63623046875, 6.358154296875, 7.080078125, 7.802001953125, 8.52392578125, 9.245849609375, 9.9677734375, 10.689697265625, 11.41162109375, 12.133544921875, 12.85546875, 13.577392578125, 14.29931640625, 15.021240234375, 15.7431640625, 16.465087890625, 17.18701171875, 17.908935546875, 18.630859375, 19.352783203125, 20.07470703125, 20.796630859375, 21.5185546875, 22.240478515625, 22.96240234375, 23.684326171875, 24.40625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 18.0, 19.0, 64.0, 180.0, 400.0, 180.0, 60.0, 26.0, 17.0, 7.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.018890380859375, -0.01849287748336792, -0.01809537410736084, -0.01769787073135376, -0.01730036735534668, -0.0169028639793396, -0.01650536060333252, -0.01610785722732544, -0.01571035385131836, -0.01531285047531128, -0.0149153470993042, -0.01451784372329712, -0.014120340347290039, -0.013722836971282959, -0.013325333595275879, -0.012927830219268799, -0.012530326843261719, -0.012132823467254639, -0.011735320091247559, -0.011337816715240479, -0.010940313339233398, -0.010542809963226318, -0.010145306587219238, -0.009747803211212158, -0.009350299835205078, -0.008952796459197998, -0.008555293083190918, -0.008157789707183838, -0.007760286331176758, -0.007362782955169678, -0.006965279579162598, -0.006567776203155518, -0.0061702728271484375, -0.005772769451141357, -0.005375266075134277, -0.004977762699127197, -0.004580259323120117, -0.004182755947113037, -0.003785252571105957, -0.003387749195098877, -0.002990245819091797, -0.002592742443084717, -0.0021952390670776367, -0.0017977356910705566, -0.0014002323150634766, -0.0010027289390563965, -0.0006052255630493164, -0.00020772218704223633, 0.00018978118896484375, 0.0005872845649719238, 0.000984787940979004, 0.001382291316986084, 0.001779794692993164, 0.002177298069000244, 0.0025748014450073242, 0.0029723048210144043, 0.0033698081970214844, 0.0037673115730285645, 0.0041648149490356445, 0.004562318325042725, 0.004959821701049805, 0.005357325077056885, 0.005754828453063965, 0.006152331829071045, 0.006549835205078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 11.0, 20.0, 30.0, 32.0, 63.0, 72.0, 134.0, 242.0, 374.0, 670.0, 1150.0, 2310.0, 5140.0, 13539.0, 44681.0, 276872.0, 581807.0, 85428.0, 21361.0, 7818.0, 3175.0, 1603.0, 806.0, 471.0, 266.0, 146.0, 110.0, 76.0, 32.0, 24.0, 26.0, 19.0, 11.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.5615234375, -17.966796875, -17.3720703125, -16.77734375, -16.1826171875, -15.587890625, -14.9931640625, -14.3984375, -13.8037109375, -13.208984375, -12.6142578125, -12.01953125, -11.4248046875, -10.830078125, -10.2353515625, -9.640625, -9.0458984375, -8.451171875, -7.8564453125, -7.26171875, -6.6669921875, -6.072265625, -5.4775390625, -4.8828125, -4.2880859375, -3.693359375, -3.0986328125, -2.50390625, -1.9091796875, -1.314453125, -0.7197265625, -0.125, 0.4697265625, 1.064453125, 1.6591796875, 2.25390625, 2.8486328125, 3.443359375, 4.0380859375, 4.6328125, 5.2275390625, 5.822265625, 6.4169921875, 7.01171875, 7.6064453125, 8.201171875, 8.7958984375, 9.390625, 9.9853515625, 10.580078125, 11.1748046875, 11.76953125, 12.3642578125, 12.958984375, 13.5537109375, 14.1484375, 14.7431640625, 15.337890625, 15.9326171875, 16.52734375, 17.1220703125, 17.716796875, 18.3115234375, 18.90625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 19.0, 35.0, 55.0, 62.0, 92.0, 119.0, 108.0, 106.0, 87.0, 79.0, 53.0, 29.0, 19.0, 14.0, 12.0, 13.0, 6.0, 4.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-18.21875, -17.7586669921875, -17.298583984375, -16.8385009765625, -16.37841796875, -15.9183349609375, -15.458251953125, -14.9981689453125, -14.5380859375, -14.0780029296875, -13.617919921875, -13.1578369140625, -12.69775390625, -12.2376708984375, -11.777587890625, -11.3175048828125, -10.857421875, -10.3973388671875, -9.937255859375, -9.4771728515625, -9.01708984375, -8.5570068359375, -8.096923828125, -7.6368408203125, -7.1767578125, -6.7166748046875, -6.256591796875, -5.7965087890625, -5.33642578125, -4.8763427734375, -4.416259765625, -3.9561767578125, -3.49609375, -3.0360107421875, -2.575927734375, -2.1158447265625, -1.65576171875, -1.1956787109375, -0.735595703125, -0.2755126953125, 0.1845703125, 0.6446533203125, 1.104736328125, 1.5648193359375, 2.02490234375, 2.4849853515625, 2.945068359375, 3.4051513671875, 3.865234375, 4.3253173828125, 4.785400390625, 5.2454833984375, 5.70556640625, 6.1656494140625, 6.625732421875, 7.0858154296875, 7.5458984375, 8.0059814453125, 8.466064453125, 8.9261474609375, 9.38623046875, 9.8463134765625, 10.306396484375, 10.7664794921875, 11.2265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 3.0, 16.0, 25.0, 46.0, 65.0, 113.0, 128.0, 141.0, 135.0, 114.0, 72.0, 66.0, 23.0, 25.0, 13.0, 10.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.1841735839844, -294.5325622558594, -284.8809814453125, -275.2293701171875, -265.5777587890625, -255.92616271972656, -246.27456665039062, -236.62295532226562, -226.9713592529297, -217.31976318359375, -207.66815185546875, -198.0165557861328, -188.36495971679688, -178.71334838867188, -169.06175231933594, -159.41015625, -149.758544921875, -140.10694885253906, -130.45533752441406, -120.80374145507812, -111.15213775634766, -101.50053405761719, -91.84893798828125, -82.19733428955078, -72.54573059082031, -62.894126892089844, -53.24252700805664, -43.59092712402344, -33.93932342529297, -24.2877197265625, -14.636119842529297, -4.984519958496094, 4.667083740234375, 14.318685531616211, 23.970287322998047, 33.62188720703125, 43.27349090576172, 52.92509460449219, 62.57669448852539, 72.2282943725586, 81.87989807128906, 91.53150177001953, 101.18310546875, 110.83470153808594, 120.4863052368164, 130.13790893554688, 139.7895050048828, 149.44110107421875, 159.09271240234375, 168.7443084716797, 178.3959197998047, 188.04751586914062, 197.69912719726562, 207.35072326660156, 217.0023193359375, 226.6539306640625, 236.30552673339844, 245.95712280273438, 255.60873413085938, 265.2603454589844, 274.91192626953125, 284.56353759765625, 294.21514892578125, 303.8667297363281, 313.5183410644531]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 5.0, 4.0, 10.0, 8.0, 5.0, 13.0, 17.0, 19.0, 18.0, 35.0, 16.0, 22.0, 35.0, 33.0, 49.0, 43.0, 34.0, 42.0, 41.0, 51.0, 40.0, 41.0, 41.0, 40.0, 42.0, 42.0, 34.0, 26.0, 34.0, 26.0, 22.0, 15.0, 17.0, 12.0, 9.0, 9.0, 12.0, 8.0, 9.0, 8.0, 3.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-171.1358642578125, -166.36476135253906, -161.59365844726562, -156.8225555419922, -152.05145263671875, -147.28036499023438, -142.50926208496094, -137.7381591796875, -132.96705627441406, -128.19595336914062, -123.42485046386719, -118.65375518798828, -113.88265228271484, -109.1115493774414, -104.3404541015625, -99.56935119628906, -94.79824829101562, -90.02714538574219, -85.25604248046875, -80.48494720458984, -75.7138442993164, -70.94274139404297, -66.17164611816406, -61.400543212890625, -56.62944030761719, -51.85833740234375, -47.08723831176758, -42.316139221191406, -37.54503631591797, -32.77393341064453, -28.00283432006836, -23.231735229492188, -18.460617065429688, -13.689516067504883, -8.918415069580078, -4.147314071655273, 0.6237869262695312, 5.394887924194336, 10.16598892211914, 14.937088012695312, 19.70819091796875, 24.479291915893555, 29.25039291381836, 34.02149200439453, 38.79259490966797, 43.563697814941406, 48.33479690551758, 53.10589599609375, 57.87699890136719, 62.648101806640625, 67.41920471191406, 72.19029998779297, 76.9614028930664, 81.73250579833984, 86.50360107421875, 91.27470397949219, 96.04580688476562, 100.81690979003906, 105.5880126953125, 110.3591079711914, 115.13021087646484, 119.90131378173828, 124.67240905761719, 129.44351196289062, 134.21461486816406]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 2.0, 6.0, 6.0, 17.0, 15.0, 34.0, 36.0, 52.0, 81.0, 103.0, 154.0, 253.0, 404.0, 669.0, 1215.0, 2237.0, 4708.0, 10735.0, 32251.0, 236190.0, 3794677.0, 77477.0, 18548.0, 7120.0, 3282.0, 1661.0, 873.0, 549.0, 342.0, 218.0, 125.0, 86.0, 39.0, 38.0, 26.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.25, -74.2041015625, -72.158203125, -70.1123046875, -68.06640625, -66.0205078125, -63.974609375, -61.9287109375, -59.8828125, -57.8369140625, -55.791015625, -53.7451171875, -51.69921875, -49.6533203125, -47.607421875, -45.5615234375, -43.515625, -41.4697265625, -39.423828125, -37.3779296875, -35.33203125, -33.2861328125, -31.240234375, -29.1943359375, -27.1484375, -25.1025390625, -23.056640625, -21.0107421875, -18.96484375, -16.9189453125, -14.873046875, -12.8271484375, -10.78125, -8.7353515625, -6.689453125, -4.6435546875, -2.59765625, -0.5517578125, 1.494140625, 3.5400390625, 5.5859375, 7.6318359375, 9.677734375, 11.7236328125, 13.76953125, 15.8154296875, 17.861328125, 19.9072265625, 21.953125, 23.9990234375, 26.044921875, 28.0908203125, 30.13671875, 32.1826171875, 34.228515625, 36.2744140625, 38.3203125, 40.3662109375, 42.412109375, 44.4580078125, 46.50390625, 48.5498046875, 50.595703125, 52.6416015625, 54.6875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 14.0, 15.0, 8.0, 17.0, 15.0, 20.0, 34.0, 39.0, 42.0, 46.0, 44.0, 57.0, 58.0, 36.0, 51.0, 45.0, 42.0, 52.0, 44.0, 55.0, 46.0, 33.0, 37.0, 29.0, 23.0, 14.0, 24.0, 11.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.0523681640625, -7.792236328125, -7.5321044921875, -7.27197265625, -7.0118408203125, -6.751708984375, -6.4915771484375, -6.2314453125, -5.9713134765625, -5.711181640625, -5.4510498046875, -5.19091796875, -4.9307861328125, -4.670654296875, -4.4105224609375, -4.150390625, -3.8902587890625, -3.630126953125, -3.3699951171875, -3.10986328125, -2.8497314453125, -2.589599609375, -2.3294677734375, -2.0693359375, -1.8092041015625, -1.549072265625, -1.2889404296875, -1.02880859375, -0.7686767578125, -0.508544921875, -0.2484130859375, 0.01171875, 0.2718505859375, 0.531982421875, 0.7921142578125, 1.05224609375, 1.3123779296875, 1.572509765625, 1.8326416015625, 2.0927734375, 2.3529052734375, 2.613037109375, 2.8731689453125, 3.13330078125, 3.3934326171875, 3.653564453125, 3.9136962890625, 4.173828125, 4.4339599609375, 4.694091796875, 4.9542236328125, 5.21435546875, 5.4744873046875, 5.734619140625, 5.9947509765625, 6.2548828125, 6.5150146484375, 6.775146484375, 7.0352783203125, 7.29541015625, 7.5555419921875, 7.815673828125, 8.0758056640625, 8.3359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 9.0, 11.0, 16.0, 18.0, 22.0, 21.0, 45.0, 53.0, 76.0, 140.0, 200.0, 342.0, 569.0, 1052.0, 2346.0, 6104.0, 20481.0, 143394.0, 3863223.0, 125591.0, 19523.0, 6054.0, 2356.0, 1124.0, 582.0, 323.0, 181.0, 146.0, 78.0, 52.0, 33.0, 22.0, 18.0, 14.0, 15.0, 7.0, 5.0, 5.0, 7.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-91.8125, -89.1494140625, -86.486328125, -83.8232421875, -81.16015625, -78.4970703125, -75.833984375, -73.1708984375, -70.5078125, -67.8447265625, -65.181640625, -62.5185546875, -59.85546875, -57.1923828125, -54.529296875, -51.8662109375, -49.203125, -46.5400390625, -43.876953125, -41.2138671875, -38.55078125, -35.8876953125, -33.224609375, -30.5615234375, -27.8984375, -25.2353515625, -22.572265625, -19.9091796875, -17.24609375, -14.5830078125, -11.919921875, -9.2568359375, -6.59375, -3.9306640625, -1.267578125, 1.3955078125, 4.05859375, 6.7216796875, 9.384765625, 12.0478515625, 14.7109375, 17.3740234375, 20.037109375, 22.7001953125, 25.36328125, 28.0263671875, 30.689453125, 33.3525390625, 36.015625, 38.6787109375, 41.341796875, 44.0048828125, 46.66796875, 49.3310546875, 51.994140625, 54.6572265625, 57.3203125, 59.9833984375, 62.646484375, 65.3095703125, 67.97265625, 70.6357421875, 73.298828125, 75.9619140625, 78.625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 17.0, 30.0, 33.0, 92.0, 223.0, 988.0, 2253.0, 228.0, 84.0, 33.0, 25.0, 14.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.994140625, -47.80078125, -46.607421875, -45.4140625, -44.220703125, -43.02734375, -41.833984375, -40.640625, -39.447265625, -38.25390625, -37.060546875, -35.8671875, -34.673828125, -33.48046875, -32.287109375, -31.09375, -29.900390625, -28.70703125, -27.513671875, -26.3203125, -25.126953125, -23.93359375, -22.740234375, -21.546875, -20.353515625, -19.16015625, -17.966796875, -16.7734375, -15.580078125, -14.38671875, -13.193359375, -12.0, -10.806640625, -9.61328125, -8.419921875, -7.2265625, -6.033203125, -4.83984375, -3.646484375, -2.453125, -1.259765625, -0.06640625, 1.126953125, 2.3203125, 3.513671875, 4.70703125, 5.900390625, 7.09375, 8.287109375, 9.48046875, 10.673828125, 11.8671875, 13.060546875, 14.25390625, 15.447265625, 16.640625, 17.833984375, 19.02734375, 20.220703125, 21.4140625, 22.607421875, 23.80078125, 24.994140625, 26.1875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 17.0, 36.0, 105.0, 272.0, 328.0, 171.0, 46.0, 15.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-497.5877380371094, -486.80401611328125, -476.0202941894531, -465.236572265625, -454.4528503417969, -443.66912841796875, -432.88543701171875, -422.1017150878906, -411.3179931640625, -400.5342712402344, -389.75054931640625, -378.9668273925781, -368.18310546875, -357.3994140625, -346.61566162109375, -335.83197021484375, -325.0482177734375, -314.2644958496094, -303.48077392578125, -292.6970520019531, -281.913330078125, -271.129638671875, -260.34588623046875, -249.56219482421875, -238.77847290039062, -227.9947509765625, -217.21102905273438, -206.42730712890625, -195.6436004638672, -184.85987854003906, -174.07615661621094, -163.29244995117188, -152.5087432861328, -141.7250213623047, -130.94129943847656, -120.15758514404297, -109.37387084960938, -98.59014892578125, -87.80642700195312, -77.02271270751953, -66.2389907836914, -55.45527267456055, -44.67155456542969, -33.88783264160156, -23.104114532470703, -12.320396423339844, -1.5366744995117188, 9.247039794921875, 20.03076171875, 30.81447982788086, 41.59819793701172, 52.381919860839844, 63.1656379699707, 73.94935607910156, 84.73307800292969, 95.51679229736328, 106.3005142211914, 117.08423614501953, 127.86795043945312, 138.65167236328125, 149.43539428710938, 160.2191162109375, 171.00283813476562, 181.7865447998047, 192.5702667236328]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 13.0, 21.0, 9.0, 19.0, 22.0, 30.0, 34.0, 40.0, 40.0, 40.0, 49.0, 54.0, 50.0, 54.0, 49.0, 46.0, 46.0, 42.0, 47.0, 43.0, 39.0, 31.0, 23.0, 26.0, 24.0, 20.0, 9.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.95223999023438, -70.51971435546875, -68.0871810913086, -65.65465545654297, -63.22212600708008, -60.78959655761719, -58.35707092285156, -55.92454147338867, -53.49201202392578, -51.05948257446289, -48.626953125, -46.194427490234375, -43.761898040771484, -41.329368591308594, -38.89684295654297, -36.46431350708008, -34.03178405761719, -31.599254608154297, -29.16672706604004, -26.73419952392578, -24.30167007446289, -21.869140625, -19.436613082885742, -17.004085540771484, -14.571556091308594, -12.13902759552002, -9.706499099731445, -7.273970603942871, -4.841442108154297, -2.4089136123657227, 0.023614883422851562, 2.4561424255371094, 4.888671875, 7.321200370788574, 9.753728866577148, 12.186257362365723, 14.618785858154297, 17.051315307617188, 19.483842849731445, 21.916370391845703, 24.348899841308594, 26.781429290771484, 29.213956832885742, 31.646484375, 34.07901382446289, 36.51154327392578, 38.944068908691406, 41.3765983581543, 43.80912780761719, 46.24165725708008, 48.67418670654297, 51.106712341308594, 53.539241790771484, 55.971771240234375, 58.404296875, 60.83682632446289, 63.26935577392578, 65.7018814086914, 68.13441467285156, 70.56694030761719, 72.99946594238281, 75.43199920654297, 77.8645248413086, 80.29705810546875, 82.72958374023438]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 0.0, 1.0, 10.0, 12.0, 19.0, 15.0, 22.0, 49.0, 55.0, 91.0, 116.0, 187.0, 273.0, 346.0, 558.0, 885.0, 1421.0, 2339.0, 3864.0, 6781.0, 13252.0, 26668.0, 57851.0, 145256.0, 408541.0, 224001.0, 81783.0, 35703.0, 17219.0, 8670.0, 4855.0, 2850.0, 1689.0, 1037.0, 685.0, 437.0, 310.0, 192.0, 131.0, 108.0, 79.0, 46.0, 42.0, 36.0, 29.0, 13.0, 6.0, 10.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-27.3125, -26.501953125, -25.69140625, -24.880859375, -24.0703125, -23.259765625, -22.44921875, -21.638671875, -20.828125, -20.017578125, -19.20703125, -18.396484375, -17.5859375, -16.775390625, -15.96484375, -15.154296875, -14.34375, -13.533203125, -12.72265625, -11.912109375, -11.1015625, -10.291015625, -9.48046875, -8.669921875, -7.859375, -7.048828125, -6.23828125, -5.427734375, -4.6171875, -3.806640625, -2.99609375, -2.185546875, -1.375, -0.564453125, 0.24609375, 1.056640625, 1.8671875, 2.677734375, 3.48828125, 4.298828125, 5.109375, 5.919921875, 6.73046875, 7.541015625, 8.3515625, 9.162109375, 9.97265625, 10.783203125, 11.59375, 12.404296875, 13.21484375, 14.025390625, 14.8359375, 15.646484375, 16.45703125, 17.267578125, 18.078125, 18.888671875, 19.69921875, 20.509765625, 21.3203125, 22.130859375, 22.94140625, 23.751953125, 24.5625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 8.0, 6.0, 9.0, 6.0, 12.0, 12.0, 18.0, 24.0, 14.0, 25.0, 34.0, 25.0, 39.0, 33.0, 39.0, 31.0, 25.0, 36.0, 47.0, 37.0, 43.0, 46.0, 42.0, 43.0, 40.0, 29.0, 33.0, 30.0, 30.0, 23.0, 25.0, 24.0, 19.0, 12.0, 8.0, 14.0, 9.0, 5.0, 9.0, 6.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-7.71875, -7.4967041015625, -7.274658203125, -7.0526123046875, -6.83056640625, -6.6085205078125, -6.386474609375, -6.1644287109375, -5.9423828125, -5.7203369140625, -5.498291015625, -5.2762451171875, -5.05419921875, -4.8321533203125, -4.610107421875, -4.3880615234375, -4.166015625, -3.9439697265625, -3.721923828125, -3.4998779296875, -3.27783203125, -3.0557861328125, -2.833740234375, -2.6116943359375, -2.3896484375, -2.1676025390625, -1.945556640625, -1.7235107421875, -1.50146484375, -1.2794189453125, -1.057373046875, -0.8353271484375, -0.61328125, -0.3912353515625, -0.169189453125, 0.0528564453125, 0.27490234375, 0.4969482421875, 0.718994140625, 0.9410400390625, 1.1630859375, 1.3851318359375, 1.607177734375, 1.8292236328125, 2.05126953125, 2.2733154296875, 2.495361328125, 2.7174072265625, 2.939453125, 3.1614990234375, 3.383544921875, 3.6055908203125, 3.82763671875, 4.0496826171875, 4.271728515625, 4.4937744140625, 4.7158203125, 4.9378662109375, 5.159912109375, 5.3819580078125, 5.60400390625, 5.8260498046875, 6.048095703125, 6.2701416015625, 6.4921875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 17.0, 19.0, 27.0, 35.0, 53.0, 76.0, 126.0, 191.0, 293.0, 533.0, 895.0, 1561.0, 2923.0, 6259.0, 15001.0, 41950.0, 175214.0, 624114.0, 122420.0, 33123.0, 12354.0, 5306.0, 2652.0, 1330.0, 740.0, 480.0, 289.0, 167.0, 128.0, 69.0, 54.0, 34.0, 21.0, 15.0, 18.0, 12.0, 13.0, 4.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-43.71875, -42.40966796875, -41.1005859375, -39.79150390625, -38.482421875, -37.17333984375, -35.8642578125, -34.55517578125, -33.24609375, -31.93701171875, -30.6279296875, -29.31884765625, -28.009765625, -26.70068359375, -25.3916015625, -24.08251953125, -22.7734375, -21.46435546875, -20.1552734375, -18.84619140625, -17.537109375, -16.22802734375, -14.9189453125, -13.60986328125, -12.30078125, -10.99169921875, -9.6826171875, -8.37353515625, -7.064453125, -5.75537109375, -4.4462890625, -3.13720703125, -1.828125, -0.51904296875, 0.7900390625, 2.09912109375, 3.408203125, 4.71728515625, 6.0263671875, 7.33544921875, 8.64453125, 9.95361328125, 11.2626953125, 12.57177734375, 13.880859375, 15.18994140625, 16.4990234375, 17.80810546875, 19.1171875, 20.42626953125, 21.7353515625, 23.04443359375, 24.353515625, 25.66259765625, 26.9716796875, 28.28076171875, 29.58984375, 30.89892578125, 32.2080078125, 33.51708984375, 34.826171875, 36.13525390625, 37.4443359375, 38.75341796875, 40.0625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 4.0, 9.0, 10.0, 19.0, 19.0, 31.0, 32.0, 40.0, 55.0, 53.0, 55.0, 59.0, 67.0, 74.0, 63.0, 64.0, 61.0, 42.0, 47.0, 33.0, 26.0, 29.0, 22.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.46875, -48.88427734375, -47.2998046875, -45.71533203125, -44.130859375, -42.54638671875, -40.9619140625, -39.37744140625, -37.79296875, -36.20849609375, -34.6240234375, -33.03955078125, -31.455078125, -29.87060546875, -28.2861328125, -26.70166015625, -25.1171875, -23.53271484375, -21.9482421875, -20.36376953125, -18.779296875, -17.19482421875, -15.6103515625, -14.02587890625, -12.44140625, -10.85693359375, -9.2724609375, -7.68798828125, -6.103515625, -4.51904296875, -2.9345703125, -1.35009765625, 0.234375, 1.81884765625, 3.4033203125, 4.98779296875, 6.572265625, 8.15673828125, 9.7412109375, 11.32568359375, 12.91015625, 14.49462890625, 16.0791015625, 17.66357421875, 19.248046875, 20.83251953125, 22.4169921875, 24.00146484375, 25.5859375, 27.17041015625, 28.7548828125, 30.33935546875, 31.923828125, 33.50830078125, 35.0927734375, 36.67724609375, 38.26171875, 39.84619140625, 41.4306640625, 43.01513671875, 44.599609375, 46.18408203125, 47.7685546875, 49.35302734375, 50.9375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 17.0, 21.0, 33.0, 35.0, 37.0, 65.0, 82.0, 155.0, 231.0, 393.0, 631.0, 1192.0, 2055.0, 4010.0, 8994.0, 24223.0, 95114.0, 565868.0, 269306.0, 48105.0, 14957.0, 6213.0, 2909.0, 1560.0, 849.0, 531.0, 295.0, 202.0, 147.0, 88.0, 51.0, 47.0, 30.0, 18.0, 9.0, 13.0, 12.0, 6.0, 10.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.171875, -18.604248046875, -18.03662109375, -17.468994140625, -16.9013671875, -16.333740234375, -15.76611328125, -15.198486328125, -14.630859375, -14.063232421875, -13.49560546875, -12.927978515625, -12.3603515625, -11.792724609375, -11.22509765625, -10.657470703125, -10.08984375, -9.522216796875, -8.95458984375, -8.386962890625, -7.8193359375, -7.251708984375, -6.68408203125, -6.116455078125, -5.548828125, -4.981201171875, -4.41357421875, -3.845947265625, -3.2783203125, -2.710693359375, -2.14306640625, -1.575439453125, -1.0078125, -0.440185546875, 0.12744140625, 0.695068359375, 1.2626953125, 1.830322265625, 2.39794921875, 2.965576171875, 3.533203125, 4.100830078125, 4.66845703125, 5.236083984375, 5.8037109375, 6.371337890625, 6.93896484375, 7.506591796875, 8.07421875, 8.641845703125, 9.20947265625, 9.777099609375, 10.3447265625, 10.912353515625, 11.47998046875, 12.047607421875, 12.615234375, 13.182861328125, 13.75048828125, 14.318115234375, 14.8857421875, 15.453369140625, 16.02099609375, 16.588623046875, 17.15625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 13.0, 14.0, 15.0, 40.0, 81.0, 342.0, 316.0, 81.0, 27.0, 25.0, 16.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013065934181213379, -0.012681245803833008, -0.012296557426452637, -0.011911869049072266, -0.011527180671691895, -0.011142492294311523, -0.010757803916931152, -0.010373115539550781, -0.00998842716217041, -0.009603738784790039, -0.009219050407409668, -0.008834362030029297, -0.008449673652648926, -0.008064985275268555, -0.007680296897888184, -0.0072956085205078125, -0.006910920143127441, -0.00652623176574707, -0.006141543388366699, -0.005756855010986328, -0.005372166633605957, -0.004987478256225586, -0.004602789878845215, -0.004218101501464844, -0.0038334131240844727, -0.0034487247467041016, -0.0030640363693237305, -0.0026793479919433594, -0.0022946596145629883, -0.0019099712371826172, -0.001525282859802246, -0.001140594482421875, -0.0007559061050415039, -0.0003712177276611328, 1.3470649719238281e-05, 0.0003981590270996094, 0.0007828474044799805, 0.0011675357818603516, 0.0015522241592407227, 0.0019369125366210938, 0.002321600914001465, 0.002706289291381836, 0.003090977668762207, 0.003475666046142578, 0.0038603544235229492, 0.00424504280090332, 0.004629731178283691, 0.0050144195556640625, 0.005399107933044434, 0.005783796310424805, 0.006168484687805176, 0.006553173065185547, 0.006937861442565918, 0.007322549819946289, 0.00770723819732666, 0.008091926574707031, 0.008476614952087402, 0.008861303329467773, 0.009245991706848145, 0.009630680084228516, 0.010015368461608887, 0.010400056838989258, 0.010784745216369629, 0.01116943359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 20.0, 35.0, 53.0, 54.0, 109.0, 163.0, 319.0, 557.0, 1103.0, 2364.0, 6106.0, 19826.0, 98932.0, 732409.0, 148827.0, 24762.0, 7344.0, 2849.0, 1210.0, 640.0, 338.0, 205.0, 107.0, 58.0, 43.0, 31.0, 16.0, 10.0, 15.0, 9.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.28125, -26.53564453125, -25.7900390625, -25.04443359375, -24.298828125, -23.55322265625, -22.8076171875, -22.06201171875, -21.31640625, -20.57080078125, -19.8251953125, -19.07958984375, -18.333984375, -17.58837890625, -16.8427734375, -16.09716796875, -15.3515625, -14.60595703125, -13.8603515625, -13.11474609375, -12.369140625, -11.62353515625, -10.8779296875, -10.13232421875, -9.38671875, -8.64111328125, -7.8955078125, -7.14990234375, -6.404296875, -5.65869140625, -4.9130859375, -4.16748046875, -3.421875, -2.67626953125, -1.9306640625, -1.18505859375, -0.439453125, 0.30615234375, 1.0517578125, 1.79736328125, 2.54296875, 3.28857421875, 4.0341796875, 4.77978515625, 5.525390625, 6.27099609375, 7.0166015625, 7.76220703125, 8.5078125, 9.25341796875, 9.9990234375, 10.74462890625, 11.490234375, 12.23583984375, 12.9814453125, 13.72705078125, 14.47265625, 15.21826171875, 15.9638671875, 16.70947265625, 17.455078125, 18.20068359375, 18.9462890625, 19.69189453125, 20.4375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 6.0, 11.0, 9.0, 11.0, 13.0, 37.0, 52.0, 69.0, 82.0, 133.0, 130.0, 119.0, 94.0, 63.0, 44.0, 32.0, 20.0, 13.0, 12.0, 5.0, 10.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.796875, -18.202392578125, -17.60791015625, -17.013427734375, -16.4189453125, -15.824462890625, -15.22998046875, -14.635498046875, -14.041015625, -13.446533203125, -12.85205078125, -12.257568359375, -11.6630859375, -11.068603515625, -10.47412109375, -9.879638671875, -9.28515625, -8.690673828125, -8.09619140625, -7.501708984375, -6.9072265625, -6.312744140625, -5.71826171875, -5.123779296875, -4.529296875, -3.934814453125, -3.34033203125, -2.745849609375, -2.1513671875, -1.556884765625, -0.96240234375, -0.367919921875, 0.2265625, 0.821044921875, 1.41552734375, 2.010009765625, 2.6044921875, 3.198974609375, 3.79345703125, 4.387939453125, 4.982421875, 5.576904296875, 6.17138671875, 6.765869140625, 7.3603515625, 7.954833984375, 8.54931640625, 9.143798828125, 9.73828125, 10.332763671875, 10.92724609375, 11.521728515625, 12.1162109375, 12.710693359375, 13.30517578125, 13.899658203125, 14.494140625, 15.088623046875, 15.68310546875, 16.277587890625, 16.8720703125, 17.466552734375, 18.06103515625, 18.655517578125, 19.25]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 23.0, 67.0, 177.0, 331.0, 236.0, 110.0, 47.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.3223876953125, -163.19183349609375, -142.061279296875, -120.93071746826172, -99.80016326904297, -78.66960906982422, -57.53904724121094, -36.40849304199219, -15.277938842773438, 5.852617263793945, 26.983173370361328, 48.113731384277344, 69.2442855834961, 90.37483978271484, 111.50540161132812, 132.63595581054688, 153.76651000976562, 174.89706420898438, 196.02761840820312, 217.15817260742188, 238.28872680664062, 259.4192810058594, 280.54986572265625, 301.680419921875, 322.81097412109375, 343.9415283203125, 365.07208251953125, 386.20263671875, 407.33319091796875, 428.4637451171875, 449.59429931640625, 470.724853515625, 491.85540771484375, 512.9859619140625, 534.1165161132812, 555.2470703125, 576.3776245117188, 597.5081787109375, 618.6387329101562, 639.769287109375, 660.8998413085938, 682.0303955078125, 703.1609497070312, 724.29150390625, 745.4220581054688, 766.5526123046875, 787.6831665039062, 808.813720703125, 829.9443359375, 851.0748901367188, 872.2054443359375, 893.3359985351562, 914.466552734375, 935.5971069335938, 956.7276611328125, 977.8582153320312, 998.98876953125, 1020.1193237304688, 1041.2498779296875, 1062.3804931640625, 1083.510986328125, 1104.6416015625, 1125.7720947265625, 1146.9027099609375, 1168.033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 8.0, 6.0, 7.0, 7.0, 10.0, 18.0, 13.0, 14.0, 19.0, 21.0, 25.0, 24.0, 24.0, 25.0, 34.0, 39.0, 38.0, 29.0, 38.0, 37.0, 42.0, 36.0, 48.0, 44.0, 36.0, 34.0, 38.0, 38.0, 31.0, 28.0, 19.0, 21.0, 20.0, 22.0, 16.0, 13.0, 15.0, 5.0, 10.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-159.8803253173828, -154.90208435058594, -149.92385864257812, -144.94561767578125, -139.96737670898438, -134.9891357421875, -130.01089477539062, -125.03266906738281, -120.05442810058594, -115.07618713378906, -110.09795379638672, -105.11972045898438, -100.1414794921875, -95.16323852539062, -90.18500518798828, -85.20677185058594, -80.22853088378906, -75.25028991699219, -70.27205657958984, -65.2938232421875, -60.315582275390625, -55.337345123291016, -50.359107971191406, -45.3808708190918, -40.40263366699219, -35.42439651489258, -30.44615936279297, -25.46792221069336, -20.48968505859375, -15.51144790649414, -10.533210754394531, -5.554973602294922, -0.57672119140625, 4.401515960693359, 9.379753112792969, 14.357990264892578, 19.336227416992188, 24.314464569091797, 29.292701721191406, 34.270938873291016, 39.249176025390625, 44.227413177490234, 49.205650329589844, 54.18388748168945, 59.16212463378906, 64.14036560058594, 69.11859893798828, 74.09683227539062, 79.0750732421875, 84.05331420898438, 89.03154754638672, 94.00978088378906, 98.98802185058594, 103.96626281738281, 108.94449615478516, 113.9227294921875, 118.90097045898438, 123.87921142578125, 128.85745239257812, 133.83567810058594, 138.8139190673828, 143.7921600341797, 148.7703857421875, 153.74862670898438, 158.72686767578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 4.0, 12.0, 16.0, 27.0, 27.0, 34.0, 65.0, 74.0, 101.0, 114.0, 178.0, 248.0, 347.0, 444.0, 705.0, 1101.0, 1795.0, 3163.0, 5883.0, 12140.0, 30468.0, 109577.0, 3737310.0, 213040.0, 43991.0, 16193.0, 7428.0, 3729.0, 2175.0, 1313.0, 772.0, 504.0, 341.0, 258.0, 185.0, 122.0, 89.0, 71.0, 52.0, 33.0, 37.0, 13.0, 17.0, 8.0, 11.0, 9.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0], "bins": [-66.375, -64.3427734375, -62.310546875, -60.2783203125, -58.24609375, -56.2138671875, -54.181640625, -52.1494140625, -50.1171875, -48.0849609375, -46.052734375, -44.0205078125, -41.98828125, -39.9560546875, -37.923828125, -35.8916015625, -33.859375, -31.8271484375, -29.794921875, -27.7626953125, -25.73046875, -23.6982421875, -21.666015625, -19.6337890625, -17.6015625, -15.5693359375, -13.537109375, -11.5048828125, -9.47265625, -7.4404296875, -5.408203125, -3.3759765625, -1.34375, 0.6884765625, 2.720703125, 4.7529296875, 6.78515625, 8.8173828125, 10.849609375, 12.8818359375, 14.9140625, 16.9462890625, 18.978515625, 21.0107421875, 23.04296875, 25.0751953125, 27.107421875, 29.1396484375, 31.171875, 33.2041015625, 35.236328125, 37.2685546875, 39.30078125, 41.3330078125, 43.365234375, 45.3974609375, 47.4296875, 49.4619140625, 51.494140625, 53.5263671875, 55.55859375, 57.5908203125, 59.623046875, 61.6552734375, 63.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 7.0, 5.0, 6.0, 7.0, 8.0, 10.0, 15.0, 8.0, 19.0, 23.0, 14.0, 28.0, 28.0, 32.0, 28.0, 32.0, 38.0, 29.0, 34.0, 39.0, 42.0, 39.0, 41.0, 38.0, 46.0, 39.0, 53.0, 36.0, 32.0, 32.0, 29.0, 23.0, 19.0, 16.0, 19.0, 17.0, 9.0, 15.0, 8.0, 9.0, 10.0, 1.0, 5.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.39453125, -7.16351318359375, -6.9324951171875, -6.70147705078125, -6.470458984375, -6.23944091796875, -6.0084228515625, -5.77740478515625, -5.54638671875, -5.31536865234375, -5.0843505859375, -4.85333251953125, -4.622314453125, -4.39129638671875, -4.1602783203125, -3.92926025390625, -3.6982421875, -3.46722412109375, -3.2362060546875, -3.00518798828125, -2.774169921875, -2.54315185546875, -2.3121337890625, -2.08111572265625, -1.85009765625, -1.61907958984375, -1.3880615234375, -1.15704345703125, -0.926025390625, -0.69500732421875, -0.4639892578125, -0.23297119140625, -0.001953125, 0.22906494140625, 0.4600830078125, 0.69110107421875, 0.922119140625, 1.15313720703125, 1.3841552734375, 1.61517333984375, 1.84619140625, 2.07720947265625, 2.3082275390625, 2.53924560546875, 2.770263671875, 3.00128173828125, 3.2322998046875, 3.46331787109375, 3.6943359375, 3.92535400390625, 4.1563720703125, 4.38739013671875, 4.618408203125, 4.84942626953125, 5.0804443359375, 5.31146240234375, 5.54248046875, 5.77349853515625, 6.0045166015625, 6.23553466796875, 6.466552734375, 6.69757080078125, 6.9285888671875, 7.15960693359375, 7.390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 12.0, 11.0, 9.0, 17.0, 22.0, 22.0, 32.0, 52.0, 51.0, 68.0, 76.0, 120.0, 124.0, 186.0, 193.0, 262.0, 342.0, 426.0, 610.0, 895.0, 1483.0, 3126.0, 7892.0, 27869.0, 238192.0, 3801709.0, 82641.0, 16205.0, 5064.0, 2206.0, 1211.0, 705.0, 529.0, 404.0, 281.0, 258.0, 211.0, 172.0, 114.0, 108.0, 82.0, 75.0, 49.0, 38.0, 39.0, 19.0, 24.0, 14.0, 12.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-105.0, -101.6455078125, -98.291015625, -94.9365234375, -91.58203125, -88.2275390625, -84.873046875, -81.5185546875, -78.1640625, -74.8095703125, -71.455078125, -68.1005859375, -64.74609375, -61.3916015625, -58.037109375, -54.6826171875, -51.328125, -47.9736328125, -44.619140625, -41.2646484375, -37.91015625, -34.5556640625, -31.201171875, -27.8466796875, -24.4921875, -21.1376953125, -17.783203125, -14.4287109375, -11.07421875, -7.7197265625, -4.365234375, -1.0107421875, 2.34375, 5.6982421875, 9.052734375, 12.4072265625, 15.76171875, 19.1162109375, 22.470703125, 25.8251953125, 29.1796875, 32.5341796875, 35.888671875, 39.2431640625, 42.59765625, 45.9521484375, 49.306640625, 52.6611328125, 56.015625, 59.3701171875, 62.724609375, 66.0791015625, 69.43359375, 72.7880859375, 76.142578125, 79.4970703125, 82.8515625, 86.2060546875, 89.560546875, 92.9150390625, 96.26953125, 99.6240234375, 102.978515625, 106.3330078125, 109.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 9.0, 15.0, 26.0, 49.0, 139.0, 553.0, 2870.0, 263.0, 68.0, 32.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.90625, -59.986328125, -58.06640625, -56.146484375, -54.2265625, -52.306640625, -50.38671875, -48.466796875, -46.546875, -44.626953125, -42.70703125, -40.787109375, -38.8671875, -36.947265625, -35.02734375, -33.107421875, -31.1875, -29.267578125, -27.34765625, -25.427734375, -23.5078125, -21.587890625, -19.66796875, -17.748046875, -15.828125, -13.908203125, -11.98828125, -10.068359375, -8.1484375, -6.228515625, -4.30859375, -2.388671875, -0.46875, 1.451171875, 3.37109375, 5.291015625, 7.2109375, 9.130859375, 11.05078125, 12.970703125, 14.890625, 16.810546875, 18.73046875, 20.650390625, 22.5703125, 24.490234375, 26.41015625, 28.330078125, 30.25, 32.169921875, 34.08984375, 36.009765625, 37.9296875, 39.849609375, 41.76953125, 43.689453125, 45.609375, 47.529296875, 49.44921875, 51.369140625, 53.2890625, 55.208984375, 57.12890625, 59.048828125, 60.96875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 34.0, 33.0, 53.0, 68.0, 108.0, 120.0, 160.0, 122.0, 75.0, 53.0, 40.0, 22.0, 15.0, 21.0, 6.0, 8.0, 9.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.16546630859375, -134.84486389160156, -128.52427673339844, -122.20367431640625, -115.8830795288086, -109.56248474121094, -103.24188232421875, -96.9212875366211, -90.60069274902344, -84.28009796142578, -77.95950317382812, -71.63890075683594, -65.31830596923828, -58.997711181640625, -52.6771125793457, -46.35651397705078, -40.035919189453125, -33.71532440185547, -27.394725799560547, -21.074129104614258, -14.753532409667969, -8.43293571472168, -2.1123390197753906, 4.208259582519531, 10.528854370117188, 16.849451065063477, 23.170047760009766, 29.490644454956055, 35.811241149902344, 42.1318359375, 48.45243453979492, 54.773033142089844, 61.0936279296875, 67.41422271728516, 73.73481750488281, 80.055419921875, 86.37601470947266, 92.69660949707031, 99.0172119140625, 105.33780670166016, 111.65840148925781, 117.97899627685547, 124.29959106445312, 130.6201934814453, 136.9407958984375, 143.26138305664062, 149.5819854736328, 155.902587890625, 162.22317504882812, 168.5437774658203, 174.86436462402344, 181.18496704101562, 187.50555419921875, 193.82615661621094, 200.14675903320312, 206.46734619140625, 212.78794860839844, 219.10855102539062, 225.42913818359375, 231.74974060058594, 238.07034301757812, 244.39093017578125, 250.71153259277344, 257.0321350097656, 263.35272216796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 5.0, 18.0, 13.0, 13.0, 19.0, 24.0, 19.0, 27.0, 21.0, 36.0, 30.0, 21.0, 37.0, 36.0, 41.0, 37.0, 34.0, 43.0, 49.0, 41.0, 33.0, 44.0, 43.0, 34.0, 35.0, 42.0, 14.0, 20.0, 28.0, 25.0, 22.0, 14.0, 7.0, 9.0, 10.0, 6.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-112.75352478027344, -109.40979766845703, -106.06607055664062, -102.72233581542969, -99.37860870361328, -96.03488159179688, -92.69115447998047, -89.34742736816406, -86.00369262695312, -82.65996551513672, -79.31623840332031, -75.97250366210938, -72.62877655029297, -69.28504943847656, -65.94132232666016, -62.597591400146484, -59.25386428833008, -55.91013717651367, -52.56640625, -49.222679138183594, -45.87894821166992, -42.535221099853516, -39.191490173339844, -35.84776306152344, -32.50403594970703, -29.160306930541992, -25.816577911376953, -22.472850799560547, -19.129119873046875, -15.785392761230469, -12.44166374206543, -9.09793472290039, -5.754203796386719, -2.410475015640259, 0.9332537651062012, 4.276982307434082, 7.620711326599121, 10.964439392089844, 14.308168411254883, 17.651897430419922, 20.99562644958496, 24.33935546875, 27.68308448791504, 31.026813507080078, 34.370540618896484, 37.714271545410156, 41.05799865722656, 44.40172576904297, 47.74545669555664, 51.08918380737305, 54.43291473388672, 57.776641845703125, 61.1203727722168, 64.46409606933594, 67.80783081054688, 71.15155792236328, 74.49528503417969, 77.8390121459961, 81.1827392578125, 84.52647399902344, 87.87020111083984, 91.21392822265625, 94.55765533447266, 97.90138244628906, 101.2451171875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 21.0, 26.0, 33.0, 42.0, 53.0, 68.0, 125.0, 172.0, 234.0, 355.0, 505.0, 739.0, 1173.0, 1824.0, 3011.0, 5414.0, 10012.0, 20681.0, 47120.0, 127742.0, 426942.0, 256452.0, 79960.0, 32147.0, 15191.0, 7546.0, 4119.0, 2426.0, 1442.0, 937.0, 609.0, 428.0, 262.0, 192.0, 134.0, 104.0, 80.0, 63.0, 35.0, 26.0, 14.0, 18.0, 9.0, 11.0, 9.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-44.8125, -43.40234375, -41.9921875, -40.58203125, -39.171875, -37.76171875, -36.3515625, -34.94140625, -33.53125, -32.12109375, -30.7109375, -29.30078125, -27.890625, -26.48046875, -25.0703125, -23.66015625, -22.25, -20.83984375, -19.4296875, -18.01953125, -16.609375, -15.19921875, -13.7890625, -12.37890625, -10.96875, -9.55859375, -8.1484375, -6.73828125, -5.328125, -3.91796875, -2.5078125, -1.09765625, 0.3125, 1.72265625, 3.1328125, 4.54296875, 5.953125, 7.36328125, 8.7734375, 10.18359375, 11.59375, 13.00390625, 14.4140625, 15.82421875, 17.234375, 18.64453125, 20.0546875, 21.46484375, 22.875, 24.28515625, 25.6953125, 27.10546875, 28.515625, 29.92578125, 31.3359375, 32.74609375, 34.15625, 35.56640625, 36.9765625, 38.38671875, 39.796875, 41.20703125, 42.6171875, 44.02734375, 45.4375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 8.0, 6.0, 13.0, 17.0, 15.0, 18.0, 25.0, 31.0, 23.0, 29.0, 29.0, 43.0, 35.0, 44.0, 43.0, 46.0, 44.0, 49.0, 48.0, 41.0, 51.0, 35.0, 28.0, 33.0, 39.0, 26.0, 29.0, 19.0, 16.0, 24.0, 13.0, 12.0, 12.0, 9.0, 6.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-11.2734375, -10.94287109375, -10.6123046875, -10.28173828125, -9.951171875, -9.62060546875, -9.2900390625, -8.95947265625, -8.62890625, -8.29833984375, -7.9677734375, -7.63720703125, -7.306640625, -6.97607421875, -6.6455078125, -6.31494140625, -5.984375, -5.65380859375, -5.3232421875, -4.99267578125, -4.662109375, -4.33154296875, -4.0009765625, -3.67041015625, -3.33984375, -3.00927734375, -2.6787109375, -2.34814453125, -2.017578125, -1.68701171875, -1.3564453125, -1.02587890625, -0.6953125, -0.36474609375, -0.0341796875, 0.29638671875, 0.626953125, 0.95751953125, 1.2880859375, 1.61865234375, 1.94921875, 2.27978515625, 2.6103515625, 2.94091796875, 3.271484375, 3.60205078125, 3.9326171875, 4.26318359375, 4.59375, 4.92431640625, 5.2548828125, 5.58544921875, 5.916015625, 6.24658203125, 6.5771484375, 6.90771484375, 7.23828125, 7.56884765625, 7.8994140625, 8.22998046875, 8.560546875, 8.89111328125, 9.2216796875, 9.55224609375, 9.8828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 7.0, 15.0, 21.0, 28.0, 47.0, 79.0, 131.0, 243.0, 387.0, 662.0, 1286.0, 2535.0, 5259.0, 13111.0, 42051.0, 224656.0, 618690.0, 98678.0, 24367.0, 8476.0, 3707.0, 1805.0, 987.0, 531.0, 293.0, 170.0, 121.0, 76.0, 49.0, 22.0, 17.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5, -64.56005859375, -62.6201171875, -60.68017578125, -58.740234375, -56.80029296875, -54.8603515625, -52.92041015625, -50.98046875, -49.04052734375, -47.1005859375, -45.16064453125, -43.220703125, -41.28076171875, -39.3408203125, -37.40087890625, -35.4609375, -33.52099609375, -31.5810546875, -29.64111328125, -27.701171875, -25.76123046875, -23.8212890625, -21.88134765625, -19.94140625, -18.00146484375, -16.0615234375, -14.12158203125, -12.181640625, -10.24169921875, -8.3017578125, -6.36181640625, -4.421875, -2.48193359375, -0.5419921875, 1.39794921875, 3.337890625, 5.27783203125, 7.2177734375, 9.15771484375, 11.09765625, 13.03759765625, 14.9775390625, 16.91748046875, 18.857421875, 20.79736328125, 22.7373046875, 24.67724609375, 26.6171875, 28.55712890625, 30.4970703125, 32.43701171875, 34.376953125, 36.31689453125, 38.2568359375, 40.19677734375, 42.13671875, 44.07666015625, 46.0166015625, 47.95654296875, 49.896484375, 51.83642578125, 53.7763671875, 55.71630859375, 57.65625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 6.0, 11.0, 12.0, 9.0, 19.0, 19.0, 21.0, 27.0, 30.0, 32.0, 42.0, 42.0, 56.0, 53.0, 45.0, 68.0, 59.0, 42.0, 46.0, 47.0, 44.0, 39.0, 39.0, 27.0, 24.0, 24.0, 20.0, 18.0, 13.0, 13.0, 7.0, 7.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.09375, -50.39453125, -48.6953125, -46.99609375, -45.296875, -43.59765625, -41.8984375, -40.19921875, -38.5, -36.80078125, -35.1015625, -33.40234375, -31.703125, -30.00390625, -28.3046875, -26.60546875, -24.90625, -23.20703125, -21.5078125, -19.80859375, -18.109375, -16.41015625, -14.7109375, -13.01171875, -11.3125, -9.61328125, -7.9140625, -6.21484375, -4.515625, -2.81640625, -1.1171875, 0.58203125, 2.28125, 3.98046875, 5.6796875, 7.37890625, 9.078125, 10.77734375, 12.4765625, 14.17578125, 15.875, 17.57421875, 19.2734375, 20.97265625, 22.671875, 24.37109375, 26.0703125, 27.76953125, 29.46875, 31.16796875, 32.8671875, 34.56640625, 36.265625, 37.96484375, 39.6640625, 41.36328125, 43.0625, 44.76171875, 46.4609375, 48.16015625, 49.859375, 51.55859375, 53.2578125, 54.95703125, 56.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 7.0, 9.0, 22.0, 23.0, 38.0, 37.0, 85.0, 135.0, 221.0, 368.0, 607.0, 1275.0, 2579.0, 5967.0, 16613.0, 65817.0, 520756.0, 360916.0, 49515.0, 13646.0, 5040.0, 2290.0, 1118.0, 594.0, 346.0, 203.0, 101.0, 71.0, 49.0, 37.0, 26.0, 10.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.53125, -24.7783203125, -24.025390625, -23.2724609375, -22.51953125, -21.7666015625, -21.013671875, -20.2607421875, -19.5078125, -18.7548828125, -18.001953125, -17.2490234375, -16.49609375, -15.7431640625, -14.990234375, -14.2373046875, -13.484375, -12.7314453125, -11.978515625, -11.2255859375, -10.47265625, -9.7197265625, -8.966796875, -8.2138671875, -7.4609375, -6.7080078125, -5.955078125, -5.2021484375, -4.44921875, -3.6962890625, -2.943359375, -2.1904296875, -1.4375, -0.6845703125, 0.068359375, 0.8212890625, 1.57421875, 2.3271484375, 3.080078125, 3.8330078125, 4.5859375, 5.3388671875, 6.091796875, 6.8447265625, 7.59765625, 8.3505859375, 9.103515625, 9.8564453125, 10.609375, 11.3623046875, 12.115234375, 12.8681640625, 13.62109375, 14.3740234375, 15.126953125, 15.8798828125, 16.6328125, 17.3857421875, 18.138671875, 18.8916015625, 19.64453125, 20.3974609375, 21.150390625, 21.9033203125, 22.65625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 18.0, 19.0, 40.0, 91.0, 280.0, 274.0, 121.0, 57.0, 33.0, 16.0, 16.0, 4.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00972747802734375, -0.009354829788208008, -0.008982181549072266, -0.008609533309936523, -0.008236885070800781, -0.007864236831665039, -0.007491588592529297, -0.007118940353393555, -0.0067462921142578125, -0.00637364387512207, -0.006000995635986328, -0.005628347396850586, -0.005255699157714844, -0.0048830509185791016, -0.004510402679443359, -0.004137754440307617, -0.003765106201171875, -0.003392457962036133, -0.0030198097229003906, -0.0026471614837646484, -0.0022745132446289062, -0.001901865005493164, -0.0015292167663574219, -0.0011565685272216797, -0.0007839202880859375, -0.0004112720489501953, -3.8623809814453125e-05, 0.00033402442932128906, 0.0007066726684570312, 0.0010793209075927734, 0.0014519691467285156, 0.0018246173858642578, 0.002197265625, 0.002569913864135742, 0.0029425621032714844, 0.0033152103424072266, 0.0036878585815429688, 0.004060506820678711, 0.004433155059814453, 0.004805803298950195, 0.0051784515380859375, 0.00555109977722168, 0.005923748016357422, 0.006296396255493164, 0.006669044494628906, 0.0070416927337646484, 0.007414340972900391, 0.007786989212036133, 0.008159637451171875, 0.008532285690307617, 0.00890493392944336, 0.009277582168579102, 0.009650230407714844, 0.010022878646850586, 0.010395526885986328, 0.01076817512512207, 0.011140823364257812, 0.011513471603393555, 0.011886119842529297, 0.012258768081665039, 0.012631416320800781, 0.013004064559936523, 0.013376712799072266, 0.013749361038208008, 0.01412200927734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 6.0, 7.0, 11.0, 14.0, 28.0, 34.0, 52.0, 82.0, 136.0, 173.0, 303.0, 423.0, 689.0, 1074.0, 2022.0, 3475.0, 6974.0, 16102.0, 47111.0, 206575.0, 550518.0, 148252.0, 37211.0, 13483.0, 6035.0, 3118.0, 1740.0, 1033.0, 654.0, 397.0, 241.0, 165.0, 127.0, 89.0, 49.0, 37.0, 31.0, 14.0, 13.0, 8.0, 6.0, 8.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.9375, -18.35302734375, -17.7685546875, -17.18408203125, -16.599609375, -16.01513671875, -15.4306640625, -14.84619140625, -14.26171875, -13.67724609375, -13.0927734375, -12.50830078125, -11.923828125, -11.33935546875, -10.7548828125, -10.17041015625, -9.5859375, -9.00146484375, -8.4169921875, -7.83251953125, -7.248046875, -6.66357421875, -6.0791015625, -5.49462890625, -4.91015625, -4.32568359375, -3.7412109375, -3.15673828125, -2.572265625, -1.98779296875, -1.4033203125, -0.81884765625, -0.234375, 0.35009765625, 0.9345703125, 1.51904296875, 2.103515625, 2.68798828125, 3.2724609375, 3.85693359375, 4.44140625, 5.02587890625, 5.6103515625, 6.19482421875, 6.779296875, 7.36376953125, 7.9482421875, 8.53271484375, 9.1171875, 9.70166015625, 10.2861328125, 10.87060546875, 11.455078125, 12.03955078125, 12.6240234375, 13.20849609375, 13.79296875, 14.37744140625, 14.9619140625, 15.54638671875, 16.130859375, 16.71533203125, 17.2998046875, 17.88427734375, 18.46875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 7.0, 11.0, 17.0, 12.0, 24.0, 28.0, 32.0, 41.0, 75.0, 60.0, 83.0, 110.0, 92.0, 91.0, 66.0, 55.0, 33.0, 27.0, 21.0, 16.0, 13.0, 15.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.890625, -16.352783203125, -15.81494140625, -15.277099609375, -14.7392578125, -14.201416015625, -13.66357421875, -13.125732421875, -12.587890625, -12.050048828125, -11.51220703125, -10.974365234375, -10.4365234375, -9.898681640625, -9.36083984375, -8.822998046875, -8.28515625, -7.747314453125, -7.20947265625, -6.671630859375, -6.1337890625, -5.595947265625, -5.05810546875, -4.520263671875, -3.982421875, -3.444580078125, -2.90673828125, -2.368896484375, -1.8310546875, -1.293212890625, -0.75537109375, -0.217529296875, 0.3203125, 0.858154296875, 1.39599609375, 1.933837890625, 2.4716796875, 3.009521484375, 3.54736328125, 4.085205078125, 4.623046875, 5.160888671875, 5.69873046875, 6.236572265625, 6.7744140625, 7.312255859375, 7.85009765625, 8.387939453125, 8.92578125, 9.463623046875, 10.00146484375, 10.539306640625, 11.0771484375, 11.614990234375, 12.15283203125, 12.690673828125, 13.228515625, 13.766357421875, 14.30419921875, 14.842041015625, 15.3798828125, 15.917724609375, 16.45556640625, 16.993408203125, 17.53125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 19.0, 18.0, 32.0, 62.0, 82.0, 160.0, 174.0, 143.0, 119.0, 72.0, 47.0, 33.0, 22.0, 6.0, 3.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.1904907226562, -577.7869262695312, -562.38330078125, -546.979736328125, -531.5761108398438, -516.1725463867188, -500.7689514160156, -485.3653564453125, -469.9617614746094, -454.55816650390625, -439.1545715332031, -423.7509765625, -408.347412109375, -392.9438171386719, -377.54022216796875, -362.1366271972656, -346.7330322265625, -331.3294372558594, -315.92584228515625, -300.52227783203125, -285.1186828613281, -269.715087890625, -254.31149291992188, -238.90789794921875, -223.50433349609375, -208.10073852539062, -192.69715881347656, -177.29356384277344, -161.8899688720703, -146.48638916015625, -131.08279418945312, -115.67919921875, -100.27560424804688, -84.87201690673828, -69.46842193603516, -54.06483459472656, -38.6612434387207, -23.257652282714844, -7.85406494140625, 7.549530029296875, 22.95311737060547, 38.35670852661133, 53.76029968261719, 69.16388702392578, 84.56747436523438, 99.9710693359375, 115.3746566772461, 130.77825927734375, 146.1818389892578, 161.58543395996094, 176.989013671875, 192.39260864257812, 207.79620361328125, 223.19979858398438, 238.60337829589844, 254.00697326660156, 269.4105529785156, 284.81414794921875, 300.2177429199219, 315.621337890625, 331.02490234375, 346.4284973144531, 361.83209228515625, 377.2356872558594, 392.6392822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 9.0, 8.0, 11.0, 17.0, 17.0, 19.0, 17.0, 38.0, 20.0, 20.0, 27.0, 35.0, 43.0, 48.0, 51.0, 44.0, 38.0, 42.0, 41.0, 51.0, 48.0, 47.0, 44.0, 33.0, 43.0, 28.0, 20.0, 19.0, 21.0, 10.0, 19.0, 9.0, 12.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-284.66607666015625, -276.7821350097656, -268.898193359375, -261.0142517089844, -253.1302947998047, -245.24635314941406, -237.36241149902344, -229.4784698486328, -221.59451293945312, -213.7105712890625, -205.82662963867188, -197.94268798828125, -190.05873107910156, -182.17478942871094, -174.2908477783203, -166.4069061279297, -158.52296447753906, -150.63902282714844, -142.7550811767578, -134.87112426757812, -126.9871826171875, -119.10324096679688, -111.21929931640625, -103.33535766601562, -95.45140838623047, -87.56746673583984, -79.68351745605469, -71.79957580566406, -63.91563034057617, -56.03168487548828, -48.147743225097656, -40.263797760009766, -32.379852294921875, -24.495906829833984, -16.611963272094727, -8.728019714355469, -0.8440742492675781, 7.0398712158203125, 14.923812866210938, 22.807758331298828, 30.69170379638672, 38.57564926147461, 46.4595947265625, 54.343536376953125, 62.227481842041016, 70.1114273071289, 77.99536895751953, 85.87931823730469, 93.76325988769531, 101.64720153808594, 109.5311508178711, 117.41509246826172, 125.29904174804688, 133.1829833984375, 141.06692504882812, 148.95086669921875, 156.83480834960938, 164.71875, 172.60269165039062, 180.48663330078125, 188.37059020996094, 196.25453186035156, 204.1384735107422, 212.0224151611328, 219.9063720703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 9.0, 6.0, 7.0, 6.0, 7.0, 9.0, 8.0, 15.0, 23.0, 22.0, 35.0, 45.0, 52.0, 85.0, 110.0, 134.0, 202.0, 229.0, 343.0, 510.0, 735.0, 1082.0, 1665.0, 2543.0, 4464.0, 8500.0, 18487.0, 48152.0, 238041.0, 3690454.0, 115384.0, 33001.0, 13288.0, 6541.0, 3623.0, 2087.0, 1295.0, 946.0, 593.0, 393.0, 315.0, 226.0, 171.0, 101.0, 80.0, 69.0, 47.0, 46.0, 29.0, 19.0, 19.0, 13.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 5.0, 2.0, 1.0], "bins": [-66.375, -64.3212890625, -62.267578125, -60.2138671875, -58.16015625, -56.1064453125, -54.052734375, -51.9990234375, -49.9453125, -47.8916015625, -45.837890625, -43.7841796875, -41.73046875, -39.6767578125, -37.623046875, -35.5693359375, -33.515625, -31.4619140625, -29.408203125, -27.3544921875, -25.30078125, -23.2470703125, -21.193359375, -19.1396484375, -17.0859375, -15.0322265625, -12.978515625, -10.9248046875, -8.87109375, -6.8173828125, -4.763671875, -2.7099609375, -0.65625, 1.3974609375, 3.451171875, 5.5048828125, 7.55859375, 9.6123046875, 11.666015625, 13.7197265625, 15.7734375, 17.8271484375, 19.880859375, 21.9345703125, 23.98828125, 26.0419921875, 28.095703125, 30.1494140625, 32.203125, 34.2568359375, 36.310546875, 38.3642578125, 40.41796875, 42.4716796875, 44.525390625, 46.5791015625, 48.6328125, 50.6865234375, 52.740234375, 54.7939453125, 56.84765625, 58.9013671875, 60.955078125, 63.0087890625, 65.0625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 3.0, 8.0, 10.0, 14.0, 16.0, 15.0, 17.0, 23.0, 34.0, 40.0, 28.0, 27.0, 38.0, 44.0, 40.0, 50.0, 40.0, 48.0, 42.0, 49.0, 44.0, 41.0, 36.0, 40.0, 32.0, 25.0, 32.0, 26.0, 15.0, 25.0, 20.0, 14.0, 10.0, 8.0, 8.0, 13.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.5899658203125, -9.258056640625, -8.9261474609375, -8.59423828125, -8.2623291015625, -7.930419921875, -7.5985107421875, -7.2666015625, -6.9346923828125, -6.602783203125, -6.2708740234375, -5.93896484375, -5.6070556640625, -5.275146484375, -4.9432373046875, -4.611328125, -4.2794189453125, -3.947509765625, -3.6156005859375, -3.28369140625, -2.9517822265625, -2.619873046875, -2.2879638671875, -1.9560546875, -1.6241455078125, -1.292236328125, -0.9603271484375, -0.62841796875, -0.2965087890625, 0.035400390625, 0.3673095703125, 0.69921875, 1.0311279296875, 1.363037109375, 1.6949462890625, 2.02685546875, 2.3587646484375, 2.690673828125, 3.0225830078125, 3.3544921875, 3.6864013671875, 4.018310546875, 4.3502197265625, 4.68212890625, 5.0140380859375, 5.345947265625, 5.6778564453125, 6.009765625, 6.3416748046875, 6.673583984375, 7.0054931640625, 7.33740234375, 7.6693115234375, 8.001220703125, 8.3331298828125, 8.6650390625, 8.9969482421875, 9.328857421875, 9.6607666015625, 9.99267578125, 10.3245849609375, 10.656494140625, 10.9884033203125, 11.3203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 8.0, 15.0, 14.0, 25.0, 21.0, 27.0, 34.0, 36.0, 59.0, 70.0, 99.0, 127.0, 214.0, 348.0, 589.0, 1016.0, 2219.0, 6018.0, 26854.0, 1659761.0, 2458543.0, 27167.0, 6051.0, 2233.0, 1064.0, 569.0, 329.0, 180.0, 142.0, 105.0, 77.0, 59.0, 41.0, 34.0, 26.0, 20.0, 21.0, 11.0, 7.0, 9.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-200.375, -194.650390625, -188.92578125, -183.201171875, -177.4765625, -171.751953125, -166.02734375, -160.302734375, -154.578125, -148.853515625, -143.12890625, -137.404296875, -131.6796875, -125.955078125, -120.23046875, -114.505859375, -108.78125, -103.056640625, -97.33203125, -91.607421875, -85.8828125, -80.158203125, -74.43359375, -68.708984375, -62.984375, -57.259765625, -51.53515625, -45.810546875, -40.0859375, -34.361328125, -28.63671875, -22.912109375, -17.1875, -11.462890625, -5.73828125, -0.013671875, 5.7109375, 11.435546875, 17.16015625, 22.884765625, 28.609375, 34.333984375, 40.05859375, 45.783203125, 51.5078125, 57.232421875, 62.95703125, 68.681640625, 74.40625, 80.130859375, 85.85546875, 91.580078125, 97.3046875, 103.029296875, 108.75390625, 114.478515625, 120.203125, 125.927734375, 131.65234375, 137.376953125, 143.1015625, 148.826171875, 154.55078125, 160.275390625, 166.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 16.0, 36.0, 108.0, 500.0, 3073.0, 213.0, 65.0, 22.0, 11.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.375, -126.8740234375, -123.373046875, -119.8720703125, -116.37109375, -112.8701171875, -109.369140625, -105.8681640625, -102.3671875, -98.8662109375, -95.365234375, -91.8642578125, -88.36328125, -84.8623046875, -81.361328125, -77.8603515625, -74.359375, -70.8583984375, -67.357421875, -63.8564453125, -60.35546875, -56.8544921875, -53.353515625, -49.8525390625, -46.3515625, -42.8505859375, -39.349609375, -35.8486328125, -32.34765625, -28.8466796875, -25.345703125, -21.8447265625, -18.34375, -14.8427734375, -11.341796875, -7.8408203125, -4.33984375, -0.8388671875, 2.662109375, 6.1630859375, 9.6640625, 13.1650390625, 16.666015625, 20.1669921875, 23.66796875, 27.1689453125, 30.669921875, 34.1708984375, 37.671875, 41.1728515625, 44.673828125, 48.1748046875, 51.67578125, 55.1767578125, 58.677734375, 62.1787109375, 65.6796875, 69.1806640625, 72.681640625, 76.1826171875, 79.68359375, 83.1845703125, 86.685546875, 90.1865234375, 93.6875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 29.0, 55.0, 49.0, 116.0, 150.0, 180.0, 135.0, 83.0, 64.0, 28.0, 27.0, 18.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-574.7474365234375, -563.2962646484375, -551.8450927734375, -540.3939819335938, -528.9428100585938, -517.4916381835938, -506.04046630859375, -494.58929443359375, -483.1381530761719, -471.6869812011719, -460.23583984375, -448.78466796875, -437.33349609375, -425.8823547363281, -414.4311828613281, -402.98004150390625, -391.52886962890625, -380.07769775390625, -368.6265563964844, -357.1753845214844, -345.7242431640625, -334.2730712890625, -322.8218994140625, -311.3707275390625, -299.9195861816406, -288.4684143066406, -277.01727294921875, -265.56610107421875, -254.1149444580078, -242.66378784179688, -231.21261596679688, -219.76145935058594, -208.310302734375, -196.85914611816406, -185.40798950195312, -173.95681762695312, -162.5056610107422, -151.05450439453125, -139.60333251953125, -128.1521759033203, -116.70101928710938, -105.24986267089844, -93.79869842529297, -82.3475341796875, -70.89637756347656, -59.44521713256836, -47.994056701660156, -36.54289245605469, -25.09173583984375, -13.640575408935547, -2.1894149780273438, 9.26174545288086, 20.712905883789062, 32.164066314697266, 43.61522674560547, 55.06639099121094, 66.51754760742188, 77.96870422363281, 89.41986846923828, 100.87103271484375, 112.32218933105469, 123.77334594726562, 135.22451782226562, 146.67567443847656, 158.1268310546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0, 7.0, 10.0, 5.0, 7.0, 10.0, 10.0, 16.0, 10.0, 16.0, 17.0, 22.0, 26.0, 25.0, 25.0, 31.0, 38.0, 27.0, 30.0, 43.0, 52.0, 34.0, 41.0, 40.0, 52.0, 39.0, 37.0, 43.0, 53.0, 24.0, 24.0, 33.0, 28.0, 15.0, 18.0, 17.0, 13.0, 9.0, 13.0, 5.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-137.32858276367188, -132.5045166015625, -127.68045806884766, -122.85639190673828, -118.03233337402344, -113.20826721191406, -108.38420104980469, -103.56013488769531, -98.73607635498047, -93.9120101928711, -89.08795166015625, -84.26388549804688, -79.4398193359375, -74.61576080322266, -69.79169464111328, -64.96763610839844, -60.14356994628906, -55.31950759887695, -50.495445251464844, -45.67137908935547, -40.84731674194336, -36.02325439453125, -31.199190139770508, -26.375125885009766, -21.551063537597656, -16.727001190185547, -11.902936935424805, -7.078873634338379, -2.254810333251953, 2.5692520141601562, 7.393316268920898, 12.21738052368164, 17.04144287109375, 21.86550521850586, 26.6895694732666, 31.513633728027344, 36.33769607543945, 41.16175842285156, 45.98582458496094, 50.80988693237305, 55.633949279785156, 60.458011627197266, 65.28207397460938, 70.10614013671875, 74.93020629882812, 79.75426483154297, 84.57833099365234, 89.40238952636719, 94.22645568847656, 99.05052185058594, 103.87458038330078, 108.69864654541016, 113.522705078125, 118.34677124023438, 123.17083740234375, 127.99490356445312, 132.8189697265625, 137.64303588867188, 142.46710205078125, 147.29115295410156, 152.11521911621094, 156.9392852783203, 161.7633514404297, 166.58741760253906, 171.41146850585938]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 15.0, 13.0, 20.0, 20.0, 30.0, 47.0, 57.0, 77.0, 109.0, 143.0, 200.0, 260.0, 384.0, 548.0, 902.0, 1465.0, 2783.0, 5954.0, 14397.0, 44557.0, 181452.0, 533318.0, 187892.0, 45758.0, 14840.0, 6142.0, 2835.0, 1556.0, 848.0, 526.0, 372.0, 281.0, 185.0, 135.0, 93.0, 79.0, 63.0, 43.0, 27.0, 27.0, 18.0, 13.0, 14.0, 9.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -62.5673828125, -60.447265625, -58.3271484375, -56.20703125, -54.0869140625, -51.966796875, -49.8466796875, -47.7265625, -45.6064453125, -43.486328125, -41.3662109375, -39.24609375, -37.1259765625, -35.005859375, -32.8857421875, -30.765625, -28.6455078125, -26.525390625, -24.4052734375, -22.28515625, -20.1650390625, -18.044921875, -15.9248046875, -13.8046875, -11.6845703125, -9.564453125, -7.4443359375, -5.32421875, -3.2041015625, -1.083984375, 1.0361328125, 3.15625, 5.2763671875, 7.396484375, 9.5166015625, 11.63671875, 13.7568359375, 15.876953125, 17.9970703125, 20.1171875, 22.2373046875, 24.357421875, 26.4775390625, 28.59765625, 30.7177734375, 32.837890625, 34.9580078125, 37.078125, 39.1982421875, 41.318359375, 43.4384765625, 45.55859375, 47.6787109375, 49.798828125, 51.9189453125, 54.0390625, 56.1591796875, 58.279296875, 60.3994140625, 62.51953125, 64.6396484375, 66.759765625, 68.8798828125, 71.0]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 11.0, 18.0, 18.0, 25.0, 26.0, 25.0, 31.0, 37.0, 33.0, 36.0, 49.0, 46.0, 43.0, 59.0, 46.0, 40.0, 48.0, 46.0, 41.0, 29.0, 28.0, 36.0, 19.0, 27.0, 24.0, 19.0, 26.0, 10.0, 14.0, 7.0, 8.0, 11.0, 4.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.734375, -13.307373046875, -12.88037109375, -12.453369140625, -12.0263671875, -11.599365234375, -11.17236328125, -10.745361328125, -10.318359375, -9.891357421875, -9.46435546875, -9.037353515625, -8.6103515625, -8.183349609375, -7.75634765625, -7.329345703125, -6.90234375, -6.475341796875, -6.04833984375, -5.621337890625, -5.1943359375, -4.767333984375, -4.34033203125, -3.913330078125, -3.486328125, -3.059326171875, -2.63232421875, -2.205322265625, -1.7783203125, -1.351318359375, -0.92431640625, -0.497314453125, -0.0703125, 0.356689453125, 0.78369140625, 1.210693359375, 1.6376953125, 2.064697265625, 2.49169921875, 2.918701171875, 3.345703125, 3.772705078125, 4.19970703125, 4.626708984375, 5.0537109375, 5.480712890625, 5.90771484375, 6.334716796875, 6.76171875, 7.188720703125, 7.61572265625, 8.042724609375, 8.4697265625, 8.896728515625, 9.32373046875, 9.750732421875, 10.177734375, 10.604736328125, 11.03173828125, 11.458740234375, 11.8857421875, 12.312744140625, 12.73974609375, 13.166748046875, 13.59375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 12.0, 8.0, 15.0, 13.0, 28.0, 30.0, 30.0, 52.0, 74.0, 82.0, 120.0, 188.0, 248.0, 320.0, 471.0, 752.0, 1245.0, 2312.0, 4969.0, 17254.0, 133697.0, 756982.0, 104769.0, 14629.0, 4547.0, 2116.0, 1174.0, 732.0, 487.0, 333.0, 229.0, 148.0, 109.0, 101.0, 71.0, 53.0, 42.0, 22.0, 22.0, 12.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-117.75, -114.33203125, -110.9140625, -107.49609375, -104.078125, -100.66015625, -97.2421875, -93.82421875, -90.40625, -86.98828125, -83.5703125, -80.15234375, -76.734375, -73.31640625, -69.8984375, -66.48046875, -63.0625, -59.64453125, -56.2265625, -52.80859375, -49.390625, -45.97265625, -42.5546875, -39.13671875, -35.71875, -32.30078125, -28.8828125, -25.46484375, -22.046875, -18.62890625, -15.2109375, -11.79296875, -8.375, -4.95703125, -1.5390625, 1.87890625, 5.296875, 8.71484375, 12.1328125, 15.55078125, 18.96875, 22.38671875, 25.8046875, 29.22265625, 32.640625, 36.05859375, 39.4765625, 42.89453125, 46.3125, 49.73046875, 53.1484375, 56.56640625, 59.984375, 63.40234375, 66.8203125, 70.23828125, 73.65625, 77.07421875, 80.4921875, 83.91015625, 87.328125, 90.74609375, 94.1640625, 97.58203125, 101.0]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 11.0, 7.0, 11.0, 18.0, 20.0, 32.0, 51.0, 61.0, 52.0, 79.0, 83.0, 89.0, 87.0, 80.0, 54.0, 62.0, 56.0, 39.0, 30.0, 27.0, 21.0, 7.0, 9.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.1875, -105.3994140625, -101.611328125, -97.8232421875, -94.03515625, -90.2470703125, -86.458984375, -82.6708984375, -78.8828125, -75.0947265625, -71.306640625, -67.5185546875, -63.73046875, -59.9423828125, -56.154296875, -52.3662109375, -48.578125, -44.7900390625, -41.001953125, -37.2138671875, -33.42578125, -29.6376953125, -25.849609375, -22.0615234375, -18.2734375, -14.4853515625, -10.697265625, -6.9091796875, -3.12109375, 0.6669921875, 4.455078125, 8.2431640625, 12.03125, 15.8193359375, 19.607421875, 23.3955078125, 27.18359375, 30.9716796875, 34.759765625, 38.5478515625, 42.3359375, 46.1240234375, 49.912109375, 53.7001953125, 57.48828125, 61.2763671875, 65.064453125, 68.8525390625, 72.640625, 76.4287109375, 80.216796875, 84.0048828125, 87.79296875, 91.5810546875, 95.369140625, 99.1572265625, 102.9453125, 106.7333984375, 110.521484375, 114.3095703125, 118.09765625, 121.8857421875, 125.673828125, 129.4619140625, 133.25]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 2.0, 6.0, 18.0, 20.0, 28.0, 50.0, 64.0, 98.0, 111.0, 168.0, 224.0, 300.0, 457.0, 697.0, 1009.0, 1563.0, 2407.0, 4398.0, 13033.0, 260732.0, 729620.0, 20205.0, 5289.0, 2718.0, 1759.0, 1078.0, 746.0, 512.0, 365.0, 266.0, 170.0, 119.0, 82.0, 55.0, 49.0, 30.0, 29.0, 18.0, 18.0, 9.0, 10.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.75, -81.05859375, -78.3671875, -75.67578125, -72.984375, -70.29296875, -67.6015625, -64.91015625, -62.21875, -59.52734375, -56.8359375, -54.14453125, -51.453125, -48.76171875, -46.0703125, -43.37890625, -40.6875, -37.99609375, -35.3046875, -32.61328125, -29.921875, -27.23046875, -24.5390625, -21.84765625, -19.15625, -16.46484375, -13.7734375, -11.08203125, -8.390625, -5.69921875, -3.0078125, -0.31640625, 2.375, 5.06640625, 7.7578125, 10.44921875, 13.140625, 15.83203125, 18.5234375, 21.21484375, 23.90625, 26.59765625, 29.2890625, 31.98046875, 34.671875, 37.36328125, 40.0546875, 42.74609375, 45.4375, 48.12890625, 50.8203125, 53.51171875, 56.203125, 58.89453125, 61.5859375, 64.27734375, 66.96875, 69.66015625, 72.3515625, 75.04296875, 77.734375, 80.42578125, 83.1171875, 85.80859375, 88.5]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 17.0, 76.0, 309.0, 448.0, 100.0, 21.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0355224609375, -0.03444957733154297, -0.03337669372558594, -0.032303810119628906, -0.031230926513671875, -0.030158042907714844, -0.029085159301757812, -0.02801227569580078, -0.02693939208984375, -0.02586650848388672, -0.024793624877929688, -0.023720741271972656, -0.022647857666015625, -0.021574974060058594, -0.020502090454101562, -0.01942920684814453, -0.0183563232421875, -0.01728343963623047, -0.016210556030273438, -0.015137672424316406, -0.014064788818359375, -0.012991905212402344, -0.011919021606445312, -0.010846138000488281, -0.00977325439453125, -0.008700370788574219, -0.0076274871826171875, -0.006554603576660156, -0.005481719970703125, -0.004408836364746094, -0.0033359527587890625, -0.0022630691528320312, -0.001190185546875, -0.00011730194091796875, 0.0009555816650390625, 0.0020284652709960938, 0.003101348876953125, 0.004174232482910156, 0.0052471160888671875, 0.006319999694824219, 0.00739288330078125, 0.008465766906738281, 0.009538650512695312, 0.010611534118652344, 0.011684417724609375, 0.012757301330566406, 0.013830184936523438, 0.014903068542480469, 0.0159759521484375, 0.01704883575439453, 0.018121719360351562, 0.019194602966308594, 0.020267486572265625, 0.021340370178222656, 0.022413253784179688, 0.02348613739013672, 0.02455902099609375, 0.02563190460205078, 0.026704788208007812, 0.027777671813964844, 0.028850555419921875, 0.029923439025878906, 0.030996322631835938, 0.03206920623779297, 0.03314208984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 23.0, 18.0, 23.0, 32.0, 63.0, 79.0, 137.0, 261.0, 443.0, 792.0, 1540.0, 2902.0, 6596.0, 39430.0, 929007.0, 53086.0, 7391.0, 3085.0, 1625.0, 861.0, 419.0, 283.0, 165.0, 88.0, 55.0, 45.0, 19.0, 14.0, 16.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-99.1875, -95.9404296875, -92.693359375, -89.4462890625, -86.19921875, -82.9521484375, -79.705078125, -76.4580078125, -73.2109375, -69.9638671875, -66.716796875, -63.4697265625, -60.22265625, -56.9755859375, -53.728515625, -50.4814453125, -47.234375, -43.9873046875, -40.740234375, -37.4931640625, -34.24609375, -30.9990234375, -27.751953125, -24.5048828125, -21.2578125, -18.0107421875, -14.763671875, -11.5166015625, -8.26953125, -5.0224609375, -1.775390625, 1.4716796875, 4.71875, 7.9658203125, 11.212890625, 14.4599609375, 17.70703125, 20.9541015625, 24.201171875, 27.4482421875, 30.6953125, 33.9423828125, 37.189453125, 40.4365234375, 43.68359375, 46.9306640625, 50.177734375, 53.4248046875, 56.671875, 59.9189453125, 63.166015625, 66.4130859375, 69.66015625, 72.9072265625, 76.154296875, 79.4013671875, 82.6484375, 85.8955078125, 89.142578125, 92.3896484375, 95.63671875, 98.8837890625, 102.130859375, 105.3779296875, 108.625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 6.0, 6.0, 5.0, 19.0, 35.0, 60.0, 133.0, 267.0, 243.0, 98.0, 47.0, 27.0, 15.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.6875, -65.072265625, -62.45703125, -59.841796875, -57.2265625, -54.611328125, -51.99609375, -49.380859375, -46.765625, -44.150390625, -41.53515625, -38.919921875, -36.3046875, -33.689453125, -31.07421875, -28.458984375, -25.84375, -23.228515625, -20.61328125, -17.998046875, -15.3828125, -12.767578125, -10.15234375, -7.537109375, -4.921875, -2.306640625, 0.30859375, 2.923828125, 5.5390625, 8.154296875, 10.76953125, 13.384765625, 16.0, 18.615234375, 21.23046875, 23.845703125, 26.4609375, 29.076171875, 31.69140625, 34.306640625, 36.921875, 39.537109375, 42.15234375, 44.767578125, 47.3828125, 49.998046875, 52.61328125, 55.228515625, 57.84375, 60.458984375, 63.07421875, 65.689453125, 68.3046875, 70.919921875, 73.53515625, 76.150390625, 78.765625, 81.380859375, 83.99609375, 86.611328125, 89.2265625, 91.841796875, 94.45703125, 97.072265625, 99.6875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 5.0, 13.0, 9.0, 17.0, 18.0, 23.0, 30.0, 44.0, 65.0, 76.0, 80.0, 98.0, 89.0, 90.0, 88.0, 64.0, 48.0, 28.0, 19.0, 20.0, 17.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-592.8483276367188, -576.5643310546875, -560.2803955078125, -543.9963989257812, -527.7124633789062, -511.428466796875, -495.1445007324219, -478.86053466796875, -462.5765380859375, -446.2925720214844, -430.00860595703125, -413.724609375, -397.4406433105469, -381.15667724609375, -364.8727111816406, -348.5887451171875, -332.3047790527344, -316.02081298828125, -299.7368469238281, -283.452880859375, -267.16888427734375, -250.88491821289062, -234.6009521484375, -218.31698608398438, -202.0330047607422, -185.74903869628906, -169.46505737304688, -153.18109130859375, -136.89712524414062, -120.61314392089844, -104.32917785644531, -88.04520416259766, -71.76119995117188, -55.47722625732422, -39.19325637817383, -22.909286499023438, -6.625312805175781, 9.658660888671875, 25.942626953125, 42.226600646972656, 58.51057434082031, 74.79454803466797, 91.07852172851562, 107.36248779296875, 123.6464614868164, 139.93043518066406, 156.2144012451172, 172.49838256835938, 188.7823486328125, 205.06631469726562, 221.3502960205078, 237.63426208496094, 253.91824340820312, 270.20220947265625, 286.4861755371094, 302.7701416015625, 319.05413818359375, 335.3381042480469, 351.6220703125, 367.90606689453125, 384.1900329589844, 400.4739990234375, 416.7579650878906, 433.04193115234375, 449.3258972167969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 8.0, 5.0, 4.0, 7.0, 5.0, 13.0, 8.0, 8.0, 11.0, 15.0, 17.0, 25.0, 23.0, 27.0, 27.0, 29.0, 23.0, 35.0, 48.0, 27.0, 42.0, 48.0, 50.0, 37.0, 48.0, 32.0, 54.0, 38.0, 28.0, 30.0, 29.0, 17.0, 29.0, 24.0, 23.0, 9.0, 16.0, 15.0, 18.0, 11.0, 10.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-379.4832763671875, -368.2763671875, -357.0694274902344, -345.8625183105469, -334.6556091308594, -323.44866943359375, -312.24176025390625, -301.03485107421875, -289.82794189453125, -278.62103271484375, -267.4140930175781, -256.2071838378906, -245.00027465820312, -233.79335021972656, -222.58642578125, -211.3795166015625, -200.17257690429688, -188.9656524658203, -177.7587432861328, -166.55181884765625, -155.34490966796875, -144.1379852294922, -132.93106079101562, -121.7241439819336, -110.51722717285156, -99.31031036376953, -88.1033935546875, -76.89646911621094, -65.6895523071289, -54.482635498046875, -43.27571105957031, -32.06879425048828, -20.86187744140625, -9.654958724975586, 1.5519599914550781, 12.758880615234375, 23.965797424316406, 35.17271423339844, 46.379638671875, 57.58655548095703, 68.79347229003906, 80.0003890991211, 91.20730590820312, 102.41423034667969, 113.62114715576172, 124.82806396484375, 136.0349884033203, 147.24191284179688, 158.44882202148438, 169.65574645996094, 180.86265563964844, 192.069580078125, 203.2764892578125, 214.48341369628906, 225.69033813476562, 236.89724731445312, 248.1041717529297, 259.31109619140625, 270.51800537109375, 281.72491455078125, 292.9318542480469, 304.1387634277344, 315.345703125, 326.5526123046875, 337.759521484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 9.0, 11.0, 11.0, 12.0, 19.0, 38.0, 46.0, 59.0, 76.0, 165.0, 201.0, 338.0, 578.0, 979.0, 1901.0, 4742.0, 22472.0, 4143452.0, 11966.0, 3424.0, 1537.0, 823.0, 519.0, 281.0, 185.0, 123.0, 87.0, 58.0, 41.0, 22.0, 19.0, 15.0, 10.0, 7.0, 13.0, 3.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-204.5, -198.71484375, -192.9296875, -187.14453125, -181.359375, -175.57421875, -169.7890625, -164.00390625, -158.21875, -152.43359375, -146.6484375, -140.86328125, -135.078125, -129.29296875, -123.5078125, -117.72265625, -111.9375, -106.15234375, -100.3671875, -94.58203125, -88.796875, -83.01171875, -77.2265625, -71.44140625, -65.65625, -59.87109375, -54.0859375, -48.30078125, -42.515625, -36.73046875, -30.9453125, -25.16015625, -19.375, -13.58984375, -7.8046875, -2.01953125, 3.765625, 9.55078125, 15.3359375, 21.12109375, 26.90625, 32.69140625, 38.4765625, 44.26171875, 50.046875, 55.83203125, 61.6171875, 67.40234375, 73.1875, 78.97265625, 84.7578125, 90.54296875, 96.328125, 102.11328125, 107.8984375, 113.68359375, 119.46875, 125.25390625, 131.0390625, 136.82421875, 142.609375, 148.39453125, 154.1796875, 159.96484375, 165.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 3.0, 13.0, 16.0, 16.0, 21.0, 22.0, 30.0, 33.0, 34.0, 36.0, 39.0, 52.0, 51.0, 30.0, 53.0, 54.0, 47.0, 60.0, 43.0, 45.0, 37.0, 34.0, 27.0, 28.0, 24.0, 28.0, 25.0, 15.0, 15.0, 7.0, 14.0, 6.0, 11.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.421875, -16.885498046875, -16.34912109375, -15.812744140625, -15.2763671875, -14.739990234375, -14.20361328125, -13.667236328125, -13.130859375, -12.594482421875, -12.05810546875, -11.521728515625, -10.9853515625, -10.448974609375, -9.91259765625, -9.376220703125, -8.83984375, -8.303466796875, -7.76708984375, -7.230712890625, -6.6943359375, -6.157958984375, -5.62158203125, -5.085205078125, -4.548828125, -4.012451171875, -3.47607421875, -2.939697265625, -2.4033203125, -1.866943359375, -1.33056640625, -0.794189453125, -0.2578125, 0.278564453125, 0.81494140625, 1.351318359375, 1.8876953125, 2.424072265625, 2.96044921875, 3.496826171875, 4.033203125, 4.569580078125, 5.10595703125, 5.642333984375, 6.1787109375, 6.715087890625, 7.25146484375, 7.787841796875, 8.32421875, 8.860595703125, 9.39697265625, 9.933349609375, 10.4697265625, 11.006103515625, 11.54248046875, 12.078857421875, 12.615234375, 13.151611328125, 13.68798828125, 14.224365234375, 14.7607421875, 15.297119140625, 15.83349609375, 16.369873046875, 16.90625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 26.0, 28.0, 33.0, 60.0, 70.0, 102.0, 125.0, 171.0, 242.0, 310.0, 458.0, 800.0, 1671.0, 4978.0, 73170.0, 4100556.0, 6623.0, 2044.0, 863.0, 516.0, 348.0, 251.0, 224.0, 140.0, 112.0, 96.0, 60.0, 60.0, 34.0, 27.0, 24.0, 13.0, 10.0, 4.0, 2.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-217.0, -207.9921875, -198.984375, -189.9765625, -180.96875, -171.9609375, -162.953125, -153.9453125, -144.9375, -135.9296875, -126.921875, -117.9140625, -108.90625, -99.8984375, -90.890625, -81.8828125, -72.875, -63.8671875, -54.859375, -45.8515625, -36.84375, -27.8359375, -18.828125, -9.8203125, -0.8125, 8.1953125, 17.203125, 26.2109375, 35.21875, 44.2265625, 53.234375, 62.2421875, 71.25, 80.2578125, 89.265625, 98.2734375, 107.28125, 116.2890625, 125.296875, 134.3046875, 143.3125, 152.3203125, 161.328125, 170.3359375, 179.34375, 188.3515625, 197.359375, 206.3671875, 215.375, 224.3828125, 233.390625, 242.3984375, 251.40625, 260.4140625, 269.421875, 278.4296875, 287.4375, 296.4453125, 305.453125, 314.4609375, 323.46875, 332.4765625, 341.484375, 350.4921875, 359.5]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 14.0, 46.0, 3904.0, 67.0, 17.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.1875, -35.67626953125, -34.1650390625, -32.65380859375, -31.142578125, -29.63134765625, -28.1201171875, -26.60888671875, -25.09765625, -23.58642578125, -22.0751953125, -20.56396484375, -19.052734375, -17.54150390625, -16.0302734375, -14.51904296875, -13.0078125, -11.49658203125, -9.9853515625, -8.47412109375, -6.962890625, -5.45166015625, -3.9404296875, -2.42919921875, -0.91796875, 0.59326171875, 2.1044921875, 3.61572265625, 5.126953125, 6.63818359375, 8.1494140625, 9.66064453125, 11.171875, 12.68310546875, 14.1943359375, 15.70556640625, 17.216796875, 18.72802734375, 20.2392578125, 21.75048828125, 23.26171875, 24.77294921875, 26.2841796875, 27.79541015625, 29.306640625, 30.81787109375, 32.3291015625, 33.84033203125, 35.3515625, 36.86279296875, 38.3740234375, 39.88525390625, 41.396484375, 42.90771484375, 44.4189453125, 45.93017578125, 47.44140625, 48.95263671875, 50.4638671875, 51.97509765625, 53.486328125, 54.99755859375, 56.5087890625, 58.02001953125, 59.53125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 13.0, 19.0, 42.0, 78.0, 149.0, 204.0, 179.0, 118.0, 65.0, 46.0, 24.0, 29.0, 10.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.42698669433594, -235.44906616210938, -228.4711456298828, -221.49322509765625, -214.51528930664062, -207.53738403320312, -200.5594482421875, -193.58152770996094, -186.60360717773438, -179.6256866455078, -172.64776611328125, -165.6698455810547, -158.69192504882812, -151.7139892578125, -144.73606872558594, -137.75814819335938, -130.7802276611328, -123.80230712890625, -116.82438659667969, -109.8464584350586, -102.86853790283203, -95.89061737060547, -88.91268920898438, -81.93476867675781, -74.95684814453125, -67.97892761230469, -61.00100326538086, -54.02307891845703, -47.04515838623047, -40.067237854003906, -33.08931350708008, -26.11138916015625, -19.13348388671875, -12.155561447143555, -5.177639007568359, 1.800283432006836, 8.778205871582031, 15.756126403808594, 22.734050750732422, 29.71197509765625, 36.68989562988281, 43.667816162109375, 50.6457405090332, 57.62366485595703, 64.6015853881836, 71.57950592041016, 78.55743408203125, 85.53535461425781, 92.51327514648438, 99.49119567871094, 106.4691162109375, 113.4470443725586, 120.42496490478516, 127.40288543701172, 134.3808135986328, 141.35873413085938, 148.33665466308594, 155.3145751953125, 162.29249572753906, 169.27041625976562, 176.24835205078125, 183.22625732421875, 190.20419311523438, 197.18211364746094, 204.1600341796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 6.0, 9.0, 5.0, 12.0, 8.0, 8.0, 18.0, 16.0, 18.0, 21.0, 17.0, 22.0, 22.0, 28.0, 41.0, 37.0, 36.0, 33.0, 42.0, 31.0, 33.0, 36.0, 36.0, 25.0, 36.0, 28.0, 31.0, 29.0, 26.0, 27.0, 24.0, 28.0, 24.0, 22.0, 19.0, 15.0, 16.0, 27.0, 14.0, 13.0, 16.0, 5.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-63.00270080566406, -60.92894744873047, -58.855194091796875, -56.78144073486328, -54.70768737792969, -52.633934020996094, -50.5601806640625, -48.486427307128906, -46.41267395019531, -44.33892059326172, -42.265167236328125, -40.19141387939453, -38.11766052246094, -36.043907165527344, -33.97015380859375, -31.896400451660156, -29.822647094726562, -27.74889373779297, -25.675140380859375, -23.60138702392578, -21.527633666992188, -19.453880310058594, -17.380126953125, -15.306373596191406, -13.232620239257812, -11.158866882324219, -9.085113525390625, -7.011360168457031, -4.9376068115234375, -2.8638534545898438, -0.79010009765625, 1.2836532592773438, 3.3574066162109375, 5.431159973144531, 7.504913330078125, 9.578666687011719, 11.652420043945312, 13.726173400878906, 15.7999267578125, 17.873680114746094, 19.947433471679688, 22.02118682861328, 24.094940185546875, 26.16869354248047, 28.242446899414062, 30.316200256347656, 32.38995361328125, 34.463706970214844, 36.53746032714844, 38.61121368408203, 40.684967041015625, 42.75872039794922, 44.83247375488281, 46.906227111816406, 48.97998046875, 51.053733825683594, 53.12748718261719, 55.20124053955078, 57.274993896484375, 59.34874725341797, 61.42250061035156, 63.496253967285156, 65.57000732421875, 67.64376068115234, 69.71751403808594]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 15.0, 29.0, 21.0, 29.0, 41.0, 65.0, 89.0, 108.0, 142.0, 201.0, 338.0, 427.0, 677.0, 954.0, 1601.0, 2399.0, 3761.0, 6436.0, 11525.0, 21453.0, 42702.0, 92380.0, 226267.0, 339518.0, 157975.0, 67463.0, 31586.0, 16665.0, 9002.0, 5279.0, 3232.0, 2043.0, 1310.0, 870.0, 574.0, 369.0, 318.0, 200.0, 135.0, 89.0, 66.0, 52.0, 29.0, 26.0, 16.0, 25.0, 14.0, 6.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-48.4375, -46.89013671875, -45.3427734375, -43.79541015625, -42.248046875, -40.70068359375, -39.1533203125, -37.60595703125, -36.05859375, -34.51123046875, -32.9638671875, -31.41650390625, -29.869140625, -28.32177734375, -26.7744140625, -25.22705078125, -23.6796875, -22.13232421875, -20.5849609375, -19.03759765625, -17.490234375, -15.94287109375, -14.3955078125, -12.84814453125, -11.30078125, -9.75341796875, -8.2060546875, -6.65869140625, -5.111328125, -3.56396484375, -2.0166015625, -0.46923828125, 1.078125, 2.62548828125, 4.1728515625, 5.72021484375, 7.267578125, 8.81494140625, 10.3623046875, 11.90966796875, 13.45703125, 15.00439453125, 16.5517578125, 18.09912109375, 19.646484375, 21.19384765625, 22.7412109375, 24.28857421875, 25.8359375, 27.38330078125, 28.9306640625, 30.47802734375, 32.025390625, 33.57275390625, 35.1201171875, 36.66748046875, 38.21484375, 39.76220703125, 41.3095703125, 42.85693359375, 44.404296875, 45.95166015625, 47.4990234375, 49.04638671875, 50.59375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 13.0, 9.0, 7.0, 12.0, 22.0, 12.0, 21.0, 33.0, 34.0, 43.0, 44.0, 59.0, 53.0, 52.0, 50.0, 53.0, 53.0, 57.0, 35.0, 44.0, 34.0, 33.0, 32.0, 28.0, 19.0, 18.0, 18.0, 20.0, 25.0, 12.0, 4.0, 8.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.125, -20.435302734375, -19.74560546875, -19.055908203125, -18.3662109375, -17.676513671875, -16.98681640625, -16.297119140625, -15.607421875, -14.917724609375, -14.22802734375, -13.538330078125, -12.8486328125, -12.158935546875, -11.46923828125, -10.779541015625, -10.08984375, -9.400146484375, -8.71044921875, -8.020751953125, -7.3310546875, -6.641357421875, -5.95166015625, -5.261962890625, -4.572265625, -3.882568359375, -3.19287109375, -2.503173828125, -1.8134765625, -1.123779296875, -0.43408203125, 0.255615234375, 0.9453125, 1.635009765625, 2.32470703125, 3.014404296875, 3.7041015625, 4.393798828125, 5.08349609375, 5.773193359375, 6.462890625, 7.152587890625, 7.84228515625, 8.531982421875, 9.2216796875, 9.911376953125, 10.60107421875, 11.290771484375, 11.98046875, 12.670166015625, 13.35986328125, 14.049560546875, 14.7392578125, 15.428955078125, 16.11865234375, 16.808349609375, 17.498046875, 18.187744140625, 18.87744140625, 19.567138671875, 20.2568359375, 20.946533203125, 21.63623046875, 22.325927734375, 23.015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 10.0, 21.0, 10.0, 23.0, 32.0, 65.0, 83.0, 172.0, 321.0, 479.0, 1048.0, 2382.0, 5725.0, 15785.0, 57909.0, 360688.0, 500628.0, 72490.0, 18831.0, 6627.0, 2598.0, 1261.0, 584.0, 296.0, 181.0, 122.0, 53.0, 43.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.3125, -90.8291015625, -87.345703125, -83.8623046875, -80.37890625, -76.8955078125, -73.412109375, -69.9287109375, -66.4453125, -62.9619140625, -59.478515625, -55.9951171875, -52.51171875, -49.0283203125, -45.544921875, -42.0615234375, -38.578125, -35.0947265625, -31.611328125, -28.1279296875, -24.64453125, -21.1611328125, -17.677734375, -14.1943359375, -10.7109375, -7.2275390625, -3.744140625, -0.2607421875, 3.22265625, 6.7060546875, 10.189453125, 13.6728515625, 17.15625, 20.6396484375, 24.123046875, 27.6064453125, 31.08984375, 34.5732421875, 38.056640625, 41.5400390625, 45.0234375, 48.5068359375, 51.990234375, 55.4736328125, 58.95703125, 62.4404296875, 65.923828125, 69.4072265625, 72.890625, 76.3740234375, 79.857421875, 83.3408203125, 86.82421875, 90.3076171875, 93.791015625, 97.2744140625, 100.7578125, 104.2412109375, 107.724609375, 111.2080078125, 114.69140625, 118.1748046875, 121.658203125, 125.1416015625, 128.625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 19.0, 17.0, 25.0, 30.0, 21.0, 40.0, 47.0, 41.0, 37.0, 59.0, 60.0, 49.0, 45.0, 60.0, 69.0, 56.0, 53.0, 35.0, 39.0, 29.0, 41.0, 21.0, 15.0, 14.0, 9.0, 16.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.375, -110.953125, -106.53125, -102.109375, -97.6875, -93.265625, -88.84375, -84.421875, -80.0, -75.578125, -71.15625, -66.734375, -62.3125, -57.890625, -53.46875, -49.046875, -44.625, -40.203125, -35.78125, -31.359375, -26.9375, -22.515625, -18.09375, -13.671875, -9.25, -4.828125, -0.40625, 4.015625, 8.4375, 12.859375, 17.28125, 21.703125, 26.125, 30.546875, 34.96875, 39.390625, 43.8125, 48.234375, 52.65625, 57.078125, 61.5, 65.921875, 70.34375, 74.765625, 79.1875, 83.609375, 88.03125, 92.453125, 96.875, 101.296875, 105.71875, 110.140625, 114.5625, 118.984375, 123.40625, 127.828125, 132.25, 136.671875, 141.09375, 145.515625, 149.9375, 154.359375, 158.78125, 163.203125, 167.625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 21.0, 32.0, 36.0, 60.0, 88.0, 135.0, 205.0, 317.0, 487.0, 760.0, 1308.0, 2339.0, 4898.0, 12149.0, 43821.0, 447540.0, 466531.0, 44751.0, 12244.0, 4868.0, 2347.0, 1378.0, 775.0, 442.0, 321.0, 173.0, 155.0, 108.0, 66.0, 42.0, 44.0, 19.0, 16.0, 13.0, 7.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.59375, -52.8330078125, -51.072265625, -49.3115234375, -47.55078125, -45.7900390625, -44.029296875, -42.2685546875, -40.5078125, -38.7470703125, -36.986328125, -35.2255859375, -33.46484375, -31.7041015625, -29.943359375, -28.1826171875, -26.421875, -24.6611328125, -22.900390625, -21.1396484375, -19.37890625, -17.6181640625, -15.857421875, -14.0966796875, -12.3359375, -10.5751953125, -8.814453125, -7.0537109375, -5.29296875, -3.5322265625, -1.771484375, -0.0107421875, 1.75, 3.5107421875, 5.271484375, 7.0322265625, 8.79296875, 10.5537109375, 12.314453125, 14.0751953125, 15.8359375, 17.5966796875, 19.357421875, 21.1181640625, 22.87890625, 24.6396484375, 26.400390625, 28.1611328125, 29.921875, 31.6826171875, 33.443359375, 35.2041015625, 36.96484375, 38.7255859375, 40.486328125, 42.2470703125, 44.0078125, 45.7685546875, 47.529296875, 49.2900390625, 51.05078125, 52.8115234375, 54.572265625, 56.3330078125, 58.09375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 15.0, 19.0, 19.0, 23.0, 34.0, 58.0, 78.0, 99.0, 131.0, 120.0, 108.0, 76.0, 51.0, 40.0, 25.0, 13.0, 26.0, 13.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01082611083984375, -0.01050722599029541, -0.01018834114074707, -0.00986945629119873, -0.00955057144165039, -0.00923168659210205, -0.008912801742553711, -0.008593916893005371, -0.008275032043457031, -0.007956147193908691, -0.0076372623443603516, -0.007318377494812012, -0.006999492645263672, -0.006680607795715332, -0.006361722946166992, -0.006042838096618652, -0.0057239532470703125, -0.005405068397521973, -0.005086183547973633, -0.004767298698425293, -0.004448413848876953, -0.004129528999328613, -0.0038106441497802734, -0.0034917593002319336, -0.0031728744506835938, -0.002853989601135254, -0.002535104751586914, -0.0022162199020385742, -0.0018973350524902344, -0.0015784502029418945, -0.0012595653533935547, -0.0009406805038452148, -0.000621795654296875, -0.00030291080474853516, 1.5974044799804688e-05, 0.00033485889434814453, 0.0006537437438964844, 0.0009726285934448242, 0.001291513442993164, 0.001610398292541504, 0.0019292831420898438, 0.0022481679916381836, 0.0025670528411865234, 0.0028859376907348633, 0.003204822540283203, 0.003523707389831543, 0.003842592239379883, 0.004161477088928223, 0.0044803619384765625, 0.004799246788024902, 0.005118131637573242, 0.005437016487121582, 0.005755901336669922, 0.006074786186218262, 0.0063936710357666016, 0.006712555885314941, 0.007031440734863281, 0.007350325584411621, 0.007669210433959961, 0.0079880952835083, 0.00830698013305664, 0.00862586498260498, 0.00894474983215332, 0.00926363468170166, 0.00958251953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 14.0, 15.0, 17.0, 38.0, 64.0, 101.0, 148.0, 348.0, 757.0, 1928.0, 7195.0, 44423.0, 837202.0, 137676.0, 13348.0, 3145.0, 1113.0, 454.0, 242.0, 100.0, 83.0, 42.0, 28.0, 21.0, 10.0, 9.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.8125, -102.7626953125, -99.712890625, -96.6630859375, -93.61328125, -90.5634765625, -87.513671875, -84.4638671875, -81.4140625, -78.3642578125, -75.314453125, -72.2646484375, -69.21484375, -66.1650390625, -63.115234375, -60.0654296875, -57.015625, -53.9658203125, -50.916015625, -47.8662109375, -44.81640625, -41.7666015625, -38.716796875, -35.6669921875, -32.6171875, -29.5673828125, -26.517578125, -23.4677734375, -20.41796875, -17.3681640625, -14.318359375, -11.2685546875, -8.21875, -5.1689453125, -2.119140625, 0.9306640625, 3.98046875, 7.0302734375, 10.080078125, 13.1298828125, 16.1796875, 19.2294921875, 22.279296875, 25.3291015625, 28.37890625, 31.4287109375, 34.478515625, 37.5283203125, 40.578125, 43.6279296875, 46.677734375, 49.7275390625, 52.77734375, 55.8271484375, 58.876953125, 61.9267578125, 64.9765625, 68.0263671875, 71.076171875, 74.1259765625, 77.17578125, 80.2255859375, 83.275390625, 86.3251953125, 89.375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 11.0, 12.0, 16.0, 31.0, 51.0, 88.0, 141.0, 196.0, 171.0, 109.0, 57.0, 28.0, 23.0, 17.0, 9.0, 12.0, 9.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-113.9375, -111.3330078125, -108.728515625, -106.1240234375, -103.51953125, -100.9150390625, -98.310546875, -95.7060546875, -93.1015625, -90.4970703125, -87.892578125, -85.2880859375, -82.68359375, -80.0791015625, -77.474609375, -74.8701171875, -72.265625, -69.6611328125, -67.056640625, -64.4521484375, -61.84765625, -59.2431640625, -56.638671875, -54.0341796875, -51.4296875, -48.8251953125, -46.220703125, -43.6162109375, -41.01171875, -38.4072265625, -35.802734375, -33.1982421875, -30.59375, -27.9892578125, -25.384765625, -22.7802734375, -20.17578125, -17.5712890625, -14.966796875, -12.3623046875, -9.7578125, -7.1533203125, -4.548828125, -1.9443359375, 0.66015625, 3.2646484375, 5.869140625, 8.4736328125, 11.078125, 13.6826171875, 16.287109375, 18.8916015625, 21.49609375, 24.1005859375, 26.705078125, 29.3095703125, 31.9140625, 34.5185546875, 37.123046875, 39.7275390625, 42.33203125, 44.9365234375, 47.541015625, 50.1455078125, 52.75]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 16.0, 21.0, 27.0, 49.0, 58.0, 83.0, 134.0, 152.0, 152.0, 110.0, 73.0, 56.0, 34.0, 13.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-520.7315063476562, -487.66729736328125, -454.60308837890625, -421.53887939453125, -388.47467041015625, -355.41046142578125, -322.3462829589844, -289.2820739746094, -256.2178649902344, -223.15365600585938, -190.08944702148438, -157.02525329589844, -123.96104431152344, -90.89683532714844, -57.8326416015625, -24.7684326171875, 8.2957763671875, 41.359981536865234, 74.42418670654297, 107.48838806152344, 140.55259704589844, 173.61680603027344, 206.68099975585938, 239.74520874023438, 272.8094177246094, 305.8736267089844, 338.9378356933594, 372.00201416015625, 405.06622314453125, 438.13043212890625, 471.19464111328125, 504.25885009765625, 537.322998046875, 570.38720703125, 603.451416015625, 636.515625, 669.579833984375, 702.64404296875, 735.708251953125, 768.7724609375, 801.836669921875, 834.90087890625, 867.965087890625, 901.029296875, 934.093505859375, 967.15771484375, 1000.221923828125, 1033.2861328125, 1066.350341796875, 1099.41455078125, 1132.478759765625, 1165.54296875, 1198.607177734375, 1231.67138671875, 1264.735595703125, 1297.7998046875, 1330.8638916015625, 1363.9281005859375, 1396.9923095703125, 1430.0565185546875, 1463.1207275390625, 1496.1849365234375, 1529.2491455078125, 1562.3133544921875, 1595.3775634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 1.0, 7.0, 6.0, 11.0, 12.0, 13.0, 13.0, 16.0, 22.0, 20.0, 18.0, 22.0, 22.0, 25.0, 33.0, 42.0, 33.0, 39.0, 33.0, 38.0, 56.0, 40.0, 45.0, 40.0, 33.0, 31.0, 32.0, 41.0, 27.0, 32.0, 20.0, 18.0, 21.0, 25.0, 22.0, 12.0, 11.0, 14.0, 7.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-495.1510009765625, -478.4688720703125, -461.7867431640625, -445.1046142578125, -428.4224853515625, -411.7403564453125, -395.0581970214844, -378.3760681152344, -361.6939392089844, -345.0118103027344, -328.3296813964844, -311.6475524902344, -294.96539306640625, -278.28326416015625, -261.60113525390625, -244.91900634765625, -228.23687744140625, -211.55474853515625, -194.87261962890625, -178.1904754638672, -161.5083465576172, -144.8262176513672, -128.14407348632812, -111.46194458007812, -94.77981567382812, -78.09768676757812, -61.415550231933594, -44.73341751098633, -28.051284790039062, -11.369155883789062, 5.312980651855469, 21.9951171875, 38.67718505859375, 55.359317779541016, 72.04145050048828, 88.72358703613281, 105.40571594238281, 122.08784484863281, 138.76998901367188, 155.45211791992188, 172.13424682617188, 188.81637573242188, 205.49850463867188, 222.18064880371094, 238.86277770996094, 255.54490661621094, 272.22705078125, 288.9091796875, 305.59130859375, 322.2734375, 338.95556640625, 355.6376953125, 372.31982421875, 389.001953125, 405.6841125488281, 422.3662414550781, 439.0483703613281, 455.7304992675781, 472.4126281738281, 489.0947570800781, 505.77691650390625, 522.4590454101562, 539.1411743164062, 555.8233032226562, 572.5054321289062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 10.0, 16.0, 13.0, 32.0, 30.0, 74.0, 95.0, 128.0, 173.0, 250.0, 429.0, 611.0, 999.0, 1661.0, 3899.0, 27188.0, 4144708.0, 7958.0, 2359.0, 1242.0, 792.0, 535.0, 332.0, 260.0, 145.0, 95.0, 81.0, 55.0, 32.0, 23.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-259.5, -252.71484375, -245.9296875, -239.14453125, -232.359375, -225.57421875, -218.7890625, -212.00390625, -205.21875, -198.43359375, -191.6484375, -184.86328125, -178.078125, -171.29296875, -164.5078125, -157.72265625, -150.9375, -144.15234375, -137.3671875, -130.58203125, -123.796875, -117.01171875, -110.2265625, -103.44140625, -96.65625, -89.87109375, -83.0859375, -76.30078125, -69.515625, -62.73046875, -55.9453125, -49.16015625, -42.375, -35.58984375, -28.8046875, -22.01953125, -15.234375, -8.44921875, -1.6640625, 5.12109375, 11.90625, 18.69140625, 25.4765625, 32.26171875, 39.046875, 45.83203125, 52.6171875, 59.40234375, 66.1875, 72.97265625, 79.7578125, 86.54296875, 93.328125, 100.11328125, 106.8984375, 113.68359375, 120.46875, 127.25390625, 134.0390625, 140.82421875, 147.609375, 154.39453125, 161.1796875, 167.96484375, 174.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 15.0, 20.0, 25.0, 15.0, 26.0, 33.0, 39.0, 47.0, 44.0, 42.0, 54.0, 55.0, 56.0, 53.0, 57.0, 44.0, 43.0, 55.0, 42.0, 41.0, 31.0, 28.0, 28.0, 14.0, 16.0, 14.0, 13.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.772216796875, -19.99755859375, -19.222900390625, -18.4482421875, -17.673583984375, -16.89892578125, -16.124267578125, -15.349609375, -14.574951171875, -13.80029296875, -13.025634765625, -12.2509765625, -11.476318359375, -10.70166015625, -9.927001953125, -9.15234375, -8.377685546875, -7.60302734375, -6.828369140625, -6.0537109375, -5.279052734375, -4.50439453125, -3.729736328125, -2.955078125, -2.180419921875, -1.40576171875, -0.631103515625, 0.1435546875, 0.918212890625, 1.69287109375, 2.467529296875, 3.2421875, 4.016845703125, 4.79150390625, 5.566162109375, 6.3408203125, 7.115478515625, 7.89013671875, 8.664794921875, 9.439453125, 10.214111328125, 10.98876953125, 11.763427734375, 12.5380859375, 13.312744140625, 14.08740234375, 14.862060546875, 15.63671875, 16.411376953125, 17.18603515625, 17.960693359375, 18.7353515625, 19.510009765625, 20.28466796875, 21.059326171875, 21.833984375, 22.608642578125, 23.38330078125, 24.157958984375, 24.9326171875, 25.707275390625, 26.48193359375, 27.256591796875, 28.03125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 8.0, 9.0, 9.0, 15.0, 18.0, 22.0, 36.0, 45.0, 41.0, 85.0, 102.0, 172.0, 281.0, 551.0, 1349.0, 3994.0, 22458.0, 4147232.0, 12589.0, 2977.0, 1049.0, 433.0, 262.0, 151.0, 99.0, 68.0, 56.0, 49.0, 31.0, 21.0, 21.0, 10.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.0, -300.01171875, -291.0234375, -282.03515625, -273.046875, -264.05859375, -255.0703125, -246.08203125, -237.09375, -228.10546875, -219.1171875, -210.12890625, -201.140625, -192.15234375, -183.1640625, -174.17578125, -165.1875, -156.19921875, -147.2109375, -138.22265625, -129.234375, -120.24609375, -111.2578125, -102.26953125, -93.28125, -84.29296875, -75.3046875, -66.31640625, -57.328125, -48.33984375, -39.3515625, -30.36328125, -21.375, -12.38671875, -3.3984375, 5.58984375, 14.578125, 23.56640625, 32.5546875, 41.54296875, 50.53125, 59.51953125, 68.5078125, 77.49609375, 86.484375, 95.47265625, 104.4609375, 113.44921875, 122.4375, 131.42578125, 140.4140625, 149.40234375, 158.390625, 167.37890625, 176.3671875, 185.35546875, 194.34375, 203.33203125, 212.3203125, 221.30859375, 230.296875, 239.28515625, 248.2734375, 257.26171875, 266.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 45.0, 3845.0, 123.0, 15.0, 12.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -73.22314453125, -71.3837890625, -69.54443359375, -67.705078125, -65.86572265625, -64.0263671875, -62.18701171875, -60.34765625, -58.50830078125, -56.6689453125, -54.82958984375, -52.990234375, -51.15087890625, -49.3115234375, -47.47216796875, -45.6328125, -43.79345703125, -41.9541015625, -40.11474609375, -38.275390625, -36.43603515625, -34.5966796875, -32.75732421875, -30.91796875, -29.07861328125, -27.2392578125, -25.39990234375, -23.560546875, -21.72119140625, -19.8818359375, -18.04248046875, -16.203125, -14.36376953125, -12.5244140625, -10.68505859375, -8.845703125, -7.00634765625, -5.1669921875, -3.32763671875, -1.48828125, 0.35107421875, 2.1904296875, 4.02978515625, 5.869140625, 7.70849609375, 9.5478515625, 11.38720703125, 13.2265625, 15.06591796875, 16.9052734375, 18.74462890625, 20.583984375, 22.42333984375, 24.2626953125, 26.10205078125, 27.94140625, 29.78076171875, 31.6201171875, 33.45947265625, 35.298828125, 37.13818359375, 38.9775390625, 40.81689453125, 42.65625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 5.0, 6.0, 13.0, 14.0, 22.0, 23.0, 17.0, 42.0, 44.0, 59.0, 69.0, 78.0, 95.0, 96.0, 77.0, 72.0, 73.0, 48.0, 43.0, 22.0, 19.0, 10.0, 15.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-117.26155090332031, -114.4413070678711, -111.62106323242188, -108.80081939697266, -105.98057556152344, -103.16033172607422, -100.340087890625, -97.51983642578125, -94.69960021972656, -91.87935638427734, -89.05911254882812, -86.2388687133789, -83.41862487792969, -80.59838104248047, -77.77813720703125, -74.9578857421875, -72.13764190673828, -69.31739807128906, -66.49715423583984, -63.676910400390625, -60.856666564941406, -58.03642272949219, -55.2161750793457, -52.395931243896484, -49.575687408447266, -46.75544357299805, -43.93519973754883, -41.114952087402344, -38.294708251953125, -35.474464416503906, -32.65422058105469, -29.83397674560547, -27.013736724853516, -24.193492889404297, -21.373249053955078, -18.553003311157227, -15.732759475708008, -12.912515640258789, -10.092269897460938, -7.272026062011719, -4.4517822265625, -1.631537914276123, 1.188706398010254, 4.008951187133789, 6.829195022583008, 9.649438858032227, 12.469684600830078, 15.289928436279297, 18.110172271728516, 20.930416107177734, 23.750659942626953, 26.570905685424805, 29.391149520874023, 32.211395263671875, 35.031639099121094, 37.85188293457031, 40.67212677001953, 43.49237060546875, 46.31261444091797, 49.13285827636719, 51.953102111816406, 54.773345947265625, 57.59359359741211, 60.41383743286133, 63.23408126831055]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 22.0, 14.0, 23.0, 31.0, 29.0, 37.0, 32.0, 39.0, 31.0, 44.0, 47.0, 56.0, 49.0, 53.0, 50.0, 45.0, 46.0, 38.0, 35.0, 46.0, 31.0, 30.0, 22.0, 8.0, 14.0, 16.0, 21.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-85.15863037109375, -82.89708709716797, -80.63554382324219, -78.3740005493164, -76.11245727539062, -73.85091400146484, -71.58937072753906, -69.32783508300781, -67.0662841796875, -64.80474090576172, -62.54319763183594, -60.281654357910156, -58.020111083984375, -55.758567810058594, -53.49702835083008, -51.2354850769043, -48.97394561767578, -46.71240234375, -44.45085906982422, -42.18931579589844, -39.927772521972656, -37.666229248046875, -35.40468978881836, -33.14314651489258, -30.881603240966797, -28.620059967041016, -26.358516693115234, -24.096975326538086, -21.835432052612305, -19.573888778686523, -17.312347412109375, -15.050804138183594, -12.789268493652344, -10.527725219726562, -8.266182899475098, -6.004640102386475, -3.7430973052978516, -1.4815540313720703, 0.7799882888793945, 3.0415306091308594, 5.303073883056641, 7.564616680145264, 9.826159477233887, 12.087701797485352, 14.349245071411133, 16.610788345336914, 18.872329711914062, 21.133872985839844, 23.395416259765625, 25.656959533691406, 27.918502807617188, 30.180044174194336, 32.44158935546875, 34.70313262939453, 36.96467208862305, 39.22621536254883, 41.48775863647461, 43.74930191040039, 46.01084518432617, 48.27238845825195, 50.53392791748047, 52.79547119140625, 55.05701446533203, 57.31855773925781, 59.580101013183594]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 11.0, 13.0, 11.0, 15.0, 42.0, 47.0, 72.0, 87.0, 138.0, 188.0, 281.0, 457.0, 721.0, 1123.0, 1815.0, 2907.0, 5179.0, 9397.0, 18051.0, 37886.0, 87937.0, 229442.0, 362427.0, 163511.0, 65109.0, 29188.0, 14100.0, 7503.0, 4252.0, 2509.0, 1451.0, 906.0, 597.0, 391.0, 263.0, 175.0, 112.0, 74.0, 48.0, 27.0, 22.0, 23.0, 13.0, 10.0, 14.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.34375, -53.7314453125, -52.119140625, -50.5068359375, -48.89453125, -47.2822265625, -45.669921875, -44.0576171875, -42.4453125, -40.8330078125, -39.220703125, -37.6083984375, -35.99609375, -34.3837890625, -32.771484375, -31.1591796875, -29.546875, -27.9345703125, -26.322265625, -24.7099609375, -23.09765625, -21.4853515625, -19.873046875, -18.2607421875, -16.6484375, -15.0361328125, -13.423828125, -11.8115234375, -10.19921875, -8.5869140625, -6.974609375, -5.3623046875, -3.75, -2.1376953125, -0.525390625, 1.0869140625, 2.69921875, 4.3115234375, 5.923828125, 7.5361328125, 9.1484375, 10.7607421875, 12.373046875, 13.9853515625, 15.59765625, 17.2099609375, 18.822265625, 20.4345703125, 22.046875, 23.6591796875, 25.271484375, 26.8837890625, 28.49609375, 30.1083984375, 31.720703125, 33.3330078125, 34.9453125, 36.5576171875, 38.169921875, 39.7822265625, 41.39453125, 43.0068359375, 44.619140625, 46.2314453125, 47.84375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 1.0, 8.0, 6.0, 12.0, 14.0, 9.0, 10.0, 17.0, 19.0, 26.0, 29.0, 45.0, 42.0, 52.0, 38.0, 44.0, 45.0, 57.0, 54.0, 64.0, 46.0, 39.0, 31.0, 52.0, 36.0, 32.0, 39.0, 35.0, 21.0, 14.0, 13.0, 12.0, 13.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.25, -25.45751953125, -24.6650390625, -23.87255859375, -23.080078125, -22.28759765625, -21.4951171875, -20.70263671875, -19.91015625, -19.11767578125, -18.3251953125, -17.53271484375, -16.740234375, -15.94775390625, -15.1552734375, -14.36279296875, -13.5703125, -12.77783203125, -11.9853515625, -11.19287109375, -10.400390625, -9.60791015625, -8.8154296875, -8.02294921875, -7.23046875, -6.43798828125, -5.6455078125, -4.85302734375, -4.060546875, -3.26806640625, -2.4755859375, -1.68310546875, -0.890625, -0.09814453125, 0.6943359375, 1.48681640625, 2.279296875, 3.07177734375, 3.8642578125, 4.65673828125, 5.44921875, 6.24169921875, 7.0341796875, 7.82666015625, 8.619140625, 9.41162109375, 10.2041015625, 10.99658203125, 11.7890625, 12.58154296875, 13.3740234375, 14.16650390625, 14.958984375, 15.75146484375, 16.5439453125, 17.33642578125, 18.12890625, 18.92138671875, 19.7138671875, 20.50634765625, 21.298828125, 22.09130859375, 22.8837890625, 23.67626953125, 24.46875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 16.0, 14.0, 24.0, 44.0, 43.0, 75.0, 107.0, 172.0, 338.0, 609.0, 1128.0, 2532.0, 6139.0, 17477.0, 65167.0, 406382.0, 447755.0, 70184.0, 18651.0, 6380.0, 2559.0, 1233.0, 581.0, 316.0, 204.0, 119.0, 92.0, 42.0, 31.0, 28.0, 21.0, 15.0, 8.0, 3.0, 10.0, 4.0, 4.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.75, -95.84765625, -92.9453125, -90.04296875, -87.140625, -84.23828125, -81.3359375, -78.43359375, -75.53125, -72.62890625, -69.7265625, -66.82421875, -63.921875, -61.01953125, -58.1171875, -55.21484375, -52.3125, -49.41015625, -46.5078125, -43.60546875, -40.703125, -37.80078125, -34.8984375, -31.99609375, -29.09375, -26.19140625, -23.2890625, -20.38671875, -17.484375, -14.58203125, -11.6796875, -8.77734375, -5.875, -2.97265625, -0.0703125, 2.83203125, 5.734375, 8.63671875, 11.5390625, 14.44140625, 17.34375, 20.24609375, 23.1484375, 26.05078125, 28.953125, 31.85546875, 34.7578125, 37.66015625, 40.5625, 43.46484375, 46.3671875, 49.26953125, 52.171875, 55.07421875, 57.9765625, 60.87890625, 63.78125, 66.68359375, 69.5859375, 72.48828125, 75.390625, 78.29296875, 81.1953125, 84.09765625, 87.0]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 7.0, 12.0, 8.0, 11.0, 13.0, 11.0, 19.0, 22.0, 28.0, 29.0, 19.0, 30.0, 29.0, 40.0, 33.0, 41.0, 47.0, 51.0, 47.0, 44.0, 44.0, 38.0, 41.0, 40.0, 45.0, 32.0, 32.0, 35.0, 25.0, 27.0, 15.0, 10.0, 18.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.0, -90.6435546875, -87.287109375, -83.9306640625, -80.57421875, -77.2177734375, -73.861328125, -70.5048828125, -67.1484375, -63.7919921875, -60.435546875, -57.0791015625, -53.72265625, -50.3662109375, -47.009765625, -43.6533203125, -40.296875, -36.9404296875, -33.583984375, -30.2275390625, -26.87109375, -23.5146484375, -20.158203125, -16.8017578125, -13.4453125, -10.0888671875, -6.732421875, -3.3759765625, -0.01953125, 3.3369140625, 6.693359375, 10.0498046875, 13.40625, 16.7626953125, 20.119140625, 23.4755859375, 26.83203125, 30.1884765625, 33.544921875, 36.9013671875, 40.2578125, 43.6142578125, 46.970703125, 50.3271484375, 53.68359375, 57.0400390625, 60.396484375, 63.7529296875, 67.109375, 70.4658203125, 73.822265625, 77.1787109375, 80.53515625, 83.8916015625, 87.248046875, 90.6044921875, 93.9609375, 97.3173828125, 100.673828125, 104.0302734375, 107.38671875, 110.7431640625, 114.099609375, 117.4560546875, 120.8125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 13.0, 17.0, 32.0, 33.0, 60.0, 104.0, 189.0, 337.0, 693.0, 1532.0, 4421.0, 23280.0, 697940.0, 298463.0, 15371.0, 3467.0, 1261.0, 574.0, 317.0, 164.0, 90.0, 45.0, 50.0, 24.0, 27.0, 13.0, 8.0, 8.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.125, -70.40625, -67.6875, -64.96875, -62.25, -59.53125, -56.8125, -54.09375, -51.375, -48.65625, -45.9375, -43.21875, -40.5, -37.78125, -35.0625, -32.34375, -29.625, -26.90625, -24.1875, -21.46875, -18.75, -16.03125, -13.3125, -10.59375, -7.875, -5.15625, -2.4375, 0.28125, 3.0, 5.71875, 8.4375, 11.15625, 13.875, 16.59375, 19.3125, 22.03125, 24.75, 27.46875, 30.1875, 32.90625, 35.625, 38.34375, 41.0625, 43.78125, 46.5, 49.21875, 51.9375, 54.65625, 57.375, 60.09375, 62.8125, 65.53125, 68.25, 70.96875, 73.6875, 76.40625, 79.125, 81.84375, 84.5625, 87.28125, 90.0, 92.71875, 95.4375, 98.15625, 100.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 7.0, 6.0, 16.0, 22.0, 25.0, 61.0, 104.0, 192.0, 216.0, 159.0, 71.0, 37.0, 22.0, 14.0, 10.0, 9.0, 13.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155792236328125, -0.014987468719482422, -0.014395713806152344, -0.013803958892822266, -0.013212203979492188, -0.01262044906616211, -0.012028694152832031, -0.011436939239501953, -0.010845184326171875, -0.010253429412841797, -0.009661674499511719, -0.00906991958618164, -0.008478164672851562, -0.007886409759521484, -0.007294654846191406, -0.006702899932861328, -0.00611114501953125, -0.005519390106201172, -0.004927635192871094, -0.004335880279541016, -0.0037441253662109375, -0.0031523704528808594, -0.0025606155395507812, -0.001968860626220703, -0.001377105712890625, -0.0007853507995605469, -0.00019359588623046875, 0.0003981590270996094, 0.0009899139404296875, 0.0015816688537597656, 0.0021734237670898438, 0.002765178680419922, 0.00335693359375, 0.003948688507080078, 0.004540443420410156, 0.005132198333740234, 0.0057239532470703125, 0.006315708160400391, 0.006907463073730469, 0.007499217987060547, 0.008090972900390625, 0.008682727813720703, 0.009274482727050781, 0.00986623764038086, 0.010457992553710938, 0.011049747467041016, 0.011641502380371094, 0.012233257293701172, 0.01282501220703125, 0.013416767120361328, 0.014008522033691406, 0.014600276947021484, 0.015192031860351562, 0.01578378677368164, 0.01637554168701172, 0.016967296600341797, 0.017559051513671875, 0.018150806427001953, 0.01874256134033203, 0.01933431625366211, 0.019926071166992188, 0.020517826080322266, 0.021109580993652344, 0.021701335906982422, 0.0222930908203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 17.0, 20.0, 42.0, 63.0, 92.0, 145.0, 195.0, 384.0, 813.0, 1713.0, 4588.0, 17902.0, 167810.0, 773531.0, 64947.0, 10360.0, 3176.0, 1266.0, 612.0, 300.0, 202.0, 109.0, 78.0, 48.0, 34.0, 20.0, 14.0, 13.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-72.4375, -70.38671875, -68.3359375, -66.28515625, -64.234375, -62.18359375, -60.1328125, -58.08203125, -56.03125, -53.98046875, -51.9296875, -49.87890625, -47.828125, -45.77734375, -43.7265625, -41.67578125, -39.625, -37.57421875, -35.5234375, -33.47265625, -31.421875, -29.37109375, -27.3203125, -25.26953125, -23.21875, -21.16796875, -19.1171875, -17.06640625, -15.015625, -12.96484375, -10.9140625, -8.86328125, -6.8125, -4.76171875, -2.7109375, -0.66015625, 1.390625, 3.44140625, 5.4921875, 7.54296875, 9.59375, 11.64453125, 13.6953125, 15.74609375, 17.796875, 19.84765625, 21.8984375, 23.94921875, 26.0, 28.05078125, 30.1015625, 32.15234375, 34.203125, 36.25390625, 38.3046875, 40.35546875, 42.40625, 44.45703125, 46.5078125, 48.55859375, 50.609375, 52.66015625, 54.7109375, 56.76171875, 58.8125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 13.0, 31.0, 41.0, 54.0, 88.0, 120.0, 135.0, 143.0, 111.0, 87.0, 44.0, 31.0, 27.0, 15.0, 8.0, 10.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.75, -62.94580078125, -61.1416015625, -59.33740234375, -57.533203125, -55.72900390625, -53.9248046875, -52.12060546875, -50.31640625, -48.51220703125, -46.7080078125, -44.90380859375, -43.099609375, -41.29541015625, -39.4912109375, -37.68701171875, -35.8828125, -34.07861328125, -32.2744140625, -30.47021484375, -28.666015625, -26.86181640625, -25.0576171875, -23.25341796875, -21.44921875, -19.64501953125, -17.8408203125, -16.03662109375, -14.232421875, -12.42822265625, -10.6240234375, -8.81982421875, -7.015625, -5.21142578125, -3.4072265625, -1.60302734375, 0.201171875, 2.00537109375, 3.8095703125, 5.61376953125, 7.41796875, 9.22216796875, 11.0263671875, 12.83056640625, 14.634765625, 16.43896484375, 18.2431640625, 20.04736328125, 21.8515625, 23.65576171875, 25.4599609375, 27.26416015625, 29.068359375, 30.87255859375, 32.6767578125, 34.48095703125, 36.28515625, 38.08935546875, 39.8935546875, 41.69775390625, 43.501953125, 45.30615234375, 47.1103515625, 48.91455078125, 50.71875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 15.0, 18.0, 36.0, 44.0, 43.0, 51.0, 98.0, 95.0, 101.0, 91.0, 92.0, 78.0, 63.0, 46.0, 34.0, 21.0, 13.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-396.11224365234375, -376.8864440917969, -357.66064453125, -338.4348449707031, -319.20904541015625, -299.9832763671875, -280.7574768066406, -261.53167724609375, -242.30587768554688, -223.080078125, -203.85427856445312, -184.6284942626953, -165.40269470214844, -146.17689514160156, -126.95110321044922, -107.72531127929688, -88.49951171875, -69.27371215820312, -50.04792022705078, -30.822124481201172, -11.596328735351562, 7.6294708251953125, 26.855262756347656, 46.0810546875, 65.30685424804688, 84.53265380859375, 103.7584457397461, 122.98423767089844, 142.2100372314453, 161.4358367919922, 180.66162109375, 199.88742065429688, 219.1131591796875, 238.33895874023438, 257.56475830078125, 276.7905578613281, 296.016357421875, 315.24212646484375, 334.4679260253906, 353.6937255859375, 372.9195251464844, 392.14532470703125, 411.3711242675781, 430.596923828125, 449.82269287109375, 469.04852294921875, 488.2742919921875, 507.5000915527344, 526.7258911132812, 545.95166015625, 565.177490234375, 584.4032592773438, 603.6290893554688, 622.8548583984375, 642.0806884765625, 661.3064575195312, 680.5322265625, 699.7579956054688, 718.9838256835938, 738.2095947265625, 757.4354248046875, 776.6611938476562, 795.8870239257812, 815.11279296875, 834.338623046875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 8.0, 2.0, 9.0, 8.0, 10.0, 16.0, 12.0, 13.0, 29.0, 23.0, 20.0, 30.0, 29.0, 42.0, 54.0, 62.0, 55.0, 62.0, 63.0, 51.0, 41.0, 45.0, 37.0, 39.0, 32.0, 29.0, 33.0, 32.0, 18.0, 20.0, 21.0, 6.0, 10.0, 10.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-692.869384765625, -673.8358764648438, -654.8023681640625, -635.7688598632812, -616.7353515625, -597.7017822265625, -578.6682739257812, -559.634765625, -540.6012573242188, -521.5677490234375, -502.53424072265625, -483.5007019042969, -464.4671936035156, -445.4336853027344, -426.400146484375, -407.36663818359375, -388.3331298828125, -369.29962158203125, -350.26611328125, -331.2325744628906, -312.1990661621094, -293.1655578613281, -274.13201904296875, -255.0985107421875, -236.06500244140625, -217.031494140625, -197.9979705810547, -178.96444702148438, -159.93093872070312, -140.89743041992188, -121.86390686035156, -102.83038330078125, -83.79693603515625, -64.76342010498047, -45.72990417480469, -26.696388244628906, -7.662872314453125, 11.370643615722656, 30.404159545898438, 49.43768310546875, 68.47119140625, 87.50470733642578, 106.53822326660156, 125.57173919677734, 144.60525512695312, 163.63876342773438, 182.6722869873047, 201.705810546875, 220.73931884765625, 239.7728271484375, 258.80633544921875, 277.8398742675781, 296.8733825683594, 315.9068908691406, 334.9404296875, 353.97393798828125, 373.0074462890625, 392.04095458984375, 411.074462890625, 430.1080017089844, 449.1415100097656, 468.1750183105469, 487.20855712890625, 506.2420654296875, 525.2755737304688]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 10.0, 5.0, 13.0, 15.0, 15.0, 35.0, 26.0, 41.0, 51.0, 76.0, 92.0, 143.0, 216.0, 303.0, 408.0, 613.0, 886.0, 1517.0, 3404.0, 4144988.0, 34143.0, 3026.0, 1384.0, 912.0, 586.0, 386.0, 272.0, 223.0, 139.0, 96.0, 64.0, 49.0, 46.0, 36.0, 21.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.875, -201.564453125, -195.25390625, -188.943359375, -182.6328125, -176.322265625, -170.01171875, -163.701171875, -157.390625, -151.080078125, -144.76953125, -138.458984375, -132.1484375, -125.837890625, -119.52734375, -113.216796875, -106.90625, -100.595703125, -94.28515625, -87.974609375, -81.6640625, -75.353515625, -69.04296875, -62.732421875, -56.421875, -50.111328125, -43.80078125, -37.490234375, -31.1796875, -24.869140625, -18.55859375, -12.248046875, -5.9375, 0.373046875, 6.68359375, 12.994140625, 19.3046875, 25.615234375, 31.92578125, 38.236328125, 44.546875, 50.857421875, 57.16796875, 63.478515625, 69.7890625, 76.099609375, 82.41015625, 88.720703125, 95.03125, 101.341796875, 107.65234375, 113.962890625, 120.2734375, 126.583984375, 132.89453125, 139.205078125, 145.515625, 151.826171875, 158.13671875, 164.447265625, 170.7578125, 177.068359375, 183.37890625, 189.689453125, 196.0]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 7.0, 3.0, 8.0, 10.0, 6.0, 7.0, 12.0, 15.0, 16.0, 15.0, 19.0, 27.0, 26.0, 37.0, 55.0, 47.0, 43.0, 52.0, 49.0, 57.0, 58.0, 48.0, 59.0, 43.0, 44.0, 39.0, 29.0, 32.0, 26.0, 21.0, 21.0, 14.0, 12.0, 12.0, 8.0, 9.0, 2.0, 8.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.140625, -24.371337890625, -23.60205078125, -22.832763671875, -22.0634765625, -21.294189453125, -20.52490234375, -19.755615234375, -18.986328125, -18.217041015625, -17.44775390625, -16.678466796875, -15.9091796875, -15.139892578125, -14.37060546875, -13.601318359375, -12.83203125, -12.062744140625, -11.29345703125, -10.524169921875, -9.7548828125, -8.985595703125, -8.21630859375, -7.447021484375, -6.677734375, -5.908447265625, -5.13916015625, -4.369873046875, -3.6005859375, -2.831298828125, -2.06201171875, -1.292724609375, -0.5234375, 0.245849609375, 1.01513671875, 1.784423828125, 2.5537109375, 3.322998046875, 4.09228515625, 4.861572265625, 5.630859375, 6.400146484375, 7.16943359375, 7.938720703125, 8.7080078125, 9.477294921875, 10.24658203125, 11.015869140625, 11.78515625, 12.554443359375, 13.32373046875, 14.093017578125, 14.8623046875, 15.631591796875, 16.40087890625, 17.170166015625, 17.939453125, 18.708740234375, 19.47802734375, 20.247314453125, 21.0166015625, 21.785888671875, 22.55517578125, 23.324462890625, 24.09375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 12.0, 22.0, 30.0, 34.0, 48.0, 69.0, 103.0, 154.0, 294.0, 551.0, 1736.0, 4138771.0, 49561.0, 1542.0, 545.0, 271.0, 161.0, 104.0, 76.0, 37.0, 33.0, 28.0, 19.0, 15.0, 7.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-543.0, -522.859375, -502.71875, -482.578125, -462.4375, -442.296875, -422.15625, -402.015625, -381.875, -361.734375, -341.59375, -321.453125, -301.3125, -281.171875, -261.03125, -240.890625, -220.75, -200.609375, -180.46875, -160.328125, -140.1875, -120.046875, -99.90625, -79.765625, -59.625, -39.484375, -19.34375, 0.796875, 20.9375, 41.078125, 61.21875, 81.359375, 101.5, 121.640625, 141.78125, 161.921875, 182.0625, 202.203125, 222.34375, 242.484375, 262.625, 282.765625, 302.90625, 323.046875, 343.1875, 363.328125, 383.46875, 403.609375, 423.75, 443.890625, 464.03125, 484.171875, 504.3125, 524.453125, 544.59375, 564.734375, 584.875, 605.015625, 625.15625, 645.296875, 665.4375, 685.578125, 705.71875, 725.859375, 746.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 9.0, 3915.0, 140.0, 11.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.125, -143.701171875, -140.27734375, -136.853515625, -133.4296875, -130.005859375, -126.58203125, -123.158203125, -119.734375, -116.310546875, -112.88671875, -109.462890625, -106.0390625, -102.615234375, -99.19140625, -95.767578125, -92.34375, -88.919921875, -85.49609375, -82.072265625, -78.6484375, -75.224609375, -71.80078125, -68.376953125, -64.953125, -61.529296875, -58.10546875, -54.681640625, -51.2578125, -47.833984375, -44.41015625, -40.986328125, -37.5625, -34.138671875, -30.71484375, -27.291015625, -23.8671875, -20.443359375, -17.01953125, -13.595703125, -10.171875, -6.748046875, -3.32421875, 0.099609375, 3.5234375, 6.947265625, 10.37109375, 13.794921875, 17.21875, 20.642578125, 24.06640625, 27.490234375, 30.9140625, 34.337890625, 37.76171875, 41.185546875, 44.609375, 48.033203125, 51.45703125, 54.880859375, 58.3046875, 61.728515625, 65.15234375, 68.576171875, 72.0]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 6.0, 17.0, 19.0, 32.0, 48.0, 43.0, 86.0, 114.0, 133.0, 130.0, 99.0, 66.0, 48.0, 42.0, 22.0, 22.0, 10.0, 11.0, 8.0, 6.0, 10.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.56886291503906, -217.20550537109375, -211.84214782714844, -206.47879028320312, -201.1154327392578, -195.7520751953125, -190.38870239257812, -185.0253448486328, -179.6619873046875, -174.2986297607422, -168.93527221679688, -163.57191467285156, -158.20855712890625, -152.84518432617188, -147.48184204101562, -142.11846923828125, -136.755126953125, -131.3917694091797, -126.02841186523438, -120.66505432128906, -115.30168914794922, -109.9383316040039, -104.5749740600586, -99.21160888671875, -93.84825134277344, -88.48489379882812, -83.12153625488281, -77.7581787109375, -72.39481353759766, -67.03145599365234, -61.66809844970703, -56.30473709106445, -50.941368103027344, -45.57801055908203, -40.21464920043945, -34.85129165649414, -29.487932205200195, -24.12457275390625, -18.761215209960938, -13.39785385131836, -8.034496307373047, -2.6711373329162598, 2.6922216415405273, 8.055580139160156, 13.418939590454102, 18.782299041748047, 24.14565658569336, 29.509017944335938, 34.87237548828125, 40.23573303222656, 45.59909439086914, 50.96245193481445, 56.32581329345703, 61.689170837402344, 67.05252838134766, 72.4158935546875, 77.77925109863281, 83.14260864257812, 88.50596618652344, 93.86932373046875, 99.2326889038086, 104.5960464477539, 109.95940399169922, 115.32276916503906, 120.68611907958984]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 8.0, 9.0, 13.0, 16.0, 18.0, 23.0, 26.0, 19.0, 41.0, 37.0, 38.0, 31.0, 42.0, 24.0, 45.0, 46.0, 45.0, 31.0, 43.0, 42.0, 41.0, 35.0, 42.0, 42.0, 35.0, 35.0, 21.0, 15.0, 25.0, 19.0, 14.0, 13.0, 6.0, 16.0, 9.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.53889465332031, -94.59437561035156, -91.64986419677734, -88.70535278320312, -85.76083374023438, -82.81631469726562, -79.8718032836914, -76.92729187011719, -73.98277282714844, -71.03825378417969, -68.09374237060547, -65.14923095703125, -62.2047119140625, -59.260196685791016, -56.31568145751953, -53.37116622924805, -50.42665100097656, -47.48213577270508, -44.537620544433594, -41.59310531616211, -38.648590087890625, -35.70407485961914, -32.759559631347656, -29.815044403076172, -26.870529174804688, -23.926013946533203, -20.98149871826172, -18.036983489990234, -15.09246826171875, -12.147953033447266, -9.203437805175781, -6.258922576904297, -3.3144149780273438, -0.3698997497558594, 2.574615478515625, 5.519130706787109, 8.463645935058594, 11.408161163330078, 14.352676391601562, 17.297191619873047, 20.24170684814453, 23.186222076416016, 26.1307373046875, 29.075252532958984, 32.01976776123047, 34.96428298950195, 37.90879821777344, 40.85331344604492, 43.797828674316406, 46.74234390258789, 49.686859130859375, 52.63137435913086, 55.575889587402344, 58.52040481567383, 61.46492004394531, 64.40943908691406, 67.35395050048828, 70.2984619140625, 73.24298095703125, 76.1875, 79.13201141357422, 82.07652282714844, 85.02104187011719, 87.96556091308594, 90.91007232666016]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 8.0, 13.0, 12.0, 29.0, 36.0, 40.0, 83.0, 120.0, 168.0, 260.0, 455.0, 656.0, 1120.0, 1944.0, 3521.0, 7036.0, 14993.0, 36168.0, 104460.0, 436203.0, 308132.0, 78669.0, 28624.0, 12394.0, 5929.0, 3082.0, 1730.0, 1012.0, 581.0, 370.0, 228.0, 148.0, 119.0, 75.0, 41.0, 25.0, 16.0, 12.0, 13.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6875, -67.2744140625, -64.861328125, -62.4482421875, -60.03515625, -57.6220703125, -55.208984375, -52.7958984375, -50.3828125, -47.9697265625, -45.556640625, -43.1435546875, -40.73046875, -38.3173828125, -35.904296875, -33.4912109375, -31.078125, -28.6650390625, -26.251953125, -23.8388671875, -21.42578125, -19.0126953125, -16.599609375, -14.1865234375, -11.7734375, -9.3603515625, -6.947265625, -4.5341796875, -2.12109375, 0.2919921875, 2.705078125, 5.1181640625, 7.53125, 9.9443359375, 12.357421875, 14.7705078125, 17.18359375, 19.5966796875, 22.009765625, 24.4228515625, 26.8359375, 29.2490234375, 31.662109375, 34.0751953125, 36.48828125, 38.9013671875, 41.314453125, 43.7275390625, 46.140625, 48.5537109375, 50.966796875, 53.3798828125, 55.79296875, 58.2060546875, 60.619140625, 63.0322265625, 65.4453125, 67.8583984375, 70.271484375, 72.6845703125, 75.09765625, 77.5107421875, 79.923828125, 82.3369140625, 84.75]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 5.0, 15.0, 13.0, 22.0, 18.0, 28.0, 22.0, 26.0, 32.0, 47.0, 47.0, 39.0, 46.0, 59.0, 49.0, 60.0, 67.0, 54.0, 39.0, 52.0, 24.0, 32.0, 38.0, 21.0, 26.0, 10.0, 21.0, 16.0, 15.0, 5.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68994140625, -28.6923828125, -27.69482421875, -26.697265625, -25.69970703125, -24.7021484375, -23.70458984375, -22.70703125, -21.70947265625, -20.7119140625, -19.71435546875, -18.716796875, -17.71923828125, -16.7216796875, -15.72412109375, -14.7265625, -13.72900390625, -12.7314453125, -11.73388671875, -10.736328125, -9.73876953125, -8.7412109375, -7.74365234375, -6.74609375, -5.74853515625, -4.7509765625, -3.75341796875, -2.755859375, -1.75830078125, -0.7607421875, 0.23681640625, 1.234375, 2.23193359375, 3.2294921875, 4.22705078125, 5.224609375, 6.22216796875, 7.2197265625, 8.21728515625, 9.21484375, 10.21240234375, 11.2099609375, 12.20751953125, 13.205078125, 14.20263671875, 15.2001953125, 16.19775390625, 17.1953125, 18.19287109375, 19.1904296875, 20.18798828125, 21.185546875, 22.18310546875, 23.1806640625, 24.17822265625, 25.17578125, 26.17333984375, 27.1708984375, 28.16845703125, 29.166015625, 30.16357421875, 31.1611328125, 32.15869140625, 33.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 8.0, 13.0, 12.0, 17.0, 25.0, 29.0, 37.0, 62.0, 89.0, 155.0, 264.0, 549.0, 926.0, 1937.0, 4807.0, 15551.0, 73487.0, 655937.0, 245219.0, 34374.0, 8898.0, 3110.0, 1382.0, 672.0, 351.0, 225.0, 134.0, 89.0, 60.0, 35.0, 24.0, 21.0, 19.0, 11.0, 3.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.875, -112.4443359375, -109.013671875, -105.5830078125, -102.15234375, -98.7216796875, -95.291015625, -91.8603515625, -88.4296875, -84.9990234375, -81.568359375, -78.1376953125, -74.70703125, -71.2763671875, -67.845703125, -64.4150390625, -60.984375, -57.5537109375, -54.123046875, -50.6923828125, -47.26171875, -43.8310546875, -40.400390625, -36.9697265625, -33.5390625, -30.1083984375, -26.677734375, -23.2470703125, -19.81640625, -16.3857421875, -12.955078125, -9.5244140625, -6.09375, -2.6630859375, 0.767578125, 4.1982421875, 7.62890625, 11.0595703125, 14.490234375, 17.9208984375, 21.3515625, 24.7822265625, 28.212890625, 31.6435546875, 35.07421875, 38.5048828125, 41.935546875, 45.3662109375, 48.796875, 52.2275390625, 55.658203125, 59.0888671875, 62.51953125, 65.9501953125, 69.380859375, 72.8115234375, 76.2421875, 79.6728515625, 83.103515625, 86.5341796875, 89.96484375, 93.3955078125, 96.826171875, 100.2568359375, 103.6875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 7.0, 1.0, 12.0, 15.0, 16.0, 12.0, 20.0, 28.0, 29.0, 35.0, 28.0, 32.0, 37.0, 36.0, 36.0, 45.0, 42.0, 46.0, 43.0, 39.0, 46.0, 41.0, 42.0, 35.0, 32.0, 45.0, 27.0, 25.0, 16.0, 20.0, 18.0, 12.0, 14.0, 14.0, 10.0, 6.0, 6.0, 1.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.5625, -110.857421875, -107.15234375, -103.447265625, -99.7421875, -96.037109375, -92.33203125, -88.626953125, -84.921875, -81.216796875, -77.51171875, -73.806640625, -70.1015625, -66.396484375, -62.69140625, -58.986328125, -55.28125, -51.576171875, -47.87109375, -44.166015625, -40.4609375, -36.755859375, -33.05078125, -29.345703125, -25.640625, -21.935546875, -18.23046875, -14.525390625, -10.8203125, -7.115234375, -3.41015625, 0.294921875, 4.0, 7.705078125, 11.41015625, 15.115234375, 18.8203125, 22.525390625, 26.23046875, 29.935546875, 33.640625, 37.345703125, 41.05078125, 44.755859375, 48.4609375, 52.166015625, 55.87109375, 59.576171875, 63.28125, 66.986328125, 70.69140625, 74.396484375, 78.1015625, 81.806640625, 85.51171875, 89.216796875, 92.921875, 96.626953125, 100.33203125, 104.037109375, 107.7421875, 111.447265625, 115.15234375, 118.857421875, 122.5625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 12.0, 13.0, 26.0, 17.0, 29.0, 59.0, 93.0, 225.0, 418.0, 1028.0, 2686.0, 9029.0, 46864.0, 627948.0, 318052.0, 31470.0, 6813.0, 2169.0, 768.0, 346.0, 183.0, 96.0, 62.0, 39.0, 27.0, 21.0, 12.0, 11.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.96875, -61.1640625, -59.359375, -57.5546875, -55.75, -53.9453125, -52.140625, -50.3359375, -48.53125, -46.7265625, -44.921875, -43.1171875, -41.3125, -39.5078125, -37.703125, -35.8984375, -34.09375, -32.2890625, -30.484375, -28.6796875, -26.875, -25.0703125, -23.265625, -21.4609375, -19.65625, -17.8515625, -16.046875, -14.2421875, -12.4375, -10.6328125, -8.828125, -7.0234375, -5.21875, -3.4140625, -1.609375, 0.1953125, 2.0, 3.8046875, 5.609375, 7.4140625, 9.21875, 11.0234375, 12.828125, 14.6328125, 16.4375, 18.2421875, 20.046875, 21.8515625, 23.65625, 25.4609375, 27.265625, 29.0703125, 30.875, 32.6796875, 34.484375, 36.2890625, 38.09375, 39.8984375, 41.703125, 43.5078125, 45.3125, 47.1171875, 48.921875, 50.7265625, 52.53125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 21.0, 21.0, 52.0, 102.0, 161.0, 224.0, 168.0, 101.0, 43.0, 28.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008453369140625, -0.007940053939819336, -0.007426738739013672, -0.006913423538208008, -0.006400108337402344, -0.00588679313659668, -0.005373477935791016, -0.0048601627349853516, -0.0043468475341796875, -0.0038335323333740234, -0.0033202171325683594, -0.0028069019317626953, -0.0022935867309570312, -0.0017802715301513672, -0.0012669563293457031, -0.0007536411285400391, -0.000240325927734375, 0.00027298927307128906, 0.0007863044738769531, 0.0012996196746826172, 0.0018129348754882812, 0.0023262500762939453, 0.0028395652770996094, 0.0033528804779052734, 0.0038661956787109375, 0.0043795108795166016, 0.004892826080322266, 0.00540614128112793, 0.005919456481933594, 0.006432771682739258, 0.006946086883544922, 0.007459402084350586, 0.00797271728515625, 0.008486032485961914, 0.008999347686767578, 0.009512662887573242, 0.010025978088378906, 0.01053929328918457, 0.011052608489990234, 0.011565923690795898, 0.012079238891601562, 0.012592554092407227, 0.01310586929321289, 0.013619184494018555, 0.014132499694824219, 0.014645814895629883, 0.015159130096435547, 0.01567244529724121, 0.016185760498046875, 0.01669907569885254, 0.017212390899658203, 0.017725706100463867, 0.01823902130126953, 0.018752336502075195, 0.01926565170288086, 0.019778966903686523, 0.020292282104492188, 0.02080559730529785, 0.021318912506103516, 0.02183222770690918, 0.022345542907714844, 0.022858858108520508, 0.023372173309326172, 0.023885488510131836, 0.0243988037109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 7.0, 11.0, 7.0, 16.0, 23.0, 30.0, 41.0, 57.0, 85.0, 171.0, 277.0, 595.0, 1451.0, 4780.0, 22783.0, 224477.0, 723785.0, 56615.0, 9112.0, 2385.0, 853.0, 413.0, 210.0, 116.0, 65.0, 56.0, 31.0, 34.0, 20.0, 14.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.5625, -72.318359375, -70.07421875, -67.830078125, -65.5859375, -63.341796875, -61.09765625, -58.853515625, -56.609375, -54.365234375, -52.12109375, -49.876953125, -47.6328125, -45.388671875, -43.14453125, -40.900390625, -38.65625, -36.412109375, -34.16796875, -31.923828125, -29.6796875, -27.435546875, -25.19140625, -22.947265625, -20.703125, -18.458984375, -16.21484375, -13.970703125, -11.7265625, -9.482421875, -7.23828125, -4.994140625, -2.75, -0.505859375, 1.73828125, 3.982421875, 6.2265625, 8.470703125, 10.71484375, 12.958984375, 15.203125, 17.447265625, 19.69140625, 21.935546875, 24.1796875, 26.423828125, 28.66796875, 30.912109375, 33.15625, 35.400390625, 37.64453125, 39.888671875, 42.1328125, 44.376953125, 46.62109375, 48.865234375, 51.109375, 53.353515625, 55.59765625, 57.841796875, 60.0859375, 62.330078125, 64.57421875, 66.818359375, 69.0625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 8.0, 12.0, 28.0, 31.0, 49.0, 58.0, 76.0, 124.0, 175.0, 138.0, 82.0, 69.0, 36.0, 34.0, 21.0, 17.0, 12.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84375, -50.58740234375, -48.3310546875, -46.07470703125, -43.818359375, -41.56201171875, -39.3056640625, -37.04931640625, -34.79296875, -32.53662109375, -30.2802734375, -28.02392578125, -25.767578125, -23.51123046875, -21.2548828125, -18.99853515625, -16.7421875, -14.48583984375, -12.2294921875, -9.97314453125, -7.716796875, -5.46044921875, -3.2041015625, -0.94775390625, 1.30859375, 3.56494140625, 5.8212890625, 8.07763671875, 10.333984375, 12.59033203125, 14.8466796875, 17.10302734375, 19.359375, 21.61572265625, 23.8720703125, 26.12841796875, 28.384765625, 30.64111328125, 32.8974609375, 35.15380859375, 37.41015625, 39.66650390625, 41.9228515625, 44.17919921875, 46.435546875, 48.69189453125, 50.9482421875, 53.20458984375, 55.4609375, 57.71728515625, 59.9736328125, 62.22998046875, 64.486328125, 66.74267578125, 68.9990234375, 71.25537109375, 73.51171875, 75.76806640625, 78.0244140625, 80.28076171875, 82.537109375, 84.79345703125, 87.0498046875, 89.30615234375, 91.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 17.0, 18.0, 64.0, 118.0, 210.0, 243.0, 153.0, 82.0, 43.0, 20.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-997.660888671875, -950.6033935546875, -903.5459594726562, -856.488525390625, -809.4310302734375, -762.37353515625, -715.3161010742188, -668.2586669921875, -621.201171875, -574.1436767578125, -527.0862426757812, -480.0287780761719, -432.9713134765625, -385.9138488769531, -338.85638427734375, -291.7989196777344, -244.741455078125, -197.68399047851562, -150.62652587890625, -103.56906127929688, -56.5115966796875, -9.454132080078125, 37.60333251953125, 84.66079711914062, 131.71826171875, 178.77572631835938, 225.83319091796875, 272.8906555175781, 319.9481201171875, 367.0055847167969, 414.06304931640625, 461.1205139160156, 508.177978515625, 555.2354736328125, 602.2929077148438, 649.350341796875, 696.4078369140625, 743.46533203125, 790.5227661132812, 837.5802001953125, 884.6376953125, 931.6951904296875, 978.7526245117188, 1025.81005859375, 1072.8675537109375, 1119.925048828125, 1166.982421875, 1214.0399169921875, 1261.097412109375, 1308.1549072265625, 1355.21240234375, 1402.269775390625, 1449.3272705078125, 1496.384765625, 1543.442138671875, 1590.4996337890625, 1637.55712890625, 1684.6146240234375, 1731.672119140625, 1778.7294921875, 1825.7869873046875, 1872.844482421875, 1919.90185546875, 1966.9593505859375, 2014.016845703125]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 5.0, 11.0, 17.0, 16.0, 16.0, 22.0, 29.0, 46.0, 38.0, 35.0, 51.0, 54.0, 55.0, 74.0, 53.0, 57.0, 51.0, 51.0, 51.0, 35.0, 41.0, 30.0, 28.0, 19.0, 14.0, 17.0, 14.0, 15.0, 12.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-650.7698364257812, -627.1006469726562, -603.4314575195312, -579.76220703125, -556.093017578125, -532.423828125, -508.754638671875, -485.08544921875, -461.416259765625, -437.7470703125, -414.0778503417969, -390.4086608886719, -366.7394714355469, -343.07025146484375, -319.40106201171875, -295.73187255859375, -272.0626525878906, -248.39344787597656, -224.72425842285156, -201.0550537109375, -177.3858642578125, -153.71665954589844, -130.04745483398438, -106.37826538085938, -82.70906066894531, -59.03986358642578, -35.370662689208984, -11.701461791992188, 11.967735290527344, 35.636932373046875, 59.30613708496094, 82.97532653808594, 106.64453125, 130.31373596191406, 153.98292541503906, 177.65213012695312, 201.32131958007812, 224.9905242919922, 248.65972900390625, 272.32891845703125, 295.99810791015625, 319.66729736328125, 343.3365173339844, 367.0057067871094, 390.6748962402344, 414.3441162109375, 438.0133056640625, 461.6824951171875, 485.3517150878906, 509.0209045410156, 532.6901245117188, 556.3593139648438, 580.0285034179688, 603.6976928710938, 627.366943359375, 651.0361328125, 674.705322265625, 698.37451171875, 722.043701171875, 745.712890625, 769.3821411132812, 793.0513305664062, 816.7205200195312, 840.3897094726562, 864.0588989257812]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 7.0, 1.0, 9.0, 9.0, 18.0, 14.0, 21.0, 30.0, 48.0, 62.0, 99.0, 123.0, 166.0, 310.0, 427.0, 631.0, 984.0, 1486.0, 2689.0, 5530.0, 23555.0, 4129707.0, 17038.0, 4707.0, 2421.0, 1419.0, 900.0, 601.0, 392.0, 276.0, 176.0, 131.0, 93.0, 50.0, 47.0, 37.0, 22.0, 18.0, 12.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -151.71875, -146.5625, -141.40625, -136.25, -131.09375, -125.9375, -120.78125, -115.625, -110.46875, -105.3125, -100.15625, -95.0, -89.84375, -84.6875, -79.53125, -74.375, -69.21875, -64.0625, -58.90625, -53.75, -48.59375, -43.4375, -38.28125, -33.125, -27.96875, -22.8125, -17.65625, -12.5, -7.34375, -2.1875, 2.96875, 8.125, 13.28125, 18.4375, 23.59375, 28.75, 33.90625, 39.0625, 44.21875, 49.375, 54.53125, 59.6875, 64.84375, 70.0, 75.15625, 80.3125, 85.46875, 90.625, 95.78125, 100.9375, 106.09375, 111.25, 116.40625, 121.5625, 126.71875, 131.875, 137.03125, 142.1875, 147.34375, 152.5, 157.65625, 162.8125, 167.96875, 173.125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 14.0, 28.0, 28.0, 23.0, 38.0, 56.0, 65.0, 60.0, 73.0, 69.0, 82.0, 84.0, 63.0, 65.0, 59.0, 33.0, 38.0, 21.0, 13.0, 12.0, 16.0, 14.0, 8.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.84375, -49.47705078125, -48.1103515625, -46.74365234375, -45.376953125, -44.01025390625, -42.6435546875, -41.27685546875, -39.91015625, -38.54345703125, -37.1767578125, -35.81005859375, -34.443359375, -33.07666015625, -31.7099609375, -30.34326171875, -28.9765625, -27.60986328125, -26.2431640625, -24.87646484375, -23.509765625, -22.14306640625, -20.7763671875, -19.40966796875, -18.04296875, -16.67626953125, -15.3095703125, -13.94287109375, -12.576171875, -11.20947265625, -9.8427734375, -8.47607421875, -7.109375, -5.74267578125, -4.3759765625, -3.00927734375, -1.642578125, -0.27587890625, 1.0908203125, 2.45751953125, 3.82421875, 5.19091796875, 6.5576171875, 7.92431640625, 9.291015625, 10.65771484375, 12.0244140625, 13.39111328125, 14.7578125, 16.12451171875, 17.4912109375, 18.85791015625, 20.224609375, 21.59130859375, 22.9580078125, 24.32470703125, 25.69140625, 27.05810546875, 28.4248046875, 29.79150390625, 31.158203125, 32.52490234375, 33.8916015625, 35.25830078125, 36.625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 19.0, 13.0, 25.0, 39.0, 49.0, 62.0, 136.0, 160.0, 237.0, 348.0, 527.0, 973.0, 1594.0, 3073.0, 7426.0, 42505.0, 4103301.0, 21736.0, 5681.0, 2643.0, 1387.0, 791.0, 500.0, 303.0, 239.0, 153.0, 105.0, 84.0, 48.0, 29.0, 32.0, 21.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-204.75, -198.79296875, -192.8359375, -186.87890625, -180.921875, -174.96484375, -169.0078125, -163.05078125, -157.09375, -151.13671875, -145.1796875, -139.22265625, -133.265625, -127.30859375, -121.3515625, -115.39453125, -109.4375, -103.48046875, -97.5234375, -91.56640625, -85.609375, -79.65234375, -73.6953125, -67.73828125, -61.78125, -55.82421875, -49.8671875, -43.91015625, -37.953125, -31.99609375, -26.0390625, -20.08203125, -14.125, -8.16796875, -2.2109375, 3.74609375, 9.703125, 15.66015625, 21.6171875, 27.57421875, 33.53125, 39.48828125, 45.4453125, 51.40234375, 57.359375, 63.31640625, 69.2734375, 75.23046875, 81.1875, 87.14453125, 93.1015625, 99.05859375, 105.015625, 110.97265625, 116.9296875, 122.88671875, 128.84375, 134.80078125, 140.7578125, 146.71484375, 152.671875, 158.62890625, 164.5859375, 170.54296875, 176.5]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 8.0, 9.0, 17.0, 16.0, 45.0, 167.0, 3643.0, 101.0, 24.0, 15.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.9375, -59.7529296875, -57.568359375, -55.3837890625, -53.19921875, -51.0146484375, -48.830078125, -46.6455078125, -44.4609375, -42.2763671875, -40.091796875, -37.9072265625, -35.72265625, -33.5380859375, -31.353515625, -29.1689453125, -26.984375, -24.7998046875, -22.615234375, -20.4306640625, -18.24609375, -16.0615234375, -13.876953125, -11.6923828125, -9.5078125, -7.3232421875, -5.138671875, -2.9541015625, -0.76953125, 1.4150390625, 3.599609375, 5.7841796875, 7.96875, 10.1533203125, 12.337890625, 14.5224609375, 16.70703125, 18.8916015625, 21.076171875, 23.2607421875, 25.4453125, 27.6298828125, 29.814453125, 31.9990234375, 34.18359375, 36.3681640625, 38.552734375, 40.7373046875, 42.921875, 45.1064453125, 47.291015625, 49.4755859375, 51.66015625, 53.8447265625, 56.029296875, 58.2138671875, 60.3984375, 62.5830078125, 64.767578125, 66.9521484375, 69.13671875, 71.3212890625, 73.505859375, 75.6904296875, 77.875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 20.0, 39.0, 63.0, 92.0, 139.0, 163.0, 148.0, 98.0, 77.0, 39.0, 22.0, 17.0, 11.0, 9.0, 4.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.9148712158203, -219.68553161621094, -211.45620727539062, -203.22686767578125, -194.99752807617188, -186.7681884765625, -178.5388641357422, -170.3095245361328, -162.0802001953125, -153.85086059570312, -145.6215362548828, -137.39219665527344, -129.16285705566406, -120.93352508544922, -112.70419311523438, -104.474853515625, -96.24551391601562, -88.01618194580078, -79.7868423461914, -71.55751037597656, -63.32817459106445, -55.098838806152344, -46.8695068359375, -38.64017105102539, -30.41083526611328, -22.181499481201172, -13.952165603637695, -5.722831726074219, 2.5065040588378906, 10.73583984375, 18.965171813964844, 27.194507598876953, 35.423858642578125, 43.653194427490234, 51.882530212402344, 60.11186218261719, 68.34120178222656, 76.5705337524414, 84.79986572265625, 93.02920532226562, 101.25853729248047, 109.48786926269531, 117.71720886230469, 125.94654083251953, 134.17587280273438, 142.40521240234375, 150.63455200195312, 158.86387634277344, 167.0932159423828, 175.3225555419922, 183.5518798828125, 191.78121948242188, 200.01055908203125, 208.23989868164062, 216.46922302246094, 224.6985626220703, 232.92788696289062, 241.1572265625, 249.3865509033203, 257.61590576171875, 265.84521484375, 274.0745544433594, 282.30389404296875, 290.5332336425781, 298.7625732421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 9.0, 8.0, 7.0, 7.0, 14.0, 10.0, 15.0, 15.0, 23.0, 27.0, 29.0, 23.0, 35.0, 28.0, 44.0, 40.0, 42.0, 35.0, 41.0, 50.0, 45.0, 42.0, 34.0, 43.0, 32.0, 38.0, 20.0, 26.0, 39.0, 23.0, 27.0, 24.0, 15.0, 12.0, 12.0, 9.0, 17.0, 8.0, 6.0, 7.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-113.14628601074219, -109.76753997802734, -106.3887939453125, -103.01004791259766, -99.63130187988281, -96.25255584716797, -92.87380981445312, -89.49507141113281, -86.11631774902344, -82.7375717163086, -79.35882568359375, -75.9800796508789, -72.60133361816406, -69.22258758544922, -65.84384155273438, -62.4650993347168, -59.08635711669922, -55.707611083984375, -52.32886505126953, -48.95011901855469, -45.571372985839844, -42.192626953125, -38.81388473510742, -35.43513870239258, -32.056392669677734, -28.67764663696289, -25.298900604248047, -21.920156478881836, -18.541410446166992, -15.162664413452148, -11.783920288085938, -8.405174255371094, -5.02642822265625, -1.6476826667785645, 1.731062889099121, 5.109807968139648, 8.488554000854492, 11.867300033569336, 15.246044158935547, 18.62479019165039, 22.003536224365234, 25.382282257080078, 28.761028289794922, 32.1397705078125, 35.518516540527344, 38.89726257324219, 42.27600860595703, 45.654754638671875, 49.03350067138672, 52.41224670410156, 55.790992736816406, 59.16973876953125, 62.548484802246094, 65.92723083496094, 69.30596923828125, 72.68472290039062, 76.06346130371094, 79.44220733642578, 82.82095336914062, 86.19969940185547, 89.57844543457031, 92.95719146728516, 96.3359375, 99.71467590332031, 103.09342956542969]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 4.0, 1.0, 8.0, 8.0, 10.0, 7.0, 21.0, 26.0, 46.0, 68.0, 114.0, 132.0, 246.0, 402.0, 577.0, 1010.0, 1768.0, 3204.0, 6171.0, 13491.0, 31657.0, 85384.0, 290007.0, 418524.0, 119461.0, 42063.0, 17301.0, 7821.0, 3927.0, 2047.0, 1157.0, 688.0, 405.0, 266.0, 191.0, 102.0, 67.0, 51.0, 33.0, 29.0, 21.0, 9.0, 12.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.0, -84.20703125, -81.4140625, -78.62109375, -75.828125, -73.03515625, -70.2421875, -67.44921875, -64.65625, -61.86328125, -59.0703125, -56.27734375, -53.484375, -50.69140625, -47.8984375, -45.10546875, -42.3125, -39.51953125, -36.7265625, -33.93359375, -31.140625, -28.34765625, -25.5546875, -22.76171875, -19.96875, -17.17578125, -14.3828125, -11.58984375, -8.796875, -6.00390625, -3.2109375, -0.41796875, 2.375, 5.16796875, 7.9609375, 10.75390625, 13.546875, 16.33984375, 19.1328125, 21.92578125, 24.71875, 27.51171875, 30.3046875, 33.09765625, 35.890625, 38.68359375, 41.4765625, 44.26953125, 47.0625, 49.85546875, 52.6484375, 55.44140625, 58.234375, 61.02734375, 63.8203125, 66.61328125, 69.40625, 72.19921875, 74.9921875, 77.78515625, 80.578125, 83.37109375, 86.1640625, 88.95703125, 91.75]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 5.0, 7.0, 11.0, 19.0, 17.0, 21.0, 27.0, 38.0, 28.0, 46.0, 68.0, 70.0, 77.0, 70.0, 69.0, 67.0, 73.0, 64.0, 37.0, 42.0, 25.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.96875, -43.560546875, -42.15234375, -40.744140625, -39.3359375, -37.927734375, -36.51953125, -35.111328125, -33.703125, -32.294921875, -30.88671875, -29.478515625, -28.0703125, -26.662109375, -25.25390625, -23.845703125, -22.4375, -21.029296875, -19.62109375, -18.212890625, -16.8046875, -15.396484375, -13.98828125, -12.580078125, -11.171875, -9.763671875, -8.35546875, -6.947265625, -5.5390625, -4.130859375, -2.72265625, -1.314453125, 0.09375, 1.501953125, 2.91015625, 4.318359375, 5.7265625, 7.134765625, 8.54296875, 9.951171875, 11.359375, 12.767578125, 14.17578125, 15.583984375, 16.9921875, 18.400390625, 19.80859375, 21.216796875, 22.625, 24.033203125, 25.44140625, 26.849609375, 28.2578125, 29.666015625, 31.07421875, 32.482421875, 33.890625, 35.298828125, 36.70703125, 38.115234375, 39.5234375, 40.931640625, 42.33984375, 43.748046875, 45.15625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 13.0, 10.0, 20.0, 18.0, 37.0, 45.0, 58.0, 104.0, 107.0, 167.0, 274.0, 381.0, 663.0, 1053.0, 1913.0, 3780.0, 8094.0, 21816.0, 72238.0, 386025.0, 432949.0, 78114.0, 23096.0, 8738.0, 3879.0, 1925.0, 1072.0, 600.0, 428.0, 285.0, 195.0, 115.0, 98.0, 60.0, 41.0, 30.0, 26.0, 18.0, 17.0, 5.0, 6.0, 7.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0], "bins": [-102.6875, -99.755859375, -96.82421875, -93.892578125, -90.9609375, -88.029296875, -85.09765625, -82.166015625, -79.234375, -76.302734375, -73.37109375, -70.439453125, -67.5078125, -64.576171875, -61.64453125, -58.712890625, -55.78125, -52.849609375, -49.91796875, -46.986328125, -44.0546875, -41.123046875, -38.19140625, -35.259765625, -32.328125, -29.396484375, -26.46484375, -23.533203125, -20.6015625, -17.669921875, -14.73828125, -11.806640625, -8.875, -5.943359375, -3.01171875, -0.080078125, 2.8515625, 5.783203125, 8.71484375, 11.646484375, 14.578125, 17.509765625, 20.44140625, 23.373046875, 26.3046875, 29.236328125, 32.16796875, 35.099609375, 38.03125, 40.962890625, 43.89453125, 46.826171875, 49.7578125, 52.689453125, 55.62109375, 58.552734375, 61.484375, 64.416015625, 67.34765625, 70.279296875, 73.2109375, 76.142578125, 79.07421875, 82.005859375, 84.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 8.0, 12.0, 15.0, 17.0, 19.0, 22.0, 37.0, 41.0, 47.0, 38.0, 53.0, 50.0, 52.0, 57.0, 77.0, 66.0, 47.0, 46.0, 41.0, 50.0, 39.0, 27.0, 32.0, 23.0, 20.0, 15.0, 10.0, 8.0, 7.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.125, -187.783203125, -182.44140625, -177.099609375, -171.7578125, -166.416015625, -161.07421875, -155.732421875, -150.390625, -145.048828125, -139.70703125, -134.365234375, -129.0234375, -123.681640625, -118.33984375, -112.998046875, -107.65625, -102.314453125, -96.97265625, -91.630859375, -86.2890625, -80.947265625, -75.60546875, -70.263671875, -64.921875, -59.580078125, -54.23828125, -48.896484375, -43.5546875, -38.212890625, -32.87109375, -27.529296875, -22.1875, -16.845703125, -11.50390625, -6.162109375, -0.8203125, 4.521484375, 9.86328125, 15.205078125, 20.546875, 25.888671875, 31.23046875, 36.572265625, 41.9140625, 47.255859375, 52.59765625, 57.939453125, 63.28125, 68.623046875, 73.96484375, 79.306640625, 84.6484375, 89.990234375, 95.33203125, 100.673828125, 106.015625, 111.357421875, 116.69921875, 122.041015625, 127.3828125, 132.724609375, 138.06640625, 143.408203125, 148.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 4.0, 7.0, 12.0, 19.0, 31.0, 49.0, 72.0, 157.0, 356.0, 1101.0, 4598.0, 47778.0, 954694.0, 34049.0, 3931.0, 984.0, 352.0, 158.0, 68.0, 38.0, 30.0, 18.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.5, -101.65625, -97.8125, -93.96875, -90.125, -86.28125, -82.4375, -78.59375, -74.75, -70.90625, -67.0625, -63.21875, -59.375, -55.53125, -51.6875, -47.84375, -44.0, -40.15625, -36.3125, -32.46875, -28.625, -24.78125, -20.9375, -17.09375, -13.25, -9.40625, -5.5625, -1.71875, 2.125, 5.96875, 9.8125, 13.65625, 17.5, 21.34375, 25.1875, 29.03125, 32.875, 36.71875, 40.5625, 44.40625, 48.25, 52.09375, 55.9375, 59.78125, 63.625, 67.46875, 71.3125, 75.15625, 79.0, 82.84375, 86.6875, 90.53125, 94.375, 98.21875, 102.0625, 105.90625, 109.75, 113.59375, 117.4375, 121.28125, 125.125, 128.96875, 132.8125, 136.65625, 140.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 25.0, 22.0, 23.0, 39.0, 53.0, 84.0, 144.0, 212.0, 159.0, 80.0, 46.0, 20.0, 19.0, 15.0, 12.0, 5.0, 9.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0136566162109375, -0.013141870498657227, -0.012627124786376953, -0.01211237907409668, -0.011597633361816406, -0.011082887649536133, -0.01056814193725586, -0.010053396224975586, -0.009538650512695312, -0.009023904800415039, -0.008509159088134766, -0.007994413375854492, -0.007479667663574219, -0.006964921951293945, -0.006450176239013672, -0.0059354305267333984, -0.005420684814453125, -0.0049059391021728516, -0.004391193389892578, -0.0038764476776123047, -0.0033617019653320312, -0.002846956253051758, -0.0023322105407714844, -0.001817464828491211, -0.0013027191162109375, -0.0007879734039306641, -0.0002732276916503906, 0.0002415180206298828, 0.0007562637329101562, 0.0012710094451904297, 0.0017857551574707031, 0.0023005008697509766, 0.00281524658203125, 0.0033299922943115234, 0.003844738006591797, 0.00435948371887207, 0.004874229431152344, 0.005388975143432617, 0.005903720855712891, 0.006418466567993164, 0.0069332122802734375, 0.007447957992553711, 0.007962703704833984, 0.008477449417114258, 0.008992195129394531, 0.009506940841674805, 0.010021686553955078, 0.010536432266235352, 0.011051177978515625, 0.011565923690795898, 0.012080669403076172, 0.012595415115356445, 0.013110160827636719, 0.013624906539916992, 0.014139652252197266, 0.014654397964477539, 0.015169143676757812, 0.015683889389038086, 0.01619863510131836, 0.016713380813598633, 0.017228126525878906, 0.01774287223815918, 0.018257617950439453, 0.018772363662719727, 0.019287109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 8.0, 5.0, 4.0, 5.0, 17.0, 23.0, 25.0, 42.0, 60.0, 93.0, 161.0, 293.0, 466.0, 1076.0, 2846.0, 12254.0, 205873.0, 795902.0, 22184.0, 4280.0, 1433.0, 650.0, 323.0, 179.0, 103.0, 83.0, 43.0, 28.0, 25.0, 22.0, 14.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-104.0625, -100.611328125, -97.16015625, -93.708984375, -90.2578125, -86.806640625, -83.35546875, -79.904296875, -76.453125, -73.001953125, -69.55078125, -66.099609375, -62.6484375, -59.197265625, -55.74609375, -52.294921875, -48.84375, -45.392578125, -41.94140625, -38.490234375, -35.0390625, -31.587890625, -28.13671875, -24.685546875, -21.234375, -17.783203125, -14.33203125, -10.880859375, -7.4296875, -3.978515625, -0.52734375, 2.923828125, 6.375, 9.826171875, 13.27734375, 16.728515625, 20.1796875, 23.630859375, 27.08203125, 30.533203125, 33.984375, 37.435546875, 40.88671875, 44.337890625, 47.7890625, 51.240234375, 54.69140625, 58.142578125, 61.59375, 65.044921875, 68.49609375, 71.947265625, 75.3984375, 78.849609375, 82.30078125, 85.751953125, 89.203125, 92.654296875, 96.10546875, 99.556640625, 103.0078125, 106.458984375, 109.91015625, 113.361328125, 116.8125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 11.0, 11.0, 17.0, 24.0, 50.0, 90.0, 220.0, 257.0, 151.0, 67.0, 34.0, 19.0, 20.0, 13.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.375, -86.943359375, -83.51171875, -80.080078125, -76.6484375, -73.216796875, -69.78515625, -66.353515625, -62.921875, -59.490234375, -56.05859375, -52.626953125, -49.1953125, -45.763671875, -42.33203125, -38.900390625, -35.46875, -32.037109375, -28.60546875, -25.173828125, -21.7421875, -18.310546875, -14.87890625, -11.447265625, -8.015625, -4.583984375, -1.15234375, 2.279296875, 5.7109375, 9.142578125, 12.57421875, 16.005859375, 19.4375, 22.869140625, 26.30078125, 29.732421875, 33.1640625, 36.595703125, 40.02734375, 43.458984375, 46.890625, 50.322265625, 53.75390625, 57.185546875, 60.6171875, 64.048828125, 67.48046875, 70.912109375, 74.34375, 77.775390625, 81.20703125, 84.638671875, 88.0703125, 91.501953125, 94.93359375, 98.365234375, 101.796875, 105.228515625, 108.66015625, 112.091796875, 115.5234375, 118.955078125, 122.38671875, 125.818359375, 129.25]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 30.0, 157.0, 447.0, 263.0, 67.0, 22.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1050.192626953125, -941.7163696289062, -833.2401123046875, -724.7638549804688, -616.28759765625, -507.81134033203125, -399.3350830078125, -290.85882568359375, -182.382568359375, -73.90631103515625, 34.5699462890625, 143.04620361328125, 251.5224609375, 359.99871826171875, 468.4749755859375, 576.9512329101562, 685.427490234375, 793.9037475585938, 902.3800048828125, 1010.8562622070312, 1119.33251953125, 1227.808837890625, 1336.2850341796875, 1444.76123046875, 1553.237548828125, 1661.7138671875, 1770.1900634765625, 1878.666259765625, 1987.142578125, 2095.618896484375, 2204.09521484375, 2312.5712890625, 2421.04736328125, 2529.523681640625, 2638.0, 2746.47607421875, 2854.952392578125, 2963.4287109375, 3071.90478515625, 3180.381103515625, 3288.857421875, 3397.333740234375, 3505.81005859375, 3614.2861328125, 3722.762451171875, 3831.23876953125, 3939.71484375, 4048.191162109375, 4156.66748046875, 4265.1435546875, 4373.6201171875, 4482.09619140625, 4590.572265625, 4699.048828125, 4807.52490234375, 4916.00146484375, 5024.4775390625, 5132.95361328125, 5241.43017578125, 5349.90625, 5458.3828125, 5566.85888671875, 5675.3349609375, 5783.8115234375, 5892.28759765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 3.0, 8.0, 8.0, 14.0, 9.0, 11.0, 13.0, 22.0, 26.0, 24.0, 36.0, 27.0, 32.0, 37.0, 39.0, 40.0, 54.0, 43.0, 53.0, 55.0, 37.0, 55.0, 40.0, 46.0, 37.0, 42.0, 30.0, 30.0, 17.0, 26.0, 17.0, 16.0, 10.0, 12.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-621.1695556640625, -600.2647705078125, -579.3599853515625, -558.4552001953125, -537.5504150390625, -516.6456298828125, -495.7408447265625, -474.8360595703125, -453.9312744140625, -433.0264892578125, -412.1217041015625, -391.2169189453125, -370.3121337890625, -349.4073486328125, -328.5025634765625, -307.5977783203125, -286.6929626464844, -265.7881774902344, -244.88339233398438, -223.97860717773438, -203.07382202148438, -182.16903686523438, -161.2642364501953, -140.3594512939453, -119.45466613769531, -98.54988098144531, -77.64509582519531, -56.74030303955078, -35.83551788330078, -14.930732727050781, 5.97406005859375, 26.87884521484375, 47.78363037109375, 68.68841552734375, 89.59320068359375, 110.49799346923828, 131.40277099609375, 152.30755615234375, 173.2123565673828, 194.1171417236328, 215.0219268798828, 235.9267120361328, 256.8315124511719, 277.7362976074219, 298.6410827636719, 319.5458679199219, 340.4506530761719, 361.3554382324219, 382.2602233886719, 403.1650085449219, 424.0697937011719, 444.9745788574219, 465.8793640136719, 486.7841491699219, 507.68896484375, 528.59375, 549.49853515625, 570.4033203125, 591.30810546875, 612.212890625, 633.11767578125, 654.0224609375, 674.92724609375, 695.83203125, 716.73681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 15.0, 13.0, 20.0, 27.0, 46.0, 64.0, 72.0, 125.0, 127.0, 188.0, 252.0, 357.0, 524.0, 766.0, 1063.0, 1690.0, 2684.0, 4578.0, 8676.0, 19378.0, 65604.0, 903120.0, 2988755.0, 141421.0, 28522.0, 11413.0, 5606.0, 3251.0, 1884.0, 1180.0, 837.0, 533.0, 412.0, 267.0, 195.0, 158.0, 105.0, 96.0, 60.0, 57.0, 45.0, 25.0, 15.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.9375, -68.5068359375, -66.076171875, -63.6455078125, -61.21484375, -58.7841796875, -56.353515625, -53.9228515625, -51.4921875, -49.0615234375, -46.630859375, -44.2001953125, -41.76953125, -39.3388671875, -36.908203125, -34.4775390625, -32.046875, -29.6162109375, -27.185546875, -24.7548828125, -22.32421875, -19.8935546875, -17.462890625, -15.0322265625, -12.6015625, -10.1708984375, -7.740234375, -5.3095703125, -2.87890625, -0.4482421875, 1.982421875, 4.4130859375, 6.84375, 9.2744140625, 11.705078125, 14.1357421875, 16.56640625, 18.9970703125, 21.427734375, 23.8583984375, 26.2890625, 28.7197265625, 31.150390625, 33.5810546875, 36.01171875, 38.4423828125, 40.873046875, 43.3037109375, 45.734375, 48.1650390625, 50.595703125, 53.0263671875, 55.45703125, 57.8876953125, 60.318359375, 62.7490234375, 65.1796875, 67.6103515625, 70.041015625, 72.4716796875, 74.90234375, 77.3330078125, 79.763671875, 82.1943359375, 84.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 7.0, 14.0, 28.0, 17.0, 25.0, 40.0, 39.0, 45.0, 61.0, 68.0, 77.0, 75.0, 76.0, 78.0, 68.0, 63.0, 44.0, 36.0, 32.0, 25.0, 12.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -33.60693359375, -32.1826171875, -30.75830078125, -29.333984375, -27.90966796875, -26.4853515625, -25.06103515625, -23.63671875, -22.21240234375, -20.7880859375, -19.36376953125, -17.939453125, -16.51513671875, -15.0908203125, -13.66650390625, -12.2421875, -10.81787109375, -9.3935546875, -7.96923828125, -6.544921875, -5.12060546875, -3.6962890625, -2.27197265625, -0.84765625, 0.57666015625, 2.0009765625, 3.42529296875, 4.849609375, 6.27392578125, 7.6982421875, 9.12255859375, 10.546875, 11.97119140625, 13.3955078125, 14.81982421875, 16.244140625, 17.66845703125, 19.0927734375, 20.51708984375, 21.94140625, 23.36572265625, 24.7900390625, 26.21435546875, 27.638671875, 29.06298828125, 30.4873046875, 31.91162109375, 33.3359375, 34.76025390625, 36.1845703125, 37.60888671875, 39.033203125, 40.45751953125, 41.8818359375, 43.30615234375, 44.73046875, 46.15478515625, 47.5791015625, 49.00341796875, 50.427734375, 51.85205078125, 53.2763671875, 54.70068359375, 56.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 11.0, 6.0, 8.0, 13.0, 20.0, 16.0, 41.0, 73.0, 88.0, 162.0, 246.0, 428.0, 781.0, 1588.0, 3545.0, 8788.0, 25957.0, 110839.0, 3336524.0, 621263.0, 56466.0, 16364.0, 5971.0, 2408.0, 1174.0, 613.0, 348.0, 210.0, 111.0, 79.0, 38.0, 37.0, 16.0, 16.0, 9.0, 7.0, 3.0, 4.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.875, -98.337890625, -94.80078125, -91.263671875, -87.7265625, -84.189453125, -80.65234375, -77.115234375, -73.578125, -70.041015625, -66.50390625, -62.966796875, -59.4296875, -55.892578125, -52.35546875, -48.818359375, -45.28125, -41.744140625, -38.20703125, -34.669921875, -31.1328125, -27.595703125, -24.05859375, -20.521484375, -16.984375, -13.447265625, -9.91015625, -6.373046875, -2.8359375, 0.701171875, 4.23828125, 7.775390625, 11.3125, 14.849609375, 18.38671875, 21.923828125, 25.4609375, 28.998046875, 32.53515625, 36.072265625, 39.609375, 43.146484375, 46.68359375, 50.220703125, 53.7578125, 57.294921875, 60.83203125, 64.369140625, 67.90625, 71.443359375, 74.98046875, 78.517578125, 82.0546875, 85.591796875, 89.12890625, 92.666015625, 96.203125, 99.740234375, 103.27734375, 106.814453125, 110.3515625, 113.888671875, 117.42578125, 120.962890625, 124.5]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 12.0, 13.0, 11.0, 24.0, 24.0, 36.0, 37.0, 63.0, 102.0, 205.0, 526.0, 1404.0, 898.0, 321.0, 132.0, 76.0, 41.0, 30.0, 17.0, 23.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -136.6904296875, -132.755859375, -128.8212890625, -124.88671875, -120.9521484375, -117.017578125, -113.0830078125, -109.1484375, -105.2138671875, -101.279296875, -97.3447265625, -93.41015625, -89.4755859375, -85.541015625, -81.6064453125, -77.671875, -73.7373046875, -69.802734375, -65.8681640625, -61.93359375, -57.9990234375, -54.064453125, -50.1298828125, -46.1953125, -42.2607421875, -38.326171875, -34.3916015625, -30.45703125, -26.5224609375, -22.587890625, -18.6533203125, -14.71875, -10.7841796875, -6.849609375, -2.9150390625, 1.01953125, 4.9541015625, 8.888671875, 12.8232421875, 16.7578125, 20.6923828125, 24.626953125, 28.5615234375, 32.49609375, 36.4306640625, 40.365234375, 44.2998046875, 48.234375, 52.1689453125, 56.103515625, 60.0380859375, 63.97265625, 67.9072265625, 71.841796875, 75.7763671875, 79.7109375, 83.6455078125, 87.580078125, 91.5146484375, 95.44921875, 99.3837890625, 103.318359375, 107.2529296875, 111.1875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 20.0, 25.0, 51.0, 106.0, 196.0, 292.0, 181.0, 62.0, 26.0, 14.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1828.8466796875, -1782.648193359375, -1736.44970703125, -1690.251220703125, -1644.052734375, -1597.854248046875, -1551.65576171875, -1505.457275390625, -1459.2587890625, -1413.060302734375, -1366.86181640625, -1320.663330078125, -1274.46484375, -1228.266357421875, -1182.06787109375, -1135.869384765625, -1089.6710205078125, -1043.4725341796875, -997.2740478515625, -951.0755615234375, -904.8770751953125, -858.6785888671875, -812.4801635742188, -766.2816772460938, -720.0831909179688, -673.8847045898438, -627.6862182617188, -581.48779296875, -535.289306640625, -489.0907897949219, -442.892333984375, -396.69384765625, -350.495361328125, -304.296875, -258.098388671875, -211.89993286132812, -165.70144653320312, -119.50296020507812, -73.30450439453125, -27.10601806640625, 19.09246826171875, 65.29094696044922, 111.48942565917969, 157.68789672851562, 203.88638305664062, 250.08486938476562, 296.2833251953125, 342.4818115234375, 388.6802978515625, 434.8787841796875, 481.0772705078125, 527.2757568359375, 573.4742431640625, 619.6727294921875, 665.8711547851562, 712.0696411132812, 758.2681274414062, 804.4666137695312, 850.6651000976562, 896.863525390625, 943.06201171875, 989.260498046875, 1035.458984375, 1081.657470703125, 1127.85595703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 7.0, 6.0, 17.0, 23.0, 20.0, 16.0, 19.0, 25.0, 28.0, 32.0, 31.0, 31.0, 40.0, 42.0, 42.0, 39.0, 37.0, 46.0, 50.0, 33.0, 42.0, 44.0, 44.0, 43.0, 25.0, 29.0, 35.0, 22.0, 23.0, 10.0, 13.0, 9.0, 13.0, 8.0, 11.0, 10.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-447.6067810058594, -433.94354248046875, -420.28033447265625, -406.61712646484375, -392.9538879394531, -379.2906494140625, -365.62744140625, -351.9642333984375, -338.3009948730469, -324.63775634765625, -310.97454833984375, -297.31134033203125, -283.6481018066406, -269.98486328125, -256.3216552734375, -242.65843200683594, -228.99520874023438, -215.3319854736328, -201.66876220703125, -188.0055389404297, -174.34231567382812, -160.67909240722656, -147.015869140625, -133.35264587402344, -119.68942260742188, -106.02619934082031, -92.36297607421875, -78.69975280761719, -65.03652954101562, -51.37330627441406, -37.7100830078125, -24.046859741210938, -10.38360595703125, 3.2796173095703125, 16.942840576171875, 30.606063842773438, 44.269287109375, 57.93251037597656, 71.59573364257812, 85.25895690917969, 98.92218017578125, 112.58540344238281, 126.24862670898438, 139.91184997558594, 153.5750732421875, 167.23829650878906, 180.90151977539062, 194.5647430419922, 208.22796630859375, 221.8911895751953, 235.55441284179688, 249.21763610839844, 262.880859375, 276.5440673828125, 290.2073059082031, 303.87054443359375, 317.53375244140625, 331.19696044921875, 344.8601989746094, 358.5234375, 372.1866455078125, 385.849853515625, 399.5130920410156, 413.17633056640625, 426.83953857421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 10.0, 10.0, 17.0, 14.0, 30.0, 47.0, 67.0, 89.0, 143.0, 223.0, 329.0, 457.0, 697.0, 978.0, 1595.0, 2476.0, 4149.0, 6958.0, 12624.0, 24743.0, 53562.0, 140373.0, 394937.0, 243737.0, 83951.0, 35681.0, 17201.0, 9233.0, 5166.0, 3165.0, 2007.0, 1241.0, 863.0, 518.0, 368.0, 261.0, 187.0, 129.0, 102.0, 62.0, 40.0, 33.0, 22.0, 19.0, 13.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-71.875, -69.7451171875, -67.615234375, -65.4853515625, -63.35546875, -61.2255859375, -59.095703125, -56.9658203125, -54.8359375, -52.7060546875, -50.576171875, -48.4462890625, -46.31640625, -44.1865234375, -42.056640625, -39.9267578125, -37.796875, -35.6669921875, -33.537109375, -31.4072265625, -29.27734375, -27.1474609375, -25.017578125, -22.8876953125, -20.7578125, -18.6279296875, -16.498046875, -14.3681640625, -12.23828125, -10.1083984375, -7.978515625, -5.8486328125, -3.71875, -1.5888671875, 0.541015625, 2.6708984375, 4.80078125, 6.9306640625, 9.060546875, 11.1904296875, 13.3203125, 15.4501953125, 17.580078125, 19.7099609375, 21.83984375, 23.9697265625, 26.099609375, 28.2294921875, 30.359375, 32.4892578125, 34.619140625, 36.7490234375, 38.87890625, 41.0087890625, 43.138671875, 45.2685546875, 47.3984375, 49.5283203125, 51.658203125, 53.7880859375, 55.91796875, 58.0478515625, 60.177734375, 62.3076171875, 64.4375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 15.0, 19.0, 22.0, 23.0, 28.0, 32.0, 46.0, 49.0, 45.0, 60.0, 69.0, 58.0, 64.0, 72.0, 49.0, 54.0, 50.0, 37.0, 33.0, 35.0, 20.0, 21.0, 19.0, 19.0, 11.0, 6.0, 1.0, 4.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.630859375, -30.35546875, -29.080078125, -27.8046875, -26.529296875, -25.25390625, -23.978515625, -22.703125, -21.427734375, -20.15234375, -18.876953125, -17.6015625, -16.326171875, -15.05078125, -13.775390625, -12.5, -11.224609375, -9.94921875, -8.673828125, -7.3984375, -6.123046875, -4.84765625, -3.572265625, -2.296875, -1.021484375, 0.25390625, 1.529296875, 2.8046875, 4.080078125, 5.35546875, 6.630859375, 7.90625, 9.181640625, 10.45703125, 11.732421875, 13.0078125, 14.283203125, 15.55859375, 16.833984375, 18.109375, 19.384765625, 20.66015625, 21.935546875, 23.2109375, 24.486328125, 25.76171875, 27.037109375, 28.3125, 29.587890625, 30.86328125, 32.138671875, 33.4140625, 34.689453125, 35.96484375, 37.240234375, 38.515625, 39.791015625, 41.06640625, 42.341796875, 43.6171875, 44.892578125, 46.16796875, 47.443359375, 48.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 11.0, 18.0, 18.0, 29.0, 35.0, 51.0, 67.0, 108.0, 202.0, 293.0, 433.0, 809.0, 1624.0, 3957.0, 12396.0, 60986.0, 732676.0, 197690.0, 25240.0, 6758.0, 2447.0, 1122.0, 594.0, 314.0, 219.0, 121.0, 97.0, 67.0, 46.0, 28.0, 25.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-161.625, -156.689453125, -151.75390625, -146.818359375, -141.8828125, -136.947265625, -132.01171875, -127.076171875, -122.140625, -117.205078125, -112.26953125, -107.333984375, -102.3984375, -97.462890625, -92.52734375, -87.591796875, -82.65625, -77.720703125, -72.78515625, -67.849609375, -62.9140625, -57.978515625, -53.04296875, -48.107421875, -43.171875, -38.236328125, -33.30078125, -28.365234375, -23.4296875, -18.494140625, -13.55859375, -8.623046875, -3.6875, 1.248046875, 6.18359375, 11.119140625, 16.0546875, 20.990234375, 25.92578125, 30.861328125, 35.796875, 40.732421875, 45.66796875, 50.603515625, 55.5390625, 60.474609375, 65.41015625, 70.345703125, 75.28125, 80.216796875, 85.15234375, 90.087890625, 95.0234375, 99.958984375, 104.89453125, 109.830078125, 114.765625, 119.701171875, 124.63671875, 129.572265625, 134.5078125, 139.443359375, 144.37890625, 149.314453125, 154.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 9.0, 6.0, 9.0, 13.0, 16.0, 23.0, 26.0, 32.0, 31.0, 34.0, 45.0, 42.0, 35.0, 34.0, 55.0, 50.0, 49.0, 42.0, 54.0, 52.0, 47.0, 42.0, 32.0, 35.0, 36.0, 21.0, 21.0, 19.0, 9.0, 9.0, 8.0, 9.0, 8.0, 4.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-184.875, -180.048828125, -175.22265625, -170.396484375, -165.5703125, -160.744140625, -155.91796875, -151.091796875, -146.265625, -141.439453125, -136.61328125, -131.787109375, -126.9609375, -122.134765625, -117.30859375, -112.482421875, -107.65625, -102.830078125, -98.00390625, -93.177734375, -88.3515625, -83.525390625, -78.69921875, -73.873046875, -69.046875, -64.220703125, -59.39453125, -54.568359375, -49.7421875, -44.916015625, -40.08984375, -35.263671875, -30.4375, -25.611328125, -20.78515625, -15.958984375, -11.1328125, -6.306640625, -1.48046875, 3.345703125, 8.171875, 12.998046875, 17.82421875, 22.650390625, 27.4765625, 32.302734375, 37.12890625, 41.955078125, 46.78125, 51.607421875, 56.43359375, 61.259765625, 66.0859375, 70.912109375, 75.73828125, 80.564453125, 85.390625, 90.216796875, 95.04296875, 99.869140625, 104.6953125, 109.521484375, 114.34765625, 119.173828125, 124.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 7.0, 11.0, 17.0, 13.0, 32.0, 41.0, 65.0, 119.0, 186.0, 320.0, 610.0, 1194.0, 2696.0, 6509.0, 21063.0, 134098.0, 761233.0, 93140.0, 16884.0, 5457.0, 2407.0, 1097.0, 512.0, 289.0, 207.0, 124.0, 71.0, 43.0, 33.0, 17.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -42.7568359375, -41.138671875, -39.5205078125, -37.90234375, -36.2841796875, -34.666015625, -33.0478515625, -31.4296875, -29.8115234375, -28.193359375, -26.5751953125, -24.95703125, -23.3388671875, -21.720703125, -20.1025390625, -18.484375, -16.8662109375, -15.248046875, -13.6298828125, -12.01171875, -10.3935546875, -8.775390625, -7.1572265625, -5.5390625, -3.9208984375, -2.302734375, -0.6845703125, 0.93359375, 2.5517578125, 4.169921875, 5.7880859375, 7.40625, 9.0244140625, 10.642578125, 12.2607421875, 13.87890625, 15.4970703125, 17.115234375, 18.7333984375, 20.3515625, 21.9697265625, 23.587890625, 25.2060546875, 26.82421875, 28.4423828125, 30.060546875, 31.6787109375, 33.296875, 34.9150390625, 36.533203125, 38.1513671875, 39.76953125, 41.3876953125, 43.005859375, 44.6240234375, 46.2421875, 47.8603515625, 49.478515625, 51.0966796875, 52.71484375, 54.3330078125, 55.951171875, 57.5693359375, 59.1875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 16.0, 18.0, 34.0, 37.0, 61.0, 100.0, 120.0, 187.0, 144.0, 89.0, 51.0, 45.0, 16.0, 11.0, 10.0, 11.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018157958984375, -0.017614126205444336, -0.017070293426513672, -0.016526460647583008, -0.015982627868652344, -0.01543879508972168, -0.014894962310791016, -0.014351129531860352, -0.013807296752929688, -0.013263463973999023, -0.01271963119506836, -0.012175798416137695, -0.011631965637207031, -0.011088132858276367, -0.010544300079345703, -0.010000467300415039, -0.009456634521484375, -0.008912801742553711, -0.008368968963623047, -0.007825136184692383, -0.007281303405761719, -0.006737470626831055, -0.006193637847900391, -0.0056498050689697266, -0.0051059722900390625, -0.0045621395111083984, -0.004018306732177734, -0.0034744739532470703, -0.0029306411743164062, -0.002386808395385742, -0.0018429756164550781, -0.001299142837524414, -0.00075531005859375, -0.00021147727966308594, 0.0003323554992675781, 0.0008761882781982422, 0.0014200210571289062, 0.0019638538360595703, 0.0025076866149902344, 0.0030515193939208984, 0.0035953521728515625, 0.0041391849517822266, 0.004683017730712891, 0.005226850509643555, 0.005770683288574219, 0.006314516067504883, 0.006858348846435547, 0.007402181625366211, 0.007946014404296875, 0.008489847183227539, 0.009033679962158203, 0.009577512741088867, 0.010121345520019531, 0.010665178298950195, 0.01120901107788086, 0.011752843856811523, 0.012296676635742188, 0.012840509414672852, 0.013384342193603516, 0.01392817497253418, 0.014472007751464844, 0.015015840530395508, 0.015559673309326172, 0.016103506088256836, 0.0166473388671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 10.0, 12.0, 14.0, 20.0, 29.0, 42.0, 56.0, 81.0, 126.0, 201.0, 353.0, 647.0, 1119.0, 2386.0, 6094.0, 19918.0, 113039.0, 726313.0, 143128.0, 22680.0, 6694.0, 2646.0, 1288.0, 631.0, 363.0, 221.0, 137.0, 95.0, 59.0, 38.0, 29.0, 22.0, 11.0, 18.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0, -43.57373046875, -42.1474609375, -40.72119140625, -39.294921875, -37.86865234375, -36.4423828125, -35.01611328125, -33.58984375, -32.16357421875, -30.7373046875, -29.31103515625, -27.884765625, -26.45849609375, -25.0322265625, -23.60595703125, -22.1796875, -20.75341796875, -19.3271484375, -17.90087890625, -16.474609375, -15.04833984375, -13.6220703125, -12.19580078125, -10.76953125, -9.34326171875, -7.9169921875, -6.49072265625, -5.064453125, -3.63818359375, -2.2119140625, -0.78564453125, 0.640625, 2.06689453125, 3.4931640625, 4.91943359375, 6.345703125, 7.77197265625, 9.1982421875, 10.62451171875, 12.05078125, 13.47705078125, 14.9033203125, 16.32958984375, 17.755859375, 19.18212890625, 20.6083984375, 22.03466796875, 23.4609375, 24.88720703125, 26.3134765625, 27.73974609375, 29.166015625, 30.59228515625, 32.0185546875, 33.44482421875, 34.87109375, 36.29736328125, 37.7236328125, 39.14990234375, 40.576171875, 42.00244140625, 43.4287109375, 44.85498046875, 46.28125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 6.0, 12.0, 16.0, 12.0, 15.0, 23.0, 47.0, 50.0, 60.0, 75.0, 82.0, 77.0, 91.0, 74.0, 80.0, 56.0, 55.0, 41.0, 25.0, 15.0, 13.0, 10.0, 10.0, 12.0, 4.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-48.1875, -46.85107421875, -45.5146484375, -44.17822265625, -42.841796875, -41.50537109375, -40.1689453125, -38.83251953125, -37.49609375, -36.15966796875, -34.8232421875, -33.48681640625, -32.150390625, -30.81396484375, -29.4775390625, -28.14111328125, -26.8046875, -25.46826171875, -24.1318359375, -22.79541015625, -21.458984375, -20.12255859375, -18.7861328125, -17.44970703125, -16.11328125, -14.77685546875, -13.4404296875, -12.10400390625, -10.767578125, -9.43115234375, -8.0947265625, -6.75830078125, -5.421875, -4.08544921875, -2.7490234375, -1.41259765625, -0.076171875, 1.26025390625, 2.5966796875, 3.93310546875, 5.26953125, 6.60595703125, 7.9423828125, 9.27880859375, 10.615234375, 11.95166015625, 13.2880859375, 14.62451171875, 15.9609375, 17.29736328125, 18.6337890625, 19.97021484375, 21.306640625, 22.64306640625, 23.9794921875, 25.31591796875, 26.65234375, 27.98876953125, 29.3251953125, 30.66162109375, 31.998046875, 33.33447265625, 34.6708984375, 36.00732421875, 37.34375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 12.0, 8.0, 9.0, 28.0, 52.0, 59.0, 93.0, 138.0, 155.0, 150.0, 87.0, 72.0, 51.0, 28.0, 20.0, 16.0, 7.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-859.085205078125, -830.8626708984375, -802.6400756835938, -774.4175415039062, -746.1949462890625, -717.972412109375, -689.7498779296875, -661.52734375, -633.3047485351562, -605.0822143554688, -576.859619140625, -548.6370849609375, -520.41455078125, -492.19195556640625, -463.96942138671875, -435.7468566894531, -407.5242919921875, -379.3017272949219, -351.07916259765625, -322.85662841796875, -294.6340637207031, -266.4114990234375, -238.18894958496094, -209.96640014648438, -181.74383544921875, -153.52127075195312, -125.29872131347656, -97.07616424560547, -68.85360717773438, -40.63104248046875, -12.408493041992188, 15.814056396484375, 44.03662109375, 72.2591781616211, 100.48173522949219, 128.70428466796875, 156.92684936523438, 185.1494140625, 213.37196350097656, 241.59451293945312, 269.81707763671875, 298.0396423339844, 326.26220703125, 354.4847412109375, 382.7073059082031, 410.92987060546875, 439.15240478515625, 467.3749694824219, 495.5975341796875, 523.820068359375, 552.0426635742188, 580.2651977539062, 608.48779296875, 636.7103271484375, 664.932861328125, 693.1553955078125, 721.3779907226562, 749.6005249023438, 777.8231201171875, 806.045654296875, 834.2681884765625, 862.4907836914062, 890.7133178710938, 918.9359130859375, 947.158447265625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 12.0, 14.0, 13.0, 21.0, 24.0, 23.0, 20.0, 23.0, 29.0, 29.0, 41.0, 47.0, 66.0, 55.0, 65.0, 48.0, 56.0, 49.0, 35.0, 35.0, 31.0, 31.0, 35.0, 32.0, 29.0, 19.0, 14.0, 18.0, 9.0, 8.0, 10.0, 14.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.265380859375, -602.0185546875, -582.7717895507812, -563.5249633789062, -544.2781372070312, -525.0313110351562, -505.7845458984375, -486.5377197265625, -467.2908935546875, -448.0440979003906, -428.7972717285156, -409.55047607421875, -390.30364990234375, -371.0568542480469, -351.81005859375, -332.563232421875, -313.3164367675781, -294.06964111328125, -274.82281494140625, -255.57601928710938, -236.32919311523438, -217.0823974609375, -197.83558654785156, -178.58877563476562, -159.3419647216797, -140.09515380859375, -120.84834289550781, -101.6015396118164, -82.35472869873047, -63.10791778564453, -43.861114501953125, -24.614303588867188, -5.36749267578125, 13.879316329956055, 33.12612533569336, 52.37293243408203, 71.61974334716797, 90.8665542602539, 110.11335754394531, 129.36016845703125, 148.6069793701172, 167.85379028320312, 187.10060119628906, 206.347412109375, 225.59420776367188, 244.84103393554688, 264.08782958984375, 283.33465576171875, 302.5814514160156, 321.8282470703125, 341.0750732421875, 360.3218688964844, 379.5686950683594, 398.81549072265625, 418.06231689453125, 437.3091125488281, 456.555908203125, 475.8027038574219, 495.0495300292969, 514.2963256835938, 533.5431518554688, 552.7899780273438, 572.0367431640625, 591.2835693359375, 610.5303955078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 16.0, 12.0, 16.0, 27.0, 31.0, 35.0, 61.0, 127.0, 247.0, 494.0, 1273.0, 3488.0, 13045.0, 183165.0, 3873333.0, 102921.0, 10835.0, 3048.0, 1105.0, 462.0, 213.0, 104.0, 59.0, 21.0, 37.0, 18.0, 11.0, 9.0, 11.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-122.125, -118.2392578125, -114.353515625, -110.4677734375, -106.58203125, -102.6962890625, -98.810546875, -94.9248046875, -91.0390625, -87.1533203125, -83.267578125, -79.3818359375, -75.49609375, -71.6103515625, -67.724609375, -63.8388671875, -59.953125, -56.0673828125, -52.181640625, -48.2958984375, -44.41015625, -40.5244140625, -36.638671875, -32.7529296875, -28.8671875, -24.9814453125, -21.095703125, -17.2099609375, -13.32421875, -9.4384765625, -5.552734375, -1.6669921875, 2.21875, 6.1044921875, 9.990234375, 13.8759765625, 17.76171875, 21.6474609375, 25.533203125, 29.4189453125, 33.3046875, 37.1904296875, 41.076171875, 44.9619140625, 48.84765625, 52.7333984375, 56.619140625, 60.5048828125, 64.390625, 68.2763671875, 72.162109375, 76.0478515625, 79.93359375, 83.8193359375, 87.705078125, 91.5908203125, 95.4765625, 99.3623046875, 103.248046875, 107.1337890625, 111.01953125, 114.9052734375, 118.791015625, 122.6767578125, 126.5625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 6.0, 13.0, 8.0, 9.0, 9.0, 19.0, 15.0, 21.0, 16.0, 29.0, 40.0, 37.0, 40.0, 55.0, 47.0, 44.0, 73.0, 69.0, 63.0, 42.0, 56.0, 55.0, 45.0, 27.0, 25.0, 24.0, 12.0, 18.0, 20.0, 15.0, 10.0, 10.0, 4.0, 12.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-38.15625, -36.99853515625, -35.8408203125, -34.68310546875, -33.525390625, -32.36767578125, -31.2099609375, -30.05224609375, -28.89453125, -27.73681640625, -26.5791015625, -25.42138671875, -24.263671875, -23.10595703125, -21.9482421875, -20.79052734375, -19.6328125, -18.47509765625, -17.3173828125, -16.15966796875, -15.001953125, -13.84423828125, -12.6865234375, -11.52880859375, -10.37109375, -9.21337890625, -8.0556640625, -6.89794921875, -5.740234375, -4.58251953125, -3.4248046875, -2.26708984375, -1.109375, 0.04833984375, 1.2060546875, 2.36376953125, 3.521484375, 4.67919921875, 5.8369140625, 6.99462890625, 8.15234375, 9.31005859375, 10.4677734375, 11.62548828125, 12.783203125, 13.94091796875, 15.0986328125, 16.25634765625, 17.4140625, 18.57177734375, 19.7294921875, 20.88720703125, 22.044921875, 23.20263671875, 24.3603515625, 25.51806640625, 26.67578125, 27.83349609375, 28.9912109375, 30.14892578125, 31.306640625, 32.46435546875, 33.6220703125, 34.77978515625, 35.9375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 6.0, 15.0, 27.0, 30.0, 49.0, 86.0, 122.0, 233.0, 298.0, 488.0, 780.0, 1290.0, 2312.0, 4807.0, 11148.0, 31970.0, 148658.0, 2966738.0, 910060.0, 77751.0, 21124.0, 7936.0, 3680.0, 1825.0, 1062.0, 615.0, 399.0, 237.0, 162.0, 118.0, 64.0, 54.0, 38.0, 30.0, 13.0, 11.0, 9.0, 2.0, 8.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.75, -80.1494140625, -77.548828125, -74.9482421875, -72.34765625, -69.7470703125, -67.146484375, -64.5458984375, -61.9453125, -59.3447265625, -56.744140625, -54.1435546875, -51.54296875, -48.9423828125, -46.341796875, -43.7412109375, -41.140625, -38.5400390625, -35.939453125, -33.3388671875, -30.73828125, -28.1376953125, -25.537109375, -22.9365234375, -20.3359375, -17.7353515625, -15.134765625, -12.5341796875, -9.93359375, -7.3330078125, -4.732421875, -2.1318359375, 0.46875, 3.0693359375, 5.669921875, 8.2705078125, 10.87109375, 13.4716796875, 16.072265625, 18.6728515625, 21.2734375, 23.8740234375, 26.474609375, 29.0751953125, 31.67578125, 34.2763671875, 36.876953125, 39.4775390625, 42.078125, 44.6787109375, 47.279296875, 49.8798828125, 52.48046875, 55.0810546875, 57.681640625, 60.2822265625, 62.8828125, 65.4833984375, 68.083984375, 70.6845703125, 73.28515625, 75.8857421875, 78.486328125, 81.0869140625, 83.6875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 4.0, 11.0, 21.0, 22.0, 23.0, 59.0, 82.0, 155.0, 335.0, 823.0, 1243.0, 640.0, 276.0, 137.0, 81.0, 44.0, 24.0, 26.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.6875, -102.2119140625, -98.736328125, -95.2607421875, -91.78515625, -88.3095703125, -84.833984375, -81.3583984375, -77.8828125, -74.4072265625, -70.931640625, -67.4560546875, -63.98046875, -60.5048828125, -57.029296875, -53.5537109375, -50.078125, -46.6025390625, -43.126953125, -39.6513671875, -36.17578125, -32.7001953125, -29.224609375, -25.7490234375, -22.2734375, -18.7978515625, -15.322265625, -11.8466796875, -8.37109375, -4.8955078125, -1.419921875, 2.0556640625, 5.53125, 9.0068359375, 12.482421875, 15.9580078125, 19.43359375, 22.9091796875, 26.384765625, 29.8603515625, 33.3359375, 36.8115234375, 40.287109375, 43.7626953125, 47.23828125, 50.7138671875, 54.189453125, 57.6650390625, 61.140625, 64.6162109375, 68.091796875, 71.5673828125, 75.04296875, 78.5185546875, 81.994140625, 85.4697265625, 88.9453125, 92.4208984375, 95.896484375, 99.3720703125, 102.84765625, 106.3232421875, 109.798828125, 113.2744140625, 116.75]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 19.0, 10.0, 50.0, 68.0, 102.0, 115.0, 147.0, 147.0, 109.0, 66.0, 49.0, 31.0, 20.0, 9.0, 10.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-392.81005859375, -373.8019104003906, -354.7937316894531, -335.78558349609375, -316.77740478515625, -297.7692565917969, -278.7611083984375, -259.7529296875, -240.74478149414062, -221.7366180419922, -202.72845458984375, -183.72030639648438, -164.71214294433594, -145.7039794921875, -126.6958236694336, -107.68766784667969, -88.67950439453125, -69.67134094238281, -50.663185119628906, -31.655025482177734, -12.646865844726562, 6.361297607421875, 25.36945343017578, 44.37760925292969, 63.385772705078125, 82.39393615722656, 101.40209197998047, 120.41024780273438, 139.4184112548828, 158.42657470703125, 177.43472290039062, 196.44288635253906, 215.45111083984375, 234.4592742919922, 253.46743774414062, 272.4755859375, 291.4837646484375, 310.4919128417969, 329.50006103515625, 348.50823974609375, 367.5163879394531, 386.5245361328125, 405.53271484375, 424.5408630371094, 443.54901123046875, 462.55718994140625, 481.5653381347656, 500.573486328125, 519.5816650390625, 538.58984375, 557.5979614257812, 576.6061401367188, 595.6143188476562, 614.6224365234375, 633.630615234375, 652.6387939453125, 671.64697265625, 690.6551513671875, 709.6632690429688, 728.6714477539062, 747.6796264648438, 766.687744140625, 785.6959228515625, 804.7041015625, 823.7122192382812]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 11.0, 17.0, 17.0, 22.0, 29.0, 13.0, 31.0, 30.0, 30.0, 38.0, 44.0, 41.0, 46.0, 36.0, 51.0, 42.0, 44.0, 49.0, 33.0, 52.0, 36.0, 39.0, 32.0, 25.0, 20.0, 26.0, 21.0, 20.0, 14.0, 13.0, 12.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-320.2158508300781, -309.3950500488281, -298.57427978515625, -287.75347900390625, -276.93267822265625, -266.11187744140625, -255.2910919189453, -244.47030639648438, -233.64950561523438, -222.82870483398438, -212.00791931152344, -201.1871337890625, -190.3663330078125, -179.5455322265625, -168.72474670410156, -157.90396118164062, -147.08316040039062, -136.26235961914062, -125.44157409667969, -114.62078094482422, -103.79998779296875, -92.97919464111328, -82.15840148925781, -71.33760833740234, -60.516815185546875, -49.696022033691406, -38.87522888183594, -28.05443572998047, -17.233642578125, -6.412849426269531, 4.4079437255859375, 15.228736877441406, 26.049560546875, 36.87035369873047, 47.69114685058594, 58.511940002441406, 69.33273315429688, 80.15352630615234, 90.97431945800781, 101.79511260986328, 112.61590576171875, 123.43669891357422, 134.2574920654297, 145.07827758789062, 155.89907836914062, 166.71987915039062, 177.54066467285156, 188.3614501953125, 199.1822509765625, 210.0030517578125, 220.82383728027344, 231.64462280273438, 242.46542358398438, 253.28622436523438, 264.10699462890625, 274.92779541015625, 285.74859619140625, 296.56939697265625, 307.39019775390625, 318.2109680175781, 329.0317687988281, 339.8525695800781, 350.67333984375, 361.494140625, 372.31494140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 18.0, 9.0, 16.0, 18.0, 37.0, 39.0, 69.0, 111.0, 158.0, 223.0, 382.0, 528.0, 934.0, 1588.0, 2943.0, 5377.0, 11101.0, 25030.0, 63904.0, 186270.0, 446536.0, 189974.0, 64009.0, 25402.0, 11251.0, 5460.0, 2900.0, 1689.0, 941.0, 571.0, 337.0, 238.0, 121.0, 102.0, 68.0, 53.0, 24.0, 35.0, 15.0, 17.0, 10.0, 4.0, 9.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-70.1875, -68.0283203125, -65.869140625, -63.7099609375, -61.55078125, -59.3916015625, -57.232421875, -55.0732421875, -52.9140625, -50.7548828125, -48.595703125, -46.4365234375, -44.27734375, -42.1181640625, -39.958984375, -37.7998046875, -35.640625, -33.4814453125, -31.322265625, -29.1630859375, -27.00390625, -24.8447265625, -22.685546875, -20.5263671875, -18.3671875, -16.2080078125, -14.048828125, -11.8896484375, -9.73046875, -7.5712890625, -5.412109375, -3.2529296875, -1.09375, 1.0654296875, 3.224609375, 5.3837890625, 7.54296875, 9.7021484375, 11.861328125, 14.0205078125, 16.1796875, 18.3388671875, 20.498046875, 22.6572265625, 24.81640625, 26.9755859375, 29.134765625, 31.2939453125, 33.453125, 35.6123046875, 37.771484375, 39.9306640625, 42.08984375, 44.2490234375, 46.408203125, 48.5673828125, 50.7265625, 52.8857421875, 55.044921875, 57.2041015625, 59.36328125, 61.5224609375, 63.681640625, 65.8408203125, 68.0]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 9.0, 14.0, 16.0, 12.0, 12.0, 19.0, 16.0, 25.0, 29.0, 24.0, 34.0, 34.0, 37.0, 37.0, 37.0, 52.0, 39.0, 50.0, 57.0, 39.0, 52.0, 47.0, 48.0, 40.0, 24.0, 34.0, 21.0, 25.0, 12.0, 25.0, 9.0, 13.0, 15.0, 9.0, 4.0, 4.0, 6.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.542236328125, -29.47509765625, -28.407958984375, -27.3408203125, -26.273681640625, -25.20654296875, -24.139404296875, -23.072265625, -22.005126953125, -20.93798828125, -19.870849609375, -18.8037109375, -17.736572265625, -16.66943359375, -15.602294921875, -14.53515625, -13.468017578125, -12.40087890625, -11.333740234375, -10.2666015625, -9.199462890625, -8.13232421875, -7.065185546875, -5.998046875, -4.930908203125, -3.86376953125, -2.796630859375, -1.7294921875, -0.662353515625, 0.40478515625, 1.471923828125, 2.5390625, 3.606201171875, 4.67333984375, 5.740478515625, 6.8076171875, 7.874755859375, 8.94189453125, 10.009033203125, 11.076171875, 12.143310546875, 13.21044921875, 14.277587890625, 15.3447265625, 16.411865234375, 17.47900390625, 18.546142578125, 19.61328125, 20.680419921875, 21.74755859375, 22.814697265625, 23.8818359375, 24.948974609375, 26.01611328125, 27.083251953125, 28.150390625, 29.217529296875, 30.28466796875, 31.351806640625, 32.4189453125, 33.486083984375, 34.55322265625, 35.620361328125, 36.6875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 16.0, 17.0, 21.0, 30.0, 54.0, 79.0, 112.0, 196.0, 361.0, 715.0, 1601.0, 4388.0, 16287.0, 90939.0, 754227.0, 147165.0, 22667.0, 5823.0, 2027.0, 840.0, 400.0, 208.0, 137.0, 76.0, 44.0, 29.0, 26.0, 7.0, 17.0, 13.0, 3.0, 9.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.25, -134.3828125, -129.515625, -124.6484375, -119.78125, -114.9140625, -110.046875, -105.1796875, -100.3125, -95.4453125, -90.578125, -85.7109375, -80.84375, -75.9765625, -71.109375, -66.2421875, -61.375, -56.5078125, -51.640625, -46.7734375, -41.90625, -37.0390625, -32.171875, -27.3046875, -22.4375, -17.5703125, -12.703125, -7.8359375, -2.96875, 1.8984375, 6.765625, 11.6328125, 16.5, 21.3671875, 26.234375, 31.1015625, 35.96875, 40.8359375, 45.703125, 50.5703125, 55.4375, 60.3046875, 65.171875, 70.0390625, 74.90625, 79.7734375, 84.640625, 89.5078125, 94.375, 99.2421875, 104.109375, 108.9765625, 113.84375, 118.7109375, 123.578125, 128.4453125, 133.3125, 138.1796875, 143.046875, 147.9140625, 152.78125, 157.6484375, 162.515625, 167.3828125, 172.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 9.0, 11.0, 14.0, 15.0, 25.0, 20.0, 34.0, 30.0, 52.0, 48.0, 43.0, 38.0, 43.0, 48.0, 52.0, 57.0, 63.0, 50.0, 42.0, 44.0, 45.0, 33.0, 28.0, 24.0, 23.0, 18.0, 12.0, 12.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.25, -158.201171875, -153.15234375, -148.103515625, -143.0546875, -138.005859375, -132.95703125, -127.908203125, -122.859375, -117.810546875, -112.76171875, -107.712890625, -102.6640625, -97.615234375, -92.56640625, -87.517578125, -82.46875, -77.419921875, -72.37109375, -67.322265625, -62.2734375, -57.224609375, -52.17578125, -47.126953125, -42.078125, -37.029296875, -31.98046875, -26.931640625, -21.8828125, -16.833984375, -11.78515625, -6.736328125, -1.6875, 3.361328125, 8.41015625, 13.458984375, 18.5078125, 23.556640625, 28.60546875, 33.654296875, 38.703125, 43.751953125, 48.80078125, 53.849609375, 58.8984375, 63.947265625, 68.99609375, 74.044921875, 79.09375, 84.142578125, 89.19140625, 94.240234375, 99.2890625, 104.337890625, 109.38671875, 114.435546875, 119.484375, 124.533203125, 129.58203125, 134.630859375, 139.6796875, 144.728515625, 149.77734375, 154.826171875, 159.875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 11.0, 16.0, 24.0, 28.0, 58.0, 75.0, 122.0, 223.0, 394.0, 691.0, 1554.0, 3915.0, 12000.0, 61114.0, 719539.0, 211415.0, 25690.0, 6857.0, 2371.0, 1126.0, 533.0, 334.0, 172.0, 110.0, 57.0, 32.0, 20.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-79.875, -77.5771484375, -75.279296875, -72.9814453125, -70.68359375, -68.3857421875, -66.087890625, -63.7900390625, -61.4921875, -59.1943359375, -56.896484375, -54.5986328125, -52.30078125, -50.0029296875, -47.705078125, -45.4072265625, -43.109375, -40.8115234375, -38.513671875, -36.2158203125, -33.91796875, -31.6201171875, -29.322265625, -27.0244140625, -24.7265625, -22.4287109375, -20.130859375, -17.8330078125, -15.53515625, -13.2373046875, -10.939453125, -8.6416015625, -6.34375, -4.0458984375, -1.748046875, 0.5498046875, 2.84765625, 5.1455078125, 7.443359375, 9.7412109375, 12.0390625, 14.3369140625, 16.634765625, 18.9326171875, 21.23046875, 23.5283203125, 25.826171875, 28.1240234375, 30.421875, 32.7197265625, 35.017578125, 37.3154296875, 39.61328125, 41.9111328125, 44.208984375, 46.5068359375, 48.8046875, 51.1025390625, 53.400390625, 55.6982421875, 57.99609375, 60.2939453125, 62.591796875, 64.8896484375, 67.1875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 13.0, 24.0, 50.0, 91.0, 247.0, 291.0, 128.0, 50.0, 31.0, 17.0, 15.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.054443359375, -0.053238868713378906, -0.05203437805175781, -0.05082988739013672, -0.049625396728515625, -0.04842090606689453, -0.04721641540527344, -0.046011924743652344, -0.04480743408203125, -0.043602943420410156, -0.04239845275878906, -0.04119396209716797, -0.039989471435546875, -0.03878498077392578, -0.03758049011230469, -0.036375999450683594, -0.0351715087890625, -0.033967018127441406, -0.03276252746582031, -0.03155803680419922, -0.030353546142578125, -0.02914905548095703, -0.027944564819335938, -0.026740074157714844, -0.02553558349609375, -0.024331092834472656, -0.023126602172851562, -0.02192211151123047, -0.020717620849609375, -0.01951313018798828, -0.018308639526367188, -0.017104148864746094, -0.015899658203125, -0.014695167541503906, -0.013490676879882812, -0.012286186218261719, -0.011081695556640625, -0.009877204895019531, -0.008672714233398438, -0.007468223571777344, -0.00626373291015625, -0.005059242248535156, -0.0038547515869140625, -0.0026502609252929688, -0.001445770263671875, -0.00024127960205078125, 0.0009632110595703125, 0.0021677017211914062, 0.0033721923828125, 0.004576683044433594, 0.0057811737060546875, 0.006985664367675781, 0.008190155029296875, 0.009394645690917969, 0.010599136352539062, 0.011803627014160156, 0.01300811767578125, 0.014212608337402344, 0.015417098999023438, 0.01662158966064453, 0.017826080322265625, 0.01903057098388672, 0.020235061645507812, 0.021439552307128906, 0.02264404296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 15.0, 24.0, 22.0, 41.0, 78.0, 107.0, 172.0, 365.0, 668.0, 1350.0, 3169.0, 8856.0, 35408.0, 241637.0, 650614.0, 80703.0, 16169.0, 5056.0, 2012.0, 971.0, 439.0, 253.0, 154.0, 74.0, 54.0, 28.0, 18.0, 20.0, 18.0, 11.0, 4.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.25, -50.52197265625, -48.7939453125, -47.06591796875, -45.337890625, -43.60986328125, -41.8818359375, -40.15380859375, -38.42578125, -36.69775390625, -34.9697265625, -33.24169921875, -31.513671875, -29.78564453125, -28.0576171875, -26.32958984375, -24.6015625, -22.87353515625, -21.1455078125, -19.41748046875, -17.689453125, -15.96142578125, -14.2333984375, -12.50537109375, -10.77734375, -9.04931640625, -7.3212890625, -5.59326171875, -3.865234375, -2.13720703125, -0.4091796875, 1.31884765625, 3.046875, 4.77490234375, 6.5029296875, 8.23095703125, 9.958984375, 11.68701171875, 13.4150390625, 15.14306640625, 16.87109375, 18.59912109375, 20.3271484375, 22.05517578125, 23.783203125, 25.51123046875, 27.2392578125, 28.96728515625, 30.6953125, 32.42333984375, 34.1513671875, 35.87939453125, 37.607421875, 39.33544921875, 41.0634765625, 42.79150390625, 44.51953125, 46.24755859375, 47.9755859375, 49.70361328125, 51.431640625, 53.15966796875, 54.8876953125, 56.61572265625, 58.34375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 11.0, 17.0, 13.0, 32.0, 48.0, 43.0, 79.0, 65.0, 98.0, 108.0, 92.0, 91.0, 67.0, 66.0, 36.0, 25.0, 17.0, 15.0, 20.0, 9.0, 3.0, 9.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-62.0625, -60.15234375, -58.2421875, -56.33203125, -54.421875, -52.51171875, -50.6015625, -48.69140625, -46.78125, -44.87109375, -42.9609375, -41.05078125, -39.140625, -37.23046875, -35.3203125, -33.41015625, -31.5, -29.58984375, -27.6796875, -25.76953125, -23.859375, -21.94921875, -20.0390625, -18.12890625, -16.21875, -14.30859375, -12.3984375, -10.48828125, -8.578125, -6.66796875, -4.7578125, -2.84765625, -0.9375, 0.97265625, 2.8828125, 4.79296875, 6.703125, 8.61328125, 10.5234375, 12.43359375, 14.34375, 16.25390625, 18.1640625, 20.07421875, 21.984375, 23.89453125, 25.8046875, 27.71484375, 29.625, 31.53515625, 33.4453125, 35.35546875, 37.265625, 39.17578125, 41.0859375, 42.99609375, 44.90625, 46.81640625, 48.7265625, 50.63671875, 52.546875, 54.45703125, 56.3671875, 58.27734375, 60.1875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 21.0, 64.0, 191.0, 314.0, 216.0, 108.0, 40.0, 19.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1606.042724609375, -1551.7738037109375, -1497.5048828125, -1443.2359619140625, -1388.967041015625, -1334.6981201171875, -1280.42919921875, -1226.1602783203125, -1171.891357421875, -1117.6224365234375, -1063.353515625, -1009.0845947265625, -954.815673828125, -900.5467529296875, -846.27783203125, -792.0089111328125, -737.739990234375, -683.4710693359375, -629.2021484375, -574.9332275390625, -520.664306640625, -466.3953857421875, -412.12646484375, -357.8575439453125, -303.588623046875, -249.3197021484375, -195.05078125, -140.7818603515625, -86.512939453125, -32.2440185546875, 22.02490234375, 76.2938232421875, 130.5628662109375, 184.831787109375, 239.1007080078125, 293.36962890625, 347.6385498046875, 401.907470703125, 456.1763916015625, 510.4453125, 564.7142333984375, 618.983154296875, 673.2520751953125, 727.52099609375, 781.7899169921875, 836.058837890625, 890.3277587890625, 944.5966796875, 998.8656005859375, 1053.134521484375, 1107.4034423828125, 1161.67236328125, 1215.9412841796875, 1270.210205078125, 1324.4791259765625, 1378.748046875, 1433.0169677734375, 1487.285888671875, 1541.5548095703125, 1595.82373046875, 1650.0926513671875, 1704.361572265625, 1758.6304931640625, 1812.8994140625, 1867.1683349609375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 11.0, 7.0, 6.0, 15.0, 10.0, 17.0, 13.0, 20.0, 22.0, 31.0, 20.0, 29.0, 38.0, 27.0, 42.0, 42.0, 37.0, 41.0, 59.0, 52.0, 49.0, 32.0, 39.0, 39.0, 38.0, 34.0, 29.0, 21.0, 31.0, 20.0, 16.0, 18.0, 15.0, 12.0, 20.0, 8.0, 8.0, 11.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-614.193115234375, -596.7333374023438, -579.2735595703125, -561.8137817382812, -544.35400390625, -526.8941650390625, -509.43438720703125, -491.974609375, -474.51483154296875, -457.0550537109375, -439.59527587890625, -422.1354675292969, -404.6756896972656, -387.2159118652344, -369.756103515625, -352.29632568359375, -334.8365478515625, -317.37677001953125, -299.9169921875, -282.4571838378906, -264.9974060058594, -247.53762817382812, -230.0778350830078, -212.6180419921875, -195.15826416015625, -177.698486328125, -160.2386932373047, -142.77890014648438, -125.31912231445312, -107.85933685302734, -90.39955139160156, -72.93976593017578, -55.47998046875, -38.02019500732422, -20.560409545898438, -3.1006240844726562, 14.359161376953125, 31.818946838378906, 49.27873229980469, 66.73851776123047, 84.19830322265625, 101.65808868408203, 119.11787414550781, 136.57766723632812, 154.03744506835938, 171.49722290039062, 188.95701599121094, 206.41680908203125, 223.8765869140625, 241.33636474609375, 258.796142578125, 276.2559509277344, 293.7157287597656, 311.1755065917969, 328.63531494140625, 346.0950927734375, 363.55487060546875, 381.0146484375, 398.47442626953125, 415.9342346191406, 433.3940124511719, 450.8537902832031, 468.3135986328125, 485.77337646484375, 503.233154296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 7.0, 9.0, 6.0, 7.0, 19.0, 21.0, 25.0, 44.0, 60.0, 80.0, 107.0, 156.0, 262.0, 406.0, 633.0, 1064.0, 1674.0, 3061.0, 5722.0, 11498.0, 26539.0, 83376.0, 341821.0, 1637369.0, 1615702.0, 337040.0, 79085.0, 25243.0, 10819.0, 5333.0, 2781.0, 1573.0, 938.0, 618.0, 404.0, 215.0, 151.0, 105.0, 82.0, 65.0, 47.0, 36.0, 18.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 1.0], "bins": [-42.125, -40.80810546875, -39.4912109375, -38.17431640625, -36.857421875, -35.54052734375, -34.2236328125, -32.90673828125, -31.58984375, -30.27294921875, -28.9560546875, -27.63916015625, -26.322265625, -25.00537109375, -23.6884765625, -22.37158203125, -21.0546875, -19.73779296875, -18.4208984375, -17.10400390625, -15.787109375, -14.47021484375, -13.1533203125, -11.83642578125, -10.51953125, -9.20263671875, -7.8857421875, -6.56884765625, -5.251953125, -3.93505859375, -2.6181640625, -1.30126953125, 0.015625, 1.33251953125, 2.6494140625, 3.96630859375, 5.283203125, 6.60009765625, 7.9169921875, 9.23388671875, 10.55078125, 11.86767578125, 13.1845703125, 14.50146484375, 15.818359375, 17.13525390625, 18.4521484375, 19.76904296875, 21.0859375, 22.40283203125, 23.7197265625, 25.03662109375, 26.353515625, 27.67041015625, 28.9873046875, 30.30419921875, 31.62109375, 32.93798828125, 34.2548828125, 35.57177734375, 36.888671875, 38.20556640625, 39.5224609375, 40.83935546875, 42.15625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 3.0, 6.0, 6.0, 12.0, 18.0, 20.0, 15.0, 26.0, 18.0, 39.0, 22.0, 31.0, 38.0, 32.0, 64.0, 44.0, 45.0, 59.0, 60.0, 44.0, 49.0, 48.0, 50.0, 36.0, 38.0, 25.0, 20.0, 23.0, 13.0, 15.0, 16.0, 17.0, 8.0, 10.0, 7.0, 4.0, 3.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.859375, -26.784912109375, -25.71044921875, -24.635986328125, -23.5615234375, -22.487060546875, -21.41259765625, -20.338134765625, -19.263671875, -18.189208984375, -17.11474609375, -16.040283203125, -14.9658203125, -13.891357421875, -12.81689453125, -11.742431640625, -10.66796875, -9.593505859375, -8.51904296875, -7.444580078125, -6.3701171875, -5.295654296875, -4.22119140625, -3.146728515625, -2.072265625, -0.997802734375, 0.07666015625, 1.151123046875, 2.2255859375, 3.300048828125, 4.37451171875, 5.448974609375, 6.5234375, 7.597900390625, 8.67236328125, 9.746826171875, 10.8212890625, 11.895751953125, 12.97021484375, 14.044677734375, 15.119140625, 16.193603515625, 17.26806640625, 18.342529296875, 19.4169921875, 20.491455078125, 21.56591796875, 22.640380859375, 23.71484375, 24.789306640625, 25.86376953125, 26.938232421875, 28.0126953125, 29.087158203125, 30.16162109375, 31.236083984375, 32.310546875, 33.385009765625, 34.45947265625, 35.533935546875, 36.6083984375, 37.682861328125, 38.75732421875, 39.831787109375, 40.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 9.0, 18.0, 31.0, 29.0, 72.0, 75.0, 119.0, 190.0, 308.0, 521.0, 940.0, 1683.0, 3561.0, 8626.0, 26466.0, 109246.0, 1789763.0, 2092117.0, 118253.0, 26661.0, 8451.0, 3434.0, 1606.0, 804.0, 471.0, 279.0, 157.0, 124.0, 85.0, 39.0, 46.0, 19.0, 15.0, 10.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-102.9375, -99.72265625, -96.5078125, -93.29296875, -90.078125, -86.86328125, -83.6484375, -80.43359375, -77.21875, -74.00390625, -70.7890625, -67.57421875, -64.359375, -61.14453125, -57.9296875, -54.71484375, -51.5, -48.28515625, -45.0703125, -41.85546875, -38.640625, -35.42578125, -32.2109375, -28.99609375, -25.78125, -22.56640625, -19.3515625, -16.13671875, -12.921875, -9.70703125, -6.4921875, -3.27734375, -0.0625, 3.15234375, 6.3671875, 9.58203125, 12.796875, 16.01171875, 19.2265625, 22.44140625, 25.65625, 28.87109375, 32.0859375, 35.30078125, 38.515625, 41.73046875, 44.9453125, 48.16015625, 51.375, 54.58984375, 57.8046875, 61.01953125, 64.234375, 67.44921875, 70.6640625, 73.87890625, 77.09375, 80.30859375, 83.5234375, 86.73828125, 89.953125, 93.16796875, 96.3828125, 99.59765625, 102.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 11.0, 9.0, 21.0, 28.0, 31.0, 53.0, 72.0, 75.0, 164.0, 383.0, 800.0, 1065.0, 599.0, 291.0, 159.0, 89.0, 74.0, 38.0, 25.0, 19.0, 16.0, 6.0, 8.0, 11.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-142.5, -138.08984375, -133.6796875, -129.26953125, -124.859375, -120.44921875, -116.0390625, -111.62890625, -107.21875, -102.80859375, -98.3984375, -93.98828125, -89.578125, -85.16796875, -80.7578125, -76.34765625, -71.9375, -67.52734375, -63.1171875, -58.70703125, -54.296875, -49.88671875, -45.4765625, -41.06640625, -36.65625, -32.24609375, -27.8359375, -23.42578125, -19.015625, -14.60546875, -10.1953125, -5.78515625, -1.375, 3.03515625, 7.4453125, 11.85546875, 16.265625, 20.67578125, 25.0859375, 29.49609375, 33.90625, 38.31640625, 42.7265625, 47.13671875, 51.546875, 55.95703125, 60.3671875, 64.77734375, 69.1875, 73.59765625, 78.0078125, 82.41796875, 86.828125, 91.23828125, 95.6484375, 100.05859375, 104.46875, 108.87890625, 113.2890625, 117.69921875, 122.109375, 126.51953125, 130.9296875, 135.33984375, 139.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 14.0, 14.0, 30.0, 91.0, 173.0, 246.0, 216.0, 128.0, 40.0, 26.0, 10.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2329.535888671875, -2277.539794921875, -2225.54345703125, -2173.54736328125, -2121.55126953125, -2069.554931640625, -2017.558837890625, -1965.5626220703125, -1913.56640625, -1861.5701904296875, -1809.5740966796875, -1757.577880859375, -1705.5816650390625, -1653.58544921875, -1601.58935546875, -1549.5931396484375, -1497.5970458984375, -1445.600830078125, -1393.604736328125, -1341.6085205078125, -1289.6123046875, -1237.6162109375, -1185.6199951171875, -1133.623779296875, -1081.627685546875, -1029.6314697265625, -977.6353149414062, -925.63916015625, -873.6429443359375, -821.6467895507812, -769.650634765625, -717.6544189453125, -665.6580810546875, -613.6619262695312, -561.6657104492188, -509.6695556640625, -457.6733703613281, -405.67718505859375, -353.6810302734375, -301.6848449707031, -249.68865966796875, -197.69247436523438, -145.69630432128906, -93.70013427734375, -41.703948974609375, 10.292236328125, 62.28839111328125, 114.28457641601562, 166.28076171875, 218.27694702148438, 270.27313232421875, 322.269287109375, 374.2654724121094, 426.26165771484375, 478.2578125, 530.2540283203125, 582.2501831054688, 634.246337890625, 686.2425537109375, 738.2387084960938, 790.23486328125, 842.2310791015625, 894.2272338867188, 946.223388671875, 998.2196044921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 9.0, 7.0, 6.0, 15.0, 20.0, 30.0, 23.0, 26.0, 31.0, 33.0, 34.0, 44.0, 41.0, 62.0, 55.0, 64.0, 39.0, 57.0, 31.0, 52.0, 34.0, 33.0, 41.0, 29.0, 32.0, 23.0, 22.0, 22.0, 17.0, 14.0, 5.0, 12.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-600.299560546875, -582.5486450195312, -564.7977294921875, -547.0468139648438, -529.2958984375, -511.54498291015625, -493.7940673828125, -476.04315185546875, -458.292236328125, -440.54132080078125, -422.7904052734375, -405.03948974609375, -387.28857421875, -369.53765869140625, -351.7867431640625, -334.03582763671875, -316.2848815917969, -298.5339660644531, -280.7830505371094, -263.0321350097656, -245.28121948242188, -227.53030395507812, -209.7793731689453, -192.02845764160156, -174.2775421142578, -156.52662658691406, -138.7757110595703, -121.02478790283203, -103.27387237548828, -85.52295684814453, -67.77203369140625, -50.0211181640625, -32.27020263671875, -14.519285202026367, 3.2316322326660156, 20.98255157470703, 38.73346710205078, 56.48438262939453, 74.23530578613281, 91.98622131347656, 109.73713684082031, 127.48805236816406, 145.2389678955078, 162.98989868164062, 180.74081420898438, 198.49172973632812, 216.24264526367188, 233.99356079101562, 251.74447631835938, 269.4953918457031, 287.2463073730469, 304.9972229003906, 322.7481384277344, 340.4990539550781, 358.25, 376.00091552734375, 393.7518310546875, 411.50274658203125, 429.253662109375, 447.00457763671875, 464.7554931640625, 482.50640869140625, 500.25732421875, 518.0082397460938, 535.7591552734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 12.0, 17.0, 14.0, 30.0, 49.0, 60.0, 92.0, 118.0, 166.0, 324.0, 546.0, 795.0, 1369.0, 2291.0, 3907.0, 6995.0, 12940.0, 25408.0, 50653.0, 106499.0, 238442.0, 313772.0, 145050.0, 67864.0, 33471.0, 16497.0, 9029.0, 5049.0, 2811.0, 1649.0, 953.0, 635.0, 332.0, 257.0, 139.0, 104.0, 54.0, 47.0, 36.0, 34.0, 12.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.875, -54.083984375, -52.29296875, -50.501953125, -48.7109375, -46.919921875, -45.12890625, -43.337890625, -41.546875, -39.755859375, -37.96484375, -36.173828125, -34.3828125, -32.591796875, -30.80078125, -29.009765625, -27.21875, -25.427734375, -23.63671875, -21.845703125, -20.0546875, -18.263671875, -16.47265625, -14.681640625, -12.890625, -11.099609375, -9.30859375, -7.517578125, -5.7265625, -3.935546875, -2.14453125, -0.353515625, 1.4375, 3.228515625, 5.01953125, 6.810546875, 8.6015625, 10.392578125, 12.18359375, 13.974609375, 15.765625, 17.556640625, 19.34765625, 21.138671875, 22.9296875, 24.720703125, 26.51171875, 28.302734375, 30.09375, 31.884765625, 33.67578125, 35.466796875, 37.2578125, 39.048828125, 40.83984375, 42.630859375, 44.421875, 46.212890625, 48.00390625, 49.794921875, 51.5859375, 53.376953125, 55.16796875, 56.958984375, 58.75]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 13.0, 11.0, 13.0, 15.0, 20.0, 28.0, 24.0, 34.0, 41.0, 42.0, 49.0, 57.0, 52.0, 54.0, 50.0, 50.0, 57.0, 44.0, 57.0, 39.0, 27.0, 35.0, 35.0, 28.0, 13.0, 24.0, 17.0, 11.0, 12.0, 11.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.5625, -47.31103515625, -46.0595703125, -44.80810546875, -43.556640625, -42.30517578125, -41.0537109375, -39.80224609375, -38.55078125, -37.29931640625, -36.0478515625, -34.79638671875, -33.544921875, -32.29345703125, -31.0419921875, -29.79052734375, -28.5390625, -27.28759765625, -26.0361328125, -24.78466796875, -23.533203125, -22.28173828125, -21.0302734375, -19.77880859375, -18.52734375, -17.27587890625, -16.0244140625, -14.77294921875, -13.521484375, -12.27001953125, -11.0185546875, -9.76708984375, -8.515625, -7.26416015625, -6.0126953125, -4.76123046875, -3.509765625, -2.25830078125, -1.0068359375, 0.24462890625, 1.49609375, 2.74755859375, 3.9990234375, 5.25048828125, 6.501953125, 7.75341796875, 9.0048828125, 10.25634765625, 11.5078125, 12.75927734375, 14.0107421875, 15.26220703125, 16.513671875, 17.76513671875, 19.0166015625, 20.26806640625, 21.51953125, 22.77099609375, 24.0224609375, 25.27392578125, 26.525390625, 27.77685546875, 29.0283203125, 30.27978515625, 31.53125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 13.0, 11.0, 13.0, 22.0, 52.0, 38.0, 64.0, 100.0, 165.0, 239.0, 413.0, 740.0, 1487.0, 3644.0, 12819.0, 96721.0, 809573.0, 102051.0, 13321.0, 3666.0, 1458.0, 720.0, 419.0, 281.0, 158.0, 108.0, 70.0, 57.0, 37.0, 18.0, 18.0, 20.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-254.75, -248.134765625, -241.51953125, -234.904296875, -228.2890625, -221.673828125, -215.05859375, -208.443359375, -201.828125, -195.212890625, -188.59765625, -181.982421875, -175.3671875, -168.751953125, -162.13671875, -155.521484375, -148.90625, -142.291015625, -135.67578125, -129.060546875, -122.4453125, -115.830078125, -109.21484375, -102.599609375, -95.984375, -89.369140625, -82.75390625, -76.138671875, -69.5234375, -62.908203125, -56.29296875, -49.677734375, -43.0625, -36.447265625, -29.83203125, -23.216796875, -16.6015625, -9.986328125, -3.37109375, 3.244140625, 9.859375, 16.474609375, 23.08984375, 29.705078125, 36.3203125, 42.935546875, 49.55078125, 56.166015625, 62.78125, 69.396484375, 76.01171875, 82.626953125, 89.2421875, 95.857421875, 102.47265625, 109.087890625, 115.703125, 122.318359375, 128.93359375, 135.548828125, 142.1640625, 148.779296875, 155.39453125, 162.009765625, 168.625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 4.0, 14.0, 16.0, 22.0, 24.0, 19.0, 24.0, 45.0, 40.0, 47.0, 46.0, 58.0, 65.0, 66.0, 56.0, 52.0, 61.0, 32.0, 42.0, 42.0, 32.0, 38.0, 27.0, 27.0, 21.0, 15.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-266.25, -259.634765625, -253.01953125, -246.404296875, -239.7890625, -233.173828125, -226.55859375, -219.943359375, -213.328125, -206.712890625, -200.09765625, -193.482421875, -186.8671875, -180.251953125, -173.63671875, -167.021484375, -160.40625, -153.791015625, -147.17578125, -140.560546875, -133.9453125, -127.330078125, -120.71484375, -114.099609375, -107.484375, -100.869140625, -94.25390625, -87.638671875, -81.0234375, -74.408203125, -67.79296875, -61.177734375, -54.5625, -47.947265625, -41.33203125, -34.716796875, -28.1015625, -21.486328125, -14.87109375, -8.255859375, -1.640625, 4.974609375, 11.58984375, 18.205078125, 24.8203125, 31.435546875, 38.05078125, 44.666015625, 51.28125, 57.896484375, 64.51171875, 71.126953125, 77.7421875, 84.357421875, 90.97265625, 97.587890625, 104.203125, 110.818359375, 117.43359375, 124.048828125, 130.6640625, 137.279296875, 143.89453125, 150.509765625, 157.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 12.0, 11.0, 22.0, 29.0, 34.0, 62.0, 103.0, 184.0, 314.0, 617.0, 1452.0, 3601.0, 10910.0, 43443.0, 256964.0, 628947.0, 75842.0, 17024.0, 5188.0, 1950.0, 816.0, 424.0, 218.0, 123.0, 87.0, 45.0, 49.0, 24.0, 11.0, 10.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -33.82177734375, -32.3623046875, -30.90283203125, -29.443359375, -27.98388671875, -26.5244140625, -25.06494140625, -23.60546875, -22.14599609375, -20.6865234375, -19.22705078125, -17.767578125, -16.30810546875, -14.8486328125, -13.38916015625, -11.9296875, -10.47021484375, -9.0107421875, -7.55126953125, -6.091796875, -4.63232421875, -3.1728515625, -1.71337890625, -0.25390625, 1.20556640625, 2.6650390625, 4.12451171875, 5.583984375, 7.04345703125, 8.5029296875, 9.96240234375, 11.421875, 12.88134765625, 14.3408203125, 15.80029296875, 17.259765625, 18.71923828125, 20.1787109375, 21.63818359375, 23.09765625, 24.55712890625, 26.0166015625, 27.47607421875, 28.935546875, 30.39501953125, 31.8544921875, 33.31396484375, 34.7734375, 36.23291015625, 37.6923828125, 39.15185546875, 40.611328125, 42.07080078125, 43.5302734375, 44.98974609375, 46.44921875, 47.90869140625, 49.3681640625, 50.82763671875, 52.287109375, 53.74658203125, 55.2060546875, 56.66552734375, 58.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 25.0, 24.0, 28.0, 33.0, 40.0, 57.0, 84.0, 91.0, 121.0, 98.0, 88.0, 57.0, 51.0, 32.0, 34.0, 18.0, 16.0, 15.0, 10.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017974853515625, -0.017531633377075195, -0.01708841323852539, -0.016645193099975586, -0.01620197296142578, -0.015758752822875977, -0.015315532684326172, -0.014872312545776367, -0.014429092407226562, -0.013985872268676758, -0.013542652130126953, -0.013099431991577148, -0.012656211853027344, -0.012212991714477539, -0.011769771575927734, -0.01132655143737793, -0.010883331298828125, -0.01044011116027832, -0.009996891021728516, -0.009553670883178711, -0.009110450744628906, -0.008667230606079102, -0.008224010467529297, -0.007780790328979492, -0.0073375701904296875, -0.006894350051879883, -0.006451129913330078, -0.0060079097747802734, -0.005564689636230469, -0.005121469497680664, -0.004678249359130859, -0.004235029220581055, -0.00379180908203125, -0.0033485889434814453, -0.0029053688049316406, -0.002462148666381836, -0.0020189285278320312, -0.0015757083892822266, -0.0011324882507324219, -0.0006892681121826172, -0.0002460479736328125, 0.0001971721649169922, 0.0006403923034667969, 0.0010836124420166016, 0.0015268325805664062, 0.001970052719116211, 0.0024132728576660156, 0.0028564929962158203, 0.003299713134765625, 0.0037429332733154297, 0.004186153411865234, 0.004629373550415039, 0.005072593688964844, 0.0055158138275146484, 0.005959033966064453, 0.006402254104614258, 0.0068454742431640625, 0.007288694381713867, 0.007731914520263672, 0.008175134658813477, 0.008618354797363281, 0.009061574935913086, 0.00950479507446289, 0.009948015213012695, 0.0103912353515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 10.0, 24.0, 27.0, 69.0, 77.0, 131.0, 208.0, 472.0, 994.0, 2513.0, 8960.0, 59805.0, 787034.0, 164473.0, 17237.0, 3867.0, 1355.0, 590.0, 291.0, 147.0, 82.0, 58.0, 34.0, 22.0, 17.0, 9.0, 10.0, 10.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.0625, -74.96240234375, -72.8623046875, -70.76220703125, -68.662109375, -66.56201171875, -64.4619140625, -62.36181640625, -60.26171875, -58.16162109375, -56.0615234375, -53.96142578125, -51.861328125, -49.76123046875, -47.6611328125, -45.56103515625, -43.4609375, -41.36083984375, -39.2607421875, -37.16064453125, -35.060546875, -32.96044921875, -30.8603515625, -28.76025390625, -26.66015625, -24.56005859375, -22.4599609375, -20.35986328125, -18.259765625, -16.15966796875, -14.0595703125, -11.95947265625, -9.859375, -7.75927734375, -5.6591796875, -3.55908203125, -1.458984375, 0.64111328125, 2.7412109375, 4.84130859375, 6.94140625, 9.04150390625, 11.1416015625, 13.24169921875, 15.341796875, 17.44189453125, 19.5419921875, 21.64208984375, 23.7421875, 25.84228515625, 27.9423828125, 30.04248046875, 32.142578125, 34.24267578125, 36.3427734375, 38.44287109375, 40.54296875, 42.64306640625, 44.7431640625, 46.84326171875, 48.943359375, 51.04345703125, 53.1435546875, 55.24365234375, 57.34375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 13.0, 9.0, 10.0, 16.0, 14.0, 21.0, 21.0, 29.0, 26.0, 39.0, 48.0, 43.0, 37.0, 54.0, 74.0, 76.0, 59.0, 58.0, 54.0, 36.0, 34.0, 30.0, 28.0, 19.0, 25.0, 19.0, 22.0, 5.0, 8.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.5625, -38.36669921875, -37.1708984375, -35.97509765625, -34.779296875, -33.58349609375, -32.3876953125, -31.19189453125, -29.99609375, -28.80029296875, -27.6044921875, -26.40869140625, -25.212890625, -24.01708984375, -22.8212890625, -21.62548828125, -20.4296875, -19.23388671875, -18.0380859375, -16.84228515625, -15.646484375, -14.45068359375, -13.2548828125, -12.05908203125, -10.86328125, -9.66748046875, -8.4716796875, -7.27587890625, -6.080078125, -4.88427734375, -3.6884765625, -2.49267578125, -1.296875, -0.10107421875, 1.0947265625, 2.29052734375, 3.486328125, 4.68212890625, 5.8779296875, 7.07373046875, 8.26953125, 9.46533203125, 10.6611328125, 11.85693359375, 13.052734375, 14.24853515625, 15.4443359375, 16.64013671875, 17.8359375, 19.03173828125, 20.2275390625, 21.42333984375, 22.619140625, 23.81494140625, 25.0107421875, 26.20654296875, 27.40234375, 28.59814453125, 29.7939453125, 30.98974609375, 32.185546875, 33.38134765625, 34.5771484375, 35.77294921875, 36.96875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 13.0, 39.0, 50.0, 150.0, 268.0, 217.0, 139.0, 64.0, 26.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-973.2877197265625, -928.6898803710938, -884.092041015625, -839.4942626953125, -794.8963623046875, -750.298583984375, -705.7007446289062, -661.1029052734375, -616.5050659179688, -571.9072265625, -527.3093872070312, -482.7115783691406, -438.1137390136719, -393.5158996582031, -348.9180908203125, -304.32025146484375, -259.722412109375, -215.12457275390625, -170.52674865722656, -125.92892456054688, -81.33108520507812, -36.733245849609375, 7.86456298828125, 52.46240234375, 97.06024169921875, 141.6580810546875, 186.2559051513672, 230.85372924804688, 275.4515686035156, 320.0494079589844, 364.647216796875, 409.24505615234375, 453.843017578125, 498.44085693359375, 543.0386962890625, 587.636474609375, 632.234375, 676.8321533203125, 721.4299926757812, 766.02783203125, 810.6256713867188, 855.2235107421875, 899.8213500976562, 944.419189453125, 989.0169677734375, 1033.6148681640625, 1078.212646484375, 1122.810546875, 1167.4083251953125, 1212.006103515625, 1256.60400390625, 1301.2017822265625, 1345.7996826171875, 1390.3974609375, 1434.995361328125, 1479.5931396484375, 1524.19091796875, 1568.7886962890625, 1613.3865966796875, 1657.984375, 1702.582275390625, 1747.1800537109375, 1791.77783203125, 1836.375732421875, 1880.9736328125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 7.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 11.0, 19.0, 14.0, 21.0, 25.0, 28.0, 32.0, 27.0, 26.0, 36.0, 35.0, 48.0, 67.0, 62.0, 69.0, 50.0, 43.0, 51.0, 36.0, 30.0, 26.0, 29.0, 18.0, 21.0, 23.0, 17.0, 15.0, 8.0, 20.0, 11.0, 6.0, 3.0, 3.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-561.072265625, -540.8294067382812, -520.5864868164062, -500.3436279296875, -480.1007385253906, -459.85784912109375, -439.614990234375, -419.3721008300781, -399.12921142578125, -378.8863220214844, -358.6434326171875, -338.40057373046875, -318.1576843261719, -297.914794921875, -277.67193603515625, -257.4290466308594, -237.1861572265625, -216.94326782226562, -196.7003936767578, -176.45751953125, -156.21463012695312, -135.97174072265625, -115.72886657714844, -95.48599243164062, -75.24310302734375, -55.000221252441406, -34.75733947753906, -14.514457702636719, 5.728424072265625, 25.97130584716797, 46.21418762207031, 66.45706176757812, 86.69989013671875, 106.9427719116211, 127.18565368652344, 147.42852783203125, 167.67141723632812, 187.914306640625, 208.1571807861328, 228.40005493164062, 248.6429443359375, 268.8858337402344, 289.12872314453125, 309.37158203125, 329.6144714355469, 349.85736083984375, 370.1002197265625, 390.3431091308594, 410.58599853515625, 430.8288879394531, 451.07177734375, 471.31463623046875, 491.5575256347656, 511.8004150390625, 532.0432739257812, 552.2861328125, 572.529052734375, 592.7719116210938, 613.0148315429688, 633.2576904296875, 653.5006103515625, 673.7434692382812, 693.986328125, 714.229248046875, 734.4721069335938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 21.0, 38.0, 53.0, 117.0, 191.0, 393.0, 774.0, 1571.0, 3257.0, 7061.0, 17521.0, 59584.0, 312803.0, 1805955.0, 1642431.0, 263033.0, 51539.0, 15667.0, 6471.0, 2728.0, 1406.0, 691.0, 403.0, 231.0, 124.0, 82.0, 41.0, 26.0, 20.0, 9.0, 11.0, 6.0, 6.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.15771484375, -29.5966796875, -28.03564453125, -26.474609375, -24.91357421875, -23.3525390625, -21.79150390625, -20.23046875, -18.66943359375, -17.1083984375, -15.54736328125, -13.986328125, -12.42529296875, -10.8642578125, -9.30322265625, -7.7421875, -6.18115234375, -4.6201171875, -3.05908203125, -1.498046875, 0.06298828125, 1.6240234375, 3.18505859375, 4.74609375, 6.30712890625, 7.8681640625, 9.42919921875, 10.990234375, 12.55126953125, 14.1123046875, 15.67333984375, 17.234375, 18.79541015625, 20.3564453125, 21.91748046875, 23.478515625, 25.03955078125, 26.6005859375, 28.16162109375, 29.72265625, 31.28369140625, 32.8447265625, 34.40576171875, 35.966796875, 37.52783203125, 39.0888671875, 40.64990234375, 42.2109375, 43.77197265625, 45.3330078125, 46.89404296875, 48.455078125, 50.01611328125, 51.5771484375, 53.13818359375, 54.69921875, 56.26025390625, 57.8212890625, 59.38232421875, 60.943359375, 62.50439453125, 64.0654296875, 65.62646484375, 67.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 5.0, 6.0, 17.0, 11.0, 22.0, 39.0, 46.0, 52.0, 62.0, 64.0, 73.0, 87.0, 85.0, 81.0, 65.0, 73.0, 51.0, 49.0, 33.0, 31.0, 9.0, 18.0, 15.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -41.71484375, -39.7421875, -37.76953125, -35.796875, -33.82421875, -31.8515625, -29.87890625, -27.90625, -25.93359375, -23.9609375, -21.98828125, -20.015625, -18.04296875, -16.0703125, -14.09765625, -12.125, -10.15234375, -8.1796875, -6.20703125, -4.234375, -2.26171875, -0.2890625, 1.68359375, 3.65625, 5.62890625, 7.6015625, 9.57421875, 11.546875, 13.51953125, 15.4921875, 17.46484375, 19.4375, 21.41015625, 23.3828125, 25.35546875, 27.328125, 29.30078125, 31.2734375, 33.24609375, 35.21875, 37.19140625, 39.1640625, 41.13671875, 43.109375, 45.08203125, 47.0546875, 49.02734375, 51.0, 52.97265625, 54.9453125, 56.91796875, 58.890625, 60.86328125, 62.8359375, 64.80859375, 66.78125, 68.75390625, 70.7265625, 72.69921875, 74.671875, 76.64453125, 78.6171875, 80.58984375, 82.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 7.0, 14.0, 19.0, 26.0, 42.0, 75.0, 114.0, 251.0, 429.0, 1048.0, 2956.0, 10096.0, 46659.0, 449647.0, 3437692.0, 203525.0, 29860.0, 7354.0, 2427.0, 1007.0, 428.0, 241.0, 142.0, 85.0, 50.0, 32.0, 20.0, 9.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.4375, -106.9169921875, -103.396484375, -99.8759765625, -96.35546875, -92.8349609375, -89.314453125, -85.7939453125, -82.2734375, -78.7529296875, -75.232421875, -71.7119140625, -68.19140625, -64.6708984375, -61.150390625, -57.6298828125, -54.109375, -50.5888671875, -47.068359375, -43.5478515625, -40.02734375, -36.5068359375, -32.986328125, -29.4658203125, -25.9453125, -22.4248046875, -18.904296875, -15.3837890625, -11.86328125, -8.3427734375, -4.822265625, -1.3017578125, 2.21875, 5.7392578125, 9.259765625, 12.7802734375, 16.30078125, 19.8212890625, 23.341796875, 26.8623046875, 30.3828125, 33.9033203125, 37.423828125, 40.9443359375, 44.46484375, 47.9853515625, 51.505859375, 55.0263671875, 58.546875, 62.0673828125, 65.587890625, 69.1083984375, 72.62890625, 76.1494140625, 79.669921875, 83.1904296875, 86.7109375, 90.2314453125, 93.751953125, 97.2724609375, 100.79296875, 104.3134765625, 107.833984375, 111.3544921875, 114.875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 5.0, 9.0, 19.0, 21.0, 25.0, 28.0, 47.0, 51.0, 59.0, 100.0, 156.0, 253.0, 423.0, 632.0, 684.0, 568.0, 335.0, 198.0, 121.0, 72.0, 53.0, 38.0, 34.0, 25.0, 28.0, 12.0, 12.0, 12.0, 7.0, 7.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-85.125, -82.220703125, -79.31640625, -76.412109375, -73.5078125, -70.603515625, -67.69921875, -64.794921875, -61.890625, -58.986328125, -56.08203125, -53.177734375, -50.2734375, -47.369140625, -44.46484375, -41.560546875, -38.65625, -35.751953125, -32.84765625, -29.943359375, -27.0390625, -24.134765625, -21.23046875, -18.326171875, -15.421875, -12.517578125, -9.61328125, -6.708984375, -3.8046875, -0.900390625, 2.00390625, 4.908203125, 7.8125, 10.716796875, 13.62109375, 16.525390625, 19.4296875, 22.333984375, 25.23828125, 28.142578125, 31.046875, 33.951171875, 36.85546875, 39.759765625, 42.6640625, 45.568359375, 48.47265625, 51.376953125, 54.28125, 57.185546875, 60.08984375, 62.994140625, 65.8984375, 68.802734375, 71.70703125, 74.611328125, 77.515625, 80.419921875, 83.32421875, 86.228515625, 89.1328125, 92.037109375, 94.94140625, 97.845703125, 100.75]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 19.0, 21.0, 72.0, 162.0, 287.0, 236.0, 117.0, 51.0, 17.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1917.255126953125, -1866.497802734375, -1815.7403564453125, -1764.9830322265625, -1714.2257080078125, -1663.46826171875, -1612.7109375, -1561.95361328125, -1511.1961669921875, -1460.4388427734375, -1409.681396484375, -1358.924072265625, -1308.166748046875, -1257.4093017578125, -1206.6519775390625, -1155.89453125, -1105.13720703125, -1054.3798828125, -1003.6224975585938, -952.8651123046875, -902.1077270507812, -851.350341796875, -800.593017578125, -749.8356323242188, -699.078369140625, -648.3209838867188, -597.5636596679688, -546.8062744140625, -496.04888916015625, -445.2915344238281, -394.5341796875, -343.77679443359375, -293.0194091796875, -242.2620391845703, -191.50466918945312, -140.747314453125, -89.98994445800781, -39.232574462890625, 11.5247802734375, 62.28216552734375, 113.03952026367188, 163.79689025878906, 214.55426025390625, 265.3116149902344, 316.0689697265625, 366.82635498046875, 417.5837097167969, 468.3410949707031, 519.0984497070312, 569.8558349609375, 620.6131591796875, 671.3705444335938, 722.1279296875, 772.88525390625, 823.6426391601562, 874.4000244140625, 925.1573486328125, 975.9147338867188, 1026.672119140625, 1077.429443359375, 1128.186767578125, 1178.9442138671875, 1229.7015380859375, 1280.458984375, 1331.21630859375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 7.0, 10.0, 12.0, 14.0, 16.0, 24.0, 29.0, 31.0, 24.0, 36.0, 42.0, 49.0, 58.0, 46.0, 63.0, 52.0, 41.0, 51.0, 52.0, 39.0, 33.0, 29.0, 30.0, 29.0, 34.0, 18.0, 26.0, 19.0, 23.0, 7.0, 3.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-502.78564453125, -487.50390625, -472.22216796875, -456.9404296875, -441.6586608886719, -426.3769226074219, -411.0951843261719, -395.8134460449219, -380.53167724609375, -365.24993896484375, -349.96820068359375, -334.68646240234375, -319.4046936035156, -304.1229553222656, -288.8412170410156, -273.5594787597656, -258.2777404785156, -242.99600219726562, -227.71424865722656, -212.43251037597656, -197.1507568359375, -181.8690185546875, -166.5872802734375, -151.3055419921875, -136.02378845214844, -120.7420425415039, -105.46029663085938, -90.17855834960938, -74.89681243896484, -59.61506652832031, -44.33332824707031, -29.05158233642578, -13.76983642578125, 1.5119075775146484, 16.793651580810547, 32.07539367675781, 47.357139587402344, 62.638885498046875, 77.92062377929688, 93.2023696899414, 108.48411560058594, 123.76586151123047, 139.047607421875, 154.329345703125, 169.611083984375, 184.89283752441406, 200.17457580566406, 215.45632934570312, 230.73806762695312, 246.01980590820312, 261.3015441894531, 276.58331298828125, 291.86505126953125, 307.14678955078125, 322.42852783203125, 337.71026611328125, 352.99200439453125, 368.27374267578125, 383.55548095703125, 398.83721923828125, 414.1189880371094, 429.4007263183594, 444.6824645996094, 459.9642028808594, 475.2459716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 1.0, 11.0, 10.0, 21.0, 45.0, 65.0, 110.0, 201.0, 360.0, 700.0, 1504.0, 3167.0, 7517.0, 20044.0, 58044.0, 204418.0, 502920.0, 169535.0, 50151.0, 17278.0, 6808.0, 2922.0, 1303.0, 670.0, 337.0, 162.0, 104.0, 53.0, 24.0, 38.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5, -83.748046875, -80.99609375, -78.244140625, -75.4921875, -72.740234375, -69.98828125, -67.236328125, -64.484375, -61.732421875, -58.98046875, -56.228515625, -53.4765625, -50.724609375, -47.97265625, -45.220703125, -42.46875, -39.716796875, -36.96484375, -34.212890625, -31.4609375, -28.708984375, -25.95703125, -23.205078125, -20.453125, -17.701171875, -14.94921875, -12.197265625, -9.4453125, -6.693359375, -3.94140625, -1.189453125, 1.5625, 4.314453125, 7.06640625, 9.818359375, 12.5703125, 15.322265625, 18.07421875, 20.826171875, 23.578125, 26.330078125, 29.08203125, 31.833984375, 34.5859375, 37.337890625, 40.08984375, 42.841796875, 45.59375, 48.345703125, 51.09765625, 53.849609375, 56.6015625, 59.353515625, 62.10546875, 64.857421875, 67.609375, 70.361328125, 73.11328125, 75.865234375, 78.6171875, 81.369140625, 84.12109375, 86.873046875, 89.625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 12.0, 13.0, 23.0, 28.0, 25.0, 63.0, 64.0, 68.0, 78.0, 84.0, 93.0, 67.0, 76.0, 80.0, 61.0, 33.0, 34.0, 39.0, 19.0, 19.0, 8.0, 7.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.875, -50.72265625, -48.5703125, -46.41796875, -44.265625, -42.11328125, -39.9609375, -37.80859375, -35.65625, -33.50390625, -31.3515625, -29.19921875, -27.046875, -24.89453125, -22.7421875, -20.58984375, -18.4375, -16.28515625, -14.1328125, -11.98046875, -9.828125, -7.67578125, -5.5234375, -3.37109375, -1.21875, 0.93359375, 3.0859375, 5.23828125, 7.390625, 9.54296875, 11.6953125, 13.84765625, 16.0, 18.15234375, 20.3046875, 22.45703125, 24.609375, 26.76171875, 28.9140625, 31.06640625, 33.21875, 35.37109375, 37.5234375, 39.67578125, 41.828125, 43.98046875, 46.1328125, 48.28515625, 50.4375, 52.58984375, 54.7421875, 56.89453125, 59.046875, 61.19921875, 63.3515625, 65.50390625, 67.65625, 69.80859375, 71.9609375, 74.11328125, 76.265625, 78.41796875, 80.5703125, 82.72265625, 84.875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 11.0, 17.0, 22.0, 52.0, 53.0, 83.0, 165.0, 271.0, 515.0, 915.0, 2230.0, 7789.0, 47481.0, 743147.0, 217415.0, 20791.0, 4375.0, 1484.0, 744.0, 380.0, 225.0, 114.0, 79.0, 66.0, 30.0, 24.0, 19.0, 10.0, 7.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.875, -150.548828125, -144.22265625, -137.896484375, -131.5703125, -125.244140625, -118.91796875, -112.591796875, -106.265625, -99.939453125, -93.61328125, -87.287109375, -80.9609375, -74.634765625, -68.30859375, -61.982421875, -55.65625, -49.330078125, -43.00390625, -36.677734375, -30.3515625, -24.025390625, -17.69921875, -11.373046875, -5.046875, 1.279296875, 7.60546875, 13.931640625, 20.2578125, 26.583984375, 32.91015625, 39.236328125, 45.5625, 51.888671875, 58.21484375, 64.541015625, 70.8671875, 77.193359375, 83.51953125, 89.845703125, 96.171875, 102.498046875, 108.82421875, 115.150390625, 121.4765625, 127.802734375, 134.12890625, 140.455078125, 146.78125, 153.107421875, 159.43359375, 165.759765625, 172.0859375, 178.412109375, 184.73828125, 191.064453125, 197.390625, 203.716796875, 210.04296875, 216.369140625, 222.6953125, 229.021484375, 235.34765625, 241.673828125, 248.0]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 22.0, 35.0, 50.0, 64.0, 68.0, 99.0, 93.0, 101.0, 95.0, 86.0, 66.0, 53.0, 46.0, 22.0, 23.0, 19.0, 14.0, 7.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.75, -260.83984375, -250.9296875, -241.01953125, -231.109375, -221.19921875, -211.2890625, -201.37890625, -191.46875, -181.55859375, -171.6484375, -161.73828125, -151.828125, -141.91796875, -132.0078125, -122.09765625, -112.1875, -102.27734375, -92.3671875, -82.45703125, -72.546875, -62.63671875, -52.7265625, -42.81640625, -32.90625, -22.99609375, -13.0859375, -3.17578125, 6.734375, 16.64453125, 26.5546875, 36.46484375, 46.375, 56.28515625, 66.1953125, 76.10546875, 86.015625, 95.92578125, 105.8359375, 115.74609375, 125.65625, 135.56640625, 145.4765625, 155.38671875, 165.296875, 175.20703125, 185.1171875, 195.02734375, 204.9375, 214.84765625, 224.7578125, 234.66796875, 244.578125, 254.48828125, 264.3984375, 274.30859375, 284.21875, 294.12890625, 304.0390625, 313.94921875, 323.859375, 333.76953125, 343.6796875, 353.58984375, 363.5]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 10.0, 12.0, 17.0, 35.0, 49.0, 67.0, 81.0, 144.0, 263.0, 405.0, 666.0, 1376.0, 2832.0, 6746.0, 18861.0, 71853.0, 575286.0, 293068.0, 51585.0, 14607.0, 5568.0, 2364.0, 1095.0, 582.0, 364.0, 223.0, 115.0, 76.0, 46.0, 45.0, 22.0, 25.0, 20.0, 14.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.5625, -41.1845703125, -39.806640625, -38.4287109375, -37.05078125, -35.6728515625, -34.294921875, -32.9169921875, -31.5390625, -30.1611328125, -28.783203125, -27.4052734375, -26.02734375, -24.6494140625, -23.271484375, -21.8935546875, -20.515625, -19.1376953125, -17.759765625, -16.3818359375, -15.00390625, -13.6259765625, -12.248046875, -10.8701171875, -9.4921875, -8.1142578125, -6.736328125, -5.3583984375, -3.98046875, -2.6025390625, -1.224609375, 0.1533203125, 1.53125, 2.9091796875, 4.287109375, 5.6650390625, 7.04296875, 8.4208984375, 9.798828125, 11.1767578125, 12.5546875, 13.9326171875, 15.310546875, 16.6884765625, 18.06640625, 19.4443359375, 20.822265625, 22.2001953125, 23.578125, 24.9560546875, 26.333984375, 27.7119140625, 29.08984375, 30.4677734375, 31.845703125, 33.2236328125, 34.6015625, 35.9794921875, 37.357421875, 38.7353515625, 40.11328125, 41.4912109375, 42.869140625, 44.2470703125, 45.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 1.0, 7.0, 9.0, 11.0, 9.0, 13.0, 22.0, 20.0, 36.0, 55.0, 87.0, 135.0, 127.0, 138.0, 99.0, 66.0, 39.0, 36.0, 20.0, 10.0, 13.0, 6.0, 5.0, 8.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0214691162109375, -0.02088308334350586, -0.02029705047607422, -0.019711017608642578, -0.019124984741210938, -0.018538951873779297, -0.017952919006347656, -0.017366886138916016, -0.016780853271484375, -0.016194820404052734, -0.015608787536621094, -0.015022754669189453, -0.014436721801757812, -0.013850688934326172, -0.013264656066894531, -0.01267862319946289, -0.01209259033203125, -0.01150655746459961, -0.010920524597167969, -0.010334491729736328, -0.009748458862304688, -0.009162425994873047, -0.008576393127441406, -0.007990360260009766, -0.007404327392578125, -0.006818294525146484, -0.006232261657714844, -0.005646228790283203, -0.0050601959228515625, -0.004474163055419922, -0.0038881301879882812, -0.0033020973205566406, -0.002716064453125, -0.0021300315856933594, -0.0015439987182617188, -0.0009579658508300781, -0.0003719329833984375, 0.00021409988403320312, 0.0008001327514648438, 0.0013861656188964844, 0.001972198486328125, 0.0025582313537597656, 0.0031442642211914062, 0.003730297088623047, 0.0043163299560546875, 0.004902362823486328, 0.005488395690917969, 0.006074428558349609, 0.00666046142578125, 0.007246494293212891, 0.007832527160644531, 0.008418560028076172, 0.009004592895507812, 0.009590625762939453, 0.010176658630371094, 0.010762691497802734, 0.011348724365234375, 0.011934757232666016, 0.012520790100097656, 0.013106822967529297, 0.013692855834960938, 0.014278888702392578, 0.014864921569824219, 0.01545095443725586, 0.0160369873046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 16.0, 12.0, 26.0, 38.0, 49.0, 80.0, 101.0, 147.0, 211.0, 361.0, 651.0, 1292.0, 2624.0, 6720.0, 20560.0, 86577.0, 606980.0, 253168.0, 46984.0, 12940.0, 4531.0, 1974.0, 1009.0, 535.0, 301.0, 176.0, 147.0, 103.0, 65.0, 43.0, 35.0, 32.0, 15.0, 8.0, 14.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.71875, -34.43408203125, -33.1494140625, -31.86474609375, -30.580078125, -29.29541015625, -28.0107421875, -26.72607421875, -25.44140625, -24.15673828125, -22.8720703125, -21.58740234375, -20.302734375, -19.01806640625, -17.7333984375, -16.44873046875, -15.1640625, -13.87939453125, -12.5947265625, -11.31005859375, -10.025390625, -8.74072265625, -7.4560546875, -6.17138671875, -4.88671875, -3.60205078125, -2.3173828125, -1.03271484375, 0.251953125, 1.53662109375, 2.8212890625, 4.10595703125, 5.390625, 6.67529296875, 7.9599609375, 9.24462890625, 10.529296875, 11.81396484375, 13.0986328125, 14.38330078125, 15.66796875, 16.95263671875, 18.2373046875, 19.52197265625, 20.806640625, 22.09130859375, 23.3759765625, 24.66064453125, 25.9453125, 27.22998046875, 28.5146484375, 29.79931640625, 31.083984375, 32.36865234375, 33.6533203125, 34.93798828125, 36.22265625, 37.50732421875, 38.7919921875, 40.07666015625, 41.361328125, 42.64599609375, 43.9306640625, 45.21533203125, 46.5]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 5.0, 12.0, 15.0, 15.0, 25.0, 31.0, 33.0, 29.0, 35.0, 42.0, 55.0, 54.0, 59.0, 65.0, 77.0, 60.0, 62.0, 40.0, 33.0, 45.0, 29.0, 23.0, 13.0, 20.0, 21.0, 14.0, 12.0, 11.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.40625, -27.4072265625, -26.408203125, -25.4091796875, -24.41015625, -23.4111328125, -22.412109375, -21.4130859375, -20.4140625, -19.4150390625, -18.416015625, -17.4169921875, -16.41796875, -15.4189453125, -14.419921875, -13.4208984375, -12.421875, -11.4228515625, -10.423828125, -9.4248046875, -8.42578125, -7.4267578125, -6.427734375, -5.4287109375, -4.4296875, -3.4306640625, -2.431640625, -1.4326171875, -0.43359375, 0.5654296875, 1.564453125, 2.5634765625, 3.5625, 4.5615234375, 5.560546875, 6.5595703125, 7.55859375, 8.5576171875, 9.556640625, 10.5556640625, 11.5546875, 12.5537109375, 13.552734375, 14.5517578125, 15.55078125, 16.5498046875, 17.548828125, 18.5478515625, 19.546875, 20.5458984375, 21.544921875, 22.5439453125, 23.54296875, 24.5419921875, 25.541015625, 26.5400390625, 27.5390625, 28.5380859375, 29.537109375, 30.5361328125, 31.53515625, 32.5341796875, 33.533203125, 34.5322265625, 35.53125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 11.0, 18.0, 39.0, 75.0, 119.0, 186.0, 248.0, 123.0, 64.0, 39.0, 23.0, 19.0, 10.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1224.50927734375, -1190.79345703125, -1157.07763671875, -1123.3616943359375, -1089.6458740234375, -1055.9300537109375, -1022.2142333984375, -988.4984130859375, -954.7825317382812, -921.0667114257812, -887.350830078125, -853.635009765625, -819.919189453125, -786.2033081054688, -752.4874877929688, -718.7716064453125, -685.0557861328125, -651.3399658203125, -617.6240844726562, -583.9082641601562, -550.1923828125, -516.4765625, -482.7607421875, -449.0448913574219, -415.32904052734375, -381.6131896972656, -347.8973388671875, -314.1815185546875, -280.4656677246094, -246.74981689453125, -213.0339813232422, -179.31814575195312, -145.60223388671875, -111.88639068603516, -78.17054748535156, -44.45470428466797, -10.738861083984375, 22.97698974609375, 56.69282531738281, 90.40866088867188, 124.12451171875, 157.84036254882812, 191.5561981201172, 225.27203369140625, 258.9878845214844, 292.7037353515625, 326.4195556640625, 360.1354064941406, 393.85125732421875, 427.5671081542969, 461.282958984375, 494.998779296875, 528.714599609375, 562.4304809570312, 596.1463012695312, 629.8621826171875, 663.5780029296875, 697.2938232421875, 731.0097045898438, 764.7255249023438, 798.44140625, 832.1572265625, 865.873046875, 899.5888671875, 933.3047485351562]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 8.0, 8.0, 22.0, 16.0, 15.0, 13.0, 19.0, 22.0, 17.0, 29.0, 27.0, 38.0, 37.0, 36.0, 42.0, 69.0, 82.0, 74.0, 56.0, 50.0, 52.0, 32.0, 26.0, 35.0, 33.0, 22.0, 20.0, 18.0, 11.0, 19.0, 6.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-621.338134765625, -599.2092895507812, -577.0805053710938, -554.95166015625, -532.8228149414062, -510.6940002441406, -488.565185546875, -466.43634033203125, -444.3075256347656, -422.1787109375, -400.04986572265625, -377.9210510253906, -355.792236328125, -333.66339111328125, -311.5345764160156, -289.40576171875, -267.27691650390625, -245.14808654785156, -223.01925659179688, -200.89044189453125, -178.76161193847656, -156.63278198242188, -134.50396728515625, -112.37513732910156, -90.24630737304688, -68.11747741699219, -45.98865509033203, -23.859832763671875, -1.7310028076171875, 20.3978271484375, 42.526641845703125, 64.65547180175781, 86.78436279296875, 108.91319274902344, 131.04202270507812, 153.17083740234375, 175.29966735839844, 197.42849731445312, 219.55731201171875, 241.68614196777344, 263.8149719238281, 285.94378662109375, 308.0726318359375, 330.2014465332031, 352.33026123046875, 374.4591064453125, 396.5879211425781, 418.71673583984375, 440.8455810546875, 462.9743957519531, 485.1032409667969, 507.2320556640625, 529.3609008789062, 551.48974609375, 573.6185302734375, 595.7473754882812, 617.876220703125, 640.0050659179688, 662.1338500976562, 684.2626953125, 706.3915405273438, 728.5203857421875, 750.649169921875, 772.7780151367188, 794.9067993164062]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 10.0, 10.0, 10.0, 21.0, 30.0, 35.0, 57.0, 99.0, 146.0, 226.0, 394.0, 706.0, 1249.0, 2478.0, 5664.0, 15421.0, 67333.0, 658834.0, 2894341.0, 470632.0, 53549.0, 13219.0, 4880.0, 2151.0, 1158.0, 591.0, 387.0, 193.0, 152.0, 95.0, 67.0, 40.0, 31.0, 21.0, 12.0, 8.0, 10.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.4375, -63.287109375, -61.13671875, -58.986328125, -56.8359375, -54.685546875, -52.53515625, -50.384765625, -48.234375, -46.083984375, -43.93359375, -41.783203125, -39.6328125, -37.482421875, -35.33203125, -33.181640625, -31.03125, -28.880859375, -26.73046875, -24.580078125, -22.4296875, -20.279296875, -18.12890625, -15.978515625, -13.828125, -11.677734375, -9.52734375, -7.376953125, -5.2265625, -3.076171875, -0.92578125, 1.224609375, 3.375, 5.525390625, 7.67578125, 9.826171875, 11.9765625, 14.126953125, 16.27734375, 18.427734375, 20.578125, 22.728515625, 24.87890625, 27.029296875, 29.1796875, 31.330078125, 33.48046875, 35.630859375, 37.78125, 39.931640625, 42.08203125, 44.232421875, 46.3828125, 48.533203125, 50.68359375, 52.833984375, 54.984375, 57.134765625, 59.28515625, 61.435546875, 63.5859375, 65.736328125, 67.88671875, 70.037109375, 72.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 14.0, 11.0, 11.0, 16.0, 22.0, 31.0, 45.0, 51.0, 44.0, 49.0, 59.0, 67.0, 60.0, 63.0, 75.0, 58.0, 55.0, 37.0, 45.0, 49.0, 25.0, 25.0, 20.0, 15.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-53.875, -52.3740234375, -50.873046875, -49.3720703125, -47.87109375, -46.3701171875, -44.869140625, -43.3681640625, -41.8671875, -40.3662109375, -38.865234375, -37.3642578125, -35.86328125, -34.3623046875, -32.861328125, -31.3603515625, -29.859375, -28.3583984375, -26.857421875, -25.3564453125, -23.85546875, -22.3544921875, -20.853515625, -19.3525390625, -17.8515625, -16.3505859375, -14.849609375, -13.3486328125, -11.84765625, -10.3466796875, -8.845703125, -7.3447265625, -5.84375, -4.3427734375, -2.841796875, -1.3408203125, 0.16015625, 1.6611328125, 3.162109375, 4.6630859375, 6.1640625, 7.6650390625, 9.166015625, 10.6669921875, 12.16796875, 13.6689453125, 15.169921875, 16.6708984375, 18.171875, 19.6728515625, 21.173828125, 22.6748046875, 24.17578125, 25.6767578125, 27.177734375, 28.6787109375, 30.1796875, 31.6806640625, 33.181640625, 34.6826171875, 36.18359375, 37.6845703125, 39.185546875, 40.6865234375, 42.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 10.0, 16.0, 25.0, 32.0, 47.0, 73.0, 106.0, 153.0, 236.0, 440.0, 1419.0, 21920.0, 4090630.0, 75264.0, 2581.0, 611.0, 238.0, 156.0, 120.0, 63.0, 51.0, 41.0, 20.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-364.75, -353.57421875, -342.3984375, -331.22265625, -320.046875, -308.87109375, -297.6953125, -286.51953125, -275.34375, -264.16796875, -252.9921875, -241.81640625, -230.640625, -219.46484375, -208.2890625, -197.11328125, -185.9375, -174.76171875, -163.5859375, -152.41015625, -141.234375, -130.05859375, -118.8828125, -107.70703125, -96.53125, -85.35546875, -74.1796875, -63.00390625, -51.828125, -40.65234375, -29.4765625, -18.30078125, -7.125, 4.05078125, 15.2265625, 26.40234375, 37.578125, 48.75390625, 59.9296875, 71.10546875, 82.28125, 93.45703125, 104.6328125, 115.80859375, 126.984375, 138.16015625, 149.3359375, 160.51171875, 171.6875, 182.86328125, 194.0390625, 205.21484375, 216.390625, 227.56640625, 238.7421875, 249.91796875, 261.09375, 272.26953125, 283.4453125, 294.62109375, 305.796875, 316.97265625, 328.1484375, 339.32421875, 350.5]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 11.0, 11.0, 28.0, 48.0, 118.0, 335.0, 1260.0, 1639.0, 409.0, 128.0, 43.0, 24.0, 16.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.0, -282.71484375, -274.4296875, -266.14453125, -257.859375, -249.57421875, -241.2890625, -233.00390625, -224.71875, -216.43359375, -208.1484375, -199.86328125, -191.578125, -183.29296875, -175.0078125, -166.72265625, -158.4375, -150.15234375, -141.8671875, -133.58203125, -125.296875, -117.01171875, -108.7265625, -100.44140625, -92.15625, -83.87109375, -75.5859375, -67.30078125, -59.015625, -50.73046875, -42.4453125, -34.16015625, -25.875, -17.58984375, -9.3046875, -1.01953125, 7.265625, 15.55078125, 23.8359375, 32.12109375, 40.40625, 48.69140625, 56.9765625, 65.26171875, 73.546875, 81.83203125, 90.1171875, 98.40234375, 106.6875, 114.97265625, 123.2578125, 131.54296875, 139.828125, 148.11328125, 156.3984375, 164.68359375, 172.96875, 181.25390625, 189.5390625, 197.82421875, 206.109375, 214.39453125, 222.6796875, 230.96484375, 239.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 30.0, 58.0, 85.0, 193.0, 276.0, 188.0, 72.0, 34.0, 17.0, 13.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1509.131591796875, -1458.294921875, -1407.4583740234375, -1356.6217041015625, -1305.78515625, -1254.948486328125, -1204.11181640625, -1153.2752685546875, -1102.4385986328125, -1051.6019287109375, -1000.765380859375, -949.9287109375, -899.0921020507812, -848.2554931640625, -797.4188842773438, -746.582275390625, -695.7456665039062, -644.9090576171875, -594.0724487304688, -543.23583984375, -492.399169921875, -441.56256103515625, -390.7259521484375, -339.8893127441406, -289.0527038574219, -238.21607971191406, -187.37945556640625, -136.5428466796875, -85.70622253417969, -34.869598388671875, 15.967010498046875, 66.80364990234375, 117.6402587890625, 168.4768829345703, 219.31350708007812, 270.1501159667969, 320.98675537109375, 371.8233642578125, 422.65997314453125, 473.4966125488281, 524.333251953125, 575.1698608398438, 626.0064697265625, 676.8431396484375, 727.6797485351562, 778.516357421875, 829.3529663085938, 880.1895751953125, 931.0261840820312, 981.86279296875, 1032.699462890625, 1083.5360107421875, 1134.3726806640625, 1185.209228515625, 1236.0458984375, 1286.882568359375, 1337.7191162109375, 1388.5557861328125, 1439.392333984375, 1490.22900390625, 1541.0655517578125, 1591.9022216796875, 1642.73876953125, 1693.575439453125, 1744.412109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 11.0, 9.0, 8.0, 20.0, 27.0, 27.0, 25.0, 36.0, 45.0, 41.0, 49.0, 52.0, 56.0, 55.0, 53.0, 60.0, 56.0, 60.0, 54.0, 44.0, 35.0, 36.0, 33.0, 22.0, 21.0, 16.0, 16.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.2180786132812, -570.8192138671875, -552.4203491210938, -534.0214233398438, -515.62255859375, -497.22369384765625, -478.8248291015625, -460.42596435546875, -442.0270690917969, -423.6282043457031, -405.22930908203125, -386.8304443359375, -368.43157958984375, -350.0326843261719, -331.6338195800781, -313.23492431640625, -294.8360595703125, -276.43719482421875, -258.0382995605469, -239.63943481445312, -221.2405548095703, -202.8416748046875, -184.44281005859375, -166.04393005371094, -147.64505004882812, -129.2461700439453, -110.84729766845703, -92.44842529296875, -74.04954528808594, -55.650665283203125, -37.251792907714844, -18.852920532226562, -0.4541015625, 17.944774627685547, 36.343650817871094, 54.74252700805664, 73.14140319824219, 91.540283203125, 109.93915557861328, 128.33802795410156, 146.73690795898438, 165.1357879638672, 183.53466796875, 201.93353271484375, 220.33241271972656, 238.73129272460938, 257.1301574707031, 275.529052734375, 293.92791748046875, 312.3267822265625, 330.7256774902344, 349.1245422363281, 367.5234375, 385.92230224609375, 404.3211669921875, 422.72003173828125, 441.1189270019531, 459.5177917480469, 477.91668701171875, 496.3155517578125, 514.7144165039062, 533.11328125, 551.51220703125, 569.9110717773438, 588.3099365234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 11.0, 14.0, 28.0, 35.0, 65.0, 75.0, 104.0, 173.0, 264.0, 381.0, 675.0, 1009.0, 1639.0, 2715.0, 4614.0, 8333.0, 15642.0, 30873.0, 64199.0, 143086.0, 292468.0, 254336.0, 117494.0, 53493.0, 25908.0, 13289.0, 7105.0, 4119.0, 2413.0, 1435.0, 900.0, 555.0, 354.0, 256.0, 177.0, 119.0, 55.0, 44.0, 26.0, 20.0, 13.0, 9.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-44.46875, -43.1162109375, -41.763671875, -40.4111328125, -39.05859375, -37.7060546875, -36.353515625, -35.0009765625, -33.6484375, -32.2958984375, -30.943359375, -29.5908203125, -28.23828125, -26.8857421875, -25.533203125, -24.1806640625, -22.828125, -21.4755859375, -20.123046875, -18.7705078125, -17.41796875, -16.0654296875, -14.712890625, -13.3603515625, -12.0078125, -10.6552734375, -9.302734375, -7.9501953125, -6.59765625, -5.2451171875, -3.892578125, -2.5400390625, -1.1875, 0.1650390625, 1.517578125, 2.8701171875, 4.22265625, 5.5751953125, 6.927734375, 8.2802734375, 9.6328125, 10.9853515625, 12.337890625, 13.6904296875, 15.04296875, 16.3955078125, 17.748046875, 19.1005859375, 20.453125, 21.8056640625, 23.158203125, 24.5107421875, 25.86328125, 27.2158203125, 28.568359375, 29.9208984375, 31.2734375, 32.6259765625, 33.978515625, 35.3310546875, 36.68359375, 38.0361328125, 39.388671875, 40.7412109375, 42.09375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 8.0, 8.0, 12.0, 10.0, 13.0, 19.0, 23.0, 37.0, 35.0, 50.0, 48.0, 57.0, 55.0, 51.0, 62.0, 53.0, 59.0, 56.0, 61.0, 50.0, 36.0, 36.0, 30.0, 26.0, 22.0, 26.0, 6.0, 18.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.15625, -53.5771484375, -51.998046875, -50.4189453125, -48.83984375, -47.2607421875, -45.681640625, -44.1025390625, -42.5234375, -40.9443359375, -39.365234375, -37.7861328125, -36.20703125, -34.6279296875, -33.048828125, -31.4697265625, -29.890625, -28.3115234375, -26.732421875, -25.1533203125, -23.57421875, -21.9951171875, -20.416015625, -18.8369140625, -17.2578125, -15.6787109375, -14.099609375, -12.5205078125, -10.94140625, -9.3623046875, -7.783203125, -6.2041015625, -4.625, -3.0458984375, -1.466796875, 0.1123046875, 1.69140625, 3.2705078125, 4.849609375, 6.4287109375, 8.0078125, 9.5869140625, 11.166015625, 12.7451171875, 14.32421875, 15.9033203125, 17.482421875, 19.0615234375, 20.640625, 22.2197265625, 23.798828125, 25.3779296875, 26.95703125, 28.5361328125, 30.115234375, 31.6943359375, 33.2734375, 34.8525390625, 36.431640625, 38.0107421875, 39.58984375, 41.1689453125, 42.748046875, 44.3271484375, 45.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 19.0, 22.0, 21.0, 46.0, 83.0, 199.0, 442.0, 1152.0, 3208.0, 11024.0, 54963.0, 610550.0, 314279.0, 39696.0, 8518.0, 2588.0, 927.0, 388.0, 181.0, 85.0, 46.0, 35.0, 25.0, 12.0, 3.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.0, -116.814453125, -112.62890625, -108.443359375, -104.2578125, -100.072265625, -95.88671875, -91.701171875, -87.515625, -83.330078125, -79.14453125, -74.958984375, -70.7734375, -66.587890625, -62.40234375, -58.216796875, -54.03125, -49.845703125, -45.66015625, -41.474609375, -37.2890625, -33.103515625, -28.91796875, -24.732421875, -20.546875, -16.361328125, -12.17578125, -7.990234375, -3.8046875, 0.380859375, 4.56640625, 8.751953125, 12.9375, 17.123046875, 21.30859375, 25.494140625, 29.6796875, 33.865234375, 38.05078125, 42.236328125, 46.421875, 50.607421875, 54.79296875, 58.978515625, 63.1640625, 67.349609375, 71.53515625, 75.720703125, 79.90625, 84.091796875, 88.27734375, 92.462890625, 96.6484375, 100.833984375, 105.01953125, 109.205078125, 113.390625, 117.576171875, 121.76171875, 125.947265625, 130.1328125, 134.318359375, 138.50390625, 142.689453125, 146.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 9.0, 8.0, 13.0, 28.0, 28.0, 38.0, 32.0, 46.0, 45.0, 51.0, 64.0, 58.0, 52.0, 62.0, 78.0, 46.0, 48.0, 44.0, 43.0, 28.0, 32.0, 36.0, 13.0, 22.0, 6.0, 12.0, 5.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-200.125, -194.01171875, -187.8984375, -181.78515625, -175.671875, -169.55859375, -163.4453125, -157.33203125, -151.21875, -145.10546875, -138.9921875, -132.87890625, -126.765625, -120.65234375, -114.5390625, -108.42578125, -102.3125, -96.19921875, -90.0859375, -83.97265625, -77.859375, -71.74609375, -65.6328125, -59.51953125, -53.40625, -47.29296875, -41.1796875, -35.06640625, -28.953125, -22.83984375, -16.7265625, -10.61328125, -4.5, 1.61328125, 7.7265625, 13.83984375, 19.953125, 26.06640625, 32.1796875, 38.29296875, 44.40625, 50.51953125, 56.6328125, 62.74609375, 68.859375, 74.97265625, 81.0859375, 87.19921875, 93.3125, 99.42578125, 105.5390625, 111.65234375, 117.765625, 123.87890625, 129.9921875, 136.10546875, 142.21875, 148.33203125, 154.4453125, 160.55859375, 166.671875, 172.78515625, 178.8984375, 185.01171875, 191.125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 12.0, 21.0, 21.0, 41.0, 54.0, 109.0, 205.0, 425.0, 997.0, 2590.0, 8855.0, 35096.0, 166522.0, 641214.0, 148259.0, 31623.0, 8108.0, 2548.0, 961.0, 383.0, 212.0, 103.0, 58.0, 37.0, 24.0, 17.0, 15.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.1875, -30.226806640625, -29.26611328125, -28.305419921875, -27.3447265625, -26.384033203125, -25.42333984375, -24.462646484375, -23.501953125, -22.541259765625, -21.58056640625, -20.619873046875, -19.6591796875, -18.698486328125, -17.73779296875, -16.777099609375, -15.81640625, -14.855712890625, -13.89501953125, -12.934326171875, -11.9736328125, -11.012939453125, -10.05224609375, -9.091552734375, -8.130859375, -7.170166015625, -6.20947265625, -5.248779296875, -4.2880859375, -3.327392578125, -2.36669921875, -1.406005859375, -0.4453125, 0.515380859375, 1.47607421875, 2.436767578125, 3.3974609375, 4.358154296875, 5.31884765625, 6.279541015625, 7.240234375, 8.200927734375, 9.16162109375, 10.122314453125, 11.0830078125, 12.043701171875, 13.00439453125, 13.965087890625, 14.92578125, 15.886474609375, 16.84716796875, 17.807861328125, 18.7685546875, 19.729248046875, 20.68994140625, 21.650634765625, 22.611328125, 23.572021484375, 24.53271484375, 25.493408203125, 26.4541015625, 27.414794921875, 28.37548828125, 29.336181640625, 30.296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 10.0, 13.0, 13.0, 19.0, 25.0, 33.0, 36.0, 53.0, 61.0, 74.0, 72.0, 81.0, 94.0, 71.0, 76.0, 44.0, 54.0, 28.0, 27.0, 26.0, 15.0, 9.0, 9.0, 8.0, 7.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01110076904296875, -0.010815560817718506, -0.010530352592468262, -0.010245144367218018, -0.009959936141967773, -0.00967472791671753, -0.009389519691467285, -0.009104311466217041, -0.008819103240966797, -0.008533895015716553, -0.008248686790466309, -0.007963478565216064, -0.00767827033996582, -0.007393062114715576, -0.007107853889465332, -0.006822645664215088, -0.006537437438964844, -0.0062522292137146, -0.0059670209884643555, -0.005681812763214111, -0.005396604537963867, -0.005111396312713623, -0.004826188087463379, -0.004540979862213135, -0.004255771636962891, -0.0039705634117126465, -0.0036853551864624023, -0.003400146961212158, -0.003114938735961914, -0.00282973051071167, -0.0025445222854614258, -0.0022593140602111816, -0.0019741058349609375, -0.0016888976097106934, -0.0014036893844604492, -0.001118481159210205, -0.0008332729339599609, -0.0005480647087097168, -0.00026285648345947266, 2.2351741790771484e-05, 0.0003075599670410156, 0.0005927681922912598, 0.0008779764175415039, 0.001163184642791748, 0.0014483928680419922, 0.0017336010932922363, 0.0020188093185424805, 0.0023040175437927246, 0.0025892257690429688, 0.002874433994293213, 0.003159642219543457, 0.003444850444793701, 0.0037300586700439453, 0.0040152668952941895, 0.004300475120544434, 0.004585683345794678, 0.004870891571044922, 0.005156099796295166, 0.00544130802154541, 0.005726516246795654, 0.0060117244720458984, 0.006296932697296143, 0.006582140922546387, 0.006867349147796631, 0.007152557373046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 9.0, 25.0, 38.0, 82.0, 141.0, 243.0, 581.0, 1483.0, 4299.0, 16100.0, 77608.0, 567917.0, 306886.0, 55340.0, 12047.0, 3483.0, 1236.0, 516.0, 239.0, 118.0, 57.0, 32.0, 23.0, 14.0, 6.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.125, -27.0390625, -25.953125, -24.8671875, -23.78125, -22.6953125, -21.609375, -20.5234375, -19.4375, -18.3515625, -17.265625, -16.1796875, -15.09375, -14.0078125, -12.921875, -11.8359375, -10.75, -9.6640625, -8.578125, -7.4921875, -6.40625, -5.3203125, -4.234375, -3.1484375, -2.0625, -0.9765625, 0.109375, 1.1953125, 2.28125, 3.3671875, 4.453125, 5.5390625, 6.625, 7.7109375, 8.796875, 9.8828125, 10.96875, 12.0546875, 13.140625, 14.2265625, 15.3125, 16.3984375, 17.484375, 18.5703125, 19.65625, 20.7421875, 21.828125, 22.9140625, 24.0, 25.0859375, 26.171875, 27.2578125, 28.34375, 29.4296875, 30.515625, 31.6015625, 32.6875, 33.7734375, 34.859375, 35.9453125, 37.03125, 38.1171875, 39.203125, 40.2890625, 41.375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 13.0, 13.0, 18.0, 28.0, 35.0, 42.0, 61.0, 65.0, 80.0, 70.0, 73.0, 96.0, 53.0, 76.0, 48.0, 50.0, 34.0, 39.0, 20.0, 23.0, 13.0, 7.0, 9.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-42.21875, -41.120361328125, -40.02197265625, -38.923583984375, -37.8251953125, -36.726806640625, -35.62841796875, -34.530029296875, -33.431640625, -32.333251953125, -31.23486328125, -30.136474609375, -29.0380859375, -27.939697265625, -26.84130859375, -25.742919921875, -24.64453125, -23.546142578125, -22.44775390625, -21.349365234375, -20.2509765625, -19.152587890625, -18.05419921875, -16.955810546875, -15.857421875, -14.759033203125, -13.66064453125, -12.562255859375, -11.4638671875, -10.365478515625, -9.26708984375, -8.168701171875, -7.0703125, -5.971923828125, -4.87353515625, -3.775146484375, -2.6767578125, -1.578369140625, -0.47998046875, 0.618408203125, 1.716796875, 2.815185546875, 3.91357421875, 5.011962890625, 6.1103515625, 7.208740234375, 8.30712890625, 9.405517578125, 10.50390625, 11.602294921875, 12.70068359375, 13.799072265625, 14.8974609375, 15.995849609375, 17.09423828125, 18.192626953125, 19.291015625, 20.389404296875, 21.48779296875, 22.586181640625, 23.6845703125, 24.782958984375, 25.88134765625, 26.979736328125, 28.078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 25.0, 56.0, 139.0, 359.0, 263.0, 79.0, 40.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1960.0020751953125, -1916.3197021484375, -1872.637451171875, -1828.955078125, -1785.272705078125, -1741.5904541015625, -1697.9080810546875, -1654.225830078125, -1610.54345703125, -1566.861083984375, -1523.1788330078125, -1479.4964599609375, -1435.8140869140625, -1392.1318359375, -1348.449462890625, -1304.76708984375, -1261.084716796875, -1217.40234375, -1173.7200927734375, -1130.0377197265625, -1086.3553466796875, -1042.673095703125, -998.99072265625, -955.3084106445312, -911.6260986328125, -867.9437866210938, -824.2614135742188, -780.5791015625, -736.8967895507812, -693.2144775390625, -649.5321044921875, -605.8497924804688, -562.16748046875, -518.4851684570312, -474.8028259277344, -431.1204833984375, -387.43817138671875, -343.7558288574219, -300.073486328125, -256.39117431640625, -212.70883178710938, -169.02650451660156, -125.34416961669922, -81.66183471679688, -37.97950744628906, 5.70281982421875, 49.385162353515625, 93.06747436523438, 136.74981689453125, 180.43214416503906, 224.11447143554688, 267.79681396484375, 311.4791259765625, 355.1614685058594, 398.84381103515625, 442.526123046875, 486.2084655761719, 529.8908081054688, 573.5731201171875, 617.2554931640625, 660.9378051757812, 704.6201171875, 748.302490234375, 791.9847412109375, 835.6671142578125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 4.0, 9.0, 4.0, 5.0, 13.0, 9.0, 16.0, 17.0, 12.0, 22.0, 24.0, 25.0, 25.0, 30.0, 37.0, 45.0, 50.0, 79.0, 71.0, 82.0, 48.0, 40.0, 38.0, 35.0, 24.0, 34.0, 17.0, 28.0, 22.0, 20.0, 17.0, 13.0, 8.0, 16.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-676.45458984375, -656.978515625, -637.5025024414062, -618.0264282226562, -598.5504150390625, -579.0743408203125, -559.5983276367188, -540.1222534179688, -520.646240234375, -501.1701965332031, -481.69415283203125, -462.2181091308594, -442.7420654296875, -423.2659912109375, -403.7899475097656, -384.31390380859375, -364.83782958984375, -345.3617858886719, -325.8857421875, -306.4096984863281, -286.93365478515625, -267.45758056640625, -247.98153686523438, -228.5054931640625, -209.02944946289062, -189.55340576171875, -170.07736206054688, -150.60130310058594, -131.12525939941406, -111.64921569824219, -92.17316436767578, -72.69711303710938, -53.2210693359375, -33.74502182006836, -14.268974304199219, 5.207073211669922, 24.683120727539062, 44.15916442871094, 63.635215759277344, 83.11126708984375, 102.58731079101562, 122.0633544921875, 141.53939819335938, 161.0154571533203, 180.4915008544922, 199.96754455566406, 219.443603515625, 238.91964721679688, 258.39569091796875, 277.8717346191406, 297.3477783203125, 316.8238220214844, 336.29986572265625, 355.77593994140625, 375.2519836425781, 394.72802734375, 414.2040710449219, 433.68011474609375, 453.1561584472656, 472.6322021484375, 492.1082763671875, 511.58428955078125, 531.0603637695312, 550.536376953125, 570.012451171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 4.0, 8.0, 8.0, 16.0, 17.0, 18.0, 25.0, 35.0, 40.0, 75.0, 140.0, 292.0, 961.0, 3287.0, 16414.0, 305575.0, 3542003.0, 303306.0, 16907.0, 3377.0, 988.0, 350.0, 147.0, 59.0, 47.0, 32.0, 28.0, 21.0, 14.0, 9.0, 18.0, 13.0, 6.0, 3.0, 8.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.5625, -105.1162109375, -101.669921875, -98.2236328125, -94.77734375, -91.3310546875, -87.884765625, -84.4384765625, -80.9921875, -77.5458984375, -74.099609375, -70.6533203125, -67.20703125, -63.7607421875, -60.314453125, -56.8681640625, -53.421875, -49.9755859375, -46.529296875, -43.0830078125, -39.63671875, -36.1904296875, -32.744140625, -29.2978515625, -25.8515625, -22.4052734375, -18.958984375, -15.5126953125, -12.06640625, -8.6201171875, -5.173828125, -1.7275390625, 1.71875, 5.1650390625, 8.611328125, 12.0576171875, 15.50390625, 18.9501953125, 22.396484375, 25.8427734375, 29.2890625, 32.7353515625, 36.181640625, 39.6279296875, 43.07421875, 46.5205078125, 49.966796875, 53.4130859375, 56.859375, 60.3056640625, 63.751953125, 67.1982421875, 70.64453125, 74.0908203125, 77.537109375, 80.9833984375, 84.4296875, 87.8759765625, 91.322265625, 94.7685546875, 98.21484375, 101.6611328125, 105.107421875, 108.5537109375, 112.0]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 0.0, 4.0, 7.0, 6.0, 4.0, 9.0, 10.0, 11.0, 6.0, 16.0, 12.0, 15.0, 19.0, 24.0, 29.0, 39.0, 44.0, 42.0, 46.0, 52.0, 49.0, 33.0, 40.0, 53.0, 51.0, 41.0, 32.0, 47.0, 34.0, 39.0, 32.0, 25.0, 19.0, 24.0, 10.0, 14.0, 16.0, 13.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.51806640625, -38.2548828125, -36.99169921875, -35.728515625, -34.46533203125, -33.2021484375, -31.93896484375, -30.67578125, -29.41259765625, -28.1494140625, -26.88623046875, -25.623046875, -24.35986328125, -23.0966796875, -21.83349609375, -20.5703125, -19.30712890625, -18.0439453125, -16.78076171875, -15.517578125, -14.25439453125, -12.9912109375, -11.72802734375, -10.46484375, -9.20166015625, -7.9384765625, -6.67529296875, -5.412109375, -4.14892578125, -2.8857421875, -1.62255859375, -0.359375, 0.90380859375, 2.1669921875, 3.43017578125, 4.693359375, 5.95654296875, 7.2197265625, 8.48291015625, 9.74609375, 11.00927734375, 12.2724609375, 13.53564453125, 14.798828125, 16.06201171875, 17.3251953125, 18.58837890625, 19.8515625, 21.11474609375, 22.3779296875, 23.64111328125, 24.904296875, 26.16748046875, 27.4306640625, 28.69384765625, 29.95703125, 31.22021484375, 32.4833984375, 33.74658203125, 35.009765625, 36.27294921875, 37.5361328125, 38.79931640625, 40.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 12.0, 16.0, 68.0, 110.0, 256.0, 855.0, 13677.0, 4151282.0, 26451.0, 1022.0, 281.0, 128.0, 55.0, 37.0, 19.0, 14.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-430.25, -416.17578125, -402.1015625, -388.02734375, -373.953125, -359.87890625, -345.8046875, -331.73046875, -317.65625, -303.58203125, -289.5078125, -275.43359375, -261.359375, -247.28515625, -233.2109375, -219.13671875, -205.0625, -190.98828125, -176.9140625, -162.83984375, -148.765625, -134.69140625, -120.6171875, -106.54296875, -92.46875, -78.39453125, -64.3203125, -50.24609375, -36.171875, -22.09765625, -8.0234375, 6.05078125, 20.125, 34.19921875, 48.2734375, 62.34765625, 76.421875, 90.49609375, 104.5703125, 118.64453125, 132.71875, 146.79296875, 160.8671875, 174.94140625, 189.015625, 203.08984375, 217.1640625, 231.23828125, 245.3125, 259.38671875, 273.4609375, 287.53515625, 301.609375, 315.68359375, 329.7578125, 343.83203125, 357.90625, 371.98046875, 386.0546875, 400.12890625, 414.203125, 428.27734375, 442.3515625, 456.42578125, 470.5]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 12.0, 29.0, 47.0, 99.0, 396.0, 1714.0, 1348.0, 284.0, 81.0, 35.0, 13.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.25, -254.7265625, -246.203125, -237.6796875, -229.15625, -220.6328125, -212.109375, -203.5859375, -195.0625, -186.5390625, -178.015625, -169.4921875, -160.96875, -152.4453125, -143.921875, -135.3984375, -126.875, -118.3515625, -109.828125, -101.3046875, -92.78125, -84.2578125, -75.734375, -67.2109375, -58.6875, -50.1640625, -41.640625, -33.1171875, -24.59375, -16.0703125, -7.546875, 0.9765625, 9.5, 18.0234375, 26.546875, 35.0703125, 43.59375, 52.1171875, 60.640625, 69.1640625, 77.6875, 86.2109375, 94.734375, 103.2578125, 111.78125, 120.3046875, 128.828125, 137.3515625, 145.875, 154.3984375, 162.921875, 171.4453125, 179.96875, 188.4921875, 197.015625, 205.5390625, 214.0625, 222.5859375, 231.109375, 239.6328125, 248.15625, 256.6796875, 265.203125, 273.7265625, 282.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 17.0, 19.0, 15.0, 41.0, 43.0, 80.0, 132.0, 179.0, 143.0, 113.0, 99.0, 37.0, 29.0, 14.0, 12.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-973.7903442382812, -947.4930419921875, -921.1957397460938, -894.8983764648438, -868.60107421875, -842.3037719726562, -816.0064697265625, -789.7091064453125, -763.4118041992188, -737.114501953125, -710.8171997070312, -684.5198364257812, -658.2225341796875, -631.9252319335938, -605.6279296875, -579.33056640625, -553.0333251953125, -526.7360229492188, -500.4386901855469, -474.1413879394531, -447.84405517578125, -421.5467529296875, -395.24945068359375, -368.9521179199219, -342.65478515625, -316.35748291015625, -290.0601501464844, -263.7628479003906, -237.46551513671875, -211.168212890625, -184.8708953857422, -158.57357788085938, -132.2762451171875, -105.97892761230469, -79.68161010742188, -53.384300231933594, -27.08698272705078, -0.7896728515625, 25.507644653320312, 51.804962158203125, 78.10227966308594, 104.39959716796875, 130.69691467285156, 156.99423217773438, 183.29153442382812, 209.58885192871094, 235.88616943359375, 262.1834716796875, 288.4808044433594, 314.7781066894531, 341.075439453125, 367.37274169921875, 393.6700744628906, 419.9673767089844, 446.26470947265625, 472.56201171875, 498.85931396484375, 525.1566162109375, 551.4539184570312, 577.7512817382812, 604.048583984375, 630.3458862304688, 656.6431884765625, 682.9405517578125, 709.2378540039062]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 9.0, 9.0, 14.0, 17.0, 11.0, 27.0, 30.0, 29.0, 26.0, 33.0, 33.0, 28.0, 34.0, 32.0, 49.0, 47.0, 42.0, 41.0, 44.0, 31.0, 42.0, 32.0, 35.0, 34.0, 16.0, 29.0, 24.0, 17.0, 17.0, 20.0, 17.0, 22.0, 9.0, 16.0, 9.0, 3.0, 12.0, 7.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-434.8672180175781, -421.15618896484375, -407.44512939453125, -393.73406982421875, -380.0230407714844, -366.31201171875, -352.6009521484375, -338.889892578125, -325.1788635253906, -311.46783447265625, -297.75677490234375, -284.04571533203125, -270.3346862792969, -256.6236572265625, -242.91259765625, -229.20155334472656, -215.49050903320312, -201.7794647216797, -188.06842041015625, -174.3573760986328, -160.64633178710938, -146.93528747558594, -133.2242431640625, -119.51319885253906, -105.80215454101562, -92.09111022949219, -78.38006591796875, -64.66902160644531, -50.957977294921875, -37.24693298339844, -23.535888671875, -9.824844360351562, 3.88623046875, 17.597274780273438, 31.308319091796875, 45.01936340332031, 58.73040771484375, 72.44145202636719, 86.15249633789062, 99.86354064941406, 113.5745849609375, 127.28562927246094, 140.99667358398438, 154.7077178955078, 168.41876220703125, 182.1298065185547, 195.84085083007812, 209.55189514160156, 223.262939453125, 236.97398376464844, 250.68502807617188, 264.39605712890625, 278.10711669921875, 291.81817626953125, 305.5292053222656, 319.240234375, 332.9512939453125, 346.662353515625, 360.3733825683594, 374.08441162109375, 387.79547119140625, 401.50653076171875, 415.2175598144531, 428.9285888671875, 442.6396484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 12.0, 18.0, 39.0, 44.0, 75.0, 81.0, 129.0, 229.0, 304.0, 489.0, 780.0, 1186.0, 2012.0, 3341.0, 5522.0, 9790.0, 17678.0, 32318.0, 63723.0, 126578.0, 251100.0, 258932.0, 132386.0, 65143.0, 33902.0, 18071.0, 10081.0, 5697.0, 3385.0, 1981.0, 1295.0, 723.0, 512.0, 324.0, 213.0, 149.0, 78.0, 67.0, 49.0, 29.0, 23.0, 17.0, 15.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.71875, -39.48583984375, -38.2529296875, -37.02001953125, -35.787109375, -34.55419921875, -33.3212890625, -32.08837890625, -30.85546875, -29.62255859375, -28.3896484375, -27.15673828125, -25.923828125, -24.69091796875, -23.4580078125, -22.22509765625, -20.9921875, -19.75927734375, -18.5263671875, -17.29345703125, -16.060546875, -14.82763671875, -13.5947265625, -12.36181640625, -11.12890625, -9.89599609375, -8.6630859375, -7.43017578125, -6.197265625, -4.96435546875, -3.7314453125, -2.49853515625, -1.265625, -0.03271484375, 1.2001953125, 2.43310546875, 3.666015625, 4.89892578125, 6.1318359375, 7.36474609375, 8.59765625, 9.83056640625, 11.0634765625, 12.29638671875, 13.529296875, 14.76220703125, 15.9951171875, 17.22802734375, 18.4609375, 19.69384765625, 20.9267578125, 22.15966796875, 23.392578125, 24.62548828125, 25.8583984375, 27.09130859375, 28.32421875, 29.55712890625, 30.7900390625, 32.02294921875, 33.255859375, 34.48876953125, 35.7216796875, 36.95458984375, 38.1875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 3.0, 8.0, 3.0, 9.0, 10.0, 13.0, 9.0, 18.0, 19.0, 24.0, 33.0, 46.0, 39.0, 43.0, 43.0, 59.0, 70.0, 60.0, 34.0, 46.0, 47.0, 48.0, 44.0, 42.0, 44.0, 23.0, 35.0, 22.0, 20.0, 23.0, 15.0, 12.0, 11.0, 5.0, 4.0, 7.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.34375, -51.77734375, -50.2109375, -48.64453125, -47.078125, -45.51171875, -43.9453125, -42.37890625, -40.8125, -39.24609375, -37.6796875, -36.11328125, -34.546875, -32.98046875, -31.4140625, -29.84765625, -28.28125, -26.71484375, -25.1484375, -23.58203125, -22.015625, -20.44921875, -18.8828125, -17.31640625, -15.75, -14.18359375, -12.6171875, -11.05078125, -9.484375, -7.91796875, -6.3515625, -4.78515625, -3.21875, -1.65234375, -0.0859375, 1.48046875, 3.046875, 4.61328125, 6.1796875, 7.74609375, 9.3125, 10.87890625, 12.4453125, 14.01171875, 15.578125, 17.14453125, 18.7109375, 20.27734375, 21.84375, 23.41015625, 24.9765625, 26.54296875, 28.109375, 29.67578125, 31.2421875, 32.80859375, 34.375, 35.94140625, 37.5078125, 39.07421875, 40.640625, 42.20703125, 43.7734375, 45.33984375, 46.90625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 5.0, 12.0, 6.0, 13.0, 23.0, 39.0, 36.0, 80.0, 89.0, 161.0, 250.0, 583.0, 1471.0, 5413.0, 27802.0, 334125.0, 635496.0, 33660.0, 6214.0, 1670.0, 606.0, 305.0, 148.0, 92.0, 62.0, 53.0, 34.0, 31.0, 13.0, 13.0, 12.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-135.375, -129.970703125, -124.56640625, -119.162109375, -113.7578125, -108.353515625, -102.94921875, -97.544921875, -92.140625, -86.736328125, -81.33203125, -75.927734375, -70.5234375, -65.119140625, -59.71484375, -54.310546875, -48.90625, -43.501953125, -38.09765625, -32.693359375, -27.2890625, -21.884765625, -16.48046875, -11.076171875, -5.671875, -0.267578125, 5.13671875, 10.541015625, 15.9453125, 21.349609375, 26.75390625, 32.158203125, 37.5625, 42.966796875, 48.37109375, 53.775390625, 59.1796875, 64.583984375, 69.98828125, 75.392578125, 80.796875, 86.201171875, 91.60546875, 97.009765625, 102.4140625, 107.818359375, 113.22265625, 118.626953125, 124.03125, 129.435546875, 134.83984375, 140.244140625, 145.6484375, 151.052734375, 156.45703125, 161.861328125, 167.265625, 172.669921875, 178.07421875, 183.478515625, 188.8828125, 194.287109375, 199.69140625, 205.095703125, 210.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 15.0, 13.0, 13.0, 13.0, 24.0, 26.0, 24.0, 50.0, 50.0, 66.0, 67.0, 88.0, 77.0, 89.0, 91.0, 62.0, 44.0, 45.0, 28.0, 28.0, 21.0, 10.0, 9.0, 13.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.625, -192.599609375, -183.57421875, -174.548828125, -165.5234375, -156.498046875, -147.47265625, -138.447265625, -129.421875, -120.396484375, -111.37109375, -102.345703125, -93.3203125, -84.294921875, -75.26953125, -66.244140625, -57.21875, -48.193359375, -39.16796875, -30.142578125, -21.1171875, -12.091796875, -3.06640625, 5.958984375, 14.984375, 24.009765625, 33.03515625, 42.060546875, 51.0859375, 60.111328125, 69.13671875, 78.162109375, 87.1875, 96.212890625, 105.23828125, 114.263671875, 123.2890625, 132.314453125, 141.33984375, 150.365234375, 159.390625, 168.416015625, 177.44140625, 186.466796875, 195.4921875, 204.517578125, 213.54296875, 222.568359375, 231.59375, 240.619140625, 249.64453125, 258.669921875, 267.6953125, 276.720703125, 285.74609375, 294.771484375, 303.796875, 312.822265625, 321.84765625, 330.873046875, 339.8984375, 348.923828125, 357.94921875, 366.974609375, 376.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 11.0, 13.0, 14.0, 20.0, 32.0, 39.0, 62.0, 121.0, 214.0, 341.0, 627.0, 1413.0, 3518.0, 10588.0, 41838.0, 304161.0, 612761.0, 52904.0, 12517.0, 4137.0, 1586.0, 690.0, 382.0, 196.0, 108.0, 74.0, 58.0, 29.0, 15.0, 23.0, 13.0, 14.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.8125, -31.6435546875, -30.474609375, -29.3056640625, -28.13671875, -26.9677734375, -25.798828125, -24.6298828125, -23.4609375, -22.2919921875, -21.123046875, -19.9541015625, -18.78515625, -17.6162109375, -16.447265625, -15.2783203125, -14.109375, -12.9404296875, -11.771484375, -10.6025390625, -9.43359375, -8.2646484375, -7.095703125, -5.9267578125, -4.7578125, -3.5888671875, -2.419921875, -1.2509765625, -0.08203125, 1.0869140625, 2.255859375, 3.4248046875, 4.59375, 5.7626953125, 6.931640625, 8.1005859375, 9.26953125, 10.4384765625, 11.607421875, 12.7763671875, 13.9453125, 15.1142578125, 16.283203125, 17.4521484375, 18.62109375, 19.7900390625, 20.958984375, 22.1279296875, 23.296875, 24.4658203125, 25.634765625, 26.8037109375, 27.97265625, 29.1416015625, 30.310546875, 31.4794921875, 32.6484375, 33.8173828125, 34.986328125, 36.1552734375, 37.32421875, 38.4931640625, 39.662109375, 40.8310546875, 42.0]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 15.0, 24.0, 26.0, 15.0, 44.0, 47.0, 74.0, 105.0, 135.0, 132.0, 97.0, 71.0, 60.0, 32.0, 19.0, 27.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.01139974594116211, -0.011004447937011719, -0.010609149932861328, -0.010213851928710938, -0.009818553924560547, -0.009423255920410156, -0.009027957916259766, -0.008632659912109375, -0.008237361907958984, -0.007842063903808594, -0.007446765899658203, -0.0070514678955078125, -0.006656169891357422, -0.006260871887207031, -0.005865573883056641, -0.00547027587890625, -0.005074977874755859, -0.004679679870605469, -0.004284381866455078, -0.0038890838623046875, -0.003493785858154297, -0.0030984878540039062, -0.0027031898498535156, -0.002307891845703125, -0.0019125938415527344, -0.0015172958374023438, -0.0011219978332519531, -0.0007266998291015625, -0.0003314018249511719, 6.389617919921875e-05, 0.0004591941833496094, 0.0008544921875, 0.0012497901916503906, 0.0016450881958007812, 0.002040386199951172, 0.0024356842041015625, 0.002830982208251953, 0.0032262802124023438, 0.0036215782165527344, 0.004016876220703125, 0.004412174224853516, 0.004807472229003906, 0.005202770233154297, 0.0055980682373046875, 0.005993366241455078, 0.006388664245605469, 0.006783962249755859, 0.00717926025390625, 0.007574558258056641, 0.007969856262207031, 0.008365154266357422, 0.008760452270507812, 0.009155750274658203, 0.009551048278808594, 0.009946346282958984, 0.010341644287109375, 0.010736942291259766, 0.011132240295410156, 0.011527538299560547, 0.011922836303710938, 0.012318134307861328, 0.012713432312011719, 0.01310873031616211, 0.0135040283203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 1.0, 2.0, 12.0, 6.0, 15.0, 26.0, 28.0, 28.0, 63.0, 93.0, 166.0, 300.0, 635.0, 1521.0, 4640.0, 18892.0, 126188.0, 789077.0, 85903.0, 14515.0, 3888.0, 1334.0, 538.0, 265.0, 164.0, 93.0, 54.0, 29.0, 24.0, 25.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.34375, -46.89697265625, -45.4501953125, -44.00341796875, -42.556640625, -41.10986328125, -39.6630859375, -38.21630859375, -36.76953125, -35.32275390625, -33.8759765625, -32.42919921875, -30.982421875, -29.53564453125, -28.0888671875, -26.64208984375, -25.1953125, -23.74853515625, -22.3017578125, -20.85498046875, -19.408203125, -17.96142578125, -16.5146484375, -15.06787109375, -13.62109375, -12.17431640625, -10.7275390625, -9.28076171875, -7.833984375, -6.38720703125, -4.9404296875, -3.49365234375, -2.046875, -0.60009765625, 0.8466796875, 2.29345703125, 3.740234375, 5.18701171875, 6.6337890625, 8.08056640625, 9.52734375, 10.97412109375, 12.4208984375, 13.86767578125, 15.314453125, 16.76123046875, 18.2080078125, 19.65478515625, 21.1015625, 22.54833984375, 23.9951171875, 25.44189453125, 26.888671875, 28.33544921875, 29.7822265625, 31.22900390625, 32.67578125, 34.12255859375, 35.5693359375, 37.01611328125, 38.462890625, 39.90966796875, 41.3564453125, 42.80322265625, 44.25]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 7.0, 14.0, 17.0, 40.0, 59.0, 81.0, 122.0, 143.0, 127.0, 110.0, 81.0, 48.0, 26.0, 32.0, 13.0, 17.0, 11.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.09375, -61.37841796875, -59.6630859375, -57.94775390625, -56.232421875, -54.51708984375, -52.8017578125, -51.08642578125, -49.37109375, -47.65576171875, -45.9404296875, -44.22509765625, -42.509765625, -40.79443359375, -39.0791015625, -37.36376953125, -35.6484375, -33.93310546875, -32.2177734375, -30.50244140625, -28.787109375, -27.07177734375, -25.3564453125, -23.64111328125, -21.92578125, -20.21044921875, -18.4951171875, -16.77978515625, -15.064453125, -13.34912109375, -11.6337890625, -9.91845703125, -8.203125, -6.48779296875, -4.7724609375, -3.05712890625, -1.341796875, 0.37353515625, 2.0888671875, 3.80419921875, 5.51953125, 7.23486328125, 8.9501953125, 10.66552734375, 12.380859375, 14.09619140625, 15.8115234375, 17.52685546875, 19.2421875, 20.95751953125, 22.6728515625, 24.38818359375, 26.103515625, 27.81884765625, 29.5341796875, 31.24951171875, 32.96484375, 34.68017578125, 36.3955078125, 38.11083984375, 39.826171875, 41.54150390625, 43.2568359375, 44.97216796875, 46.6875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 16.0, 34.0, 122.0, 327.0, 355.0, 95.0, 28.0, 15.0, 8.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2877.7158203125, -2820.189453125, -2762.663330078125, -2705.136962890625, -2647.61083984375, -2590.08447265625, -2532.55810546875, -2475.031982421875, -2417.505615234375, -2359.979248046875, -2302.453125, -2244.9267578125, -2187.400634765625, -2129.874267578125, -2072.34814453125, -2014.82177734375, -1957.295654296875, -1899.7694091796875, -1842.2431640625, -1784.716796875, -1727.1905517578125, -1669.664306640625, -1612.1380615234375, -1554.61181640625, -1497.08544921875, -1439.5592041015625, -1382.032958984375, -1324.506591796875, -1266.9803466796875, -1209.4541015625, -1151.9278564453125, -1094.401611328125, -1036.87548828125, -979.3492431640625, -921.8229370117188, -864.2966918945312, -806.7704467773438, -749.244140625, -691.7178955078125, -634.191650390625, -576.665283203125, -519.1390380859375, -461.6127624511719, -404.08648681640625, -346.56024169921875, -289.0339660644531, -231.5076904296875, -173.9814453125, -116.4552001953125, -58.92893600463867, -1.4026718139648438, 56.12359619140625, 113.64985656738281, 171.17611694335938, 228.702392578125, 286.2286376953125, 343.7549133300781, 401.28118896484375, 458.80743408203125, 516.333740234375, 573.8599853515625, 631.38623046875, 688.9124755859375, 746.438720703125, 803.9650268554688]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 7.0, 10.0, 4.0, 5.0, 8.0, 10.0, 13.0, 10.0, 17.0, 28.0, 25.0, 24.0, 35.0, 44.0, 39.0, 57.0, 65.0, 84.0, 89.0, 61.0, 45.0, 28.0, 29.0, 28.0, 23.0, 22.0, 26.0, 21.0, 23.0, 6.0, 14.0, 18.0, 10.0, 10.0, 4.0, 10.0, 7.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-648.345947265625, -626.691162109375, -605.036376953125, -583.3815307617188, -561.7267456054688, -540.0719604492188, -518.4171752929688, -496.7623596191406, -475.1075439453125, -453.4527587890625, -431.7979431152344, -410.1431579589844, -388.48834228515625, -366.83355712890625, -345.17877197265625, -323.5239562988281, -301.8691711425781, -280.2143859863281, -258.5595703125, -236.90478515625, -215.24996948242188, -193.59518432617188, -171.9403839111328, -150.28558349609375, -128.6307830810547, -106.97598266601562, -85.32118225097656, -63.66638946533203, -42.01158905029297, -20.356788635253906, 1.298004150390625, 22.952804565429688, 44.60760498046875, 66.26240539550781, 87.91720581054688, 109.5719985961914, 131.226806640625, 152.881591796875, 174.53639221191406, 196.19119262695312, 217.8459930419922, 239.50079345703125, 261.15557861328125, 282.8103942871094, 304.4651794433594, 326.1199951171875, 347.7747802734375, 369.4295654296875, 391.0843811035156, 412.7391662597656, 434.39398193359375, 456.04876708984375, 477.7035827636719, 499.3583679199219, 521.01318359375, 542.66796875, 564.32275390625, 585.9775390625, 607.63232421875, 629.2871704101562, 650.9419555664062, 672.5967407226562, 694.2515258789062, 715.9063720703125, 737.5611572265625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 10.0, 8.0, 25.0, 28.0, 51.0, 66.0, 85.0, 132.0, 210.0, 365.0, 555.0, 950.0, 1709.0, 3113.0, 6487.0, 17084.0, 59253.0, 238813.0, 1040822.0, 2042804.0, 584813.0, 135691.0, 36909.0, 12663.0, 5464.0, 2679.0, 1407.0, 781.0, 483.0, 262.0, 193.0, 129.0, 78.0, 51.0, 29.0, 24.0, 17.0, 6.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.34375, -40.94677734375, -39.5498046875, -38.15283203125, -36.755859375, -35.35888671875, -33.9619140625, -32.56494140625, -31.16796875, -29.77099609375, -28.3740234375, -26.97705078125, -25.580078125, -24.18310546875, -22.7861328125, -21.38916015625, -19.9921875, -18.59521484375, -17.1982421875, -15.80126953125, -14.404296875, -13.00732421875, -11.6103515625, -10.21337890625, -8.81640625, -7.41943359375, -6.0224609375, -4.62548828125, -3.228515625, -1.83154296875, -0.4345703125, 0.96240234375, 2.359375, 3.75634765625, 5.1533203125, 6.55029296875, 7.947265625, 9.34423828125, 10.7412109375, 12.13818359375, 13.53515625, 14.93212890625, 16.3291015625, 17.72607421875, 19.123046875, 20.52001953125, 21.9169921875, 23.31396484375, 24.7109375, 26.10791015625, 27.5048828125, 28.90185546875, 30.298828125, 31.69580078125, 33.0927734375, 34.48974609375, 35.88671875, 37.28369140625, 38.6806640625, 40.07763671875, 41.474609375, 42.87158203125, 44.2685546875, 45.66552734375, 47.0625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 12.0, 17.0, 23.0, 23.0, 24.0, 29.0, 35.0, 33.0, 49.0, 69.0, 51.0, 57.0, 62.0, 46.0, 60.0, 54.0, 45.0, 39.0, 52.0, 32.0, 34.0, 26.0, 26.0, 15.0, 14.0, 10.0, 11.0, 5.0, 4.0, 5.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0], "bins": [-73.375, -71.57470703125, -69.7744140625, -67.97412109375, -66.173828125, -64.37353515625, -62.5732421875, -60.77294921875, -58.97265625, -57.17236328125, -55.3720703125, -53.57177734375, -51.771484375, -49.97119140625, -48.1708984375, -46.37060546875, -44.5703125, -42.77001953125, -40.9697265625, -39.16943359375, -37.369140625, -35.56884765625, -33.7685546875, -31.96826171875, -30.16796875, -28.36767578125, -26.5673828125, -24.76708984375, -22.966796875, -21.16650390625, -19.3662109375, -17.56591796875, -15.765625, -13.96533203125, -12.1650390625, -10.36474609375, -8.564453125, -6.76416015625, -4.9638671875, -3.16357421875, -1.36328125, 0.43701171875, 2.2373046875, 4.03759765625, 5.837890625, 7.63818359375, 9.4384765625, 11.23876953125, 13.0390625, 14.83935546875, 16.6396484375, 18.43994140625, 20.240234375, 22.04052734375, 23.8408203125, 25.64111328125, 27.44140625, 29.24169921875, 31.0419921875, 32.84228515625, 34.642578125, 36.44287109375, 38.2431640625, 40.04345703125, 41.84375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 9.0, 10.0, 13.0, 32.0, 41.0, 76.0, 114.0, 282.0, 916.0, 3407.0, 21011.0, 777702.0, 3343801.0, 39599.0, 5129.0, 1233.0, 413.0, 225.0, 98.0, 52.0, 38.0, 19.0, 15.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-183.75, -178.3671875, -172.984375, -167.6015625, -162.21875, -156.8359375, -151.453125, -146.0703125, -140.6875, -135.3046875, -129.921875, -124.5390625, -119.15625, -113.7734375, -108.390625, -103.0078125, -97.625, -92.2421875, -86.859375, -81.4765625, -76.09375, -70.7109375, -65.328125, -59.9453125, -54.5625, -49.1796875, -43.796875, -38.4140625, -33.03125, -27.6484375, -22.265625, -16.8828125, -11.5, -6.1171875, -0.734375, 4.6484375, 10.03125, 15.4140625, 20.796875, 26.1796875, 31.5625, 36.9453125, 42.328125, 47.7109375, 53.09375, 58.4765625, 63.859375, 69.2421875, 74.625, 80.0078125, 85.390625, 90.7734375, 96.15625, 101.5390625, 106.921875, 112.3046875, 117.6875, 123.0703125, 128.453125, 133.8359375, 139.21875, 144.6015625, 149.984375, 155.3671875, 160.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 6.0, 6.0, 10.0, 19.0, 13.0, 22.0, 20.0, 33.0, 62.0, 102.0, 176.0, 298.0, 557.0, 804.0, 730.0, 533.0, 287.0, 148.0, 69.0, 55.0, 37.0, 24.0, 14.0, 9.0, 13.0, 5.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.3125, -101.9169921875, -98.521484375, -95.1259765625, -91.73046875, -88.3349609375, -84.939453125, -81.5439453125, -78.1484375, -74.7529296875, -71.357421875, -67.9619140625, -64.56640625, -61.1708984375, -57.775390625, -54.3798828125, -50.984375, -47.5888671875, -44.193359375, -40.7978515625, -37.40234375, -34.0068359375, -30.611328125, -27.2158203125, -23.8203125, -20.4248046875, -17.029296875, -13.6337890625, -10.23828125, -6.8427734375, -3.447265625, -0.0517578125, 3.34375, 6.7392578125, 10.134765625, 13.5302734375, 16.92578125, 20.3212890625, 23.716796875, 27.1123046875, 30.5078125, 33.9033203125, 37.298828125, 40.6943359375, 44.08984375, 47.4853515625, 50.880859375, 54.2763671875, 57.671875, 61.0673828125, 64.462890625, 67.8583984375, 71.25390625, 74.6494140625, 78.044921875, 81.4404296875, 84.8359375, 88.2314453125, 91.626953125, 95.0224609375, 98.41796875, 101.8134765625, 105.208984375, 108.6044921875, 112.0]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 19.0, 30.0, 55.0, 109.0, 190.0, 241.0, 157.0, 100.0, 45.0, 19.0, 7.0, 2.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-859.0454711914062, -828.9410400390625, -798.8365478515625, -768.7321166992188, -738.627685546875, -708.523193359375, -678.4187622070312, -648.3143310546875, -618.2098388671875, -588.1054077148438, -558.0009155273438, -527.896484375, -497.79205322265625, -467.6875915527344, -437.5831298828125, -407.47869873046875, -377.374267578125, -347.2698059082031, -317.1653747558594, -287.0609130859375, -256.95648193359375, -226.85202026367188, -196.74755859375, -166.6431121826172, -136.53866577148438, -106.43421936035156, -76.32976531982422, -46.225311279296875, -16.120864868164062, 13.98358154296875, 44.088043212890625, 74.19248962402344, 104.2969970703125, 134.4014434814453, 164.50588989257812, 194.6103515625, 224.7147979736328, 254.81924438476562, 284.9237060546875, 315.02813720703125, 345.1325988769531, 375.237060546875, 405.34149169921875, 435.4459533691406, 465.5504150390625, 495.65484619140625, 525.75927734375, 555.86376953125, 585.9682006835938, 616.0726318359375, 646.1771240234375, 676.2815551757812, 706.385986328125, 736.490478515625, 766.5949096679688, 796.6993408203125, 826.8038330078125, 856.9082641601562, 887.0127563476562, 917.1171875, 947.2216186523438, 977.3260498046875, 1007.4305419921875, 1037.5350341796875, 1067.639404296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 5.0, 8.0, 15.0, 24.0, 16.0, 18.0, 31.0, 33.0, 50.0, 37.0, 42.0, 48.0, 53.0, 48.0, 49.0, 53.0, 50.0, 48.0, 43.0, 65.0, 35.0, 44.0, 38.0, 28.0, 23.0, 17.0, 19.0, 15.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-440.7887268066406, -425.0470886230469, -409.3054504394531, -393.5638122558594, -377.8221740722656, -362.0805358886719, -346.3388671875, -330.59722900390625, -314.8555908203125, -299.11395263671875, -283.372314453125, -267.63067626953125, -251.8890380859375, -236.14739990234375, -220.40574645996094, -204.6641082763672, -188.9224853515625, -173.18084716796875, -157.439208984375, -141.69757080078125, -125.95592498779297, -110.21428680419922, -94.47264099121094, -78.73100280761719, -62.98936462402344, -47.24772644042969, -31.506084442138672, -15.764442443847656, -0.02280426025390625, 15.718833923339844, 31.460479736328125, 47.202117919921875, 62.94378662109375, 78.6854248046875, 94.42706298828125, 110.16870880126953, 125.91034698486328, 141.6519775390625, 157.3936309814453, 173.13526916503906, 188.8769073486328, 204.61854553222656, 220.3601837158203, 236.10183715820312, 251.84347534179688, 267.5851135253906, 283.3267517089844, 299.0683898925781, 314.8100280761719, 330.5516662597656, 346.2933044433594, 362.0349426269531, 377.7765808105469, 393.5182189941406, 409.2598876953125, 425.00152587890625, 440.7431640625, 456.48480224609375, 472.2264404296875, 487.96807861328125, 503.709716796875, 519.4513549804688, 535.1929931640625, 550.9346313476562, 566.67626953125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 27.0, 36.0, 58.0, 78.0, 138.0, 187.0, 306.0, 449.0, 800.0, 1376.0, 2526.0, 4567.0, 9098.0, 18610.0, 42402.0, 103074.0, 271164.0, 348178.0, 140545.0, 56135.0, 24609.0, 11449.0, 5588.0, 3022.0, 1602.0, 954.0, 560.0, 349.0, 240.0, 142.0, 86.0, 66.0, 50.0, 22.0, 19.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.75, -56.978515625, -55.20703125, -53.435546875, -51.6640625, -49.892578125, -48.12109375, -46.349609375, -44.578125, -42.806640625, -41.03515625, -39.263671875, -37.4921875, -35.720703125, -33.94921875, -32.177734375, -30.40625, -28.634765625, -26.86328125, -25.091796875, -23.3203125, -21.548828125, -19.77734375, -18.005859375, -16.234375, -14.462890625, -12.69140625, -10.919921875, -9.1484375, -7.376953125, -5.60546875, -3.833984375, -2.0625, -0.291015625, 1.48046875, 3.251953125, 5.0234375, 6.794921875, 8.56640625, 10.337890625, 12.109375, 13.880859375, 15.65234375, 17.423828125, 19.1953125, 20.966796875, 22.73828125, 24.509765625, 26.28125, 28.052734375, 29.82421875, 31.595703125, 33.3671875, 35.138671875, 36.91015625, 38.681640625, 40.453125, 42.224609375, 43.99609375, 45.767578125, 47.5390625, 49.310546875, 51.08203125, 52.853515625, 54.625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 11.0, 10.0, 10.0, 18.0, 19.0, 19.0, 18.0, 21.0, 32.0, 24.0, 37.0, 37.0, 55.0, 55.0, 57.0, 45.0, 55.0, 58.0, 48.0, 44.0, 45.0, 49.0, 38.0, 24.0, 28.0, 29.0, 23.0, 17.0, 11.0, 16.0, 10.0, 12.0, 7.0, 4.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0], "bins": [-68.6875, -66.98583984375, -65.2841796875, -63.58251953125, -61.880859375, -60.17919921875, -58.4775390625, -56.77587890625, -55.07421875, -53.37255859375, -51.6708984375, -49.96923828125, -48.267578125, -46.56591796875, -44.8642578125, -43.16259765625, -41.4609375, -39.75927734375, -38.0576171875, -36.35595703125, -34.654296875, -32.95263671875, -31.2509765625, -29.54931640625, -27.84765625, -26.14599609375, -24.4443359375, -22.74267578125, -21.041015625, -19.33935546875, -17.6376953125, -15.93603515625, -14.234375, -12.53271484375, -10.8310546875, -9.12939453125, -7.427734375, -5.72607421875, -4.0244140625, -2.32275390625, -0.62109375, 1.08056640625, 2.7822265625, 4.48388671875, 6.185546875, 7.88720703125, 9.5888671875, 11.29052734375, 12.9921875, 14.69384765625, 16.3955078125, 18.09716796875, 19.798828125, 21.50048828125, 23.2021484375, 24.90380859375, 26.60546875, 28.30712890625, 30.0087890625, 31.71044921875, 33.412109375, 35.11376953125, 36.8154296875, 38.51708984375, 40.21875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 12.0, 22.0, 23.0, 32.0, 47.0, 85.0, 132.0, 194.0, 368.0, 804.0, 2162.0, 9157.0, 91163.0, 880387.0, 53946.0, 6795.0, 1668.0, 646.0, 349.0, 179.0, 118.0, 60.0, 42.0, 41.0, 19.0, 26.0, 14.0, 13.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.625, -163.435546875, -157.24609375, -151.056640625, -144.8671875, -138.677734375, -132.48828125, -126.298828125, -120.109375, -113.919921875, -107.73046875, -101.541015625, -95.3515625, -89.162109375, -82.97265625, -76.783203125, -70.59375, -64.404296875, -58.21484375, -52.025390625, -45.8359375, -39.646484375, -33.45703125, -27.267578125, -21.078125, -14.888671875, -8.69921875, -2.509765625, 3.6796875, 9.869140625, 16.05859375, 22.248046875, 28.4375, 34.626953125, 40.81640625, 47.005859375, 53.1953125, 59.384765625, 65.57421875, 71.763671875, 77.953125, 84.142578125, 90.33203125, 96.521484375, 102.7109375, 108.900390625, 115.08984375, 121.279296875, 127.46875, 133.658203125, 139.84765625, 146.037109375, 152.2265625, 158.416015625, 164.60546875, 170.794921875, 176.984375, 183.173828125, 189.36328125, 195.552734375, 201.7421875, 207.931640625, 214.12109375, 220.310546875, 226.5]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 11.0, 23.0, 19.0, 29.0, 23.0, 27.0, 35.0, 41.0, 34.0, 64.0, 52.0, 71.0, 83.0, 64.0, 76.0, 53.0, 45.0, 47.0, 37.0, 32.0, 31.0, 16.0, 20.0, 11.0, 8.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-241.5, -234.46875, -227.4375, -220.40625, -213.375, -206.34375, -199.3125, -192.28125, -185.25, -178.21875, -171.1875, -164.15625, -157.125, -150.09375, -143.0625, -136.03125, -129.0, -121.96875, -114.9375, -107.90625, -100.875, -93.84375, -86.8125, -79.78125, -72.75, -65.71875, -58.6875, -51.65625, -44.625, -37.59375, -30.5625, -23.53125, -16.5, -9.46875, -2.4375, 4.59375, 11.625, 18.65625, 25.6875, 32.71875, 39.75, 46.78125, 53.8125, 60.84375, 67.875, 74.90625, 81.9375, 88.96875, 96.0, 103.03125, 110.0625, 117.09375, 124.125, 131.15625, 138.1875, 145.21875, 152.25, 159.28125, 166.3125, 173.34375, 180.375, 187.40625, 194.4375, 201.46875, 208.5]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 5.0, 9.0, 15.0, 21.0, 27.0, 50.0, 57.0, 88.0, 113.0, 174.0, 279.0, 461.0, 828.0, 1501.0, 3027.0, 7033.0, 18222.0, 58683.0, 254086.0, 589384.0, 75960.0, 22405.0, 8397.0, 3659.0, 1674.0, 939.0, 527.0, 335.0, 172.0, 127.0, 86.0, 53.0, 39.0, 24.0, 16.0, 21.0, 15.0, 12.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.921875, -20.226806640625, -19.53173828125, -18.836669921875, -18.1416015625, -17.446533203125, -16.75146484375, -16.056396484375, -15.361328125, -14.666259765625, -13.97119140625, -13.276123046875, -12.5810546875, -11.885986328125, -11.19091796875, -10.495849609375, -9.80078125, -9.105712890625, -8.41064453125, -7.715576171875, -7.0205078125, -6.325439453125, -5.63037109375, -4.935302734375, -4.240234375, -3.545166015625, -2.85009765625, -2.155029296875, -1.4599609375, -0.764892578125, -0.06982421875, 0.625244140625, 1.3203125, 2.015380859375, 2.71044921875, 3.405517578125, 4.1005859375, 4.795654296875, 5.49072265625, 6.185791015625, 6.880859375, 7.575927734375, 8.27099609375, 8.966064453125, 9.6611328125, 10.356201171875, 11.05126953125, 11.746337890625, 12.44140625, 13.136474609375, 13.83154296875, 14.526611328125, 15.2216796875, 15.916748046875, 16.61181640625, 17.306884765625, 18.001953125, 18.697021484375, 19.39208984375, 20.087158203125, 20.7822265625, 21.477294921875, 22.17236328125, 22.867431640625, 23.5625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 19.0, 25.0, 37.0, 67.0, 78.0, 144.0, 195.0, 155.0, 77.0, 60.0, 45.0, 33.0, 14.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0211944580078125, -0.020669221878051758, -0.020143985748291016, -0.019618749618530273, -0.01909351348876953, -0.01856827735900879, -0.018043041229248047, -0.017517805099487305, -0.016992568969726562, -0.01646733283996582, -0.015942096710205078, -0.015416860580444336, -0.014891624450683594, -0.014366388320922852, -0.01384115219116211, -0.013315916061401367, -0.012790679931640625, -0.012265443801879883, -0.01174020767211914, -0.011214971542358398, -0.010689735412597656, -0.010164499282836914, -0.009639263153076172, -0.00911402702331543, -0.008588790893554688, -0.008063554763793945, -0.007538318634033203, -0.007013082504272461, -0.006487846374511719, -0.0059626102447509766, -0.005437374114990234, -0.004912137985229492, -0.00438690185546875, -0.003861665725708008, -0.0033364295959472656, -0.0028111934661865234, -0.0022859573364257812, -0.001760721206665039, -0.0012354850769042969, -0.0007102489471435547, -0.0001850128173828125, 0.0003402233123779297, 0.0008654594421386719, 0.001390695571899414, 0.0019159317016601562, 0.0024411678314208984, 0.0029664039611816406, 0.003491640090942383, 0.004016876220703125, 0.004542112350463867, 0.005067348480224609, 0.0055925846099853516, 0.006117820739746094, 0.006643056869506836, 0.007168292999267578, 0.00769352912902832, 0.008218765258789062, 0.008744001388549805, 0.009269237518310547, 0.009794473648071289, 0.010319709777832031, 0.010844945907592773, 0.011370182037353516, 0.011895418167114258, 0.012420654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 9.0, 13.0, 19.0, 18.0, 31.0, 37.0, 37.0, 56.0, 101.0, 168.0, 303.0, 627.0, 1320.0, 3608.0, 12718.0, 62919.0, 677294.0, 239679.0, 36555.0, 8240.0, 2547.0, 1050.0, 503.0, 241.0, 154.0, 104.0, 46.0, 35.0, 28.0, 14.0, 16.0, 11.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.8125, -29.8134765625, -28.814453125, -27.8154296875, -26.81640625, -25.8173828125, -24.818359375, -23.8193359375, -22.8203125, -21.8212890625, -20.822265625, -19.8232421875, -18.82421875, -17.8251953125, -16.826171875, -15.8271484375, -14.828125, -13.8291015625, -12.830078125, -11.8310546875, -10.83203125, -9.8330078125, -8.833984375, -7.8349609375, -6.8359375, -5.8369140625, -4.837890625, -3.8388671875, -2.83984375, -1.8408203125, -0.841796875, 0.1572265625, 1.15625, 2.1552734375, 3.154296875, 4.1533203125, 5.15234375, 6.1513671875, 7.150390625, 8.1494140625, 9.1484375, 10.1474609375, 11.146484375, 12.1455078125, 13.14453125, 14.1435546875, 15.142578125, 16.1416015625, 17.140625, 18.1396484375, 19.138671875, 20.1376953125, 21.13671875, 22.1357421875, 23.134765625, 24.1337890625, 25.1328125, 26.1318359375, 27.130859375, 28.1298828125, 29.12890625, 30.1279296875, 31.126953125, 32.1259765625, 33.125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 2.0, 7.0, 3.0, 1.0, 10.0, 10.0, 14.0, 13.0, 12.0, 17.0, 26.0, 27.0, 41.0, 37.0, 48.0, 69.0, 61.0, 86.0, 68.0, 71.0, 66.0, 33.0, 59.0, 31.0, 26.0, 20.0, 20.0, 17.0, 7.0, 18.0, 11.0, 11.0, 6.0, 9.0, 7.0, 9.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-25.78125, -25.071533203125, -24.36181640625, -23.652099609375, -22.9423828125, -22.232666015625, -21.52294921875, -20.813232421875, -20.103515625, -19.393798828125, -18.68408203125, -17.974365234375, -17.2646484375, -16.554931640625, -15.84521484375, -15.135498046875, -14.42578125, -13.716064453125, -13.00634765625, -12.296630859375, -11.5869140625, -10.877197265625, -10.16748046875, -9.457763671875, -8.748046875, -8.038330078125, -7.32861328125, -6.618896484375, -5.9091796875, -5.199462890625, -4.48974609375, -3.780029296875, -3.0703125, -2.360595703125, -1.65087890625, -0.941162109375, -0.2314453125, 0.478271484375, 1.18798828125, 1.897705078125, 2.607421875, 3.317138671875, 4.02685546875, 4.736572265625, 5.4462890625, 6.156005859375, 6.86572265625, 7.575439453125, 8.28515625, 8.994873046875, 9.70458984375, 10.414306640625, 11.1240234375, 11.833740234375, 12.54345703125, 13.253173828125, 13.962890625, 14.672607421875, 15.38232421875, 16.092041015625, 16.8017578125, 17.511474609375, 18.22119140625, 18.930908203125, 19.640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 12.0, 9.0, 42.0, 77.0, 236.0, 414.0, 117.0, 49.0, 21.0, 14.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1807.1153564453125, -1763.2694091796875, -1719.423583984375, -1675.57763671875, -1631.7318115234375, -1587.8858642578125, -1544.0400390625, -1500.194091796875, -1456.34814453125, -1412.502197265625, -1368.6563720703125, -1324.8104248046875, -1280.964599609375, -1237.11865234375, -1193.272705078125, -1149.4268798828125, -1105.5810546875, -1061.735107421875, -1017.8892822265625, -974.0433349609375, -930.1974487304688, -886.3515625, -842.5056762695312, -798.6597900390625, -754.8138427734375, -710.9679565429688, -667.1220703125, -623.276123046875, -579.4302368164062, -535.5843505859375, -491.73846435546875, -447.8925476074219, -404.046630859375, -360.20074462890625, -316.3548278808594, -272.5089416503906, -228.6630401611328, -184.817138671875, -140.97125244140625, -97.12533569335938, -53.279449462890625, -9.433551788330078, 34.41234588623047, 78.25823974609375, 122.10414123535156, 165.95004272460938, 209.79592895507812, 253.641845703125, 297.48773193359375, 341.3336181640625, 385.1795349121094, 429.0254211425781, 472.871337890625, 516.7172241210938, 560.5631103515625, 604.4090576171875, 648.2548828125, 692.1007690429688, 735.9466552734375, 779.7926025390625, 823.6384887695312, 867.484375, 911.3302612304688, 955.1761474609375, 999.0220947265625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 6.0, 11.0, 15.0, 15.0, 17.0, 9.0, 24.0, 24.0, 26.0, 36.0, 30.0, 49.0, 53.0, 115.0, 125.0, 82.0, 37.0, 44.0, 36.0, 26.0, 21.0, 22.0, 17.0, 21.0, 22.0, 22.0, 17.0, 10.0, 6.0, 9.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-632.9547119140625, -612.6290283203125, -592.3033447265625, -571.9777221679688, -551.6520385742188, -531.3263549804688, -511.00067138671875, -490.67498779296875, -470.3493347167969, -450.0236511230469, -429.697998046875, -409.372314453125, -389.046630859375, -368.7209777832031, -348.3952941894531, -328.06964111328125, -307.74395751953125, -287.41827392578125, -267.0926208496094, -246.76693725585938, -226.44126892089844, -206.1156005859375, -185.7899169921875, -165.46424865722656, -145.13858032226562, -124.81291198730469, -104.48723602294922, -84.16156005859375, -63.83589172363281, -43.510223388671875, -23.184547424316406, -2.8588714599609375, 17.46685791015625, 37.79253005981445, 58.118202209472656, 78.44387817382812, 98.76954650878906, 119.09521484375, 139.4208984375, 159.74656677246094, 180.07223510742188, 200.3979034423828, 220.72357177734375, 241.04925537109375, 261.37493896484375, 281.7005920410156, 302.0262756347656, 322.3519287109375, 342.6776123046875, 363.0032958984375, 383.3289489746094, 403.6546325683594, 423.98028564453125, 444.30596923828125, 464.63165283203125, 484.95733642578125, 505.2829895019531, 525.608642578125, 545.934326171875, 566.260009765625, 586.585693359375, 606.911376953125, 627.2369995117188, 647.5626831054688, 667.8883666992188]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 10.0, 9.0, 7.0, 16.0, 16.0, 25.0, 28.0, 36.0, 55.0, 56.0, 84.0, 117.0, 209.0, 348.0, 828.0, 2119.0, 6248.0, 26011.0, 224688.0, 2481273.0, 1324648.0, 104568.0, 15733.0, 4217.0, 1441.0, 622.0, 275.0, 174.0, 115.0, 74.0, 55.0, 41.0, 37.0, 27.0, 18.0, 10.0, 15.0, 9.0, 4.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-111.375, -107.876953125, -104.37890625, -100.880859375, -97.3828125, -93.884765625, -90.38671875, -86.888671875, -83.390625, -79.892578125, -76.39453125, -72.896484375, -69.3984375, -65.900390625, -62.40234375, -58.904296875, -55.40625, -51.908203125, -48.41015625, -44.912109375, -41.4140625, -37.916015625, -34.41796875, -30.919921875, -27.421875, -23.923828125, -20.42578125, -16.927734375, -13.4296875, -9.931640625, -6.43359375, -2.935546875, 0.5625, 4.060546875, 7.55859375, 11.056640625, 14.5546875, 18.052734375, 21.55078125, 25.048828125, 28.546875, 32.044921875, 35.54296875, 39.041015625, 42.5390625, 46.037109375, 49.53515625, 53.033203125, 56.53125, 60.029296875, 63.52734375, 67.025390625, 70.5234375, 74.021484375, 77.51953125, 81.017578125, 84.515625, 88.013671875, 91.51171875, 95.009765625, 98.5078125, 102.005859375, 105.50390625, 109.001953125, 112.5]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 17.0, 10.0, 11.0, 15.0, 15.0, 22.0, 25.0, 27.0, 34.0, 32.0, 39.0, 42.0, 50.0, 54.0, 50.0, 59.0, 40.0, 49.0, 54.0, 43.0, 44.0, 39.0, 34.0, 32.0, 25.0, 28.0, 28.0, 16.0, 11.0, 11.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-59.875, -58.33349609375, -56.7919921875, -55.25048828125, -53.708984375, -52.16748046875, -50.6259765625, -49.08447265625, -47.54296875, -46.00146484375, -44.4599609375, -42.91845703125, -41.376953125, -39.83544921875, -38.2939453125, -36.75244140625, -35.2109375, -33.66943359375, -32.1279296875, -30.58642578125, -29.044921875, -27.50341796875, -25.9619140625, -24.42041015625, -22.87890625, -21.33740234375, -19.7958984375, -18.25439453125, -16.712890625, -15.17138671875, -13.6298828125, -12.08837890625, -10.546875, -9.00537109375, -7.4638671875, -5.92236328125, -4.380859375, -2.83935546875, -1.2978515625, 0.24365234375, 1.78515625, 3.32666015625, 4.8681640625, 6.40966796875, 7.951171875, 9.49267578125, 11.0341796875, 12.57568359375, 14.1171875, 15.65869140625, 17.2001953125, 18.74169921875, 20.283203125, 21.82470703125, 23.3662109375, 24.90771484375, 26.44921875, 27.99072265625, 29.5322265625, 31.07373046875, 32.615234375, 34.15673828125, 35.6982421875, 37.23974609375, 38.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 10.0, 24.0, 69.0, 150.0, 387.0, 1692.0, 37562.0, 4146052.0, 6997.0, 890.0, 274.0, 97.0, 35.0, 18.0, 10.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-565.5, -544.015625, -522.53125, -501.046875, -479.5625, -458.078125, -436.59375, -415.109375, -393.625, -372.140625, -350.65625, -329.171875, -307.6875, -286.203125, -264.71875, -243.234375, -221.75, -200.265625, -178.78125, -157.296875, -135.8125, -114.328125, -92.84375, -71.359375, -49.875, -28.390625, -6.90625, 14.578125, 36.0625, 57.546875, 79.03125, 100.515625, 122.0, 143.484375, 164.96875, 186.453125, 207.9375, 229.421875, 250.90625, 272.390625, 293.875, 315.359375, 336.84375, 358.328125, 379.8125, 401.296875, 422.78125, 444.265625, 465.75, 487.234375, 508.71875, 530.203125, 551.6875, 573.171875, 594.65625, 616.140625, 637.625, 659.109375, 680.59375, 702.078125, 723.5625, 745.046875, 766.53125, 788.015625, 809.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 14.0, 21.0, 65.0, 149.0, 355.0, 1118.0, 1555.0, 514.0, 156.0, 74.0, 37.0, 13.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-464.75, -452.5625, -440.375, -428.1875, -416.0, -403.8125, -391.625, -379.4375, -367.25, -355.0625, -342.875, -330.6875, -318.5, -306.3125, -294.125, -281.9375, -269.75, -257.5625, -245.375, -233.1875, -221.0, -208.8125, -196.625, -184.4375, -172.25, -160.0625, -147.875, -135.6875, -123.5, -111.3125, -99.125, -86.9375, -74.75, -62.5625, -50.375, -38.1875, -26.0, -13.8125, -1.625, 10.5625, 22.75, 34.9375, 47.125, 59.3125, 71.5, 83.6875, 95.875, 108.0625, 120.25, 132.4375, 144.625, 156.8125, 169.0, 181.1875, 193.375, 205.5625, 217.75, 229.9375, 242.125, 254.3125, 266.5, 278.6875, 290.875, 303.0625, 315.25]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 19.0, 16.0, 35.0, 52.0, 103.0, 142.0, 201.0, 148.0, 109.0, 68.0, 35.0, 20.0, 9.0, 7.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1939.178466796875, -1887.5079345703125, -1835.8372802734375, -1784.166748046875, -1732.49609375, -1680.8255615234375, -1629.155029296875, -1577.484375, -1525.813720703125, -1474.1431884765625, -1422.4725341796875, -1370.802001953125, -1319.13134765625, -1267.4608154296875, -1215.790283203125, -1164.11962890625, -1112.4490966796875, -1060.778564453125, -1009.10791015625, -957.4373779296875, -905.7667236328125, -854.09619140625, -802.4255981445312, -750.7550048828125, -699.0844116210938, -647.413818359375, -595.7432250976562, -544.0726318359375, -492.4020690917969, -440.7314758300781, -389.0609130859375, -337.39031982421875, -285.7197265625, -234.04913330078125, -182.37855529785156, -130.70797729492188, -79.03738403320312, -27.366790771484375, 24.30377197265625, 75.974365234375, 127.64495849609375, 179.3155517578125, 230.9861297607422, 282.6567077636719, 334.3273010253906, 385.9978942871094, 437.66845703125, 489.33905029296875, 541.0096435546875, 592.6802368164062, 644.350830078125, 696.0213623046875, 747.6920166015625, 799.362548828125, 851.0331420898438, 902.7037353515625, 954.3743286132812, 1006.044921875, 1057.7154541015625, 1109.3861083984375, 1161.056640625, 1212.727294921875, 1264.3978271484375, 1316.068359375, 1367.739013671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 8.0, 13.0, 10.0, 22.0, 22.0, 24.0, 28.0, 22.0, 30.0, 33.0, 33.0, 33.0, 34.0, 41.0, 40.0, 47.0, 53.0, 66.0, 48.0, 43.0, 38.0, 37.0, 34.0, 42.0, 28.0, 34.0, 15.0, 19.0, 13.0, 13.0, 16.0, 13.0, 9.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-781.1297607421875, -758.0313110351562, -734.9329223632812, -711.83447265625, -688.736083984375, -665.6376342773438, -642.5391845703125, -619.4407958984375, -596.3423461914062, -573.243896484375, -550.1455078125, -527.0470581054688, -503.9486389160156, -480.8502197265625, -457.7518005371094, -434.65338134765625, -411.5549621582031, -388.45654296875, -365.3581237792969, -342.25970458984375, -319.1612548828125, -296.0628356933594, -272.96441650390625, -249.86598205566406, -226.76756286621094, -203.6691436767578, -180.57070922851562, -157.4722900390625, -134.37387084960938, -111.27543640136719, -88.17701721191406, -65.07858276367188, -41.98016357421875, -18.881738662719727, 4.216686248779297, 27.315109252929688, 50.413536071777344, 73.511962890625, 96.61038208007812, 119.70881652832031, 142.80723571777344, 165.90565490722656, 189.00408935546875, 212.10250854492188, 235.200927734375, 258.29937744140625, 281.39776611328125, 304.4962158203125, 327.5946350097656, 350.69305419921875, 373.7914733886719, 396.889892578125, 419.98834228515625, 443.0867614746094, 466.1851806640625, 489.28363037109375, 512.3820190429688, 535.48046875, 558.578857421875, 581.6773071289062, 604.7756958007812, 627.8741455078125, 650.9725341796875, 674.0709838867188, 697.16943359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 31.0, 27.0, 48.0, 62.0, 106.0, 124.0, 222.0, 322.0, 622.0, 1028.0, 1813.0, 3528.0, 7278.0, 15554.0, 37922.0, 107503.0, 451320.0, 288742.0, 78191.0, 29003.0, 12470.0, 5844.0, 2893.0, 1543.0, 880.0, 523.0, 268.0, 203.0, 141.0, 81.0, 54.0, 39.0, 32.0, 23.0, 16.0, 8.0, 13.0, 6.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.6875, -81.2158203125, -78.744140625, -76.2724609375, -73.80078125, -71.3291015625, -68.857421875, -66.3857421875, -63.9140625, -61.4423828125, -58.970703125, -56.4990234375, -54.02734375, -51.5556640625, -49.083984375, -46.6123046875, -44.140625, -41.6689453125, -39.197265625, -36.7255859375, -34.25390625, -31.7822265625, -29.310546875, -26.8388671875, -24.3671875, -21.8955078125, -19.423828125, -16.9521484375, -14.48046875, -12.0087890625, -9.537109375, -7.0654296875, -4.59375, -2.1220703125, 0.349609375, 2.8212890625, 5.29296875, 7.7646484375, 10.236328125, 12.7080078125, 15.1796875, 17.6513671875, 20.123046875, 22.5947265625, 25.06640625, 27.5380859375, 30.009765625, 32.4814453125, 34.953125, 37.4248046875, 39.896484375, 42.3681640625, 44.83984375, 47.3115234375, 49.783203125, 52.2548828125, 54.7265625, 57.1982421875, 59.669921875, 62.1416015625, 64.61328125, 67.0849609375, 69.556640625, 72.0283203125, 74.5]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 8.0, 3.0, 6.0, 14.0, 21.0, 14.0, 13.0, 27.0, 21.0, 28.0, 31.0, 38.0, 45.0, 53.0, 41.0, 54.0, 46.0, 62.0, 53.0, 46.0, 38.0, 42.0, 43.0, 32.0, 33.0, 17.0, 23.0, 25.0, 20.0, 18.0, 12.0, 9.0, 13.0, 9.0, 3.0, 4.0, 2.0, 9.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-66.5, -64.57373046875, -62.6474609375, -60.72119140625, -58.794921875, -56.86865234375, -54.9423828125, -53.01611328125, -51.08984375, -49.16357421875, -47.2373046875, -45.31103515625, -43.384765625, -41.45849609375, -39.5322265625, -37.60595703125, -35.6796875, -33.75341796875, -31.8271484375, -29.90087890625, -27.974609375, -26.04833984375, -24.1220703125, -22.19580078125, -20.26953125, -18.34326171875, -16.4169921875, -14.49072265625, -12.564453125, -10.63818359375, -8.7119140625, -6.78564453125, -4.859375, -2.93310546875, -1.0068359375, 0.91943359375, 2.845703125, 4.77197265625, 6.6982421875, 8.62451171875, 10.55078125, 12.47705078125, 14.4033203125, 16.32958984375, 18.255859375, 20.18212890625, 22.1083984375, 24.03466796875, 25.9609375, 27.88720703125, 29.8134765625, 31.73974609375, 33.666015625, 35.59228515625, 37.5185546875, 39.44482421875, 41.37109375, 43.29736328125, 45.2236328125, 47.14990234375, 49.076171875, 51.00244140625, 52.9287109375, 54.85498046875, 56.78125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 12.0, 10.0, 13.0, 21.0, 39.0, 48.0, 88.0, 142.0, 308.0, 646.0, 1701.0, 7088.0, 68428.0, 932271.0, 30940.0, 4485.0, 1218.0, 533.0, 256.0, 114.0, 62.0, 42.0, 29.0, 12.0, 18.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.75, -178.125, -170.5, -162.875, -155.25, -147.625, -140.0, -132.375, -124.75, -117.125, -109.5, -101.875, -94.25, -86.625, -79.0, -71.375, -63.75, -56.125, -48.5, -40.875, -33.25, -25.625, -18.0, -10.375, -2.75, 4.875, 12.5, 20.125, 27.75, 35.375, 43.0, 50.625, 58.25, 65.875, 73.5, 81.125, 88.75, 96.375, 104.0, 111.625, 119.25, 126.875, 134.5, 142.125, 149.75, 157.375, 165.0, 172.625, 180.25, 187.875, 195.5, 203.125, 210.75, 218.375, 226.0, 233.625, 241.25, 248.875, 256.5, 264.125, 271.75, 279.375, 287.0, 294.625, 302.25]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 3.0, 4.0, 7.0, 10.0, 17.0, 14.0, 17.0, 20.0, 25.0, 33.0, 36.0, 39.0, 51.0, 80.0, 92.0, 101.0, 91.0, 59.0, 46.0, 45.0, 33.0, 33.0, 24.0, 25.0, 16.0, 18.0, 12.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-417.25, -405.46875, -393.6875, -381.90625, -370.125, -358.34375, -346.5625, -334.78125, -323.0, -311.21875, -299.4375, -287.65625, -275.875, -264.09375, -252.3125, -240.53125, -228.75, -216.96875, -205.1875, -193.40625, -181.625, -169.84375, -158.0625, -146.28125, -134.5, -122.71875, -110.9375, -99.15625, -87.375, -75.59375, -63.8125, -52.03125, -40.25, -28.46875, -16.6875, -4.90625, 6.875, 18.65625, 30.4375, 42.21875, 54.0, 65.78125, 77.5625, 89.34375, 101.125, 112.90625, 124.6875, 136.46875, 148.25, 160.03125, 171.8125, 183.59375, 195.375, 207.15625, 218.9375, 230.71875, 242.5, 254.28125, 266.0625, 277.84375, 289.625, 301.40625, 313.1875, 324.96875, 336.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 19.0, 16.0, 32.0, 78.0, 92.0, 158.0, 370.0, 902.0, 2263.0, 7338.0, 33057.0, 809606.0, 166564.0, 20274.0, 5012.0, 1574.0, 617.0, 265.0, 127.0, 67.0, 54.0, 20.0, 15.0, 7.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-52.5625, -51.3359375, -50.109375, -48.8828125, -47.65625, -46.4296875, -45.203125, -43.9765625, -42.75, -41.5234375, -40.296875, -39.0703125, -37.84375, -36.6171875, -35.390625, -34.1640625, -32.9375, -31.7109375, -30.484375, -29.2578125, -28.03125, -26.8046875, -25.578125, -24.3515625, -23.125, -21.8984375, -20.671875, -19.4453125, -18.21875, -16.9921875, -15.765625, -14.5390625, -13.3125, -12.0859375, -10.859375, -9.6328125, -8.40625, -7.1796875, -5.953125, -4.7265625, -3.5, -2.2734375, -1.046875, 0.1796875, 1.40625, 2.6328125, 3.859375, 5.0859375, 6.3125, 7.5390625, 8.765625, 9.9921875, 11.21875, 12.4453125, 13.671875, 14.8984375, 16.125, 17.3515625, 18.578125, 19.8046875, 21.03125, 22.2578125, 23.484375, 24.7109375, 25.9375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 10.0, 8.0, 8.0, 7.0, 11.0, 19.0, 26.0, 34.0, 36.0, 53.0, 82.0, 98.0, 121.0, 116.0, 95.0, 74.0, 38.0, 23.0, 21.0, 24.0, 14.0, 9.0, 14.0, 4.0, 7.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01104736328125, -0.010699152946472168, -0.010350942611694336, -0.010002732276916504, -0.009654521942138672, -0.00930631160736084, -0.008958101272583008, -0.008609890937805176, -0.008261680603027344, -0.007913470268249512, -0.00756525993347168, -0.007217049598693848, -0.006868839263916016, -0.006520628929138184, -0.0061724185943603516, -0.0058242082595825195, -0.0054759979248046875, -0.0051277875900268555, -0.0047795772552490234, -0.004431366920471191, -0.004083156585693359, -0.0037349462509155273, -0.0033867359161376953, -0.0030385255813598633, -0.0026903152465820312, -0.0023421049118041992, -0.001993894577026367, -0.0016456842422485352, -0.0012974739074707031, -0.0009492635726928711, -0.0006010532379150391, -0.00025284290313720703, 9.5367431640625e-05, 0.00044357776641845703, 0.0007917881011962891, 0.001139998435974121, 0.0014882087707519531, 0.0018364191055297852, 0.002184629440307617, 0.0025328397750854492, 0.0028810501098632812, 0.0032292604446411133, 0.0035774707794189453, 0.003925681114196777, 0.004273891448974609, 0.004622101783752441, 0.0049703121185302734, 0.0053185224533081055, 0.0056667327880859375, 0.0060149431228637695, 0.0063631534576416016, 0.006711363792419434, 0.007059574127197266, 0.007407784461975098, 0.00775599479675293, 0.008104205131530762, 0.008452415466308594, 0.008800625801086426, 0.009148836135864258, 0.00949704647064209, 0.009845256805419922, 0.010193467140197754, 0.010541677474975586, 0.010889887809753418, 0.01123809814453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 15.0, 20.0, 36.0, 46.0, 58.0, 87.0, 152.0, 253.0, 553.0, 939.0, 2434.0, 7566.0, 33010.0, 778010.0, 195343.0, 21129.0, 5362.0, 1823.0, 790.0, 405.0, 201.0, 99.0, 61.0, 51.0, 23.0, 20.0, 7.0, 5.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.01953125, -31.9140625, -30.80859375, -29.703125, -28.59765625, -27.4921875, -26.38671875, -25.28125, -24.17578125, -23.0703125, -21.96484375, -20.859375, -19.75390625, -18.6484375, -17.54296875, -16.4375, -15.33203125, -14.2265625, -13.12109375, -12.015625, -10.91015625, -9.8046875, -8.69921875, -7.59375, -6.48828125, -5.3828125, -4.27734375, -3.171875, -2.06640625, -0.9609375, 0.14453125, 1.25, 2.35546875, 3.4609375, 4.56640625, 5.671875, 6.77734375, 7.8828125, 8.98828125, 10.09375, 11.19921875, 12.3046875, 13.41015625, 14.515625, 15.62109375, 16.7265625, 17.83203125, 18.9375, 20.04296875, 21.1484375, 22.25390625, 23.359375, 24.46484375, 25.5703125, 26.67578125, 27.78125, 28.88671875, 29.9921875, 31.09765625, 32.203125, 33.30859375, 34.4140625, 35.51953125, 36.625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 6.0, 5.0, 12.0, 7.0, 6.0, 11.0, 15.0, 11.0, 18.0, 21.0, 41.0, 55.0, 52.0, 87.0, 89.0, 103.0, 106.0, 80.0, 66.0, 42.0, 36.0, 27.0, 18.0, 17.0, 17.0, 12.0, 4.0, 6.0, 6.0, 4.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.65625, -41.46826171875, -40.2802734375, -39.09228515625, -37.904296875, -36.71630859375, -35.5283203125, -34.34033203125, -33.15234375, -31.96435546875, -30.7763671875, -29.58837890625, -28.400390625, -27.21240234375, -26.0244140625, -24.83642578125, -23.6484375, -22.46044921875, -21.2724609375, -20.08447265625, -18.896484375, -17.70849609375, -16.5205078125, -15.33251953125, -14.14453125, -12.95654296875, -11.7685546875, -10.58056640625, -9.392578125, -8.20458984375, -7.0166015625, -5.82861328125, -4.640625, -3.45263671875, -2.2646484375, -1.07666015625, 0.111328125, 1.29931640625, 2.4873046875, 3.67529296875, 4.86328125, 6.05126953125, 7.2392578125, 8.42724609375, 9.615234375, 10.80322265625, 11.9912109375, 13.17919921875, 14.3671875, 15.55517578125, 16.7431640625, 17.93115234375, 19.119140625, 20.30712890625, 21.4951171875, 22.68310546875, 23.87109375, 25.05908203125, 26.2470703125, 27.43505859375, 28.623046875, 29.81103515625, 30.9990234375, 32.18701171875, 33.375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 17.0, 28.0, 57.0, 99.0, 455.0, 192.0, 59.0, 44.0, 15.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2002.5418701171875, -1953.463134765625, -1904.3843994140625, -1855.3056640625, -1806.2269287109375, -1757.148193359375, -1708.0694580078125, -1658.99072265625, -1609.9119873046875, -1560.833251953125, -1511.7545166015625, -1462.67578125, -1413.5970458984375, -1364.518310546875, -1315.4395751953125, -1266.36083984375, -1217.2821044921875, -1168.203369140625, -1119.1246337890625, -1070.0458984375, -1020.9671630859375, -971.888427734375, -922.8096923828125, -873.73095703125, -824.6522216796875, -775.573486328125, -726.4947509765625, -677.416015625, -628.3372802734375, -579.258544921875, -530.1798095703125, -481.10107421875, -432.0224609375, -382.9437255859375, -333.864990234375, -284.7862548828125, -235.70751953125, -186.6287841796875, -137.550048828125, -88.4713134765625, -39.392578125, 9.6861572265625, 58.764892578125, 107.8436279296875, 156.92236328125, 206.0010986328125, 255.079833984375, 304.1585693359375, 353.2373046875, 402.3160400390625, 451.394775390625, 500.4735107421875, 549.55224609375, 598.6309814453125, 647.709716796875, 696.7884521484375, 745.8671875, 794.9459228515625, 844.024658203125, 893.1033935546875, 942.18212890625, 991.2608642578125, 1040.339599609375, 1089.4183349609375, 1138.4970703125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 13.0, 4.0, 8.0, 10.0, 12.0, 16.0, 17.0, 20.0, 13.0, 24.0, 27.0, 27.0, 34.0, 62.0, 179.0, 214.0, 79.0, 38.0, 32.0, 30.0, 19.0, 20.0, 18.0, 16.0, 5.0, 8.0, 11.0, 5.0, 8.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-811.7107543945312, -781.8485107421875, -751.9862060546875, -722.1239624023438, -692.26171875, -662.3994750976562, -632.5372314453125, -602.6749267578125, -572.8126831054688, -542.950439453125, -513.088134765625, -483.22589111328125, -453.3636474609375, -423.50140380859375, -393.6391296386719, -363.77685546875, -333.91461181640625, -304.0523681640625, -274.1900939941406, -244.3278350830078, -214.465576171875, -184.6033172607422, -154.74105834960938, -124.87879943847656, -95.01654052734375, -65.15428161621094, -35.292022705078125, -5.4297637939453125, 24.4324951171875, 54.29475402832031, 84.15701293945312, 114.01927185058594, 143.881591796875, 173.7438507080078, 203.60610961914062, 233.46836853027344, 263.33062744140625, 293.19287109375, 323.0551452636719, 352.91741943359375, 382.7796630859375, 412.64190673828125, 442.5041809082031, 472.366455078125, 502.22869873046875, 532.0909423828125, 561.9532470703125, 591.8154907226562, 621.677734375, 651.5399780273438, 681.4022216796875, 711.2645263671875, 741.1267700195312, 770.989013671875, 800.851318359375, 830.7135620117188, 860.5758056640625, 890.4380493164062, 920.30029296875, 950.16259765625, 980.0248413085938, 1009.8870849609375, 1039.7493896484375, 1069.611572265625, 1099.473876953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 5.0, 3.0, 7.0, 10.0, 10.0, 12.0, 13.0, 17.0, 19.0, 22.0, 25.0, 36.0, 45.0, 55.0, 124.0, 196.0, 76.0, 62.0, 37.0, 29.0, 37.0, 26.0, 20.0, 26.0, 16.0, 15.0, 10.0, 11.0, 6.0, 2.0, 7.0, 2.0, 4.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.5625, -46.3974609375, -44.232421875, -42.0673828125, -39.90234375, -37.7373046875, -35.572265625, -33.4072265625, -31.2421875, -29.0771484375, -26.912109375, -24.7470703125, -22.58203125, -20.4169921875, -18.251953125, -16.0869140625, -13.921875, -11.7568359375, -9.591796875, -7.4267578125, -5.26171875, -3.0966796875, -0.931640625, 1.2333984375, 3.3984375, 5.5634765625, 7.728515625, 9.8935546875, 12.05859375, 14.2236328125, 16.388671875, 18.5537109375, 20.71875, 22.8837890625, 25.048828125, 27.2138671875, 29.37890625, 31.5439453125, 33.708984375, 35.8740234375, 38.0390625, 40.2041015625, 42.369140625, 44.5341796875, 46.69921875, 48.8642578125, 51.029296875, 53.1943359375, 55.359375, 57.5244140625, 59.689453125, 61.8544921875, 64.01953125, 66.1845703125, 68.349609375, 70.5146484375, 72.6796875, 74.8447265625, 77.009765625, 79.1748046875, 81.33984375, 83.5048828125, 85.669921875, 87.8349609375, 90.0]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 4.0, 10.0, 11.0, 6.0, 13.0, 15.0, 21.0, 24.0, 24.0, 60.0, 106.0, 167.0, 336.0, 721.0, 2171.0, 9514.0, 8327996.0, 40952.0, 4274.0, 1166.0, 470.0, 171.0, 114.0, 63.0, 54.0, 25.0, 16.0, 10.0, 14.0, 6.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-537.6149291992188, -522.1497192382812, -506.6845397949219, -491.2193603515625, -475.754150390625, -460.2889709472656, -444.8237609863281, -429.35858154296875, -413.89337158203125, -398.4281921386719, -382.9629821777344, -367.497802734375, -352.0325927734375, -336.5674133300781, -321.1022033691406, -305.63702392578125, -290.17181396484375, -274.7066345214844, -259.2414245605469, -243.77622985839844, -228.31103515625, -212.84585571289062, -197.38064575195312, -181.91546630859375, -166.45028686523438, -150.98509216308594, -135.5198974609375, -120.05470275878906, -104.58950805664062, -89.12432098388672, -73.65912628173828, -58.193931579589844, -42.728729248046875, -27.263534545898438, -11.798341751098633, 3.666851043701172, 19.13204574584961, 34.59723663330078, 50.06243133544922, 65.52762603759766, 80.9928207397461, 96.45801544189453, 111.92321014404297, 127.38839721679688, 142.8535919189453, 158.31878662109375, 173.7839813232422, 189.24917602539062, 204.71437072753906, 220.1795654296875, 235.64476013183594, 251.10995483398438, 266.57513427734375, 282.04034423828125, 297.5055236816406, 312.9707336425781, 328.4359130859375, 343.9010925292969, 359.3663024902344, 374.83148193359375, 390.29669189453125, 405.7618713378906, 421.2270812988281, 436.6922607421875, 452.157470703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 4.0, 7.0, 3.0, 5.0, 5.0, 7.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.5076904296875, -359.2933044433594, -345.07891845703125, -330.8645324707031, -316.650146484375, -302.4357604980469, -288.22137451171875, -274.0069885253906, -259.7926025390625, -245.57821655273438, -231.36383056640625, -217.14944458007812, -202.93505859375, -188.72067260742188, -174.50628662109375, -160.29190063476562, -146.07752990722656, -131.86314392089844, -117.64875793457031, -103.43437194824219, -89.21998596191406, -75.00560760498047, -60.791221618652344, -46.57683563232422, -32.362449645996094, -18.14806365966797, -3.9336795806884766, 10.280704498291016, 24.49509048461914, 38.70947265625, 52.923858642578125, 67.13824462890625, 81.35263061523438, 95.5670166015625, 109.78140258789062, 123.99578857421875, 138.21017456054688, 152.424560546875, 166.63894653320312, 180.85333251953125, 195.06771850585938, 209.2821044921875, 223.49649047851562, 237.71087646484375, 251.92526245117188, 266.1396484375, 280.3540344238281, 294.56842041015625, 308.78277587890625, 322.9971618652344, 337.2115478515625, 351.4259338378906, 365.64031982421875, 379.8547058105469, 394.069091796875, 408.2834777832031, 422.49786376953125, 436.7122497558594, 450.9266357421875, 465.1410217285156, 479.35540771484375, 493.5697937011719, 507.7841796875, 521.99853515625, 536.2129516601562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 10.0, 9.0, 16.0, 16.0, 30.0, 31.0, 40.0, 51.0, 60.0, 56.0, 62.0, 80.0, 77.0, 71.0, 64.0, 55.0, 40.0, 38.0, 41.0, 28.0, 24.0, 26.0, 13.0, 20.0, 6.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.3623046875, -35.849609375, -34.3369140625, -32.82421875, -31.3115234375, -29.798828125, -28.2861328125, -26.7734375, -25.2607421875, -23.748046875, -22.2353515625, -20.72265625, -19.2099609375, -17.697265625, -16.1845703125, -14.671875, -13.1591796875, -11.646484375, -10.1337890625, -8.62109375, -7.1083984375, -5.595703125, -4.0830078125, -2.5703125, -1.0576171875, 0.455078125, 1.9677734375, 3.48046875, 4.9931640625, 6.505859375, 8.0185546875, 9.53125, 11.0439453125, 12.556640625, 14.0693359375, 15.58203125, 17.0947265625, 18.607421875, 20.1201171875, 21.6328125, 23.1455078125, 24.658203125, 26.1708984375, 27.68359375, 29.1962890625, 30.708984375, 32.2216796875, 33.734375, 35.2470703125, 36.759765625, 38.2724609375, 39.78515625, 41.2978515625, 42.810546875, 44.3232421875, 45.8359375, 47.3486328125, 48.861328125, 50.3740234375, 51.88671875, 53.3994140625, 54.912109375, 56.4248046875, 57.9375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 5.0, 4.0, 8.0, 19.0, 16.0, 23.0, 41.0, 72.0, 102.0, 153.0, 257.0, 493.0, 731.0, 1441.0, 2833.0, 6169.0, 14143.0, 35592.0, 97478.0, 189860.0, 106797.0, 39414.0, 15538.0, 6551.0, 3153.0, 1453.0, 776.0, 477.0, 249.0, 163.0, 92.0, 53.0, 32.0, 25.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-409.25, -398.3515625, -387.453125, -376.5546875, -365.65625, -354.7578125, -343.859375, -332.9609375, -322.0625, -311.1640625, -300.265625, -289.3671875, -278.46875, -267.5703125, -256.671875, -245.7734375, -234.875, -223.9765625, -213.078125, -202.1796875, -191.28125, -180.3828125, -169.484375, -158.5859375, -147.6875, -136.7890625, -125.890625, -114.9921875, -104.09375, -93.1953125, -82.296875, -71.3984375, -60.5, -49.6015625, -38.703125, -27.8046875, -16.90625, -6.0078125, 4.890625, 15.7890625, 26.6875, 37.5859375, 48.484375, 59.3828125, 70.28125, 81.1796875, 92.078125, 102.9765625, 113.875, 124.7734375, 135.671875, 146.5703125, 157.46875, 168.3671875, 179.265625, 190.1640625, 201.0625, 211.9609375, 222.859375, 233.7578125, 244.65625, 255.5546875, 266.453125, 277.3515625, 288.25]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 29.0, 23.0, 29.0, 36.0, 31.0, 51.0, 45.0, 54.0, 62.0, 53.0, 68.0, 51.0, 59.0, 64.0, 53.0, 40.0, 35.0, 28.0, 23.0, 13.0, 17.0, 18.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.19921875, -54.1484375, -52.09765625, -50.046875, -47.99609375, -45.9453125, -43.89453125, -41.84375, -39.79296875, -37.7421875, -35.69140625, -33.640625, -31.58984375, -29.5390625, -27.48828125, -25.4375, -23.38671875, -21.3359375, -19.28515625, -17.234375, -15.18359375, -13.1328125, -11.08203125, -9.03125, -6.98046875, -4.9296875, -2.87890625, -0.828125, 1.22265625, 3.2734375, 5.32421875, 7.375, 9.42578125, 11.4765625, 13.52734375, 15.578125, 17.62890625, 19.6796875, 21.73046875, 23.78125, 25.83203125, 27.8828125, 29.93359375, 31.984375, 34.03515625, 36.0859375, 38.13671875, 40.1875, 42.23828125, 44.2890625, 46.33984375, 48.390625, 50.44140625, 52.4921875, 54.54296875, 56.59375, 58.64453125, 60.6953125, 62.74609375, 64.796875, 66.84765625, 68.8984375, 70.94921875, 73.0]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 14.0, 22.0, 34.0, 64.0, 56.0, 68.0, 47.0, 50.0, 31.0, 14.0, 17.0, 11.0, 8.0, 9.0, 6.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-356.912353515625, -344.955322265625, -332.998291015625, -321.041259765625, -309.0841979980469, -297.1271667480469, -285.1701354980469, -273.2131042480469, -261.2560729980469, -249.29904174804688, -237.3419952392578, -225.3849639892578, -213.4279327392578, -201.47088623046875, -189.51385498046875, -177.55682373046875, -165.5997772216797, -153.6427459716797, -141.68569946289062, -129.72866821289062, -117.77163696289062, -105.8145980834961, -93.85755920410156, -81.90052795410156, -69.94348907470703, -57.986454010009766, -46.0294189453125, -34.07238006591797, -22.115345001220703, -10.158309936523438, 1.7987289428710938, 13.755760192871094, 25.712799072265625, 37.66983413696289, 49.626869201660156, 61.58390808105469, 73.54093933105469, 85.49797821044922, 97.45501708984375, 109.41204833984375, 121.36908721923828, 133.3261260986328, 145.2831573486328, 157.24020385742188, 169.19723510742188, 181.15426635742188, 193.11129760742188, 205.06832885742188, 217.02537536621094, 228.98240661621094, 240.939453125, 252.896484375, 264.853515625, 276.810546875, 288.767578125, 300.724609375, 312.6816711425781, 324.6387023925781, 336.5957336425781, 348.55279541015625, 360.50982666015625, 372.46685791015625, 384.42388916015625, 396.38092041015625, 408.33795166015625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 6.0, 6.0, 3.0, 5.0, 2.0, 9.0, 12.0, 21.0, 67.0, 87.0, 89.0, 53.0, 39.0, 17.0, 11.0, 10.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-300.09393310546875, -287.365966796875, -274.63800048828125, -261.9100646972656, -249.18209838867188, -236.45413208007812, -223.72616577148438, -210.9982147216797, -198.270263671875, -185.54229736328125, -172.81434631347656, -160.0863800048828, -147.35842895507812, -134.63046264648438, -121.90250396728516, -109.17454528808594, -96.44657897949219, -83.71862030029297, -70.99066162109375, -58.262699127197266, -45.53474044799805, -32.80678176879883, -20.078819274902344, -7.350860595703125, 5.377098083496094, 18.105056762695312, 30.833017349243164, 43.560977935791016, 56.288936614990234, 69.01689147949219, 81.74485778808594, 94.47281646728516, 107.20077514648438, 119.9287338256836, 132.6566925048828, 145.38465881347656, 158.11260986328125, 170.840576171875, 183.56854248046875, 196.29649353027344, 209.02444458007812, 221.75241088867188, 234.48036193847656, 247.2083282470703, 259.936279296875, 272.66424560546875, 285.3922119140625, 298.12017822265625, 310.84814453125, 323.57611083984375, 336.3040771484375, 349.0320129394531, 361.7599792480469, 374.4879455566406, 387.2159118652344, 399.94384765625, 412.67181396484375, 425.3997802734375, 438.12774658203125, 450.8556823730469, 463.5836486816406, 476.3116149902344, 489.0395812988281, 501.76751708984375, 514.4954833984375]}, "eval/loss": 0.6945949792861938, "eval/wer": 0.09533915113050377, "eval/runtime": 683.1919, "eval/samples_per_second": 3.867, "eval/steps_per_second": 0.484, "train/train_runtime": 134751.1179, "train/train_samples_per_second": 5.295, "train/train_steps_per_second": 0.165, "train/total_flos": 0.0, "train/train_loss": 1.8353804810692644} \ No newline at end of file