diff --git "a/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" --- "a/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" +++ "b/wandb/run-20220302_132803-2mcgzjjb/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4894, "train/learning_rate": 3.4682080924855494e-08, "train/epoch": 5.0, "train/global_step": 4460, "_runtime": 28486, "_timestamp": 1646256169, "_step": 4462, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 99.0, 21.0, 7.0, 6.0, 3.0, 3.0, 8.0, 1.0, 30037.0, 216.0, 45.0, 17.0, 10.0, 9.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.90625, -37.05322265625, -36.2001953125, -35.34716796875, -34.494140625, -33.64111328125, -32.7880859375, -31.93505859375, -31.08203125, -30.22900390625, -29.3759765625, -28.52294921875, -27.669921875, -26.81689453125, -25.9638671875, -25.11083984375, -24.2578125, -23.40478515625, -22.5517578125, -21.69873046875, -20.845703125, -19.99267578125, -19.1396484375, -18.28662109375, -17.43359375, -16.58056640625, -15.7275390625, -14.87451171875, -14.021484375, -13.16845703125, -12.3154296875, -11.46240234375, -10.609375, -9.75634765625, -8.9033203125, -8.05029296875, -7.197265625, -6.34423828125, -5.4912109375, -4.63818359375, -3.78515625, -2.93212890625, -2.0791015625, -1.22607421875, -0.373046875, 0.47998046875, 1.3330078125, 2.18603515625, 3.0390625, 3.89208984375, 4.7451171875, 5.59814453125, 6.451171875, 7.30419921875, 8.1572265625, 9.01025390625, 9.86328125, 10.71630859375, 11.5693359375, 12.42236328125, 13.275390625, 14.12841796875, 14.9814453125, 15.83447265625, 16.6875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 7.0, 4.0, 4.0, 6.0, 12.0, 9.0, 14.0, 21.0, 15.0, 24.0, 20.0, 27.0, 33.0, 33.0, 27.0, 43.0, 30.0, 41.0, 36.0, 46.0, 47.0, 38.0, 46.0, 42.0, 43.0, 36.0, 41.0, 30.0, 37.0, 29.0, 19.0, 30.0, 25.0, 12.0, 11.0, 6.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.805110931396484, -9.561691284179688, -9.318270683288574, -9.074851036071777, -8.83143138885498, -8.588010787963867, -8.34459114074707, -8.101171493530273, -7.857751369476318, -7.614331245422363, -7.370911598205566, -7.127491474151611, -6.884071350097656, -6.640651702880859, -6.397231578826904, -6.153811454772949, -5.910391807556152, -5.666971683502197, -5.4235520362854, -5.180131912231445, -4.936712265014648, -4.693292140960693, -4.449872016906738, -4.206452369689941, -3.9630322456359863, -3.7196123600006104, -3.4761924743652344, -3.2327723503112793, -2.9893524646759033, -2.7459325790405273, -2.5025124549865723, -2.2590925693511963, -2.0156731605529785, -1.7722532749176025, -1.528833270072937, -1.2854132652282715, -1.0419933795928955, -0.7985734939575195, -0.555153489112854, -0.3117334842681885, -0.0683135986328125, 0.17510634660720825, 0.418526291847229, 0.6619462370872498, 0.9053661823272705, 1.1487860679626465, 1.392206072807312, 1.6356260776519775, 1.8790459632873535, 2.1224658489227295, 2.3658857345581055, 2.6093058586120605, 2.8527257442474365, 3.0961456298828125, 3.3395657539367676, 3.5829856395721436, 3.8264055252075195, 4.069825649261475, 4.3132452964782715, 4.556665420532227, 4.800085067749023, 5.0435051918029785, 5.286925315856934, 5.5303449630737305, 5.7737650871276855]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 8.0, 18.0, 13.0, 11.0, 20.0, 17.0, 17.0, 32.0, 21.0, 36.0, 31.0, 45.0, 40.0, 37.0, 50.0, 38.0, 42.0, 51.0, 40.0, 46.0, 35.0, 37.0, 23.0, 35.0, 31.0, 34.0, 24.0, 28.0, 20.0, 19.0, 16.0, 18.0, 13.0, 5.0, 4.0, 3.0, 5.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.515730857849121, -7.263637065887451, -7.011543273925781, -6.759449481964111, -6.507355690002441, -6.255261421203613, -6.003167629241943, -5.751073837280273, -5.4989800453186035, -5.246886253356934, -4.994792461395264, -4.742698669433594, -4.490604400634766, -4.238511085510254, -3.986416816711426, -3.734323024749756, -3.482229232788086, -3.230135440826416, -2.978041648864746, -2.725947618484497, -2.473853826522827, -2.2217600345611572, -1.9696661233901978, -1.7175722122192383, -1.4654784202575684, -1.2133846282958984, -0.961290717124939, -0.7091968655586243, -0.45710301399230957, -0.20500922203063965, 0.047084689140319824, 0.2991786003112793, 0.5512733459472656, 0.8033671975135803, 1.055461049079895, 1.3075549602508545, 1.5596487522125244, 1.8117425441741943, 2.0638365745544434, 2.3159303665161133, 2.568024158477783, 2.820117950439453, 3.072211742401123, 3.324305772781372, 3.576399564743042, 3.828493356704712, 4.080587387084961, 4.332681179046631, 4.584774971008301, 4.836868762969971, 5.088962554931641, 5.3410563468933105, 5.5931501388549805, 5.845244407653809, 6.0973381996154785, 6.349431991577148, 6.601525783538818, 6.853619575500488, 7.105713367462158, 7.357807159423828, 7.609901428222656, 7.861994743347168, 8.114089012145996, 8.366182327270508, 8.618276596069336]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 16.0, 19.0, 35.0, 68.0, 95.0, 158.0, 251.0, 411.0, 623.0, 1083.0, 1743.0, 2828.0, 4714.0, 7535.0, 11752.0, 18425.0, 27274.0, 40217.0, 57174.0, 77683.0, 101516.0, 139276.0, 158053.0, 112234.0, 85687.0, 64222.0, 45651.0, 31301.0, 21287.0, 13941.0, 8838.0, 5490.0, 3435.0, 2130.0, 1269.0, 783.0, 509.0, 310.0, 202.0, 112.0, 59.0, 50.0, 27.0, 22.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.625, -23.904541015625, -23.18408203125, -22.463623046875, -21.7431640625, -21.022705078125, -20.30224609375, -19.581787109375, -18.861328125, -18.140869140625, -17.42041015625, -16.699951171875, -15.9794921875, -15.259033203125, -14.53857421875, -13.818115234375, -13.09765625, -12.377197265625, -11.65673828125, -10.936279296875, -10.2158203125, -9.495361328125, -8.77490234375, -8.054443359375, -7.333984375, -6.613525390625, -5.89306640625, -5.172607421875, -4.4521484375, -3.731689453125, -3.01123046875, -2.290771484375, -1.5703125, -0.849853515625, -0.12939453125, 0.591064453125, 1.3115234375, 2.031982421875, 2.75244140625, 3.472900390625, 4.193359375, 4.913818359375, 5.63427734375, 6.354736328125, 7.0751953125, 7.795654296875, 8.51611328125, 9.236572265625, 9.95703125, 10.677490234375, 11.39794921875, 12.118408203125, 12.8388671875, 13.559326171875, 14.27978515625, 15.000244140625, 15.720703125, 16.441162109375, 17.16162109375, 17.882080078125, 18.6025390625, 19.322998046875, 20.04345703125, 20.763916015625, 21.484375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 25.0, 18.0, 13.0, 26.0, 38.0, 43.0, 42.0, 41.0, 53.0, 61.0, 65.0, 69.0, 62.0, 61.0, 49.0, 32.0, 31.0, 23.0, 24.0, 27.0, 26.0, 12.0, 18.0, 14.0, 15.0, 9.0, 3.0, 5.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.316650390625, -8.98486328125, -8.653076171875, -8.3212890625, -7.989501953125, -7.65771484375, -7.325927734375, -6.994140625, -6.662353515625, -6.33056640625, -5.998779296875, -5.6669921875, -5.335205078125, -5.00341796875, -4.671630859375, -4.33984375, -4.008056640625, -3.67626953125, -3.344482421875, -3.0126953125, -2.680908203125, -2.34912109375, -2.017333984375, -1.685546875, -1.353759765625, -1.02197265625, -0.690185546875, -0.3583984375, -0.026611328125, 0.30517578125, 0.636962890625, 0.96875, 1.300537109375, 1.63232421875, 1.964111328125, 2.2958984375, 2.627685546875, 2.95947265625, 3.291259765625, 3.623046875, 3.954833984375, 4.28662109375, 4.618408203125, 4.9501953125, 5.281982421875, 5.61376953125, 5.945556640625, 6.27734375, 6.609130859375, 6.94091796875, 7.272705078125, 7.6044921875, 7.936279296875, 8.26806640625, 8.599853515625, 8.931640625, 9.263427734375, 9.59521484375, 9.927001953125, 10.2587890625, 10.590576171875, 10.92236328125, 11.254150390625, 11.5859375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 9.0, 13.0, 10.0, 16.0, 16.0, 22.0, 28.0, 28.0, 36.0, 31.0, 39.0, 64.0, 54.0, 49.0, 53.0, 59.0, 43.0, 55.0, 50.0, 34.0, 46.0, 38.0, 37.0, 26.0, 29.0, 19.0, 15.0, 15.0, 8.0, 12.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.451366424560547, -6.244081974029541, -6.036797523498535, -5.829513072967529, -5.622228622436523, -5.414944171905518, -5.207659721374512, -5.000375747680664, -4.7930908203125, -4.585806369781494, -4.378521919250488, -4.171237468719482, -3.9639530181884766, -3.7566685676574707, -3.549384355545044, -3.342099905014038, -3.1348156929016113, -2.9275312423706055, -2.7202467918395996, -2.5129623413085938, -2.305677890777588, -2.098393440246582, -1.8911092281341553, -1.6838247776031494, -1.4765403270721436, -1.2692558765411377, -1.0619714260101318, -0.8546870946884155, -0.6474026441574097, -0.4401181936264038, -0.2328338623046875, -0.02554941177368164, 0.18173551559448242, 0.3890199363231659, 0.5963043570518494, 0.8035887479782104, 1.0108731985092163, 1.2181576490402222, 1.4254419803619385, 1.6327264308929443, 1.8400108814239502, 2.047295331954956, 2.254579782485962, 2.4618639945983887, 2.6691484451293945, 2.8764328956604004, 3.0837173461914062, 3.291001796722412, 3.498286247253418, 3.705570697784424, 3.9128551483154297, 4.1201395988464355, 4.327424049377441, 4.534708499908447, 4.741992950439453, 4.949276924133301, 5.156561851501465, 5.363846302032471, 5.571130752563477, 5.778415203094482, 5.985699653625488, 6.192984104156494, 6.4002685546875, 6.607552528381348, 6.8148369789123535]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 8.0, 6.0, 13.0, 11.0, 16.0, 23.0, 15.0, 31.0, 28.0, 38.0, 33.0, 35.0, 45.0, 45.0, 48.0, 45.0, 57.0, 41.0, 48.0, 38.0, 36.0, 39.0, 43.0, 33.0, 45.0, 30.0, 29.0, 25.0, 24.0, 7.0, 14.0, 11.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.627979278564453, -5.424100875854492, -5.220222473144531, -5.01634407043457, -4.812465667724609, -4.608587265014648, -4.404709339141846, -4.200830936431885, -3.996952533721924, -3.793074131011963, -3.589195728302002, -3.38531756401062, -3.181439161300659, -2.9775607585906982, -2.7736825942993164, -2.5698041915893555, -2.3659257888793945, -2.1620473861694336, -1.9581691026687622, -1.7542908191680908, -1.5504124164581299, -1.346534013748169, -1.1426557302474976, -0.9387774467468262, -0.7348990440368652, -0.5310207009315491, -0.3271423578262329, -0.12326401472091675, 0.08061432838439941, 0.28449273109436035, 0.48837101459503174, 0.6922492980957031, 0.8961272239685059, 1.1000056266784668, 1.3038839101791382, 1.5077621936798096, 1.7116405963897705, 1.9155189990997314, 2.1193971633911133, 2.323275566101074, 2.527153968811035, 2.731032371520996, 2.934910774230957, 3.138788938522339, 3.3426673412323, 3.5465457439422607, 3.7504239082336426, 3.9543023109436035, 4.1581807136535645, 4.362059116363525, 4.565937519073486, 4.769815921783447, 4.97369384765625, 5.177572250366211, 5.381450653076172, 5.585329055786133, 5.789207458496094, 5.993085861206055, 6.196964263916016, 6.400842666625977, 6.6047210693359375, 6.808599472045898, 7.012477397918701, 7.216355800628662, 7.420234203338623]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 25.0, 34.0, 39.0, 78.0, 102.0, 146.0, 199.0, 330.0, 532.0, 806.0, 1317.0, 2168.0, 3330.0, 5413.0, 8947.0, 14418.0, 23731.0, 38487.0, 62220.0, 101652.0, 165023.0, 262525.0, 398320.0, 545724.0, 634460.0, 601583.0, 471734.0, 321557.0, 203793.0, 126650.0, 76489.0, 47312.0, 29068.0, 17646.0, 10741.0, 6525.0, 4180.0, 2508.0, 1584.0, 995.0, 677.0, 394.0, 235.0, 176.0, 132.0, 77.0, 54.0, 30.0, 27.0, 20.0, 15.0, 5.0, 10.0, 6.0, 4.0], "bins": [-4.8046875, -4.6622314453125, -4.519775390625, -4.3773193359375, -4.23486328125, -4.0924072265625, -3.949951171875, -3.8074951171875, -3.6650390625, -3.5225830078125, -3.380126953125, -3.2376708984375, -3.09521484375, -2.9527587890625, -2.810302734375, -2.6678466796875, -2.525390625, -2.3829345703125, -2.240478515625, -2.0980224609375, -1.95556640625, -1.8131103515625, -1.670654296875, -1.5281982421875, -1.3857421875, -1.2432861328125, -1.100830078125, -0.9583740234375, -0.81591796875, -0.6734619140625, -0.531005859375, -0.3885498046875, -0.24609375, -0.1036376953125, 0.038818359375, 0.1812744140625, 0.32373046875, 0.4661865234375, 0.608642578125, 0.7510986328125, 0.8935546875, 1.0360107421875, 1.178466796875, 1.3209228515625, 1.46337890625, 1.6058349609375, 1.748291015625, 1.8907470703125, 2.033203125, 2.1756591796875, 2.318115234375, 2.4605712890625, 2.60302734375, 2.7454833984375, 2.887939453125, 3.0303955078125, 3.1728515625, 3.3153076171875, 3.457763671875, 3.6002197265625, 3.74267578125, 3.8851318359375, 4.027587890625, 4.1700439453125, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 12.0, 6.0, 15.0, 18.0, 21.0, 19.0, 25.0, 31.0, 39.0, 35.0, 38.0, 35.0, 46.0, 44.0, 52.0, 25.0, 31.0, 38.0, 43.0, 38.0, 44.0, 43.0, 41.0, 33.0, 37.0, 25.0, 21.0, 21.0, 18.0, 13.0, 10.0, 11.0, 10.0, 13.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1845703125, -4.037109375, -3.8896484375, -3.7421875, -3.5947265625, -3.447265625, -3.2998046875, -3.15234375, -3.0048828125, -2.857421875, -2.7099609375, -2.5625, -2.4150390625, -2.267578125, -2.1201171875, -1.97265625, -1.8251953125, -1.677734375, -1.5302734375, -1.3828125, -1.2353515625, -1.087890625, -0.9404296875, -0.79296875, -0.6455078125, -0.498046875, -0.3505859375, -0.203125, -0.0556640625, 0.091796875, 0.2392578125, 0.38671875, 0.5341796875, 0.681640625, 0.8291015625, 0.9765625, 1.1240234375, 1.271484375, 1.4189453125, 1.56640625, 1.7138671875, 1.861328125, 2.0087890625, 2.15625, 2.3037109375, 2.451171875, 2.5986328125, 2.74609375, 2.8935546875, 3.041015625, 3.1884765625, 3.3359375, 3.4833984375, 3.630859375, 3.7783203125, 3.92578125, 4.0732421875, 4.220703125, 4.3681640625, 4.515625, 4.6630859375, 4.810546875, 4.9580078125, 5.10546875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 20.0, 32.0, 45.0, 50.0, 106.0, 162.0, 265.0, 438.0, 731.0, 1176.0, 2094.0, 3319.0, 5919.0, 9896.0, 16776.0, 27900.0, 46589.0, 76213.0, 122406.0, 190160.0, 285649.0, 405693.0, 530305.0, 598291.0, 555293.0, 436782.0, 312968.0, 211478.0, 136680.0, 85377.0, 52662.0, 31946.0, 19276.0, 11207.0, 6706.0, 3895.0, 2339.0, 1372.0, 789.0, 465.0, 278.0, 195.0, 109.0, 84.0, 53.0, 27.0, 21.0, 7.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 16.0, 29.0, 33.0, 46.0, 58.0, 83.0, 104.0, 103.0, 140.0, 167.0, 208.0, 213.0, 236.0, 257.0, 287.0, 284.0, 267.0, 258.0, 214.0, 203.0, 145.0, 125.0, 120.0, 99.0, 70.0, 65.0, 62.0, 31.0, 38.0, 22.0, 16.0, 9.0, 9.0, 12.0, 7.0, 3.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.33740234375, -2.2646484375, -2.19189453125, -2.119140625, -2.04638671875, -1.9736328125, -1.90087890625, -1.828125, -1.75537109375, -1.6826171875, -1.60986328125, -1.537109375, -1.46435546875, -1.3916015625, -1.31884765625, -1.24609375, -1.17333984375, -1.1005859375, -1.02783203125, -0.955078125, -0.88232421875, -0.8095703125, -0.73681640625, -0.6640625, -0.59130859375, -0.5185546875, -0.44580078125, -0.373046875, -0.30029296875, -0.2275390625, -0.15478515625, -0.08203125, -0.00927734375, 0.0634765625, 0.13623046875, 0.208984375, 0.28173828125, 0.3544921875, 0.42724609375, 0.5, 0.57275390625, 0.6455078125, 0.71826171875, 0.791015625, 0.86376953125, 0.9365234375, 1.00927734375, 1.08203125, 1.15478515625, 1.2275390625, 1.30029296875, 1.373046875, 1.44580078125, 1.5185546875, 1.59130859375, 1.6640625, 1.73681640625, 1.8095703125, 1.88232421875, 1.955078125, 2.02783203125, 2.1005859375, 2.17333984375, 2.24609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 19.0, 25.0, 28.0, 32.0, 28.0, 33.0, 56.0, 61.0, 54.0, 71.0, 48.0, 50.0, 69.0, 50.0, 52.0, 48.0, 36.0, 38.0, 30.0, 34.0, 21.0, 20.0, 11.0, 8.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.364202499389648, -7.164638042449951, -6.965073585510254, -6.765509605407715, -6.565945148468018, -6.36638069152832, -6.166816234588623, -5.967251777648926, -5.767687797546387, -5.5681233406066895, -5.368558883666992, -5.168994903564453, -4.969430446624756, -4.769865989685059, -4.570301532745361, -4.370737075805664, -4.171173095703125, -3.9716086387634277, -3.7720444202423096, -3.5724799633026123, -3.372915744781494, -3.173351287841797, -2.9737868309020996, -2.7742226123809814, -2.574657917022705, -2.375093460083008, -2.1755292415618896, -1.9759647846221924, -1.7764005661010742, -1.576836109161377, -1.3772717714309692, -1.1777074337005615, -0.9781432151794434, -0.7785788774490356, -0.5790145397186279, -0.37945014238357544, -0.17988580465316772, 0.01967853307723999, 0.21924293041229248, 0.4188072681427002, 0.6183716058731079, 0.8179359436035156, 1.0175002813339233, 1.217064619064331, 1.4166290760040283, 1.6161932945251465, 1.8157577514648438, 2.015322208404541, 2.214886426925659, 2.4144508838653564, 2.6140151023864746, 2.813579559326172, 3.01314377784729, 3.2127082347869873, 3.4122724533081055, 3.6118369102478027, 3.8114013671875, 4.010965824127197, 4.2105302810668945, 4.410094261169434, 4.609658718109131, 4.809223175048828, 5.008787631988525, 5.208352088928223, 5.407916069030762]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 14.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 16.0, 23.0, 15.0, 26.0, 24.0, 27.0, 23.0, 36.0, 32.0, 34.0, 31.0, 48.0, 30.0, 41.0, 31.0, 48.0, 45.0, 41.0, 33.0, 29.0, 28.0, 31.0, 29.0, 27.0, 22.0, 23.0, 19.0, 16.0, 18.0, 12.0, 8.0, 7.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.708048343658447, -4.56910514831543, -4.430161952972412, -4.2912187576293945, -4.152275562286377, -4.013332366943359, -3.8743889331817627, -3.735445737838745, -3.5965025424957275, -3.45755934715271, -3.3186161518096924, -3.179672956466675, -3.040729522705078, -2.9017863273620605, -2.762843132019043, -2.6238999366760254, -2.484956741333008, -2.3460135459899902, -2.2070703506469727, -2.068127155303955, -1.929183840751648, -1.7902406454086304, -1.6512973308563232, -1.5123541355133057, -1.373410940170288, -1.2344677448272705, -1.095524549484253, -0.9565812349319458, -0.8176380395889282, -0.6786948442459106, -0.5397515892982483, -0.40080833435058594, -0.26186561584472656, -0.1229223906993866, 0.01602083444595337, 0.15496405959129333, 0.2939072847366333, 0.4328504800796509, 0.5717937350273132, 0.7107369899749756, 0.8496801853179932, 0.9886233806610107, 1.1275665760040283, 1.2665098905563354, 1.405453085899353, 1.5443962812423706, 1.6833395957946777, 1.8222827911376953, 1.961225986480713, 2.1001691818237305, 2.239112377166748, 2.3780555725097656, 2.516998767852783, 2.655941963195801, 2.7948853969573975, 2.933828592300415, 3.0727717876434326, 3.21171498298645, 3.3506581783294678, 3.4896013736724854, 3.628544807434082, 3.7674880027770996, 3.906431198120117, 4.045374393463135, 4.184317588806152]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 25.0, 30.0, 41.0, 64.0, 81.0, 140.0, 250.0, 371.0, 638.0, 930.0, 1547.0, 2532.0, 4204.0, 7248.0, 13091.0, 24033.0, 47192.0, 95628.0, 187896.0, 268893.0, 191403.0, 97959.0, 48615.0, 24462.0, 13171.0, 7180.0, 4278.0, 2462.0, 1504.0, 987.0, 614.0, 401.0, 234.0, 155.0, 107.0, 67.0, 39.0, 20.0, 15.0, 16.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.04083251953125, -3.8824462890625, -3.72406005859375, -3.565673828125, -3.40728759765625, -3.2489013671875, -3.09051513671875, -2.93212890625, -2.77374267578125, -2.6153564453125, -2.45697021484375, -2.298583984375, -2.14019775390625, -1.9818115234375, -1.82342529296875, -1.6650390625, -1.50665283203125, -1.3482666015625, -1.18988037109375, -1.031494140625, -0.87310791015625, -0.7147216796875, -0.55633544921875, -0.39794921875, -0.23956298828125, -0.0811767578125, 0.07720947265625, 0.235595703125, 0.39398193359375, 0.5523681640625, 0.71075439453125, 0.869140625, 1.02752685546875, 1.1859130859375, 1.34429931640625, 1.502685546875, 1.66107177734375, 1.8194580078125, 1.97784423828125, 2.13623046875, 2.29461669921875, 2.4530029296875, 2.61138916015625, 2.769775390625, 2.92816162109375, 3.0865478515625, 3.24493408203125, 3.4033203125, 3.56170654296875, 3.7200927734375, 3.87847900390625, 4.036865234375, 4.19525146484375, 4.3536376953125, 4.51202392578125, 4.67041015625, 4.82879638671875, 4.9871826171875, 5.14556884765625, 5.303955078125, 5.46234130859375, 5.6207275390625, 5.77911376953125, 5.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 10.0, 14.0, 17.0, 22.0, 12.0, 25.0, 26.0, 31.0, 27.0, 43.0, 30.0, 44.0, 36.0, 49.0, 38.0, 58.0, 35.0, 29.0, 46.0, 37.0, 36.0, 33.0, 39.0, 27.0, 33.0, 37.0, 23.0, 17.0, 18.0, 9.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.41796875, -5.26171875, -5.10546875, -4.94921875, -4.79296875, -4.63671875, -4.48046875, -4.32421875, -4.16796875, -4.01171875, -3.85546875, -3.69921875, -3.54296875, -3.38671875, -3.23046875, -3.07421875, -2.91796875, -2.76171875, -2.60546875, -2.44921875, -2.29296875, -2.13671875, -1.98046875, -1.82421875, -1.66796875, -1.51171875, -1.35546875, -1.19921875, -1.04296875, -0.88671875, -0.73046875, -0.57421875, -0.41796875, -0.26171875, -0.10546875, 0.05078125, 0.20703125, 0.36328125, 0.51953125, 0.67578125, 0.83203125, 0.98828125, 1.14453125, 1.30078125, 1.45703125, 1.61328125, 1.76953125, 1.92578125, 2.08203125, 2.23828125, 2.39453125, 2.55078125, 2.70703125, 2.86328125, 3.01953125, 3.17578125, 3.33203125, 3.48828125, 3.64453125, 3.80078125, 3.95703125, 4.11328125, 4.26953125, 4.42578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 12.0, 20.0, 34.0, 40.0, 49.0, 64.0, 75.0, 158.0, 207.0, 267.0, 443.0, 608.0, 944.0, 1514.0, 2507.0, 4383.0, 8156.0, 16576.0, 38212.0, 103439.0, 298008.0, 351266.0, 132584.0, 47082.0, 19555.0, 9520.0, 4990.0, 2832.0, 1735.0, 1065.0, 654.0, 459.0, 319.0, 210.0, 148.0, 85.0, 68.0, 63.0, 39.0, 34.0, 28.0, 11.0, 12.0, 15.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.38671875, -4.2457275390625, -4.104736328125, -3.9637451171875, -3.82275390625, -3.6817626953125, -3.540771484375, -3.3997802734375, -3.2587890625, -3.1177978515625, -2.976806640625, -2.8358154296875, -2.69482421875, -2.5538330078125, -2.412841796875, -2.2718505859375, -2.130859375, -1.9898681640625, -1.848876953125, -1.7078857421875, -1.56689453125, -1.4259033203125, -1.284912109375, -1.1439208984375, -1.0029296875, -0.8619384765625, -0.720947265625, -0.5799560546875, -0.43896484375, -0.2979736328125, -0.156982421875, -0.0159912109375, 0.125, 0.2659912109375, 0.406982421875, 0.5479736328125, 0.68896484375, 0.8299560546875, 0.970947265625, 1.1119384765625, 1.2529296875, 1.3939208984375, 1.534912109375, 1.6759033203125, 1.81689453125, 1.9578857421875, 2.098876953125, 2.2398681640625, 2.380859375, 2.5218505859375, 2.662841796875, 2.8038330078125, 2.94482421875, 3.0858154296875, 3.226806640625, 3.3677978515625, 3.5087890625, 3.6497802734375, 3.790771484375, 3.9317626953125, 4.07275390625, 4.2137451171875, 4.354736328125, 4.4957275390625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 8.0, 17.0, 14.0, 16.0, 16.0, 18.0, 18.0, 20.0, 22.0, 29.0, 37.0, 31.0, 32.0, 31.0, 32.0, 36.0, 29.0, 30.0, 43.0, 44.0, 43.0, 36.0, 48.0, 33.0, 38.0, 32.0, 27.0, 22.0, 30.0, 29.0, 27.0, 11.0, 19.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.741546630859375, -2.64324951171875, -2.544952392578125, -2.4466552734375, -2.348358154296875, -2.25006103515625, -2.151763916015625, -2.053466796875, -1.955169677734375, -1.85687255859375, -1.758575439453125, -1.6602783203125, -1.561981201171875, -1.46368408203125, -1.365386962890625, -1.26708984375, -1.168792724609375, -1.07049560546875, -0.972198486328125, -0.8739013671875, -0.775604248046875, -0.67730712890625, -0.579010009765625, -0.480712890625, -0.382415771484375, -0.28411865234375, -0.185821533203125, -0.0875244140625, 0.010772705078125, 0.10906982421875, 0.207366943359375, 0.3056640625, 0.403961181640625, 0.50225830078125, 0.600555419921875, 0.6988525390625, 0.797149658203125, 0.89544677734375, 0.993743896484375, 1.092041015625, 1.190338134765625, 1.28863525390625, 1.386932373046875, 1.4852294921875, 1.583526611328125, 1.68182373046875, 1.780120849609375, 1.87841796875, 1.976715087890625, 2.07501220703125, 2.173309326171875, 2.2716064453125, 2.369903564453125, 2.46820068359375, 2.566497802734375, 2.664794921875, 2.763092041015625, 2.86138916015625, 2.959686279296875, 3.0579833984375, 3.156280517578125, 3.25457763671875, 3.352874755859375, 3.451171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 16.0, 18.0, 19.0, 33.0, 49.0, 84.0, 126.0, 213.0, 301.0, 480.0, 878.0, 1626.0, 4419.0, 28056.0, 978213.0, 25996.0, 4214.0, 1618.0, 831.0, 512.0, 292.0, 189.0, 113.0, 77.0, 58.0, 26.0, 20.0, 16.0, 11.0, 12.0, 9.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.064453125, -18.31640625, -17.568359375, -16.8203125, -16.072265625, -15.32421875, -14.576171875, -13.828125, -13.080078125, -12.33203125, -11.583984375, -10.8359375, -10.087890625, -9.33984375, -8.591796875, -7.84375, -7.095703125, -6.34765625, -5.599609375, -4.8515625, -4.103515625, -3.35546875, -2.607421875, -1.859375, -1.111328125, -0.36328125, 0.384765625, 1.1328125, 1.880859375, 2.62890625, 3.376953125, 4.125, 4.873046875, 5.62109375, 6.369140625, 7.1171875, 7.865234375, 8.61328125, 9.361328125, 10.109375, 10.857421875, 11.60546875, 12.353515625, 13.1015625, 13.849609375, 14.59765625, 15.345703125, 16.09375, 16.841796875, 17.58984375, 18.337890625, 19.0859375, 19.833984375, 20.58203125, 21.330078125, 22.078125, 22.826171875, 23.57421875, 24.322265625, 25.0703125, 25.818359375, 26.56640625, 27.314453125, 28.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 11.0, 33.0, 58.0, 221.0, 408.0, 136.0, 47.0, 23.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007940083742141724, -0.0007669031620025635, -0.0007397979497909546, -0.0007126927375793457, -0.0006855875253677368, -0.0006584823131561279, -0.000631377100944519, -0.0006042718887329102, -0.0005771666765213013, -0.0005500614643096924, -0.0005229562520980835, -0.0004958510398864746, -0.0004687458276748657, -0.00044164061546325684, -0.00041453540325164795, -0.00038743019104003906, -0.0003603249788284302, -0.0003332197666168213, -0.0003061145544052124, -0.0002790093421936035, -0.00025190412998199463, -0.00022479891777038574, -0.00019769370555877686, -0.00017058849334716797, -0.00014348328113555908, -0.0001163780689239502, -8.927285671234131e-05, -6.216764450073242e-05, -3.5062432289123535e-05, -7.957220077514648e-06, 1.9147992134094238e-05, 4.6253204345703125e-05, 7.335841655731201e-05, 0.0001004636287689209, 0.00012756884098052979, 0.00015467405319213867, 0.00018177926540374756, 0.00020888447761535645, 0.00023598968982696533, 0.0002630949020385742, 0.0002902001142501831, 0.000317305326461792, 0.0003444105386734009, 0.00037151575088500977, 0.00039862096309661865, 0.00042572617530822754, 0.0004528313875198364, 0.0004799365997314453, 0.0005070418119430542, 0.0005341470241546631, 0.000561252236366272, 0.0005883574485778809, 0.0006154626607894897, 0.0006425678730010986, 0.0006696730852127075, 0.0006967782974243164, 0.0007238835096359253, 0.0007509887218475342, 0.0007780939340591431, 0.000805199146270752, 0.0008323043584823608, 0.0008594095706939697, 0.0008865147829055786, 0.0009136199951171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 19.0, 8.0, 26.0, 32.0, 40.0, 56.0, 74.0, 115.0, 164.0, 220.0, 303.0, 411.0, 588.0, 824.0, 1158.0, 1546.0, 2312.0, 3710.0, 6001.0, 11396.0, 26493.0, 90347.0, 429666.0, 351747.0, 71797.0, 22815.0, 10104.0, 5605.0, 3465.0, 2207.0, 1549.0, 1081.0, 689.0, 552.0, 407.0, 291.0, 200.0, 156.0, 105.0, 70.0, 58.0, 38.0, 36.0, 31.0, 17.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.42608642578125, -5.2506103515625, -5.07513427734375, -4.899658203125, -4.72418212890625, -4.5487060546875, -4.37322998046875, -4.19775390625, -4.02227783203125, -3.8468017578125, -3.67132568359375, -3.495849609375, -3.32037353515625, -3.1448974609375, -2.96942138671875, -2.7939453125, -2.61846923828125, -2.4429931640625, -2.26751708984375, -2.092041015625, -1.91656494140625, -1.7410888671875, -1.56561279296875, -1.39013671875, -1.21466064453125, -1.0391845703125, -0.86370849609375, -0.688232421875, -0.51275634765625, -0.3372802734375, -0.16180419921875, 0.013671875, 0.18914794921875, 0.3646240234375, 0.54010009765625, 0.715576171875, 0.89105224609375, 1.0665283203125, 1.24200439453125, 1.41748046875, 1.59295654296875, 1.7684326171875, 1.94390869140625, 2.119384765625, 2.29486083984375, 2.4703369140625, 2.64581298828125, 2.8212890625, 2.99676513671875, 3.1722412109375, 3.34771728515625, 3.523193359375, 3.69866943359375, 3.8741455078125, 4.04962158203125, 4.22509765625, 4.40057373046875, 4.5760498046875, 4.75152587890625, 4.927001953125, 5.10247802734375, 5.2779541015625, 5.45343017578125, 5.62890625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 8.0, 12.0, 28.0, 48.0, 99.0, 160.0, 208.0, 178.0, 102.0, 58.0, 23.0, 13.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.50732421875, -2.4345703125, -2.36181640625, -2.2890625, -2.21630859375, -2.1435546875, -2.07080078125, -1.998046875, -1.92529296875, -1.8525390625, -1.77978515625, -1.70703125, -1.63427734375, -1.5615234375, -1.48876953125, -1.416015625, -1.34326171875, -1.2705078125, -1.19775390625, -1.125, -1.05224609375, -0.9794921875, -0.90673828125, -0.833984375, -0.76123046875, -0.6884765625, -0.61572265625, -0.54296875, -0.47021484375, -0.3974609375, -0.32470703125, -0.251953125, -0.17919921875, -0.1064453125, -0.03369140625, 0.0390625, 0.11181640625, 0.1845703125, 0.25732421875, 0.330078125, 0.40283203125, 0.4755859375, 0.54833984375, 0.62109375, 0.69384765625, 0.7666015625, 0.83935546875, 0.912109375, 0.98486328125, 1.0576171875, 1.13037109375, 1.203125, 1.27587890625, 1.3486328125, 1.42138671875, 1.494140625, 1.56689453125, 1.6396484375, 1.71240234375, 1.78515625, 1.85791015625, 1.9306640625, 2.00341796875, 2.076171875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 4.0, 8.0, 17.0, 8.0, 6.0, 14.0, 25.0, 20.0, 32.0, 26.0, 36.0, 29.0, 47.0, 41.0, 44.0, 64.0, 49.0, 57.0, 54.0, 40.0, 51.0, 39.0, 37.0, 42.0, 44.0, 24.0, 24.0, 22.0, 22.0, 19.0, 7.0, 7.0, 8.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.619289875030518, -5.4501519203186035, -5.281014442443848, -5.111876487731934, -4.942739009857178, -4.773601055145264, -4.604463577270508, -4.435325622558594, -4.266188144683838, -4.097050189971924, -3.927912712097168, -3.758774995803833, -3.589637279510498, -3.420499563217163, -3.251361846923828, -3.082223892211914, -2.913086175918579, -2.743948459625244, -2.574810743331909, -2.405673027038574, -2.2365353107452393, -2.0673975944519043, -1.8982597589492798, -1.7291220426559448, -1.5599843263626099, -1.390846610069275, -1.22170889377594, -1.0525710582733154, -0.8834334015846252, -0.7142956852912903, -0.5451579093933105, -0.3760201930999756, -0.20688247680664062, -0.03774474561214447, 0.13139298558235168, 0.30053073167800903, 0.469668447971344, 0.638806164264679, 0.8079439401626587, 0.9770816564559937, 1.1462193727493286, 1.3153570890426636, 1.4844948053359985, 1.653632640838623, 1.822770357131958, 1.991908073425293, 2.161045789718628, 2.330183506011963, 2.499321222305298, 2.668458938598633, 2.8375966548919678, 3.0067343711853027, 3.1758720874786377, 3.3450098037719727, 3.5141477584838867, 3.6832852363586426, 3.8524231910705566, 4.021561145782471, 4.190698623657227, 4.359836578369141, 4.5289740562438965, 4.6981120109558105, 4.867249488830566, 5.0363874435424805, 5.205524921417236]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 5.0, 6.0, 8.0, 10.0, 17.0, 19.0, 15.0, 7.0, 26.0, 21.0, 23.0, 30.0, 32.0, 29.0, 27.0, 35.0, 26.0, 38.0, 37.0, 37.0, 48.0, 30.0, 41.0, 42.0, 36.0, 28.0, 28.0, 30.0, 34.0, 23.0, 33.0, 23.0, 17.0, 21.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-4.382673263549805, -4.250843048095703, -4.119012355804443, -3.987182140350342, -3.8553519248962402, -3.7235214710235596, -3.591691017150879, -3.4598608016967773, -3.328030586242676, -3.196200132369995, -3.0643699169158936, -2.932539463043213, -2.8007092475891113, -2.6688787937164307, -2.53704833984375, -2.4052181243896484, -2.2733876705169678, -2.141557216644287, -2.0097270011901855, -1.8778965473175049, -1.7460663318634033, -1.6142358779907227, -1.4824055433273315, -1.3505752086639404, -1.2187448740005493, -1.0869145393371582, -0.9550842046737671, -0.8232538104057312, -0.6914234757423401, -0.559593141078949, -0.4277627468109131, -0.295932412147522, -0.16410207748413086, -0.03227172791957855, 0.09955862164497375, 0.23138898611068726, 0.36321932077407837, 0.4950496554374695, 0.6268800497055054, 0.7587103843688965, 0.8905407190322876, 1.0223710536956787, 1.1542013883590698, 1.286031723022461, 1.4178621768951416, 1.5496923923492432, 1.6815228462219238, 1.813353180885315, 1.945183515548706, 2.0770139694213867, 2.2088441848754883, 2.340674638748169, 2.4725048542022705, 2.604335308074951, 2.7361655235290527, 2.8679959774017334, 2.999826431274414, 3.1316568851470947, 3.2634871006011963, 3.395317554473877, 3.5271477699279785, 3.658978223800659, 3.79080867767334, 3.9226388931274414, 4.054469108581543]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 30.0, 44.0, 53.0, 101.0, 161.0, 264.0, 402.0, 631.0, 978.0, 1594.0, 2510.0, 4238.0, 6575.0, 10311.0, 16142.0, 24500.0, 36111.0, 51080.0, 68924.0, 86676.0, 101723.0, 111442.0, 111356.0, 101975.0, 86930.0, 68407.0, 51169.0, 36173.0, 24162.0, 16151.0, 10241.0, 6521.0, 4033.0, 2610.0, 1686.0, 981.0, 636.0, 372.0, 237.0, 167.0, 98.0, 45.0, 31.0, 21.0, 11.0, 5.0, 16.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.58984375, -4.45074462890625, -4.3116455078125, -4.17254638671875, -4.033447265625, -3.89434814453125, -3.7552490234375, -3.61614990234375, -3.47705078125, -3.33795166015625, -3.1988525390625, -3.05975341796875, -2.920654296875, -2.78155517578125, -2.6424560546875, -2.50335693359375, -2.3642578125, -2.22515869140625, -2.0860595703125, -1.94696044921875, -1.807861328125, -1.66876220703125, -1.5296630859375, -1.39056396484375, -1.25146484375, -1.11236572265625, -0.9732666015625, -0.83416748046875, -0.695068359375, -0.55596923828125, -0.4168701171875, -0.27777099609375, -0.138671875, 0.00042724609375, 0.1395263671875, 0.27862548828125, 0.417724609375, 0.55682373046875, 0.6959228515625, 0.83502197265625, 0.97412109375, 1.11322021484375, 1.2523193359375, 1.39141845703125, 1.530517578125, 1.66961669921875, 1.8087158203125, 1.94781494140625, 2.0869140625, 2.22601318359375, 2.3651123046875, 2.50421142578125, 2.643310546875, 2.78240966796875, 2.9215087890625, 3.06060791015625, 3.19970703125, 3.33880615234375, 3.4779052734375, 3.61700439453125, 3.756103515625, 3.89520263671875, 4.0343017578125, 4.17340087890625, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 7.0, 8.0, 10.0, 13.0, 23.0, 24.0, 21.0, 17.0, 25.0, 37.0, 38.0, 30.0, 31.0, 40.0, 53.0, 34.0, 33.0, 50.0, 48.0, 36.0, 37.0, 42.0, 33.0, 24.0, 28.0, 41.0, 28.0, 23.0, 27.0, 18.0, 16.0, 14.0, 15.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-5.015625, -4.8765869140625, -4.737548828125, -4.5985107421875, -4.45947265625, -4.3204345703125, -4.181396484375, -4.0423583984375, -3.9033203125, -3.7642822265625, -3.625244140625, -3.4862060546875, -3.34716796875, -3.2081298828125, -3.069091796875, -2.9300537109375, -2.791015625, -2.6519775390625, -2.512939453125, -2.3739013671875, -2.23486328125, -2.0958251953125, -1.956787109375, -1.8177490234375, -1.6787109375, -1.5396728515625, -1.400634765625, -1.2615966796875, -1.12255859375, -0.9835205078125, -0.844482421875, -0.7054443359375, -0.56640625, -0.4273681640625, -0.288330078125, -0.1492919921875, -0.01025390625, 0.1287841796875, 0.267822265625, 0.4068603515625, 0.5458984375, 0.6849365234375, 0.823974609375, 0.9630126953125, 1.10205078125, 1.2410888671875, 1.380126953125, 1.5191650390625, 1.658203125, 1.7972412109375, 1.936279296875, 2.0753173828125, 2.21435546875, 2.3533935546875, 2.492431640625, 2.6314697265625, 2.7705078125, 2.9095458984375, 3.048583984375, 3.1876220703125, 3.32666015625, 3.4656982421875, 3.604736328125, 3.7437744140625, 3.8828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 19.0, 17.0, 33.0, 43.0, 66.0, 146.0, 238.0, 322.0, 505.0, 746.0, 1313.0, 2147.0, 3458.0, 5567.0, 9152.0, 14708.0, 23169.0, 35971.0, 53307.0, 75009.0, 98540.0, 117690.0, 126550.0, 121282.0, 104971.0, 81787.0, 59596.0, 40778.0, 26961.0, 16761.0, 10474.0, 6610.0, 3907.0, 2542.0, 1585.0, 915.0, 560.0, 393.0, 262.0, 171.0, 94.0, 61.0, 43.0, 29.0, 20.0, 8.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2734375, -5.1119384765625, -4.950439453125, -4.7889404296875, -4.62744140625, -4.4659423828125, -4.304443359375, -4.1429443359375, -3.9814453125, -3.8199462890625, -3.658447265625, -3.4969482421875, -3.33544921875, -3.1739501953125, -3.012451171875, -2.8509521484375, -2.689453125, -2.5279541015625, -2.366455078125, -2.2049560546875, -2.04345703125, -1.8819580078125, -1.720458984375, -1.5589599609375, -1.3974609375, -1.2359619140625, -1.074462890625, -0.9129638671875, -0.75146484375, -0.5899658203125, -0.428466796875, -0.2669677734375, -0.10546875, 0.0560302734375, 0.217529296875, 0.3790283203125, 0.54052734375, 0.7020263671875, 0.863525390625, 1.0250244140625, 1.1865234375, 1.3480224609375, 1.509521484375, 1.6710205078125, 1.83251953125, 1.9940185546875, 2.155517578125, 2.3170166015625, 2.478515625, 2.6400146484375, 2.801513671875, 2.9630126953125, 3.12451171875, 3.2860107421875, 3.447509765625, 3.6090087890625, 3.7705078125, 3.9320068359375, 4.093505859375, 4.2550048828125, 4.41650390625, 4.5780029296875, 4.739501953125, 4.9010009765625, 5.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 13.0, 16.0, 12.0, 19.0, 19.0, 21.0, 22.0, 30.0, 35.0, 35.0, 38.0, 37.0, 47.0, 55.0, 51.0, 44.0, 39.0, 49.0, 47.0, 39.0, 39.0, 38.0, 30.0, 23.0, 25.0, 24.0, 20.0, 14.0, 13.0, 12.0, 10.0, 8.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.063262939453125, -2.96441650390625, -2.865570068359375, -2.7667236328125, -2.667877197265625, -2.56903076171875, -2.470184326171875, -2.371337890625, -2.272491455078125, -2.17364501953125, -2.074798583984375, -1.9759521484375, -1.877105712890625, -1.77825927734375, -1.679412841796875, -1.58056640625, -1.481719970703125, -1.38287353515625, -1.284027099609375, -1.1851806640625, -1.086334228515625, -0.98748779296875, -0.888641357421875, -0.789794921875, -0.690948486328125, -0.59210205078125, -0.493255615234375, -0.3944091796875, -0.295562744140625, -0.19671630859375, -0.097869873046875, 0.0009765625, 0.099822998046875, 0.19866943359375, 0.297515869140625, 0.3963623046875, 0.495208740234375, 0.59405517578125, 0.692901611328125, 0.791748046875, 0.890594482421875, 0.98944091796875, 1.088287353515625, 1.1871337890625, 1.285980224609375, 1.38482666015625, 1.483673095703125, 1.58251953125, 1.681365966796875, 1.78021240234375, 1.879058837890625, 1.9779052734375, 2.076751708984375, 2.17559814453125, 2.274444580078125, 2.373291015625, 2.472137451171875, 2.57098388671875, 2.669830322265625, 2.7686767578125, 2.867523193359375, 2.96636962890625, 3.065216064453125, 3.1640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 11.0, 13.0, 23.0, 22.0, 34.0, 41.0, 64.0, 92.0, 120.0, 168.0, 234.0, 373.0, 542.0, 821.0, 1304.0, 2198.0, 3693.0, 6567.0, 12338.0, 23544.0, 45969.0, 85466.0, 141070.0, 190806.0, 192863.0, 145926.0, 90202.0, 48539.0, 25288.0, 13051.0, 6923.0, 3818.0, 2247.0, 1377.0, 877.0, 594.0, 401.0, 252.0, 178.0, 139.0, 94.0, 83.0, 53.0, 32.0, 31.0, 10.0, 22.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.11846923828125, -2.0455322265625, -1.97259521484375, -1.899658203125, -1.82672119140625, -1.7537841796875, -1.68084716796875, -1.60791015625, -1.53497314453125, -1.4620361328125, -1.38909912109375, -1.316162109375, -1.24322509765625, -1.1702880859375, -1.09735107421875, -1.0244140625, -0.95147705078125, -0.8785400390625, -0.80560302734375, -0.732666015625, -0.65972900390625, -0.5867919921875, -0.51385498046875, -0.44091796875, -0.36798095703125, -0.2950439453125, -0.22210693359375, -0.149169921875, -0.07623291015625, -0.0032958984375, 0.06964111328125, 0.142578125, 0.21551513671875, 0.2884521484375, 0.36138916015625, 0.434326171875, 0.50726318359375, 0.5802001953125, 0.65313720703125, 0.72607421875, 0.79901123046875, 0.8719482421875, 0.94488525390625, 1.017822265625, 1.09075927734375, 1.1636962890625, 1.23663330078125, 1.3095703125, 1.38250732421875, 1.4554443359375, 1.52838134765625, 1.601318359375, 1.67425537109375, 1.7471923828125, 1.82012939453125, 1.89306640625, 1.96600341796875, 2.0389404296875, 2.11187744140625, 2.184814453125, 2.25775146484375, 2.3306884765625, 2.40362548828125, 2.4765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 2.0, 4.0, 10.0, 16.0, 20.0, 28.0, 22.0, 42.0, 34.0, 45.0, 58.0, 55.0, 72.0, 65.0, 87.0, 68.0, 60.0, 62.0, 50.0, 44.0, 41.0, 28.0, 24.0, 13.0, 13.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021754205226898193, -0.0002097785472869873, -0.00020201504230499268, -0.00019425153732299805, -0.00018648803234100342, -0.0001787245273590088, -0.00017096102237701416, -0.00016319751739501953, -0.0001554340124130249, -0.00014767050743103027, -0.00013990700244903564, -0.00013214349746704102, -0.0001243799924850464, -0.00011661648750305176, -0.00010885298252105713, -0.0001010894775390625, -9.332597255706787e-05, -8.556246757507324e-05, -7.779896259307861e-05, -7.003545761108398e-05, -6.227195262908936e-05, -5.4508447647094727e-05, -4.67449426651001e-05, -3.898143768310547e-05, -3.121793270111084e-05, -2.345442771911621e-05, -1.5690922737121582e-05, -7.927417755126953e-06, -1.6391277313232422e-07, 7.599592208862305e-06, 1.5363097190856934e-05, 2.3126602172851562e-05, 3.089010715484619e-05, 3.865361213684082e-05, 4.641711711883545e-05, 5.418062210083008e-05, 6.194412708282471e-05, 6.970763206481934e-05, 7.747113704681396e-05, 8.52346420288086e-05, 9.299814701080322e-05, 0.00010076165199279785, 0.00010852515697479248, 0.00011628866195678711, 0.00012405216693878174, 0.00013181567192077637, 0.000139579176902771, 0.00014734268188476562, 0.00015510618686676025, 0.00016286969184875488, 0.0001706331968307495, 0.00017839670181274414, 0.00018616020679473877, 0.0001939237117767334, 0.00020168721675872803, 0.00020945072174072266, 0.00021721422672271729, 0.00022497773170471191, 0.00023274123668670654, 0.00024050474166870117, 0.0002482682466506958, 0.00025603175163269043, 0.00026379525661468506, 0.0002715587615966797]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 1.0, 9.0, 12.0, 16.0, 12.0, 14.0, 26.0, 32.0, 42.0, 61.0, 84.0, 114.0, 116.0, 190.0, 275.0, 495.0, 821.0, 1465.0, 2728.0, 5407.0, 10136.0, 19336.0, 37308.0, 67574.0, 111863.0, 157183.0, 181363.0, 165040.0, 120948.0, 75988.0, 42284.0, 22590.0, 11659.0, 5953.0, 3126.0, 1674.0, 908.0, 575.0, 367.0, 217.0, 143.0, 98.0, 80.0, 58.0, 35.0, 38.0, 23.0, 20.0, 8.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-2.029296875, -1.9670562744140625, -1.904815673828125, -1.8425750732421875, -1.78033447265625, -1.7180938720703125, -1.655853271484375, -1.5936126708984375, -1.5313720703125, -1.4691314697265625, -1.406890869140625, -1.3446502685546875, -1.28240966796875, -1.2201690673828125, -1.157928466796875, -1.0956878662109375, -1.033447265625, -0.9712066650390625, -0.908966064453125, -0.8467254638671875, -0.78448486328125, -0.7222442626953125, -0.660003662109375, -0.5977630615234375, -0.5355224609375, -0.4732818603515625, -0.411041259765625, -0.3488006591796875, -0.28656005859375, -0.2243194580078125, -0.162078857421875, -0.0998382568359375, -0.03759765625, 0.0246429443359375, 0.086883544921875, 0.1491241455078125, 0.21136474609375, 0.2736053466796875, 0.335845947265625, 0.3980865478515625, 0.4603271484375, 0.5225677490234375, 0.584808349609375, 0.6470489501953125, 0.70928955078125, 0.7715301513671875, 0.833770751953125, 0.8960113525390625, 0.958251953125, 1.0204925537109375, 1.082733154296875, 1.1449737548828125, 1.20721435546875, 1.2694549560546875, 1.331695556640625, 1.3939361572265625, 1.4561767578125, 1.5184173583984375, 1.580657958984375, 1.6428985595703125, 1.70513916015625, 1.7673797607421875, 1.829620361328125, 1.8918609619140625, 1.9541015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 17.0, 14.0, 35.0, 36.0, 44.0, 38.0, 39.0, 42.0, 61.0, 64.0, 62.0, 63.0, 60.0, 55.0, 50.0, 50.0, 43.0, 44.0, 24.0, 30.0, 26.0, 13.0, 12.0, 11.0, 6.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6356277465820312, -0.6130523681640625, -0.5904769897460938, -0.567901611328125, -0.5453262329101562, -0.5227508544921875, -0.5001754760742188, -0.47760009765625, -0.45502471923828125, -0.4324493408203125, -0.40987396240234375, -0.387298583984375, -0.36472320556640625, -0.3421478271484375, -0.31957244873046875, -0.2969970703125, -0.27442169189453125, -0.2518463134765625, -0.22927093505859375, -0.206695556640625, -0.18412017822265625, -0.1615447998046875, -0.13896942138671875, -0.11639404296875, -0.09381866455078125, -0.0712432861328125, -0.04866790771484375, -0.026092529296875, -0.00351715087890625, 0.0190582275390625, 0.04163360595703125, 0.064208984375, 0.08678436279296875, 0.1093597412109375, 0.13193511962890625, 0.154510498046875, 0.17708587646484375, 0.1996612548828125, 0.22223663330078125, 0.24481201171875, 0.26738739013671875, 0.2899627685546875, 0.31253814697265625, 0.335113525390625, 0.35768890380859375, 0.3802642822265625, 0.40283966064453125, 0.4254150390625, 0.44799041748046875, 0.4705657958984375, 0.49314117431640625, 0.515716552734375, 0.5382919311523438, 0.5608673095703125, 0.5834426879882812, 0.60601806640625, 0.6285934448242188, 0.6511688232421875, 0.6737442016601562, 0.696319580078125, 0.7188949584960938, 0.7414703369140625, 0.7640457153320312, 0.78662109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 5.0, 11.0, 14.0, 12.0, 13.0, 13.0, 16.0, 21.0, 19.0, 35.0, 28.0, 33.0, 35.0, 43.0, 45.0, 64.0, 53.0, 45.0, 55.0, 44.0, 47.0, 35.0, 29.0, 39.0, 39.0, 34.0, 28.0, 27.0, 25.0, 21.0, 8.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.122591495513916, -4.962081432342529, -4.801571369171143, -4.641060829162598, -4.480550765991211, -4.320040702819824, -4.1595306396484375, -3.9990203380584717, -3.838510036468506, -3.677999973297119, -3.5174896717071533, -3.3569796085357666, -3.196469306945801, -3.035959243774414, -2.8754491806030273, -2.7149388790130615, -2.554428815841675, -2.393918752670288, -2.2334084510803223, -2.0728983879089355, -1.9123880863189697, -1.751878023147583, -1.5913678407669067, -1.4308576583862305, -1.2703474760055542, -1.109837293624878, -0.9493271112442017, -0.7888169884681702, -0.6283068060874939, -0.4677966237068176, -0.30728650093078613, -0.14677631855010986, 0.013733863830566406, 0.17424403131008148, 0.33475419878959656, 0.49526435136795044, 0.6557745337486267, 0.816284716129303, 0.9767948389053345, 1.1373050212860107, 1.297815203666687, 1.4583253860473633, 1.6188355684280396, 1.7793457508087158, 1.9398558139801025, 2.1003661155700684, 2.260876178741455, 2.421386241912842, 2.5818965435028076, 2.7424066066741943, 2.90291690826416, 3.063426971435547, 3.2239372730255127, 3.3844473361968994, 3.5449576377868652, 3.705467700958252, 3.8659777641296387, 4.026487827301025, 4.186997890472412, 4.347508430480957, 4.508018493652344, 4.6685285568237305, 4.829038619995117, 4.989548683166504, 5.150059223175049]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 10.0, 12.0, 15.0, 22.0, 14.0, 30.0, 24.0, 31.0, 29.0, 30.0, 36.0, 53.0, 35.0, 39.0, 42.0, 50.0, 44.0, 47.0, 34.0, 34.0, 36.0, 44.0, 29.0, 31.0, 34.0, 22.0, 21.0, 16.0, 20.0, 11.0, 13.0, 10.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021089553833008, -4.866550922393799, -4.71201229095459, -4.557473182678223, -4.402934551239014, -4.248395919799805, -4.093857288360596, -3.9393186569213867, -3.7847800254821777, -3.6302413940429688, -3.4757025241851807, -3.3211638927459717, -3.1666252613067627, -3.0120863914489746, -2.8575477600097656, -2.7030091285705566, -2.5484702587127686, -2.3939316272735596, -2.2393927574157715, -2.0848541259765625, -1.9303154945373535, -1.775776743888855, -1.6212379932403564, -1.4666993618011475, -1.312160611152649, -1.1576218605041504, -1.0030832290649414, -0.8485444784164429, -0.6940057873725891, -0.5394670963287354, -0.3849283456802368, -0.23038971424102783, -0.0758509635925293, 0.07868774235248566, 0.2332264482975006, 0.38776516914367676, 0.5423038601875305, 0.6968425512313843, 0.8513813018798828, 1.0059199333190918, 1.1604586839675903, 1.3149974346160889, 1.4695360660552979, 1.6240748167037964, 1.778613567352295, 1.933152198791504, 2.087690830230713, 2.242229461669922, 2.39676833152771, 2.551306962966919, 2.705845832824707, 2.860384464263916, 3.014923095703125, 3.169461727142334, 3.324000597000122, 3.478539228439331, 3.633078098297119, 3.787616729736328, 3.942155599594116, 4.096693992614746, 4.251233100891113, 4.405771732330322, 4.560310363769531, 4.71484899520874, 4.869387626647949]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 7.0, 23.0, 20.0, 57.0, 79.0, 129.0, 240.0, 389.0, 644.0, 1086.0, 1690.0, 2903.0, 4884.0, 7936.0, 13549.0, 22353.0, 37250.0, 61627.0, 101512.0, 163475.0, 256915.0, 380127.0, 509729.0, 596424.0, 583854.0, 486224.0, 353835.0, 234928.0, 147725.0, 90589.0, 54667.0, 32431.0, 19222.0, 11378.0, 6745.0, 3961.0, 2298.0, 1391.0, 827.0, 479.0, 264.0, 172.0, 107.0, 53.0, 35.0, 21.0, 15.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.25, -4.128204345703125, -4.00640869140625, -3.884613037109375, -3.7628173828125, -3.641021728515625, -3.51922607421875, -3.397430419921875, -3.275634765625, -3.153839111328125, -3.03204345703125, -2.910247802734375, -2.7884521484375, -2.666656494140625, -2.54486083984375, -2.423065185546875, -2.30126953125, -2.179473876953125, -2.05767822265625, -1.935882568359375, -1.8140869140625, -1.692291259765625, -1.57049560546875, -1.448699951171875, -1.326904296875, -1.205108642578125, -1.08331298828125, -0.961517333984375, -0.8397216796875, -0.717926025390625, -0.59613037109375, -0.474334716796875, -0.3525390625, -0.230743408203125, -0.10894775390625, 0.012847900390625, 0.1346435546875, 0.256439208984375, 0.37823486328125, 0.500030517578125, 0.621826171875, 0.743621826171875, 0.86541748046875, 0.987213134765625, 1.1090087890625, 1.230804443359375, 1.35260009765625, 1.474395751953125, 1.59619140625, 1.717987060546875, 1.83978271484375, 1.961578369140625, 2.0833740234375, 2.205169677734375, 2.32696533203125, 2.448760986328125, 2.570556640625, 2.692352294921875, 2.81414794921875, 2.935943603515625, 3.0577392578125, 3.179534912109375, 3.30133056640625, 3.423126220703125, 3.544921875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 6.0, 11.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 26.0, 28.0, 38.0, 37.0, 27.0, 44.0, 35.0, 50.0, 34.0, 43.0, 57.0, 42.0, 41.0, 30.0, 50.0, 40.0, 39.0, 34.0, 32.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 8.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.479644775390625, -3.35577392578125, -3.231903076171875, -3.1080322265625, -2.984161376953125, -2.86029052734375, -2.736419677734375, -2.612548828125, -2.488677978515625, -2.36480712890625, -2.240936279296875, -2.1170654296875, -1.993194580078125, -1.86932373046875, -1.745452880859375, -1.62158203125, -1.497711181640625, -1.37384033203125, -1.249969482421875, -1.1260986328125, -1.002227783203125, -0.87835693359375, -0.754486083984375, -0.630615234375, -0.506744384765625, -0.38287353515625, -0.259002685546875, -0.1351318359375, -0.011260986328125, 0.11260986328125, 0.236480712890625, 0.3603515625, 0.484222412109375, 0.60809326171875, 0.731964111328125, 0.8558349609375, 0.979705810546875, 1.10357666015625, 1.227447509765625, 1.351318359375, 1.475189208984375, 1.59906005859375, 1.722930908203125, 1.8468017578125, 1.970672607421875, 2.09454345703125, 2.218414306640625, 2.34228515625, 2.466156005859375, 2.59002685546875, 2.713897705078125, 2.8377685546875, 2.961639404296875, 3.08551025390625, 3.209381103515625, 3.333251953125, 3.457122802734375, 3.58099365234375, 3.704864501953125, 3.8287353515625, 3.952606201171875, 4.07647705078125, 4.200347900390625, 4.32421875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 16.0, 15.0, 31.0, 70.0, 82.0, 164.0, 277.0, 460.0, 914.0, 1554.0, 2873.0, 5252.0, 9363.0, 17180.0, 29773.0, 51312.0, 86806.0, 142476.0, 221547.0, 327103.0, 444346.0, 539694.0, 570593.0, 520358.0, 416514.0, 299272.0, 199450.0, 126904.0, 76408.0, 44967.0, 25758.0, 14409.0, 8047.0, 4601.0, 2482.0, 1438.0, 781.0, 448.0, 216.0, 147.0, 78.0, 38.0, 24.0, 20.0, 7.0, 8.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.359375, -4.23614501953125, -4.1129150390625, -3.98968505859375, -3.866455078125, -3.74322509765625, -3.6199951171875, -3.49676513671875, -3.37353515625, -3.25030517578125, -3.1270751953125, -3.00384521484375, -2.880615234375, -2.75738525390625, -2.6341552734375, -2.51092529296875, -2.3876953125, -2.26446533203125, -2.1412353515625, -2.01800537109375, -1.894775390625, -1.77154541015625, -1.6483154296875, -1.52508544921875, -1.40185546875, -1.27862548828125, -1.1553955078125, -1.03216552734375, -0.908935546875, -0.78570556640625, -0.6624755859375, -0.53924560546875, -0.416015625, -0.29278564453125, -0.1695556640625, -0.04632568359375, 0.076904296875, 0.20013427734375, 0.3233642578125, 0.44659423828125, 0.56982421875, 0.69305419921875, 0.8162841796875, 0.93951416015625, 1.062744140625, 1.18597412109375, 1.3092041015625, 1.43243408203125, 1.5556640625, 1.67889404296875, 1.8021240234375, 1.92535400390625, 2.048583984375, 2.17181396484375, 2.2950439453125, 2.41827392578125, 2.54150390625, 2.66473388671875, 2.7879638671875, 2.91119384765625, 3.034423828125, 3.15765380859375, 3.2808837890625, 3.40411376953125, 3.52734375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 11.0, 14.0, 12.0, 13.0, 25.0, 32.0, 33.0, 45.0, 44.0, 60.0, 93.0, 88.0, 118.0, 137.0, 160.0, 183.0, 183.0, 214.0, 236.0, 252.0, 241.0, 258.0, 233.0, 186.0, 204.0, 166.0, 132.0, 136.0, 107.0, 96.0, 70.0, 69.0, 47.0, 32.0, 28.0, 29.0, 17.0, 21.0, 15.0, 9.0, 5.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.650390625, -1.595611572265625, -1.54083251953125, -1.486053466796875, -1.4312744140625, -1.376495361328125, -1.32171630859375, -1.266937255859375, -1.212158203125, -1.157379150390625, -1.10260009765625, -1.047821044921875, -0.9930419921875, -0.938262939453125, -0.88348388671875, -0.828704833984375, -0.77392578125, -0.719146728515625, -0.66436767578125, -0.609588623046875, -0.5548095703125, -0.500030517578125, -0.44525146484375, -0.390472412109375, -0.335693359375, -0.280914306640625, -0.22613525390625, -0.171356201171875, -0.1165771484375, -0.061798095703125, -0.00701904296875, 0.047760009765625, 0.1025390625, 0.157318115234375, 0.21209716796875, 0.266876220703125, 0.3216552734375, 0.376434326171875, 0.43121337890625, 0.485992431640625, 0.540771484375, 0.595550537109375, 0.65032958984375, 0.705108642578125, 0.7598876953125, 0.814666748046875, 0.86944580078125, 0.924224853515625, 0.97900390625, 1.033782958984375, 1.08856201171875, 1.143341064453125, 1.1981201171875, 1.252899169921875, 1.30767822265625, 1.362457275390625, 1.417236328125, 1.472015380859375, 1.52679443359375, 1.581573486328125, 1.6363525390625, 1.691131591796875, 1.74591064453125, 1.800689697265625, 1.85546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 14.0, 17.0, 9.0, 16.0, 22.0, 30.0, 33.0, 36.0, 46.0, 35.0, 50.0, 43.0, 53.0, 56.0, 51.0, 52.0, 52.0, 39.0, 45.0, 36.0, 42.0, 39.0, 29.0, 22.0, 31.0, 15.0, 10.0, 15.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9960076808929443, -3.8486523628234863, -3.7012972831726074, -3.5539419651031494, -3.4065866470336914, -3.2592313289642334, -3.1118760108947754, -2.9645209312438965, -2.8171656131744385, -2.6698102951049805, -2.5224552154541016, -2.3750998973846436, -2.2277445793151855, -2.0803892612457275, -1.933034062385559, -1.7856788635253906, -1.6383235454559326, -1.4909682273864746, -1.3436130285263062, -1.1962578296661377, -1.0489025115966797, -0.9015472531318665, -0.7541919946670532, -0.6068367958068848, -0.45948147773742676, -0.3121262192726135, -0.1647709608078003, -0.01741570234298706, 0.12993955612182617, 0.2772948145866394, 0.42465007305145264, 0.5720052719116211, 0.7193608283996582, 0.8667160868644714, 1.0140713453292847, 1.1614265441894531, 1.3087818622589111, 1.4561371803283691, 1.6034923791885376, 1.750847578048706, 1.898202896118164, 2.045558214187622, 2.19291353225708, 2.340268611907959, 2.487623929977417, 2.634979248046875, 2.782334327697754, 2.929689645767212, 3.07704496383667, 3.224400281906128, 3.371755599975586, 3.519110679626465, 3.666465997695923, 3.813821315765381, 3.9611763954162598, 4.108531951904297, 4.255887031555176, 4.403242111206055, 4.550597667694092, 4.697952747344971, 4.845308303833008, 4.992663383483887, 5.140018463134766, 5.2873735427856445, 5.434729099273682]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 7.0, 11.0, 11.0, 8.0, 13.0, 14.0, 17.0, 14.0, 22.0, 28.0, 26.0, 27.0, 26.0, 32.0, 41.0, 43.0, 33.0, 49.0, 32.0, 38.0, 43.0, 48.0, 27.0, 49.0, 40.0, 39.0, 30.0, 34.0, 23.0, 30.0, 21.0, 18.0, 21.0, 13.0, 16.0, 9.0, 8.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.188475131988525, -4.064115047454834, -3.9397549629211426, -3.815394878387451, -3.6910347938537598, -3.5666747093200684, -3.442314624786377, -3.3179545402526855, -3.193594455718994, -3.0692343711853027, -2.9448742866516113, -2.82051420211792, -2.6961541175842285, -2.571794033050537, -2.4474339485168457, -2.3230738639831543, -2.198714017868042, -2.0743539333343506, -1.9499938488006592, -1.8256337642669678, -1.7012736797332764, -1.576913595199585, -1.452553629875183, -1.3281935453414917, -1.2038334608078003, -1.0794733762741089, -0.9551132917404175, -0.8307532668113708, -0.7063931822776794, -0.582033097743988, -0.4576730728149414, -0.33331298828125, -0.2089526653289795, -0.08459259569644928, 0.03976747393608093, 0.16412752866744995, 0.28848761320114136, 0.41284769773483276, 0.5372077226638794, 0.6615678071975708, 0.7859278917312622, 0.9102879762649536, 1.034648060798645, 1.1590080261230469, 1.2833681106567383, 1.4077281951904297, 1.532088279724121, 1.6564483642578125, 1.780808448791504, 1.9051685333251953, 2.0295286178588867, 2.153888702392578, 2.2782487869262695, 2.402608871459961, 2.5269689559936523, 2.6513290405273438, 2.775689125061035, 2.9000492095947266, 3.024409294128418, 3.1487693786621094, 3.273129463195801, 3.397489547729492, 3.5218496322631836, 3.646209716796875, 3.7705695629119873]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 12.0, 20.0, 21.0, 40.0, 43.0, 75.0, 118.0, 201.0, 270.0, 446.0, 753.0, 1254.0, 2168.0, 3897.0, 7795.0, 16462.0, 37349.0, 88790.0, 210077.0, 326745.0, 199994.0, 84234.0, 35627.0, 15628.0, 7339.0, 3846.0, 2159.0, 1229.0, 720.0, 419.0, 287.0, 169.0, 100.0, 91.0, 48.0, 36.0, 21.0, 17.0, 12.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.27288818359375, -5.0809326171875, -4.88897705078125, -4.697021484375, -4.50506591796875, -4.3131103515625, -4.12115478515625, -3.92919921875, -3.73724365234375, -3.5452880859375, -3.35333251953125, -3.161376953125, -2.96942138671875, -2.7774658203125, -2.58551025390625, -2.3935546875, -2.20159912109375, -2.0096435546875, -1.81768798828125, -1.625732421875, -1.43377685546875, -1.2418212890625, -1.04986572265625, -0.85791015625, -0.66595458984375, -0.4739990234375, -0.28204345703125, -0.090087890625, 0.10186767578125, 0.2938232421875, 0.48577880859375, 0.677734375, 0.86968994140625, 1.0616455078125, 1.25360107421875, 1.445556640625, 1.63751220703125, 1.8294677734375, 2.02142333984375, 2.21337890625, 2.40533447265625, 2.5972900390625, 2.78924560546875, 2.981201171875, 3.17315673828125, 3.3651123046875, 3.55706787109375, 3.7490234375, 3.94097900390625, 4.1329345703125, 4.32489013671875, 4.516845703125, 4.70880126953125, 4.9007568359375, 5.09271240234375, 5.28466796875, 5.47662353515625, 5.6685791015625, 5.86053466796875, 6.052490234375, 6.24444580078125, 6.4364013671875, 6.62835693359375, 6.8203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 11.0, 13.0, 9.0, 20.0, 15.0, 14.0, 22.0, 34.0, 20.0, 32.0, 30.0, 25.0, 30.0, 31.0, 40.0, 40.0, 46.0, 44.0, 37.0, 33.0, 45.0, 44.0, 30.0, 35.0, 21.0, 31.0, 24.0, 22.0, 18.0, 22.0, 19.0, 21.0, 14.0, 19.0, 13.0, 6.0, 9.0, 10.0, 3.0, 1.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.728515625, -3.610595703125, -3.49267578125, -3.374755859375, -3.2568359375, -3.138916015625, -3.02099609375, -2.903076171875, -2.78515625, -2.667236328125, -2.54931640625, -2.431396484375, -2.3134765625, -2.195556640625, -2.07763671875, -1.959716796875, -1.841796875, -1.723876953125, -1.60595703125, -1.488037109375, -1.3701171875, -1.252197265625, -1.13427734375, -1.016357421875, -0.8984375, -0.780517578125, -0.66259765625, -0.544677734375, -0.4267578125, -0.308837890625, -0.19091796875, -0.072998046875, 0.044921875, 0.162841796875, 0.28076171875, 0.398681640625, 0.5166015625, 0.634521484375, 0.75244140625, 0.870361328125, 0.98828125, 1.106201171875, 1.22412109375, 1.342041015625, 1.4599609375, 1.577880859375, 1.69580078125, 1.813720703125, 1.931640625, 2.049560546875, 2.16748046875, 2.285400390625, 2.4033203125, 2.521240234375, 2.63916015625, 2.757080078125, 2.875, 2.992919921875, 3.11083984375, 3.228759765625, 3.3466796875, 3.464599609375, 3.58251953125, 3.700439453125, 3.818359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 12.0, 20.0, 27.0, 37.0, 52.0, 86.0, 98.0, 141.0, 180.0, 271.0, 363.0, 508.0, 722.0, 1086.0, 1759.0, 2833.0, 4528.0, 8055.0, 15187.0, 31146.0, 69167.0, 161390.0, 309219.0, 240138.0, 106288.0, 46141.0, 21544.0, 11107.0, 5991.0, 3616.0, 2211.0, 1424.0, 978.0, 662.0, 455.0, 333.0, 229.0, 148.0, 107.0, 80.0, 60.0, 48.0, 22.0, 23.0, 21.0, 11.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-4.29296875, -4.16943359375, -4.0458984375, -3.92236328125, -3.798828125, -3.67529296875, -3.5517578125, -3.42822265625, -3.3046875, -3.18115234375, -3.0576171875, -2.93408203125, -2.810546875, -2.68701171875, -2.5634765625, -2.43994140625, -2.31640625, -2.19287109375, -2.0693359375, -1.94580078125, -1.822265625, -1.69873046875, -1.5751953125, -1.45166015625, -1.328125, -1.20458984375, -1.0810546875, -0.95751953125, -0.833984375, -0.71044921875, -0.5869140625, -0.46337890625, -0.33984375, -0.21630859375, -0.0927734375, 0.03076171875, 0.154296875, 0.27783203125, 0.4013671875, 0.52490234375, 0.6484375, 0.77197265625, 0.8955078125, 1.01904296875, 1.142578125, 1.26611328125, 1.3896484375, 1.51318359375, 1.63671875, 1.76025390625, 1.8837890625, 2.00732421875, 2.130859375, 2.25439453125, 2.3779296875, 2.50146484375, 2.625, 2.74853515625, 2.8720703125, 2.99560546875, 3.119140625, 3.24267578125, 3.3662109375, 3.48974609375, 3.61328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 8.0, 10.0, 12.0, 13.0, 13.0, 19.0, 13.0, 20.0, 19.0, 28.0, 28.0, 18.0, 27.0, 32.0, 42.0, 43.0, 24.0, 33.0, 31.0, 32.0, 39.0, 48.0, 38.0, 40.0, 42.0, 34.0, 41.0, 24.0, 34.0, 24.0, 21.0, 19.0, 20.0, 14.0, 15.0, 17.0, 7.0, 14.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.32501220703125, -2.2457275390625, -2.16644287109375, -2.087158203125, -2.00787353515625, -1.9285888671875, -1.84930419921875, -1.77001953125, -1.69073486328125, -1.6114501953125, -1.53216552734375, -1.452880859375, -1.37359619140625, -1.2943115234375, -1.21502685546875, -1.1357421875, -1.05645751953125, -0.9771728515625, -0.89788818359375, -0.818603515625, -0.73931884765625, -0.6600341796875, -0.58074951171875, -0.50146484375, -0.42218017578125, -0.3428955078125, -0.26361083984375, -0.184326171875, -0.10504150390625, -0.0257568359375, 0.05352783203125, 0.1328125, 0.21209716796875, 0.2913818359375, 0.37066650390625, 0.449951171875, 0.52923583984375, 0.6085205078125, 0.68780517578125, 0.76708984375, 0.84637451171875, 0.9256591796875, 1.00494384765625, 1.084228515625, 1.16351318359375, 1.2427978515625, 1.32208251953125, 1.4013671875, 1.48065185546875, 1.5599365234375, 1.63922119140625, 1.718505859375, 1.79779052734375, 1.8770751953125, 1.95635986328125, 2.03564453125, 2.11492919921875, 2.1942138671875, 2.27349853515625, 2.352783203125, 2.43206787109375, 2.5113525390625, 2.59063720703125, 2.669921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 7.0, 16.0, 29.0, 47.0, 63.0, 104.0, 187.0, 272.0, 453.0, 649.0, 1083.0, 1812.0, 3224.0, 6522.0, 15726.0, 61687.0, 695563.0, 210619.0, 29825.0, 10017.0, 4678.0, 2360.0, 1365.0, 771.0, 487.0, 339.0, 234.0, 136.0, 105.0, 58.0, 35.0, 22.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.0645751953125, -5.867431640625, -5.6702880859375, -5.47314453125, -5.2760009765625, -5.078857421875, -4.8817138671875, -4.6845703125, -4.4874267578125, -4.290283203125, -4.0931396484375, -3.89599609375, -3.6988525390625, -3.501708984375, -3.3045654296875, -3.107421875, -2.9102783203125, -2.713134765625, -2.5159912109375, -2.31884765625, -2.1217041015625, -1.924560546875, -1.7274169921875, -1.5302734375, -1.3331298828125, -1.135986328125, -0.9388427734375, -0.74169921875, -0.5445556640625, -0.347412109375, -0.1502685546875, 0.046875, 0.2440185546875, 0.441162109375, 0.6383056640625, 0.83544921875, 1.0325927734375, 1.229736328125, 1.4268798828125, 1.6240234375, 1.8211669921875, 2.018310546875, 2.2154541015625, 2.41259765625, 2.6097412109375, 2.806884765625, 3.0040283203125, 3.201171875, 3.3983154296875, 3.595458984375, 3.7926025390625, 3.98974609375, 4.1868896484375, 4.384033203125, 4.5811767578125, 4.7783203125, 4.9754638671875, 5.172607421875, 5.3697509765625, 5.56689453125, 5.7640380859375, 5.961181640625, 6.1583251953125, 6.35546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 10.0, 9.0, 22.0, 27.0, 68.0, 142.0, 287.0, 206.0, 94.0, 51.0, 20.0, 22.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008754730224609375, -0.0008528754115104675, -0.0008302778005599976, -0.0008076801896095276, -0.0007850825786590576, -0.0007624849677085876, -0.0007398873567581177, -0.0007172897458076477, -0.0006946921348571777, -0.0006720945239067078, -0.0006494969129562378, -0.0006268993020057678, -0.0006043016910552979, -0.0005817040801048279, -0.0005591064691543579, -0.0005365088582038879, -0.000513911247253418, -0.000491313636302948, -0.00046871602535247803, -0.00044611841440200806, -0.0004235208034515381, -0.0004009231925010681, -0.00037832558155059814, -0.0003557279706001282, -0.0003331303596496582, -0.00031053274869918823, -0.00028793513774871826, -0.0002653375267982483, -0.00024273991584777832, -0.00022014230489730835, -0.00019754469394683838, -0.0001749470829963684, -0.00015234947204589844, -0.00012975186109542847, -0.0001071542501449585, -8.455663919448853e-05, -6.195902824401855e-05, -3.9361417293548584e-05, -1.6763806343078613e-05, 5.833804607391357e-06, 2.8431415557861328e-05, 5.10290265083313e-05, 7.362663745880127e-05, 9.622424840927124e-05, 0.00011882185935974121, 0.00014141947031021118, 0.00016401708126068115, 0.00018661469221115112, 0.0002092123031616211, 0.00023180991411209106, 0.00025440752506256104, 0.000277005136013031, 0.000299602746963501, 0.00032220035791397095, 0.0003447979688644409, 0.0003673955798149109, 0.00038999319076538086, 0.00041259080171585083, 0.0004351884126663208, 0.00045778602361679077, 0.00048038363456726074, 0.0005029812455177307, 0.0005255788564682007, 0.0005481764674186707, 0.0005707740783691406]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 16.0, 23.0, 32.0, 48.0, 52.0, 85.0, 126.0, 179.0, 230.0, 373.0, 496.0, 657.0, 986.0, 1409.0, 2205.0, 3412.0, 5424.0, 9344.0, 18558.0, 42486.0, 120809.0, 370820.0, 304261.0, 93817.0, 34234.0, 15770.0, 8360.0, 4780.0, 3125.0, 2008.0, 1319.0, 909.0, 615.0, 477.0, 316.0, 236.0, 145.0, 121.0, 87.0, 65.0, 37.0, 27.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.935546875, -3.808135986328125, -3.68072509765625, -3.553314208984375, -3.4259033203125, -3.298492431640625, -3.17108154296875, -3.043670654296875, -2.916259765625, -2.788848876953125, -2.66143798828125, -2.534027099609375, -2.4066162109375, -2.279205322265625, -2.15179443359375, -2.024383544921875, -1.89697265625, -1.769561767578125, -1.64215087890625, -1.514739990234375, -1.3873291015625, -1.259918212890625, -1.13250732421875, -1.005096435546875, -0.877685546875, -0.750274658203125, -0.62286376953125, -0.495452880859375, -0.3680419921875, -0.240631103515625, -0.11322021484375, 0.014190673828125, 0.1416015625, 0.269012451171875, 0.39642333984375, 0.523834228515625, 0.6512451171875, 0.778656005859375, 0.90606689453125, 1.033477783203125, 1.160888671875, 1.288299560546875, 1.41571044921875, 1.543121337890625, 1.6705322265625, 1.797943115234375, 1.92535400390625, 2.052764892578125, 2.18017578125, 2.307586669921875, 2.43499755859375, 2.562408447265625, 2.6898193359375, 2.817230224609375, 2.94464111328125, 3.072052001953125, 3.199462890625, 3.326873779296875, 3.45428466796875, 3.581695556640625, 3.7091064453125, 3.836517333984375, 3.96392822265625, 4.091339111328125, 4.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 4.0, 4.0, 4.0, 6.0, 15.0, 14.0, 19.0, 31.0, 40.0, 63.0, 49.0, 71.0, 72.0, 103.0, 92.0, 86.0, 69.0, 60.0, 46.0, 27.0, 25.0, 15.0, 13.0, 11.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.97802734375, -0.95001220703125, -0.9219970703125, -0.89398193359375, -0.865966796875, -0.83795166015625, -0.8099365234375, -0.78192138671875, -0.75390625, -0.72589111328125, -0.6978759765625, -0.66986083984375, -0.641845703125, -0.61383056640625, -0.5858154296875, -0.55780029296875, -0.52978515625, -0.50177001953125, -0.4737548828125, -0.44573974609375, -0.417724609375, -0.38970947265625, -0.3616943359375, -0.33367919921875, -0.3056640625, -0.27764892578125, -0.2496337890625, -0.22161865234375, -0.193603515625, -0.16558837890625, -0.1375732421875, -0.10955810546875, -0.08154296875, -0.05352783203125, -0.0255126953125, 0.00250244140625, 0.030517578125, 0.05853271484375, 0.0865478515625, 0.11456298828125, 0.142578125, 0.17059326171875, 0.1986083984375, 0.22662353515625, 0.254638671875, 0.28265380859375, 0.3106689453125, 0.33868408203125, 0.36669921875, 0.39471435546875, 0.4227294921875, 0.45074462890625, 0.478759765625, 0.50677490234375, 0.5347900390625, 0.56280517578125, 0.5908203125, 0.61883544921875, 0.6468505859375, 0.67486572265625, 0.702880859375, 0.73089599609375, 0.7589111328125, 0.78692626953125, 0.81494140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 18.0, 17.0, 30.0, 26.0, 30.0, 40.0, 45.0, 37.0, 37.0, 37.0, 35.0, 39.0, 49.0, 54.0, 49.0, 42.0, 33.0, 38.0, 24.0, 32.0, 32.0, 26.0, 31.0, 17.0, 24.0, 19.0, 11.0, 12.0, 6.0, 6.0, 13.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6007587909698486, -3.4782354831695557, -3.3557121753692627, -3.2331888675689697, -3.1106653213500977, -2.9881420135498047, -2.8656187057495117, -2.7430953979492188, -2.620572090148926, -2.498048782348633, -2.37552547454834, -2.253002166748047, -2.130478858947754, -2.007955551147461, -1.8854320049285889, -1.762908697128296, -1.640385389328003, -1.51786208152771, -1.395338773727417, -1.2728153467178345, -1.1502920389175415, -1.0277687311172485, -0.9052453637123108, -0.782721996307373, -0.6601986885070801, -0.5376753807067871, -0.41515201330184937, -0.292628675699234, -0.17010533809661865, -0.047582030296325684, 0.07494133710861206, 0.1974647045135498, 0.3199882507324219, 0.44251158833503723, 0.5650349259376526, 0.6875582933425903, 0.8100816011428833, 0.9326049089431763, 1.0551283359527588, 1.1776516437530518, 1.3001749515533447, 1.4226982593536377, 1.5452215671539307, 1.6677449941635132, 1.7902683019638062, 1.9127916097640991, 2.0353150367736816, 2.1578383445739746, 2.2803616523742676, 2.4028849601745605, 2.5254082679748535, 2.6479315757751465, 2.7704548835754395, 2.8929781913757324, 3.0155017375946045, 3.1380250453948975, 3.2605483531951904, 3.3830716609954834, 3.5055949687957764, 3.6281182765960693, 3.7506418228149414, 3.8731651306152344, 3.9956884384155273, 4.11821174621582, 4.240735054016113]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 13.0, 11.0, 7.0, 15.0, 12.0, 21.0, 12.0, 23.0, 17.0, 26.0, 25.0, 29.0, 33.0, 39.0, 30.0, 42.0, 40.0, 43.0, 52.0, 30.0, 38.0, 39.0, 41.0, 49.0, 39.0, 34.0, 34.0, 19.0, 25.0, 26.0, 23.0, 14.0, 15.0, 14.0, 12.0, 7.0, 3.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.016229152679443, -3.8973805904388428, -3.778532028198242, -3.6596834659576416, -3.540834903717041, -3.4219865798950195, -3.303138017654419, -3.1842894554138184, -3.0654408931732178, -2.946592330932617, -2.8277437686920166, -2.708895206451416, -2.5900468826293945, -2.471198081970215, -2.3523497581481934, -2.2335011959075928, -2.114652633666992, -1.9958040714263916, -1.876955509185791, -1.75810706615448, -1.6392585039138794, -1.5204099416732788, -1.4015614986419678, -1.2827129364013672, -1.1638643741607666, -1.045015811920166, -0.9261673092842102, -0.8073188066482544, -0.6884702444076538, -0.5696216821670532, -0.4507731795310974, -0.3319246768951416, -0.21307611465454102, -0.09422758221626282, 0.02462095022201538, 0.14346948266029358, 0.2623180150985718, 0.38116657733917236, 0.5000150799751282, 0.618863582611084, 0.7377121448516846, 0.8565607070922852, 0.975409209728241, 1.0942577123641968, 1.2131062746047974, 1.331954836845398, 1.450803279876709, 1.5696518421173096, 1.6885004043579102, 1.8073489665985107, 1.9261975288391113, 2.045046091079712, 2.1638946533203125, 2.282742977142334, 2.4015915393829346, 2.520440101623535, 2.6392886638641357, 2.7581372261047363, 2.876985788345337, 2.9958343505859375, 3.114682674407959, 3.2335314750671387, 3.35237979888916, 3.4712283611297607, 3.5900769233703613]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 31.0, 41.0, 61.0, 97.0, 136.0, 200.0, 310.0, 487.0, 710.0, 1082.0, 1701.0, 2751.0, 4259.0, 6712.0, 10392.0, 16315.0, 24860.0, 37364.0, 53346.0, 72787.0, 92835.0, 110228.0, 118796.0, 115629.0, 102177.0, 82811.0, 62211.0, 44310.0, 30027.0, 19990.0, 12816.0, 8378.0, 5220.0, 3376.0, 2107.0, 1356.0, 857.0, 602.0, 352.0, 246.0, 183.0, 134.0, 65.0, 48.0, 36.0, 20.0, 19.0, 13.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 9.0, 16.0, 12.0, 15.0, 18.0, 30.0, 18.0, 19.0, 39.0, 23.0, 26.0, 35.0, 41.0, 40.0, 32.0, 43.0, 41.0, 42.0, 42.0, 46.0, 36.0, 46.0, 41.0, 38.0, 29.0, 26.0, 36.0, 26.0, 18.0, 16.0, 14.0, 14.0, 10.0, 10.0, 7.0, 4.0, 8.0, 1.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.865234375, -3.747894287109375, -3.63055419921875, -3.513214111328125, -3.3958740234375, -3.278533935546875, -3.16119384765625, -3.043853759765625, -2.926513671875, -2.809173583984375, -2.69183349609375, -2.574493408203125, -2.4571533203125, -2.339813232421875, -2.22247314453125, -2.105133056640625, -1.98779296875, -1.870452880859375, -1.75311279296875, -1.635772705078125, -1.5184326171875, -1.401092529296875, -1.28375244140625, -1.166412353515625, -1.049072265625, -0.931732177734375, -0.81439208984375, -0.697052001953125, -0.5797119140625, -0.462371826171875, -0.34503173828125, -0.227691650390625, -0.1103515625, 0.006988525390625, 0.12432861328125, 0.241668701171875, 0.3590087890625, 0.476348876953125, 0.59368896484375, 0.711029052734375, 0.828369140625, 0.945709228515625, 1.06304931640625, 1.180389404296875, 1.2977294921875, 1.415069580078125, 1.53240966796875, 1.649749755859375, 1.76708984375, 1.884429931640625, 2.00177001953125, 2.119110107421875, 2.2364501953125, 2.353790283203125, 2.47113037109375, 2.588470458984375, 2.705810546875, 2.823150634765625, 2.94049072265625, 3.057830810546875, 3.1751708984375, 3.292510986328125, 3.40985107421875, 3.527191162109375, 3.64453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 13.0, 14.0, 29.0, 43.0, 79.0, 125.0, 191.0, 292.0, 549.0, 790.0, 1393.0, 2312.0, 3759.0, 6144.0, 10282.0, 16606.0, 26349.0, 40187.0, 58723.0, 81777.0, 105485.0, 121920.0, 126443.0, 118413.0, 99664.0, 76025.0, 53878.0, 35964.0, 23340.0, 14671.0, 9080.0, 5587.0, 3328.0, 2023.0, 1261.0, 683.0, 440.0, 285.0, 152.0, 82.0, 72.0, 40.0, 23.0, 15.0, 10.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.0194091796875, -3.882568359375, -3.7457275390625, -3.60888671875, -3.4720458984375, -3.335205078125, -3.1983642578125, -3.0615234375, -2.9246826171875, -2.787841796875, -2.6510009765625, -2.51416015625, -2.3773193359375, -2.240478515625, -2.1036376953125, -1.966796875, -1.8299560546875, -1.693115234375, -1.5562744140625, -1.41943359375, -1.2825927734375, -1.145751953125, -1.0089111328125, -0.8720703125, -0.7352294921875, -0.598388671875, -0.4615478515625, -0.32470703125, -0.1878662109375, -0.051025390625, 0.0858154296875, 0.22265625, 0.3594970703125, 0.496337890625, 0.6331787109375, 0.77001953125, 0.9068603515625, 1.043701171875, 1.1805419921875, 1.3173828125, 1.4542236328125, 1.591064453125, 1.7279052734375, 1.86474609375, 2.0015869140625, 2.138427734375, 2.2752685546875, 2.412109375, 2.5489501953125, 2.685791015625, 2.8226318359375, 2.95947265625, 3.0963134765625, 3.233154296875, 3.3699951171875, 3.5068359375, 3.6436767578125, 3.780517578125, 3.9173583984375, 4.05419921875, 4.1910400390625, 4.327880859375, 4.4647216796875, 4.6015625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 10.0, 11.0, 18.0, 8.0, 11.0, 14.0, 22.0, 21.0, 31.0, 28.0, 31.0, 39.0, 36.0, 24.0, 37.0, 41.0, 41.0, 46.0, 44.0, 38.0, 44.0, 53.0, 29.0, 41.0, 36.0, 27.0, 20.0, 29.0, 25.0, 17.0, 18.0, 15.0, 21.0, 18.0, 11.0, 8.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.303192138671875, -2.22552490234375, -2.147857666015625, -2.0701904296875, -1.992523193359375, -1.91485595703125, -1.837188720703125, -1.759521484375, -1.681854248046875, -1.60418701171875, -1.526519775390625, -1.4488525390625, -1.371185302734375, -1.29351806640625, -1.215850830078125, -1.13818359375, -1.060516357421875, -0.98284912109375, -0.905181884765625, -0.8275146484375, -0.749847412109375, -0.67218017578125, -0.594512939453125, -0.516845703125, -0.439178466796875, -0.36151123046875, -0.283843994140625, -0.2061767578125, -0.128509521484375, -0.05084228515625, 0.026824951171875, 0.1044921875, 0.182159423828125, 0.25982666015625, 0.337493896484375, 0.4151611328125, 0.492828369140625, 0.57049560546875, 0.648162841796875, 0.725830078125, 0.803497314453125, 0.88116455078125, 0.958831787109375, 1.0364990234375, 1.114166259765625, 1.19183349609375, 1.269500732421875, 1.34716796875, 1.424835205078125, 1.50250244140625, 1.580169677734375, 1.6578369140625, 1.735504150390625, 1.81317138671875, 1.890838623046875, 1.968505859375, 2.046173095703125, 2.12384033203125, 2.201507568359375, 2.2791748046875, 2.356842041015625, 2.43450927734375, 2.512176513671875, 2.58984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 13.0, 22.0, 19.0, 42.0, 54.0, 78.0, 110.0, 167.0, 191.0, 348.0, 452.0, 686.0, 991.0, 1628.0, 2673.0, 4959.0, 9748.0, 21169.0, 48439.0, 111224.0, 213081.0, 267553.0, 191670.0, 95153.0, 40639.0, 17735.0, 8366.0, 4438.0, 2430.0, 1563.0, 908.0, 598.0, 430.0, 284.0, 207.0, 155.0, 81.0, 72.0, 44.0, 36.0, 22.0, 20.0, 15.0, 15.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.25616455078125, -3.1490478515625, -3.04193115234375, -2.934814453125, -2.82769775390625, -2.7205810546875, -2.61346435546875, -2.50634765625, -2.39923095703125, -2.2921142578125, -2.18499755859375, -2.077880859375, -1.97076416015625, -1.8636474609375, -1.75653076171875, -1.6494140625, -1.54229736328125, -1.4351806640625, -1.32806396484375, -1.220947265625, -1.11383056640625, -1.0067138671875, -0.89959716796875, -0.79248046875, -0.68536376953125, -0.5782470703125, -0.47113037109375, -0.364013671875, -0.25689697265625, -0.1497802734375, -0.04266357421875, 0.064453125, 0.17156982421875, 0.2786865234375, 0.38580322265625, 0.492919921875, 0.60003662109375, 0.7071533203125, 0.81427001953125, 0.92138671875, 1.02850341796875, 1.1356201171875, 1.24273681640625, 1.349853515625, 1.45697021484375, 1.5640869140625, 1.67120361328125, 1.7783203125, 1.88543701171875, 1.9925537109375, 2.09967041015625, 2.206787109375, 2.31390380859375, 2.4210205078125, 2.52813720703125, 2.63525390625, 2.74237060546875, 2.8494873046875, 2.95660400390625, 3.063720703125, 3.17083740234375, 3.2779541015625, 3.38507080078125, 3.4921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 13.0, 9.0, 9.0, 31.0, 27.0, 32.0, 57.0, 61.0, 71.0, 70.0, 68.0, 78.0, 82.0, 59.0, 62.0, 53.0, 31.0, 39.0, 28.0, 30.0, 22.0, 21.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003304481506347656, -0.00032163411378860474, -0.00031282007694244385, -0.00030400604009628296, -0.00029519200325012207, -0.0002863779664039612, -0.0002775639295578003, -0.0002687498927116394, -0.0002599358558654785, -0.0002511218190193176, -0.00024230778217315674, -0.00023349374532699585, -0.00022467970848083496, -0.00021586567163467407, -0.00020705163478851318, -0.0001982375979423523, -0.0001894235610961914, -0.00018060952425003052, -0.00017179548740386963, -0.00016298145055770874, -0.00015416741371154785, -0.00014535337686538696, -0.00013653934001922607, -0.00012772530317306519, -0.0001189112663269043, -0.00011009722948074341, -0.00010128319263458252, -9.246915578842163e-05, -8.365511894226074e-05, -7.484108209609985e-05, -6.602704524993896e-05, -5.7213008403778076e-05, -4.839897155761719e-05, -3.95849347114563e-05, -3.077089786529541e-05, -2.195686101913452e-05, -1.3142824172973633e-05, -4.328787326812744e-06, 4.4852495193481445e-06, 1.3299286365509033e-05, 2.2113323211669922e-05, 3.092736005783081e-05, 3.97413969039917e-05, 4.855543375015259e-05, 5.7369470596313477e-05, 6.618350744247437e-05, 7.499754428863525e-05, 8.381158113479614e-05, 9.262561798095703e-05, 0.00010143965482711792, 0.00011025369167327881, 0.0001190677285194397, 0.00012788176536560059, 0.00013669580221176147, 0.00014550983905792236, 0.00015432387590408325, 0.00016313791275024414, 0.00017195194959640503, 0.00018076598644256592, 0.0001895800232887268, 0.0001983940601348877, 0.00020720809698104858, 0.00021602213382720947, 0.00022483617067337036, 0.00023365020751953125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 20.0, 23.0, 54.0, 61.0, 86.0, 168.0, 233.0, 325.0, 496.0, 722.0, 1231.0, 2039.0, 3574.0, 6433.0, 11765.0, 22186.0, 41990.0, 77182.0, 129225.0, 180852.0, 194642.0, 155637.0, 98937.0, 55483.0, 29726.0, 15757.0, 8454.0, 4484.0, 2549.0, 1542.0, 862.0, 593.0, 395.0, 220.0, 184.0, 134.0, 81.0, 64.0, 42.0, 25.0, 21.0, 15.0, 13.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4609375, -2.386871337890625, -2.31280517578125, -2.238739013671875, -2.1646728515625, -2.090606689453125, -2.01654052734375, -1.942474365234375, -1.868408203125, -1.794342041015625, -1.72027587890625, -1.646209716796875, -1.5721435546875, -1.498077392578125, -1.42401123046875, -1.349945068359375, -1.27587890625, -1.201812744140625, -1.12774658203125, -1.053680419921875, -0.9796142578125, -0.905548095703125, -0.83148193359375, -0.757415771484375, -0.683349609375, -0.609283447265625, -0.53521728515625, -0.461151123046875, -0.3870849609375, -0.313018798828125, -0.23895263671875, -0.164886474609375, -0.0908203125, -0.016754150390625, 0.05731201171875, 0.131378173828125, 0.2054443359375, 0.279510498046875, 0.35357666015625, 0.427642822265625, 0.501708984375, 0.575775146484375, 0.64984130859375, 0.723907470703125, 0.7979736328125, 0.872039794921875, 0.94610595703125, 1.020172119140625, 1.09423828125, 1.168304443359375, 1.24237060546875, 1.316436767578125, 1.3905029296875, 1.464569091796875, 1.53863525390625, 1.612701416015625, 1.686767578125, 1.760833740234375, 1.83489990234375, 1.908966064453125, 1.9830322265625, 2.057098388671875, 2.13116455078125, 2.205230712890625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 15.0, 12.0, 16.0, 13.0, 23.0, 22.0, 28.0, 31.0, 46.0, 37.0, 50.0, 47.0, 60.0, 49.0, 53.0, 49.0, 54.0, 60.0, 47.0, 46.0, 32.0, 36.0, 30.0, 24.0, 19.0, 15.0, 15.0, 9.0, 8.0, 5.0, 4.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79541015625, -0.7714614868164062, -0.7475128173828125, -0.7235641479492188, -0.699615478515625, -0.6756668090820312, -0.6517181396484375, -0.6277694702148438, -0.60382080078125, -0.5798721313476562, -0.5559234619140625, -0.5319747924804688, -0.508026123046875, -0.48407745361328125, -0.4601287841796875, -0.43618011474609375, -0.4122314453125, -0.38828277587890625, -0.3643341064453125, -0.34038543701171875, -0.316436767578125, -0.29248809814453125, -0.2685394287109375, -0.24459075927734375, -0.22064208984375, -0.19669342041015625, -0.1727447509765625, -0.14879608154296875, -0.124847412109375, -0.10089874267578125, -0.0769500732421875, -0.05300140380859375, -0.029052734375, -0.00510406494140625, 0.0188446044921875, 0.04279327392578125, 0.066741943359375, 0.09069061279296875, 0.1146392822265625, 0.13858795166015625, 0.16253662109375, 0.18648529052734375, 0.2104339599609375, 0.23438262939453125, 0.258331298828125, 0.28227996826171875, 0.3062286376953125, 0.33017730712890625, 0.3541259765625, 0.37807464599609375, 0.4020233154296875, 0.42597198486328125, 0.449920654296875, 0.47386932373046875, 0.4978179931640625, 0.5217666625976562, 0.54571533203125, 0.5696640014648438, 0.5936126708984375, 0.6175613403320312, 0.641510009765625, 0.6654586791992188, 0.6894073486328125, 0.7133560180664062, 0.7373046875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 9.0, 8.0, 11.0, 12.0, 18.0, 22.0, 28.0, 24.0, 22.0, 37.0, 40.0, 45.0, 44.0, 44.0, 53.0, 47.0, 41.0, 45.0, 44.0, 46.0, 29.0, 41.0, 39.0, 22.0, 27.0, 25.0, 23.0, 21.0, 22.0, 11.0, 16.0, 13.0, 7.0, 9.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6092023849487305, -3.489184856414795, -3.3691673278808594, -3.249149799346924, -3.1291322708129883, -3.0091147422790527, -2.889097213745117, -2.7690794467926025, -2.649061918258667, -2.5290443897247314, -2.409026861190796, -2.2890093326568604, -2.168991804122925, -2.04897403717041, -1.9289566278457642, -1.808938980102539, -1.688921570777893, -1.5689040422439575, -1.448886513710022, -1.3288688659667969, -1.2088513374328613, -1.0888338088989258, -0.9688162803649902, -0.8487986922264099, -0.7287811636924744, -0.6087636351585388, -0.4887460470199585, -0.36872851848602295, -0.24871096014976501, -0.12869340181350708, -0.008675873279571533, 0.11134171485900879, 0.23135924339294434, 0.35137680172920227, 0.4713943600654602, 0.5914118885993958, 0.7114294767379761, 0.8314470052719116, 0.9514645338058472, 1.0714821815490723, 1.1914997100830078, 1.3115172386169434, 1.431534767150879, 1.5515522956848145, 1.6715699434280396, 1.791587471961975, 1.9116050004959106, 2.0316226482391357, 2.151639938354492, 2.2716574668884277, 2.3916749954223633, 2.511692523956299, 2.6317100524902344, 2.75172758102417, 2.8717451095581055, 2.99176287651062, 3.1117804050445557, 3.231797933578491, 3.3518154621124268, 3.4718329906463623, 3.591850519180298, 3.7118682861328125, 3.831885814666748, 3.9519033432006836, 4.071920871734619]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 9.0, 8.0, 9.0, 15.0, 12.0, 14.0, 10.0, 10.0, 15.0, 23.0, 19.0, 34.0, 30.0, 37.0, 32.0, 44.0, 49.0, 31.0, 42.0, 45.0, 45.0, 35.0, 38.0, 36.0, 42.0, 33.0, 42.0, 26.0, 32.0, 17.0, 23.0, 20.0, 16.0, 22.0, 9.0, 12.0, 8.0, 14.0, 11.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.8113772869110107, -3.691875696182251, -3.572374105453491, -3.4528725147247314, -3.3333709239959717, -3.213869333267212, -3.094367742538452, -2.9748661518096924, -2.8553645610809326, -2.735862970352173, -2.616361379623413, -2.4968597888946533, -2.3773581981658936, -2.257856607437134, -2.138355016708374, -2.0188534259796143, -1.8993518352508545, -1.7798502445220947, -1.660348653793335, -1.5408470630645752, -1.4213454723358154, -1.3018438816070557, -1.182342290878296, -1.0628407001495361, -0.9433391094207764, -0.8238375186920166, -0.7043359279632568, -0.5848343372344971, -0.4653327465057373, -0.34583115577697754, -0.22632956504821777, -0.10682797431945801, 0.012673377990722656, 0.13217496871948242, 0.2516765594482422, 0.37117815017700195, 0.4906797409057617, 0.6101813316345215, 0.7296829223632812, 0.849184513092041, 0.9686861038208008, 1.0881876945495605, 1.2076892852783203, 1.32719087600708, 1.4466924667358398, 1.5661940574645996, 1.6856956481933594, 1.8051972389221191, 1.924698829650879, 2.0442004203796387, 2.1637020111083984, 2.283203601837158, 2.402705192565918, 2.5222067832946777, 2.6417083740234375, 2.7612099647521973, 2.880711555480957, 3.000213146209717, 3.1197147369384766, 3.2392163276672363, 3.358717918395996, 3.478219509124756, 3.5977210998535156, 3.7172226905822754, 3.836724281311035]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 8.0, 19.0, 29.0, 41.0, 71.0, 147.0, 202.0, 342.0, 498.0, 861.0, 1453.0, 2343.0, 3724.0, 6109.0, 9958.0, 16278.0, 26585.0, 42211.0, 67967.0, 107281.0, 166552.0, 249078.0, 354256.0, 459905.0, 533483.0, 541889.0, 477075.0, 374384.0, 267073.0, 179271.0, 115153.0, 72621.0, 45410.0, 28037.0, 16967.0, 10563.0, 6354.0, 3959.0, 2421.0, 1408.0, 870.0, 564.0, 318.0, 201.0, 123.0, 85.0, 52.0, 30.0, 14.0, 16.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.919921875, -2.826019287109375, -2.73211669921875, -2.638214111328125, -2.5443115234375, -2.450408935546875, -2.35650634765625, -2.262603759765625, -2.168701171875, -2.074798583984375, -1.98089599609375, -1.886993408203125, -1.7930908203125, -1.699188232421875, -1.60528564453125, -1.511383056640625, -1.41748046875, -1.323577880859375, -1.22967529296875, -1.135772705078125, -1.0418701171875, -0.947967529296875, -0.85406494140625, -0.760162353515625, -0.666259765625, -0.572357177734375, -0.47845458984375, -0.384552001953125, -0.2906494140625, -0.196746826171875, -0.10284423828125, -0.008941650390625, 0.0849609375, 0.178863525390625, 0.27276611328125, 0.366668701171875, 0.4605712890625, 0.554473876953125, 0.64837646484375, 0.742279052734375, 0.836181640625, 0.930084228515625, 1.02398681640625, 1.117889404296875, 1.2117919921875, 1.305694580078125, 1.39959716796875, 1.493499755859375, 1.58740234375, 1.681304931640625, 1.77520751953125, 1.869110107421875, 1.9630126953125, 2.056915283203125, 2.15081787109375, 2.244720458984375, 2.338623046875, 2.432525634765625, 2.52642822265625, 2.620330810546875, 2.7142333984375, 2.808135986328125, 2.90203857421875, 2.995941162109375, 3.08984375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 2.0, 7.0, 12.0, 10.0, 16.0, 8.0, 14.0, 13.0, 21.0, 20.0, 18.0, 27.0, 31.0, 44.0, 36.0, 37.0, 33.0, 38.0, 35.0, 42.0, 33.0, 51.0, 44.0, 40.0, 38.0, 29.0, 28.0, 27.0, 27.0, 24.0, 29.0, 20.0, 17.0, 22.0, 21.0, 21.0, 8.0, 12.0, 9.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.526580810546875, -2.43597412109375, -2.345367431640625, -2.2547607421875, -2.164154052734375, -2.07354736328125, -1.982940673828125, -1.892333984375, -1.801727294921875, -1.71112060546875, -1.620513916015625, -1.5299072265625, -1.439300537109375, -1.34869384765625, -1.258087158203125, -1.16748046875, -1.076873779296875, -0.98626708984375, -0.895660400390625, -0.8050537109375, -0.714447021484375, -0.62384033203125, -0.533233642578125, -0.442626953125, -0.352020263671875, -0.26141357421875, -0.170806884765625, -0.0802001953125, 0.010406494140625, 0.10101318359375, 0.191619873046875, 0.2822265625, 0.372833251953125, 0.46343994140625, 0.554046630859375, 0.6446533203125, 0.735260009765625, 0.82586669921875, 0.916473388671875, 1.007080078125, 1.097686767578125, 1.18829345703125, 1.278900146484375, 1.3695068359375, 1.460113525390625, 1.55072021484375, 1.641326904296875, 1.73193359375, 1.822540283203125, 1.91314697265625, 2.003753662109375, 2.0943603515625, 2.184967041015625, 2.27557373046875, 2.366180419921875, 2.456787109375, 2.547393798828125, 2.63800048828125, 2.728607177734375, 2.8192138671875, 2.909820556640625, 3.00042724609375, 3.091033935546875, 3.181640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 24.0, 29.0, 41.0, 67.0, 145.0, 267.0, 450.0, 807.0, 1671.0, 3110.0, 6082.0, 11950.0, 22364.0, 41566.0, 76856.0, 134260.0, 224595.0, 348208.0, 488313.0, 596026.0, 619137.0, 544317.0, 410737.0, 275480.0, 171091.0, 98577.0, 55544.0, 29649.0, 15491.0, 8332.0, 4204.0, 2271.0, 1262.0, 618.0, 307.0, 188.0, 102.0, 57.0, 37.0, 21.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.998046875, -3.8812255859375, -3.764404296875, -3.6475830078125, -3.53076171875, -3.4139404296875, -3.297119140625, -3.1802978515625, -3.0634765625, -2.9466552734375, -2.829833984375, -2.7130126953125, -2.59619140625, -2.4793701171875, -2.362548828125, -2.2457275390625, -2.12890625, -2.0120849609375, -1.895263671875, -1.7784423828125, -1.66162109375, -1.5447998046875, -1.427978515625, -1.3111572265625, -1.1943359375, -1.0775146484375, -0.960693359375, -0.8438720703125, -0.72705078125, -0.6102294921875, -0.493408203125, -0.3765869140625, -0.259765625, -0.1429443359375, -0.026123046875, 0.0906982421875, 0.20751953125, 0.3243408203125, 0.441162109375, 0.5579833984375, 0.6748046875, 0.7916259765625, 0.908447265625, 1.0252685546875, 1.14208984375, 1.2589111328125, 1.375732421875, 1.4925537109375, 1.609375, 1.7261962890625, 1.843017578125, 1.9598388671875, 2.07666015625, 2.1934814453125, 2.310302734375, 2.4271240234375, 2.5439453125, 2.6607666015625, 2.777587890625, 2.8944091796875, 3.01123046875, 3.1280517578125, 3.244873046875, 3.3616943359375, 3.478515625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 14.0, 25.0, 28.0, 27.0, 54.0, 54.0, 71.0, 96.0, 82.0, 128.0, 155.0, 168.0, 216.0, 235.0, 258.0, 247.0, 242.0, 253.0, 255.0, 245.0, 203.0, 192.0, 173.0, 128.0, 123.0, 86.0, 73.0, 65.0, 35.0, 37.0, 26.0, 23.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6337890625, -1.582061767578125, -1.53033447265625, -1.478607177734375, -1.4268798828125, -1.375152587890625, -1.32342529296875, -1.271697998046875, -1.219970703125, -1.168243408203125, -1.11651611328125, -1.064788818359375, -1.0130615234375, -0.961334228515625, -0.90960693359375, -0.857879638671875, -0.80615234375, -0.754425048828125, -0.70269775390625, -0.650970458984375, -0.5992431640625, -0.547515869140625, -0.49578857421875, -0.444061279296875, -0.392333984375, -0.340606689453125, -0.28887939453125, -0.237152099609375, -0.1854248046875, -0.133697509765625, -0.08197021484375, -0.030242919921875, 0.021484375, 0.073211669921875, 0.12493896484375, 0.176666259765625, 0.2283935546875, 0.280120849609375, 0.33184814453125, 0.383575439453125, 0.435302734375, 0.487030029296875, 0.53875732421875, 0.590484619140625, 0.6422119140625, 0.693939208984375, 0.74566650390625, 0.797393798828125, 0.84912109375, 0.900848388671875, 0.95257568359375, 1.004302978515625, 1.0560302734375, 1.107757568359375, 1.15948486328125, 1.211212158203125, 1.262939453125, 1.314666748046875, 1.36639404296875, 1.418121337890625, 1.4698486328125, 1.521575927734375, 1.57330322265625, 1.625030517578125, 1.6767578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 6.0, 11.0, 8.0, 5.0, 9.0, 14.0, 16.0, 20.0, 27.0, 30.0, 16.0, 27.0, 49.0, 35.0, 40.0, 43.0, 49.0, 50.0, 49.0, 45.0, 39.0, 47.0, 53.0, 38.0, 43.0, 32.0, 35.0, 25.0, 18.0, 19.0, 20.0, 18.0, 18.0, 13.0, 6.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.854025363922119, -3.737438917160034, -3.620852470397949, -3.5042660236358643, -3.3876795768737793, -3.2710931301116943, -3.1545066833496094, -3.0379204750061035, -2.9213337898254395, -2.8047473430633545, -2.6881608963012695, -2.5715744495391846, -2.4549880027770996, -2.3384015560150146, -2.2218151092529297, -2.105228900909424, -1.9886424541473389, -1.872056007385254, -1.755469560623169, -1.638883113861084, -1.522296667098999, -1.405710220336914, -1.2891238927841187, -1.1725374460220337, -1.0559509992599487, -0.9393645524978638, -0.8227781057357788, -0.7061917185783386, -0.5896052718162537, -0.4730188250541687, -0.3564324378967285, -0.23984599113464355, -0.1232595443725586, -0.006673112511634827, 0.10991331934928894, 0.2264997363090515, 0.3430861830711365, 0.45967262983322144, 0.5762590169906616, 0.6928454637527466, 0.8094319105148315, 0.9260183572769165, 1.0426048040390015, 1.1591911315917969, 1.2757775783538818, 1.3923640251159668, 1.5089504718780518, 1.6255369186401367, 1.7421233654022217, 1.8587098121643066, 1.9752962589263916, 2.0918827056884766, 2.2084691524505615, 2.3250555992126465, 2.4416418075561523, 2.5582284927368164, 2.6748147010803223, 2.7914011478424072, 2.907987594604492, 3.024574041366577, 3.141160488128662, 3.257746934890747, 3.374333381652832, 3.490919589996338, 3.607506275177002]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 3.0, 5.0, 10.0, 8.0, 16.0, 14.0, 8.0, 17.0, 20.0, 20.0, 24.0, 27.0, 31.0, 34.0, 42.0, 29.0, 33.0, 36.0, 42.0, 40.0, 44.0, 50.0, 45.0, 44.0, 31.0, 33.0, 42.0, 34.0, 21.0, 32.0, 23.0, 24.0, 24.0, 14.0, 9.0, 10.0, 11.0, 12.0, 5.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.6561279296875, -3.55086612701416, -3.4456043243408203, -3.3403425216674805, -3.2350807189941406, -3.129818916320801, -3.024557113647461, -2.919295310974121, -2.8140335083007812, -2.7087717056274414, -2.6035099029541016, -2.4982481002807617, -2.392986297607422, -2.287724494934082, -2.182462692260742, -2.0772008895874023, -1.9719388484954834, -1.8666770458221436, -1.7614152431488037, -1.6561534404754639, -1.550891637802124, -1.4456298351287842, -1.3403679132461548, -1.235106110572815, -1.129844307899475, -1.0245825052261353, -0.9193207025527954, -0.8140588402748108, -0.708797037601471, -0.6035352349281311, -0.4982733726501465, -0.39301156997680664, -0.2877495288848877, -0.18248771131038666, -0.07722589373588562, 0.02803593873977661, 0.13329774141311646, 0.2385595440864563, 0.3438214063644409, 0.44908320903778076, 0.5543450117111206, 0.6596068143844604, 0.7648686170578003, 0.8701304793357849, 0.9753922820091248, 1.0806541442871094, 1.1859159469604492, 1.291177749633789, 1.396439552307129, 1.5017013549804688, 1.6069631576538086, 1.7122249603271484, 1.8174867630004883, 1.9227485656738281, 2.028010368347168, 2.133272171020508, 2.2385339736938477, 2.3437957763671875, 2.4490575790405273, 2.554319381713867, 2.659581184387207, 2.764842987060547, 2.8701047897338867, 2.9753665924072266, 3.0806286334991455]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 19.0, 26.0, 49.0, 63.0, 96.0, 146.0, 222.0, 302.0, 430.0, 629.0, 925.0, 1337.0, 1958.0, 2953.0, 4453.0, 6807.0, 10514.0, 16383.0, 26178.0, 41741.0, 67147.0, 105428.0, 155079.0, 182426.0, 149921.0, 100633.0, 63528.0, 39225.0, 24912.0, 15551.0, 10067.0, 6485.0, 4162.0, 2790.0, 1890.0, 1256.0, 839.0, 613.0, 435.0, 278.0, 202.0, 164.0, 105.0, 62.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.613372802734375, -2.52752685546875, -2.441680908203125, -2.3558349609375, -2.269989013671875, -2.18414306640625, -2.098297119140625, -2.012451171875, -1.926605224609375, -1.84075927734375, -1.754913330078125, -1.6690673828125, -1.583221435546875, -1.49737548828125, -1.411529541015625, -1.32568359375, -1.239837646484375, -1.15399169921875, -1.068145751953125, -0.9822998046875, -0.896453857421875, -0.81060791015625, -0.724761962890625, -0.638916015625, -0.553070068359375, -0.46722412109375, -0.381378173828125, -0.2955322265625, -0.209686279296875, -0.12384033203125, -0.037994384765625, 0.0478515625, 0.133697509765625, 0.21954345703125, 0.305389404296875, 0.3912353515625, 0.477081298828125, 0.56292724609375, 0.648773193359375, 0.734619140625, 0.820465087890625, 0.90631103515625, 0.992156982421875, 1.0780029296875, 1.163848876953125, 1.24969482421875, 1.335540771484375, 1.42138671875, 1.507232666015625, 1.59307861328125, 1.678924560546875, 1.7647705078125, 1.850616455078125, 1.93646240234375, 2.022308349609375, 2.108154296875, 2.194000244140625, 2.27984619140625, 2.365692138671875, 2.4515380859375, 2.537384033203125, 2.62322998046875, 2.709075927734375, 2.794921875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 11.0, 8.0, 15.0, 14.0, 17.0, 26.0, 20.0, 13.0, 27.0, 30.0, 27.0, 33.0, 37.0, 35.0, 45.0, 40.0, 47.0, 43.0, 40.0, 29.0, 46.0, 29.0, 39.0, 32.0, 31.0, 35.0, 25.0, 26.0, 32.0, 22.0, 22.0, 8.0, 14.0, 10.0, 7.0, 8.0, 11.0, 10.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.5625, -3.45538330078125, -3.3482666015625, -3.24114990234375, -3.134033203125, -3.02691650390625, -2.9197998046875, -2.81268310546875, -2.70556640625, -2.59844970703125, -2.4913330078125, -2.38421630859375, -2.277099609375, -2.16998291015625, -2.0628662109375, -1.95574951171875, -1.8486328125, -1.74151611328125, -1.6343994140625, -1.52728271484375, -1.420166015625, -1.31304931640625, -1.2059326171875, -1.09881591796875, -0.99169921875, -0.88458251953125, -0.7774658203125, -0.67034912109375, -0.563232421875, -0.45611572265625, -0.3489990234375, -0.24188232421875, -0.134765625, -0.02764892578125, 0.0794677734375, 0.18658447265625, 0.293701171875, 0.40081787109375, 0.5079345703125, 0.61505126953125, 0.72216796875, 0.82928466796875, 0.9364013671875, 1.04351806640625, 1.150634765625, 1.25775146484375, 1.3648681640625, 1.47198486328125, 1.5791015625, 1.68621826171875, 1.7933349609375, 1.90045166015625, 2.007568359375, 2.11468505859375, 2.2218017578125, 2.32891845703125, 2.43603515625, 2.54315185546875, 2.6502685546875, 2.75738525390625, 2.864501953125, 2.97161865234375, 3.0787353515625, 3.18585205078125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 13.0, 6.0, 13.0, 30.0, 29.0, 47.0, 73.0, 107.0, 177.0, 238.0, 378.0, 578.0, 1010.0, 1621.0, 2760.0, 4887.0, 8876.0, 16460.0, 33230.0, 70466.0, 153697.0, 283381.0, 241621.0, 118397.0, 54255.0, 25792.0, 13323.0, 7056.0, 3998.0, 2349.0, 1389.0, 799.0, 488.0, 352.0, 199.0, 136.0, 98.0, 70.0, 45.0, 32.0, 16.0, 13.0, 12.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.973846435546875, -2.87738037109375, -2.780914306640625, -2.6844482421875, -2.587982177734375, -2.49151611328125, -2.395050048828125, -2.298583984375, -2.202117919921875, -2.10565185546875, -2.009185791015625, -1.9127197265625, -1.816253662109375, -1.71978759765625, -1.623321533203125, -1.52685546875, -1.430389404296875, -1.33392333984375, -1.237457275390625, -1.1409912109375, -1.044525146484375, -0.94805908203125, -0.851593017578125, -0.755126953125, -0.658660888671875, -0.56219482421875, -0.465728759765625, -0.3692626953125, -0.272796630859375, -0.17633056640625, -0.079864501953125, 0.0166015625, 0.113067626953125, 0.20953369140625, 0.305999755859375, 0.4024658203125, 0.498931884765625, 0.59539794921875, 0.691864013671875, 0.788330078125, 0.884796142578125, 0.98126220703125, 1.077728271484375, 1.1741943359375, 1.270660400390625, 1.36712646484375, 1.463592529296875, 1.56005859375, 1.656524658203125, 1.75299072265625, 1.849456787109375, 1.9459228515625, 2.042388916015625, 2.13885498046875, 2.235321044921875, 2.331787109375, 2.428253173828125, 2.52471923828125, 2.621185302734375, 2.7176513671875, 2.814117431640625, 2.91058349609375, 3.007049560546875, 3.103515625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 11.0, 7.0, 10.0, 10.0, 14.0, 11.0, 11.0, 26.0, 22.0, 20.0, 19.0, 43.0, 23.0, 30.0, 30.0, 31.0, 35.0, 30.0, 39.0, 39.0, 47.0, 37.0, 34.0, 44.0, 44.0, 41.0, 26.0, 40.0, 26.0, 25.0, 20.0, 26.0, 21.0, 11.0, 16.0, 12.0, 12.0, 10.0, 6.0, 6.0, 9.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.01171875, -1.9432373046875, -1.874755859375, -1.8062744140625, -1.73779296875, -1.6693115234375, -1.600830078125, -1.5323486328125, -1.4638671875, -1.3953857421875, -1.326904296875, -1.2584228515625, -1.18994140625, -1.1214599609375, -1.052978515625, -0.9844970703125, -0.916015625, -0.8475341796875, -0.779052734375, -0.7105712890625, -0.64208984375, -0.5736083984375, -0.505126953125, -0.4366455078125, -0.3681640625, -0.2996826171875, -0.231201171875, -0.1627197265625, -0.09423828125, -0.0257568359375, 0.042724609375, 0.1112060546875, 0.1796875, 0.2481689453125, 0.316650390625, 0.3851318359375, 0.45361328125, 0.5220947265625, 0.590576171875, 0.6590576171875, 0.7275390625, 0.7960205078125, 0.864501953125, 0.9329833984375, 1.00146484375, 1.0699462890625, 1.138427734375, 1.2069091796875, 1.275390625, 1.3438720703125, 1.412353515625, 1.4808349609375, 1.54931640625, 1.6177978515625, 1.686279296875, 1.7547607421875, 1.8232421875, 1.8917236328125, 1.960205078125, 2.0286865234375, 2.09716796875, 2.1656494140625, 2.234130859375, 2.3026123046875, 2.37109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 10.0, 9.0, 13.0, 11.0, 25.0, 47.0, 61.0, 75.0, 98.0, 133.0, 199.0, 269.0, 348.0, 497.0, 724.0, 1111.0, 1626.0, 2412.0, 3848.0, 6490.0, 11274.0, 22789.0, 59159.0, 281531.0, 497077.0, 92870.0, 30456.0, 14030.0, 7763.0, 4579.0, 2891.0, 1921.0, 1232.0, 837.0, 602.0, 451.0, 302.0, 198.0, 160.0, 132.0, 70.0, 62.0, 41.0, 40.0, 24.0, 16.0, 8.0, 11.0, 5.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.455078125, -3.340576171875, -3.22607421875, -3.111572265625, -2.9970703125, -2.882568359375, -2.76806640625, -2.653564453125, -2.5390625, -2.424560546875, -2.31005859375, -2.195556640625, -2.0810546875, -1.966552734375, -1.85205078125, -1.737548828125, -1.623046875, -1.508544921875, -1.39404296875, -1.279541015625, -1.1650390625, -1.050537109375, -0.93603515625, -0.821533203125, -0.70703125, -0.592529296875, -0.47802734375, -0.363525390625, -0.2490234375, -0.134521484375, -0.02001953125, 0.094482421875, 0.208984375, 0.323486328125, 0.43798828125, 0.552490234375, 0.6669921875, 0.781494140625, 0.89599609375, 1.010498046875, 1.125, 1.239501953125, 1.35400390625, 1.468505859375, 1.5830078125, 1.697509765625, 1.81201171875, 1.926513671875, 2.041015625, 2.155517578125, 2.27001953125, 2.384521484375, 2.4990234375, 2.613525390625, 2.72802734375, 2.842529296875, 2.95703125, 3.071533203125, 3.18603515625, 3.300537109375, 3.4150390625, 3.529541015625, 3.64404296875, 3.758544921875, 3.873046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 0.0, 7.0, 6.0, 4.0, 6.0, 7.0, 16.0, 12.0, 23.0, 39.0, 40.0, 58.0, 94.0, 160.0, 164.0, 111.0, 69.0, 39.0, 31.0, 23.0, 13.0, 15.0, 8.0, 12.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003421306610107422, -0.00032897666096687317, -0.00031582266092300415, -0.00030266866087913513, -0.0002895146608352661, -0.0002763606607913971, -0.0002632066607475281, -0.00025005266070365906, -0.00023689866065979004, -0.00022374466061592102, -0.000210590660572052, -0.00019743666052818298, -0.00018428266048431396, -0.00017112866044044495, -0.00015797466039657593, -0.0001448206603527069, -0.0001316666603088379, -0.00011851266026496887, -0.00010535866022109985, -9.220466017723083e-05, -7.905066013336182e-05, -6.58966600894928e-05, -5.274266004562378e-05, -3.958866000175476e-05, -2.6434659957885742e-05, -1.3280659914016724e-05, -1.2665987014770508e-07, 1.3027340173721313e-05, 2.6181340217590332e-05, 3.933534026145935e-05, 5.248934030532837e-05, 6.564334034919739e-05, 7.87973403930664e-05, 9.195134043693542e-05, 0.00010510534048080444, 0.00011825934052467346, 0.00013141334056854248, 0.0001445673406124115, 0.00015772134065628052, 0.00017087534070014954, 0.00018402934074401855, 0.00019718334078788757, 0.0002103373408317566, 0.0002234913408756256, 0.00023664534091949463, 0.00024979934096336365, 0.00026295334100723267, 0.0002761073410511017, 0.0002892613410949707, 0.0003024153411388397, 0.00031556934118270874, 0.00032872334122657776, 0.0003418773412704468, 0.0003550313413143158, 0.0003681853413581848, 0.00038133934140205383, 0.00039449334144592285, 0.00040764734148979187, 0.0004208013415336609, 0.0004339553415775299, 0.0004471093416213989, 0.00046026334166526794, 0.00047341734170913696, 0.000486571341753006, 0.000499725341796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 11.0, 9.0, 16.0, 24.0, 49.0, 55.0, 81.0, 102.0, 168.0, 244.0, 350.0, 533.0, 827.0, 1240.0, 1911.0, 3218.0, 5084.0, 8338.0, 14519.0, 27435.0, 61338.0, 165420.0, 393606.0, 213638.0, 76011.0, 32646.0, 16700.0, 9547.0, 5602.0, 3580.0, 2175.0, 1437.0, 942.0, 560.0, 351.0, 257.0, 155.0, 103.0, 73.0, 63.0, 45.0, 29.0, 22.0, 11.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.375, -3.26824951171875, -3.1614990234375, -3.05474853515625, -2.947998046875, -2.84124755859375, -2.7344970703125, -2.62774658203125, -2.52099609375, -2.41424560546875, -2.3074951171875, -2.20074462890625, -2.093994140625, -1.98724365234375, -1.8804931640625, -1.77374267578125, -1.6669921875, -1.56024169921875, -1.4534912109375, -1.34674072265625, -1.239990234375, -1.13323974609375, -1.0264892578125, -0.91973876953125, -0.81298828125, -0.70623779296875, -0.5994873046875, -0.49273681640625, -0.385986328125, -0.27923583984375, -0.1724853515625, -0.06573486328125, 0.041015625, 0.14776611328125, 0.2545166015625, 0.36126708984375, 0.468017578125, 0.57476806640625, 0.6815185546875, 0.78826904296875, 0.89501953125, 1.00177001953125, 1.1085205078125, 1.21527099609375, 1.322021484375, 1.42877197265625, 1.5355224609375, 1.64227294921875, 1.7490234375, 1.85577392578125, 1.9625244140625, 2.06927490234375, 2.176025390625, 2.28277587890625, 2.3895263671875, 2.49627685546875, 2.60302734375, 2.70977783203125, 2.8165283203125, 2.92327880859375, 3.030029296875, 3.13677978515625, 3.2435302734375, 3.35028076171875, 3.45703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 5.0, 12.0, 14.0, 14.0, 27.0, 20.0, 21.0, 37.0, 30.0, 47.0, 74.0, 63.0, 89.0, 115.0, 86.0, 54.0, 54.0, 38.0, 48.0, 25.0, 17.0, 29.0, 12.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.7531204223632812, -0.7288970947265625, -0.7046737670898438, -0.680450439453125, -0.6562271118164062, -0.6320037841796875, -0.6077804565429688, -0.58355712890625, -0.5593338012695312, -0.5351104736328125, -0.5108871459960938, -0.486663818359375, -0.46244049072265625, -0.4382171630859375, -0.41399383544921875, -0.3897705078125, -0.36554718017578125, -0.3413238525390625, -0.31710052490234375, -0.292877197265625, -0.26865386962890625, -0.2444305419921875, -0.22020721435546875, -0.19598388671875, -0.17176055908203125, -0.1475372314453125, -0.12331390380859375, -0.099090576171875, -0.07486724853515625, -0.0506439208984375, -0.02642059326171875, -0.002197265625, 0.02202606201171875, 0.0462493896484375, 0.07047271728515625, 0.094696044921875, 0.11891937255859375, 0.1431427001953125, 0.16736602783203125, 0.19158935546875, 0.21581268310546875, 0.2400360107421875, 0.26425933837890625, 0.288482666015625, 0.31270599365234375, 0.3369293212890625, 0.36115264892578125, 0.3853759765625, 0.40959930419921875, 0.4338226318359375, 0.45804595947265625, 0.482269287109375, 0.5064926147460938, 0.5307159423828125, 0.5549392700195312, 0.57916259765625, 0.6033859252929688, 0.6276092529296875, 0.6518325805664062, 0.676055908203125, 0.7002792358398438, 0.7245025634765625, 0.7487258911132812, 0.77294921875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 15.0, 15.0, 17.0, 24.0, 34.0, 27.0, 23.0, 43.0, 46.0, 44.0, 48.0, 42.0, 54.0, 56.0, 53.0, 57.0, 54.0, 53.0, 43.0, 32.0, 45.0, 27.0, 21.0, 20.0, 17.0, 16.0, 8.0, 7.0, 7.0, 5.0, 3.0, 8.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982191801071167, -3.8511953353881836, -3.7201988697052, -3.589202404022217, -3.4582056999206543, -3.327209234237671, -3.1962127685546875, -3.065216302871704, -2.9342198371887207, -2.8032233715057373, -2.672226905822754, -2.5412302017211914, -2.410233736038208, -2.2792372703552246, -2.148240804672241, -2.017244338989258, -1.8862476348876953, -1.755251169204712, -1.624254584312439, -1.4932581186294556, -1.3622615337371826, -1.2312650680541992, -1.1002686023712158, -0.9692720770835876, -0.8382755517959595, -0.7072790265083313, -0.5762825012207031, -0.4452860355377197, -0.31428951025009155, -0.18329298496246338, -0.05229651927947998, 0.0787000060081482, 0.20969676971435547, 0.34069329500198364, 0.47168979048728943, 0.6026862859725952, 0.7336828112602234, 0.8646793365478516, 0.995675802230835, 1.1266722679138184, 1.2576688528060913, 1.3886653184890747, 1.5196619033813477, 1.650658369064331, 1.7816548347473145, 1.9126514196395874, 2.0436477661132812, 2.1746444702148438, 2.305640935897827, 2.4366374015808105, 2.567633867263794, 2.6986303329467773, 2.82962703704834, 2.9606235027313232, 3.0916199684143066, 3.22261643409729, 3.3536128997802734, 3.484609365463257, 3.6156058311462402, 3.7466025352478027, 3.877599000930786, 4.0085954666137695, 4.139592170715332, 4.270588397979736, 4.401585102081299]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 3.0, 6.0, 13.0, 15.0, 16.0, 11.0, 12.0, 21.0, 27.0, 24.0, 25.0, 35.0, 37.0, 26.0, 43.0, 33.0, 39.0, 41.0, 47.0, 46.0, 46.0, 42.0, 40.0, 36.0, 27.0, 39.0, 34.0, 19.0, 31.0, 17.0, 32.0, 12.0, 22.0, 14.0, 9.0, 13.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.6701035499572754, -3.5632424354553223, -3.4563815593719482, -3.349520444869995, -3.242659330368042, -3.135798454284668, -3.028937339782715, -2.9220762252807617, -2.8152151107788086, -2.7083539962768555, -2.6014931201934814, -2.4946320056915283, -2.387770891189575, -2.280910015106201, -2.174048900604248, -2.067187786102295, -1.960326910018921, -1.8534659147262573, -1.7466048002243042, -1.6397438049316406, -1.5328826904296875, -1.426021695137024, -1.3191606998443604, -1.2122995853424072, -1.1054385900497437, -0.9985775351524353, -0.891716480255127, -0.7848554849624634, -0.677994430065155, -0.5711333751678467, -0.4642723798751831, -0.35741132497787476, -0.2505500316619873, -0.14368899166584015, -0.03682795166969299, 0.07003307342529297, 0.17689412832260132, 0.28375518321990967, 0.39061617851257324, 0.4974772334098816, 0.6043382883071899, 0.7111993432044983, 0.8180603981018066, 0.9249213933944702, 1.0317823886871338, 1.138643503189087, 1.2455044984817505, 1.352365493774414, 1.4592266082763672, 1.5660876035690308, 1.6729487180709839, 1.7798097133636475, 1.8866708278656006, 1.9935318231582642, 2.1003928184509277, 2.207253932952881, 2.314115047454834, 2.420976161956787, 2.527837038040161, 2.6346981525421143, 2.7415592670440674, 2.8484201431274414, 2.9552812576293945, 3.0621423721313477, 3.1690032482147217]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 9.0, 3.0, 2.0, 19.0, 13.0, 41.0, 60.0, 88.0, 153.0, 186.0, 323.0, 506.0, 689.0, 1133.0, 1786.0, 2650.0, 4091.0, 6081.0, 9229.0, 13578.0, 19701.0, 27911.0, 39051.0, 51711.0, 67357.0, 82172.0, 94945.0, 102395.0, 102096.0, 94698.0, 82118.0, 66362.0, 51554.0, 38081.0, 27809.0, 19560.0, 13222.0, 9183.0, 6142.0, 4073.0, 2701.0, 1830.0, 1139.0, 728.0, 537.0, 295.0, 193.0, 122.0, 88.0, 52.0, 34.0, 25.0, 19.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.361328125, -3.259429931640625, -3.15753173828125, -3.055633544921875, -2.9537353515625, -2.851837158203125, -2.74993896484375, -2.648040771484375, -2.546142578125, -2.444244384765625, -2.34234619140625, -2.240447998046875, -2.1385498046875, -2.036651611328125, -1.93475341796875, -1.832855224609375, -1.73095703125, -1.629058837890625, -1.52716064453125, -1.425262451171875, -1.3233642578125, -1.221466064453125, -1.11956787109375, -1.017669677734375, -0.915771484375, -0.813873291015625, -0.71197509765625, -0.610076904296875, -0.5081787109375, -0.406280517578125, -0.30438232421875, -0.202484130859375, -0.1005859375, 0.001312255859375, 0.10321044921875, 0.205108642578125, 0.3070068359375, 0.408905029296875, 0.51080322265625, 0.612701416015625, 0.714599609375, 0.816497802734375, 0.91839599609375, 1.020294189453125, 1.1221923828125, 1.224090576171875, 1.32598876953125, 1.427886962890625, 1.52978515625, 1.631683349609375, 1.73358154296875, 1.835479736328125, 1.9373779296875, 2.039276123046875, 2.14117431640625, 2.243072509765625, 2.344970703125, 2.446868896484375, 2.54876708984375, 2.650665283203125, 2.7525634765625, 2.854461669921875, 2.95635986328125, 3.058258056640625, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 13.0, 15.0, 21.0, 14.0, 23.0, 32.0, 39.0, 26.0, 33.0, 36.0, 32.0, 30.0, 33.0, 36.0, 38.0, 53.0, 39.0, 45.0, 36.0, 38.0, 34.0, 28.0, 41.0, 25.0, 32.0, 22.0, 29.0, 15.0, 21.0, 17.0, 10.0, 9.0, 18.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.447265625, -3.344970703125, -3.24267578125, -3.140380859375, -3.0380859375, -2.935791015625, -2.83349609375, -2.731201171875, -2.62890625, -2.526611328125, -2.42431640625, -2.322021484375, -2.2197265625, -2.117431640625, -2.01513671875, -1.912841796875, -1.810546875, -1.708251953125, -1.60595703125, -1.503662109375, -1.4013671875, -1.299072265625, -1.19677734375, -1.094482421875, -0.9921875, -0.889892578125, -0.78759765625, -0.685302734375, -0.5830078125, -0.480712890625, -0.37841796875, -0.276123046875, -0.173828125, -0.071533203125, 0.03076171875, 0.133056640625, 0.2353515625, 0.337646484375, 0.43994140625, 0.542236328125, 0.64453125, 0.746826171875, 0.84912109375, 0.951416015625, 1.0537109375, 1.156005859375, 1.25830078125, 1.360595703125, 1.462890625, 1.565185546875, 1.66748046875, 1.769775390625, 1.8720703125, 1.974365234375, 2.07666015625, 2.178955078125, 2.28125, 2.383544921875, 2.48583984375, 2.588134765625, 2.6904296875, 2.792724609375, 2.89501953125, 2.997314453125, 3.099609375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 25.0, 23.0, 54.0, 83.0, 93.0, 195.0, 318.0, 519.0, 810.0, 1446.0, 2322.0, 3945.0, 6564.0, 10437.0, 16807.0, 26084.0, 39631.0, 57727.0, 78152.0, 99556.0, 115591.0, 121551.0, 116269.0, 100996.0, 79646.0, 58073.0, 40366.0, 26835.0, 17084.0, 10741.0, 6526.0, 3997.0, 2389.0, 1450.0, 866.0, 535.0, 337.0, 198.0, 123.0, 66.0, 49.0, 19.0, 14.0, 14.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.681640625, -3.564849853515625, -3.44805908203125, -3.331268310546875, -3.2144775390625, -3.097686767578125, -2.98089599609375, -2.864105224609375, -2.747314453125, -2.630523681640625, -2.51373291015625, -2.396942138671875, -2.2801513671875, -2.163360595703125, -2.04656982421875, -1.929779052734375, -1.81298828125, -1.696197509765625, -1.57940673828125, -1.462615966796875, -1.3458251953125, -1.229034423828125, -1.11224365234375, -0.995452880859375, -0.878662109375, -0.761871337890625, -0.64508056640625, -0.528289794921875, -0.4114990234375, -0.294708251953125, -0.17791748046875, -0.061126708984375, 0.0556640625, 0.172454833984375, 0.28924560546875, 0.406036376953125, 0.5228271484375, 0.639617919921875, 0.75640869140625, 0.873199462890625, 0.989990234375, 1.106781005859375, 1.22357177734375, 1.340362548828125, 1.4571533203125, 1.573944091796875, 1.69073486328125, 1.807525634765625, 1.92431640625, 2.041107177734375, 2.15789794921875, 2.274688720703125, 2.3914794921875, 2.508270263671875, 2.62506103515625, 2.741851806640625, 2.858642578125, 2.975433349609375, 3.09222412109375, 3.209014892578125, 3.3258056640625, 3.442596435546875, 3.55938720703125, 3.676177978515625, 3.79296875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 1.0, 8.0, 12.0, 10.0, 10.0, 12.0, 21.0, 17.0, 24.0, 21.0, 25.0, 16.0, 29.0, 36.0, 32.0, 46.0, 37.0, 43.0, 37.0, 43.0, 50.0, 36.0, 43.0, 41.0, 40.0, 39.0, 28.0, 33.0, 31.0, 26.0, 19.0, 27.0, 15.0, 12.0, 15.0, 14.0, 6.0, 10.0, 9.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.103607177734375, -2.03533935546875, -1.967071533203125, -1.8988037109375, -1.830535888671875, -1.76226806640625, -1.694000244140625, -1.625732421875, -1.557464599609375, -1.48919677734375, -1.420928955078125, -1.3526611328125, -1.284393310546875, -1.21612548828125, -1.147857666015625, -1.07958984375, -1.011322021484375, -0.94305419921875, -0.874786376953125, -0.8065185546875, -0.738250732421875, -0.66998291015625, -0.601715087890625, -0.533447265625, -0.465179443359375, -0.39691162109375, -0.328643798828125, -0.2603759765625, -0.192108154296875, -0.12384033203125, -0.055572509765625, 0.0126953125, 0.080963134765625, 0.14923095703125, 0.217498779296875, 0.2857666015625, 0.354034423828125, 0.42230224609375, 0.490570068359375, 0.558837890625, 0.627105712890625, 0.69537353515625, 0.763641357421875, 0.8319091796875, 0.900177001953125, 0.96844482421875, 1.036712646484375, 1.10498046875, 1.173248291015625, 1.24151611328125, 1.309783935546875, 1.3780517578125, 1.446319580078125, 1.51458740234375, 1.582855224609375, 1.651123046875, 1.719390869140625, 1.78765869140625, 1.855926513671875, 1.9241943359375, 1.992462158203125, 2.06072998046875, 2.128997802734375, 2.197265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 7.0, 9.0, 14.0, 26.0, 35.0, 54.0, 74.0, 114.0, 171.0, 214.0, 309.0, 464.0, 659.0, 1069.0, 1631.0, 2518.0, 4450.0, 8460.0, 17438.0, 38248.0, 89579.0, 190745.0, 277061.0, 217166.0, 107261.0, 46866.0, 20808.0, 9741.0, 5282.0, 2869.0, 1758.0, 1043.0, 773.0, 482.0, 371.0, 228.0, 183.0, 123.0, 83.0, 43.0, 30.0, 25.0, 27.0, 17.0, 12.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.968170166015625, -3.84649658203125, -3.724822998046875, -3.6031494140625, -3.481475830078125, -3.35980224609375, -3.238128662109375, -3.116455078125, -2.994781494140625, -2.87310791015625, -2.751434326171875, -2.6297607421875, -2.508087158203125, -2.38641357421875, -2.264739990234375, -2.14306640625, -2.021392822265625, -1.89971923828125, -1.778045654296875, -1.6563720703125, -1.534698486328125, -1.41302490234375, -1.291351318359375, -1.169677734375, -1.048004150390625, -0.92633056640625, -0.804656982421875, -0.6829833984375, -0.561309814453125, -0.43963623046875, -0.317962646484375, -0.1962890625, -0.074615478515625, 0.04705810546875, 0.168731689453125, 0.2904052734375, 0.412078857421875, 0.53375244140625, 0.655426025390625, 0.777099609375, 0.898773193359375, 1.02044677734375, 1.142120361328125, 1.2637939453125, 1.385467529296875, 1.50714111328125, 1.628814697265625, 1.75048828125, 1.872161865234375, 1.99383544921875, 2.115509033203125, 2.2371826171875, 2.358856201171875, 2.48052978515625, 2.602203369140625, 2.723876953125, 2.845550537109375, 2.96722412109375, 3.088897705078125, 3.2105712890625, 3.332244873046875, 3.45391845703125, 3.575592041015625, 3.697265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 23.0, 20.0, 38.0, 32.0, 57.0, 57.0, 95.0, 85.0, 123.0, 93.0, 78.0, 56.0, 70.0, 35.0, 29.0, 25.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0005211830139160156, -0.0005088746547698975, -0.0004965662956237793, -0.00048425793647766113, -0.00047194957733154297, -0.0004596412181854248, -0.00044733285903930664, -0.0004350244998931885, -0.0004227161407470703, -0.00041040778160095215, -0.000398099422454834, -0.0003857910633087158, -0.00037348270416259766, -0.0003611743450164795, -0.00034886598587036133, -0.00033655762672424316, -0.000324249267578125, -0.00031194090843200684, -0.00029963254928588867, -0.0002873241901397705, -0.00027501583099365234, -0.0002627074718475342, -0.000250399112701416, -0.00023809075355529785, -0.0002257823944091797, -0.00021347403526306152, -0.00020116567611694336, -0.0001888573169708252, -0.00017654895782470703, -0.00016424059867858887, -0.0001519322395324707, -0.00013962388038635254, -0.00012731552124023438, -0.00011500716209411621, -0.00010269880294799805, -9.039044380187988e-05, -7.808208465576172e-05, -6.577372550964355e-05, -5.346536636352539e-05, -4.1157007217407227e-05, -2.8848648071289062e-05, -1.65402889251709e-05, -4.231929779052734e-06, 8.07642936706543e-06, 2.0384788513183594e-05, 3.269314765930176e-05, 4.500150680541992e-05, 5.7309865951538086e-05, 6.961822509765625e-05, 8.192658424377441e-05, 9.423494338989258e-05, 0.00010654330253601074, 0.0001188516616821289, 0.00013116002082824707, 0.00014346837997436523, 0.0001557767391204834, 0.00016808509826660156, 0.00018039345741271973, 0.0001927018165588379, 0.00020501017570495605, 0.00021731853485107422, 0.00022962689399719238, 0.00024193525314331055, 0.0002542436122894287, 0.0002665519714355469]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 20.0, 27.0, 33.0, 48.0, 85.0, 124.0, 174.0, 317.0, 464.0, 704.0, 1134.0, 1798.0, 3086.0, 5074.0, 8710.0, 14711.0, 24937.0, 41823.0, 68069.0, 102617.0, 138919.0, 159228.0, 150393.0, 117837.0, 81310.0, 51355.0, 30510.0, 18253.0, 10589.0, 6284.0, 3758.0, 2324.0, 1433.0, 816.0, 580.0, 329.0, 230.0, 150.0, 95.0, 63.0, 52.0, 26.0, 18.0, 14.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.0050048828125, -1.939697265625, -1.8743896484375, -1.80908203125, -1.7437744140625, -1.678466796875, -1.6131591796875, -1.5478515625, -1.4825439453125, -1.417236328125, -1.3519287109375, -1.28662109375, -1.2213134765625, -1.156005859375, -1.0906982421875, -1.025390625, -0.9600830078125, -0.894775390625, -0.8294677734375, -0.76416015625, -0.6988525390625, -0.633544921875, -0.5682373046875, -0.5029296875, -0.4376220703125, -0.372314453125, -0.3070068359375, -0.24169921875, -0.1763916015625, -0.111083984375, -0.0457763671875, 0.01953125, 0.0848388671875, 0.150146484375, 0.2154541015625, 0.28076171875, 0.3460693359375, 0.411376953125, 0.4766845703125, 0.5419921875, 0.6072998046875, 0.672607421875, 0.7379150390625, 0.80322265625, 0.8685302734375, 0.933837890625, 0.9991455078125, 1.064453125, 1.1297607421875, 1.195068359375, 1.2603759765625, 1.32568359375, 1.3909912109375, 1.456298828125, 1.5216064453125, 1.5869140625, 1.6522216796875, 1.717529296875, 1.7828369140625, 1.84814453125, 1.9134521484375, 1.978759765625, 2.0440673828125, 2.109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 7.0, 23.0, 14.0, 19.0, 19.0, 25.0, 28.0, 42.0, 45.0, 67.0, 62.0, 57.0, 51.0, 63.0, 66.0, 62.0, 56.0, 50.0, 41.0, 29.0, 35.0, 25.0, 19.0, 17.0, 19.0, 12.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.750335693359375, -0.72283935546875, -0.695343017578125, -0.6678466796875, -0.640350341796875, -0.61285400390625, -0.585357666015625, -0.557861328125, -0.530364990234375, -0.50286865234375, -0.475372314453125, -0.4478759765625, -0.420379638671875, -0.39288330078125, -0.365386962890625, -0.337890625, -0.310394287109375, -0.28289794921875, -0.255401611328125, -0.2279052734375, -0.200408935546875, -0.17291259765625, -0.145416259765625, -0.117919921875, -0.090423583984375, -0.06292724609375, -0.035430908203125, -0.0079345703125, 0.019561767578125, 0.04705810546875, 0.074554443359375, 0.10205078125, 0.129547119140625, 0.15704345703125, 0.184539794921875, 0.2120361328125, 0.239532470703125, 0.26702880859375, 0.294525146484375, 0.322021484375, 0.349517822265625, 0.37701416015625, 0.404510498046875, 0.4320068359375, 0.459503173828125, 0.48699951171875, 0.514495849609375, 0.5419921875, 0.569488525390625, 0.59698486328125, 0.624481201171875, 0.6519775390625, 0.679473876953125, 0.70697021484375, 0.734466552734375, 0.761962890625, 0.789459228515625, 0.81695556640625, 0.844451904296875, 0.8719482421875, 0.899444580078125, 0.92694091796875, 0.954437255859375, 0.98193359375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 8.0, 8.0, 12.0, 16.0, 12.0, 11.0, 9.0, 20.0, 20.0, 26.0, 29.0, 31.0, 44.0, 31.0, 44.0, 47.0, 43.0, 34.0, 38.0, 56.0, 45.0, 43.0, 42.0, 34.0, 39.0, 44.0, 30.0, 23.0, 20.0, 15.0, 23.0, 18.0, 13.0, 10.0, 12.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3753297328948975, -3.2676143646240234, -3.1598987579345703, -3.0521833896636963, -2.9444680213928223, -2.8367526531219482, -2.729037284851074, -2.621321678161621, -2.513606309890747, -2.405890941619873, -2.29817533493042, -2.190459966659546, -2.082744598388672, -1.9750292301177979, -1.8673137426376343, -1.7595982551574707, -1.6518828868865967, -1.5441675186157227, -1.436452031135559, -1.3287365436553955, -1.2210211753845215, -1.1133058071136475, -1.0055903196334839, -0.8978748917579651, -0.7901594638824463, -0.6824440360069275, -0.5747286081314087, -0.4670131802558899, -0.3592977523803711, -0.2515823245048523, -0.1438668966293335, -0.0361514687538147, 0.0715641975402832, 0.179279625415802, 0.2869950532913208, 0.3947104811668396, 0.5024259090423584, 0.6101413369178772, 0.717856764793396, 0.8255721926689148, 0.9332876205444336, 1.0410029888153076, 1.1487184762954712, 1.2564339637756348, 1.3641493320465088, 1.4718647003173828, 1.5795801877975464, 1.68729567527771, 1.795011043548584, 1.902726411819458, 2.010441780090332, 2.118157386779785, 2.225872755050659, 2.333588123321533, 2.4413037300109863, 2.5490190982818604, 2.6567344665527344, 2.7644498348236084, 2.8721652030944824, 2.9798808097839355, 3.0875961780548096, 3.1953115463256836, 3.3030271530151367, 3.4107425212860107, 3.5184578895568848]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 7.0, 13.0, 15.0, 25.0, 21.0, 14.0, 22.0, 27.0, 29.0, 25.0, 34.0, 38.0, 31.0, 39.0, 52.0, 41.0, 37.0, 47.0, 37.0, 49.0, 57.0, 22.0, 32.0, 34.0, 26.0, 19.0, 26.0, 23.0, 21.0, 12.0, 10.0, 19.0, 19.0, 12.0, 8.0, 9.0, 5.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.945760726928711, -2.8403706550598145, -2.734980583190918, -2.6295905113220215, -2.524200677871704, -2.4188106060028076, -2.313420534133911, -2.2080304622650146, -2.1026406288146973, -1.9972505569458008, -1.8918606042861938, -1.7864705324172974, -1.6810805797576904, -1.575690507888794, -1.4703004360198975, -1.364910364151001, -1.2595202922821045, -1.154130220413208, -1.048740267753601, -0.9433501958847046, -0.8379601836204529, -0.7325701713562012, -0.6271800994873047, -0.521790087223053, -0.41640007495880127, -0.31101006269454956, -0.20562002062797546, -0.10022997856140137, 0.005160033702850342, 0.11055004596710205, 0.21594011783599854, 0.32133013010025024, 0.42672038078308105, 0.5321103930473328, 0.6375004053115845, 0.742890477180481, 0.8482804894447327, 0.9536705017089844, 1.0590605735778809, 1.1644506454467773, 1.2698405981063843, 1.3752306699752808, 1.4806206226348877, 1.5860106945037842, 1.6914007663726807, 1.7967907190322876, 1.902180790901184, 2.007570743560791, 2.1129608154296875, 2.218350887298584, 2.3237409591674805, 2.429131031036377, 2.5345208644866943, 2.639910936355591, 2.7453010082244873, 2.850691080093384, 2.956080913543701, 3.0614709854125977, 3.166861057281494, 3.2722511291503906, 3.377640962600708, 3.4830310344696045, 3.588421106338501, 3.6938111782073975, 3.799201250076294]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 13.0, 42.0, 50.0, 90.0, 144.0, 253.0, 415.0, 766.0, 1288.0, 2212.0, 3723.0, 6901.0, 12516.0, 22660.0, 40935.0, 75409.0, 135952.0, 239532.0, 395004.0, 572624.0, 692871.0, 669715.0, 520854.0, 343113.0, 202895.0, 114621.0, 62913.0, 34303.0, 18776.0, 10421.0, 5706.0, 3186.0, 1796.0, 1026.0, 627.0, 345.0, 204.0, 152.0, 86.0, 39.0, 32.0, 23.0, 12.0, 7.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.263671875, -3.15789794921875, -3.0521240234375, -2.94635009765625, -2.840576171875, -2.73480224609375, -2.6290283203125, -2.52325439453125, -2.41748046875, -2.31170654296875, -2.2059326171875, -2.10015869140625, -1.994384765625, -1.88861083984375, -1.7828369140625, -1.67706298828125, -1.5712890625, -1.46551513671875, -1.3597412109375, -1.25396728515625, -1.148193359375, -1.04241943359375, -0.9366455078125, -0.83087158203125, -0.72509765625, -0.61932373046875, -0.5135498046875, -0.40777587890625, -0.302001953125, -0.19622802734375, -0.0904541015625, 0.01531982421875, 0.12109375, 0.22686767578125, 0.3326416015625, 0.43841552734375, 0.544189453125, 0.64996337890625, 0.7557373046875, 0.86151123046875, 0.96728515625, 1.07305908203125, 1.1788330078125, 1.28460693359375, 1.390380859375, 1.49615478515625, 1.6019287109375, 1.70770263671875, 1.8134765625, 1.91925048828125, 2.0250244140625, 2.13079833984375, 2.236572265625, 2.34234619140625, 2.4481201171875, 2.55389404296875, 2.65966796875, 2.76544189453125, 2.8712158203125, 2.97698974609375, 3.082763671875, 3.18853759765625, 3.2943115234375, 3.40008544921875, 3.505859375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 6.0, 18.0, 16.0, 17.0, 16.0, 21.0, 21.0, 17.0, 23.0, 33.0, 27.0, 42.0, 40.0, 32.0, 45.0, 51.0, 40.0, 53.0, 42.0, 36.0, 51.0, 48.0, 40.0, 26.0, 27.0, 27.0, 23.0, 15.0, 23.0, 16.0, 23.0, 13.0, 12.0, 7.0, 8.0, 4.0, 6.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.29656982421875, -2.2122802734375, -2.12799072265625, -2.043701171875, -1.95941162109375, -1.8751220703125, -1.79083251953125, -1.70654296875, -1.62225341796875, -1.5379638671875, -1.45367431640625, -1.369384765625, -1.28509521484375, -1.2008056640625, -1.11651611328125, -1.0322265625, -0.94793701171875, -0.8636474609375, -0.77935791015625, -0.695068359375, -0.61077880859375, -0.5264892578125, -0.44219970703125, -0.35791015625, -0.27362060546875, -0.1893310546875, -0.10504150390625, -0.020751953125, 0.06353759765625, 0.1478271484375, 0.23211669921875, 0.31640625, 0.40069580078125, 0.4849853515625, 0.56927490234375, 0.653564453125, 0.73785400390625, 0.8221435546875, 0.90643310546875, 0.99072265625, 1.07501220703125, 1.1593017578125, 1.24359130859375, 1.327880859375, 1.41217041015625, 1.4964599609375, 1.58074951171875, 1.6650390625, 1.74932861328125, 1.8336181640625, 1.91790771484375, 2.002197265625, 2.08648681640625, 2.1707763671875, 2.25506591796875, 2.33935546875, 2.42364501953125, 2.5079345703125, 2.59222412109375, 2.676513671875, 2.76080322265625, 2.8450927734375, 2.92938232421875, 3.013671875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 28.0, 29.0, 44.0, 66.0, 110.0, 171.0, 317.0, 460.0, 730.0, 1145.0, 1851.0, 3119.0, 4697.0, 7517.0, 11720.0, 18551.0, 28126.0, 44187.0, 65869.0, 98796.0, 142659.0, 201026.0, 270242.0, 344086.0, 409945.0, 450180.0, 448690.0, 407470.0, 342459.0, 268034.0, 197844.0, 140808.0, 96534.0, 65353.0, 43292.0, 28456.0, 17860.0, 11682.0, 7422.0, 4683.0, 2922.0, 1929.0, 1211.0, 743.0, 440.0, 297.0, 170.0, 104.0, 83.0, 37.0, 30.0, 24.0, 10.0, 10.0, 5.0, 5.0, 1.0], "bins": [-2.427734375, -2.3541259765625, -2.280517578125, -2.2069091796875, -2.13330078125, -2.0596923828125, -1.986083984375, -1.9124755859375, -1.8388671875, -1.7652587890625, -1.691650390625, -1.6180419921875, -1.54443359375, -1.4708251953125, -1.397216796875, -1.3236083984375, -1.25, -1.1763916015625, -1.102783203125, -1.0291748046875, -0.95556640625, -0.8819580078125, -0.808349609375, -0.7347412109375, -0.6611328125, -0.5875244140625, -0.513916015625, -0.4403076171875, -0.36669921875, -0.2930908203125, -0.219482421875, -0.1458740234375, -0.072265625, 0.0013427734375, 0.074951171875, 0.1485595703125, 0.22216796875, 0.2957763671875, 0.369384765625, 0.4429931640625, 0.5166015625, 0.5902099609375, 0.663818359375, 0.7374267578125, 0.81103515625, 0.8846435546875, 0.958251953125, 1.0318603515625, 1.10546875, 1.1790771484375, 1.252685546875, 1.3262939453125, 1.39990234375, 1.4735107421875, 1.547119140625, 1.6207275390625, 1.6943359375, 1.7679443359375, 1.841552734375, 1.9151611328125, 1.98876953125, 2.0623779296875, 2.135986328125, 2.2095947265625, 2.283203125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 1.0, 6.0, 8.0, 13.0, 20.0, 15.0, 15.0, 32.0, 43.0, 63.0, 44.0, 59.0, 69.0, 90.0, 91.0, 114.0, 138.0, 152.0, 169.0, 176.0, 178.0, 220.0, 212.0, 223.0, 223.0, 204.0, 178.0, 187.0, 160.0, 173.0, 117.0, 122.0, 101.0, 71.0, 77.0, 70.0, 59.0, 44.0, 23.0, 23.0, 20.0, 18.0, 14.0, 11.0, 6.0, 10.0, 4.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.195556640625, -1.15966796875, -1.123779296875, -1.087890625, -1.052001953125, -1.01611328125, -0.980224609375, -0.9443359375, -0.908447265625, -0.87255859375, -0.836669921875, -0.80078125, -0.764892578125, -0.72900390625, -0.693115234375, -0.6572265625, -0.621337890625, -0.58544921875, -0.549560546875, -0.513671875, -0.477783203125, -0.44189453125, -0.406005859375, -0.3701171875, -0.334228515625, -0.29833984375, -0.262451171875, -0.2265625, -0.190673828125, -0.15478515625, -0.118896484375, -0.0830078125, -0.047119140625, -0.01123046875, 0.024658203125, 0.060546875, 0.096435546875, 0.13232421875, 0.168212890625, 0.2041015625, 0.239990234375, 0.27587890625, 0.311767578125, 0.34765625, 0.383544921875, 0.41943359375, 0.455322265625, 0.4912109375, 0.527099609375, 0.56298828125, 0.598876953125, 0.634765625, 0.670654296875, 0.70654296875, 0.742431640625, 0.7783203125, 0.814208984375, 0.85009765625, 0.885986328125, 0.921875, 0.957763671875, 0.99365234375, 1.029541015625, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 1.0, 3.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 17.0, 19.0, 15.0, 28.0, 27.0, 31.0, 30.0, 35.0, 31.0, 37.0, 34.0, 41.0, 34.0, 47.0, 40.0, 45.0, 38.0, 33.0, 41.0, 40.0, 42.0, 24.0, 25.0, 27.0, 25.0, 19.0, 17.0, 12.0, 10.0, 12.0, 16.0, 8.0, 7.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.152416706085205, -3.0596210956573486, -2.966825485229492, -2.874030113220215, -2.7812345027923584, -2.688438892364502, -2.5956432819366455, -2.502847671508789, -2.4100522994995117, -2.3172566890716553, -2.224461078643799, -2.1316657066345215, -2.038870096206665, -1.9460744857788086, -1.8532788753509521, -1.7604832649230957, -1.6676876544952393, -1.5748920440673828, -1.482096552848816, -1.3893009424209595, -1.2965054512023926, -1.2037098407745361, -1.1109142303466797, -1.0181186199188232, -0.9253231287002563, -0.8325275778770447, -0.739732027053833, -0.6469364166259766, -0.5541408658027649, -0.4613453149795532, -0.3685497045516968, -0.2757541537284851, -0.18295836448669434, -0.09016279876232147, 0.0026327669620513916, 0.09542834758758545, 0.18822389841079712, 0.2810194492340088, 0.37381505966186523, 0.4666106104850769, 0.5594061613082886, 0.6522017121315002, 0.7449972629547119, 0.8377928733825684, 0.93058842420578, 1.0233839750289917, 1.1161795854568481, 1.208975076675415, 1.3017706871032715, 1.394566297531128, 1.4873617887496948, 1.5801573991775513, 1.6729528903961182, 1.7657485008239746, 1.858544111251831, 1.9513397216796875, 2.044135093688965, 2.1369307041168213, 2.2297263145446777, 2.322521686553955, 2.4153172969818115, 2.508112907409668, 2.6009085178375244, 2.693704128265381, 2.7864997386932373]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 22.0, 14.0, 19.0, 14.0, 15.0, 28.0, 24.0, 26.0, 32.0, 35.0, 34.0, 39.0, 39.0, 36.0, 40.0, 42.0, 51.0, 39.0, 33.0, 33.0, 41.0, 32.0, 40.0, 24.0, 20.0, 30.0, 16.0, 23.0, 21.0, 17.0, 13.0, 13.0, 15.0, 7.0, 9.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.8398711681365967, -2.7512996196746826, -2.6627280712127686, -2.5741565227508545, -2.4855849742889404, -2.3970134258270264, -2.3084418773651123, -2.2198703289031982, -2.131298780441284, -2.04272723197937, -1.954155683517456, -1.865584135055542, -1.777012586593628, -1.6884410381317139, -1.5998694896697998, -1.5112979412078857, -1.4227263927459717, -1.3341548442840576, -1.2455832958221436, -1.1570117473602295, -1.0684401988983154, -0.9798686504364014, -0.8912971019744873, -0.8027255535125732, -0.7141540050506592, -0.6255824565887451, -0.537010908126831, -0.448439359664917, -0.35986781120300293, -0.27129626274108887, -0.1827247142791748, -0.09415316581726074, -0.005581855773925781, 0.08298969268798828, 0.17156124114990234, 0.2601327896118164, 0.34870433807373047, 0.43727588653564453, 0.5258474349975586, 0.6144189834594727, 0.7029905319213867, 0.7915620803833008, 0.8801336288452148, 0.9687051773071289, 1.057276725769043, 1.145848274230957, 1.234419822692871, 1.3229913711547852, 1.4115629196166992, 1.5001344680786133, 1.5887060165405273, 1.6772775650024414, 1.7658491134643555, 1.8544206619262695, 1.9429922103881836, 2.0315637588500977, 2.1201353073120117, 2.208706855773926, 2.29727840423584, 2.385849952697754, 2.474421501159668, 2.562993049621582, 2.651564598083496, 2.74013614654541, 2.828707695007324]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 2.0, 2.0, 4.0, 13.0, 21.0, 22.0, 29.0, 49.0, 68.0, 92.0, 115.0, 192.0, 271.0, 337.0, 484.0, 699.0, 1083.0, 1524.0, 2506.0, 3839.0, 6468.0, 11483.0, 22072.0, 46646.0, 104451.0, 237465.0, 313001.0, 157298.0, 68453.0, 31705.0, 15762.0, 8478.0, 4894.0, 3008.0, 1921.0, 1273.0, 818.0, 602.0, 399.0, 289.0, 204.0, 131.0, 117.0, 73.0, 55.0, 37.0, 32.0, 12.0, 17.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.9017333984375, -3.768310546875, -3.6348876953125, -3.50146484375, -3.3680419921875, -3.234619140625, -3.1011962890625, -2.9677734375, -2.8343505859375, -2.700927734375, -2.5675048828125, -2.43408203125, -2.3006591796875, -2.167236328125, -2.0338134765625, -1.900390625, -1.7669677734375, -1.633544921875, -1.5001220703125, -1.36669921875, -1.2332763671875, -1.099853515625, -0.9664306640625, -0.8330078125, -0.6995849609375, -0.566162109375, -0.4327392578125, -0.29931640625, -0.1658935546875, -0.032470703125, 0.1009521484375, 0.234375, 0.3677978515625, 0.501220703125, 0.6346435546875, 0.76806640625, 0.9014892578125, 1.034912109375, 1.1683349609375, 1.3017578125, 1.4351806640625, 1.568603515625, 1.7020263671875, 1.83544921875, 1.9688720703125, 2.102294921875, 2.2357177734375, 2.369140625, 2.5025634765625, 2.635986328125, 2.7694091796875, 2.90283203125, 3.0362548828125, 3.169677734375, 3.3031005859375, 3.4365234375, 3.5699462890625, 3.703369140625, 3.8367919921875, 3.97021484375, 4.1036376953125, 4.237060546875, 4.3704833984375, 4.50390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 10.0, 6.0, 11.0, 16.0, 16.0, 16.0, 19.0, 23.0, 38.0, 32.0, 21.0, 33.0, 30.0, 28.0, 46.0, 38.0, 36.0, 42.0, 35.0, 39.0, 42.0, 39.0, 22.0, 46.0, 29.0, 31.0, 32.0, 27.0, 22.0, 20.0, 21.0, 13.0, 14.0, 14.0, 14.0, 8.0, 8.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.80859375, -2.71929931640625, -2.6300048828125, -2.54071044921875, -2.451416015625, -2.36212158203125, -2.2728271484375, -2.18353271484375, -2.09423828125, -2.00494384765625, -1.9156494140625, -1.82635498046875, -1.737060546875, -1.64776611328125, -1.5584716796875, -1.46917724609375, -1.3798828125, -1.29058837890625, -1.2012939453125, -1.11199951171875, -1.022705078125, -0.93341064453125, -0.8441162109375, -0.75482177734375, -0.66552734375, -0.57623291015625, -0.4869384765625, -0.39764404296875, -0.308349609375, -0.21905517578125, -0.1297607421875, -0.04046630859375, 0.048828125, 0.13812255859375, 0.2274169921875, 0.31671142578125, 0.406005859375, 0.49530029296875, 0.5845947265625, 0.67388916015625, 0.76318359375, 0.85247802734375, 0.9417724609375, 1.03106689453125, 1.120361328125, 1.20965576171875, 1.2989501953125, 1.38824462890625, 1.4775390625, 1.56683349609375, 1.6561279296875, 1.74542236328125, 1.834716796875, 1.92401123046875, 2.0133056640625, 2.10260009765625, 2.19189453125, 2.28118896484375, 2.3704833984375, 2.45977783203125, 2.549072265625, 2.63836669921875, 2.7276611328125, 2.81695556640625, 2.90625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 14.0, 27.0, 29.0, 42.0, 56.0, 89.0, 127.0, 200.0, 265.0, 501.0, 719.0, 1161.0, 1938.0, 3525.0, 6547.0, 13789.0, 31677.0, 84733.0, 254156.0, 391021.0, 159702.0, 54669.0, 21714.0, 9856.0, 5035.0, 2731.0, 1539.0, 979.0, 544.0, 339.0, 236.0, 173.0, 116.0, 85.0, 56.0, 34.0, 30.0, 20.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.539306640625, -3.41845703125, -3.297607421875, -3.1767578125, -3.055908203125, -2.93505859375, -2.814208984375, -2.693359375, -2.572509765625, -2.45166015625, -2.330810546875, -2.2099609375, -2.089111328125, -1.96826171875, -1.847412109375, -1.7265625, -1.605712890625, -1.48486328125, -1.364013671875, -1.2431640625, -1.122314453125, -1.00146484375, -0.880615234375, -0.759765625, -0.638916015625, -0.51806640625, -0.397216796875, -0.2763671875, -0.155517578125, -0.03466796875, 0.086181640625, 0.20703125, 0.327880859375, 0.44873046875, 0.569580078125, 0.6904296875, 0.811279296875, 0.93212890625, 1.052978515625, 1.173828125, 1.294677734375, 1.41552734375, 1.536376953125, 1.6572265625, 1.778076171875, 1.89892578125, 2.019775390625, 2.140625, 2.261474609375, 2.38232421875, 2.503173828125, 2.6240234375, 2.744873046875, 2.86572265625, 2.986572265625, 3.107421875, 3.228271484375, 3.34912109375, 3.469970703125, 3.5908203125, 3.711669921875, 3.83251953125, 3.953369140625, 4.07421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 8.0, 10.0, 10.0, 16.0, 23.0, 28.0, 23.0, 31.0, 35.0, 32.0, 40.0, 44.0, 29.0, 52.0, 55.0, 45.0, 45.0, 41.0, 42.0, 47.0, 33.0, 37.0, 47.0, 33.0, 28.0, 31.0, 21.0, 22.0, 18.0, 17.0, 15.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.701263427734375, -2.62518310546875, -2.549102783203125, -2.4730224609375, -2.396942138671875, -2.32086181640625, -2.244781494140625, -2.168701171875, -2.092620849609375, -2.01654052734375, -1.940460205078125, -1.8643798828125, -1.788299560546875, -1.71221923828125, -1.636138916015625, -1.56005859375, -1.483978271484375, -1.40789794921875, -1.331817626953125, -1.2557373046875, -1.179656982421875, -1.10357666015625, -1.027496337890625, -0.951416015625, -0.875335693359375, -0.79925537109375, -0.723175048828125, -0.6470947265625, -0.571014404296875, -0.49493408203125, -0.418853759765625, -0.3427734375, -0.266693115234375, -0.19061279296875, -0.114532470703125, -0.0384521484375, 0.037628173828125, 0.11370849609375, 0.189788818359375, 0.265869140625, 0.341949462890625, 0.41802978515625, 0.494110107421875, 0.5701904296875, 0.646270751953125, 0.72235107421875, 0.798431396484375, 0.87451171875, 0.950592041015625, 1.02667236328125, 1.102752685546875, 1.1788330078125, 1.254913330078125, 1.33099365234375, 1.407073974609375, 1.483154296875, 1.559234619140625, 1.63531494140625, 1.711395263671875, 1.7874755859375, 1.863555908203125, 1.93963623046875, 2.015716552734375, 2.091796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 19.0, 19.0, 15.0, 37.0, 43.0, 56.0, 83.0, 112.0, 133.0, 146.0, 205.0, 248.0, 409.0, 535.0, 765.0, 1223.0, 2007.0, 3742.0, 7620.0, 20970.0, 106441.0, 767546.0, 98922.0, 20142.0, 7623.0, 3575.0, 1962.0, 1206.0, 739.0, 500.0, 370.0, 270.0, 219.0, 165.0, 119.0, 88.0, 60.0, 49.0, 40.0, 22.0, 23.0, 16.0, 18.0, 5.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.41796875, -5.25616455078125, -5.0943603515625, -4.93255615234375, -4.770751953125, -4.60894775390625, -4.4471435546875, -4.28533935546875, -4.12353515625, -3.96173095703125, -3.7999267578125, -3.63812255859375, -3.476318359375, -3.31451416015625, -3.1527099609375, -2.99090576171875, -2.8291015625, -2.66729736328125, -2.5054931640625, -2.34368896484375, -2.181884765625, -2.02008056640625, -1.8582763671875, -1.69647216796875, -1.53466796875, -1.37286376953125, -1.2110595703125, -1.04925537109375, -0.887451171875, -0.72564697265625, -0.5638427734375, -0.40203857421875, -0.240234375, -0.07843017578125, 0.0833740234375, 0.24517822265625, 0.406982421875, 0.56878662109375, 0.7305908203125, 0.89239501953125, 1.05419921875, 1.21600341796875, 1.3778076171875, 1.53961181640625, 1.701416015625, 1.86322021484375, 2.0250244140625, 2.18682861328125, 2.3486328125, 2.51043701171875, 2.6722412109375, 2.83404541015625, 2.995849609375, 3.15765380859375, 3.3194580078125, 3.48126220703125, 3.64306640625, 3.80487060546875, 3.9666748046875, 4.12847900390625, 4.290283203125, 4.45208740234375, 4.6138916015625, 4.77569580078125, 4.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 3.0, 12.0, 19.0, 30.0, 55.0, 110.0, 185.0, 244.0, 125.0, 73.0, 43.0, 28.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004253387451171875, -0.00041211768984794617, -0.00039889663457870483, -0.0003856755793094635, -0.00037245452404022217, -0.00035923346877098083, -0.0003460124135017395, -0.00033279135823249817, -0.00031957030296325684, -0.0003063492476940155, -0.00029312819242477417, -0.00027990713715553284, -0.0002666860818862915, -0.00025346502661705017, -0.00024024397134780884, -0.0002270229160785675, -0.00021380186080932617, -0.00020058080554008484, -0.0001873597502708435, -0.00017413869500160217, -0.00016091763973236084, -0.0001476965844631195, -0.00013447552919387817, -0.00012125447392463684, -0.00010803341865539551, -9.481236338615417e-05, -8.159130811691284e-05, -6.837025284767151e-05, -5.5149197578430176e-05, -4.192814230918884e-05, -2.870708703994751e-05, -1.5486031770706177e-05, -2.2649765014648438e-06, 1.095607876777649e-05, 2.4177134037017822e-05, 3.7398189306259155e-05, 5.061924457550049e-05, 6.384029984474182e-05, 7.706135511398315e-05, 9.028241038322449e-05, 0.00010350346565246582, 0.00011672452092170715, 0.00012994557619094849, 0.00014316663146018982, 0.00015638768672943115, 0.00016960874199867249, 0.00018282979726791382, 0.00019605085253715515, 0.00020927190780639648, 0.00022249296307563782, 0.00023571401834487915, 0.0002489350736141205, 0.0002621561288833618, 0.00027537718415260315, 0.0002885982394218445, 0.0003018192946910858, 0.00031504034996032715, 0.0003282614052295685, 0.0003414824604988098, 0.00035470351576805115, 0.0003679245710372925, 0.0003811456263065338, 0.00039436668157577515, 0.0004075877368450165, 0.0004208087921142578]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 11.0, 19.0, 33.0, 56.0, 72.0, 88.0, 133.0, 163.0, 199.0, 288.0, 435.0, 678.0, 1041.0, 1640.0, 2424.0, 3801.0, 6716.0, 12820.0, 29486.0, 90729.0, 436349.0, 337131.0, 71840.0, 24842.0, 11313.0, 6151.0, 3524.0, 2198.0, 1399.0, 947.0, 586.0, 403.0, 274.0, 211.0, 149.0, 116.0, 83.0, 54.0, 44.0, 36.0, 22.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.721282958984375, -3.59686279296875, -3.472442626953125, -3.3480224609375, -3.223602294921875, -3.09918212890625, -2.974761962890625, -2.850341796875, -2.725921630859375, -2.60150146484375, -2.477081298828125, -2.3526611328125, -2.228240966796875, -2.10382080078125, -1.979400634765625, -1.85498046875, -1.730560302734375, -1.60614013671875, -1.481719970703125, -1.3572998046875, -1.232879638671875, -1.10845947265625, -0.984039306640625, -0.859619140625, -0.735198974609375, -0.61077880859375, -0.486358642578125, -0.3619384765625, -0.237518310546875, -0.11309814453125, 0.011322021484375, 0.1357421875, 0.260162353515625, 0.38458251953125, 0.509002685546875, 0.6334228515625, 0.757843017578125, 0.88226318359375, 1.006683349609375, 1.131103515625, 1.255523681640625, 1.37994384765625, 1.504364013671875, 1.6287841796875, 1.753204345703125, 1.87762451171875, 2.002044677734375, 2.12646484375, 2.250885009765625, 2.37530517578125, 2.499725341796875, 2.6241455078125, 2.748565673828125, 2.87298583984375, 2.997406005859375, 3.121826171875, 3.246246337890625, 3.37066650390625, 3.495086669921875, 3.6195068359375, 3.743927001953125, 3.86834716796875, 3.992767333984375, 4.1171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 9.0, 14.0, 13.0, 9.0, 29.0, 42.0, 55.0, 104.0, 188.0, 165.0, 107.0, 62.0, 55.0, 32.0, 20.0, 21.0, 14.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.9459228515625, -0.917236328125, -0.8885498046875, -0.85986328125, -0.8311767578125, -0.802490234375, -0.7738037109375, -0.7451171875, -0.7164306640625, -0.687744140625, -0.6590576171875, -0.63037109375, -0.6016845703125, -0.572998046875, -0.5443115234375, -0.515625, -0.4869384765625, -0.458251953125, -0.4295654296875, -0.40087890625, -0.3721923828125, -0.343505859375, -0.3148193359375, -0.2861328125, -0.2574462890625, -0.228759765625, -0.2000732421875, -0.17138671875, -0.1427001953125, -0.114013671875, -0.0853271484375, -0.056640625, -0.0279541015625, 0.000732421875, 0.0294189453125, 0.05810546875, 0.0867919921875, 0.115478515625, 0.1441650390625, 0.1728515625, 0.2015380859375, 0.230224609375, 0.2589111328125, 0.28759765625, 0.3162841796875, 0.344970703125, 0.3736572265625, 0.40234375, 0.4310302734375, 0.459716796875, 0.4884033203125, 0.51708984375, 0.5457763671875, 0.574462890625, 0.6031494140625, 0.6318359375, 0.6605224609375, 0.689208984375, 0.7178955078125, 0.74658203125, 0.7752685546875, 0.803955078125, 0.8326416015625, 0.861328125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 13.0, 12.0, 6.0, 15.0, 13.0, 26.0, 23.0, 26.0, 27.0, 27.0, 32.0, 28.0, 35.0, 32.0, 36.0, 34.0, 42.0, 32.0, 57.0, 52.0, 44.0, 34.0, 37.0, 32.0, 28.0, 24.0, 33.0, 25.0, 17.0, 17.0, 19.0, 21.0, 19.0, 10.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.174232006072998, -3.0808262825012207, -2.9874205589294434, -2.894014596939087, -2.8006088733673096, -2.7072031497955322, -2.613797426223755, -2.5203914642333984, -2.426985740661621, -2.3335800170898438, -2.2401742935180664, -2.14676833152771, -2.0533626079559326, -1.9599568843841553, -1.866551160812378, -1.773145318031311, -1.6797395944595337, -1.5863338708877563, -1.4929280281066895, -1.399522304534912, -1.3061164617538452, -1.2127107381820679, -1.119304895401001, -1.0258991718292236, -0.9324933886528015, -0.8390876054763794, -0.7456818222999573, -0.6522760391235352, -0.5588703155517578, -0.4654645025730133, -0.3720587491989136, -0.27865296602249146, -0.18524718284606934, -0.09184140712022781, 0.0015643686056137085, 0.09497013688087463, 0.18837592005729675, 0.28178170323371887, 0.3751874566078186, 0.4685932397842407, 0.5619990229606628, 0.655404806137085, 0.7488105893135071, 0.8422163724899292, 0.9356220960617065, 1.0290279388427734, 1.1224336624145508, 1.2158393859863281, 1.309245228767395, 1.4026509523391724, 1.4960567951202393, 1.5894625186920166, 1.6828683614730835, 1.7762740850448608, 1.8696799278259277, 1.963085651397705, 2.0564913749694824, 2.1498970985412598, 2.243302822113037, 2.3367087841033936, 2.430114507675171, 2.5235202312469482, 2.6169259548187256, 2.710331916809082, 2.8037376403808594]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 2.0, 20.0, 16.0, 15.0, 11.0, 15.0, 19.0, 20.0, 28.0, 32.0, 28.0, 29.0, 28.0, 48.0, 49.0, 27.0, 36.0, 45.0, 37.0, 44.0, 39.0, 37.0, 48.0, 34.0, 41.0, 25.0, 20.0, 18.0, 22.0, 29.0, 12.0, 21.0, 21.0, 12.0, 11.0, 13.0, 10.0, 3.0, 9.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.7933664321899414, -2.7040176391601562, -2.614668846130371, -2.525320053100586, -2.4359710216522217, -2.3466222286224365, -2.2572734355926514, -2.167924642562866, -2.078575611114502, -1.9892268180847168, -1.899877905845642, -1.810529112815857, -1.7211802005767822, -1.631831407546997, -1.542482614517212, -1.4531338214874268, -1.3637850284576416, -1.2744362354278564, -1.1850873231887817, -1.0957385301589966, -1.0063896179199219, -0.9170408248901367, -0.8276920318603516, -0.7383431792259216, -0.6489943265914917, -0.5596454739570618, -0.4702966511249542, -0.3809478282928467, -0.29159897565841675, -0.20225012302398682, -0.11290132999420166, -0.02355247735977173, 0.0657963752746582, 0.15514521300792694, 0.24449405074119568, 0.3338428735733032, 0.42319172620773315, 0.5125405788421631, 0.6018893718719482, 0.6912382245063782, 0.7805870771408081, 0.869935929775238, 0.959284782409668, 1.0486335754394531, 1.1379823684692383, 1.227331280708313, 1.3166800737380981, 1.4060289859771729, 1.495377779006958, 1.5847265720367432, 1.6740754842758179, 1.763424277305603, 1.8527731895446777, 1.942121982574463, 2.031470775604248, 2.120819568634033, 2.2101683616638184, 2.2995171546936035, 2.3888659477233887, 2.478214740753174, 2.567563772201538, 2.6569125652313232, 2.7462613582611084, 2.8356101512908936, 2.924959182739258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 14.0, 23.0, 45.0, 66.0, 93.0, 130.0, 221.0, 299.0, 523.0, 730.0, 1283.0, 1939.0, 3103.0, 4794.0, 7696.0, 11811.0, 18349.0, 28291.0, 41647.0, 58858.0, 79424.0, 100235.0, 115517.0, 119991.0, 112949.0, 96590.0, 76039.0, 55562.0, 38503.0, 26410.0, 17105.0, 10993.0, 7077.0, 4440.0, 2772.0, 1825.0, 1125.0, 730.0, 506.0, 347.0, 192.0, 104.0, 62.0, 41.0, 41.0, 22.0, 16.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.765625, -3.65618896484375, -3.5467529296875, -3.43731689453125, -3.327880859375, -3.21844482421875, -3.1090087890625, -2.99957275390625, -2.89013671875, -2.78070068359375, -2.6712646484375, -2.56182861328125, -2.452392578125, -2.34295654296875, -2.2335205078125, -2.12408447265625, -2.0146484375, -1.90521240234375, -1.7957763671875, -1.68634033203125, -1.576904296875, -1.46746826171875, -1.3580322265625, -1.24859619140625, -1.13916015625, -1.02972412109375, -0.9202880859375, -0.81085205078125, -0.701416015625, -0.59197998046875, -0.4825439453125, -0.37310791015625, -0.263671875, -0.15423583984375, -0.0447998046875, 0.06463623046875, 0.174072265625, 0.28350830078125, 0.3929443359375, 0.50238037109375, 0.61181640625, 0.72125244140625, 0.8306884765625, 0.94012451171875, 1.049560546875, 1.15899658203125, 1.2684326171875, 1.37786865234375, 1.4873046875, 1.59674072265625, 1.7061767578125, 1.81561279296875, 1.925048828125, 2.03448486328125, 2.1439208984375, 2.25335693359375, 2.36279296875, 2.47222900390625, 2.5816650390625, 2.69110107421875, 2.800537109375, 2.90997314453125, 3.0194091796875, 3.12884521484375, 3.23828125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 15.0, 16.0, 11.0, 26.0, 23.0, 25.0, 24.0, 24.0, 37.0, 29.0, 34.0, 31.0, 45.0, 39.0, 36.0, 44.0, 37.0, 43.0, 45.0, 31.0, 36.0, 39.0, 39.0, 27.0, 17.0, 29.0, 25.0, 20.0, 15.0, 15.0, 16.0, 11.0, 12.0, 13.0, 9.0, 12.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.330169677734375, -2.24432373046875, -2.158477783203125, -2.0726318359375, -1.986785888671875, -1.90093994140625, -1.815093994140625, -1.729248046875, -1.643402099609375, -1.55755615234375, -1.471710205078125, -1.3858642578125, -1.300018310546875, -1.21417236328125, -1.128326416015625, -1.04248046875, -0.956634521484375, -0.87078857421875, -0.784942626953125, -0.6990966796875, -0.613250732421875, -0.52740478515625, -0.441558837890625, -0.355712890625, -0.269866943359375, -0.18402099609375, -0.098175048828125, -0.0123291015625, 0.073516845703125, 0.15936279296875, 0.245208740234375, 0.3310546875, 0.416900634765625, 0.50274658203125, 0.588592529296875, 0.6744384765625, 0.760284423828125, 0.84613037109375, 0.931976318359375, 1.017822265625, 1.103668212890625, 1.18951416015625, 1.275360107421875, 1.3612060546875, 1.447052001953125, 1.53289794921875, 1.618743896484375, 1.70458984375, 1.790435791015625, 1.87628173828125, 1.962127685546875, 2.0479736328125, 2.133819580078125, 2.21966552734375, 2.305511474609375, 2.391357421875, 2.477203369140625, 2.56304931640625, 2.648895263671875, 2.7347412109375, 2.820587158203125, 2.90643310546875, 2.992279052734375, 3.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 16.0, 21.0, 31.0, 45.0, 95.0, 123.0, 188.0, 301.0, 490.0, 748.0, 1207.0, 1884.0, 3011.0, 4532.0, 7134.0, 11006.0, 16454.0, 25095.0, 36265.0, 50526.0, 67738.0, 85888.0, 101337.0, 110327.0, 110202.0, 101222.0, 85537.0, 67968.0, 50687.0, 35781.0, 24820.0, 16604.0, 11159.0, 7252.0, 4701.0, 2849.0, 1895.0, 1226.0, 820.0, 481.0, 309.0, 207.0, 136.0, 86.0, 51.0, 40.0, 20.0, 14.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.984375, -2.89111328125, -2.7978515625, -2.70458984375, -2.611328125, -2.51806640625, -2.4248046875, -2.33154296875, -2.23828125, -2.14501953125, -2.0517578125, -1.95849609375, -1.865234375, -1.77197265625, -1.6787109375, -1.58544921875, -1.4921875, -1.39892578125, -1.3056640625, -1.21240234375, -1.119140625, -1.02587890625, -0.9326171875, -0.83935546875, -0.74609375, -0.65283203125, -0.5595703125, -0.46630859375, -0.373046875, -0.27978515625, -0.1865234375, -0.09326171875, 0.0, 0.09326171875, 0.1865234375, 0.27978515625, 0.373046875, 0.46630859375, 0.5595703125, 0.65283203125, 0.74609375, 0.83935546875, 0.9326171875, 1.02587890625, 1.119140625, 1.21240234375, 1.3056640625, 1.39892578125, 1.4921875, 1.58544921875, 1.6787109375, 1.77197265625, 1.865234375, 1.95849609375, 2.0517578125, 2.14501953125, 2.23828125, 2.33154296875, 2.4248046875, 2.51806640625, 2.611328125, 2.70458984375, 2.7978515625, 2.89111328125, 2.984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 14.0, 13.0, 15.0, 23.0, 20.0, 23.0, 33.0, 36.0, 44.0, 28.0, 42.0, 27.0, 38.0, 33.0, 43.0, 37.0, 42.0, 43.0, 34.0, 41.0, 37.0, 38.0, 25.0, 26.0, 22.0, 24.0, 20.0, 27.0, 20.0, 17.0, 9.0, 13.0, 10.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7958984375, -1.739959716796875, -1.68402099609375, -1.628082275390625, -1.5721435546875, -1.516204833984375, -1.46026611328125, -1.404327392578125, -1.348388671875, -1.292449951171875, -1.23651123046875, -1.180572509765625, -1.1246337890625, -1.068695068359375, -1.01275634765625, -0.956817626953125, -0.90087890625, -0.844940185546875, -0.78900146484375, -0.733062744140625, -0.6771240234375, -0.621185302734375, -0.56524658203125, -0.509307861328125, -0.453369140625, -0.397430419921875, -0.34149169921875, -0.285552978515625, -0.2296142578125, -0.173675537109375, -0.11773681640625, -0.061798095703125, -0.005859375, 0.050079345703125, 0.10601806640625, 0.161956787109375, 0.2178955078125, 0.273834228515625, 0.32977294921875, 0.385711669921875, 0.441650390625, 0.497589111328125, 0.55352783203125, 0.609466552734375, 0.6654052734375, 0.721343994140625, 0.77728271484375, 0.833221435546875, 0.88916015625, 0.945098876953125, 1.00103759765625, 1.056976318359375, 1.1129150390625, 1.168853759765625, 1.22479248046875, 1.280731201171875, 1.336669921875, 1.392608642578125, 1.44854736328125, 1.504486083984375, 1.5604248046875, 1.616363525390625, 1.67230224609375, 1.728240966796875, 1.7841796875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 16.0, 21.0, 34.0, 35.0, 56.0, 69.0, 114.0, 148.0, 228.0, 311.0, 460.0, 663.0, 1018.0, 1496.0, 2350.0, 3549.0, 5894.0, 9731.0, 17415.0, 33431.0, 66910.0, 132532.0, 217598.0, 231647.0, 153825.0, 79651.0, 39736.0, 20362.0, 11113.0, 6506.0, 3977.0, 2474.0, 1688.0, 1082.0, 768.0, 524.0, 347.0, 229.0, 160.0, 111.0, 89.0, 76.0, 32.0, 19.0, 25.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.34783935546875, -3.2366943359375, -3.12554931640625, -3.014404296875, -2.90325927734375, -2.7921142578125, -2.68096923828125, -2.56982421875, -2.45867919921875, -2.3475341796875, -2.23638916015625, -2.125244140625, -2.01409912109375, -1.9029541015625, -1.79180908203125, -1.6806640625, -1.56951904296875, -1.4583740234375, -1.34722900390625, -1.236083984375, -1.12493896484375, -1.0137939453125, -0.90264892578125, -0.79150390625, -0.68035888671875, -0.5692138671875, -0.45806884765625, -0.346923828125, -0.23577880859375, -0.1246337890625, -0.01348876953125, 0.09765625, 0.20880126953125, 0.3199462890625, 0.43109130859375, 0.542236328125, 0.65338134765625, 0.7645263671875, 0.87567138671875, 0.98681640625, 1.09796142578125, 1.2091064453125, 1.32025146484375, 1.431396484375, 1.54254150390625, 1.6536865234375, 1.76483154296875, 1.8759765625, 1.98712158203125, 2.0982666015625, 2.20941162109375, 2.320556640625, 2.43170166015625, 2.5428466796875, 2.65399169921875, 2.76513671875, 2.87628173828125, 2.9874267578125, 3.09857177734375, 3.209716796875, 3.32086181640625, 3.4320068359375, 3.54315185546875, 3.654296875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 10.0, 15.0, 27.0, 32.0, 42.0, 79.0, 85.0, 96.0, 111.0, 94.0, 71.0, 81.0, 63.0, 47.0, 38.0, 19.0, 18.0, 13.0, 13.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047779083251953125, -0.00046325474977493286, -0.00044871866703033447, -0.0004341825842857361, -0.0004196465015411377, -0.0004051104187965393, -0.0003905743360519409, -0.00037603825330734253, -0.00036150217056274414, -0.00034696608781814575, -0.00033243000507354736, -0.000317893922328949, -0.0003033578395843506, -0.0002888217568397522, -0.0002742856740951538, -0.0002597495913505554, -0.00024521350860595703, -0.00023067742586135864, -0.00021614134311676025, -0.00020160526037216187, -0.00018706917762756348, -0.0001725330948829651, -0.0001579970121383667, -0.0001434609293937683, -0.00012892484664916992, -0.00011438876390457153, -9.985268115997314e-05, -8.531659841537476e-05, -7.078051567077637e-05, -5.624443292617798e-05, -4.170835018157959e-05, -2.71722674369812e-05, -1.2636184692382812e-05, 1.8998980522155762e-06, 1.6435980796813965e-05, 3.0972063541412354e-05, 4.550814628601074e-05, 6.004422903060913e-05, 7.458031177520752e-05, 8.911639451980591e-05, 0.0001036524772644043, 0.00011818856000900269, 0.00013272464275360107, 0.00014726072549819946, 0.00016179680824279785, 0.00017633289098739624, 0.00019086897373199463, 0.00020540505647659302, 0.0002199411392211914, 0.0002344772219657898, 0.0002490133047103882, 0.00026354938745498657, 0.00027808547019958496, 0.00029262155294418335, 0.00030715763568878174, 0.0003216937184333801, 0.0003362298011779785, 0.0003507658839225769, 0.0003653019666671753, 0.0003798380494117737, 0.00039437413215637207, 0.00040891021490097046, 0.00042344629764556885, 0.00043798238039016724, 0.0004525184631347656]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 14.0, 22.0, 27.0, 33.0, 35.0, 64.0, 112.0, 168.0, 228.0, 360.0, 512.0, 842.0, 1307.0, 2104.0, 3298.0, 5192.0, 8411.0, 14035.0, 23373.0, 38006.0, 61430.0, 93142.0, 128271.0, 152090.0, 150744.0, 124570.0, 88632.0, 58383.0, 36039.0, 22086.0, 13382.0, 8056.0, 4998.0, 3038.0, 1966.0, 1197.0, 777.0, 552.0, 328.0, 222.0, 150.0, 123.0, 67.0, 48.0, 35.0, 26.0, 14.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-2.1484375, -2.083221435546875, -2.01800537109375, -1.952789306640625, -1.8875732421875, -1.822357177734375, -1.75714111328125, -1.691925048828125, -1.626708984375, -1.561492919921875, -1.49627685546875, -1.431060791015625, -1.3658447265625, -1.300628662109375, -1.23541259765625, -1.170196533203125, -1.10498046875, -1.039764404296875, -0.97454833984375, -0.909332275390625, -0.8441162109375, -0.778900146484375, -0.71368408203125, -0.648468017578125, -0.583251953125, -0.518035888671875, -0.45281982421875, -0.387603759765625, -0.3223876953125, -0.257171630859375, -0.19195556640625, -0.126739501953125, -0.0615234375, 0.003692626953125, 0.06890869140625, 0.134124755859375, 0.1993408203125, 0.264556884765625, 0.32977294921875, 0.394989013671875, 0.460205078125, 0.525421142578125, 0.59063720703125, 0.655853271484375, 0.7210693359375, 0.786285400390625, 0.85150146484375, 0.916717529296875, 0.98193359375, 1.047149658203125, 1.11236572265625, 1.177581787109375, 1.2427978515625, 1.308013916015625, 1.37322998046875, 1.438446044921875, 1.503662109375, 1.568878173828125, 1.63409423828125, 1.699310302734375, 1.7645263671875, 1.829742431640625, 1.89495849609375, 1.960174560546875, 2.025390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 8.0, 5.0, 8.0, 7.0, 9.0, 7.0, 11.0, 13.0, 18.0, 13.0, 15.0, 23.0, 32.0, 20.0, 35.0, 44.0, 49.0, 44.0, 47.0, 40.0, 47.0, 53.0, 39.0, 45.0, 46.0, 43.0, 45.0, 30.0, 42.0, 22.0, 25.0, 17.0, 19.0, 18.0, 10.0, 12.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.88916015625, -0.86395263671875, -0.8387451171875, -0.81353759765625, -0.788330078125, -0.76312255859375, -0.7379150390625, -0.71270751953125, -0.6875, -0.66229248046875, -0.6370849609375, -0.61187744140625, -0.586669921875, -0.56146240234375, -0.5362548828125, -0.51104736328125, -0.48583984375, -0.46063232421875, -0.4354248046875, -0.41021728515625, -0.385009765625, -0.35980224609375, -0.3345947265625, -0.30938720703125, -0.2841796875, -0.25897216796875, -0.2337646484375, -0.20855712890625, -0.183349609375, -0.15814208984375, -0.1329345703125, -0.10772705078125, -0.08251953125, -0.05731201171875, -0.0321044921875, -0.00689697265625, 0.018310546875, 0.04351806640625, 0.0687255859375, 0.09393310546875, 0.119140625, 0.14434814453125, 0.1695556640625, 0.19476318359375, 0.219970703125, 0.24517822265625, 0.2703857421875, 0.29559326171875, 0.32080078125, 0.34600830078125, 0.3712158203125, 0.39642333984375, 0.421630859375, 0.44683837890625, 0.4720458984375, 0.49725341796875, 0.5224609375, 0.54766845703125, 0.5728759765625, 0.59808349609375, 0.623291015625, 0.64849853515625, 0.6737060546875, 0.69891357421875, 0.72412109375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 13.0, 23.0, 23.0, 18.0, 20.0, 31.0, 27.0, 28.0, 23.0, 28.0, 30.0, 45.0, 36.0, 44.0, 45.0, 43.0, 45.0, 44.0, 40.0, 45.0, 33.0, 49.0, 31.0, 27.0, 22.0, 29.0, 26.0, 16.0, 20.0, 17.0, 3.0, 11.0, 10.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.302363872528076, -3.2079219818115234, -3.1134800910949707, -3.019038200378418, -2.924596071243286, -2.8301541805267334, -2.7357122898101807, -2.641270399093628, -2.546828269958496, -2.4523863792419434, -2.3579444885253906, -2.263502597808838, -2.169060468673706, -2.0746185779571533, -1.9801766872406006, -1.8857347965240479, -1.7912929058074951, -1.6968510150909424, -1.6024090051651, -1.5079671144485474, -1.413525104522705, -1.3190832138061523, -1.2246413230895996, -1.1301994323730469, -1.0357574224472046, -0.9413154721260071, -0.8468735218048096, -0.7524316310882568, -0.6579896807670593, -0.5635477304458618, -0.4691058397293091, -0.3746638894081116, -0.28022170066833496, -0.18577976524829865, -0.09133782982826233, 0.003104090690612793, 0.0975460410118103, 0.1919879913330078, 0.28642988204956055, 0.38087183237075806, 0.47531378269195557, 0.5697557330131531, 0.6641976833343506, 0.7586395740509033, 0.8530815243721008, 0.9475234746932983, 1.041965365409851, 1.1364073753356934, 1.230849266052246, 1.3252911567687988, 1.4197331666946411, 1.5141750574111938, 1.6086170673370361, 1.7030589580535889, 1.7975008487701416, 1.8919427394866943, 1.9863847494125366, 2.080826759338379, 2.1752686500549316, 2.2697105407714844, 2.364152431488037, 2.45859432220459, 2.5530362129211426, 2.6474783420562744, 2.741920232772827]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 11.0, 11.0, 10.0, 13.0, 14.0, 18.0, 23.0, 24.0, 28.0, 28.0, 32.0, 32.0, 26.0, 51.0, 42.0, 41.0, 41.0, 37.0, 44.0, 47.0, 34.0, 29.0, 43.0, 32.0, 30.0, 39.0, 30.0, 30.0, 21.0, 14.0, 16.0, 17.0, 15.0, 18.0, 9.0, 2.0, 10.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.664181709289551, -2.571289300918579, -2.4783968925476074, -2.3855044841766357, -2.292612075805664, -2.1997196674346924, -2.1068272590637207, -2.01393461227417, -1.9210423231124878, -1.8281499147415161, -1.7352575063705444, -1.6423649787902832, -1.5494725704193115, -1.4565801620483398, -1.3636877536773682, -1.2707953453063965, -1.1779029369354248, -1.0850105285644531, -0.9921181201934814, -0.899225652217865, -0.8063332438468933, -0.7134408354759216, -0.6205483675003052, -0.5276559591293335, -0.4347635507583618, -0.34187114238739014, -0.24897870421409607, -0.156086266040802, -0.06319385766983032, 0.029698550701141357, 0.12259101867675781, 0.2154834270477295, 0.30837583541870117, 0.40126824378967285, 0.4941606819629669, 0.587053120136261, 0.6799455285072327, 0.7728379368782043, 0.8657304048538208, 0.9586228132247925, 1.0515152215957642, 1.1444076299667358, 1.2373000383377075, 1.3301925659179688, 1.4230849742889404, 1.515977382659912, 1.6088697910308838, 1.7017621994018555, 1.7946546077728271, 1.8875470161437988, 1.9804394245147705, 2.073331832885742, 2.166224241256714, 2.2591166496276855, 2.3520092964172363, 2.444901466369629, 2.5377941131591797, 2.6306865215301514, 2.723578929901123, 2.8164713382720947, 2.9093637466430664, 3.002256155014038, 3.0951485633850098, 3.1880412101745605, 3.280933380126953]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 13.0, 25.0, 31.0, 42.0, 62.0, 136.0, 215.0, 377.0, 618.0, 1086.0, 1722.0, 3036.0, 5018.0, 8500.0, 14598.0, 24543.0, 41199.0, 69894.0, 114159.0, 185315.0, 285838.0, 412390.0, 531399.0, 593869.0, 560884.0, 454996.0, 326476.0, 217120.0, 135424.0, 83259.0, 49723.0, 29332.0, 17410.0, 10443.0, 6141.0, 3608.0, 2082.0, 1373.0, 757.0, 475.0, 251.0, 164.0, 106.0, 69.0, 40.0, 22.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.6796875, -2.600067138671875, -2.52044677734375, -2.440826416015625, -2.3612060546875, -2.281585693359375, -2.20196533203125, -2.122344970703125, -2.042724609375, -1.963104248046875, -1.88348388671875, -1.803863525390625, -1.7242431640625, -1.644622802734375, -1.56500244140625, -1.485382080078125, -1.40576171875, -1.326141357421875, -1.24652099609375, -1.166900634765625, -1.0872802734375, -1.007659912109375, -0.92803955078125, -0.848419189453125, -0.768798828125, -0.689178466796875, -0.60955810546875, -0.529937744140625, -0.4503173828125, -0.370697021484375, -0.29107666015625, -0.211456298828125, -0.1318359375, -0.052215576171875, 0.02740478515625, 0.107025146484375, 0.1866455078125, 0.266265869140625, 0.34588623046875, 0.425506591796875, 0.505126953125, 0.584747314453125, 0.66436767578125, 0.743988037109375, 0.8236083984375, 0.903228759765625, 0.98284912109375, 1.062469482421875, 1.14208984375, 1.221710205078125, 1.30133056640625, 1.380950927734375, 1.4605712890625, 1.540191650390625, 1.61981201171875, 1.699432373046875, 1.779052734375, 1.858673095703125, 1.93829345703125, 2.017913818359375, 2.0975341796875, 2.177154541015625, 2.25677490234375, 2.336395263671875, 2.416015625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 12.0, 9.0, 17.0, 16.0, 13.0, 21.0, 25.0, 27.0, 27.0, 34.0, 38.0, 32.0, 41.0, 46.0, 37.0, 39.0, 48.0, 33.0, 46.0, 44.0, 40.0, 36.0, 38.0, 38.0, 35.0, 33.0, 23.0, 23.0, 17.0, 14.0, 12.0, 14.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.029296875, -1.95849609375, -1.8876953125, -1.81689453125, -1.74609375, -1.67529296875, -1.6044921875, -1.53369140625, -1.462890625, -1.39208984375, -1.3212890625, -1.25048828125, -1.1796875, -1.10888671875, -1.0380859375, -0.96728515625, -0.896484375, -0.82568359375, -0.7548828125, -0.68408203125, -0.61328125, -0.54248046875, -0.4716796875, -0.40087890625, -0.330078125, -0.25927734375, -0.1884765625, -0.11767578125, -0.046875, 0.02392578125, 0.0947265625, 0.16552734375, 0.236328125, 0.30712890625, 0.3779296875, 0.44873046875, 0.51953125, 0.59033203125, 0.6611328125, 0.73193359375, 0.802734375, 0.87353515625, 0.9443359375, 1.01513671875, 1.0859375, 1.15673828125, 1.2275390625, 1.29833984375, 1.369140625, 1.43994140625, 1.5107421875, 1.58154296875, 1.65234375, 1.72314453125, 1.7939453125, 1.86474609375, 1.935546875, 2.00634765625, 2.0771484375, 2.14794921875, 2.21875, 2.28955078125, 2.3603515625, 2.43115234375, 2.501953125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 33.0, 41.0, 71.0, 126.0, 200.0, 358.0, 611.0, 1054.0, 1768.0, 3103.0, 5271.0, 9154.0, 16049.0, 27037.0, 45753.0, 75324.0, 122266.0, 189562.0, 278947.0, 383194.0, 481017.0, 535683.0, 526642.0, 454338.0, 353029.0, 250271.0, 167287.0, 106250.0, 65386.0, 38969.0, 23369.0, 13525.0, 7743.0, 4542.0, 2602.0, 1592.0, 848.0, 530.0, 286.0, 184.0, 106.0, 70.0, 39.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.511444091796875, -2.43499755859375, -2.358551025390625, -2.2821044921875, -2.205657958984375, -2.12921142578125, -2.052764892578125, -1.976318359375, -1.899871826171875, -1.82342529296875, -1.746978759765625, -1.6705322265625, -1.594085693359375, -1.51763916015625, -1.441192626953125, -1.36474609375, -1.288299560546875, -1.21185302734375, -1.135406494140625, -1.0589599609375, -0.982513427734375, -0.90606689453125, -0.829620361328125, -0.753173828125, -0.676727294921875, -0.60028076171875, -0.523834228515625, -0.4473876953125, -0.370941162109375, -0.29449462890625, -0.218048095703125, -0.1416015625, -0.065155029296875, 0.01129150390625, 0.087738037109375, 0.1641845703125, 0.240631103515625, 0.31707763671875, 0.393524169921875, 0.469970703125, 0.546417236328125, 0.62286376953125, 0.699310302734375, 0.7757568359375, 0.852203369140625, 0.92864990234375, 1.005096435546875, 1.08154296875, 1.157989501953125, 1.23443603515625, 1.310882568359375, 1.3873291015625, 1.463775634765625, 1.54022216796875, 1.616668701171875, 1.693115234375, 1.769561767578125, 1.84600830078125, 1.922454833984375, 1.9989013671875, 2.075347900390625, 2.15179443359375, 2.228240966796875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 12.0, 7.0, 14.0, 20.0, 31.0, 41.0, 40.0, 61.0, 53.0, 82.0, 100.0, 112.0, 117.0, 142.0, 137.0, 182.0, 187.0, 213.0, 232.0, 185.0, 211.0, 206.0, 201.0, 193.0, 172.0, 167.0, 151.0, 115.0, 114.0, 108.0, 93.0, 78.0, 58.0, 52.0, 44.0, 28.0, 33.0, 21.0, 15.0, 16.0, 3.0, 6.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0595703125, -1.0271148681640625, -0.994659423828125, -0.9622039794921875, -0.92974853515625, -0.8972930908203125, -0.864837646484375, -0.8323822021484375, -0.7999267578125, -0.7674713134765625, -0.735015869140625, -0.7025604248046875, -0.67010498046875, -0.6376495361328125, -0.605194091796875, -0.5727386474609375, -0.540283203125, -0.5078277587890625, -0.475372314453125, -0.4429168701171875, -0.41046142578125, -0.3780059814453125, -0.345550537109375, -0.3130950927734375, -0.2806396484375, -0.2481842041015625, -0.215728759765625, -0.1832733154296875, -0.15081787109375, -0.1183624267578125, -0.085906982421875, -0.0534515380859375, -0.02099609375, 0.0114593505859375, 0.043914794921875, 0.0763702392578125, 0.10882568359375, 0.1412811279296875, 0.173736572265625, 0.2061920166015625, 0.2386474609375, 0.2711029052734375, 0.303558349609375, 0.3360137939453125, 0.36846923828125, 0.4009246826171875, 0.433380126953125, 0.4658355712890625, 0.498291015625, 0.5307464599609375, 0.563201904296875, 0.5956573486328125, 0.62811279296875, 0.6605682373046875, 0.693023681640625, 0.7254791259765625, 0.7579345703125, 0.7903900146484375, 0.822845458984375, 0.8553009033203125, 0.88775634765625, 0.9202117919921875, 0.952667236328125, 0.9851226806640625, 1.017578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 6.0, 10.0, 7.0, 16.0, 17.0, 23.0, 23.0, 32.0, 34.0, 28.0, 41.0, 36.0, 40.0, 53.0, 62.0, 46.0, 46.0, 54.0, 47.0, 53.0, 45.0, 38.0, 36.0, 33.0, 31.0, 23.0, 21.0, 12.0, 14.0, 17.0, 14.0, 5.0, 8.0, 9.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3508079051971436, -3.2532224655151367, -3.155637264251709, -3.0580520629882812, -2.9604666233062744, -2.8628811836242676, -2.76529598236084, -2.667710781097412, -2.5701253414154053, -2.4725399017333984, -2.3749547004699707, -2.277369499206543, -2.179784059524536, -2.0821986198425293, -1.9846134185791016, -1.8870280981063843, -1.789442777633667, -1.6918574571609497, -1.5942721366882324, -1.4966868162155151, -1.3991014957427979, -1.3015161752700806, -1.2039308547973633, -1.106345534324646, -1.0087602138519287, -0.9111748933792114, -0.8135895729064941, -0.7160042524337769, -0.6184189319610596, -0.5208336114883423, -0.423248291015625, -0.3256629705429077, -0.22807741165161133, -0.13049209117889404, -0.03290677070617676, 0.06467854976654053, 0.1622638702392578, 0.2598491907119751, 0.3574345111846924, 0.45501983165740967, 0.552605152130127, 0.6501904726028442, 0.7477757930755615, 0.8453611135482788, 0.9429464340209961, 1.0405317544937134, 1.1381170749664307, 1.235702395439148, 1.3332877159118652, 1.4308730363845825, 1.5284583568572998, 1.626043677330017, 1.7236289978027344, 1.8212143182754517, 1.918799638748169, 2.016385078430176, 2.1139702796936035, 2.2115554809570312, 2.309140920639038, 2.406726360321045, 2.5043115615844727, 2.6018967628479004, 2.6994822025299072, 2.797067642211914, 2.894652843475342]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 2.0, 3.0, 6.0, 16.0, 14.0, 8.0, 16.0, 30.0, 23.0, 27.0, 27.0, 28.0, 34.0, 26.0, 32.0, 49.0, 49.0, 48.0, 42.0, 41.0, 34.0, 30.0, 39.0, 29.0, 39.0, 40.0, 33.0, 30.0, 30.0, 26.0, 18.0, 25.0, 19.0, 17.0, 12.0, 8.0, 6.0, 12.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.750286102294922, -2.670217990875244, -2.5901501178741455, -2.5100820064544678, -2.430014133453369, -2.3499460220336914, -2.2698781490325928, -2.189810037612915, -2.1097421646118164, -2.0296740531921387, -1.94960618019104, -1.8695381879806519, -1.7894701957702637, -1.7094022035598755, -1.6293342113494873, -1.5492660999298096, -1.4691981077194214, -1.3891301155090332, -1.309062123298645, -1.2289941310882568, -1.1489261388778687, -1.0688581466674805, -0.9887900948524475, -0.9087221026420593, -0.8286541104316711, -0.748586118221283, -0.6685181260108948, -0.5884500741958618, -0.5083820819854736, -0.42831411957740784, -0.34824609756469727, -0.2681781053543091, -0.1881101131439209, -0.10804211348295212, -0.027974113821983337, 0.05209389328956604, 0.13216188549995422, 0.2122298777103424, 0.292297899723053, 0.37236589193344116, 0.45243388414382935, 0.5325018763542175, 0.6125698685646057, 0.6926379203796387, 0.7727059125900269, 0.852773904800415, 0.9328418970108032, 1.0129098892211914, 1.0929778814315796, 1.1730458736419678, 1.253113865852356, 1.3331818580627441, 1.4132498502731323, 1.4933178424835205, 1.5733859539031982, 1.6534538269042969, 1.7335219383239746, 1.8135899305343628, 1.893657922744751, 1.9737259149551392, 2.0537939071655273, 2.133862018585205, 2.2139298915863037, 2.2939980030059814, 2.37406587600708]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 17.0, 27.0, 25.0, 36.0, 45.0, 76.0, 119.0, 178.0, 251.0, 441.0, 734.0, 1246.0, 2374.0, 4394.0, 8666.0, 18709.0, 39206.0, 83009.0, 169491.0, 265414.0, 223873.0, 120114.0, 57149.0, 26871.0, 12506.0, 6161.0, 3138.0, 1664.0, 974.0, 584.0, 362.0, 238.0, 150.0, 97.0, 69.0, 48.0, 28.0, 13.0, 7.0, 12.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.46484375, -2.38720703125, -2.3095703125, -2.23193359375, -2.154296875, -2.07666015625, -1.9990234375, -1.92138671875, -1.84375, -1.76611328125, -1.6884765625, -1.61083984375, -1.533203125, -1.45556640625, -1.3779296875, -1.30029296875, -1.22265625, -1.14501953125, -1.0673828125, -0.98974609375, -0.912109375, -0.83447265625, -0.7568359375, -0.67919921875, -0.6015625, -0.52392578125, -0.4462890625, -0.36865234375, -0.291015625, -0.21337890625, -0.1357421875, -0.05810546875, 0.01953125, 0.09716796875, 0.1748046875, 0.25244140625, 0.330078125, 0.40771484375, 0.4853515625, 0.56298828125, 0.640625, 0.71826171875, 0.7958984375, 0.87353515625, 0.951171875, 1.02880859375, 1.1064453125, 1.18408203125, 1.26171875, 1.33935546875, 1.4169921875, 1.49462890625, 1.572265625, 1.64990234375, 1.7275390625, 1.80517578125, 1.8828125, 1.96044921875, 2.0380859375, 2.11572265625, 2.193359375, 2.27099609375, 2.3486328125, 2.42626953125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 5.0, 11.0, 6.0, 12.0, 16.0, 10.0, 20.0, 22.0, 24.0, 18.0, 18.0, 39.0, 33.0, 39.0, 35.0, 38.0, 45.0, 44.0, 39.0, 40.0, 39.0, 38.0, 31.0, 32.0, 40.0, 35.0, 28.0, 23.0, 30.0, 33.0, 31.0, 19.0, 12.0, 15.0, 13.0, 10.0, 12.0, 11.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71484375, -2.633209228515625, -2.55157470703125, -2.469940185546875, -2.3883056640625, -2.306671142578125, -2.22503662109375, -2.143402099609375, -2.061767578125, -1.980133056640625, -1.89849853515625, -1.816864013671875, -1.7352294921875, -1.653594970703125, -1.57196044921875, -1.490325927734375, -1.40869140625, -1.327056884765625, -1.24542236328125, -1.163787841796875, -1.0821533203125, -1.000518798828125, -0.91888427734375, -0.837249755859375, -0.755615234375, -0.673980712890625, -0.59234619140625, -0.510711669921875, -0.4290771484375, -0.347442626953125, -0.26580810546875, -0.184173583984375, -0.1025390625, -0.020904541015625, 0.06072998046875, 0.142364501953125, 0.2239990234375, 0.305633544921875, 0.38726806640625, 0.468902587890625, 0.550537109375, 0.632171630859375, 0.71380615234375, 0.795440673828125, 0.8770751953125, 0.958709716796875, 1.04034423828125, 1.121978759765625, 1.20361328125, 1.285247802734375, 1.36688232421875, 1.448516845703125, 1.5301513671875, 1.611785888671875, 1.69342041015625, 1.775054931640625, 1.856689453125, 1.938323974609375, 2.01995849609375, 2.101593017578125, 2.1832275390625, 2.264862060546875, 2.34649658203125, 2.428131103515625, 2.509765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 22.0, 25.0, 37.0, 51.0, 73.0, 114.0, 174.0, 279.0, 396.0, 624.0, 976.0, 1635.0, 2886.0, 5246.0, 9743.0, 19743.0, 41563.0, 89975.0, 191591.0, 294144.0, 203112.0, 96953.0, 44387.0, 21044.0, 10648.0, 5398.0, 2984.0, 1767.0, 1083.0, 633.0, 440.0, 234.0, 206.0, 118.0, 64.0, 58.0, 33.0, 26.0, 17.0, 11.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.669525146484375, -1.60662841796875, -1.543731689453125, -1.4808349609375, -1.417938232421875, -1.35504150390625, -1.292144775390625, -1.229248046875, -1.166351318359375, -1.10345458984375, -1.040557861328125, -0.9776611328125, -0.914764404296875, -0.85186767578125, -0.788970947265625, -0.72607421875, -0.663177490234375, -0.60028076171875, -0.537384033203125, -0.4744873046875, -0.411590576171875, -0.34869384765625, -0.285797119140625, -0.222900390625, -0.160003662109375, -0.09710693359375, -0.034210205078125, 0.0286865234375, 0.091583251953125, 0.15447998046875, 0.217376708984375, 0.2802734375, 0.343170166015625, 0.40606689453125, 0.468963623046875, 0.5318603515625, 0.594757080078125, 0.65765380859375, 0.720550537109375, 0.783447265625, 0.846343994140625, 0.90924072265625, 0.972137451171875, 1.0350341796875, 1.097930908203125, 1.16082763671875, 1.223724365234375, 1.28662109375, 1.349517822265625, 1.41241455078125, 1.475311279296875, 1.5382080078125, 1.601104736328125, 1.66400146484375, 1.726898193359375, 1.789794921875, 1.852691650390625, 1.91558837890625, 1.978485107421875, 2.0413818359375, 2.104278564453125, 2.16717529296875, 2.230072021484375, 2.29296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 3.0, 6.0, 11.0, 9.0, 17.0, 15.0, 16.0, 20.0, 30.0, 27.0, 36.0, 38.0, 31.0, 44.0, 39.0, 42.0, 46.0, 48.0, 46.0, 35.0, 44.0, 41.0, 36.0, 32.0, 30.0, 41.0, 27.0, 29.0, 22.0, 22.0, 16.0, 19.0, 11.0, 14.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.61602783203125, -1.5562744140625, -1.49652099609375, -1.436767578125, -1.37701416015625, -1.3172607421875, -1.25750732421875, -1.19775390625, -1.13800048828125, -1.0782470703125, -1.01849365234375, -0.958740234375, -0.89898681640625, -0.8392333984375, -0.77947998046875, -0.7197265625, -0.65997314453125, -0.6002197265625, -0.54046630859375, -0.480712890625, -0.42095947265625, -0.3612060546875, -0.30145263671875, -0.24169921875, -0.18194580078125, -0.1221923828125, -0.06243896484375, -0.002685546875, 0.05706787109375, 0.1168212890625, 0.17657470703125, 0.236328125, 0.29608154296875, 0.3558349609375, 0.41558837890625, 0.475341796875, 0.53509521484375, 0.5948486328125, 0.65460205078125, 0.71435546875, 0.77410888671875, 0.8338623046875, 0.89361572265625, 0.953369140625, 1.01312255859375, 1.0728759765625, 1.13262939453125, 1.1923828125, 1.25213623046875, 1.3118896484375, 1.37164306640625, 1.431396484375, 1.49114990234375, 1.5509033203125, 1.61065673828125, 1.67041015625, 1.73016357421875, 1.7899169921875, 1.84967041015625, 1.909423828125, 1.96917724609375, 2.0289306640625, 2.08868408203125, 2.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 14.0, 16.0, 23.0, 17.0, 20.0, 37.0, 44.0, 53.0, 71.0, 87.0, 132.0, 177.0, 209.0, 313.0, 436.0, 599.0, 1003.0, 1487.0, 2583.0, 4692.0, 10438.0, 31674.0, 187744.0, 665094.0, 101128.0, 22067.0, 8155.0, 3914.0, 2080.0, 1276.0, 855.0, 547.0, 417.0, 290.0, 186.0, 156.0, 113.0, 98.0, 61.0, 51.0, 48.0, 38.0, 19.0, 16.0, 16.0, 10.0, 11.0, 10.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.28515625, -2.2122802734375, -2.139404296875, -2.0665283203125, -1.99365234375, -1.9207763671875, -1.847900390625, -1.7750244140625, -1.7021484375, -1.6292724609375, -1.556396484375, -1.4835205078125, -1.41064453125, -1.3377685546875, -1.264892578125, -1.1920166015625, -1.119140625, -1.0462646484375, -0.973388671875, -0.9005126953125, -0.82763671875, -0.7547607421875, -0.681884765625, -0.6090087890625, -0.5361328125, -0.4632568359375, -0.390380859375, -0.3175048828125, -0.24462890625, -0.1717529296875, -0.098876953125, -0.0260009765625, 0.046875, 0.1197509765625, 0.192626953125, 0.2655029296875, 0.33837890625, 0.4112548828125, 0.484130859375, 0.5570068359375, 0.6298828125, 0.7027587890625, 0.775634765625, 0.8485107421875, 0.92138671875, 0.9942626953125, 1.067138671875, 1.1400146484375, 1.212890625, 1.2857666015625, 1.358642578125, 1.4315185546875, 1.50439453125, 1.5772705078125, 1.650146484375, 1.7230224609375, 1.7958984375, 1.8687744140625, 1.941650390625, 2.0145263671875, 2.08740234375, 2.1602783203125, 2.233154296875, 2.3060302734375, 2.37890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 14.0, 16.0, 26.0, 52.0, 55.0, 113.0, 118.0, 114.0, 126.0, 92.0, 86.0, 44.0, 35.0, 16.0, 10.0, 12.0, 11.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00014328956604003906, -0.00013889558613300323, -0.0001345016062259674, -0.00013010762631893158, -0.00012571364641189575, -0.00012131966650485992, -0.0001169256865978241, -0.00011253170669078827, -0.00010813772678375244, -0.00010374374687671661, -9.934976696968079e-05, -9.495578706264496e-05, -9.056180715560913e-05, -8.61678272485733e-05, -8.177384734153748e-05, -7.737986743450165e-05, -7.298588752746582e-05, -6.859190762042999e-05, -6.419792771339417e-05, -5.980394780635834e-05, -5.540996789932251e-05, -5.101598799228668e-05, -4.6622008085250854e-05, -4.222802817821503e-05, -3.78340482711792e-05, -3.344006836414337e-05, -2.9046088457107544e-05, -2.4652108550071716e-05, -2.025812864303589e-05, -1.586414873600006e-05, -1.1470168828964233e-05, -7.076188921928406e-06, -2.682209014892578e-06, 1.7117708921432495e-06, 6.105750799179077e-06, 1.0499730706214905e-05, 1.4893710613250732e-05, 1.928769052028656e-05, 2.3681670427322388e-05, 2.8075650334358215e-05, 3.246963024139404e-05, 3.686361014842987e-05, 4.12575900554657e-05, 4.5651569962501526e-05, 5.0045549869537354e-05, 5.443952977657318e-05, 5.883350968360901e-05, 6.322748959064484e-05, 6.762146949768066e-05, 7.201544940471649e-05, 7.640942931175232e-05, 8.080340921878815e-05, 8.519738912582397e-05, 8.95913690328598e-05, 9.398534893989563e-05, 9.837932884693146e-05, 0.00010277330875396729, 0.00010716728866100311, 0.00011156126856803894, 0.00011595524847507477, 0.0001203492283821106, 0.00012474320828914642, 0.00012913718819618225, 0.00013353116810321808, 0.0001379251480102539]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 13.0, 16.0, 17.0, 37.0, 36.0, 42.0, 64.0, 103.0, 157.0, 179.0, 245.0, 329.0, 498.0, 680.0, 924.0, 1231.0, 1853.0, 2985.0, 4684.0, 8207.0, 17532.0, 44549.0, 130059.0, 336648.0, 308034.0, 113843.0, 39050.0, 15756.0, 7590.0, 4355.0, 2657.0, 1758.0, 1201.0, 914.0, 620.0, 461.0, 338.0, 223.0, 175.0, 137.0, 94.0, 72.0, 66.0, 31.0, 20.0, 17.0, 18.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.455291748046875, -1.40667724609375, -1.358062744140625, -1.3094482421875, -1.260833740234375, -1.21221923828125, -1.163604736328125, -1.114990234375, -1.066375732421875, -1.01776123046875, -0.969146728515625, -0.9205322265625, -0.871917724609375, -0.82330322265625, -0.774688720703125, -0.72607421875, -0.677459716796875, -0.62884521484375, -0.580230712890625, -0.5316162109375, -0.483001708984375, -0.43438720703125, -0.385772705078125, -0.337158203125, -0.288543701171875, -0.23992919921875, -0.191314697265625, -0.1427001953125, -0.094085693359375, -0.04547119140625, 0.003143310546875, 0.0517578125, 0.100372314453125, 0.14898681640625, 0.197601318359375, 0.2462158203125, 0.294830322265625, 0.34344482421875, 0.392059326171875, 0.440673828125, 0.489288330078125, 0.53790283203125, 0.586517333984375, 0.6351318359375, 0.683746337890625, 0.73236083984375, 0.780975341796875, 0.82958984375, 0.878204345703125, 0.92681884765625, 0.975433349609375, 1.0240478515625, 1.072662353515625, 1.12127685546875, 1.169891357421875, 1.218505859375, 1.267120361328125, 1.31573486328125, 1.364349365234375, 1.4129638671875, 1.461578369140625, 1.51019287109375, 1.558807373046875, 1.607421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 5.0, 13.0, 12.0, 10.0, 28.0, 20.0, 31.0, 44.0, 63.0, 68.0, 76.0, 105.0, 103.0, 76.0, 69.0, 56.0, 45.0, 39.0, 21.0, 18.0, 13.0, 12.0, 11.0, 7.0, 2.0, 2.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.365966796875, -0.3542289733886719, -0.34249114990234375, -0.3307533264160156, -0.3190155029296875, -0.3072776794433594, -0.29553985595703125, -0.2838020324707031, -0.272064208984375, -0.2603263854980469, -0.24858856201171875, -0.23685073852539062, -0.2251129150390625, -0.21337509155273438, -0.20163726806640625, -0.18989944458007812, -0.17816162109375, -0.16642379760742188, -0.15468597412109375, -0.14294815063476562, -0.1312103271484375, -0.11947250366210938, -0.10773468017578125, -0.09599685668945312, -0.084259033203125, -0.07252120971679688, -0.06078338623046875, -0.049045562744140625, -0.0373077392578125, -0.025569915771484375, -0.01383209228515625, -0.002094268798828125, 0.0096435546875, 0.021381378173828125, 0.03311920166015625, 0.044857025146484375, 0.0565948486328125, 0.06833267211914062, 0.08007049560546875, 0.09180831909179688, 0.103546142578125, 0.11528396606445312, 0.12702178955078125, 0.13875961303710938, 0.1504974365234375, 0.16223526000976562, 0.17397308349609375, 0.18571090698242188, 0.19744873046875, 0.20918655395507812, 0.22092437744140625, 0.23266220092773438, 0.2444000244140625, 0.2561378479003906, 0.26787567138671875, 0.2796134948730469, 0.291351318359375, 0.3030891418457031, 0.31482696533203125, 0.3265647888183594, 0.3383026123046875, 0.3500404357910156, 0.36177825927734375, 0.3735160827636719, 0.38525390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 10.0, 18.0, 20.0, 12.0, 20.0, 32.0, 27.0, 27.0, 31.0, 30.0, 33.0, 56.0, 55.0, 62.0, 51.0, 46.0, 54.0, 43.0, 46.0, 46.0, 42.0, 39.0, 26.0, 31.0, 34.0, 20.0, 9.0, 12.0, 13.0, 16.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265214204788208, -3.1674351692199707, -3.0696561336517334, -2.971877098083496, -2.874098062515259, -2.7763190269470215, -2.678539991378784, -2.580760955810547, -2.4829819202423096, -2.3852028846740723, -2.287423849105835, -2.1896448135375977, -2.0918657779693604, -1.994086742401123, -1.8963077068328857, -1.7985286712646484, -1.7007497549057007, -1.6029707193374634, -1.505191683769226, -1.4074126482009888, -1.3096336126327515, -1.2118545770645142, -1.1140756607055664, -1.016296625137329, -0.918517529964447, -0.8207384943962097, -0.7229594588279724, -0.6251804828643799, -0.5274014472961426, -0.4296223819255829, -0.33184337615966797, -0.23406434059143066, -0.13628530502319336, -0.03850627690553665, 0.059272751212120056, 0.15705177187919617, 0.25483080744743347, 0.3526098430156708, 0.4503888487815857, 0.548167884349823, 0.6459469199180603, 0.7437259554862976, 0.8415049910545349, 0.9392839670181274, 1.0370630025863647, 1.134842038154602, 1.2326210737228394, 1.3304001092910767, 1.428179144859314, 1.5259581804275513, 1.6237372159957886, 1.7215162515640259, 1.8192952871322632, 1.9170743227005005, 2.0148532390594482, 2.1126322746276855, 2.210411310195923, 2.30819034576416, 2.4059693813323975, 2.5037484169006348, 2.601527452468872, 2.6993064880371094, 2.7970855236053467, 2.894864559173584, 2.9926435947418213]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 7.0, 13.0, 12.0, 11.0, 18.0, 20.0, 30.0, 31.0, 23.0, 27.0, 25.0, 28.0, 39.0, 48.0, 48.0, 38.0, 34.0, 45.0, 48.0, 28.0, 33.0, 31.0, 35.0, 38.0, 35.0, 30.0, 23.0, 36.0, 20.0, 23.0, 19.0, 19.0, 16.0, 10.0, 4.0, 12.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.642449140548706, -2.5643460750579834, -2.4862427711486816, -2.408139705657959, -2.3300366401672363, -2.2519335746765137, -2.173830270767212, -2.0957272052764893, -2.0176239013671875, -1.9395207166671753, -1.8614176511764526, -1.7833144664764404, -1.7052114009857178, -1.6271082162857056, -1.5490050315856934, -1.4709019660949707, -1.392798900604248, -1.3146957159042358, -1.2365926504135132, -1.158489465713501, -1.0803864002227783, -1.0022832155227661, -0.9241800308227539, -0.8460769057273865, -0.767973780632019, -0.6898706555366516, -0.6117675304412842, -0.533664345741272, -0.45556122064590454, -0.3774580955505371, -0.2993549406528473, -0.22125178575515747, -0.14314889907836914, -0.06504575908184052, 0.01305738091468811, 0.09116052091121674, 0.16926366090774536, 0.2473667860031128, 0.3254699409008026, 0.40357309579849243, 0.48167622089385986, 0.5597793459892273, 0.6378824710845947, 0.7159856557846069, 0.7940887808799744, 0.8721919059753418, 0.950295090675354, 1.0283982753753662, 1.1065013408660889, 1.184604525566101, 1.2627075910568237, 1.340810775756836, 1.4189138412475586, 1.4970170259475708, 1.575120210647583, 1.6532232761383057, 1.7313264608383179, 1.80942964553833, 1.8875327110290527, 1.965635895729065, 2.043739080429077, 2.1218421459198, 2.1999452114105225, 2.278048515319824, 2.356151580810547]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 13.0, 17.0, 37.0, 36.0, 61.0, 97.0, 158.0, 210.0, 363.0, 574.0, 894.0, 1542.0, 2436.0, 3994.0, 6380.0, 9952.0, 15611.0, 23825.0, 35609.0, 51795.0, 70984.0, 91955.0, 110038.0, 119786.0, 117408.0, 104729.0, 84257.0, 63918.0, 45160.0, 30615.0, 20240.0, 13445.0, 8208.0, 5314.0, 3329.0, 2143.0, 1316.0, 769.0, 509.0, 328.0, 169.0, 115.0, 80.0, 53.0, 33.0, 24.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.826171875, -2.74005126953125, -2.6539306640625, -2.56781005859375, -2.481689453125, -2.39556884765625, -2.3094482421875, -2.22332763671875, -2.13720703125, -2.05108642578125, -1.9649658203125, -1.87884521484375, -1.792724609375, -1.70660400390625, -1.6204833984375, -1.53436279296875, -1.4482421875, -1.36212158203125, -1.2760009765625, -1.18988037109375, -1.103759765625, -1.01763916015625, -0.9315185546875, -0.84539794921875, -0.75927734375, -0.67315673828125, -0.5870361328125, -0.50091552734375, -0.414794921875, -0.32867431640625, -0.2425537109375, -0.15643310546875, -0.0703125, 0.01580810546875, 0.1019287109375, 0.18804931640625, 0.274169921875, 0.36029052734375, 0.4464111328125, 0.53253173828125, 0.61865234375, 0.70477294921875, 0.7908935546875, 0.87701416015625, 0.963134765625, 1.04925537109375, 1.1353759765625, 1.22149658203125, 1.3076171875, 1.39373779296875, 1.4798583984375, 1.56597900390625, 1.652099609375, 1.73822021484375, 1.8243408203125, 1.91046142578125, 1.99658203125, 2.08270263671875, 2.1688232421875, 2.25494384765625, 2.341064453125, 2.42718505859375, 2.5133056640625, 2.59942626953125, 2.685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 10.0, 4.0, 16.0, 14.0, 17.0, 22.0, 17.0, 27.0, 27.0, 36.0, 32.0, 32.0, 35.0, 45.0, 32.0, 44.0, 47.0, 34.0, 37.0, 38.0, 48.0, 36.0, 38.0, 23.0, 34.0, 35.0, 21.0, 23.0, 29.0, 19.0, 24.0, 22.0, 14.0, 10.0, 10.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.6484375, -2.57012939453125, -2.4918212890625, -2.41351318359375, -2.335205078125, -2.25689697265625, -2.1785888671875, -2.10028076171875, -2.02197265625, -1.94366455078125, -1.8653564453125, -1.78704833984375, -1.708740234375, -1.63043212890625, -1.5521240234375, -1.47381591796875, -1.3955078125, -1.31719970703125, -1.2388916015625, -1.16058349609375, -1.082275390625, -1.00396728515625, -0.9256591796875, -0.84735107421875, -0.76904296875, -0.69073486328125, -0.6124267578125, -0.53411865234375, -0.455810546875, -0.37750244140625, -0.2991943359375, -0.22088623046875, -0.142578125, -0.06427001953125, 0.0140380859375, 0.09234619140625, 0.170654296875, 0.24896240234375, 0.3272705078125, 0.40557861328125, 0.48388671875, 0.56219482421875, 0.6405029296875, 0.71881103515625, 0.797119140625, 0.87542724609375, 0.9537353515625, 1.03204345703125, 1.1103515625, 1.18865966796875, 1.2669677734375, 1.34527587890625, 1.423583984375, 1.50189208984375, 1.5802001953125, 1.65850830078125, 1.73681640625, 1.81512451171875, 1.8934326171875, 1.97174072265625, 2.050048828125, 2.12835693359375, 2.2066650390625, 2.28497314453125, 2.36328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 13.0, 13.0, 10.0, 16.0, 33.0, 48.0, 86.0, 86.0, 128.0, 190.0, 325.0, 462.0, 739.0, 1079.0, 1589.0, 2474.0, 3640.0, 5332.0, 8377.0, 12243.0, 18133.0, 26326.0, 37081.0, 51792.0, 67703.0, 84323.0, 98260.0, 107617.0, 107504.0, 98450.0, 83229.0, 66027.0, 49940.0, 36218.0, 25937.0, 17412.0, 11973.0, 8121.0, 5262.0, 3438.0, 2274.0, 1558.0, 1041.0, 623.0, 485.0, 303.0, 195.0, 132.0, 107.0, 71.0, 59.0, 28.0, 10.0, 20.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0], "bins": [-2.330078125, -2.257171630859375, -2.18426513671875, -2.111358642578125, -2.0384521484375, -1.965545654296875, -1.89263916015625, -1.819732666015625, -1.746826171875, -1.673919677734375, -1.60101318359375, -1.528106689453125, -1.4552001953125, -1.382293701171875, -1.30938720703125, -1.236480712890625, -1.16357421875, -1.090667724609375, -1.01776123046875, -0.944854736328125, -0.8719482421875, -0.799041748046875, -0.72613525390625, -0.653228759765625, -0.580322265625, -0.507415771484375, -0.43450927734375, -0.361602783203125, -0.2886962890625, -0.215789794921875, -0.14288330078125, -0.069976806640625, 0.0029296875, 0.075836181640625, 0.14874267578125, 0.221649169921875, 0.2945556640625, 0.367462158203125, 0.44036865234375, 0.513275146484375, 0.586181640625, 0.659088134765625, 0.73199462890625, 0.804901123046875, 0.8778076171875, 0.950714111328125, 1.02362060546875, 1.096527099609375, 1.16943359375, 1.242340087890625, 1.31524658203125, 1.388153076171875, 1.4610595703125, 1.533966064453125, 1.60687255859375, 1.679779052734375, 1.752685546875, 1.825592041015625, 1.89849853515625, 1.971405029296875, 2.0443115234375, 2.117218017578125, 2.19012451171875, 2.263031005859375, 2.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 5.0, 5.0, 9.0, 9.0, 7.0, 16.0, 14.0, 11.0, 17.0, 21.0, 25.0, 20.0, 33.0, 26.0, 38.0, 35.0, 40.0, 32.0, 32.0, 40.0, 45.0, 37.0, 50.0, 38.0, 28.0, 30.0, 33.0, 30.0, 29.0, 17.0, 20.0, 22.0, 18.0, 20.0, 20.0, 26.0, 12.0, 13.0, 14.0, 13.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.43359375, -1.387115478515625, -1.34063720703125, -1.294158935546875, -1.2476806640625, -1.201202392578125, -1.15472412109375, -1.108245849609375, -1.061767578125, -1.015289306640625, -0.96881103515625, -0.922332763671875, -0.8758544921875, -0.829376220703125, -0.78289794921875, -0.736419677734375, -0.68994140625, -0.643463134765625, -0.59698486328125, -0.550506591796875, -0.5040283203125, -0.457550048828125, -0.41107177734375, -0.364593505859375, -0.318115234375, -0.271636962890625, -0.22515869140625, -0.178680419921875, -0.1322021484375, -0.085723876953125, -0.03924560546875, 0.007232666015625, 0.0537109375, 0.100189208984375, 0.14666748046875, 0.193145751953125, 0.2396240234375, 0.286102294921875, 0.33258056640625, 0.379058837890625, 0.425537109375, 0.472015380859375, 0.51849365234375, 0.564971923828125, 0.6114501953125, 0.657928466796875, 0.70440673828125, 0.750885009765625, 0.79736328125, 0.843841552734375, 0.89031982421875, 0.936798095703125, 0.9832763671875, 1.029754638671875, 1.07623291015625, 1.122711181640625, 1.169189453125, 1.215667724609375, 1.26214599609375, 1.308624267578125, 1.3551025390625, 1.401580810546875, 1.44805908203125, 1.494537353515625, 1.541015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 20.0, 28.0, 47.0, 56.0, 70.0, 116.0, 175.0, 244.0, 368.0, 528.0, 736.0, 1116.0, 1884.0, 3040.0, 5412.0, 9753.0, 19544.0, 43548.0, 100710.0, 209204.0, 280337.0, 198141.0, 92559.0, 40248.0, 18322.0, 9207.0, 5009.0, 2899.0, 1810.0, 1038.0, 726.0, 498.0, 348.0, 254.0, 167.0, 114.0, 81.0, 52.0, 31.0, 21.0, 22.0, 13.0, 16.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.954742431640625, -2.85089111328125, -2.747039794921875, -2.6431884765625, -2.539337158203125, -2.43548583984375, -2.331634521484375, -2.227783203125, -2.123931884765625, -2.02008056640625, -1.916229248046875, -1.8123779296875, -1.708526611328125, -1.60467529296875, -1.500823974609375, -1.39697265625, -1.293121337890625, -1.18927001953125, -1.085418701171875, -0.9815673828125, -0.877716064453125, -0.77386474609375, -0.670013427734375, -0.566162109375, -0.462310791015625, -0.35845947265625, -0.254608154296875, -0.1507568359375, -0.046905517578125, 0.05694580078125, 0.160797119140625, 0.2646484375, 0.368499755859375, 0.47235107421875, 0.576202392578125, 0.6800537109375, 0.783905029296875, 0.88775634765625, 0.991607666015625, 1.095458984375, 1.199310302734375, 1.30316162109375, 1.407012939453125, 1.5108642578125, 1.614715576171875, 1.71856689453125, 1.822418212890625, 1.92626953125, 2.030120849609375, 2.13397216796875, 2.237823486328125, 2.3416748046875, 2.445526123046875, 2.54937744140625, 2.653228759765625, 2.757080078125, 2.860931396484375, 2.96478271484375, 3.068634033203125, 3.1724853515625, 3.276336669921875, 3.38018798828125, 3.484039306640625, 3.587890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 6.0, 14.0, 8.0, 20.0, 38.0, 64.0, 75.0, 109.0, 111.0, 107.0, 124.0, 91.0, 65.0, 52.0, 33.0, 23.0, 20.0, 4.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004410743713378906, -0.0004278421401977539, -0.0004146099090576172, -0.00040137767791748047, -0.00038814544677734375, -0.00037491321563720703, -0.0003616809844970703, -0.0003484487533569336, -0.0003352165222167969, -0.00032198429107666016, -0.00030875205993652344, -0.0002955198287963867, -0.00028228759765625, -0.0002690553665161133, -0.00025582313537597656, -0.00024259090423583984, -0.00022935867309570312, -0.0002161264419555664, -0.0002028942108154297, -0.00018966197967529297, -0.00017642974853515625, -0.00016319751739501953, -0.0001499652862548828, -0.0001367330551147461, -0.00012350082397460938, -0.00011026859283447266, -9.703636169433594e-05, -8.380413055419922e-05, -7.05718994140625e-05, -5.733966827392578e-05, -4.410743713378906e-05, -3.0875205993652344e-05, -1.7642974853515625e-05, -4.410743713378906e-06, 8.821487426757812e-06, 2.205371856689453e-05, 3.528594970703125e-05, 4.851818084716797e-05, 6.175041198730469e-05, 7.49826431274414e-05, 8.821487426757812e-05, 0.00010144710540771484, 0.00011467933654785156, 0.00012791156768798828, 0.000141143798828125, 0.00015437602996826172, 0.00016760826110839844, 0.00018084049224853516, 0.00019407272338867188, 0.0002073049545288086, 0.0002205371856689453, 0.00023376941680908203, 0.00024700164794921875, 0.00026023387908935547, 0.0002734661102294922, 0.0002866983413696289, 0.0002999305725097656, 0.00031316280364990234, 0.00032639503479003906, 0.0003396272659301758, 0.0003528594970703125, 0.0003660917282104492, 0.00037932395935058594, 0.00039255619049072266, 0.0004057884216308594]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 7.0, 16.0, 21.0, 36.0, 39.0, 55.0, 59.0, 115.0, 178.0, 278.0, 408.0, 621.0, 940.0, 1536.0, 2281.0, 3789.0, 6237.0, 10406.0, 18017.0, 30099.0, 50877.0, 83858.0, 126549.0, 163657.0, 169286.0, 138581.0, 94878.0, 58745.0, 35242.0, 20592.0, 11919.0, 7235.0, 4366.0, 2700.0, 1789.0, 1070.0, 684.0, 459.0, 290.0, 195.0, 135.0, 99.0, 58.0, 51.0, 29.0, 20.0, 16.0, 6.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.78515625, -1.7278289794921875, -1.670501708984375, -1.6131744384765625, -1.55584716796875, -1.4985198974609375, -1.441192626953125, -1.3838653564453125, -1.3265380859375, -1.2692108154296875, -1.211883544921875, -1.1545562744140625, -1.09722900390625, -1.0399017333984375, -0.982574462890625, -0.9252471923828125, -0.867919921875, -0.8105926513671875, -0.753265380859375, -0.6959381103515625, -0.63861083984375, -0.5812835693359375, -0.523956298828125, -0.4666290283203125, -0.4093017578125, -0.3519744873046875, -0.294647216796875, -0.2373199462890625, -0.17999267578125, -0.1226654052734375, -0.065338134765625, -0.0080108642578125, 0.04931640625, 0.1066436767578125, 0.163970947265625, 0.2212982177734375, 0.27862548828125, 0.3359527587890625, 0.393280029296875, 0.4506072998046875, 0.5079345703125, 0.5652618408203125, 0.622589111328125, 0.6799163818359375, 0.73724365234375, 0.7945709228515625, 0.851898193359375, 0.9092254638671875, 0.966552734375, 1.0238800048828125, 1.081207275390625, 1.1385345458984375, 1.19586181640625, 1.2531890869140625, 1.310516357421875, 1.3678436279296875, 1.4251708984375, 1.4824981689453125, 1.539825439453125, 1.5971527099609375, 1.65447998046875, 1.7118072509765625, 1.769134521484375, 1.8264617919921875, 1.8837890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 6.0, 8.0, 15.0, 14.0, 15.0, 23.0, 22.0, 32.0, 37.0, 31.0, 38.0, 51.0, 49.0, 39.0, 45.0, 45.0, 50.0, 60.0, 58.0, 34.0, 33.0, 31.0, 39.0, 31.0, 23.0, 21.0, 24.0, 8.0, 19.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.51513671875, -0.49948883056640625, -0.4838409423828125, -0.46819305419921875, -0.452545166015625, -0.43689727783203125, -0.4212493896484375, -0.40560150146484375, -0.38995361328125, -0.37430572509765625, -0.3586578369140625, -0.34300994873046875, -0.327362060546875, -0.31171417236328125, -0.2960662841796875, -0.28041839599609375, -0.2647705078125, -0.24912261962890625, -0.2334747314453125, -0.21782684326171875, -0.202178955078125, -0.18653106689453125, -0.1708831787109375, -0.15523529052734375, -0.13958740234375, -0.12393951416015625, -0.1082916259765625, -0.09264373779296875, -0.076995849609375, -0.06134796142578125, -0.0457000732421875, -0.03005218505859375, -0.014404296875, 0.00124359130859375, 0.0168914794921875, 0.03253936767578125, 0.048187255859375, 0.06383514404296875, 0.0794830322265625, 0.09513092041015625, 0.11077880859375, 0.12642669677734375, 0.1420745849609375, 0.15772247314453125, 0.173370361328125, 0.18901824951171875, 0.2046661376953125, 0.22031402587890625, 0.2359619140625, 0.25160980224609375, 0.2672576904296875, 0.28290557861328125, 0.298553466796875, 0.31420135498046875, 0.3298492431640625, 0.34549713134765625, 0.36114501953125, 0.37679290771484375, 0.3924407958984375, 0.40808868408203125, 0.423736572265625, 0.43938446044921875, 0.4550323486328125, 0.47068023681640625, 0.486328125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 9.0, 12.0, 18.0, 20.0, 20.0, 18.0, 23.0, 25.0, 30.0, 27.0, 40.0, 38.0, 53.0, 49.0, 32.0, 47.0, 50.0, 56.0, 43.0, 36.0, 44.0, 40.0, 33.0, 25.0, 26.0, 30.0, 24.0, 17.0, 18.0, 13.0, 17.0, 11.0, 2.0, 9.0, 8.0, 5.0, 2.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.74275541305542, -2.6544618606567383, -2.5661680698394775, -2.477874279022217, -2.389580726623535, -2.3012871742248535, -2.2129933834075928, -2.124699592590332, -2.0364060401916504, -1.9481123685836792, -1.859818696975708, -1.7715250253677368, -1.6832313537597656, -1.5949376821517944, -1.5066440105438232, -1.418350338935852, -1.3300566673278809, -1.2417629957199097, -1.1534693241119385, -1.0651756525039673, -0.9768819808959961, -0.8885883092880249, -0.8002946376800537, -0.7120009660720825, -0.6237072944641113, -0.5354136228561401, -0.44711995124816895, -0.35882627964019775, -0.27053260803222656, -0.18223893642425537, -0.09394526481628418, -0.005651593208312988, 0.0826418399810791, 0.1709355115890503, 0.2592291831970215, 0.3475228548049927, 0.43581652641296387, 0.5241101980209351, 0.6124038696289062, 0.7006975412368774, 0.7889912128448486, 0.8772848844528198, 0.965578556060791, 1.0538722276687622, 1.1421658992767334, 1.2304595708847046, 1.3187532424926758, 1.407046914100647, 1.4953405857086182, 1.5836342573165894, 1.6719279289245605, 1.7602216005325317, 1.848515272140503, 1.9368089437484741, 2.0251026153564453, 2.113396167755127, 2.2016899585723877, 2.2899837493896484, 2.37827730178833, 2.4665708541870117, 2.5548646450042725, 2.643158435821533, 2.731451988220215, 2.8197455406188965, 2.9080393314361572]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 12.0, 17.0, 13.0, 12.0, 18.0, 18.0, 11.0, 21.0, 21.0, 22.0, 29.0, 25.0, 35.0, 44.0, 31.0, 45.0, 38.0, 35.0, 41.0, 38.0, 50.0, 36.0, 35.0, 30.0, 35.0, 29.0, 31.0, 25.0, 26.0, 20.0, 23.0, 24.0, 17.0, 17.0, 13.0, 9.0, 7.0, 8.0, 1.0, 7.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5127570629119873, -2.4362292289733887, -2.35970139503479, -2.2831737995147705, -2.206645965576172, -2.1301181316375732, -2.0535902976989746, -1.977062463760376, -1.900534749031067, -1.8240069150924683, -1.7474792003631592, -1.6709513664245605, -1.594423532485962, -1.5178958177566528, -1.4413679838180542, -1.3648402690887451, -1.2883124351501465, -1.2117846012115479, -1.1352568864822388, -1.0587290525436401, -0.9822012782096863, -0.9056735038757324, -0.8291456699371338, -0.7526178956031799, -0.6760901212692261, -0.5995623469352722, -0.5230345726013184, -0.4465067386627197, -0.36997896432876587, -0.293451189994812, -0.21692338585853577, -0.14039558172225952, -0.06386804580688477, 0.012659743428230286, 0.08918753266334534, 0.1657153218984604, 0.24224311113357544, 0.3187708854675293, 0.39529868960380554, 0.4718264937400818, 0.5483542680740356, 0.6248820424079895, 0.7014098167419434, 0.777937650680542, 0.8544654250144958, 0.9309931993484497, 1.0075210332870483, 1.0840487480163574, 1.160576581954956, 1.2371044158935547, 1.3136321306228638, 1.3901599645614624, 1.4666876792907715, 1.5432155132293701, 1.6197433471679688, 1.6962711811065674, 1.7727988958358765, 1.849326729774475, 1.9258544445037842, 2.002382278442383, 2.0789101123809814, 2.15543794631958, 2.2319655418395996, 2.3084933757781982, 2.385021209716797]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 6.0, 10.0, 21.0, 21.0, 41.0, 82.0, 159.0, 239.0, 390.0, 668.0, 1130.0, 1920.0, 3135.0, 5245.0, 8943.0, 15356.0, 26283.0, 43784.0, 73951.0, 121924.0, 195773.0, 300346.0, 427972.0, 543121.0, 593948.0, 550498.0, 439748.0, 312250.0, 205893.0, 128274.0, 78963.0, 46810.0, 27504.0, 16233.0, 9442.0, 5712.0, 3344.0, 2006.0, 1213.0, 724.0, 465.0, 299.0, 164.0, 114.0, 60.0, 31.0, 42.0, 11.0, 8.0, 1.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8932037353515625, -1.824493408203125, -1.7557830810546875, -1.68707275390625, -1.6183624267578125, -1.549652099609375, -1.4809417724609375, -1.4122314453125, -1.3435211181640625, -1.274810791015625, -1.2061004638671875, -1.13739013671875, -1.0686798095703125, -0.999969482421875, -0.9312591552734375, -0.862548828125, -0.7938385009765625, -0.725128173828125, -0.6564178466796875, -0.58770751953125, -0.5189971923828125, -0.450286865234375, -0.3815765380859375, -0.3128662109375, -0.2441558837890625, -0.175445556640625, -0.1067352294921875, -0.03802490234375, 0.0306854248046875, 0.099395751953125, 0.1681060791015625, 0.23681640625, 0.3055267333984375, 0.374237060546875, 0.4429473876953125, 0.51165771484375, 0.5803680419921875, 0.649078369140625, 0.7177886962890625, 0.7864990234375, 0.8552093505859375, 0.923919677734375, 0.9926300048828125, 1.06134033203125, 1.1300506591796875, 1.198760986328125, 1.2674713134765625, 1.336181640625, 1.4048919677734375, 1.473602294921875, 1.5423126220703125, 1.61102294921875, 1.6797332763671875, 1.748443603515625, 1.8171539306640625, 1.8858642578125, 1.9545745849609375, 2.023284912109375, 2.0919952392578125, 2.16070556640625, 2.2294158935546875, 2.298126220703125, 2.3668365478515625, 2.435546875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 12.0, 13.0, 19.0, 8.0, 17.0, 29.0, 30.0, 17.0, 36.0, 35.0, 32.0, 40.0, 40.0, 38.0, 45.0, 37.0, 45.0, 44.0, 46.0, 44.0, 38.0, 34.0, 35.0, 26.0, 31.0, 24.0, 26.0, 26.0, 15.0, 20.0, 12.0, 16.0, 16.0, 11.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9421234130859375, -1.882293701171875, -1.8224639892578125, -1.76263427734375, -1.7028045654296875, -1.642974853515625, -1.5831451416015625, -1.5233154296875, -1.4634857177734375, -1.403656005859375, -1.3438262939453125, -1.28399658203125, -1.2241668701171875, -1.164337158203125, -1.1045074462890625, -1.044677734375, -0.9848480224609375, -0.925018310546875, -0.8651885986328125, -0.80535888671875, -0.7455291748046875, -0.685699462890625, -0.6258697509765625, -0.5660400390625, -0.5062103271484375, -0.446380615234375, -0.3865509033203125, -0.32672119140625, -0.2668914794921875, -0.207061767578125, -0.1472320556640625, -0.08740234375, -0.0275726318359375, 0.032257080078125, 0.0920867919921875, 0.15191650390625, 0.2117462158203125, 0.271575927734375, 0.3314056396484375, 0.3912353515625, 0.4510650634765625, 0.510894775390625, 0.5707244873046875, 0.63055419921875, 0.6903839111328125, 0.750213623046875, 0.8100433349609375, 0.869873046875, 0.9297027587890625, 0.989532470703125, 1.0493621826171875, 1.10919189453125, 1.1690216064453125, 1.228851318359375, 1.2886810302734375, 1.3485107421875, 1.4083404541015625, 1.468170166015625, 1.5279998779296875, 1.58782958984375, 1.6476593017578125, 1.707489013671875, 1.7673187255859375, 1.8271484375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 9.0, 8.0, 19.0, 37.0, 48.0, 70.0, 121.0, 167.0, 305.0, 522.0, 747.0, 1175.0, 1888.0, 3016.0, 4639.0, 7535.0, 11887.0, 18713.0, 29477.0, 45899.0, 70096.0, 105526.0, 151809.0, 214589.0, 287922.0, 365575.0, 428604.0, 462047.0, 449901.0, 399661.0, 328065.0, 250259.0, 182285.0, 127444.0, 85086.0, 57148.0, 37173.0, 23739.0, 15027.0, 9676.0, 5978.0, 3814.0, 2405.0, 1584.0, 941.0, 611.0, 388.0, 230.0, 144.0, 83.0, 92.0, 36.0, 26.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0], "bins": [-1.8271484375, -1.7713623046875, -1.715576171875, -1.6597900390625, -1.60400390625, -1.5482177734375, -1.492431640625, -1.4366455078125, -1.380859375, -1.3250732421875, -1.269287109375, -1.2135009765625, -1.15771484375, -1.1019287109375, -1.046142578125, -0.9903564453125, -0.9345703125, -0.8787841796875, -0.822998046875, -0.7672119140625, -0.71142578125, -0.6556396484375, -0.599853515625, -0.5440673828125, -0.48828125, -0.4324951171875, -0.376708984375, -0.3209228515625, -0.26513671875, -0.2093505859375, -0.153564453125, -0.0977783203125, -0.0419921875, 0.0137939453125, 0.069580078125, 0.1253662109375, 0.18115234375, 0.2369384765625, 0.292724609375, 0.3485107421875, 0.404296875, 0.4600830078125, 0.515869140625, 0.5716552734375, 0.62744140625, 0.6832275390625, 0.739013671875, 0.7947998046875, 0.8505859375, 0.9063720703125, 0.962158203125, 1.0179443359375, 1.07373046875, 1.1295166015625, 1.185302734375, 1.2410888671875, 1.296875, 1.3526611328125, 1.408447265625, 1.4642333984375, 1.52001953125, 1.5758056640625, 1.631591796875, 1.6873779296875, 1.7431640625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 17.0, 15.0, 19.0, 14.0, 21.0, 18.0, 38.0, 35.0, 45.0, 55.0, 65.0, 106.0, 108.0, 117.0, 120.0, 146.0, 155.0, 174.0, 173.0, 199.0, 202.0, 188.0, 197.0, 193.0, 198.0, 167.0, 179.0, 164.0, 144.0, 129.0, 104.0, 106.0, 79.0, 56.0, 84.0, 58.0, 39.0, 27.0, 20.0, 23.0, 21.0, 9.0, 8.0, 12.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.88037109375, -0.8539810180664062, -0.8275909423828125, -0.8012008666992188, -0.774810791015625, -0.7484207153320312, -0.7220306396484375, -0.6956405639648438, -0.66925048828125, -0.6428604125976562, -0.6164703369140625, -0.5900802612304688, -0.563690185546875, -0.5373001098632812, -0.5109100341796875, -0.48451995849609375, -0.4581298828125, -0.43173980712890625, -0.4053497314453125, -0.37895965576171875, -0.352569580078125, -0.32617950439453125, -0.2997894287109375, -0.27339935302734375, -0.24700927734375, -0.22061920166015625, -0.1942291259765625, -0.16783905029296875, -0.141448974609375, -0.11505889892578125, -0.0886688232421875, -0.06227874755859375, -0.035888671875, -0.00949859619140625, 0.0168914794921875, 0.04328155517578125, 0.069671630859375, 0.09606170654296875, 0.1224517822265625, 0.14884185791015625, 0.17523193359375, 0.20162200927734375, 0.2280120849609375, 0.25440216064453125, 0.280792236328125, 0.30718231201171875, 0.3335723876953125, 0.35996246337890625, 0.3863525390625, 0.41274261474609375, 0.4391326904296875, 0.46552276611328125, 0.491912841796875, 0.5183029174804688, 0.5446929931640625, 0.5710830688476562, 0.59747314453125, 0.6238632202148438, 0.6502532958984375, 0.6766433715820312, 0.703033447265625, 0.7294235229492188, 0.7558135986328125, 0.7822036743164062, 0.80859375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 11.0, 18.0, 21.0, 28.0, 26.0, 25.0, 44.0, 35.0, 38.0, 41.0, 48.0, 41.0, 53.0, 54.0, 62.0, 55.0, 44.0, 40.0, 44.0, 34.0, 41.0, 40.0, 27.0, 22.0, 13.0, 16.0, 12.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.011713743209839, -2.9235851764678955, -2.835456609725952, -2.747328042984009, -2.6591994762420654, -2.571070909500122, -2.482942581176758, -2.3948140144348145, -2.306685447692871, -2.2185568809509277, -2.1304283142089844, -2.042299747467041, -1.9541711807250977, -1.8660426139831543, -1.7779141664505005, -1.6897855997085571, -1.6016569137573242, -1.5135283470153809, -1.4253997802734375, -1.3372712135314941, -1.2491426467895508, -1.1610140800476074, -1.0728856325149536, -0.9847570657730103, -0.8966284990310669, -0.8084999322891235, -0.7203713655471802, -0.6322428584098816, -0.5441142916679382, -0.4559857249259949, -0.3678572177886963, -0.27972865104675293, -0.19160032272338867, -0.1034717708826065, -0.01534321904182434, 0.07278531789779663, 0.16091388463974, 0.24904245138168335, 0.33717095851898193, 0.4252995252609253, 0.5134280920028687, 0.601556658744812, 0.6896852254867554, 0.777813732624054, 0.8659422993659973, 0.9540708661079407, 1.0421993732452393, 1.1303279399871826, 1.218456506729126, 1.3065850734710693, 1.3947136402130127, 1.482842206954956, 1.5709707736968994, 1.6590993404388428, 1.7472277879714966, 1.83535635471344, 1.9234849214553833, 2.011613368988037, 2.0997419357299805, 2.187870502471924, 2.275999069213867, 2.3641276359558105, 2.452256202697754, 2.5403847694396973, 2.6285133361816406]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 6.0, 12.0, 12.0, 14.0, 12.0, 15.0, 16.0, 16.0, 22.0, 19.0, 35.0, 35.0, 24.0, 23.0, 22.0, 24.0, 34.0, 42.0, 40.0, 31.0, 47.0, 35.0, 44.0, 37.0, 34.0, 27.0, 35.0, 27.0, 32.0, 26.0, 15.0, 26.0, 20.0, 15.0, 13.0, 16.0, 16.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.096761703491211, -2.035475492477417, -1.9741891622543335, -1.91290283203125, -1.851616621017456, -1.790330410003662, -1.7290440797805786, -1.6677577495574951, -1.6064715385437012, -1.5451853275299072, -1.4838989973068237, -1.4226126670837402, -1.3613264560699463, -1.3000402450561523, -1.2387539148330688, -1.1774675846099854, -1.1161813735961914, -1.0548951625823975, -0.993608832359314, -0.9323225617408752, -0.8710362911224365, -0.8097500205039978, -0.7484637498855591, -0.6871774792671204, -0.6258912086486816, -0.5646049380302429, -0.5033186674118042, -0.4420323967933655, -0.38074612617492676, -0.31945985555648804, -0.2581735849380493, -0.1968873143196106, -0.13560104370117188, -0.07431477308273315, -0.013028502464294434, 0.04825776815414429, 0.10954403877258301, 0.17083030939102173, 0.23211658000946045, 0.29340285062789917, 0.3546891212463379, 0.4159753918647766, 0.47726166248321533, 0.538547933101654, 0.5998342037200928, 0.6611204743385315, 0.7224067449569702, 0.7836930155754089, 0.8449792861938477, 0.9062655568122864, 0.9675518274307251, 1.0288381576538086, 1.0901243686676025, 1.1514105796813965, 1.21269690990448, 1.2739832401275635, 1.3352694511413574, 1.3965556621551514, 1.4578419923782349, 1.5191283226013184, 1.5804145336151123, 1.6417007446289062, 1.7029870748519897, 1.7642734050750732, 1.8255596160888672]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 10.0, 9.0, 20.0, 18.0, 25.0, 37.0, 46.0, 61.0, 91.0, 128.0, 177.0, 265.0, 417.0, 556.0, 812.0, 1361.0, 2705.0, 5607.0, 14257.0, 43241.0, 140649.0, 375635.0, 308765.0, 101030.0, 31303.0, 10988.0, 4435.0, 2184.0, 1269.0, 779.0, 503.0, 344.0, 251.0, 156.0, 122.0, 82.0, 51.0, 43.0, 29.0, 28.0, 20.0, 16.0, 6.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.629638671875, -2.54443359375, -2.459228515625, -2.3740234375, -2.288818359375, -2.20361328125, -2.118408203125, -2.033203125, -1.947998046875, -1.86279296875, -1.777587890625, -1.6923828125, -1.607177734375, -1.52197265625, -1.436767578125, -1.3515625, -1.266357421875, -1.18115234375, -1.095947265625, -1.0107421875, -0.925537109375, -0.84033203125, -0.755126953125, -0.669921875, -0.584716796875, -0.49951171875, -0.414306640625, -0.3291015625, -0.243896484375, -0.15869140625, -0.073486328125, 0.01171875, 0.096923828125, 0.18212890625, 0.267333984375, 0.3525390625, 0.437744140625, 0.52294921875, 0.608154296875, 0.693359375, 0.778564453125, 0.86376953125, 0.948974609375, 1.0341796875, 1.119384765625, 1.20458984375, 1.289794921875, 1.375, 1.460205078125, 1.54541015625, 1.630615234375, 1.7158203125, 1.801025390625, 1.88623046875, 1.971435546875, 2.056640625, 2.141845703125, 2.22705078125, 2.312255859375, 2.3974609375, 2.482666015625, 2.56787109375, 2.653076171875, 2.73828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 14.0, 9.0, 7.0, 10.0, 13.0, 21.0, 20.0, 21.0, 26.0, 28.0, 34.0, 31.0, 28.0, 30.0, 35.0, 32.0, 34.0, 35.0, 46.0, 47.0, 38.0, 38.0, 33.0, 33.0, 21.0, 30.0, 28.0, 24.0, 22.0, 14.0, 29.0, 15.0, 15.0, 22.0, 18.0, 10.0, 8.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-2.134765625, -2.0708160400390625, -2.006866455078125, -1.9429168701171875, -1.87896728515625, -1.8150177001953125, -1.751068115234375, -1.6871185302734375, -1.6231689453125, -1.5592193603515625, -1.495269775390625, -1.4313201904296875, -1.36737060546875, -1.3034210205078125, -1.239471435546875, -1.1755218505859375, -1.111572265625, -1.0476226806640625, -0.983673095703125, -0.9197235107421875, -0.85577392578125, -0.7918243408203125, -0.727874755859375, -0.6639251708984375, -0.5999755859375, -0.5360260009765625, -0.472076416015625, -0.4081268310546875, -0.34417724609375, -0.2802276611328125, -0.216278076171875, -0.1523284912109375, -0.08837890625, -0.0244293212890625, 0.039520263671875, 0.1034698486328125, 0.16741943359375, 0.2313690185546875, 0.295318603515625, 0.3592681884765625, 0.4232177734375, 0.4871673583984375, 0.551116943359375, 0.6150665283203125, 0.67901611328125, 0.7429656982421875, 0.806915283203125, 0.8708648681640625, 0.934814453125, 0.9987640380859375, 1.062713623046875, 1.1266632080078125, 1.19061279296875, 1.2545623779296875, 1.318511962890625, 1.3824615478515625, 1.4464111328125, 1.5103607177734375, 1.574310302734375, 1.6382598876953125, 1.70220947265625, 1.7661590576171875, 1.830108642578125, 1.8940582275390625, 1.9580078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 9.0, 5.0, 12.0, 15.0, 19.0, 20.0, 35.0, 42.0, 65.0, 84.0, 101.0, 149.0, 214.0, 318.0, 477.0, 797.0, 1312.0, 2466.0, 5516.0, 13967.0, 39360.0, 128808.0, 370817.0, 324835.0, 104280.0, 32704.0, 11659.0, 4724.0, 2312.0, 1175.0, 725.0, 433.0, 311.0, 216.0, 177.0, 96.0, 76.0, 49.0, 41.0, 24.0, 24.0, 21.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 3.0], "bins": [-2.76171875, -2.6826171875, -2.603515625, -2.5244140625, -2.4453125, -2.3662109375, -2.287109375, -2.2080078125, -2.12890625, -2.0498046875, -1.970703125, -1.8916015625, -1.8125, -1.7333984375, -1.654296875, -1.5751953125, -1.49609375, -1.4169921875, -1.337890625, -1.2587890625, -1.1796875, -1.1005859375, -1.021484375, -0.9423828125, -0.86328125, -0.7841796875, -0.705078125, -0.6259765625, -0.546875, -0.4677734375, -0.388671875, -0.3095703125, -0.23046875, -0.1513671875, -0.072265625, 0.0068359375, 0.0859375, 0.1650390625, 0.244140625, 0.3232421875, 0.40234375, 0.4814453125, 0.560546875, 0.6396484375, 0.71875, 0.7978515625, 0.876953125, 0.9560546875, 1.03515625, 1.1142578125, 1.193359375, 1.2724609375, 1.3515625, 1.4306640625, 1.509765625, 1.5888671875, 1.66796875, 1.7470703125, 1.826171875, 1.9052734375, 1.984375, 2.0634765625, 2.142578125, 2.2216796875, 2.30078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 8.0, 14.0, 11.0, 11.0, 14.0, 24.0, 22.0, 28.0, 26.0, 27.0, 22.0, 38.0, 39.0, 23.0, 30.0, 40.0, 43.0, 51.0, 49.0, 53.0, 40.0, 38.0, 34.0, 46.0, 36.0, 40.0, 23.0, 24.0, 19.0, 28.0, 18.0, 16.0, 7.0, 10.0, 10.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.734375, -1.6830291748046875, -1.631683349609375, -1.5803375244140625, -1.52899169921875, -1.4776458740234375, -1.426300048828125, -1.3749542236328125, -1.3236083984375, -1.2722625732421875, -1.220916748046875, -1.1695709228515625, -1.11822509765625, -1.0668792724609375, -1.015533447265625, -0.9641876220703125, -0.912841796875, -0.8614959716796875, -0.810150146484375, -0.7588043212890625, -0.70745849609375, -0.6561126708984375, -0.604766845703125, -0.5534210205078125, -0.5020751953125, -0.4507293701171875, -0.399383544921875, -0.3480377197265625, -0.29669189453125, -0.2453460693359375, -0.194000244140625, -0.1426544189453125, -0.09130859375, -0.0399627685546875, 0.011383056640625, 0.0627288818359375, 0.11407470703125, 0.1654205322265625, 0.216766357421875, 0.2681121826171875, 0.3194580078125, 0.3708038330078125, 0.422149658203125, 0.4734954833984375, 0.52484130859375, 0.5761871337890625, 0.627532958984375, 0.6788787841796875, 0.730224609375, 0.7815704345703125, 0.832916259765625, 0.8842620849609375, 0.93560791015625, 0.9869537353515625, 1.038299560546875, 1.0896453857421875, 1.1409912109375, 1.1923370361328125, 1.243682861328125, 1.2950286865234375, 1.34637451171875, 1.3977203369140625, 1.449066162109375, 1.5004119873046875, 1.5517578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 10.0, 9.0, 8.0, 19.0, 28.0, 21.0, 31.0, 52.0, 91.0, 116.0, 173.0, 269.0, 380.0, 556.0, 871.0, 1501.0, 2573.0, 4553.0, 10212.0, 30174.0, 135434.0, 560332.0, 229287.0, 44475.0, 13761.0, 5808.0, 3035.0, 1658.0, 1054.0, 670.0, 436.0, 302.0, 189.0, 126.0, 79.0, 66.0, 49.0, 40.0, 34.0, 16.0, 19.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.205078125, -1.1681671142578125, -1.131256103515625, -1.0943450927734375, -1.05743408203125, -1.0205230712890625, -0.983612060546875, -0.9467010498046875, -0.9097900390625, -0.8728790283203125, -0.835968017578125, -0.7990570068359375, -0.76214599609375, -0.7252349853515625, -0.688323974609375, -0.6514129638671875, -0.614501953125, -0.5775909423828125, -0.540679931640625, -0.5037689208984375, -0.46685791015625, -0.4299468994140625, -0.393035888671875, -0.3561248779296875, -0.3192138671875, -0.2823028564453125, -0.245391845703125, -0.2084808349609375, -0.17156982421875, -0.1346588134765625, -0.097747802734375, -0.0608367919921875, -0.02392578125, 0.0129852294921875, 0.049896240234375, 0.0868072509765625, 0.12371826171875, 0.1606292724609375, 0.197540283203125, 0.2344512939453125, 0.2713623046875, 0.3082733154296875, 0.345184326171875, 0.3820953369140625, 0.41900634765625, 0.4559173583984375, 0.492828369140625, 0.5297393798828125, 0.566650390625, 0.6035614013671875, 0.640472412109375, 0.6773834228515625, 0.71429443359375, 0.7512054443359375, 0.788116455078125, 0.8250274658203125, 0.8619384765625, 0.8988494873046875, 0.935760498046875, 0.9726715087890625, 1.00958251953125, 1.0464935302734375, 1.083404541015625, 1.1203155517578125, 1.1572265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 10.0, 20.0, 31.0, 34.0, 38.0, 54.0, 67.0, 70.0, 62.0, 74.0, 94.0, 76.0, 68.0, 47.0, 35.0, 41.0, 26.0, 30.0, 21.0, 18.0, 8.0, 9.0, 4.0, 4.0, 1.0, 7.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.99758529663086e-05, -6.81411474943161e-05, -6.630644202232361e-05, -6.447173655033112e-05, -6.263703107833862e-05, -6.080232560634613e-05, -5.896762013435364e-05, -5.7132914662361145e-05, -5.529820919036865e-05, -5.346350371837616e-05, -5.162879824638367e-05, -4.9794092774391174e-05, -4.795938730239868e-05, -4.612468183040619e-05, -4.4289976358413696e-05, -4.2455270886421204e-05, -4.062056541442871e-05, -3.878585994243622e-05, -3.6951154470443726e-05, -3.511644899845123e-05, -3.328174352645874e-05, -3.144703805446625e-05, -2.9612332582473755e-05, -2.7777627110481262e-05, -2.594292163848877e-05, -2.4108216166496277e-05, -2.2273510694503784e-05, -2.043880522251129e-05, -1.86040997505188e-05, -1.6769394278526306e-05, -1.4934688806533813e-05, -1.309998333454132e-05, -1.1265277862548828e-05, -9.430572390556335e-06, -7.595866918563843e-06, -5.76116144657135e-06, -3.926455974578857e-06, -2.0917505025863647e-06, -2.5704503059387207e-07, 1.5776604413986206e-06, 3.4123659133911133e-06, 5.247071385383606e-06, 7.081776857376099e-06, 8.916482329368591e-06, 1.0751187801361084e-05, 1.2585893273353577e-05, 1.442059874534607e-05, 1.6255304217338562e-05, 1.8090009689331055e-05, 1.9924715161323547e-05, 2.175942063331604e-05, 2.3594126105308533e-05, 2.5428831577301025e-05, 2.7263537049293518e-05, 2.909824252128601e-05, 3.0932947993278503e-05, 3.2767653465270996e-05, 3.460235893726349e-05, 3.643706440925598e-05, 3.8271769881248474e-05, 4.010647535324097e-05, 4.194118082523346e-05, 4.377588629722595e-05, 4.5610591769218445e-05, 4.744529724121094e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 14.0, 15.0, 30.0, 39.0, 55.0, 83.0, 105.0, 178.0, 249.0, 384.0, 560.0, 839.0, 1297.0, 1942.0, 3400.0, 5662.0, 10182.0, 19208.0, 38796.0, 81446.0, 169774.0, 276304.0, 218826.0, 110166.0, 52086.0, 25528.0, 13194.0, 7150.0, 4109.0, 2352.0, 1586.0, 958.0, 682.0, 441.0, 288.0, 199.0, 135.0, 95.0, 63.0, 40.0, 21.0, 16.0, 17.0, 6.0, 10.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7031707763671875, -0.680267333984375, -0.6573638916015625, -0.63446044921875, -0.6115570068359375, -0.588653564453125, -0.5657501220703125, -0.5428466796875, -0.5199432373046875, -0.497039794921875, -0.4741363525390625, -0.45123291015625, -0.4283294677734375, -0.405426025390625, -0.3825225830078125, -0.359619140625, -0.3367156982421875, -0.313812255859375, -0.2909088134765625, -0.26800537109375, -0.2451019287109375, -0.222198486328125, -0.1992950439453125, -0.1763916015625, -0.1534881591796875, -0.130584716796875, -0.1076812744140625, -0.08477783203125, -0.0618743896484375, -0.038970947265625, -0.0160675048828125, 0.0068359375, 0.0297393798828125, 0.052642822265625, 0.0755462646484375, 0.09844970703125, 0.1213531494140625, 0.144256591796875, 0.1671600341796875, 0.1900634765625, 0.2129669189453125, 0.235870361328125, 0.2587738037109375, 0.28167724609375, 0.3045806884765625, 0.327484130859375, 0.3503875732421875, 0.373291015625, 0.3961944580078125, 0.419097900390625, 0.4420013427734375, 0.46490478515625, 0.4878082275390625, 0.510711669921875, 0.5336151123046875, 0.5565185546875, 0.5794219970703125, 0.602325439453125, 0.6252288818359375, 0.64813232421875, 0.6710357666015625, 0.693939208984375, 0.7168426513671875, 0.73974609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 6.0, 12.0, 22.0, 28.0, 25.0, 55.0, 65.0, 77.0, 97.0, 116.0, 105.0, 97.0, 74.0, 64.0, 43.0, 22.0, 28.0, 9.0, 13.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2656707763671875, -0.254974365234375, -0.2442779541015625, -0.23358154296875, -0.2228851318359375, -0.212188720703125, -0.2014923095703125, -0.1907958984375, -0.1800994873046875, -0.169403076171875, -0.1587066650390625, -0.14801025390625, -0.1373138427734375, -0.126617431640625, -0.1159210205078125, -0.105224609375, -0.0945281982421875, -0.083831787109375, -0.0731353759765625, -0.06243896484375, -0.0517425537109375, -0.041046142578125, -0.0303497314453125, -0.0196533203125, -0.0089569091796875, 0.001739501953125, 0.0124359130859375, 0.02313232421875, 0.0338287353515625, 0.044525146484375, 0.0552215576171875, 0.06591796875, 0.0766143798828125, 0.087310791015625, 0.0980072021484375, 0.10870361328125, 0.1194000244140625, 0.130096435546875, 0.1407928466796875, 0.1514892578125, 0.1621856689453125, 0.172882080078125, 0.1835784912109375, 0.19427490234375, 0.2049713134765625, 0.215667724609375, 0.2263641357421875, 0.237060546875, 0.2477569580078125, 0.258453369140625, 0.2691497802734375, 0.27984619140625, 0.2905426025390625, 0.301239013671875, 0.3119354248046875, 0.3226318359375, 0.3333282470703125, 0.344024658203125, 0.3547210693359375, 0.36541748046875, 0.3761138916015625, 0.386810302734375, 0.3975067138671875, 0.408203125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 4.0, 7.0, 11.0, 6.0, 8.0, 18.0, 28.0, 29.0, 18.0, 41.0, 36.0, 43.0, 33.0, 42.0, 48.0, 54.0, 45.0, 73.0, 54.0, 51.0, 46.0, 39.0, 39.0, 42.0, 39.0, 28.0, 26.0, 16.0, 12.0, 16.0, 13.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.925477981567383, -2.8365590572357178, -2.7476401329040527, -2.6587212085723877, -2.5698022842407227, -2.4808833599090576, -2.3919644355773926, -2.3030452728271484, -2.2141265869140625, -2.1252076625823975, -2.0362887382507324, -1.9473698139190674, -1.8584508895874023, -1.7695319652557373, -1.6806129217147827, -1.5916939973831177, -1.502774953842163, -1.413856029510498, -1.324937105178833, -1.236018180847168, -1.147099256515503, -1.058180332183838, -0.9692612886428833, -0.8803423643112183, -0.7914234399795532, -0.7025045156478882, -0.6135855913162231, -0.5246666073799133, -0.4357476830482483, -0.34682875871658325, -0.25790977478027344, -0.1689908504486084, -0.08007168769836426, 0.008847251534461975, 0.09776619076728821, 0.18668514490127563, 0.2756040692329407, 0.3645229935646057, 0.4534419775009155, 0.5423609018325806, 0.6312798261642456, 0.7201987504959106, 0.8091176748275757, 0.8980366587638855, 0.9869555830955505, 1.0758745670318604, 1.1647934913635254, 1.2537124156951904, 1.3426313400268555, 1.4315502643585205, 1.5204691886901855, 1.6093881130218506, 1.6983070373535156, 1.7872259616851807, 1.8761450052261353, 1.9650639295578003, 2.053982734680176, 2.142901659011841, 2.231820583343506, 2.320739507675171, 2.409658432006836, 2.498577356338501, 2.587496280670166, 2.67641544342041, 2.765334367752075]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 6.0, 4.0, 12.0, 8.0, 10.0, 16.0, 10.0, 16.0, 11.0, 18.0, 32.0, 28.0, 22.0, 30.0, 34.0, 24.0, 16.0, 29.0, 36.0, 40.0, 47.0, 46.0, 40.0, 32.0, 41.0, 35.0, 39.0, 40.0, 33.0, 22.0, 21.0, 24.0, 22.0, 17.0, 22.0, 10.0, 15.0, 15.0, 16.0, 13.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.1321260929107666, -2.0693349838256836, -2.0065436363220215, -1.9437525272369385, -1.880961298942566, -1.8181700706481934, -1.7553788423538208, -1.6925876140594482, -1.6297965049743652, -1.5670052766799927, -1.5042140483856201, -1.441422939300537, -1.3786317110061646, -1.315840482711792, -1.2530492544174194, -1.1902580261230469, -1.1274667978286743, -1.0646755695343018, -1.0018843412399292, -0.9390931725502014, -0.8763020038604736, -0.8135107755661011, -0.7507195472717285, -0.687928318977356, -0.6251371502876282, -0.5623459219932556, -0.49955475330352783, -0.4367635250091553, -0.3739723265171051, -0.31118112802505493, -0.24838989973068237, -0.1855987012386322, -0.12280738353729248, -0.06001617759466171, 0.002775028347969055, 0.06556624174118042, 0.1283574402332306, 0.19114863872528076, 0.2539398670196533, 0.3167310655117035, 0.37952226400375366, 0.44231346249580383, 0.505104660987854, 0.5678958892822266, 0.6306871175765991, 0.6934782862663269, 0.7562695145606995, 0.8190606832504272, 0.8818519115447998, 0.9446431398391724, 1.007434368133545, 1.070225477218628, 1.1330167055130005, 1.195807933807373, 1.2585991621017456, 1.3213903903961182, 1.3841814994812012, 1.4469727277755737, 1.5097639560699463, 1.5725550651550293, 1.6353462934494019, 1.6981375217437744, 1.760928750038147, 1.8237199783325195, 1.886511206626892]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 13.0, 13.0, 15.0, 38.0, 58.0, 85.0, 113.0, 178.0, 277.0, 402.0, 590.0, 847.0, 1352.0, 1984.0, 2889.0, 4574.0, 6788.0, 9948.0, 15071.0, 21892.0, 31813.0, 44284.0, 60720.0, 79197.0, 95565.0, 108340.0, 111284.0, 104707.0, 90615.0, 73121.0, 55075.0, 39756.0, 27912.0, 19219.0, 13079.0, 8825.0, 5909.0, 4038.0, 2730.0, 1805.0, 1146.0, 801.0, 496.0, 345.0, 214.0, 139.0, 87.0, 65.0, 34.0, 39.0, 21.0, 8.0, 9.0, 10.0, 6.0, 5.0, 5.0], "bins": [-2.111328125, -2.0479888916015625, -1.984649658203125, -1.9213104248046875, -1.85797119140625, -1.7946319580078125, -1.731292724609375, -1.6679534912109375, -1.6046142578125, -1.5412750244140625, -1.477935791015625, -1.4145965576171875, -1.35125732421875, -1.2879180908203125, -1.224578857421875, -1.1612396240234375, -1.097900390625, -1.0345611572265625, -0.971221923828125, -0.9078826904296875, -0.84454345703125, -0.7812042236328125, -0.717864990234375, -0.6545257568359375, -0.5911865234375, -0.5278472900390625, -0.464508056640625, -0.4011688232421875, -0.33782958984375, -0.2744903564453125, -0.211151123046875, -0.1478118896484375, -0.08447265625, -0.0211334228515625, 0.042205810546875, 0.1055450439453125, 0.16888427734375, 0.2322235107421875, 0.295562744140625, 0.3589019775390625, 0.4222412109375, 0.4855804443359375, 0.548919677734375, 0.6122589111328125, 0.67559814453125, 0.7389373779296875, 0.802276611328125, 0.8656158447265625, 0.928955078125, 0.9922943115234375, 1.055633544921875, 1.1189727783203125, 1.18231201171875, 1.2456512451171875, 1.308990478515625, 1.3723297119140625, 1.4356689453125, 1.4990081787109375, 1.562347412109375, 1.6256866455078125, 1.68902587890625, 1.7523651123046875, 1.815704345703125, 1.8790435791015625, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 10.0, 19.0, 16.0, 19.0, 19.0, 17.0, 19.0, 34.0, 21.0, 30.0, 27.0, 35.0, 36.0, 40.0, 38.0, 51.0, 36.0, 40.0, 45.0, 52.0, 36.0, 39.0, 28.0, 34.0, 29.0, 18.0, 16.0, 29.0, 21.0, 21.0, 17.0, 16.0, 11.0, 7.0, 7.0, 13.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.974609375, -1.91070556640625, -1.8468017578125, -1.78289794921875, -1.718994140625, -1.65509033203125, -1.5911865234375, -1.52728271484375, -1.46337890625, -1.39947509765625, -1.3355712890625, -1.27166748046875, -1.207763671875, -1.14385986328125, -1.0799560546875, -1.01605224609375, -0.9521484375, -0.88824462890625, -0.8243408203125, -0.76043701171875, -0.696533203125, -0.63262939453125, -0.5687255859375, -0.50482177734375, -0.44091796875, -0.37701416015625, -0.3131103515625, -0.24920654296875, -0.185302734375, -0.12139892578125, -0.0574951171875, 0.00640869140625, 0.0703125, 0.13421630859375, 0.1981201171875, 0.26202392578125, 0.325927734375, 0.38983154296875, 0.4537353515625, 0.51763916015625, 0.58154296875, 0.64544677734375, 0.7093505859375, 0.77325439453125, 0.837158203125, 0.90106201171875, 0.9649658203125, 1.02886962890625, 1.0927734375, 1.15667724609375, 1.2205810546875, 1.28448486328125, 1.348388671875, 1.41229248046875, 1.4761962890625, 1.54010009765625, 1.60400390625, 1.66790771484375, 1.7318115234375, 1.79571533203125, 1.859619140625, 1.92352294921875, 1.9874267578125, 2.05133056640625, 2.115234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 7.0, 22.0, 20.0, 33.0, 57.0, 106.0, 160.0, 276.0, 439.0, 734.0, 1193.0, 2015.0, 3604.0, 5963.0, 9842.0, 16141.0, 26400.0, 40745.0, 60684.0, 85314.0, 110673.0, 128409.0, 131738.0, 120376.0, 97600.0, 72003.0, 49639.0, 32462.0, 20363.0, 12548.0, 7641.0, 4443.0, 2739.0, 1672.0, 993.0, 591.0, 340.0, 237.0, 144.0, 84.0, 45.0, 30.0, 9.0, 12.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.7716064453125, -1.701416015625, -1.6312255859375, -1.56103515625, -1.4908447265625, -1.420654296875, -1.3504638671875, -1.2802734375, -1.2100830078125, -1.139892578125, -1.0697021484375, -0.99951171875, -0.9293212890625, -0.859130859375, -0.7889404296875, -0.71875, -0.6485595703125, -0.578369140625, -0.5081787109375, -0.43798828125, -0.3677978515625, -0.297607421875, -0.2274169921875, -0.1572265625, -0.0870361328125, -0.016845703125, 0.0533447265625, 0.12353515625, 0.1937255859375, 0.263916015625, 0.3341064453125, 0.404296875, 0.4744873046875, 0.544677734375, 0.6148681640625, 0.68505859375, 0.7552490234375, 0.825439453125, 0.8956298828125, 0.9658203125, 1.0360107421875, 1.106201171875, 1.1763916015625, 1.24658203125, 1.3167724609375, 1.386962890625, 1.4571533203125, 1.52734375, 1.5975341796875, 1.667724609375, 1.7379150390625, 1.80810546875, 1.8782958984375, 1.948486328125, 2.0186767578125, 2.0888671875, 2.1590576171875, 2.229248046875, 2.2994384765625, 2.36962890625, 2.4398193359375, 2.510009765625, 2.5802001953125, 2.650390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 21.0, 17.0, 12.0, 23.0, 26.0, 25.0, 21.0, 39.0, 28.0, 45.0, 31.0, 39.0, 41.0, 39.0, 51.0, 43.0, 47.0, 46.0, 45.0, 34.0, 41.0, 46.0, 33.0, 29.0, 23.0, 13.0, 22.0, 10.0, 18.0, 14.0, 6.0, 13.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.344024658203125, -1.29742431640625, -1.250823974609375, -1.2042236328125, -1.157623291015625, -1.11102294921875, -1.064422607421875, -1.017822265625, -0.971221923828125, -0.92462158203125, -0.878021240234375, -0.8314208984375, -0.784820556640625, -0.73822021484375, -0.691619873046875, -0.64501953125, -0.598419189453125, -0.55181884765625, -0.505218505859375, -0.4586181640625, -0.412017822265625, -0.36541748046875, -0.318817138671875, -0.272216796875, -0.225616455078125, -0.17901611328125, -0.132415771484375, -0.0858154296875, -0.039215087890625, 0.00738525390625, 0.053985595703125, 0.1005859375, 0.147186279296875, 0.19378662109375, 0.240386962890625, 0.2869873046875, 0.333587646484375, 0.38018798828125, 0.426788330078125, 0.473388671875, 0.519989013671875, 0.56658935546875, 0.613189697265625, 0.6597900390625, 0.706390380859375, 0.75299072265625, 0.799591064453125, 0.84619140625, 0.892791748046875, 0.93939208984375, 0.985992431640625, 1.0325927734375, 1.079193115234375, 1.12579345703125, 1.172393798828125, 1.218994140625, 1.265594482421875, 1.31219482421875, 1.358795166015625, 1.4053955078125, 1.451995849609375, 1.49859619140625, 1.545196533203125, 1.591796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 24.0, 30.0, 38.0, 48.0, 91.0, 99.0, 190.0, 250.0, 426.0, 647.0, 917.0, 1489.0, 2503.0, 4192.0, 7742.0, 15272.0, 31301.0, 69323.0, 162597.0, 299850.0, 243930.0, 110974.0, 48205.0, 22566.0, 11142.0, 5880.0, 3379.0, 1930.0, 1237.0, 799.0, 476.0, 318.0, 227.0, 137.0, 91.0, 71.0, 48.0, 35.0, 23.0, 19.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.289764404296875, -3.17132568359375, -3.052886962890625, -2.9344482421875, -2.816009521484375, -2.69757080078125, -2.579132080078125, -2.460693359375, -2.342254638671875, -2.22381591796875, -2.105377197265625, -1.9869384765625, -1.868499755859375, -1.75006103515625, -1.631622314453125, -1.51318359375, -1.394744873046875, -1.27630615234375, -1.157867431640625, -1.0394287109375, -0.920989990234375, -0.80255126953125, -0.684112548828125, -0.565673828125, -0.447235107421875, -0.32879638671875, -0.210357666015625, -0.0919189453125, 0.026519775390625, 0.14495849609375, 0.263397216796875, 0.3818359375, 0.500274658203125, 0.61871337890625, 0.737152099609375, 0.8555908203125, 0.974029541015625, 1.09246826171875, 1.210906982421875, 1.329345703125, 1.447784423828125, 1.56622314453125, 1.684661865234375, 1.8031005859375, 1.921539306640625, 2.03997802734375, 2.158416748046875, 2.27685546875, 2.395294189453125, 2.51373291015625, 2.632171630859375, 2.7506103515625, 2.869049072265625, 2.98748779296875, 3.105926513671875, 3.224365234375, 3.342803955078125, 3.46124267578125, 3.579681396484375, 3.6981201171875, 3.816558837890625, 3.93499755859375, 4.053436279296875, 4.171875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 8.0, 15.0, 19.0, 17.0, 23.0, 31.0, 51.0, 59.0, 55.0, 66.0, 90.0, 70.0, 56.0, 76.0, 49.0, 52.0, 46.0, 42.0, 19.0, 27.0, 15.0, 18.0, 5.0, 12.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020325183868408203, -0.00019521452486515045, -0.00018717721104621887, -0.0001791398972272873, -0.0001711025834083557, -0.00016306526958942413, -0.00015502795577049255, -0.00014699064195156097, -0.0001389533281326294, -0.00013091601431369781, -0.00012287870049476624, -0.00011484138667583466, -0.00010680407285690308, -9.87667590379715e-05, -9.072944521903992e-05, -8.269213140010834e-05, -7.465481758117676e-05, -6.661750376224518e-05, -5.85801899433136e-05, -5.054287612438202e-05, -4.250556230545044e-05, -3.446824848651886e-05, -2.643093466758728e-05, -1.83936208486557e-05, -1.0356307029724121e-05, -2.3189932107925415e-06, 5.718320608139038e-06, 1.3755634427070618e-05, 2.1792948246002197e-05, 2.9830262064933777e-05, 3.7867575883865356e-05, 4.5904889702796936e-05, 5.3942203521728516e-05, 6.19795173406601e-05, 7.001683115959167e-05, 7.805414497852325e-05, 8.609145879745483e-05, 9.412877261638641e-05, 0.00010216608643531799, 0.00011020340025424957, 0.00011824071407318115, 0.00012627802789211273, 0.0001343153417110443, 0.0001423526555299759, 0.00015038996934890747, 0.00015842728316783905, 0.00016646459698677063, 0.0001745019108057022, 0.0001825392246246338, 0.00019057653844356537, 0.00019861385226249695, 0.00020665116608142853, 0.0002146884799003601, 0.0002227257937192917, 0.00023076310753822327, 0.00023880042135715485, 0.0002468377351760864, 0.000254875048995018, 0.0002629123628139496, 0.00027094967663288116, 0.00027898699045181274, 0.0002870243042707443, 0.0002950616180896759, 0.0003030989319086075, 0.00031113624572753906]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 12.0, 17.0, 24.0, 37.0, 43.0, 83.0, 109.0, 158.0, 232.0, 340.0, 500.0, 727.0, 1038.0, 1526.0, 2483.0, 3754.0, 6155.0, 10440.0, 17877.0, 32690.0, 60087.0, 108852.0, 175784.0, 213301.0, 172608.0, 105094.0, 58427.0, 31708.0, 17327.0, 10101.0, 6087.0, 3734.0, 2395.0, 1488.0, 1046.0, 702.0, 469.0, 319.0, 233.0, 151.0, 118.0, 76.0, 64.0, 42.0, 34.0, 16.0, 15.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.132720947265625, -2.06036376953125, -1.988006591796875, -1.9156494140625, -1.843292236328125, -1.77093505859375, -1.698577880859375, -1.626220703125, -1.553863525390625, -1.48150634765625, -1.409149169921875, -1.3367919921875, -1.264434814453125, -1.19207763671875, -1.119720458984375, -1.04736328125, -0.975006103515625, -0.90264892578125, -0.830291748046875, -0.7579345703125, -0.685577392578125, -0.61322021484375, -0.540863037109375, -0.468505859375, -0.396148681640625, -0.32379150390625, -0.251434326171875, -0.1790771484375, -0.106719970703125, -0.03436279296875, 0.037994384765625, 0.1103515625, 0.182708740234375, 0.25506591796875, 0.327423095703125, 0.3997802734375, 0.472137451171875, 0.54449462890625, 0.616851806640625, 0.689208984375, 0.761566162109375, 0.83392333984375, 0.906280517578125, 0.9786376953125, 1.050994873046875, 1.12335205078125, 1.195709228515625, 1.26806640625, 1.340423583984375, 1.41278076171875, 1.485137939453125, 1.5574951171875, 1.629852294921875, 1.70220947265625, 1.774566650390625, 1.846923828125, 1.919281005859375, 1.99163818359375, 2.063995361328125, 2.1363525390625, 2.208709716796875, 2.28106689453125, 2.353424072265625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 6.0, 10.0, 15.0, 14.0, 14.0, 28.0, 30.0, 28.0, 41.0, 47.0, 55.0, 89.0, 61.0, 77.0, 67.0, 65.0, 54.0, 47.0, 44.0, 44.0, 23.0, 30.0, 17.0, 14.0, 17.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8664016723632812, -0.8397369384765625, -0.8130722045898438, -0.786407470703125, -0.7597427368164062, -0.7330780029296875, -0.7064132690429688, -0.67974853515625, -0.6530838012695312, -0.6264190673828125, -0.5997543334960938, -0.573089599609375, -0.5464248657226562, -0.5197601318359375, -0.49309539794921875, -0.4664306640625, -0.43976593017578125, -0.4131011962890625, -0.38643646240234375, -0.359771728515625, -0.33310699462890625, -0.3064422607421875, -0.27977752685546875, -0.25311279296875, -0.22644805908203125, -0.1997833251953125, -0.17311859130859375, -0.146453857421875, -0.11978912353515625, -0.0931243896484375, -0.06645965576171875, -0.039794921875, -0.01313018798828125, 0.0135345458984375, 0.04019927978515625, 0.066864013671875, 0.09352874755859375, 0.1201934814453125, 0.14685821533203125, 0.17352294921875, 0.20018768310546875, 0.2268524169921875, 0.25351715087890625, 0.280181884765625, 0.30684661865234375, 0.3335113525390625, 0.36017608642578125, 0.3868408203125, 0.41350555419921875, 0.4401702880859375, 0.46683502197265625, 0.493499755859375, 0.5201644897460938, 0.5468292236328125, 0.5734939575195312, 0.60015869140625, 0.6268234252929688, 0.6534881591796875, 0.6801528930664062, 0.706817626953125, 0.7334823608398438, 0.7601470947265625, 0.7868118286132812, 0.8134765625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 16.0, 11.0, 13.0, 17.0, 31.0, 29.0, 35.0, 34.0, 33.0, 43.0, 31.0, 42.0, 48.0, 46.0, 47.0, 55.0, 52.0, 45.0, 47.0, 34.0, 47.0, 24.0, 25.0, 33.0, 31.0, 22.0, 11.0, 22.0, 16.0, 5.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6193525791168213, -2.537788152694702, -2.456223487854004, -2.3746590614318848, -2.2930946350097656, -2.2115302085876465, -2.1299655437469482, -2.048401117324829, -1.96683669090271, -1.8852721452713013, -1.8037077188491821, -1.7221431732177734, -1.6405787467956543, -1.5590142011642456, -1.477449655532837, -1.3958852291107178, -1.314320683479309, -1.2327561378479004, -1.1511917114257812, -1.0696271657943726, -0.9880627393722534, -0.9064981937408447, -0.8249337077140808, -0.7433692216873169, -0.661804735660553, -0.5802402496337891, -0.49867576360702515, -0.41711124777793884, -0.3355467617511749, -0.253982275724411, -0.1724177598953247, -0.09085327386856079, -0.009288787841796875, 0.07227570563554764, 0.15384019911289215, 0.23540470004081726, 0.3169691860675812, 0.3985336720943451, 0.4800981879234314, 0.5616626739501953, 0.6432271599769592, 0.7247916460037231, 0.8063561320304871, 0.887920618057251, 0.9694851636886597, 1.0510495901107788, 1.1326141357421875, 1.2141785621643066, 1.2957431077957153, 1.377307653427124, 1.4588720798492432, 1.5404366254806519, 1.622001051902771, 1.7035655975341797, 1.7851300239562988, 1.8666945695877075, 1.9482591152191162, 2.0298235416412354, 2.1113882064819336, 2.1929526329040527, 2.274517059326172, 2.356081485748291, 2.4376461505889893, 2.5192105770111084, 2.6007750034332275]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 4.0, 11.0, 11.0, 12.0, 13.0, 11.0, 21.0, 13.0, 20.0, 25.0, 30.0, 24.0, 30.0, 28.0, 33.0, 33.0, 34.0, 31.0, 42.0, 34.0, 41.0, 35.0, 43.0, 52.0, 32.0, 39.0, 29.0, 32.0, 29.0, 32.0, 20.0, 31.0, 18.0, 11.0, 12.0, 12.0, 9.0, 8.0, 8.0, 9.0, 5.0, 7.0, 1.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.2677392959594727, -2.201488494873047, -2.135237693786621, -2.0689868927001953, -2.0027360916137695, -1.9364852905273438, -1.870234489440918, -1.8039836883544922, -1.7377328872680664, -1.6714820861816406, -1.6052312850952148, -1.538980484008789, -1.4727296829223633, -1.4064788818359375, -1.3402280807495117, -1.273977279663086, -1.2077263593673706, -1.1414755582809448, -1.075224757194519, -1.0089739561080933, -0.9427231550216675, -0.8764723539352417, -0.8102214932441711, -0.7439706921577454, -0.6777198910713196, -0.6114690899848938, -0.545218288898468, -0.47896745800971985, -0.41271665692329407, -0.3464658558368683, -0.2802150249481201, -0.21396422386169434, -0.147713303565979, -0.08146249502897263, -0.015211686491966248, 0.05103912949562073, 0.11728993058204651, 0.1835407316684723, 0.24979156255722046, 0.31604236364364624, 0.382293164730072, 0.4485439658164978, 0.5147947669029236, 0.5810456275939941, 0.6472964286804199, 0.7135472297668457, 0.7797980308532715, 0.8460488319396973, 0.912299633026123, 0.9785504341125488, 1.0448012351989746, 1.1110520362854004, 1.1773028373718262, 1.243553638458252, 1.3098044395446777, 1.3760552406311035, 1.4423060417175293, 1.508556842803955, 1.5748076438903809, 1.6410584449768066, 1.7073092460632324, 1.7735600471496582, 1.839810848236084, 1.9060616493225098, 1.972312569618225]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 17.0, 27.0, 29.0, 62.0, 97.0, 121.0, 240.0, 347.0, 570.0, 910.0, 1470.0, 2229.0, 3561.0, 5886.0, 9420.0, 15350.0, 24762.0, 39929.0, 63640.0, 100979.0, 155739.0, 235136.0, 336935.0, 446928.0, 529459.0, 548992.0, 491119.0, 387947.0, 277860.0, 187169.0, 121414.0, 77488.0, 48558.0, 30053.0, 18491.0, 11992.0, 7183.0, 4417.0, 2896.0, 1747.0, 1111.0, 720.0, 448.0, 292.0, 170.0, 143.0, 85.0, 47.0, 30.0, 20.0, 14.0, 10.0, 5.0, 13.0, 1.0, 1.0, 2.0], "bins": [-1.78125, -1.7259368896484375, -1.670623779296875, -1.6153106689453125, -1.55999755859375, -1.5046844482421875, -1.449371337890625, -1.3940582275390625, -1.3387451171875, -1.2834320068359375, -1.228118896484375, -1.1728057861328125, -1.11749267578125, -1.0621795654296875, -1.006866455078125, -0.9515533447265625, -0.896240234375, -0.8409271240234375, -0.785614013671875, -0.7303009033203125, -0.67498779296875, -0.6196746826171875, -0.564361572265625, -0.5090484619140625, -0.4537353515625, -0.3984222412109375, -0.343109130859375, -0.2877960205078125, -0.23248291015625, -0.1771697998046875, -0.121856689453125, -0.0665435791015625, -0.01123046875, 0.0440826416015625, 0.099395751953125, 0.1547088623046875, 0.21002197265625, 0.2653350830078125, 0.320648193359375, 0.3759613037109375, 0.4312744140625, 0.4865875244140625, 0.541900634765625, 0.5972137451171875, 0.65252685546875, 0.7078399658203125, 0.763153076171875, 0.8184661865234375, 0.873779296875, 0.9290924072265625, 0.984405517578125, 1.0397186279296875, 1.09503173828125, 1.1503448486328125, 1.205657958984375, 1.2609710693359375, 1.3162841796875, 1.3715972900390625, 1.426910400390625, 1.4822235107421875, 1.53753662109375, 1.5928497314453125, 1.648162841796875, 1.7034759521484375, 1.7587890625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 13.0, 11.0, 13.0, 9.0, 19.0, 13.0, 25.0, 22.0, 32.0, 30.0, 30.0, 37.0, 30.0, 33.0, 45.0, 54.0, 43.0, 51.0, 43.0, 44.0, 41.0, 41.0, 51.0, 33.0, 28.0, 29.0, 30.0, 22.0, 25.0, 18.0, 13.0, 8.0, 14.0, 6.0, 10.0, 3.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9931640625, -1.9395599365234375, -1.885955810546875, -1.8323516845703125, -1.77874755859375, -1.7251434326171875, -1.671539306640625, -1.6179351806640625, -1.5643310546875, -1.5107269287109375, -1.457122802734375, -1.4035186767578125, -1.34991455078125, -1.2963104248046875, -1.242706298828125, -1.1891021728515625, -1.135498046875, -1.0818939208984375, -1.028289794921875, -0.9746856689453125, -0.92108154296875, -0.8674774169921875, -0.813873291015625, -0.7602691650390625, -0.7066650390625, -0.6530609130859375, -0.599456787109375, -0.5458526611328125, -0.49224853515625, -0.4386444091796875, -0.385040283203125, -0.3314361572265625, -0.27783203125, -0.2242279052734375, -0.170623779296875, -0.1170196533203125, -0.06341552734375, -0.0098114013671875, 0.043792724609375, 0.0973968505859375, 0.1510009765625, 0.2046051025390625, 0.258209228515625, 0.3118133544921875, 0.36541748046875, 0.4190216064453125, 0.472625732421875, 0.5262298583984375, 0.579833984375, 0.6334381103515625, 0.687042236328125, 0.7406463623046875, 0.79425048828125, 0.8478546142578125, 0.901458740234375, 0.9550628662109375, 1.0086669921875, 1.0622711181640625, 1.115875244140625, 1.1694793701171875, 1.22308349609375, 1.2766876220703125, 1.330291748046875, 1.3838958740234375, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 14.0, 18.0, 31.0, 43.0, 97.0, 110.0, 204.0, 326.0, 611.0, 993.0, 1628.0, 2723.0, 4560.0, 8034.0, 13451.0, 22727.0, 37434.0, 61894.0, 99186.0, 154213.0, 229733.0, 323447.0, 422384.0, 499957.0, 524608.0, 487044.0, 404648.0, 305777.0, 213974.0, 142143.0, 90702.0, 56274.0, 34481.0, 20740.0, 12222.0, 7384.0, 4226.0, 2523.0, 1455.0, 885.0, 548.0, 318.0, 183.0, 132.0, 69.0, 42.0, 35.0, 20.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6689453125, -1.6140594482421875, -1.559173583984375, -1.5042877197265625, -1.44940185546875, -1.3945159912109375, -1.339630126953125, -1.2847442626953125, -1.2298583984375, -1.1749725341796875, -1.120086669921875, -1.0652008056640625, -1.01031494140625, -0.9554290771484375, -0.900543212890625, -0.8456573486328125, -0.790771484375, -0.7358856201171875, -0.680999755859375, -0.6261138916015625, -0.57122802734375, -0.5163421630859375, -0.461456298828125, -0.4065704345703125, -0.3516845703125, -0.2967987060546875, -0.241912841796875, -0.1870269775390625, -0.13214111328125, -0.0772552490234375, -0.022369384765625, 0.0325164794921875, 0.08740234375, 0.1422882080078125, 0.197174072265625, 0.2520599365234375, 0.30694580078125, 0.3618316650390625, 0.416717529296875, 0.4716033935546875, 0.5264892578125, 0.5813751220703125, 0.636260986328125, 0.6911468505859375, 0.74603271484375, 0.8009185791015625, 0.855804443359375, 0.9106903076171875, 0.965576171875, 1.0204620361328125, 1.075347900390625, 1.1302337646484375, 1.18511962890625, 1.2400054931640625, 1.294891357421875, 1.3497772216796875, 1.4046630859375, 1.4595489501953125, 1.514434814453125, 1.5693206787109375, 1.62420654296875, 1.6790924072265625, 1.733978271484375, 1.7888641357421875, 1.84375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 11.0, 22.0, 21.0, 27.0, 27.0, 31.0, 52.0, 51.0, 75.0, 91.0, 83.0, 112.0, 130.0, 118.0, 152.0, 163.0, 176.0, 203.0, 191.0, 216.0, 231.0, 201.0, 204.0, 192.0, 181.0, 172.0, 140.0, 123.0, 115.0, 103.0, 74.0, 80.0, 57.0, 43.0, 47.0, 35.0, 27.0, 23.0, 13.0, 10.0, 5.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7119140625, -0.6884918212890625, -0.665069580078125, -0.6416473388671875, -0.61822509765625, -0.5948028564453125, -0.571380615234375, -0.5479583740234375, -0.5245361328125, -0.5011138916015625, -0.477691650390625, -0.4542694091796875, -0.43084716796875, -0.4074249267578125, -0.384002685546875, -0.3605804443359375, -0.337158203125, -0.3137359619140625, -0.290313720703125, -0.2668914794921875, -0.24346923828125, -0.2200469970703125, -0.196624755859375, -0.1732025146484375, -0.1497802734375, -0.1263580322265625, -0.102935791015625, -0.0795135498046875, -0.05609130859375, -0.0326690673828125, -0.009246826171875, 0.0141754150390625, 0.03759765625, 0.0610198974609375, 0.084442138671875, 0.1078643798828125, 0.13128662109375, 0.1547088623046875, 0.178131103515625, 0.2015533447265625, 0.2249755859375, 0.2483978271484375, 0.271820068359375, 0.2952423095703125, 0.31866455078125, 0.3420867919921875, 0.365509033203125, 0.3889312744140625, 0.412353515625, 0.4357757568359375, 0.459197998046875, 0.4826202392578125, 0.50604248046875, 0.5294647216796875, 0.552886962890625, 0.5763092041015625, 0.5997314453125, 0.6231536865234375, 0.646575927734375, 0.6699981689453125, 0.69342041015625, 0.7168426513671875, 0.740264892578125, 0.7636871337890625, 0.787109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 8.0, 6.0, 10.0, 9.0, 17.0, 16.0, 27.0, 31.0, 34.0, 30.0, 59.0, 60.0, 63.0, 60.0, 69.0, 70.0, 62.0, 38.0, 42.0, 43.0, 56.0, 33.0, 33.0, 22.0, 31.0, 24.0, 20.0, 7.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.988922595977783, -2.9013919830322266, -2.813861131668091, -2.726330518722534, -2.6387999057769775, -2.551269054412842, -2.463738441467285, -2.3762078285217285, -2.288677215576172, -2.2011466026306152, -2.1136157512664795, -2.026085138320923, -1.9385545253753662, -1.85102379322052, -1.7634930610656738, -1.6759624481201172, -1.5884315967559814, -1.5009008646011353, -1.4133702516555786, -1.3258395195007324, -1.2383089065551758, -1.1507781744003296, -1.0632474422454834, -0.975716769695282, -0.8881860971450806, -0.8006554245948792, -0.7131247520446777, -0.6255940198898315, -0.5380633473396301, -0.4505326747894287, -0.3630019426345825, -0.2754712700843811, -0.1879405975341797, -0.10040991008281708, -0.012879222631454468, 0.07465147972106934, 0.16218215227127075, 0.24971282482147217, 0.33724355697631836, 0.4247742295265198, 0.5123049020767212, 0.5998355746269226, 0.687366247177124, 0.7748969793319702, 0.8624276518821716, 0.949958324432373, 1.0374890565872192, 1.1250197887420654, 1.212550401687622, 1.3000811338424683, 1.387611746788025, 1.475142478942871, 1.5626730918884277, 1.650203824043274, 1.7377345561981201, 1.8252651691436768, 1.912795901298523, 2.000326633453369, 2.087857246398926, 2.1753878593444824, 2.262918710708618, 2.350449323654175, 2.4379801750183105, 2.525510787963867, 2.613041400909424]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 8.0, 6.0, 10.0, 11.0, 14.0, 15.0, 16.0, 15.0, 18.0, 28.0, 24.0, 21.0, 29.0, 31.0, 33.0, 34.0, 39.0, 34.0, 40.0, 30.0, 46.0, 30.0, 38.0, 35.0, 37.0, 26.0, 30.0, 30.0, 21.0, 24.0, 31.0, 21.0, 16.0, 21.0, 18.0, 14.0, 15.0, 13.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.6044965982437134, -1.5532957315444946, -1.5020948648452759, -1.4508939981460571, -1.3996931314468384, -1.3484922647476196, -1.2972913980484009, -1.2460905313491821, -1.1948896646499634, -1.1436887979507446, -1.0924879312515259, -1.0412870645523071, -0.9900861978530884, -0.9388853311538696, -0.8876844644546509, -0.8364835977554321, -0.7852827310562134, -0.7340818643569946, -0.6828809976577759, -0.6316801309585571, -0.5804792642593384, -0.5292783975601196, -0.4780775308609009, -0.42687666416168213, -0.3756757974624634, -0.32447493076324463, -0.2732740640640259, -0.22207319736480713, -0.17087233066558838, -0.11967146396636963, -0.06847059726715088, -0.01726973056793213, 0.03393101692199707, 0.08513188362121582, 0.13633275032043457, 0.18753361701965332, 0.23873448371887207, 0.2899353504180908, 0.34113621711730957, 0.3923370838165283, 0.44353795051574707, 0.4947388172149658, 0.5459396839141846, 0.5971405506134033, 0.6483414173126221, 0.6995422840118408, 0.7507431507110596, 0.8019440174102783, 0.8531448841094971, 0.9043457508087158, 0.9555466175079346, 1.0067474842071533, 1.057948350906372, 1.1091492176055908, 1.1603500843048096, 1.2115509510040283, 1.262751817703247, 1.3139526844024658, 1.3651535511016846, 1.4163544178009033, 1.467555284500122, 1.5187561511993408, 1.5699570178985596, 1.6211578845977783, 1.672358751296997]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 28.0, 18.0, 40.0, 55.0, 76.0, 81.0, 137.0, 178.0, 266.0, 399.0, 557.0, 779.0, 1109.0, 1719.0, 2903.0, 5997.0, 17535.0, 72549.0, 313259.0, 452580.0, 130021.0, 29278.0, 8687.0, 3818.0, 2127.0, 1303.0, 860.0, 690.0, 394.0, 329.0, 229.0, 160.0, 97.0, 80.0, 55.0, 37.0, 33.0, 20.0, 16.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84814453125, -2.7568359375, -2.66552734375, -2.57421875, -2.48291015625, -2.3916015625, -2.30029296875, -2.208984375, -2.11767578125, -2.0263671875, -1.93505859375, -1.84375, -1.75244140625, -1.6611328125, -1.56982421875, -1.478515625, -1.38720703125, -1.2958984375, -1.20458984375, -1.11328125, -1.02197265625, -0.9306640625, -0.83935546875, -0.748046875, -0.65673828125, -0.5654296875, -0.47412109375, -0.3828125, -0.29150390625, -0.2001953125, -0.10888671875, -0.017578125, 0.07373046875, 0.1650390625, 0.25634765625, 0.34765625, 0.43896484375, 0.5302734375, 0.62158203125, 0.712890625, 0.80419921875, 0.8955078125, 0.98681640625, 1.078125, 1.16943359375, 1.2607421875, 1.35205078125, 1.443359375, 1.53466796875, 1.6259765625, 1.71728515625, 1.80859375, 1.89990234375, 1.9912109375, 2.08251953125, 2.173828125, 2.26513671875, 2.3564453125, 2.44775390625, 2.5390625, 2.63037109375, 2.7216796875, 2.81298828125, 2.904296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 8.0, 12.0, 7.0, 12.0, 17.0, 17.0, 17.0, 23.0, 26.0, 22.0, 39.0, 28.0, 34.0, 35.0, 39.0, 33.0, 31.0, 29.0, 38.0, 47.0, 34.0, 46.0, 44.0, 31.0, 28.0, 32.0, 30.0, 31.0, 25.0, 18.0, 19.0, 24.0, 28.0, 19.0, 8.0, 7.0, 11.0, 3.0, 7.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7255859375, -1.6685028076171875, -1.611419677734375, -1.5543365478515625, -1.49725341796875, -1.4401702880859375, -1.383087158203125, -1.3260040283203125, -1.2689208984375, -1.2118377685546875, -1.154754638671875, -1.0976715087890625, -1.04058837890625, -0.9835052490234375, -0.926422119140625, -0.8693389892578125, -0.812255859375, -0.7551727294921875, -0.698089599609375, -0.6410064697265625, -0.58392333984375, -0.5268402099609375, -0.469757080078125, -0.4126739501953125, -0.3555908203125, -0.2985076904296875, -0.241424560546875, -0.1843414306640625, -0.12725830078125, -0.0701751708984375, -0.013092041015625, 0.0439910888671875, 0.10107421875, 0.1581573486328125, 0.215240478515625, 0.2723236083984375, 0.32940673828125, 0.3864898681640625, 0.443572998046875, 0.5006561279296875, 0.5577392578125, 0.6148223876953125, 0.671905517578125, 0.7289886474609375, 0.78607177734375, 0.8431549072265625, 0.900238037109375, 0.9573211669921875, 1.014404296875, 1.0714874267578125, 1.128570556640625, 1.1856536865234375, 1.24273681640625, 1.2998199462890625, 1.356903076171875, 1.4139862060546875, 1.4710693359375, 1.5281524658203125, 1.585235595703125, 1.6423187255859375, 1.69940185546875, 1.7564849853515625, 1.813568115234375, 1.8706512451171875, 1.927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 16.0, 17.0, 22.0, 29.0, 42.0, 51.0, 71.0, 94.0, 128.0, 167.0, 199.0, 293.0, 417.0, 628.0, 1095.0, 1970.0, 4683.0, 12812.0, 41546.0, 155245.0, 454129.0, 270118.0, 70632.0, 20574.0, 6905.0, 2748.0, 1354.0, 739.0, 480.0, 340.0, 235.0, 168.0, 150.0, 129.0, 75.0, 53.0, 50.0, 34.0, 18.0, 20.0, 20.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.1875, -2.113861083984375, -2.04022216796875, -1.966583251953125, -1.8929443359375, -1.819305419921875, -1.74566650390625, -1.672027587890625, -1.598388671875, -1.524749755859375, -1.45111083984375, -1.377471923828125, -1.3038330078125, -1.230194091796875, -1.15655517578125, -1.082916259765625, -1.00927734375, -0.935638427734375, -0.86199951171875, -0.788360595703125, -0.7147216796875, -0.641082763671875, -0.56744384765625, -0.493804931640625, -0.420166015625, -0.346527099609375, -0.27288818359375, -0.199249267578125, -0.1256103515625, -0.051971435546875, 0.02166748046875, 0.095306396484375, 0.1689453125, 0.242584228515625, 0.31622314453125, 0.389862060546875, 0.4635009765625, 0.537139892578125, 0.61077880859375, 0.684417724609375, 0.758056640625, 0.831695556640625, 0.90533447265625, 0.978973388671875, 1.0526123046875, 1.126251220703125, 1.19989013671875, 1.273529052734375, 1.34716796875, 1.420806884765625, 1.49444580078125, 1.568084716796875, 1.6417236328125, 1.715362548828125, 1.78900146484375, 1.862640380859375, 1.936279296875, 2.009918212890625, 2.08355712890625, 2.157196044921875, 2.2308349609375, 2.304473876953125, 2.37811279296875, 2.451751708984375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 7.0, 13.0, 16.0, 8.0, 8.0, 23.0, 11.0, 20.0, 19.0, 30.0, 28.0, 32.0, 26.0, 26.0, 38.0, 27.0, 41.0, 45.0, 42.0, 46.0, 41.0, 42.0, 45.0, 29.0, 36.0, 30.0, 32.0, 23.0, 24.0, 37.0, 21.0, 20.0, 15.0, 15.0, 18.0, 6.0, 14.0, 6.0, 12.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.072052001953125, -1.03472900390625, -0.997406005859375, -0.9600830078125, -0.922760009765625, -0.88543701171875, -0.848114013671875, -0.810791015625, -0.773468017578125, -0.73614501953125, -0.698822021484375, -0.6614990234375, -0.624176025390625, -0.58685302734375, -0.549530029296875, -0.51220703125, -0.474884033203125, -0.43756103515625, -0.400238037109375, -0.3629150390625, -0.325592041015625, -0.28826904296875, -0.250946044921875, -0.213623046875, -0.176300048828125, -0.13897705078125, -0.101654052734375, -0.0643310546875, -0.027008056640625, 0.01031494140625, 0.047637939453125, 0.0849609375, 0.122283935546875, 0.15960693359375, 0.196929931640625, 0.2342529296875, 0.271575927734375, 0.30889892578125, 0.346221923828125, 0.383544921875, 0.420867919921875, 0.45819091796875, 0.495513916015625, 0.5328369140625, 0.570159912109375, 0.60748291015625, 0.644805908203125, 0.68212890625, 0.719451904296875, 0.75677490234375, 0.794097900390625, 0.8314208984375, 0.868743896484375, 0.90606689453125, 0.943389892578125, 0.980712890625, 1.018035888671875, 1.05535888671875, 1.092681884765625, 1.1300048828125, 1.167327880859375, 1.20465087890625, 1.241973876953125, 1.279296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 9.0, 10.0, 12.0, 17.0, 25.0, 30.0, 53.0, 68.0, 118.0, 139.0, 197.0, 278.0, 422.0, 618.0, 959.0, 1456.0, 2382.0, 4098.0, 8088.0, 18773.0, 58960.0, 243558.0, 485528.0, 153105.0, 39866.0, 14057.0, 6401.0, 3440.0, 2025.0, 1266.0, 841.0, 496.0, 375.0, 259.0, 150.0, 113.0, 109.0, 61.0, 42.0, 29.0, 28.0, 26.0, 13.0, 12.0, 12.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.70556640625, -0.68231201171875, -0.6590576171875, -0.63580322265625, -0.612548828125, -0.58929443359375, -0.5660400390625, -0.54278564453125, -0.51953125, -0.49627685546875, -0.4730224609375, -0.44976806640625, -0.426513671875, -0.40325927734375, -0.3800048828125, -0.35675048828125, -0.33349609375, -0.31024169921875, -0.2869873046875, -0.26373291015625, -0.240478515625, -0.21722412109375, -0.1939697265625, -0.17071533203125, -0.1474609375, -0.12420654296875, -0.1009521484375, -0.07769775390625, -0.054443359375, -0.03118896484375, -0.0079345703125, 0.01531982421875, 0.03857421875, 0.06182861328125, 0.0850830078125, 0.10833740234375, 0.131591796875, 0.15484619140625, 0.1781005859375, 0.20135498046875, 0.224609375, 0.24786376953125, 0.2711181640625, 0.29437255859375, 0.317626953125, 0.34088134765625, 0.3641357421875, 0.38739013671875, 0.41064453125, 0.43389892578125, 0.4571533203125, 0.48040771484375, 0.503662109375, 0.52691650390625, 0.5501708984375, 0.57342529296875, 0.5966796875, 0.61993408203125, 0.6431884765625, 0.66644287109375, 0.689697265625, 0.71295166015625, 0.7362060546875, 0.75946044921875, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 34.0, 36.0, 59.0, 111.0, 151.0, 139.0, 136.0, 99.0, 74.0, 33.0, 25.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.861852645874023e-05, -7.612258195877075e-05, -7.362663745880127e-05, -7.113069295883179e-05, -6.86347484588623e-05, -6.613880395889282e-05, -6.364285945892334e-05, -6.114691495895386e-05, -5.8650970458984375e-05, -5.615502595901489e-05, -5.365908145904541e-05, -5.116313695907593e-05, -4.8667192459106445e-05, -4.617124795913696e-05, -4.367530345916748e-05, -4.1179358959198e-05, -3.8683414459228516e-05, -3.618746995925903e-05, -3.369152545928955e-05, -3.119558095932007e-05, -2.8699636459350586e-05, -2.6203691959381104e-05, -2.370774745941162e-05, -2.121180295944214e-05, -1.8715858459472656e-05, -1.6219913959503174e-05, -1.3723969459533691e-05, -1.1228024959564209e-05, -8.732080459594727e-06, -6.236135959625244e-06, -3.7401914596557617e-06, -1.2442469596862793e-06, 1.2516975402832031e-06, 3.7476420402526855e-06, 6.243586540222168e-06, 8.73953104019165e-06, 1.1235475540161133e-05, 1.3731420040130615e-05, 1.6227364540100098e-05, 1.872330904006958e-05, 2.1219253540039062e-05, 2.3715198040008545e-05, 2.6211142539978027e-05, 2.870708703994751e-05, 3.120303153991699e-05, 3.3698976039886475e-05, 3.619492053985596e-05, 3.869086503982544e-05, 4.118680953979492e-05, 4.3682754039764404e-05, 4.617869853973389e-05, 4.867464303970337e-05, 5.117058753967285e-05, 5.3666532039642334e-05, 5.6162476539611816e-05, 5.86584210395813e-05, 6.115436553955078e-05, 6.365031003952026e-05, 6.614625453948975e-05, 6.864219903945923e-05, 7.113814353942871e-05, 7.36340880393982e-05, 7.613003253936768e-05, 7.862597703933716e-05, 8.112192153930664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 3.0, 10.0, 25.0, 30.0, 54.0, 57.0, 88.0, 128.0, 172.0, 250.0, 389.0, 580.0, 783.0, 1313.0, 1985.0, 3159.0, 5028.0, 8559.0, 15204.0, 28684.0, 57454.0, 115493.0, 211057.0, 252402.0, 166083.0, 85360.0, 42431.0, 21734.0, 11677.0, 6845.0, 4109.0, 2504.0, 1643.0, 1078.0, 689.0, 489.0, 309.0, 196.0, 145.0, 126.0, 71.0, 51.0, 30.0, 16.0, 15.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5659637451171875, -0.548431396484375, -0.5308990478515625, -0.51336669921875, -0.4958343505859375, -0.478302001953125, -0.4607696533203125, -0.4432373046875, -0.4257049560546875, -0.408172607421875, -0.3906402587890625, -0.37310791015625, -0.3555755615234375, -0.338043212890625, -0.3205108642578125, -0.302978515625, -0.2854461669921875, -0.267913818359375, -0.2503814697265625, -0.23284912109375, -0.2153167724609375, -0.197784423828125, -0.1802520751953125, -0.1627197265625, -0.1451873779296875, -0.127655029296875, -0.1101226806640625, -0.09259033203125, -0.0750579833984375, -0.057525634765625, -0.0399932861328125, -0.0224609375, -0.0049285888671875, 0.012603759765625, 0.0301361083984375, 0.04766845703125, 0.0652008056640625, 0.082733154296875, 0.1002655029296875, 0.1177978515625, 0.1353302001953125, 0.152862548828125, 0.1703948974609375, 0.18792724609375, 0.2054595947265625, 0.222991943359375, 0.2405242919921875, 0.258056640625, 0.2755889892578125, 0.293121337890625, 0.3106536865234375, 0.32818603515625, 0.3457183837890625, 0.363250732421875, 0.3807830810546875, 0.3983154296875, 0.4158477783203125, 0.433380126953125, 0.4509124755859375, 0.46844482421875, 0.4859771728515625, 0.503509521484375, 0.5210418701171875, 0.53857421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 18.0, 17.0, 33.0, 52.0, 47.0, 93.0, 141.0, 148.0, 135.0, 88.0, 67.0, 48.0, 24.0, 25.0, 13.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.285369873046875, -0.27630615234375, -0.267242431640625, -0.2581787109375, -0.249114990234375, -0.24005126953125, -0.230987548828125, -0.221923828125, -0.212860107421875, -0.20379638671875, -0.194732666015625, -0.1856689453125, -0.176605224609375, -0.16754150390625, -0.158477783203125, -0.1494140625, -0.140350341796875, -0.13128662109375, -0.122222900390625, -0.1131591796875, -0.104095458984375, -0.09503173828125, -0.085968017578125, -0.076904296875, -0.067840576171875, -0.05877685546875, -0.049713134765625, -0.0406494140625, -0.031585693359375, -0.02252197265625, -0.013458251953125, -0.00439453125, 0.004669189453125, 0.01373291015625, 0.022796630859375, 0.0318603515625, 0.040924072265625, 0.04998779296875, 0.059051513671875, 0.068115234375, 0.077178955078125, 0.08624267578125, 0.095306396484375, 0.1043701171875, 0.113433837890625, 0.12249755859375, 0.131561279296875, 0.140625, 0.149688720703125, 0.15875244140625, 0.167816162109375, 0.1768798828125, 0.185943603515625, 0.19500732421875, 0.204071044921875, 0.213134765625, 0.222198486328125, 0.23126220703125, 0.240325927734375, 0.2493896484375, 0.258453369140625, 0.26751708984375, 0.276580810546875, 0.28564453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 14.0, 25.0, 18.0, 26.0, 32.0, 33.0, 50.0, 49.0, 60.0, 69.0, 62.0, 68.0, 49.0, 51.0, 47.0, 47.0, 52.0, 45.0, 43.0, 28.0, 19.0, 29.0, 16.0, 16.0, 9.0, 5.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.003823757171631, -2.9175076484680176, -2.8311917781829834, -2.74487566947937, -2.658559560775757, -2.5722436904907227, -2.4859275817871094, -2.399611473083496, -2.313295364379883, -2.2269792556762695, -2.1406633853912354, -2.054347276687622, -1.9680311679840088, -1.881715178489685, -1.7953991889953613, -1.709083080291748, -1.6227672100067139, -1.5364512205123901, -1.4501351118087769, -1.3638191223144531, -1.2775030136108398, -1.1911870241165161, -1.1048710346221924, -1.018554925918579, -0.9322389364242554, -0.8459228873252869, -0.7596068382263184, -0.6732908487319946, -0.5869747996330261, -0.5006587505340576, -0.4143427610397339, -0.3280267119407654, -0.24171066284179688, -0.15539462864398956, -0.06907859444618225, 0.017237424850463867, 0.10355347394943237, 0.18986952304840088, 0.2761855125427246, 0.3625015616416931, 0.4488176107406616, 0.5351336598396301, 0.6214497089385986, 0.7077656984329224, 0.7940817475318909, 0.8803977966308594, 0.9667137861251831, 1.0530297756195068, 1.1393458843231201, 1.2256618738174438, 1.3119779825210571, 1.3982939720153809, 1.4846100807189941, 1.5709260702133179, 1.6572420597076416, 1.7435581684112549, 1.8298741579055786, 1.9161901473999023, 2.0025062561035156, 2.088822364807129, 2.175138235092163, 2.2614543437957764, 2.3477702140808105, 2.434086322784424, 2.520402431488037]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 8.0, 8.0, 8.0, 15.0, 16.0, 12.0, 13.0, 16.0, 18.0, 19.0, 29.0, 24.0, 26.0, 27.0, 28.0, 37.0, 37.0, 46.0, 30.0, 41.0, 30.0, 37.0, 38.0, 38.0, 41.0, 17.0, 38.0, 24.0, 30.0, 22.0, 23.0, 21.0, 26.0, 16.0, 22.0, 12.0, 15.0, 12.0, 17.0, 4.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5719082355499268, -1.5209792852401733, -1.4700504541397095, -1.419121503829956, -1.3681925535202026, -1.3172636032104492, -1.2663347721099854, -1.215405821800232, -1.1644768714904785, -1.113547921180725, -1.0626190900802612, -1.0116901397705078, -0.9607611894607544, -0.9098322987556458, -0.8589034080505371, -0.8079744577407837, -0.7570456266403198, -0.7061167359352112, -0.6551877856254578, -0.6042588949203491, -0.5533299446105957, -0.5024010539054871, -0.4514721632003784, -0.4005432426929474, -0.34961432218551636, -0.2986854016780853, -0.2477564960718155, -0.19682759046554565, -0.14589866995811462, -0.0949697494506836, -0.04404085874557495, 0.006888061761856079, 0.05781710147857666, 0.1087460145354271, 0.15967492759227753, 0.21060383319854736, 0.2615327537059784, 0.3124616742134094, 0.36339056491851807, 0.4143194854259491, 0.4652484059333801, 0.5161772966384888, 0.5671062469482422, 0.6180351376533508, 0.6689640283584595, 0.7198929786682129, 0.7708218693733215, 0.8217507600784302, 0.8726797103881836, 0.9236086010932922, 0.9745375514030457, 1.0254664421081543, 1.0763953924179077, 1.1273243427276611, 1.178253173828125, 1.2291821241378784, 1.2801110744476318, 1.3310400247573853, 1.3819688558578491, 1.4328978061676025, 1.483826756477356, 1.5347557067871094, 1.5856845378875732, 1.6366134881973267, 1.6875423192977905]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 12.0, 23.0, 21.0, 36.0, 46.0, 68.0, 86.0, 141.0, 189.0, 324.0, 470.0, 663.0, 1151.0, 1766.0, 2768.0, 4536.0, 7436.0, 12099.0, 19240.0, 31222.0, 48183.0, 70618.0, 96769.0, 120000.0, 133898.0, 129632.0, 111419.0, 86059.0, 61073.0, 40393.0, 25955.0, 16270.0, 9791.0, 5963.0, 3684.0, 2295.0, 1468.0, 935.0, 576.0, 415.0, 255.0, 177.0, 120.0, 100.0, 71.0, 41.0, 34.0, 27.0, 12.0, 5.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.0078125, -1.944671630859375, -1.88153076171875, -1.818389892578125, -1.7552490234375, -1.692108154296875, -1.62896728515625, -1.565826416015625, -1.502685546875, -1.439544677734375, -1.37640380859375, -1.313262939453125, -1.2501220703125, -1.186981201171875, -1.12384033203125, -1.060699462890625, -0.99755859375, -0.934417724609375, -0.87127685546875, -0.808135986328125, -0.7449951171875, -0.681854248046875, -0.61871337890625, -0.555572509765625, -0.492431640625, -0.429290771484375, -0.36614990234375, -0.303009033203125, -0.2398681640625, -0.176727294921875, -0.11358642578125, -0.050445556640625, 0.0126953125, 0.075836181640625, 0.13897705078125, 0.202117919921875, 0.2652587890625, 0.328399658203125, 0.39154052734375, 0.454681396484375, 0.517822265625, 0.580963134765625, 0.64410400390625, 0.707244873046875, 0.7703857421875, 0.833526611328125, 0.89666748046875, 0.959808349609375, 1.02294921875, 1.086090087890625, 1.14923095703125, 1.212371826171875, 1.2755126953125, 1.338653564453125, 1.40179443359375, 1.464935302734375, 1.528076171875, 1.591217041015625, 1.65435791015625, 1.717498779296875, 1.7806396484375, 1.843780517578125, 1.90692138671875, 1.970062255859375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 8.0, 8.0, 13.0, 11.0, 8.0, 12.0, 19.0, 15.0, 19.0, 14.0, 23.0, 32.0, 27.0, 36.0, 29.0, 40.0, 37.0, 30.0, 37.0, 41.0, 35.0, 33.0, 43.0, 32.0, 29.0, 25.0, 39.0, 27.0, 21.0, 25.0, 28.0, 26.0, 23.0, 20.0, 20.0, 14.0, 16.0, 15.0, 12.0, 9.0, 9.0, 7.0, 1.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.716796875, -1.66448974609375, -1.6121826171875, -1.55987548828125, -1.507568359375, -1.45526123046875, -1.4029541015625, -1.35064697265625, -1.29833984375, -1.24603271484375, -1.1937255859375, -1.14141845703125, -1.089111328125, -1.03680419921875, -0.9844970703125, -0.93218994140625, -0.8798828125, -0.82757568359375, -0.7752685546875, -0.72296142578125, -0.670654296875, -0.61834716796875, -0.5660400390625, -0.51373291015625, -0.46142578125, -0.40911865234375, -0.3568115234375, -0.30450439453125, -0.252197265625, -0.19989013671875, -0.1475830078125, -0.09527587890625, -0.04296875, 0.00933837890625, 0.0616455078125, 0.11395263671875, 0.166259765625, 0.21856689453125, 0.2708740234375, 0.32318115234375, 0.37548828125, 0.42779541015625, 0.4801025390625, 0.53240966796875, 0.584716796875, 0.63702392578125, 0.6893310546875, 0.74163818359375, 0.7939453125, 0.84625244140625, 0.8985595703125, 0.95086669921875, 1.003173828125, 1.05548095703125, 1.1077880859375, 1.16009521484375, 1.21240234375, 1.26470947265625, 1.3170166015625, 1.36932373046875, 1.421630859375, 1.47393798828125, 1.5262451171875, 1.57855224609375, 1.630859375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 11.0, 14.0, 17.0, 40.0, 86.0, 105.0, 167.0, 279.0, 422.0, 730.0, 1154.0, 2061.0, 3396.0, 5667.0, 9379.0, 15524.0, 25357.0, 40040.0, 60773.0, 86530.0, 113300.0, 132039.0, 134892.0, 121972.0, 98041.0, 70846.0, 47234.0, 30604.0, 19060.0, 11476.0, 6904.0, 4156.0, 2483.0, 1509.0, 840.0, 532.0, 378.0, 210.0, 125.0, 64.0, 49.0, 37.0, 27.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.818359375, -1.758148193359375, -1.69793701171875, -1.637725830078125, -1.5775146484375, -1.517303466796875, -1.45709228515625, -1.396881103515625, -1.336669921875, -1.276458740234375, -1.21624755859375, -1.156036376953125, -1.0958251953125, -1.035614013671875, -0.97540283203125, -0.915191650390625, -0.85498046875, -0.794769287109375, -0.73455810546875, -0.674346923828125, -0.6141357421875, -0.553924560546875, -0.49371337890625, -0.433502197265625, -0.373291015625, -0.313079833984375, -0.25286865234375, -0.192657470703125, -0.1324462890625, -0.072235107421875, -0.01202392578125, 0.048187255859375, 0.1083984375, 0.168609619140625, 0.22882080078125, 0.289031982421875, 0.3492431640625, 0.409454345703125, 0.46966552734375, 0.529876708984375, 0.590087890625, 0.650299072265625, 0.71051025390625, 0.770721435546875, 0.8309326171875, 0.891143798828125, 0.95135498046875, 1.011566162109375, 1.07177734375, 1.131988525390625, 1.19219970703125, 1.252410888671875, 1.3126220703125, 1.372833251953125, 1.43304443359375, 1.493255615234375, 1.553466796875, 1.613677978515625, 1.67388916015625, 1.734100341796875, 1.7943115234375, 1.854522705078125, 1.91473388671875, 1.974945068359375, 2.03515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 4.0, 12.0, 13.0, 11.0, 26.0, 24.0, 23.0, 23.0, 28.0, 30.0, 42.0, 37.0, 32.0, 40.0, 35.0, 30.0, 46.0, 40.0, 45.0, 40.0, 40.0, 35.0, 41.0, 36.0, 28.0, 43.0, 41.0, 24.0, 26.0, 26.0, 7.0, 16.0, 11.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1051483154296875, -1.064788818359375, -1.0244293212890625, -0.98406982421875, -0.9437103271484375, -0.903350830078125, -0.8629913330078125, -0.8226318359375, -0.7822723388671875, -0.741912841796875, -0.7015533447265625, -0.66119384765625, -0.6208343505859375, -0.580474853515625, -0.5401153564453125, -0.499755859375, -0.4593963623046875, -0.419036865234375, -0.3786773681640625, -0.33831787109375, -0.2979583740234375, -0.257598876953125, -0.2172393798828125, -0.1768798828125, -0.1365203857421875, -0.096160888671875, -0.0558013916015625, -0.01544189453125, 0.0249176025390625, 0.065277099609375, 0.1056365966796875, 0.14599609375, 0.1863555908203125, 0.226715087890625, 0.2670745849609375, 0.30743408203125, 0.3477935791015625, 0.388153076171875, 0.4285125732421875, 0.4688720703125, 0.5092315673828125, 0.549591064453125, 0.5899505615234375, 0.63031005859375, 0.6706695556640625, 0.711029052734375, 0.7513885498046875, 0.791748046875, 0.8321075439453125, 0.872467041015625, 0.9128265380859375, 0.95318603515625, 0.9935455322265625, 1.033905029296875, 1.0742645263671875, 1.1146240234375, 1.1549835205078125, 1.195343017578125, 1.2357025146484375, 1.27606201171875, 1.3164215087890625, 1.356781005859375, 1.3971405029296875, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 6.0, 9.0, 7.0, 15.0, 18.0, 27.0, 42.0, 54.0, 91.0, 132.0, 244.0, 378.0, 561.0, 890.0, 1353.0, 2354.0, 4015.0, 7058.0, 13559.0, 27707.0, 62300.0, 142593.0, 264452.0, 261435.0, 140674.0, 60859.0, 27342.0, 13171.0, 7080.0, 3984.0, 2315.0, 1462.0, 827.0, 512.0, 349.0, 231.0, 150.0, 99.0, 49.0, 41.0, 33.0, 24.0, 20.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.766204833984375, -2.67694091796875, -2.587677001953125, -2.4984130859375, -2.409149169921875, -2.31988525390625, -2.230621337890625, -2.141357421875, -2.052093505859375, -1.96282958984375, -1.873565673828125, -1.7843017578125, -1.695037841796875, -1.60577392578125, -1.516510009765625, -1.42724609375, -1.337982177734375, -1.24871826171875, -1.159454345703125, -1.0701904296875, -0.980926513671875, -0.89166259765625, -0.802398681640625, -0.713134765625, -0.623870849609375, -0.53460693359375, -0.445343017578125, -0.3560791015625, -0.266815185546875, -0.17755126953125, -0.088287353515625, 0.0009765625, 0.090240478515625, 0.17950439453125, 0.268768310546875, 0.3580322265625, 0.447296142578125, 0.53656005859375, 0.625823974609375, 0.715087890625, 0.804351806640625, 0.89361572265625, 0.982879638671875, 1.0721435546875, 1.161407470703125, 1.25067138671875, 1.339935302734375, 1.42919921875, 1.518463134765625, 1.60772705078125, 1.696990966796875, 1.7862548828125, 1.875518798828125, 1.96478271484375, 2.054046630859375, 2.143310546875, 2.232574462890625, 2.32183837890625, 2.411102294921875, 2.5003662109375, 2.589630126953125, 2.67889404296875, 2.768157958984375, 2.857421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 1.0, 11.0, 12.0, 14.0, 19.0, 25.0, 27.0, 17.0, 26.0, 35.0, 50.0, 51.0, 47.0, 58.0, 64.0, 65.0, 59.0, 50.0, 43.0, 48.0, 37.0, 33.0, 40.0, 16.0, 22.0, 21.0, 11.0, 17.0, 11.0, 5.0, 4.0, 9.0, 4.0, 4.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.00013802573084831238, -0.00013347715139389038, -0.00012892857193946838, -0.0001243799924850464, -0.00011983141303062439, -0.00011528283357620239, -0.0001107342541217804, -0.0001061856746673584, -0.0001016370952129364, -9.70885157585144e-05, -9.253993630409241e-05, -8.799135684967041e-05, -8.344277739524841e-05, -7.889419794082642e-05, -7.434561848640442e-05, -6.979703903198242e-05, -6.524845957756042e-05, -6.069988012313843e-05, -5.615130066871643e-05, -5.1602721214294434e-05, -4.7054141759872437e-05, -4.250556230545044e-05, -3.795698285102844e-05, -3.3408403396606445e-05, -2.8859823942184448e-05, -2.431124448776245e-05, -1.9762665033340454e-05, -1.5214085578918457e-05, -1.066550612449646e-05, -6.116926670074463e-06, -1.5683472156524658e-06, 2.9802322387695312e-06, 7.528811693191528e-06, 1.2077391147613525e-05, 1.6625970602035522e-05, 2.117455005645752e-05, 2.5723129510879517e-05, 3.0271708965301514e-05, 3.482028841972351e-05, 3.936886787414551e-05, 4.3917447328567505e-05, 4.84660267829895e-05, 5.30146062374115e-05, 5.7563185691833496e-05, 6.211176514625549e-05, 6.666034460067749e-05, 7.120892405509949e-05, 7.575750350952148e-05, 8.030608296394348e-05, 8.485466241836548e-05, 8.940324187278748e-05, 9.395182132720947e-05, 9.850040078163147e-05, 0.00010304898023605347, 0.00010759755969047546, 0.00011214613914489746, 0.00011669471859931946, 0.00012124329805374146, 0.00012579187750816345, 0.00013034045696258545, 0.00013488903641700745, 0.00013943761587142944, 0.00014398619532585144, 0.00014853477478027344]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 16.0, 19.0, 27.0, 38.0, 75.0, 124.0, 186.0, 275.0, 481.0, 726.0, 1162.0, 1838.0, 3203.0, 5907.0, 11868.0, 25592.0, 61875.0, 151549.0, 284343.0, 266415.0, 133290.0, 53471.0, 22510.0, 10459.0, 5378.0, 3100.0, 1772.0, 1105.0, 631.0, 395.0, 250.0, 179.0, 100.0, 65.0, 41.0, 24.0, 22.0, 18.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.83880615234375, -2.7498779296875, -2.66094970703125, -2.572021484375, -2.48309326171875, -2.3941650390625, -2.30523681640625, -2.21630859375, -2.12738037109375, -2.0384521484375, -1.94952392578125, -1.860595703125, -1.77166748046875, -1.6827392578125, -1.59381103515625, -1.5048828125, -1.41595458984375, -1.3270263671875, -1.23809814453125, -1.149169921875, -1.06024169921875, -0.9713134765625, -0.88238525390625, -0.79345703125, -0.70452880859375, -0.6156005859375, -0.52667236328125, -0.437744140625, -0.34881591796875, -0.2598876953125, -0.17095947265625, -0.08203125, 0.00689697265625, 0.0958251953125, 0.18475341796875, 0.273681640625, 0.36260986328125, 0.4515380859375, 0.54046630859375, 0.62939453125, 0.71832275390625, 0.8072509765625, 0.89617919921875, 0.985107421875, 1.07403564453125, 1.1629638671875, 1.25189208984375, 1.3408203125, 1.42974853515625, 1.5186767578125, 1.60760498046875, 1.696533203125, 1.78546142578125, 1.8743896484375, 1.96331787109375, 2.05224609375, 2.14117431640625, 2.2301025390625, 2.31903076171875, 2.407958984375, 2.49688720703125, 2.5858154296875, 2.67474365234375, 2.763671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 5.0, 14.0, 15.0, 19.0, 22.0, 31.0, 36.0, 44.0, 55.0, 85.0, 65.0, 89.0, 70.0, 73.0, 63.0, 56.0, 43.0, 39.0, 29.0, 25.0, 31.0, 14.0, 12.0, 12.0, 7.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7098464965820312, -0.6843414306640625, -0.6588363647460938, -0.633331298828125, -0.6078262329101562, -0.5823211669921875, -0.5568161010742188, -0.53131103515625, -0.5058059692382812, -0.4803009033203125, -0.45479583740234375, -0.429290771484375, -0.40378570556640625, -0.3782806396484375, -0.35277557373046875, -0.3272705078125, -0.30176544189453125, -0.2762603759765625, -0.25075531005859375, -0.225250244140625, -0.19974517822265625, -0.1742401123046875, -0.14873504638671875, -0.12322998046875, -0.09772491455078125, -0.0722198486328125, -0.04671478271484375, -0.021209716796875, 0.00429534912109375, 0.0298004150390625, 0.05530548095703125, 0.080810546875, 0.10631561279296875, 0.1318206787109375, 0.15732574462890625, 0.182830810546875, 0.20833587646484375, 0.2338409423828125, 0.25934600830078125, 0.28485107421875, 0.31035614013671875, 0.3358612060546875, 0.36136627197265625, 0.386871337890625, 0.41237640380859375, 0.4378814697265625, 0.46338653564453125, 0.4888916015625, 0.5143966674804688, 0.5399017333984375, 0.5654067993164062, 0.590911865234375, 0.6164169311523438, 0.6419219970703125, 0.6674270629882812, 0.69293212890625, 0.7184371948242188, 0.7439422607421875, 0.7694473266601562, 0.794952392578125, 0.8204574584960938, 0.8459625244140625, 0.8714675903320312, 0.89697265625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 22.0, 18.0, 16.0, 25.0, 39.0, 45.0, 47.0, 59.0, 62.0, 77.0, 66.0, 69.0, 51.0, 45.0, 46.0, 53.0, 54.0, 35.0, 26.0, 22.0, 29.0, 19.0, 10.0, 15.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564897298812866, -2.4802913665771484, -2.3956854343414307, -2.311079502105713, -2.226473331451416, -2.1418673992156982, -2.0572614669799805, -1.9726555347442627, -1.8880494832992554, -1.8034435510635376, -1.7188374996185303, -1.6342315673828125, -1.5496256351470947, -1.4650195837020874, -1.3804136514663696, -1.2958076000213623, -1.2112016677856445, -1.1265957355499268, -1.0419896841049194, -0.9573837518692017, -0.8727777600288391, -0.7881717681884766, -0.7035658359527588, -0.6189598441123962, -0.5343538522720337, -0.44974786043167114, -0.365141898393631, -0.2805359363555908, -0.19592994451522827, -0.11132395267486572, -0.02671802043914795, 0.0578879714012146, 0.14249420166015625, 0.2271001785993576, 0.31170615553855896, 0.3963121175765991, 0.48091810941696167, 0.5655241012573242, 0.650130033493042, 0.7347360253334045, 0.8193420171737671, 0.9039480090141296, 0.9885540008544922, 1.07315993309021, 1.1577658653259277, 1.242371916770935, 1.3269778490066528, 1.4115839004516602, 1.496189832687378, 1.5807957649230957, 1.665401816368103, 1.7500077486038208, 1.8346138000488281, 1.919219732284546, 2.0038256645202637, 2.0884315967559814, 2.173037528991699, 2.257643461227417, 2.3422493934631348, 2.4268555641174316, 2.5114614963531494, 2.596067428588867, 2.680673360824585, 2.7652792930603027, 2.8498854637145996]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 1.0, 7.0, 6.0, 10.0, 10.0, 10.0, 6.0, 13.0, 19.0, 15.0, 18.0, 22.0, 20.0, 23.0, 26.0, 32.0, 37.0, 30.0, 22.0, 34.0, 31.0, 38.0, 39.0, 34.0, 33.0, 35.0, 27.0, 35.0, 37.0, 38.0, 25.0, 19.0, 20.0, 26.0, 24.0, 14.0, 20.0, 24.0, 10.0, 15.0, 10.0, 17.0, 11.0, 10.0, 5.0, 8.0, 10.0, 9.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.6389598846435547, -1.5876710414886475, -1.5363821983337402, -1.485093355178833, -1.4338045120239258, -1.3825156688690186, -1.3312268257141113, -1.279937982559204, -1.2286491394042969, -1.1773602962493896, -1.1260714530944824, -1.0747826099395752, -1.023493766784668, -0.9722049236297607, -0.9209160804748535, -0.8696272373199463, -0.8183384537696838, -0.7670496106147766, -0.7157607674598694, -0.6644719243049622, -0.6131830811500549, -0.5618942975997925, -0.5106054544448853, -0.45931658148765564, -0.4080277383327484, -0.3567388951778412, -0.30545005202293396, -0.2541612386703491, -0.2028723806142807, -0.15158355236053467, -0.10029470920562744, -0.049005866050720215, 0.0022829771041870117, 0.05357181653380394, 0.10486065596342087, 0.1561494916677475, 0.20743833482265472, 0.25872716307640076, 0.310016006231308, 0.3613048493862152, 0.41259369254112244, 0.46388253569602966, 0.5151713490486145, 0.5664601922035217, 0.617749035358429, 0.6690378785133362, 0.7203267216682434, 0.7716155648231506, 0.8229044079780579, 0.8741932511329651, 0.9254820942878723, 0.9767709374427795, 1.028059720993042, 1.0793485641479492, 1.1306374073028564, 1.1819262504577637, 1.233215093612671, 1.2845039367675781, 1.3357927799224854, 1.3870816230773926, 1.4383704662322998, 1.489659309387207, 1.5409481525421143, 1.5922369956970215, 1.6435258388519287]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 12.0, 11.0, 28.0, 59.0, 95.0, 174.0, 299.0, 496.0, 850.0, 1501.0, 2740.0, 4621.0, 8159.0, 14452.0, 25672.0, 45516.0, 82119.0, 141962.0, 240000.0, 379876.0, 542413.0, 655204.0, 643477.0, 518130.0, 357821.0, 222909.0, 131684.0, 75607.0, 42503.0, 23913.0, 13638.0, 7811.0, 4365.0, 2568.0, 1522.0, 867.0, 481.0, 291.0, 188.0, 86.0, 65.0, 44.0, 24.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7557373046875, -1.698974609375, -1.6422119140625, -1.58544921875, -1.5286865234375, -1.471923828125, -1.4151611328125, -1.3583984375, -1.3016357421875, -1.244873046875, -1.1881103515625, -1.13134765625, -1.0745849609375, -1.017822265625, -0.9610595703125, -0.904296875, -0.8475341796875, -0.790771484375, -0.7340087890625, -0.67724609375, -0.6204833984375, -0.563720703125, -0.5069580078125, -0.4501953125, -0.3934326171875, -0.336669921875, -0.2799072265625, -0.22314453125, -0.1663818359375, -0.109619140625, -0.0528564453125, 0.00390625, 0.0606689453125, 0.117431640625, 0.1741943359375, 0.23095703125, 0.2877197265625, 0.344482421875, 0.4012451171875, 0.4580078125, 0.5147705078125, 0.571533203125, 0.6282958984375, 0.68505859375, 0.7418212890625, 0.798583984375, 0.8553466796875, 0.912109375, 0.9688720703125, 1.025634765625, 1.0823974609375, 1.13916015625, 1.1959228515625, 1.252685546875, 1.3094482421875, 1.3662109375, 1.4229736328125, 1.479736328125, 1.5364990234375, 1.59326171875, 1.6500244140625, 1.706787109375, 1.7635498046875, 1.8203125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 3.0, 9.0, 11.0, 14.0, 12.0, 24.0, 19.0, 21.0, 25.0, 24.0, 28.0, 25.0, 29.0, 32.0, 44.0, 45.0, 28.0, 36.0, 37.0, 24.0, 35.0, 37.0, 32.0, 39.0, 40.0, 31.0, 38.0, 17.0, 14.0, 21.0, 32.0, 23.0, 19.0, 15.0, 21.0, 10.0, 15.0, 11.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.092803955078125, -1.05474853515625, -1.016693115234375, -0.9786376953125, -0.940582275390625, -0.90252685546875, -0.864471435546875, -0.826416015625, -0.788360595703125, -0.75030517578125, -0.712249755859375, -0.6741943359375, -0.636138916015625, -0.59808349609375, -0.560028076171875, -0.52197265625, -0.483917236328125, -0.44586181640625, -0.407806396484375, -0.3697509765625, -0.331695556640625, -0.29364013671875, -0.255584716796875, -0.217529296875, -0.179473876953125, -0.14141845703125, -0.103363037109375, -0.0653076171875, -0.027252197265625, 0.01080322265625, 0.048858642578125, 0.0869140625, 0.124969482421875, 0.16302490234375, 0.201080322265625, 0.2391357421875, 0.277191162109375, 0.31524658203125, 0.353302001953125, 0.391357421875, 0.429412841796875, 0.46746826171875, 0.505523681640625, 0.5435791015625, 0.581634521484375, 0.61968994140625, 0.657745361328125, 0.69580078125, 0.733856201171875, 0.77191162109375, 0.809967041015625, 0.8480224609375, 0.886077880859375, 0.92413330078125, 0.962188720703125, 1.000244140625, 1.038299560546875, 1.07635498046875, 1.114410400390625, 1.1524658203125, 1.190521240234375, 1.22857666015625, 1.266632080078125, 1.3046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 18.0, 20.0, 35.0, 40.0, 83.0, 141.0, 224.0, 346.0, 567.0, 926.0, 1627.0, 2772.0, 4575.0, 7682.0, 13066.0, 21424.0, 35434.0, 57835.0, 90700.0, 141182.0, 207486.0, 296111.0, 388439.0, 470461.0, 511125.0, 492721.0, 423943.0, 332004.0, 241209.0, 164834.0, 108412.0, 69008.0, 43399.0, 26501.0, 16049.0, 9531.0, 5809.0, 3382.0, 2065.0, 1233.0, 721.0, 473.0, 262.0, 159.0, 97.0, 57.0, 37.0, 31.0, 9.0, 9.0, 2.0, 6.0, 2.0, 0.0, 4.0], "bins": [-1.5302734375, -1.48486328125, -1.439453125, -1.39404296875, -1.3486328125, -1.30322265625, -1.2578125, -1.21240234375, -1.1669921875, -1.12158203125, -1.076171875, -1.03076171875, -0.9853515625, -0.93994140625, -0.89453125, -0.84912109375, -0.8037109375, -0.75830078125, -0.712890625, -0.66748046875, -0.6220703125, -0.57666015625, -0.53125, -0.48583984375, -0.4404296875, -0.39501953125, -0.349609375, -0.30419921875, -0.2587890625, -0.21337890625, -0.16796875, -0.12255859375, -0.0771484375, -0.03173828125, 0.013671875, 0.05908203125, 0.1044921875, 0.14990234375, 0.1953125, 0.24072265625, 0.2861328125, 0.33154296875, 0.376953125, 0.42236328125, 0.4677734375, 0.51318359375, 0.55859375, 0.60400390625, 0.6494140625, 0.69482421875, 0.740234375, 0.78564453125, 0.8310546875, 0.87646484375, 0.921875, 0.96728515625, 1.0126953125, 1.05810546875, 1.103515625, 1.14892578125, 1.1943359375, 1.23974609375, 1.28515625, 1.33056640625, 1.3759765625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 2.0, 10.0, 7.0, 7.0, 7.0, 14.0, 18.0, 15.0, 39.0, 41.0, 48.0, 42.0, 50.0, 51.0, 67.0, 84.0, 123.0, 133.0, 134.0, 176.0, 139.0, 160.0, 165.0, 195.0, 203.0, 204.0, 192.0, 195.0, 172.0, 183.0, 155.0, 145.0, 140.0, 136.0, 122.0, 70.0, 75.0, 77.0, 64.0, 46.0, 31.0, 32.0, 27.0, 16.0, 12.0, 12.0, 13.0, 14.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.55126953125, -0.5328826904296875, -0.514495849609375, -0.4961090087890625, -0.47772216796875, -0.4593353271484375, -0.440948486328125, -0.4225616455078125, -0.4041748046875, -0.3857879638671875, -0.367401123046875, -0.3490142822265625, -0.33062744140625, -0.3122406005859375, -0.293853759765625, -0.2754669189453125, -0.257080078125, -0.2386932373046875, -0.220306396484375, -0.2019195556640625, -0.18353271484375, -0.1651458740234375, -0.146759033203125, -0.1283721923828125, -0.1099853515625, -0.0915985107421875, -0.073211669921875, -0.0548248291015625, -0.03643798828125, -0.0180511474609375, 0.000335693359375, 0.0187225341796875, 0.037109375, 0.0554962158203125, 0.073883056640625, 0.0922698974609375, 0.11065673828125, 0.1290435791015625, 0.147430419921875, 0.1658172607421875, 0.1842041015625, 0.2025909423828125, 0.220977783203125, 0.2393646240234375, 0.25775146484375, 0.2761383056640625, 0.294525146484375, 0.3129119873046875, 0.331298828125, 0.3496856689453125, 0.368072509765625, 0.3864593505859375, 0.40484619140625, 0.4232330322265625, 0.441619873046875, 0.4600067138671875, 0.4783935546875, 0.4967803955078125, 0.515167236328125, 0.5335540771484375, 0.55194091796875, 0.5703277587890625, 0.588714599609375, 0.6071014404296875, 0.62548828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 13.0, 11.0, 24.0, 19.0, 20.0, 25.0, 26.0, 34.0, 47.0, 49.0, 48.0, 57.0, 55.0, 50.0, 56.0, 61.0, 58.0, 40.0, 39.0, 50.0, 35.0, 35.0, 24.0, 21.0, 16.0, 15.0, 13.0, 9.0, 5.0, 15.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2901968955993652, -2.22659969329834, -2.1630024909973145, -2.099405288696289, -2.0358080863952637, -1.9722108840942383, -1.9086135625839233, -1.845016360282898, -1.7814191579818726, -1.7178219556808472, -1.6542247533798218, -1.5906275510787964, -1.5270302295684814, -1.463433027267456, -1.3998358249664307, -1.3362386226654053, -1.2726414203643799, -1.2090442180633545, -1.145447015762329, -1.0818498134613037, -1.0182526111602783, -0.9546553492546082, -0.891058087348938, -0.8274608850479126, -0.7638636827468872, -0.7002664804458618, -0.6366692781448364, -0.5730720162391663, -0.5094748139381409, -0.4458776116371155, -0.3822803795337677, -0.3186831474304199, -0.25508618354797363, -0.19148896634578705, -0.12789174914360046, -0.06429453194141388, -0.0006973147392272949, 0.0628998875617981, 0.12649711966514587, 0.19009435176849365, 0.25369155406951904, 0.31728875637054443, 0.3808859884738922, 0.44448322057724, 0.5080804228782654, 0.5716776251792908, 0.6352748870849609, 0.6988720893859863, 0.7624692916870117, 0.8260664939880371, 0.8896636962890625, 0.9532609581947327, 1.0168581008911133, 1.0804553031921387, 1.1440526247024536, 1.207649827003479, 1.2712470293045044, 1.3348442316055298, 1.3984414339065552, 1.4620386362075806, 1.5256359577178955, 1.589233160018921, 1.6528303623199463, 1.7164275646209717, 1.780024766921997]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 8.0, 3.0, 7.0, 7.0, 8.0, 17.0, 18.0, 26.0, 24.0, 28.0, 19.0, 25.0, 34.0, 25.0, 25.0, 36.0, 37.0, 44.0, 40.0, 27.0, 42.0, 38.0, 41.0, 35.0, 38.0, 41.0, 32.0, 31.0, 25.0, 19.0, 19.0, 18.0, 25.0, 17.0, 13.0, 23.0, 14.0, 16.0, 6.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4026124477386475, -1.3561328649520874, -1.3096531629562378, -1.2631735801696777, -1.2166939973831177, -1.1702144145965576, -1.123734712600708, -1.077255129814148, -1.030775547027588, -0.9842959046363831, -0.937816321849823, -0.8913366794586182, -0.8448570966720581, -0.7983774542808533, -0.7518978118896484, -0.7054182291030884, -0.6589385867118835, -0.6124589443206787, -0.5659793615341187, -0.5194997191429138, -0.47302013635635376, -0.4265404939651489, -0.3800608813762665, -0.33358126878738403, -0.2871016561985016, -0.24062204360961914, -0.1941424310207367, -0.14766280353069305, -0.10118319094181061, -0.05470357835292816, -0.008223950862884521, 0.038255661725997925, 0.08473527431488037, 0.13121488690376282, 0.17769449949264526, 0.2241741269826889, 0.27065372467041016, 0.317133367061615, 0.36361297965049744, 0.4100925922393799, 0.45657220482826233, 0.5030518174171448, 0.5495314598083496, 0.5960110425949097, 0.6424906849861145, 0.6889702677726746, 0.7354499101638794, 0.7819294929504395, 0.8284091353416443, 0.8748887777328491, 0.9213683605194092, 0.967848002910614, 1.0143276453018188, 1.060807228088379, 1.107286810874939, 1.153766393661499, 1.2002460956573486, 1.2467256784439087, 1.2932053804397583, 1.3396849632263184, 1.3861645460128784, 1.4326441287994385, 1.479123830795288, 1.5256034135818481, 1.5720829963684082]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 10.0, 9.0, 11.0, 13.0, 28.0, 29.0, 61.0, 82.0, 121.0, 179.0, 248.0, 435.0, 640.0, 1021.0, 1576.0, 2510.0, 3968.0, 6737.0, 11412.0, 19522.0, 34020.0, 60081.0, 101959.0, 159776.0, 199411.0, 171531.0, 112984.0, 67200.0, 38475.0, 22061.0, 12841.0, 7491.0, 4485.0, 2777.0, 1767.0, 1038.0, 672.0, 470.0, 295.0, 191.0, 129.0, 93.0, 69.0, 46.0, 26.0, 18.0, 15.0, 4.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.78271484375, -0.7579498291015625, -0.733184814453125, -0.7084197998046875, -0.68365478515625, -0.6588897705078125, -0.634124755859375, -0.6093597412109375, -0.5845947265625, -0.5598297119140625, -0.535064697265625, -0.5102996826171875, -0.48553466796875, -0.4607696533203125, -0.436004638671875, -0.4112396240234375, -0.386474609375, -0.3617095947265625, -0.336944580078125, -0.3121795654296875, -0.28741455078125, -0.2626495361328125, -0.237884521484375, -0.2131195068359375, -0.1883544921875, -0.1635894775390625, -0.138824462890625, -0.1140594482421875, -0.08929443359375, -0.0645294189453125, -0.039764404296875, -0.0149993896484375, 0.009765625, 0.0345306396484375, 0.059295654296875, 0.0840606689453125, 0.10882568359375, 0.1335906982421875, 0.158355712890625, 0.1831207275390625, 0.2078857421875, 0.2326507568359375, 0.257415771484375, 0.2821807861328125, 0.30694580078125, 0.3317108154296875, 0.356475830078125, 0.3812408447265625, 0.406005859375, 0.4307708740234375, 0.455535888671875, 0.4803009033203125, 0.50506591796875, 0.5298309326171875, 0.554595947265625, 0.5793609619140625, 0.6041259765625, 0.6288909912109375, 0.653656005859375, 0.6784210205078125, 0.70318603515625, 0.7279510498046875, 0.752716064453125, 0.7774810791015625, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 6.0, 11.0, 10.0, 19.0, 20.0, 28.0, 24.0, 26.0, 37.0, 29.0, 26.0, 35.0, 36.0, 40.0, 35.0, 35.0, 41.0, 34.0, 40.0, 39.0, 37.0, 38.0, 36.0, 31.0, 40.0, 25.0, 28.0, 28.0, 10.0, 17.0, 20.0, 17.0, 14.0, 14.0, 8.0, 6.0, 6.0, 9.0, 10.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.46624755859375, -1.4149169921875, -1.36358642578125, -1.312255859375, -1.26092529296875, -1.2095947265625, -1.15826416015625, -1.10693359375, -1.05560302734375, -1.0042724609375, -0.95294189453125, -0.901611328125, -0.85028076171875, -0.7989501953125, -0.74761962890625, -0.6962890625, -0.64495849609375, -0.5936279296875, -0.54229736328125, -0.490966796875, -0.43963623046875, -0.3883056640625, -0.33697509765625, -0.28564453125, -0.23431396484375, -0.1829833984375, -0.13165283203125, -0.080322265625, -0.02899169921875, 0.0223388671875, 0.07366943359375, 0.125, 0.17633056640625, 0.2276611328125, 0.27899169921875, 0.330322265625, 0.38165283203125, 0.4329833984375, 0.48431396484375, 0.53564453125, 0.58697509765625, 0.6383056640625, 0.68963623046875, 0.740966796875, 0.79229736328125, 0.8436279296875, 0.89495849609375, 0.9462890625, 0.99761962890625, 1.0489501953125, 1.10028076171875, 1.151611328125, 1.20294189453125, 1.2542724609375, 1.30560302734375, 1.35693359375, 1.40826416015625, 1.4595947265625, 1.51092529296875, 1.562255859375, 1.61358642578125, 1.6649169921875, 1.71624755859375, 1.767578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 6.0, 7.0, 11.0, 39.0, 44.0, 68.0, 113.0, 178.0, 248.0, 425.0, 684.0, 1098.0, 1796.0, 3009.0, 5298.0, 9575.0, 17182.0, 32353.0, 61138.0, 115634.0, 201279.0, 240623.0, 164357.0, 89781.0, 46939.0, 25070.0, 13530.0, 7438.0, 4281.0, 2435.0, 1492.0, 917.0, 536.0, 357.0, 204.0, 153.0, 88.0, 70.0, 41.0, 27.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9951171875, -0.9669265747070312, -0.9387359619140625, -0.9105453491210938, -0.882354736328125, -0.8541641235351562, -0.8259735107421875, -0.7977828979492188, -0.76959228515625, -0.7414016723632812, -0.7132110595703125, -0.6850204467773438, -0.656829833984375, -0.6286392211914062, -0.6004486083984375, -0.5722579956054688, -0.5440673828125, -0.5158767700195312, -0.4876861572265625, -0.45949554443359375, -0.431304931640625, -0.40311431884765625, -0.3749237060546875, -0.34673309326171875, -0.31854248046875, -0.29035186767578125, -0.2621612548828125, -0.23397064208984375, -0.205780029296875, -0.17758941650390625, -0.1493988037109375, -0.12120819091796875, -0.093017578125, -0.06482696533203125, -0.0366363525390625, -0.00844573974609375, 0.019744873046875, 0.04793548583984375, 0.0761260986328125, 0.10431671142578125, 0.13250732421875, 0.16069793701171875, 0.1888885498046875, 0.21707916259765625, 0.245269775390625, 0.27346038818359375, 0.3016510009765625, 0.32984161376953125, 0.3580322265625, 0.38622283935546875, 0.4144134521484375, 0.44260406494140625, 0.470794677734375, 0.49898529052734375, 0.5271759033203125, 0.5553665161132812, 0.58355712890625, 0.6117477416992188, 0.6399383544921875, 0.6681289672851562, 0.696319580078125, 0.7245101928710938, 0.7527008056640625, 0.7808914184570312, 0.80908203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 5.0, 15.0, 11.0, 13.0, 15.0, 14.0, 19.0, 22.0, 37.0, 21.0, 20.0, 32.0, 26.0, 33.0, 34.0, 46.0, 49.0, 53.0, 36.0, 43.0, 47.0, 43.0, 33.0, 41.0, 36.0, 26.0, 29.0, 32.0, 25.0, 22.0, 15.0, 23.0, 14.0, 13.0, 6.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.222137451171875, -1.18548583984375, -1.148834228515625, -1.1121826171875, -1.075531005859375, -1.03887939453125, -1.002227783203125, -0.965576171875, -0.928924560546875, -0.89227294921875, -0.855621337890625, -0.8189697265625, -0.782318115234375, -0.74566650390625, -0.709014892578125, -0.67236328125, -0.635711669921875, -0.59906005859375, -0.562408447265625, -0.5257568359375, -0.489105224609375, -0.45245361328125, -0.415802001953125, -0.379150390625, -0.342498779296875, -0.30584716796875, -0.269195556640625, -0.2325439453125, -0.195892333984375, -0.15924072265625, -0.122589111328125, -0.0859375, -0.049285888671875, -0.01263427734375, 0.024017333984375, 0.0606689453125, 0.097320556640625, 0.13397216796875, 0.170623779296875, 0.207275390625, 0.243927001953125, 0.28057861328125, 0.317230224609375, 0.3538818359375, 0.390533447265625, 0.42718505859375, 0.463836669921875, 0.50048828125, 0.537139892578125, 0.57379150390625, 0.610443115234375, 0.6470947265625, 0.683746337890625, 0.72039794921875, 0.757049560546875, 0.793701171875, 0.830352783203125, 0.86700439453125, 0.903656005859375, 0.9403076171875, 0.976959228515625, 1.01361083984375, 1.050262451171875, 1.0869140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 55.0, 77.0, 57.0, 112.0, 134.0, 196.0, 289.0, 410.0, 652.0, 1003.0, 1492.0, 2554.0, 4423.0, 8168.0, 17700.0, 46551.0, 162096.0, 466474.0, 228420.0, 62504.0, 22321.0, 9739.0, 5028.0, 2895.0, 1729.0, 1072.0, 717.0, 507.0, 328.0, 220.0, 161.0, 104.0, 81.0, 50.0, 57.0, 26.0, 21.0, 14.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4549674987792969, -0.43849945068359375, -0.4220314025878906, -0.4055633544921875, -0.3890953063964844, -0.37262725830078125, -0.3561592102050781, -0.339691162109375, -0.3232231140136719, -0.30675506591796875, -0.2902870178222656, -0.2738189697265625, -0.2573509216308594, -0.24088287353515625, -0.22441482543945312, -0.20794677734375, -0.19147872924804688, -0.17501068115234375, -0.15854263305664062, -0.1420745849609375, -0.12560653686523438, -0.10913848876953125, -0.09267044067382812, -0.076202392578125, -0.059734344482421875, -0.04326629638671875, -0.026798248291015625, -0.0103302001953125, 0.006137847900390625, 0.02260589599609375, 0.039073944091796875, 0.0555419921875, 0.07201004028320312, 0.08847808837890625, 0.10494613647460938, 0.1214141845703125, 0.13788223266601562, 0.15435028076171875, 0.17081832885742188, 0.187286376953125, 0.20375442504882812, 0.22022247314453125, 0.23669052124023438, 0.2531585693359375, 0.2696266174316406, 0.28609466552734375, 0.3025627136230469, 0.31903076171875, 0.3354988098144531, 0.35196685791015625, 0.3684349060058594, 0.3849029541015625, 0.4013710021972656, 0.41783905029296875, 0.4343070983886719, 0.450775146484375, 0.4672431945800781, 0.48371124267578125, 0.5001792907714844, 0.5166473388671875, 0.5331153869628906, 0.5495834350585938, 0.5660514831542969, 0.58251953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 5.0, 4.0, 15.0, 14.0, 21.0, 18.0, 19.0, 26.0, 36.0, 25.0, 35.0, 36.0, 49.0, 42.0, 56.0, 46.0, 60.0, 43.0, 51.0, 63.0, 40.0, 41.0, 31.0, 40.0, 30.0, 23.0, 20.0, 21.0, 16.0, 10.0, 8.0, 9.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.1083280444145203e-05, -2.0410865545272827e-05, -1.973845064640045e-05, -1.9066035747528076e-05, -1.83936208486557e-05, -1.7721205949783325e-05, -1.704879105091095e-05, -1.6376376152038574e-05, -1.57039612531662e-05, -1.5031546354293823e-05, -1.4359131455421448e-05, -1.3686716556549072e-05, -1.3014301657676697e-05, -1.2341886758804321e-05, -1.1669471859931946e-05, -1.099705696105957e-05, -1.0324642062187195e-05, -9.65222716331482e-06, -8.979812264442444e-06, -8.307397365570068e-06, -7.634982466697693e-06, -6.962567567825317e-06, -6.290152668952942e-06, -5.617737770080566e-06, -4.945322871208191e-06, -4.2729079723358154e-06, -3.60049307346344e-06, -2.9280781745910645e-06, -2.255663275718689e-06, -1.5832483768463135e-06, -9.10833477973938e-07, -2.384185791015625e-07, 4.33996319770813e-07, 1.1064112186431885e-06, 1.778826117515564e-06, 2.4512410163879395e-06, 3.123655915260315e-06, 3.7960708141326904e-06, 4.468485713005066e-06, 5.140900611877441e-06, 5.813315510749817e-06, 6.485730409622192e-06, 7.158145308494568e-06, 7.830560207366943e-06, 8.502975106239319e-06, 9.175390005111694e-06, 9.84780490398407e-06, 1.0520219802856445e-05, 1.119263470172882e-05, 1.1865049600601196e-05, 1.2537464499473572e-05, 1.3209879398345947e-05, 1.3882294297218323e-05, 1.4554709196090698e-05, 1.5227124094963074e-05, 1.589953899383545e-05, 1.6571953892707825e-05, 1.72443687915802e-05, 1.7916783690452576e-05, 1.858919858932495e-05, 1.9261613488197327e-05, 1.9934028387069702e-05, 2.0606443285942078e-05, 2.1278858184814453e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 15.0, 10.0, 24.0, 39.0, 77.0, 104.0, 185.0, 273.0, 466.0, 835.0, 1397.0, 2392.0, 4420.0, 8511.0, 17373.0, 36830.0, 82607.0, 186052.0, 306803.0, 216254.0, 98906.0, 43293.0, 20199.0, 9900.0, 5053.0, 2725.0, 1492.0, 913.0, 550.0, 305.0, 206.0, 118.0, 59.0, 57.0, 36.0, 26.0, 13.0, 9.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4791755676269531, -0.46298980712890625, -0.4468040466308594, -0.4306182861328125, -0.4144325256347656, -0.39824676513671875, -0.3820610046386719, -0.365875244140625, -0.3496894836425781, -0.33350372314453125, -0.3173179626464844, -0.3011322021484375, -0.2849464416503906, -0.26876068115234375, -0.2525749206542969, -0.23638916015625, -0.22020339965820312, -0.20401763916015625, -0.18783187866210938, -0.1716461181640625, -0.15546035766601562, -0.13927459716796875, -0.12308883666992188, -0.106903076171875, -0.09071731567382812, -0.07453155517578125, -0.058345794677734375, -0.0421600341796875, -0.025974273681640625, -0.00978851318359375, 0.006397247314453125, 0.0225830078125, 0.038768768310546875, 0.05495452880859375, 0.07114028930664062, 0.0873260498046875, 0.10351181030273438, 0.11969757080078125, 0.13588333129882812, 0.152069091796875, 0.16825485229492188, 0.18444061279296875, 0.20062637329101562, 0.2168121337890625, 0.23299789428710938, 0.24918365478515625, 0.2653694152832031, 0.28155517578125, 0.2977409362792969, 0.31392669677734375, 0.3301124572753906, 0.3462982177734375, 0.3624839782714844, 0.37866973876953125, 0.3948554992675781, 0.411041259765625, 0.4272270202636719, 0.44341278076171875, 0.4595985412597656, 0.4757843017578125, 0.4919700622558594, 0.5081558227539062, 0.5243415832519531, 0.54052734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 14.0, 8.0, 7.0, 16.0, 9.0, 20.0, 18.0, 16.0, 24.0, 20.0, 24.0, 35.0, 42.0, 40.0, 65.0, 59.0, 51.0, 59.0, 55.0, 56.0, 54.0, 42.0, 38.0, 25.0, 29.0, 28.0, 19.0, 19.0, 18.0, 13.0, 10.0, 4.0, 9.0, 6.0, 12.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.097412109375, -0.09454917907714844, -0.09168624877929688, -0.08882331848144531, -0.08596038818359375, -0.08309745788574219, -0.08023452758789062, -0.07737159729003906, -0.0745086669921875, -0.07164573669433594, -0.06878280639648438, -0.06591987609863281, -0.06305694580078125, -0.06019401550292969, -0.057331085205078125, -0.05446815490722656, -0.051605224609375, -0.04874229431152344, -0.045879364013671875, -0.04301643371582031, -0.04015350341796875, -0.03729057312011719, -0.034427642822265625, -0.03156471252441406, -0.0287017822265625, -0.025838851928710938, -0.022975921630859375, -0.020112991333007812, -0.01725006103515625, -0.014387130737304688, -0.011524200439453125, -0.008661270141601562, -0.00579833984375, -0.0029354095458984375, -7.2479248046875e-05, 0.0027904510498046875, 0.00565338134765625, 0.008516311645507812, 0.011379241943359375, 0.014242172241210938, 0.0171051025390625, 0.019968032836914062, 0.022830963134765625, 0.025693893432617188, 0.02855682373046875, 0.03141975402832031, 0.034282684326171875, 0.03714561462402344, 0.040008544921875, 0.04287147521972656, 0.045734405517578125, 0.04859733581542969, 0.05146026611328125, 0.05432319641113281, 0.057186126708984375, 0.06004905700683594, 0.0629119873046875, 0.06577491760253906, 0.06863784790039062, 0.07150077819824219, 0.07436370849609375, 0.07722663879394531, 0.08008956909179688, 0.08295249938964844, 0.0858154296875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 9.0, 15.0, 21.0, 19.0, 28.0, 26.0, 36.0, 36.0, 31.0, 53.0, 37.0, 65.0, 50.0, 61.0, 55.0, 50.0, 43.0, 54.0, 44.0, 37.0, 43.0, 31.0, 19.0, 21.0, 19.0, 18.0, 11.0, 10.0, 9.0, 6.0, 3.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1656153202056885, -2.103355646133423, -2.041095733642578, -1.978835940361023, -1.9165761470794678, -1.8543163537979126, -1.7920565605163574, -1.7297967672348022, -1.667536973953247, -1.605277180671692, -1.5430173873901367, -1.4807575941085815, -1.4184978008270264, -1.3562380075454712, -1.293978214263916, -1.2317184209823608, -1.1694586277008057, -1.1071988344192505, -1.0449390411376953, -0.9826792478561401, -0.920419454574585, -0.8581596612930298, -0.7958998680114746, -0.7336400747299194, -0.6713804006576538, -0.6091206073760986, -0.5468608140945435, -0.4846010208129883, -0.4223412275314331, -0.3600814640522003, -0.29782167077064514, -0.23556187748908997, -0.1733020544052124, -0.11104226112365723, -0.04878247529268265, 0.013477310538291931, 0.0757371038198471, 0.1379968822002411, 0.20025667548179626, 0.26251646876335144, 0.3247762620449066, 0.3870360553264618, 0.44929584860801697, 0.5115556120872498, 0.5738154053688049, 0.6360751986503601, 0.6983349919319153, 0.7605947852134705, 0.8228545784950256, 0.8851143717765808, 0.947374165058136, 1.0096338987350464, 1.0718936920166016, 1.1341534852981567, 1.196413278579712, 1.258673071861267, 1.3209328651428223, 1.3831926584243774, 1.4454524517059326, 1.5077122449874878, 1.569972038269043, 1.6322318315505981, 1.6944916248321533, 1.7567514181137085, 1.8190112113952637]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 6.0, 5.0, 5.0, 11.0, 12.0, 9.0, 25.0, 27.0, 24.0, 21.0, 21.0, 30.0, 29.0, 28.0, 24.0, 29.0, 42.0, 43.0, 35.0, 32.0, 39.0, 48.0, 37.0, 34.0, 35.0, 42.0, 29.0, 27.0, 23.0, 20.0, 24.0, 22.0, 21.0, 16.0, 15.0, 15.0, 19.0, 13.0, 9.0, 8.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3607033491134644, -1.3150500059127808, -1.2693967819213867, -1.2237434387207031, -1.1780900955200195, -1.132436752319336, -1.0867834091186523, -1.0411301851272583, -0.9954768419265747, -0.9498234987258911, -0.9041702151298523, -0.8585169315338135, -0.8128635883331299, -0.7672102451324463, -0.7215569615364075, -0.6759036779403687, -0.6302503347396851, -0.5845969915390015, -0.5389437079429626, -0.49329039454460144, -0.44763708114624023, -0.40198376774787903, -0.3563304543495178, -0.3106771409511566, -0.2650238275527954, -0.2193705141544342, -0.173717200756073, -0.1280638873577118, -0.08241057395935059, -0.03675726056098938, 0.008896052837371826, 0.05454936623573303, 0.10020256042480469, 0.1458558738231659, 0.1915091872215271, 0.2371625006198883, 0.2828158140182495, 0.3284691274166107, 0.3741224408149719, 0.41977575421333313, 0.46542906761169434, 0.5110824108123779, 0.5567356944084167, 0.6023889780044556, 0.6480423212051392, 0.6936956644058228, 0.7393489480018616, 0.7850022315979004, 0.830655574798584, 0.8763089179992676, 0.9219622015953064, 0.9676154851913452, 1.0132688283920288, 1.0589221715927124, 1.1045753955841064, 1.15022873878479, 1.1958820819854736, 1.2415354251861572, 1.2871887683868408, 1.3328419923782349, 1.3784953355789185, 1.424148678779602, 1.469801902770996, 1.5154552459716797, 1.5611085891723633]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 12.0, 18.0, 23.0, 50.0, 54.0, 87.0, 139.0, 231.0, 361.0, 564.0, 839.0, 1272.0, 1955.0, 3119.0, 4894.0, 7515.0, 11383.0, 17296.0, 25425.0, 36209.0, 50124.0, 67055.0, 84012.0, 99669.0, 108911.0, 109134.0, 100086.0, 85735.0, 67929.0, 50990.0, 36845.0, 25873.0, 17287.0, 11838.0, 7746.0, 4876.0, 3256.0, 2045.0, 1343.0, 849.0, 535.0, 343.0, 226.0, 152.0, 95.0, 41.0, 33.0, 28.0, 28.0, 7.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2749176025390625, -1.232452392578125, -1.1899871826171875, -1.14752197265625, -1.1050567626953125, -1.062591552734375, -1.0201263427734375, -0.9776611328125, -0.9351959228515625, -0.892730712890625, -0.8502655029296875, -0.80780029296875, -0.7653350830078125, -0.722869873046875, -0.6804046630859375, -0.637939453125, -0.5954742431640625, -0.553009033203125, -0.5105438232421875, -0.46807861328125, -0.4256134033203125, -0.383148193359375, -0.3406829833984375, -0.2982177734375, -0.2557525634765625, -0.213287353515625, -0.1708221435546875, -0.12835693359375, -0.0858917236328125, -0.043426513671875, -0.0009613037109375, 0.04150390625, 0.0839691162109375, 0.126434326171875, 0.1688995361328125, 0.21136474609375, 0.2538299560546875, 0.296295166015625, 0.3387603759765625, 0.3812255859375, 0.4236907958984375, 0.466156005859375, 0.5086212158203125, 0.55108642578125, 0.5935516357421875, 0.636016845703125, 0.6784820556640625, 0.720947265625, 0.7634124755859375, 0.805877685546875, 0.8483428955078125, 0.89080810546875, 0.9332733154296875, 0.975738525390625, 1.0182037353515625, 1.0606689453125, 1.1031341552734375, 1.145599365234375, 1.1880645751953125, 1.23052978515625, 1.2729949951171875, 1.315460205078125, 1.3579254150390625, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 11.0, 13.0, 15.0, 22.0, 18.0, 20.0, 27.0, 29.0, 26.0, 18.0, 34.0, 25.0, 33.0, 40.0, 38.0, 40.0, 33.0, 48.0, 40.0, 40.0, 46.0, 31.0, 20.0, 27.0, 27.0, 23.0, 31.0, 17.0, 20.0, 24.0, 13.0, 17.0, 19.0, 16.0, 10.0, 8.0, 8.0, 4.0, 6.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.5146484375, -1.4691009521484375, -1.423553466796875, -1.3780059814453125, -1.33245849609375, -1.2869110107421875, -1.241363525390625, -1.1958160400390625, -1.1502685546875, -1.1047210693359375, -1.059173583984375, -1.0136260986328125, -0.96807861328125, -0.9225311279296875, -0.876983642578125, -0.8314361572265625, -0.785888671875, -0.7403411865234375, -0.694793701171875, -0.6492462158203125, -0.60369873046875, -0.5581512451171875, -0.512603759765625, -0.4670562744140625, -0.4215087890625, -0.3759613037109375, -0.330413818359375, -0.2848663330078125, -0.23931884765625, -0.1937713623046875, -0.148223876953125, -0.1026763916015625, -0.05712890625, -0.0115814208984375, 0.033966064453125, 0.0795135498046875, 0.12506103515625, 0.1706085205078125, 0.216156005859375, 0.2617034912109375, 0.3072509765625, 0.3527984619140625, 0.398345947265625, 0.4438934326171875, 0.48944091796875, 0.5349884033203125, 0.580535888671875, 0.6260833740234375, 0.671630859375, 0.7171783447265625, 0.762725830078125, 0.8082733154296875, 0.85382080078125, 0.8993682861328125, 0.944915771484375, 0.9904632568359375, 1.0360107421875, 1.0815582275390625, 1.127105712890625, 1.1726531982421875, 1.21820068359375, 1.2637481689453125, 1.309295654296875, 1.3548431396484375, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 26.0, 34.0, 64.0, 90.0, 154.0, 214.0, 373.0, 565.0, 886.0, 1422.0, 2326.0, 3504.0, 5587.0, 8588.0, 13287.0, 20391.0, 30099.0, 43180.0, 59122.0, 77582.0, 95084.0, 108012.0, 112504.0, 106995.0, 94487.0, 77092.0, 58695.0, 42529.0, 29508.0, 19641.0, 12991.0, 8564.0, 5412.0, 3494.0, 2273.0, 1331.0, 874.0, 569.0, 356.0, 229.0, 158.0, 90.0, 52.0, 33.0, 24.0, 12.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.40625, -1.3642425537109375, -1.322235107421875, -1.2802276611328125, -1.23822021484375, -1.1962127685546875, -1.154205322265625, -1.1121978759765625, -1.0701904296875, -1.0281829833984375, -0.986175537109375, -0.9441680908203125, -0.90216064453125, -0.8601531982421875, -0.818145751953125, -0.7761383056640625, -0.734130859375, -0.6921234130859375, -0.650115966796875, -0.6081085205078125, -0.56610107421875, -0.5240936279296875, -0.482086181640625, -0.4400787353515625, -0.3980712890625, -0.3560638427734375, -0.314056396484375, -0.2720489501953125, -0.23004150390625, -0.1880340576171875, -0.146026611328125, -0.1040191650390625, -0.06201171875, -0.0200042724609375, 0.022003173828125, 0.0640106201171875, 0.10601806640625, 0.1480255126953125, 0.190032958984375, 0.2320404052734375, 0.2740478515625, 0.3160552978515625, 0.358062744140625, 0.4000701904296875, 0.44207763671875, 0.4840850830078125, 0.526092529296875, 0.5680999755859375, 0.610107421875, 0.6521148681640625, 0.694122314453125, 0.7361297607421875, 0.77813720703125, 0.8201446533203125, 0.862152099609375, 0.9041595458984375, 0.9461669921875, 0.9881744384765625, 1.030181884765625, 1.0721893310546875, 1.11419677734375, 1.1562042236328125, 1.198211669921875, 1.2402191162109375, 1.2822265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 2.0, 8.0, 12.0, 5.0, 14.0, 10.0, 12.0, 19.0, 18.0, 16.0, 23.0, 27.0, 13.0, 33.0, 24.0, 30.0, 31.0, 31.0, 31.0, 35.0, 31.0, 33.0, 35.0, 42.0, 42.0, 42.0, 39.0, 21.0, 42.0, 25.0, 30.0, 31.0, 22.0, 23.0, 18.0, 21.0, 17.0, 17.0, 11.0, 9.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9072265625, -0.8786849975585938, -0.8501434326171875, -0.8216018676757812, -0.793060302734375, -0.7645187377929688, -0.7359771728515625, -0.7074356079101562, -0.67889404296875, -0.6503524780273438, -0.6218109130859375, -0.5932693481445312, -0.564727783203125, -0.5361862182617188, -0.5076446533203125, -0.47910308837890625, -0.4505615234375, -0.42201995849609375, -0.3934783935546875, -0.36493682861328125, -0.336395263671875, -0.30785369873046875, -0.2793121337890625, -0.25077056884765625, -0.22222900390625, -0.19368743896484375, -0.1651458740234375, -0.13660430908203125, -0.108062744140625, -0.07952117919921875, -0.0509796142578125, -0.02243804931640625, 0.006103515625, 0.03464508056640625, 0.0631866455078125, 0.09172821044921875, 0.120269775390625, 0.14881134033203125, 0.1773529052734375, 0.20589447021484375, 0.23443603515625, 0.26297760009765625, 0.2915191650390625, 0.32006072998046875, 0.348602294921875, 0.37714385986328125, 0.4056854248046875, 0.43422698974609375, 0.4627685546875, 0.49131011962890625, 0.5198516845703125, 0.5483932495117188, 0.576934814453125, 0.6054763793945312, 0.6340179443359375, 0.6625595092773438, 0.69110107421875, 0.7196426391601562, 0.7481842041015625, 0.7767257690429688, 0.805267333984375, 0.8338088989257812, 0.8623504638671875, 0.8908920288085938, 0.91943359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 8.0, 16.0, 14.0, 24.0, 38.0, 48.0, 80.0, 126.0, 185.0, 286.0, 466.0, 680.0, 1139.0, 1975.0, 3384.0, 5995.0, 11202.0, 21092.0, 39146.0, 73194.0, 124782.0, 182377.0, 200390.0, 159393.0, 100831.0, 55619.0, 30179.0, 15855.0, 8473.0, 4718.0, 2667.0, 1543.0, 925.0, 556.0, 346.0, 246.0, 158.0, 118.0, 61.0, 60.0, 40.0, 27.0, 26.0, 16.0, 6.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.2763671875, -1.2368316650390625, -1.197296142578125, -1.1577606201171875, -1.11822509765625, -1.0786895751953125, -1.039154052734375, -0.9996185302734375, -0.9600830078125, -0.9205474853515625, -0.881011962890625, -0.8414764404296875, -0.80194091796875, -0.7624053955078125, -0.722869873046875, -0.6833343505859375, -0.643798828125, -0.6042633056640625, -0.564727783203125, -0.5251922607421875, -0.48565673828125, -0.4461212158203125, -0.406585693359375, -0.3670501708984375, -0.3275146484375, -0.2879791259765625, -0.248443603515625, -0.2089080810546875, -0.16937255859375, -0.1298370361328125, -0.090301513671875, -0.0507659912109375, -0.01123046875, 0.0283050537109375, 0.067840576171875, 0.1073760986328125, 0.14691162109375, 0.1864471435546875, 0.225982666015625, 0.2655181884765625, 0.3050537109375, 0.3445892333984375, 0.384124755859375, 0.4236602783203125, 0.46319580078125, 0.5027313232421875, 0.542266845703125, 0.5818023681640625, 0.621337890625, 0.6608734130859375, 0.700408935546875, 0.7399444580078125, 0.77947998046875, 0.8190155029296875, 0.858551025390625, 0.8980865478515625, 0.9376220703125, 0.9771575927734375, 1.016693115234375, 1.0562286376953125, 1.09576416015625, 1.1352996826171875, 1.174835205078125, 1.2143707275390625, 1.25390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 3.0, 9.0, 12.0, 12.0, 12.0, 23.0, 34.0, 32.0, 38.0, 44.0, 49.0, 57.0, 48.0, 64.0, 60.0, 44.0, 61.0, 60.0, 52.0, 37.0, 46.0, 33.0, 40.0, 19.0, 19.0, 22.0, 13.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010466575622558594, -0.00010150019079446793, -9.833462536334991e-05, -9.51690599322319e-05, -9.200349450111389e-05, -8.883792906999588e-05, -8.567236363887787e-05, -8.250679820775986e-05, -7.934123277664185e-05, -7.617566734552383e-05, -7.301010191440582e-05, -6.984453648328781e-05, -6.66789710521698e-05, -6.351340562105179e-05, -6.034784018993378e-05, -5.7182274758815765e-05, -5.4016709327697754e-05, -5.085114389657974e-05, -4.768557846546173e-05, -4.452001303434372e-05, -4.135444760322571e-05, -3.8188882172107697e-05, -3.5023316740989685e-05, -3.1857751309871674e-05, -2.8692185878753662e-05, -2.552662044763565e-05, -2.236105501651764e-05, -1.9195489585399628e-05, -1.6029924154281616e-05, -1.2864358723163605e-05, -9.698793292045593e-06, -6.533227860927582e-06, -3.3676624298095703e-06, -2.0209699869155884e-07, 2.9634684324264526e-06, 6.129033863544464e-06, 9.294599294662476e-06, 1.2460164725780487e-05, 1.56257301568985e-05, 1.879129558801651e-05, 2.195686101913452e-05, 2.5122426450252533e-05, 2.8287991881370544e-05, 3.1453557312488556e-05, 3.461912274360657e-05, 3.778468817472458e-05, 4.095025360584259e-05, 4.41158190369606e-05, 4.728138446807861e-05, 5.0446949899196625e-05, 5.3612515330314636e-05, 5.677808076143265e-05, 5.994364619255066e-05, 6.310921162366867e-05, 6.627477705478668e-05, 6.94403424859047e-05, 7.26059079170227e-05, 7.577147334814072e-05, 7.893703877925873e-05, 8.210260421037674e-05, 8.526816964149475e-05, 8.843373507261276e-05, 9.159930050373077e-05, 9.476486593484879e-05, 9.79304313659668e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 11.0, 17.0, 17.0, 40.0, 38.0, 42.0, 63.0, 79.0, 145.0, 222.0, 301.0, 461.0, 755.0, 1174.0, 1822.0, 2861.0, 4667.0, 7651.0, 12413.0, 19913.0, 32585.0, 51298.0, 79006.0, 112705.0, 143082.0, 152351.0, 134546.0, 102270.0, 69718.0, 44877.0, 28237.0, 17182.0, 10528.0, 6524.0, 4006.0, 2549.0, 1504.0, 1038.0, 628.0, 403.0, 251.0, 179.0, 107.0, 81.0, 58.0, 49.0, 29.0, 23.0, 13.0, 14.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0], "bins": [-0.9375, -0.9085159301757812, -0.8795318603515625, -0.8505477905273438, -0.821563720703125, -0.7925796508789062, -0.7635955810546875, -0.7346115112304688, -0.70562744140625, -0.6766433715820312, -0.6476593017578125, -0.6186752319335938, -0.589691162109375, -0.5607070922851562, -0.5317230224609375, -0.5027389526367188, -0.4737548828125, -0.44477081298828125, -0.4157867431640625, -0.38680267333984375, -0.357818603515625, -0.32883453369140625, -0.2998504638671875, -0.27086639404296875, -0.24188232421875, -0.21289825439453125, -0.1839141845703125, -0.15493011474609375, -0.125946044921875, -0.09696197509765625, -0.0679779052734375, -0.03899383544921875, -0.010009765625, 0.01897430419921875, 0.0479583740234375, 0.07694244384765625, 0.105926513671875, 0.13491058349609375, 0.1638946533203125, 0.19287872314453125, 0.22186279296875, 0.25084686279296875, 0.2798309326171875, 0.30881500244140625, 0.337799072265625, 0.36678314208984375, 0.3957672119140625, 0.42475128173828125, 0.4537353515625, 0.48271942138671875, 0.5117034912109375, 0.5406875610351562, 0.569671630859375, 0.5986557006835938, 0.6276397705078125, 0.6566238403320312, 0.68560791015625, 0.7145919799804688, 0.7435760498046875, 0.7725601196289062, 0.801544189453125, 0.8305282592773438, 0.8595123291015625, 0.8884963989257812, 0.91748046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 7.0, 4.0, 10.0, 12.0, 20.0, 16.0, 22.0, 31.0, 28.0, 31.0, 32.0, 39.0, 44.0, 50.0, 60.0, 58.0, 63.0, 50.0, 54.0, 55.0, 57.0, 43.0, 35.0, 31.0, 30.0, 30.0, 21.0, 17.0, 11.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47867584228515625, -0.4656524658203125, -0.45262908935546875, -0.439605712890625, -0.42658233642578125, -0.4135589599609375, -0.40053558349609375, -0.38751220703125, -0.37448883056640625, -0.3614654541015625, -0.34844207763671875, -0.335418701171875, -0.32239532470703125, -0.3093719482421875, -0.29634857177734375, -0.2833251953125, -0.27030181884765625, -0.2572784423828125, -0.24425506591796875, -0.231231689453125, -0.21820831298828125, -0.2051849365234375, -0.19216156005859375, -0.17913818359375, -0.16611480712890625, -0.1530914306640625, -0.14006805419921875, -0.127044677734375, -0.11402130126953125, -0.1009979248046875, -0.08797454833984375, -0.074951171875, -0.06192779541015625, -0.0489044189453125, -0.03588104248046875, -0.022857666015625, -0.00983428955078125, 0.0031890869140625, 0.01621246337890625, 0.02923583984375, 0.04225921630859375, 0.0552825927734375, 0.06830596923828125, 0.081329345703125, 0.09435272216796875, 0.1073760986328125, 0.12039947509765625, 0.1334228515625, 0.14644622802734375, 0.1594696044921875, 0.17249298095703125, 0.185516357421875, 0.19853973388671875, 0.2115631103515625, 0.22458648681640625, 0.23760986328125, 0.25063323974609375, 0.2636566162109375, 0.27667999267578125, 0.289703369140625, 0.30272674560546875, 0.3157501220703125, 0.32877349853515625, 0.341796875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 13.0, 12.0, 15.0, 9.0, 26.0, 20.0, 29.0, 34.0, 40.0, 39.0, 37.0, 52.0, 46.0, 45.0, 56.0, 49.0, 57.0, 49.0, 38.0, 55.0, 48.0, 31.0, 31.0, 25.0, 20.0, 15.0, 24.0, 11.0, 12.0, 12.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8894098997116089, -1.829939365386963, -1.770468831062317, -1.710998296737671, -1.651527762413025, -1.592057228088379, -1.5325868129730225, -1.4731162786483765, -1.4136457443237305, -1.3541752099990845, -1.2947046756744385, -1.2352341413497925, -1.1757636070251465, -1.11629319190979, -1.0568225383758545, -0.997352123260498, -0.9378815293312073, -0.8784109950065613, -0.8189404606819153, -0.7594699859619141, -0.6999994516372681, -0.6405289173126221, -0.5810583829879761, -0.5215878486633301, -0.46211734414100647, -0.4026468098163605, -0.34317630529403687, -0.28370577096939087, -0.22423525154590607, -0.16476473212242126, -0.10529419779777527, -0.04582369327545166, 0.013646841049194336, 0.07311736047267914, 0.13258787989616394, 0.19205841422080994, 0.25152891874313354, 0.31099945306777954, 0.37046998739242554, 0.42994049191474915, 0.48941102623939514, 0.5488815307617188, 0.6083520650863647, 0.6678225994110107, 0.7272931337356567, 0.7867636680603027, 0.8462342023849487, 0.90570467710495, 0.965175211429596, 1.0246456861495972, 1.0841162204742432, 1.1435867547988892, 1.2030572891235352, 1.2625278234481812, 1.3219983577728271, 1.3814688920974731, 1.4409394264221191, 1.5004099607467651, 1.5598804950714111, 1.6193510293960571, 1.6788215637207031, 1.7382919788360596, 1.7977626323699951, 1.8572330474853516, 1.9167035818099976]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 1.0, 8.0, 9.0, 7.0, 12.0, 11.0, 9.0, 12.0, 13.0, 14.0, 35.0, 24.0, 17.0, 29.0, 31.0, 42.0, 30.0, 34.0, 35.0, 27.0, 41.0, 45.0, 41.0, 31.0, 41.0, 38.0, 39.0, 44.0, 29.0, 37.0, 26.0, 17.0, 21.0, 24.0, 21.0, 12.0, 10.0, 13.0, 17.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.371199607849121, -1.3224812746047974, -1.2737629413604736, -1.22504460811615, -1.1763262748718262, -1.1276079416275024, -1.0788896083831787, -1.0301713943481445, -0.981453001499176, -0.9327346682548523, -0.8840163350105286, -0.8352980613708496, -0.7865797281265259, -0.7378613948822021, -0.6891430616378784, -0.6404247283935547, -0.591706395149231, -0.5429880619049072, -0.4942697286605835, -0.44555142521858215, -0.3968330919742584, -0.3481147587299347, -0.29939645528793335, -0.2506781220436096, -0.2019597887992859, -0.15324145555496216, -0.10452313721179962, -0.055804818868637085, -0.0070864856243133545, 0.041631847620010376, 0.09035015106201172, 0.13906848430633545, 0.18778681755065918, 0.2365051507949829, 0.28522348403930664, 0.333941787481308, 0.3826601207256317, 0.43137845396995544, 0.4800967574119568, 0.5288150906562805, 0.5775334239006042, 0.626251757144928, 0.6749700903892517, 0.7236883640289307, 0.7724066972732544, 0.8211250305175781, 0.8698433637619019, 0.9185616970062256, 0.9672800302505493, 1.015998363494873, 1.0647166967391968, 1.1134350299835205, 1.1621533632278442, 1.210871696472168, 1.2595899105072021, 1.3083083629608154, 1.3570265769958496, 1.4057449102401733, 1.454463243484497, 1.5031815767288208, 1.5518999099731445, 1.6006182432174683, 1.649336576461792, 1.6980547904968262, 1.7467732429504395]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 12.0, 27.0, 39.0, 49.0, 79.0, 135.0, 225.0, 378.0, 655.0, 1170.0, 1907.0, 3451.0, 5958.0, 10651.0, 19230.0, 33416.0, 58904.0, 103499.0, 176924.0, 289343.0, 440194.0, 593615.0, 663971.0, 602063.0, 453475.0, 300291.0, 184695.0, 107892.0, 61816.0, 35026.0, 19654.0, 11040.0, 6208.0, 3646.0, 2000.0, 1098.0, 603.0, 379.0, 236.0, 125.0, 81.0, 51.0, 27.0, 23.0, 7.0, 10.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.609375, -1.559906005859375, -1.51043701171875, -1.460968017578125, -1.4114990234375, -1.362030029296875, -1.31256103515625, -1.263092041015625, -1.213623046875, -1.164154052734375, -1.11468505859375, -1.065216064453125, -1.0157470703125, -0.966278076171875, -0.91680908203125, -0.867340087890625, -0.81787109375, -0.768402099609375, -0.71893310546875, -0.669464111328125, -0.6199951171875, -0.570526123046875, -0.52105712890625, -0.471588134765625, -0.422119140625, -0.372650146484375, -0.32318115234375, -0.273712158203125, -0.2242431640625, -0.174774169921875, -0.12530517578125, -0.075836181640625, -0.0263671875, 0.023101806640625, 0.07257080078125, 0.122039794921875, 0.1715087890625, 0.220977783203125, 0.27044677734375, 0.319915771484375, 0.369384765625, 0.418853759765625, 0.46832275390625, 0.517791748046875, 0.5672607421875, 0.616729736328125, 0.66619873046875, 0.715667724609375, 0.76513671875, 0.814605712890625, 0.86407470703125, 0.913543701171875, 0.9630126953125, 1.012481689453125, 1.06195068359375, 1.111419677734375, 1.160888671875, 1.210357666015625, 1.25982666015625, 1.309295654296875, 1.3587646484375, 1.408233642578125, 1.45770263671875, 1.507171630859375, 1.556640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 6.0, 7.0, 13.0, 9.0, 13.0, 14.0, 26.0, 23.0, 30.0, 20.0, 35.0, 25.0, 39.0, 36.0, 27.0, 37.0, 35.0, 33.0, 41.0, 34.0, 40.0, 28.0, 40.0, 36.0, 31.0, 33.0, 32.0, 26.0, 22.0, 22.0, 20.0, 11.0, 14.0, 17.0, 21.0, 15.0, 11.0, 7.0, 12.0, 5.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9029006958007812, -0.8707427978515625, -0.8385848999023438, -0.806427001953125, -0.7742691040039062, -0.7421112060546875, -0.7099533081054688, -0.67779541015625, -0.6456375122070312, -0.6134796142578125, -0.5813217163085938, -0.549163818359375, -0.5170059204101562, -0.4848480224609375, -0.45269012451171875, -0.4205322265625, -0.38837432861328125, -0.3562164306640625, -0.32405853271484375, -0.291900634765625, -0.25974273681640625, -0.2275848388671875, -0.19542694091796875, -0.16326904296875, -0.13111114501953125, -0.0989532470703125, -0.06679534912109375, -0.034637451171875, -0.00247955322265625, 0.0296783447265625, 0.06183624267578125, 0.093994140625, 0.12615203857421875, 0.1583099365234375, 0.19046783447265625, 0.222625732421875, 0.25478363037109375, 0.2869415283203125, 0.31909942626953125, 0.35125732421875, 0.38341522216796875, 0.4155731201171875, 0.44773101806640625, 0.479888916015625, 0.5120468139648438, 0.5442047119140625, 0.5763626098632812, 0.6085205078125, 0.6406784057617188, 0.6728363037109375, 0.7049942016601562, 0.737152099609375, 0.7693099975585938, 0.8014678955078125, 0.8336257934570312, 0.86578369140625, 0.8979415893554688, 0.9300994873046875, 0.9622573852539062, 0.994415283203125, 1.0265731811523438, 1.0587310791015625, 1.0908889770507812, 1.123046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 10.0, 16.0, 18.0, 36.0, 67.0, 119.0, 149.0, 267.0, 470.0, 755.0, 1308.0, 2118.0, 3435.0, 5913.0, 9869.0, 16485.0, 27229.0, 44764.0, 72471.0, 113592.0, 175828.0, 255213.0, 352056.0, 443335.0, 506013.0, 513012.0, 463209.0, 375762.0, 278724.0, 193409.0, 128425.0, 81391.0, 50984.0, 30690.0, 18794.0, 11265.0, 6935.0, 4039.0, 2419.0, 1484.0, 884.0, 508.0, 314.0, 189.0, 113.0, 80.0, 58.0, 30.0, 14.0, 12.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.3486328125, -1.30792236328125, -1.2672119140625, -1.22650146484375, -1.185791015625, -1.14508056640625, -1.1043701171875, -1.06365966796875, -1.02294921875, -0.98223876953125, -0.9415283203125, -0.90081787109375, -0.860107421875, -0.81939697265625, -0.7786865234375, -0.73797607421875, -0.697265625, -0.65655517578125, -0.6158447265625, -0.57513427734375, -0.534423828125, -0.49371337890625, -0.4530029296875, -0.41229248046875, -0.37158203125, -0.33087158203125, -0.2901611328125, -0.24945068359375, -0.208740234375, -0.16802978515625, -0.1273193359375, -0.08660888671875, -0.0458984375, -0.00518798828125, 0.0355224609375, 0.07623291015625, 0.116943359375, 0.15765380859375, 0.1983642578125, 0.23907470703125, 0.27978515625, 0.32049560546875, 0.3612060546875, 0.40191650390625, 0.442626953125, 0.48333740234375, 0.5240478515625, 0.56475830078125, 0.60546875, 0.64617919921875, 0.6868896484375, 0.72760009765625, 0.768310546875, 0.80902099609375, 0.8497314453125, 0.89044189453125, 0.93115234375, 0.97186279296875, 1.0125732421875, 1.05328369140625, 1.093994140625, 1.13470458984375, 1.1754150390625, 1.21612548828125, 1.2568359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 5.0, 8.0, 13.0, 14.0, 28.0, 29.0, 25.0, 44.0, 61.0, 65.0, 83.0, 88.0, 90.0, 108.0, 127.0, 149.0, 176.0, 197.0, 186.0, 208.0, 228.0, 216.0, 199.0, 203.0, 173.0, 185.0, 173.0, 134.0, 138.0, 111.0, 111.0, 101.0, 67.0, 69.0, 46.0, 43.0, 43.0, 33.0, 21.0, 12.0, 13.0, 8.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5343780517578125, -0.516998291015625, -0.4996185302734375, -0.48223876953125, -0.4648590087890625, -0.447479248046875, -0.4300994873046875, -0.4127197265625, -0.3953399658203125, -0.377960205078125, -0.3605804443359375, -0.34320068359375, -0.3258209228515625, -0.308441162109375, -0.2910614013671875, -0.273681640625, -0.2563018798828125, -0.238922119140625, -0.2215423583984375, -0.20416259765625, -0.1867828369140625, -0.169403076171875, -0.1520233154296875, -0.1346435546875, -0.1172637939453125, -0.099884033203125, -0.0825042724609375, -0.06512451171875, -0.0477447509765625, -0.030364990234375, -0.0129852294921875, 0.00439453125, 0.0217742919921875, 0.039154052734375, 0.0565338134765625, 0.07391357421875, 0.0912933349609375, 0.108673095703125, 0.1260528564453125, 0.1434326171875, 0.1608123779296875, 0.178192138671875, 0.1955718994140625, 0.21295166015625, 0.2303314208984375, 0.247711181640625, 0.2650909423828125, 0.282470703125, 0.2998504638671875, 0.317230224609375, 0.3346099853515625, 0.35198974609375, 0.3693695068359375, 0.386749267578125, 0.4041290283203125, 0.4215087890625, 0.4388885498046875, 0.456268310546875, 0.4736480712890625, 0.49102783203125, 0.5084075927734375, 0.525787353515625, 0.5431671142578125, 0.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 8.0, 6.0, 15.0, 15.0, 29.0, 25.0, 38.0, 39.0, 42.0, 46.0, 48.0, 69.0, 72.0, 57.0, 68.0, 53.0, 69.0, 53.0, 46.0, 38.0, 34.0, 21.0, 19.0, 28.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8024777173995972, -1.7369765043258667, -1.6714752912521362, -1.6059740781784058, -1.5404728651046753, -1.4749716520309448, -1.409470558166504, -1.3439693450927734, -1.278468132019043, -1.2129669189453125, -1.147465705871582, -1.0819644927978516, -1.016463279724121, -0.9509620666503906, -0.8854609131813049, -0.8199597001075745, -0.7544584274291992, -0.6889572143554688, -0.6234560012817383, -0.5579547882080078, -0.49245360493659973, -0.42695239186286926, -0.3614512085914612, -0.2959499955177307, -0.23044878244400024, -0.16494756937026978, -0.0994463711977005, -0.033945173025131226, 0.03155604004859924, 0.09705725312232971, 0.1625584363937378, 0.22805964946746826, 0.2935607433319092, 0.35906195640563965, 0.4245631694793701, 0.4900643527507782, 0.555565595626831, 0.6210668087005615, 0.6865679621696472, 0.7520691752433777, 0.8175703883171082, 0.8830716013908386, 0.9485728144645691, 1.0140739679336548, 1.0795751810073853, 1.1450763940811157, 1.2105776071548462, 1.2760788202285767, 1.3415800333023071, 1.4070812463760376, 1.472582459449768, 1.5380836725234985, 1.603584885597229, 1.6690860986709595, 1.7345871925354004, 1.8000884056091309, 1.8655896186828613, 1.9310908317565918, 1.9965920448303223, 2.0620932579040527, 2.127594470977783, 2.1930956840515137, 2.258596897125244, 2.3240981101989746, 2.389599323272705]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 4.0, 3.0, 8.0, 8.0, 17.0, 11.0, 10.0, 22.0, 13.0, 21.0, 24.0, 29.0, 29.0, 30.0, 35.0, 30.0, 35.0, 38.0, 29.0, 33.0, 35.0, 43.0, 43.0, 33.0, 40.0, 41.0, 38.0, 33.0, 34.0, 28.0, 24.0, 26.0, 25.0, 17.0, 11.0, 7.0, 12.0, 19.0, 13.0, 10.0, 10.0, 2.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.269423007965088, -1.2290480136871338, -1.1886730194091797, -1.1482980251312256, -1.1079230308532715, -1.0675479173660278, -1.0271729230880737, -0.9867979288101196, -0.9464229345321655, -0.9060479402542114, -0.8656729459762573, -0.8252978920936584, -0.7849228978157043, -0.7445479035377502, -0.7041728496551514, -0.6637978553771973, -0.6234228610992432, -0.5830478668212891, -0.542672872543335, -0.5022978186607361, -0.461922824382782, -0.4215478301048279, -0.3811728060245514, -0.3407977819442749, -0.3004227876663208, -0.2600477933883667, -0.2196727693080902, -0.17929776012897491, -0.13892275094985962, -0.09854774177074432, -0.05817273259162903, -0.01779770851135254, 0.022577285766601562, 0.06295229494571686, 0.10332730412483215, 0.14370231330394745, 0.18407732248306274, 0.22445233166217804, 0.26482734084129333, 0.3052023649215698, 0.3455773591995239, 0.385952353477478, 0.4263273775577545, 0.466702401638031, 0.5070773959159851, 0.5474523901939392, 0.5878274440765381, 0.6282024383544922, 0.6685774326324463, 0.7089524269104004, 0.7493274211883545, 0.7897024750709534, 0.8300774693489075, 0.8704524636268616, 0.9108275175094604, 0.9512025117874146, 0.9915775060653687, 1.0319525003433228, 1.0723274946212769, 1.112702488899231, 1.1530776023864746, 1.1934525966644287, 1.2338275909423828, 1.274202585220337, 1.314577579498291]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 12.0, 20.0, 43.0, 38.0, 70.0, 96.0, 146.0, 195.0, 279.0, 424.0, 633.0, 875.0, 1368.0, 2180.0, 3483.0, 5805.0, 9731.0, 16791.0, 29913.0, 52774.0, 91020.0, 147701.0, 200017.0, 184602.0, 124050.0, 74536.0, 42984.0, 23994.0, 13773.0, 7985.0, 4761.0, 2828.0, 1706.0, 1259.0, 759.0, 508.0, 339.0, 253.0, 174.0, 131.0, 97.0, 60.0, 36.0, 32.0, 19.0, 14.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.72021484375, -0.69891357421875, -0.6776123046875, -0.65631103515625, -0.635009765625, -0.61370849609375, -0.5924072265625, -0.57110595703125, -0.5498046875, -0.52850341796875, -0.5072021484375, -0.48590087890625, -0.464599609375, -0.44329833984375, -0.4219970703125, -0.40069580078125, -0.37939453125, -0.35809326171875, -0.3367919921875, -0.31549072265625, -0.294189453125, -0.27288818359375, -0.2515869140625, -0.23028564453125, -0.208984375, -0.18768310546875, -0.1663818359375, -0.14508056640625, -0.123779296875, -0.10247802734375, -0.0811767578125, -0.05987548828125, -0.03857421875, -0.01727294921875, 0.0040283203125, 0.02532958984375, 0.046630859375, 0.06793212890625, 0.0892333984375, 0.11053466796875, 0.1318359375, 0.15313720703125, 0.1744384765625, 0.19573974609375, 0.217041015625, 0.23834228515625, 0.2596435546875, 0.28094482421875, 0.30224609375, 0.32354736328125, 0.3448486328125, 0.36614990234375, 0.387451171875, 0.40875244140625, 0.4300537109375, 0.45135498046875, 0.47265625, 0.49395751953125, 0.5152587890625, 0.53656005859375, 0.557861328125, 0.57916259765625, 0.6004638671875, 0.62176513671875, 0.64306640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 9.0, 6.0, 8.0, 13.0, 11.0, 15.0, 17.0, 12.0, 24.0, 24.0, 32.0, 21.0, 30.0, 31.0, 30.0, 37.0, 46.0, 36.0, 34.0, 42.0, 48.0, 31.0, 33.0, 48.0, 36.0, 42.0, 34.0, 32.0, 20.0, 22.0, 25.0, 23.0, 12.0, 24.0, 14.0, 13.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.36297607421875, -1.3177490234375, -1.27252197265625, -1.227294921875, -1.18206787109375, -1.1368408203125, -1.09161376953125, -1.04638671875, -1.00115966796875, -0.9559326171875, -0.91070556640625, -0.865478515625, -0.82025146484375, -0.7750244140625, -0.72979736328125, -0.6845703125, -0.63934326171875, -0.5941162109375, -0.54888916015625, -0.503662109375, -0.45843505859375, -0.4132080078125, -0.36798095703125, -0.32275390625, -0.27752685546875, -0.2322998046875, -0.18707275390625, -0.141845703125, -0.09661865234375, -0.0513916015625, -0.00616455078125, 0.0390625, 0.08428955078125, 0.1295166015625, 0.17474365234375, 0.219970703125, 0.26519775390625, 0.3104248046875, 0.35565185546875, 0.40087890625, 0.44610595703125, 0.4913330078125, 0.53656005859375, 0.581787109375, 0.62701416015625, 0.6722412109375, 0.71746826171875, 0.7626953125, 0.80792236328125, 0.8531494140625, 0.89837646484375, 0.943603515625, 0.98883056640625, 1.0340576171875, 1.07928466796875, 1.12451171875, 1.16973876953125, 1.2149658203125, 1.26019287109375, 1.305419921875, 1.35064697265625, 1.3958740234375, 1.44110107421875, 1.486328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 1.0, 11.0, 12.0, 24.0, 34.0, 52.0, 66.0, 105.0, 138.0, 231.0, 358.0, 622.0, 1085.0, 2223.0, 4879.0, 12454.0, 38183.0, 130315.0, 389692.0, 322990.0, 97387.0, 29203.0, 10148.0, 4073.0, 1819.0, 936.0, 549.0, 348.0, 215.0, 117.0, 93.0, 62.0, 29.0, 31.0, 24.0, 17.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4833984375, -1.4396209716796875, -1.395843505859375, -1.3520660400390625, -1.30828857421875, -1.2645111083984375, -1.220733642578125, -1.1769561767578125, -1.1331787109375, -1.0894012451171875, -1.045623779296875, -1.0018463134765625, -0.95806884765625, -0.9142913818359375, -0.870513916015625, -0.8267364501953125, -0.782958984375, -0.7391815185546875, -0.695404052734375, -0.6516265869140625, -0.60784912109375, -0.5640716552734375, -0.520294189453125, -0.4765167236328125, -0.4327392578125, -0.3889617919921875, -0.345184326171875, -0.3014068603515625, -0.25762939453125, -0.2138519287109375, -0.170074462890625, -0.1262969970703125, -0.08251953125, -0.0387420654296875, 0.005035400390625, 0.0488128662109375, 0.09259033203125, 0.1363677978515625, 0.180145263671875, 0.2239227294921875, 0.2677001953125, 0.3114776611328125, 0.355255126953125, 0.3990325927734375, 0.44281005859375, 0.4865875244140625, 0.530364990234375, 0.5741424560546875, 0.617919921875, 0.6616973876953125, 0.705474853515625, 0.7492523193359375, 0.79302978515625, 0.8368072509765625, 0.880584716796875, 0.9243621826171875, 0.9681396484375, 1.0119171142578125, 1.055694580078125, 1.0994720458984375, 1.14324951171875, 1.1870269775390625, 1.230804443359375, 1.2745819091796875, 1.318359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 8.0, 13.0, 12.0, 13.0, 14.0, 16.0, 14.0, 17.0, 18.0, 27.0, 26.0, 20.0, 33.0, 27.0, 38.0, 45.0, 34.0, 29.0, 35.0, 44.0, 41.0, 46.0, 42.0, 27.0, 27.0, 37.0, 33.0, 25.0, 24.0, 22.0, 19.0, 22.0, 27.0, 19.0, 17.0, 17.0, 11.0, 11.0, 7.0, 5.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9482421875, -0.9193344116210938, -0.8904266357421875, -0.8615188598632812, -0.832611083984375, -0.8037033081054688, -0.7747955322265625, -0.7458877563476562, -0.71697998046875, -0.6880722045898438, -0.6591644287109375, -0.6302566528320312, -0.601348876953125, -0.5724411010742188, -0.5435333251953125, -0.5146255493164062, -0.4857177734375, -0.45680999755859375, -0.4279022216796875, -0.39899444580078125, -0.370086669921875, -0.34117889404296875, -0.3122711181640625, -0.28336334228515625, -0.25445556640625, -0.22554779052734375, -0.1966400146484375, -0.16773223876953125, -0.138824462890625, -0.10991668701171875, -0.0810089111328125, -0.05210113525390625, -0.023193359375, 0.00571441650390625, 0.0346221923828125, 0.06352996826171875, 0.092437744140625, 0.12134552001953125, 0.1502532958984375, 0.17916107177734375, 0.20806884765625, 0.23697662353515625, 0.2658843994140625, 0.29479217529296875, 0.323699951171875, 0.35260772705078125, 0.3815155029296875, 0.41042327880859375, 0.4393310546875, 0.46823883056640625, 0.4971466064453125, 0.5260543823242188, 0.554962158203125, 0.5838699340820312, 0.6127777099609375, 0.6416854858398438, 0.67059326171875, 0.6995010375976562, 0.7284088134765625, 0.7573165893554688, 0.786224365234375, 0.8151321411132812, 0.8440399169921875, 0.8729476928710938, 0.90185546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 9.0, 12.0, 16.0, 23.0, 31.0, 49.0, 56.0, 78.0, 100.0, 157.0, 193.0, 277.0, 382.0, 552.0, 923.0, 1438.0, 2798.0, 6708.0, 28105.0, 601080.0, 371774.0, 21285.0, 5694.0, 2531.0, 1413.0, 835.0, 544.0, 383.0, 292.0, 191.0, 170.0, 102.0, 89.0, 64.0, 48.0, 41.0, 19.0, 23.0, 21.0, 14.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2080078125, -1.1662445068359375, -1.124481201171875, -1.0827178955078125, -1.04095458984375, -0.9991912841796875, -0.957427978515625, -0.9156646728515625, -0.8739013671875, -0.8321380615234375, -0.790374755859375, -0.7486114501953125, -0.70684814453125, -0.6650848388671875, -0.623321533203125, -0.5815582275390625, -0.539794921875, -0.4980316162109375, -0.456268310546875, -0.4145050048828125, -0.37274169921875, -0.3309783935546875, -0.289215087890625, -0.2474517822265625, -0.2056884765625, -0.1639251708984375, -0.122161865234375, -0.0803985595703125, -0.03863525390625, 0.0031280517578125, 0.044891357421875, 0.0866546630859375, 0.12841796875, 0.1701812744140625, 0.211944580078125, 0.2537078857421875, 0.29547119140625, 0.3372344970703125, 0.378997802734375, 0.4207611083984375, 0.4625244140625, 0.5042877197265625, 0.546051025390625, 0.5878143310546875, 0.62957763671875, 0.6713409423828125, 0.713104248046875, 0.7548675537109375, 0.796630859375, 0.8383941650390625, 0.880157470703125, 0.9219207763671875, 0.96368408203125, 1.0054473876953125, 1.047210693359375, 1.0889739990234375, 1.1307373046875, 1.1725006103515625, 1.214263916015625, 1.2560272216796875, 1.29779052734375, 1.3395538330078125, 1.381317138671875, 1.4230804443359375, 1.46484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 10.0, 7.0, 37.0, 166.0, 378.0, 271.0, 90.0, 23.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017905235290527344, -0.00017454568296670914, -0.00017003901302814484, -0.00016553234308958054, -0.00016102567315101624, -0.00015651900321245193, -0.00015201233327388763, -0.00014750566333532333, -0.00014299899339675903, -0.00013849232345819473, -0.00013398565351963043, -0.00012947898358106613, -0.00012497231364250183, -0.00012046564370393753, -0.00011595897376537323, -0.00011145230382680893, -0.00010694563388824463, -0.00010243896394968033, -9.793229401111603e-05, -9.342562407255173e-05, -8.891895413398743e-05, -8.441228419542313e-05, -7.990561425685883e-05, -7.539894431829453e-05, -7.089227437973022e-05, -6.638560444116592e-05, -6.187893450260162e-05, -5.737226456403732e-05, -5.286559462547302e-05, -4.835892468690872e-05, -4.385225474834442e-05, -3.934558480978012e-05, -3.483891487121582e-05, -3.033224493265152e-05, -2.582557499408722e-05, -2.131890505552292e-05, -1.6812235116958618e-05, -1.2305565178394318e-05, -7.798895239830017e-06, -3.2922253012657166e-06, 1.214444637298584e-06, 5.7211145758628845e-06, 1.0227784514427185e-05, 1.4734454452991486e-05, 1.9241124391555786e-05, 2.3747794330120087e-05, 2.8254464268684387e-05, 3.276113420724869e-05, 3.726780414581299e-05, 4.177447408437729e-05, 4.628114402294159e-05, 5.078781396150589e-05, 5.529448390007019e-05, 5.980115383863449e-05, 6.430782377719879e-05, 6.881449371576309e-05, 7.332116365432739e-05, 7.782783359289169e-05, 8.2334503531456e-05, 8.68411734700203e-05, 9.13478434085846e-05, 9.58545133471489e-05, 0.0001003611832857132, 0.0001048678532242775, 0.0001093745231628418]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 18.0, 22.0, 33.0, 32.0, 56.0, 84.0, 101.0, 159.0, 233.0, 403.0, 732.0, 1164.0, 2207.0, 4459.0, 10179.0, 27892.0, 102862.0, 413747.0, 356340.0, 85602.0, 24236.0, 9093.0, 3952.0, 2007.0, 1109.0, 622.0, 392.0, 254.0, 155.0, 96.0, 66.0, 53.0, 42.0, 29.0, 25.0, 18.0, 9.0, 5.0, 5.0, 5.0, 5.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.75830078125, -0.7359542846679688, -0.7136077880859375, -0.6912612915039062, -0.668914794921875, -0.6465682983398438, -0.6242218017578125, -0.6018753051757812, -0.57952880859375, -0.5571823120117188, -0.5348358154296875, -0.5124893188476562, -0.490142822265625, -0.46779632568359375, -0.4454498291015625, -0.42310333251953125, -0.4007568359375, -0.37841033935546875, -0.3560638427734375, -0.33371734619140625, -0.311370849609375, -0.28902435302734375, -0.2666778564453125, -0.24433135986328125, -0.22198486328125, -0.19963836669921875, -0.1772918701171875, -0.15494537353515625, -0.132598876953125, -0.11025238037109375, -0.0879058837890625, -0.06555938720703125, -0.043212890625, -0.02086639404296875, 0.0014801025390625, 0.02382659912109375, 0.046173095703125, 0.06851959228515625, 0.0908660888671875, 0.11321258544921875, 0.13555908203125, 0.15790557861328125, 0.1802520751953125, 0.20259857177734375, 0.224945068359375, 0.24729156494140625, 0.2696380615234375, 0.29198455810546875, 0.3143310546875, 0.33667755126953125, 0.3590240478515625, 0.38137054443359375, 0.403717041015625, 0.42606353759765625, 0.4484100341796875, 0.47075653076171875, 0.49310302734375, 0.5154495239257812, 0.5377960205078125, 0.5601425170898438, 0.582489013671875, 0.6048355102539062, 0.6271820068359375, 0.6495285034179688, 0.671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 15.0, 18.0, 20.0, 35.0, 60.0, 128.0, 212.0, 219.0, 114.0, 70.0, 35.0, 33.0, 12.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.343505859375, -0.33570098876953125, -0.3278961181640625, -0.32009124755859375, -0.312286376953125, -0.30448150634765625, -0.2966766357421875, -0.28887176513671875, -0.28106689453125, -0.27326202392578125, -0.2654571533203125, -0.25765228271484375, -0.249847412109375, -0.24204254150390625, -0.2342376708984375, -0.22643280029296875, -0.2186279296875, -0.21082305908203125, -0.2030181884765625, -0.19521331787109375, -0.187408447265625, -0.17960357666015625, -0.1717987060546875, -0.16399383544921875, -0.15618896484375, -0.14838409423828125, -0.1405792236328125, -0.13277435302734375, -0.124969482421875, -0.11716461181640625, -0.1093597412109375, -0.10155487060546875, -0.09375, -0.08594512939453125, -0.0781402587890625, -0.07033538818359375, -0.062530517578125, -0.05472564697265625, -0.0469207763671875, -0.03911590576171875, -0.03131103515625, -0.02350616455078125, -0.0157012939453125, -0.00789642333984375, -9.1552734375e-05, 0.00771331787109375, 0.0155181884765625, 0.02332305908203125, 0.0311279296875, 0.03893280029296875, 0.0467376708984375, 0.05454254150390625, 0.062347412109375, 0.07015228271484375, 0.0779571533203125, 0.08576202392578125, 0.09356689453125, 0.10137176513671875, 0.1091766357421875, 0.11698150634765625, 0.124786376953125, 0.13259124755859375, 0.1403961181640625, 0.14820098876953125, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 12.0, 11.0, 11.0, 17.0, 20.0, 25.0, 34.0, 35.0, 37.0, 45.0, 50.0, 59.0, 78.0, 57.0, 64.0, 53.0, 62.0, 65.0, 46.0, 43.0, 33.0, 33.0, 20.0, 15.0, 20.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7161957025527954, -1.6523724794387817, -1.5885493755340576, -1.524726152420044, -1.4609029293060303, -1.3970797061920166, -1.333256483078003, -1.2694333791732788, -1.2056101560592651, -1.1417869329452515, -1.0779638290405273, -1.0141406059265137, -0.9503173828125, -0.8864941596984863, -0.8226709961891174, -0.7588478326797485, -0.6950246095657349, -0.6312013864517212, -0.5673782229423523, -0.5035550594329834, -0.4397318363189697, -0.37590864300727844, -0.31208544969558716, -0.24826225638389587, -0.1844390630722046, -0.1206158697605133, -0.05679267644882202, 0.007030516862869263, 0.07085371017456055, 0.13467690348625183, 0.19850009679794312, 0.2623232901096344, 0.32614636421203613, 0.3899695575237274, 0.4537927508354187, 0.5176159143447876, 0.5814391374588013, 0.6452623605728149, 0.7090855240821838, 0.7729086875915527, 0.8367319107055664, 0.9005551338195801, 0.964378297328949, 1.0282014608383179, 1.0920246839523315, 1.1558479070663452, 1.2196710109710693, 1.283494234085083, 1.3473174571990967, 1.4111406803131104, 1.474963903427124, 1.5387870073318481, 1.6026102304458618, 1.6664334535598755, 1.7302565574645996, 1.7940797805786133, 1.857903003692627, 1.9217262268066406, 1.9855494499206543, 2.049372673034668, 2.1131958961486816, 2.177018880844116, 2.24084210395813, 2.3046653270721436, 2.3684885501861572]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 3.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 15.0, 12.0, 22.0, 29.0, 29.0, 24.0, 28.0, 35.0, 30.0, 38.0, 37.0, 31.0, 33.0, 34.0, 46.0, 40.0, 37.0, 42.0, 38.0, 35.0, 31.0, 35.0, 28.0, 28.0, 21.0, 31.0, 12.0, 13.0, 12.0, 10.0, 16.0, 11.0, 12.0, 10.0, 2.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2592148780822754, -1.2190552949905396, -1.1788957118988037, -1.1387361288070679, -1.098576545715332, -1.0584168434143066, -1.0182572603225708, -0.978097677230835, -0.9379380941390991, -0.8977785110473633, -0.8576189279556274, -0.8174592852592468, -0.777299702167511, -0.7371401190757751, -0.6969804763793945, -0.6568208932876587, -0.6166613101959229, -0.576501727104187, -0.5363421440124512, -0.49618250131607056, -0.4560229182243347, -0.4158633351325989, -0.37570372223854065, -0.3355441093444824, -0.2953845262527466, -0.25522494316101074, -0.21506533026695251, -0.17490573227405548, -0.13474613428115845, -0.09458653628826141, -0.05442693829536438, -0.014267325401306152, 0.025892257690429688, 0.06605185568332672, 0.10621145367622375, 0.1463710516691208, 0.18653064966201782, 0.22669024765491486, 0.2668498456478119, 0.3070094585418701, 0.34716904163360596, 0.3873286247253418, 0.4274882376194, 0.46764785051345825, 0.5078074336051941, 0.5479670166969299, 0.5881266593933105, 0.6282862424850464, 0.6684458255767822, 0.7086054086685181, 0.7487649917602539, 0.7889246344566345, 0.8290842175483704, 0.8692438006401062, 0.9094034433364868, 0.9495630264282227, 0.9897226095199585, 1.0298821926116943, 1.0700417757034302, 1.110201358795166, 1.1503610610961914, 1.1905206441879272, 1.230680227279663, 1.270839810371399, 1.3109993934631348]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 8.0, 10.0, 23.0, 29.0, 54.0, 75.0, 126.0, 178.0, 292.0, 452.0, 695.0, 1067.0, 1650.0, 2535.0, 3781.0, 5759.0, 8684.0, 12999.0, 19103.0, 27869.0, 38388.0, 52981.0, 69031.0, 84784.0, 98282.0, 105789.0, 104631.0, 96323.0, 82034.0, 65992.0, 49762.0, 36587.0, 25666.0, 17795.0, 12116.0, 7964.0, 5170.0, 3386.0, 2239.0, 1430.0, 974.0, 638.0, 414.0, 273.0, 177.0, 131.0, 65.0, 60.0, 36.0, 13.0, 8.0, 10.0, 14.0, 8.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1064453125, -1.0717620849609375, -1.037078857421875, -1.0023956298828125, -0.96771240234375, -0.9330291748046875, -0.898345947265625, -0.8636627197265625, -0.8289794921875, -0.7942962646484375, -0.759613037109375, -0.7249298095703125, -0.69024658203125, -0.6555633544921875, -0.620880126953125, -0.5861968994140625, -0.551513671875, -0.5168304443359375, -0.482147216796875, -0.4474639892578125, -0.41278076171875, -0.3780975341796875, -0.343414306640625, -0.3087310791015625, -0.2740478515625, -0.2393646240234375, -0.204681396484375, -0.1699981689453125, -0.13531494140625, -0.1006317138671875, -0.065948486328125, -0.0312652587890625, 0.00341796875, 0.0381011962890625, 0.072784423828125, 0.1074676513671875, 0.14215087890625, 0.1768341064453125, 0.211517333984375, 0.2462005615234375, 0.2808837890625, 0.3155670166015625, 0.350250244140625, 0.3849334716796875, 0.41961669921875, 0.4542999267578125, 0.488983154296875, 0.5236663818359375, 0.558349609375, 0.5930328369140625, 0.627716064453125, 0.6623992919921875, 0.69708251953125, 0.7317657470703125, 0.766448974609375, 0.8011322021484375, 0.8358154296875, 0.8704986572265625, 0.905181884765625, 0.9398651123046875, 0.97454833984375, 1.0092315673828125, 1.043914794921875, 1.0785980224609375, 1.11328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 8.0, 18.0, 13.0, 18.0, 25.0, 13.0, 33.0, 36.0, 38.0, 26.0, 30.0, 42.0, 38.0, 31.0, 33.0, 33.0, 40.0, 44.0, 33.0, 45.0, 38.0, 28.0, 40.0, 28.0, 30.0, 21.0, 21.0, 25.0, 16.0, 8.0, 19.0, 12.0, 9.0, 10.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2978515625, -1.257110595703125, -1.21636962890625, -1.175628662109375, -1.1348876953125, -1.094146728515625, -1.05340576171875, -1.012664794921875, -0.971923828125, -0.931182861328125, -0.89044189453125, -0.849700927734375, -0.8089599609375, -0.768218994140625, -0.72747802734375, -0.686737060546875, -0.64599609375, -0.605255126953125, -0.56451416015625, -0.523773193359375, -0.4830322265625, -0.442291259765625, -0.40155029296875, -0.360809326171875, -0.320068359375, -0.279327392578125, -0.23858642578125, -0.197845458984375, -0.1571044921875, -0.116363525390625, -0.07562255859375, -0.034881591796875, 0.005859375, 0.046600341796875, 0.08734130859375, 0.128082275390625, 0.1688232421875, 0.209564208984375, 0.25030517578125, 0.291046142578125, 0.331787109375, 0.372528076171875, 0.41326904296875, 0.454010009765625, 0.4947509765625, 0.535491943359375, 0.57623291015625, 0.616973876953125, 0.65771484375, 0.698455810546875, 0.73919677734375, 0.779937744140625, 0.8206787109375, 0.861419677734375, 0.90216064453125, 0.942901611328125, 0.983642578125, 1.024383544921875, 1.06512451171875, 1.105865478515625, 1.1466064453125, 1.187347412109375, 1.22808837890625, 1.268829345703125, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 10.0, 22.0, 27.0, 39.0, 58.0, 90.0, 129.0, 171.0, 314.0, 443.0, 744.0, 1100.0, 1716.0, 2556.0, 3836.0, 6056.0, 8960.0, 13489.0, 19406.0, 27707.0, 38876.0, 52246.0, 68236.0, 83640.0, 96278.0, 103027.0, 102151.0, 94264.0, 82405.0, 66456.0, 51550.0, 37958.0, 27116.0, 19018.0, 12697.0, 8868.0, 5848.0, 3931.0, 2471.0, 1627.0, 1030.0, 683.0, 464.0, 296.0, 204.0, 121.0, 78.0, 45.0, 48.0, 21.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0], "bins": [-1.1064453125, -1.0728759765625, -1.039306640625, -1.0057373046875, -0.97216796875, -0.9385986328125, -0.905029296875, -0.8714599609375, -0.837890625, -0.8043212890625, -0.770751953125, -0.7371826171875, -0.70361328125, -0.6700439453125, -0.636474609375, -0.6029052734375, -0.5693359375, -0.5357666015625, -0.502197265625, -0.4686279296875, -0.43505859375, -0.4014892578125, -0.367919921875, -0.3343505859375, -0.30078125, -0.2672119140625, -0.233642578125, -0.2000732421875, -0.16650390625, -0.1329345703125, -0.099365234375, -0.0657958984375, -0.0322265625, 0.0013427734375, 0.034912109375, 0.0684814453125, 0.10205078125, 0.1356201171875, 0.169189453125, 0.2027587890625, 0.236328125, 0.2698974609375, 0.303466796875, 0.3370361328125, 0.37060546875, 0.4041748046875, 0.437744140625, 0.4713134765625, 0.5048828125, 0.5384521484375, 0.572021484375, 0.6055908203125, 0.63916015625, 0.6727294921875, 0.706298828125, 0.7398681640625, 0.7734375, 0.8070068359375, 0.840576171875, 0.8741455078125, 0.90771484375, 0.9412841796875, 0.974853515625, 1.0084228515625, 1.0419921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 15.0, 18.0, 17.0, 12.0, 21.0, 18.0, 22.0, 23.0, 18.0, 36.0, 30.0, 36.0, 39.0, 44.0, 40.0, 34.0, 43.0, 37.0, 35.0, 47.0, 37.0, 43.0, 49.0, 33.0, 30.0, 23.0, 38.0, 14.0, 24.0, 24.0, 14.0, 10.0, 11.0, 10.0, 3.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7753677368164062, -0.7480010986328125, -0.7206344604492188, -0.693267822265625, -0.6659011840820312, -0.6385345458984375, -0.6111679077148438, -0.58380126953125, -0.5564346313476562, -0.5290679931640625, -0.5017013549804688, -0.474334716796875, -0.44696807861328125, -0.4196014404296875, -0.39223480224609375, -0.3648681640625, -0.33750152587890625, -0.3101348876953125, -0.28276824951171875, -0.255401611328125, -0.22803497314453125, -0.2006683349609375, -0.17330169677734375, -0.14593505859375, -0.11856842041015625, -0.0912017822265625, -0.06383514404296875, -0.036468505859375, -0.00910186767578125, 0.0182647705078125, 0.04563140869140625, 0.072998046875, 0.10036468505859375, 0.1277313232421875, 0.15509796142578125, 0.182464599609375, 0.20983123779296875, 0.2371978759765625, 0.26456451416015625, 0.29193115234375, 0.31929779052734375, 0.3466644287109375, 0.37403106689453125, 0.401397705078125, 0.42876434326171875, 0.4561309814453125, 0.48349761962890625, 0.5108642578125, 0.5382308959960938, 0.5655975341796875, 0.5929641723632812, 0.620330810546875, 0.6476974487304688, 0.6750640869140625, 0.7024307250976562, 0.72979736328125, 0.7571640014648438, 0.7845306396484375, 0.8118972778320312, 0.839263916015625, 0.8666305541992188, 0.8939971923828125, 0.9213638305664062, 0.94873046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 9.0, 13.0, 31.0, 42.0, 61.0, 91.0, 178.0, 238.0, 365.0, 583.0, 965.0, 1513.0, 2474.0, 4178.0, 7039.0, 12463.0, 21956.0, 39284.0, 68589.0, 112228.0, 163587.0, 187293.0, 160961.0, 109378.0, 66472.0, 37843.0, 21280.0, 12082.0, 6906.0, 4105.0, 2366.0, 1444.0, 928.0, 562.0, 376.0, 210.0, 155.0, 95.0, 72.0, 41.0, 29.0, 20.0, 12.0, 15.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.92236328125, -0.894805908203125, -0.86724853515625, -0.839691162109375, -0.8121337890625, -0.784576416015625, -0.75701904296875, -0.729461669921875, -0.701904296875, -0.674346923828125, -0.64678955078125, -0.619232177734375, -0.5916748046875, -0.564117431640625, -0.53656005859375, -0.509002685546875, -0.4814453125, -0.453887939453125, -0.42633056640625, -0.398773193359375, -0.3712158203125, -0.343658447265625, -0.31610107421875, -0.288543701171875, -0.260986328125, -0.233428955078125, -0.20587158203125, -0.178314208984375, -0.1507568359375, -0.123199462890625, -0.09564208984375, -0.068084716796875, -0.04052734375, -0.012969970703125, 0.01458740234375, 0.042144775390625, 0.0697021484375, 0.097259521484375, 0.12481689453125, 0.152374267578125, 0.179931640625, 0.207489013671875, 0.23504638671875, 0.262603759765625, 0.2901611328125, 0.317718505859375, 0.34527587890625, 0.372833251953125, 0.400390625, 0.427947998046875, 0.45550537109375, 0.483062744140625, 0.5106201171875, 0.538177490234375, 0.56573486328125, 0.593292236328125, 0.620849609375, 0.648406982421875, 0.67596435546875, 0.703521728515625, 0.7310791015625, 0.758636474609375, 0.78619384765625, 0.813751220703125, 0.84130859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 25.0, 27.0, 29.0, 28.0, 27.0, 45.0, 38.0, 42.0, 42.0, 62.0, 62.0, 72.0, 48.0, 51.0, 43.0, 48.0, 47.0, 32.0, 29.0, 33.0, 23.0, 18.0, 14.0, 14.0, 12.0, 8.0, 5.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.390975952148438e-05, -7.155537605285645e-05, -6.920099258422852e-05, -6.684660911560059e-05, -6.449222564697266e-05, -6.213784217834473e-05, -5.97834587097168e-05, -5.742907524108887e-05, -5.507469177246094e-05, -5.272030830383301e-05, -5.036592483520508e-05, -4.801154136657715e-05, -4.565715789794922e-05, -4.330277442932129e-05, -4.094839096069336e-05, -3.859400749206543e-05, -3.62396240234375e-05, -3.388524055480957e-05, -3.153085708618164e-05, -2.917647361755371e-05, -2.682209014892578e-05, -2.446770668029785e-05, -2.2113323211669922e-05, -1.9758939743041992e-05, -1.7404556274414062e-05, -1.5050172805786133e-05, -1.2695789337158203e-05, -1.0341405868530273e-05, -7.987022399902344e-06, -5.632638931274414e-06, -3.2782554626464844e-06, -9.238719940185547e-07, 1.430511474609375e-06, 3.7848949432373047e-06, 6.139278411865234e-06, 8.493661880493164e-06, 1.0848045349121094e-05, 1.3202428817749023e-05, 1.5556812286376953e-05, 1.7911195755004883e-05, 2.0265579223632812e-05, 2.2619962692260742e-05, 2.4974346160888672e-05, 2.73287296295166e-05, 2.968311309814453e-05, 3.203749656677246e-05, 3.439188003540039e-05, 3.674626350402832e-05, 3.910064697265625e-05, 4.145503044128418e-05, 4.380941390991211e-05, 4.616379737854004e-05, 4.851818084716797e-05, 5.08725643157959e-05, 5.322694778442383e-05, 5.558133125305176e-05, 5.793571472167969e-05, 6.029009819030762e-05, 6.264448165893555e-05, 6.499886512756348e-05, 6.73532485961914e-05, 6.970763206481934e-05, 7.206201553344727e-05, 7.44163990020752e-05, 7.677078247070312e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 16.0, 20.0, 27.0, 49.0, 58.0, 104.0, 154.0, 224.0, 366.0, 613.0, 1018.0, 1768.0, 2840.0, 4807.0, 8372.0, 14733.0, 25419.0, 44505.0, 75655.0, 118628.0, 159821.0, 174986.0, 149433.0, 106494.0, 66374.0, 39158.0, 22162.0, 12750.0, 7421.0, 4107.0, 2534.0, 1479.0, 924.0, 536.0, 363.0, 232.0, 154.0, 92.0, 55.0, 35.0, 18.0, 18.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.84765625, -0.82147216796875, -0.7952880859375, -0.76910400390625, -0.742919921875, -0.71673583984375, -0.6905517578125, -0.66436767578125, -0.63818359375, -0.61199951171875, -0.5858154296875, -0.55963134765625, -0.533447265625, -0.50726318359375, -0.4810791015625, -0.45489501953125, -0.4287109375, -0.40252685546875, -0.3763427734375, -0.35015869140625, -0.323974609375, -0.29779052734375, -0.2716064453125, -0.24542236328125, -0.21923828125, -0.19305419921875, -0.1668701171875, -0.14068603515625, -0.114501953125, -0.08831787109375, -0.0621337890625, -0.03594970703125, -0.009765625, 0.01641845703125, 0.0426025390625, 0.06878662109375, 0.094970703125, 0.12115478515625, 0.1473388671875, 0.17352294921875, 0.19970703125, 0.22589111328125, 0.2520751953125, 0.27825927734375, 0.304443359375, 0.33062744140625, 0.3568115234375, 0.38299560546875, 0.4091796875, 0.43536376953125, 0.4615478515625, 0.48773193359375, 0.513916015625, 0.54010009765625, 0.5662841796875, 0.59246826171875, 0.61865234375, 0.64483642578125, 0.6710205078125, 0.69720458984375, 0.723388671875, 0.74957275390625, 0.7757568359375, 0.80194091796875, 0.828125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 10.0, 17.0, 12.0, 22.0, 25.0, 27.0, 44.0, 46.0, 56.0, 54.0, 65.0, 75.0, 68.0, 78.0, 64.0, 67.0, 43.0, 42.0, 35.0, 27.0, 22.0, 17.0, 22.0, 13.0, 11.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38722991943359375, -0.3760223388671875, -0.36481475830078125, -0.353607177734375, -0.34239959716796875, -0.3311920166015625, -0.31998443603515625, -0.30877685546875, -0.29756927490234375, -0.2863616943359375, -0.27515411376953125, -0.263946533203125, -0.25273895263671875, -0.2415313720703125, -0.23032379150390625, -0.2191162109375, -0.20790863037109375, -0.1967010498046875, -0.18549346923828125, -0.174285888671875, -0.16307830810546875, -0.1518707275390625, -0.14066314697265625, -0.12945556640625, -0.11824798583984375, -0.1070404052734375, -0.09583282470703125, -0.084625244140625, -0.07341766357421875, -0.0622100830078125, -0.05100250244140625, -0.039794921875, -0.02858734130859375, -0.0173797607421875, -0.00617218017578125, 0.005035400390625, 0.01624298095703125, 0.0274505615234375, 0.03865814208984375, 0.04986572265625, 0.06107330322265625, 0.0722808837890625, 0.08348846435546875, 0.094696044921875, 0.10590362548828125, 0.1171112060546875, 0.12831878662109375, 0.1395263671875, 0.15073394775390625, 0.1619415283203125, 0.17314910888671875, 0.184356689453125, 0.19556427001953125, 0.2067718505859375, 0.21797943115234375, 0.22918701171875, 0.24039459228515625, 0.2516021728515625, 0.26280975341796875, 0.274017333984375, 0.28522491455078125, 0.2964324951171875, 0.30764007568359375, 0.31884765625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 11.0, 7.0, 12.0, 19.0, 26.0, 30.0, 35.0, 33.0, 33.0, 57.0, 59.0, 64.0, 63.0, 70.0, 61.0, 64.0, 71.0, 52.0, 47.0, 38.0, 30.0, 23.0, 17.0, 18.0, 23.0, 9.0, 4.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96602463722229, -1.89926016330719, -1.8324956893920898, -1.7657313346862793, -1.6989668607711792, -1.632202386856079, -1.5654380321502686, -1.4986735582351685, -1.4319090843200684, -1.3651446104049683, -1.2983801364898682, -1.2316157817840576, -1.1648513078689575, -1.0980868339538574, -1.0313224792480469, -0.9645580053329468, -0.8977935314178467, -0.8310290575027466, -0.7642646431922913, -0.6975002288818359, -0.6307357549667358, -0.5639712810516357, -0.4972068667411804, -0.4304424226284027, -0.363677978515625, -0.2969135344028473, -0.23014909029006958, -0.16338464617729187, -0.09662020206451416, -0.02985575795173645, 0.03690868616104126, 0.10367313027381897, 0.17043781280517578, 0.2372022569179535, 0.3039667010307312, 0.3707311451435089, 0.4374955892562866, 0.5042600631713867, 0.571024477481842, 0.6377888917922974, 0.7045533657073975, 0.7713178396224976, 0.8380822539329529, 0.9048466682434082, 0.9716111421585083, 1.0383756160736084, 1.105139970779419, 1.171904444694519, 1.2386689186096191, 1.3054333925247192, 1.3721978664398193, 1.4389622211456299, 1.50572669506073, 1.57249116897583, 1.6392555236816406, 1.7060199975967407, 1.7727844715118408, 1.839548945426941, 1.906313419342041, 1.9730777740478516, 2.039842128753662, 2.1066067218780518, 2.1733710765838623, 2.240135669708252, 2.3069000244140625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 2.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 9.0, 8.0, 12.0, 9.0, 14.0, 17.0, 17.0, 29.0, 22.0, 20.0, 30.0, 22.0, 25.0, 29.0, 36.0, 37.0, 30.0, 24.0, 41.0, 46.0, 43.0, 31.0, 30.0, 40.0, 40.0, 33.0, 32.0, 33.0, 18.0, 14.0, 23.0, 16.0, 25.0, 13.0, 12.0, 16.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1299009323120117, -1.0913114547729492, -1.0527218580245972, -1.0141323804855347, -0.9755429029464722, -0.9369533658027649, -0.8983638286590576, -0.8597743511199951, -0.8211848139762878, -0.7825952768325806, -0.7440057992935181, -0.7054162621498108, -0.6668267250061035, -0.628237247467041, -0.5896477103233337, -0.5510581731796265, -0.512468695640564, -0.4738791882991791, -0.4352896809577942, -0.3967001438140869, -0.358110636472702, -0.31952112913131714, -0.28093159198760986, -0.24234208464622498, -0.2037525773048401, -0.1651630699634552, -0.12657354772090912, -0.08798403292894363, -0.04939451813697815, -0.010805010795593262, 0.02778451144695282, 0.0663740336894989, 0.10496342182159424, 0.14355292916297913, 0.1821424514055252, 0.2207319736480713, 0.2593214809894562, 0.29791098833084106, 0.33650052547454834, 0.3750900328159332, 0.4136795401573181, 0.452269047498703, 0.4908585548400879, 0.5294480919837952, 0.5680376291275024, 0.6066271066665649, 0.6452166438102722, 0.6838061809539795, 0.722395658493042, 0.7609851956367493, 0.7995746731758118, 0.838164210319519, 0.8767536878585815, 0.9153432250022888, 0.9539327621459961, 0.9925222396850586, 1.031111717224121, 1.0697011947631836, 1.1082907915115356, 1.1468802690505981, 1.1854697465896606, 1.2240593433380127, 1.2626488208770752, 1.3012382984161377, 1.3398278951644897]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 11.0, 22.0, 35.0, 56.0, 97.0, 163.0, 267.0, 412.0, 617.0, 1047.0, 1675.0, 2741.0, 4423.0, 7275.0, 11679.0, 19559.0, 31746.0, 52151.0, 84917.0, 136164.0, 215054.0, 320890.0, 445944.0, 551682.0, 584934.0, 526040.0, 409265.0, 287414.0, 189352.0, 119317.0, 73346.0, 45020.0, 27438.0, 16638.0, 10245.0, 6144.0, 3970.0, 2380.0, 1519.0, 949.0, 625.0, 398.0, 268.0, 156.0, 81.0, 64.0, 39.0, 22.0, 18.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.0457611083984375, -1.007537841796875, -0.9693145751953125, -0.93109130859375, -0.8928680419921875, -0.854644775390625, -0.8164215087890625, -0.7781982421875, -0.7399749755859375, -0.701751708984375, -0.6635284423828125, -0.62530517578125, -0.5870819091796875, -0.548858642578125, -0.5106353759765625, -0.472412109375, -0.4341888427734375, -0.395965576171875, -0.3577423095703125, -0.31951904296875, -0.2812957763671875, -0.243072509765625, -0.2048492431640625, -0.1666259765625, -0.1284027099609375, -0.090179443359375, -0.0519561767578125, -0.01373291015625, 0.0244903564453125, 0.062713623046875, 0.1009368896484375, 0.13916015625, 0.1773834228515625, 0.215606689453125, 0.2538299560546875, 0.29205322265625, 0.3302764892578125, 0.368499755859375, 0.4067230224609375, 0.4449462890625, 0.4831695556640625, 0.521392822265625, 0.5596160888671875, 0.59783935546875, 0.6360626220703125, 0.674285888671875, 0.7125091552734375, 0.750732421875, 0.7889556884765625, 0.827178955078125, 0.8654022216796875, 0.90362548828125, 0.9418487548828125, 0.980072021484375, 1.0182952880859375, 1.0565185546875, 1.0947418212890625, 1.132965087890625, 1.1711883544921875, 1.20941162109375, 1.2476348876953125, 1.285858154296875, 1.3240814208984375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 11.0, 17.0, 21.0, 18.0, 16.0, 24.0, 27.0, 33.0, 26.0, 30.0, 40.0, 44.0, 41.0, 32.0, 40.0, 50.0, 46.0, 38.0, 39.0, 36.0, 48.0, 39.0, 33.0, 31.0, 18.0, 24.0, 22.0, 20.0, 21.0, 19.0, 12.0, 8.0, 5.0, 9.0, 11.0, 4.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0205078125, -0.987518310546875, -0.95452880859375, -0.921539306640625, -0.8885498046875, -0.855560302734375, -0.82257080078125, -0.789581298828125, -0.756591796875, -0.723602294921875, -0.69061279296875, -0.657623291015625, -0.6246337890625, -0.591644287109375, -0.55865478515625, -0.525665283203125, -0.49267578125, -0.459686279296875, -0.42669677734375, -0.393707275390625, -0.3607177734375, -0.327728271484375, -0.29473876953125, -0.261749267578125, -0.228759765625, -0.195770263671875, -0.16278076171875, -0.129791259765625, -0.0968017578125, -0.063812255859375, -0.03082275390625, 0.002166748046875, 0.03515625, 0.068145751953125, 0.10113525390625, 0.134124755859375, 0.1671142578125, 0.200103759765625, 0.23309326171875, 0.266082763671875, 0.299072265625, 0.332061767578125, 0.36505126953125, 0.398040771484375, 0.4310302734375, 0.464019775390625, 0.49700927734375, 0.529998779296875, 0.56298828125, 0.595977783203125, 0.62896728515625, 0.661956787109375, 0.6949462890625, 0.727935791015625, 0.76092529296875, 0.793914794921875, 0.826904296875, 0.859893798828125, 0.89288330078125, 0.925872802734375, 0.9588623046875, 0.991851806640625, 1.02484130859375, 1.057830810546875, 1.0908203125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 7.0, 8.0, 10.0, 21.0, 33.0, 42.0, 81.0, 86.0, 161.0, 251.0, 405.0, 686.0, 1126.0, 1752.0, 2789.0, 4616.0, 7535.0, 12585.0, 20347.0, 33214.0, 53900.0, 85864.0, 132855.0, 197985.0, 282884.0, 376772.0, 460876.0, 508345.0, 497358.0, 434073.0, 344207.0, 251626.0, 174302.0, 115185.0, 73336.0, 45993.0, 28355.0, 17249.0, 10592.0, 6422.0, 3939.0, 2386.0, 1518.0, 959.0, 563.0, 398.0, 211.0, 131.0, 89.0, 68.0, 40.0, 15.0, 19.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.070556640625, -1.03466796875, -0.998779296875, -0.962890625, -0.927001953125, -0.89111328125, -0.855224609375, -0.8193359375, -0.783447265625, -0.74755859375, -0.711669921875, -0.67578125, -0.639892578125, -0.60400390625, -0.568115234375, -0.5322265625, -0.496337890625, -0.46044921875, -0.424560546875, -0.388671875, -0.352783203125, -0.31689453125, -0.281005859375, -0.2451171875, -0.209228515625, -0.17333984375, -0.137451171875, -0.1015625, -0.065673828125, -0.02978515625, 0.006103515625, 0.0419921875, 0.077880859375, 0.11376953125, 0.149658203125, 0.185546875, 0.221435546875, 0.25732421875, 0.293212890625, 0.3291015625, 0.364990234375, 0.40087890625, 0.436767578125, 0.47265625, 0.508544921875, 0.54443359375, 0.580322265625, 0.6162109375, 0.652099609375, 0.68798828125, 0.723876953125, 0.759765625, 0.795654296875, 0.83154296875, 0.867431640625, 0.9033203125, 0.939208984375, 0.97509765625, 1.010986328125, 1.046875, 1.082763671875, 1.11865234375, 1.154541015625, 1.1904296875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 6.0, 11.0, 12.0, 17.0, 34.0, 34.0, 33.0, 42.0, 49.0, 46.0, 72.0, 80.0, 107.0, 120.0, 154.0, 151.0, 166.0, 190.0, 192.0, 201.0, 213.0, 230.0, 240.0, 201.0, 206.0, 165.0, 164.0, 153.0, 132.0, 119.0, 100.0, 88.0, 67.0, 49.0, 58.0, 34.0, 23.0, 25.0, 18.0, 9.0, 10.0, 12.0, 11.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4644126892089844, -0.44860076904296875, -0.4327888488769531, -0.4169769287109375, -0.4011650085449219, -0.38535308837890625, -0.3695411682128906, -0.353729248046875, -0.3379173278808594, -0.32210540771484375, -0.3062934875488281, -0.2904815673828125, -0.2746696472167969, -0.25885772705078125, -0.24304580688476562, -0.22723388671875, -0.21142196655273438, -0.19561004638671875, -0.17979812622070312, -0.1639862060546875, -0.14817428588867188, -0.13236236572265625, -0.11655044555664062, -0.100738525390625, -0.08492660522460938, -0.06911468505859375, -0.053302764892578125, -0.0374908447265625, -0.021678924560546875, -0.00586700439453125, 0.009944915771484375, 0.0257568359375, 0.041568756103515625, 0.05738067626953125, 0.07319259643554688, 0.0890045166015625, 0.10481643676757812, 0.12062835693359375, 0.13644027709960938, 0.152252197265625, 0.16806411743164062, 0.18387603759765625, 0.19968795776367188, 0.2154998779296875, 0.23131179809570312, 0.24712371826171875, 0.2629356384277344, 0.27874755859375, 0.2945594787597656, 0.31037139892578125, 0.3261833190917969, 0.3419952392578125, 0.3578071594238281, 0.37361907958984375, 0.3894309997558594, 0.405242919921875, 0.4210548400878906, 0.43686676025390625, 0.4526786804199219, 0.4684906005859375, 0.4843025207519531, 0.5001144409179688, 0.5159263610839844, 0.53173828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 7.0, 9.0, 9.0, 10.0, 14.0, 18.0, 24.0, 23.0, 32.0, 37.0, 44.0, 46.0, 51.0, 66.0, 67.0, 52.0, 71.0, 53.0, 52.0, 37.0, 42.0, 38.0, 35.0, 31.0, 27.0, 20.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 4.0, 8.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5019704103469849, -1.4478763341903687, -1.393782377243042, -1.3396883010864258, -1.2855942249298096, -1.231500267982483, -1.1774061918258667, -1.12331223487854, -1.0692181587219238, -1.0151240825653076, -0.961030125617981, -0.9069360494613647, -0.8528420329093933, -0.7987480163574219, -0.7446539402008057, -0.6905599236488342, -0.6364659070968628, -0.5823718905448914, -0.5282778739929199, -0.4741837978363037, -0.4200897812843323, -0.36599576473236084, -0.311901718378067, -0.2578076720237732, -0.20371365547180176, -0.14961962401866913, -0.0955255925655365, -0.04143156111240387, 0.01266247034072876, 0.0667564868927002, 0.12085053324699402, 0.17494457960128784, 0.22903847694396973, 0.28313249349594116, 0.337226539850235, 0.3913205862045288, 0.44541460275650024, 0.4995086193084717, 0.5536026954650879, 0.6076967120170593, 0.6617907285690308, 0.7158847451210022, 0.7699787616729736, 0.8240728378295898, 0.8781668543815613, 0.9322608709335327, 0.9863549470901489, 1.0404489040374756, 1.0945429801940918, 1.148637056350708, 1.2027310132980347, 1.2568250894546509, 1.3109190464019775, 1.3650131225585938, 1.41910719871521, 1.4732012748718262, 1.5272952318191528, 1.581389307975769, 1.6354832649230957, 1.689577341079712, 1.7436714172363281, 1.7977653741836548, 1.851859450340271, 1.9059534072875977, 1.9600474834442139]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 14.0, 12.0, 4.0, 7.0, 9.0, 20.0, 15.0, 15.0, 21.0, 20.0, 38.0, 21.0, 32.0, 28.0, 28.0, 35.0, 37.0, 38.0, 42.0, 44.0, 29.0, 30.0, 35.0, 37.0, 34.0, 27.0, 29.0, 34.0, 34.0, 22.0, 25.0, 23.0, 23.0, 20.0, 11.0, 15.0, 16.0, 17.0, 16.0, 6.0, 6.0, 4.0, 8.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.111849308013916, -1.0768101215362549, -1.0417709350585938, -1.0067317485809326, -0.9716925621032715, -0.9366533756256104, -0.9016141295433044, -0.8665749430656433, -0.8315357565879822, -0.796496570110321, -0.7614573836326599, -0.7264181971549988, -0.6913789510726929, -0.6563397645950317, -0.6213005781173706, -0.5862613916397095, -0.5512222051620483, -0.5161830186843872, -0.4811438322067261, -0.44610461592674255, -0.4110654294490814, -0.3760262429714203, -0.34098702669143677, -0.30594784021377563, -0.2709086537361145, -0.23586946725845337, -0.20083026587963104, -0.16579106450080872, -0.13075187802314758, -0.09571269154548645, -0.060673490166664124, -0.025634288787841797, 0.009405016899108887, 0.044444210827350616, 0.07948340475559235, 0.11452259868383408, 0.1495617926120758, 0.18460097908973694, 0.21964018046855927, 0.2546793818473816, 0.2897185683250427, 0.32475775480270386, 0.359796941280365, 0.3948361575603485, 0.42987534403800964, 0.4649145305156708, 0.4999537467956543, 0.5349929332733154, 0.5700321197509766, 0.6050713062286377, 0.6401104927062988, 0.67514967918396, 0.7101888656616211, 0.7452280521392822, 0.7802672982215881, 0.8153064846992493, 0.8503456711769104, 0.8853848576545715, 0.9204240441322327, 0.9554632306098938, 0.9905024766921997, 1.0255416631698608, 1.060580849647522, 1.095620036125183, 1.1306592226028442]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 1.0, 10.0, 8.0, 15.0, 21.0, 24.0, 22.0, 54.0, 63.0, 88.0, 141.0, 198.0, 277.0, 439.0, 731.0, 1047.0, 1769.0, 2715.0, 4535.0, 7041.0, 11846.0, 19658.0, 32748.0, 53931.0, 87933.0, 135080.0, 176522.0, 173044.0, 127677.0, 82773.0, 50333.0, 30352.0, 18346.0, 11088.0, 6773.0, 4067.0, 2531.0, 1661.0, 1032.0, 662.0, 406.0, 300.0, 183.0, 128.0, 91.0, 45.0, 59.0, 29.0, 19.0, 11.0, 9.0, 10.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416748046875, -0.40234375, -0.387939453125, -0.37353515625, -0.359130859375, -0.3447265625, -0.330322265625, -0.31591796875, -0.301513671875, -0.287109375, -0.272705078125, -0.25830078125, -0.243896484375, -0.2294921875, -0.215087890625, -0.20068359375, -0.186279296875, -0.171875, -0.157470703125, -0.14306640625, -0.128662109375, -0.1142578125, -0.099853515625, -0.08544921875, -0.071044921875, -0.056640625, -0.042236328125, -0.02783203125, -0.013427734375, 0.0009765625, 0.015380859375, 0.02978515625, 0.044189453125, 0.05859375, 0.072998046875, 0.08740234375, 0.101806640625, 0.1162109375, 0.130615234375, 0.14501953125, 0.159423828125, 0.173828125, 0.188232421875, 0.20263671875, 0.217041015625, 0.2314453125, 0.245849609375, 0.26025390625, 0.274658203125, 0.2890625, 0.303466796875, 0.31787109375, 0.332275390625, 0.3466796875, 0.361083984375, 0.37548828125, 0.389892578125, 0.404296875, 0.418701171875, 0.43310546875, 0.447509765625, 0.4619140625, 0.476318359375, 0.49072265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 11.0, 12.0, 14.0, 10.0, 16.0, 12.0, 18.0, 33.0, 23.0, 27.0, 36.0, 27.0, 27.0, 46.0, 35.0, 41.0, 43.0, 40.0, 38.0, 45.0, 30.0, 42.0, 42.0, 36.0, 31.0, 25.0, 32.0, 23.0, 31.0, 20.0, 24.0, 12.0, 19.0, 11.0, 13.0, 7.0, 13.0, 6.0, 2.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2594757080078125, -1.219146728515625, -1.1788177490234375, -1.13848876953125, -1.0981597900390625, -1.057830810546875, -1.0175018310546875, -0.9771728515625, -0.9368438720703125, -0.896514892578125, -0.8561859130859375, -0.81585693359375, -0.7755279541015625, -0.735198974609375, -0.6948699951171875, -0.654541015625, -0.6142120361328125, -0.573883056640625, -0.5335540771484375, -0.49322509765625, -0.4528961181640625, -0.412567138671875, -0.3722381591796875, -0.3319091796875, -0.2915802001953125, -0.251251220703125, -0.2109222412109375, -0.17059326171875, -0.1302642822265625, -0.089935302734375, -0.0496063232421875, -0.00927734375, 0.0310516357421875, 0.071380615234375, 0.1117095947265625, 0.15203857421875, 0.1923675537109375, 0.232696533203125, 0.2730255126953125, 0.3133544921875, 0.3536834716796875, 0.394012451171875, 0.4343414306640625, 0.47467041015625, 0.5149993896484375, 0.555328369140625, 0.5956573486328125, 0.635986328125, 0.6763153076171875, 0.716644287109375, 0.7569732666015625, 0.79730224609375, 0.8376312255859375, 0.877960205078125, 0.9182891845703125, 0.9586181640625, 0.9989471435546875, 1.039276123046875, 1.0796051025390625, 1.11993408203125, 1.1602630615234375, 1.200592041015625, 1.2409210205078125, 1.28125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 10.0, 10.0, 20.0, 36.0, 42.0, 66.0, 105.0, 174.0, 210.0, 367.0, 569.0, 1026.0, 1787.0, 3248.0, 6200.0, 11638.0, 23402.0, 47637.0, 96681.0, 184208.0, 259963.0, 198395.0, 106425.0, 52593.0, 25850.0, 12901.0, 6659.0, 3507.0, 1894.0, 1119.0, 631.0, 464.0, 264.0, 163.0, 99.0, 68.0, 48.0, 26.0, 20.0, 14.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6123046875, -0.593505859375, -0.57470703125, -0.555908203125, -0.537109375, -0.518310546875, -0.49951171875, -0.480712890625, -0.4619140625, -0.443115234375, -0.42431640625, -0.405517578125, -0.38671875, -0.367919921875, -0.34912109375, -0.330322265625, -0.3115234375, -0.292724609375, -0.27392578125, -0.255126953125, -0.236328125, -0.217529296875, -0.19873046875, -0.179931640625, -0.1611328125, -0.142333984375, -0.12353515625, -0.104736328125, -0.0859375, -0.067138671875, -0.04833984375, -0.029541015625, -0.0107421875, 0.008056640625, 0.02685546875, 0.045654296875, 0.064453125, 0.083251953125, 0.10205078125, 0.120849609375, 0.1396484375, 0.158447265625, 0.17724609375, 0.196044921875, 0.21484375, 0.233642578125, 0.25244140625, 0.271240234375, 0.2900390625, 0.308837890625, 0.32763671875, 0.346435546875, 0.365234375, 0.384033203125, 0.40283203125, 0.421630859375, 0.4404296875, 0.459228515625, 0.47802734375, 0.496826171875, 0.515625, 0.534423828125, 0.55322265625, 0.572021484375, 0.5908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 7.0, 17.0, 19.0, 17.0, 26.0, 31.0, 35.0, 34.0, 29.0, 32.0, 39.0, 34.0, 40.0, 41.0, 42.0, 47.0, 42.0, 37.0, 44.0, 51.0, 30.0, 34.0, 34.0, 32.0, 23.0, 18.0, 17.0, 17.0, 21.0, 16.0, 11.0, 7.0, 14.0, 2.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7228012084960938, -0.6951141357421875, -0.6674270629882812, -0.639739990234375, -0.6120529174804688, -0.5843658447265625, -0.5566787719726562, -0.52899169921875, -0.5013046264648438, -0.4736175537109375, -0.44593048095703125, -0.418243408203125, -0.39055633544921875, -0.3628692626953125, -0.33518218994140625, -0.3074951171875, -0.27980804443359375, -0.2521209716796875, -0.22443389892578125, -0.196746826171875, -0.16905975341796875, -0.1413726806640625, -0.11368560791015625, -0.08599853515625, -0.05831146240234375, -0.0306243896484375, -0.00293731689453125, 0.024749755859375, 0.05243682861328125, 0.0801239013671875, 0.10781097412109375, 0.135498046875, 0.16318511962890625, 0.1908721923828125, 0.21855926513671875, 0.246246337890625, 0.27393341064453125, 0.3016204833984375, 0.32930755615234375, 0.35699462890625, 0.38468170166015625, 0.4123687744140625, 0.44005584716796875, 0.467742919921875, 0.49542999267578125, 0.5231170654296875, 0.5508041381835938, 0.5784912109375, 0.6061782836914062, 0.6338653564453125, 0.6615524291992188, 0.689239501953125, 0.7169265747070312, 0.7446136474609375, 0.7723007202148438, 0.79998779296875, 0.8276748657226562, 0.8553619384765625, 0.8830490112304688, 0.910736083984375, 0.9384231567382812, 0.9661102294921875, 0.9937973022460938, 1.021484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 18.0, 21.0, 29.0, 32.0, 45.0, 78.0, 123.0, 131.0, 184.0, 244.0, 346.0, 439.0, 569.0, 871.0, 1205.0, 1694.0, 2662.0, 3800.0, 5977.0, 9812.0, 16993.0, 31692.0, 65999.0, 149403.0, 301991.0, 238409.0, 105710.0, 48787.0, 24321.0, 13262.0, 8045.0, 5030.0, 3163.0, 2192.0, 1452.0, 1065.0, 732.0, 555.0, 368.0, 308.0, 209.0, 185.0, 84.0, 92.0, 64.0, 43.0, 29.0, 26.0, 19.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0], "bins": [-0.2322998046875, -0.22542572021484375, -0.2185516357421875, -0.21167755126953125, -0.204803466796875, -0.19792938232421875, -0.1910552978515625, -0.18418121337890625, -0.17730712890625, -0.17043304443359375, -0.1635589599609375, -0.15668487548828125, -0.149810791015625, -0.14293670654296875, -0.1360626220703125, -0.12918853759765625, -0.122314453125, -0.11544036865234375, -0.1085662841796875, -0.10169219970703125, -0.094818115234375, -0.08794403076171875, -0.0810699462890625, -0.07419586181640625, -0.06732177734375, -0.06044769287109375, -0.0535736083984375, -0.04669952392578125, -0.039825439453125, -0.03295135498046875, -0.0260772705078125, -0.01920318603515625, -0.0123291015625, -0.00545501708984375, 0.0014190673828125, 0.00829315185546875, 0.015167236328125, 0.02204132080078125, 0.0289154052734375, 0.03578948974609375, 0.04266357421875, 0.04953765869140625, 0.0564117431640625, 0.06328582763671875, 0.070159912109375, 0.07703399658203125, 0.0839080810546875, 0.09078216552734375, 0.09765625, 0.10453033447265625, 0.1114044189453125, 0.11827850341796875, 0.125152587890625, 0.13202667236328125, 0.1389007568359375, 0.14577484130859375, 0.15264892578125, 0.15952301025390625, 0.1663970947265625, 0.17327117919921875, 0.180145263671875, 0.18701934814453125, 0.1938934326171875, 0.20076751708984375, 0.2076416015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 13.0, 5.0, 13.0, 19.0, 15.0, 26.0, 30.0, 31.0, 39.0, 70.0, 64.0, 76.0, 85.0, 82.0, 72.0, 78.0, 62.0, 53.0, 24.0, 27.0, 24.0, 15.0, 17.0, 10.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.2709369659423828e-05, -2.2079795598983765e-05, -2.14502215385437e-05, -2.0820647478103638e-05, -2.0191073417663574e-05, -1.956149935722351e-05, -1.8931925296783447e-05, -1.8302351236343384e-05, -1.767277717590332e-05, -1.7043203115463257e-05, -1.6413629055023193e-05, -1.578405499458313e-05, -1.5154480934143066e-05, -1.4524906873703003e-05, -1.389533281326294e-05, -1.3265758752822876e-05, -1.2636184692382812e-05, -1.2006610631942749e-05, -1.1377036571502686e-05, -1.0747462511062622e-05, -1.0117888450622559e-05, -9.488314390182495e-06, -8.858740329742432e-06, -8.229166269302368e-06, -7.599592208862305e-06, -6.970018148422241e-06, -6.340444087982178e-06, -5.710870027542114e-06, -5.081295967102051e-06, -4.451721906661987e-06, -3.822147846221924e-06, -3.1925737857818604e-06, -2.562999725341797e-06, -1.9334256649017334e-06, -1.30385160446167e-06, -6.742775440216064e-07, -4.470348358154297e-08, 5.848705768585205e-07, 1.214444637298584e-06, 1.8440186977386475e-06, 2.473592758178711e-06, 3.1031668186187744e-06, 3.732740879058838e-06, 4.362314939498901e-06, 4.991888999938965e-06, 5.621463060379028e-06, 6.251037120819092e-06, 6.880611181259155e-06, 7.510185241699219e-06, 8.139759302139282e-06, 8.769333362579346e-06, 9.39890742301941e-06, 1.0028481483459473e-05, 1.0658055543899536e-05, 1.12876296043396e-05, 1.1917203664779663e-05, 1.2546777725219727e-05, 1.317635178565979e-05, 1.3805925846099854e-05, 1.4435499906539917e-05, 1.506507396697998e-05, 1.5694648027420044e-05, 1.6324222087860107e-05, 1.695379614830017e-05, 1.7583370208740234e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 3.0, 18.0, 12.0, 25.0, 32.0, 40.0, 72.0, 115.0, 160.0, 248.0, 414.0, 642.0, 935.0, 1456.0, 2144.0, 3403.0, 5216.0, 8202.0, 13302.0, 21351.0, 34753.0, 58266.0, 99458.0, 161448.0, 206357.0, 166801.0, 104936.0, 61770.0, 36595.0, 22115.0, 13847.0, 8758.0, 5522.0, 3507.0, 2361.0, 1517.0, 1005.0, 611.0, 377.0, 267.0, 154.0, 114.0, 73.0, 40.0, 38.0, 21.0, 28.0, 7.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.2200927734375, -0.21372222900390625, -0.2073516845703125, -0.20098114013671875, -0.194610595703125, -0.18824005126953125, -0.1818695068359375, -0.17549896240234375, -0.16912841796875, -0.16275787353515625, -0.1563873291015625, -0.15001678466796875, -0.143646240234375, -0.13727569580078125, -0.1309051513671875, -0.12453460693359375, -0.1181640625, -0.11179351806640625, -0.1054229736328125, -0.09905242919921875, -0.092681884765625, -0.08631134033203125, -0.0799407958984375, -0.07357025146484375, -0.06719970703125, -0.06082916259765625, -0.0544586181640625, -0.04808807373046875, -0.041717529296875, -0.03534698486328125, -0.0289764404296875, -0.02260589599609375, -0.0162353515625, -0.00986480712890625, -0.0034942626953125, 0.00287628173828125, 0.009246826171875, 0.01561737060546875, 0.0219879150390625, 0.02835845947265625, 0.03472900390625, 0.04109954833984375, 0.0474700927734375, 0.05384063720703125, 0.060211181640625, 0.06658172607421875, 0.0729522705078125, 0.07932281494140625, 0.085693359375, 0.09206390380859375, 0.0984344482421875, 0.10480499267578125, 0.111175537109375, 0.11754608154296875, 0.1239166259765625, 0.13028717041015625, 0.13665771484375, 0.14302825927734375, 0.1493988037109375, 0.15576934814453125, 0.162139892578125, 0.16851043701171875, 0.1748809814453125, 0.18125152587890625, 0.1876220703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 14.0, 26.0, 34.0, 25.0, 36.0, 58.0, 62.0, 73.0, 79.0, 84.0, 93.0, 54.0, 63.0, 51.0, 29.0, 42.0, 37.0, 29.0, 17.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.0648794174194336, -0.06225395202636719, -0.05962848663330078, -0.057003021240234375, -0.05437755584716797, -0.05175209045410156, -0.049126625061035156, -0.04650115966796875, -0.043875694274902344, -0.04125022888183594, -0.03862476348876953, -0.035999298095703125, -0.03337383270263672, -0.030748367309570312, -0.028122901916503906, -0.0254974365234375, -0.022871971130371094, -0.020246505737304688, -0.01762104034423828, -0.014995574951171875, -0.012370109558105469, -0.009744644165039062, -0.007119178771972656, -0.00449371337890625, -0.0018682479858398438, 0.0007572174072265625, 0.0033826828002929688, 0.006008148193359375, 0.008633613586425781, 0.011259078979492188, 0.013884544372558594, 0.016510009765625, 0.019135475158691406, 0.021760940551757812, 0.02438640594482422, 0.027011871337890625, 0.02963733673095703, 0.03226280212402344, 0.034888267517089844, 0.03751373291015625, 0.040139198303222656, 0.04276466369628906, 0.04539012908935547, 0.048015594482421875, 0.05064105987548828, 0.05326652526855469, 0.055891990661621094, 0.0585174560546875, 0.061142921447753906, 0.06376838684082031, 0.06639385223388672, 0.06901931762695312, 0.07164478302001953, 0.07427024841308594, 0.07689571380615234, 0.07952117919921875, 0.08214664459228516, 0.08477210998535156, 0.08739757537841797, 0.09002304077148438, 0.09264850616455078, 0.09527397155761719, 0.0978994369506836, 0.10052490234375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 11.0, 11.0, 19.0, 22.0, 29.0, 35.0, 22.0, 51.0, 42.0, 63.0, 50.0, 69.0, 59.0, 54.0, 65.0, 42.0, 47.0, 49.0, 36.0, 25.0, 34.0, 28.0, 21.0, 16.0, 18.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4869941473007202, -1.433651328086853, -1.3803086280822754, -1.3269658088684082, -1.273622989654541, -1.2202801704406738, -1.1669373512268066, -1.113594651222229, -1.0602518320083618, -1.0069090127944946, -0.9535662531852722, -0.9002234935760498, -0.8468806743621826, -0.7935378551483154, -0.740195095539093, -0.6868523359298706, -0.6335095167160034, -0.5801666975021362, -0.5268239378929138, -0.473481148481369, -0.4201383590698242, -0.3667955696582794, -0.3134527802467346, -0.2601099908351898, -0.20676720142364502, -0.15342441201210022, -0.10008162260055542, -0.04673883318901062, 0.00660395622253418, 0.05994674563407898, 0.11328953504562378, 0.16663232445716858, 0.21997511386871338, 0.2733179032802582, 0.326660692691803, 0.3800034821033478, 0.4333462715148926, 0.4866890609264374, 0.5400318503379822, 0.5933746099472046, 0.6467174291610718, 0.700060248374939, 0.7534030079841614, 0.8067457675933838, 0.860088586807251, 0.9134314060211182, 0.9667741656303406, 1.020116925239563, 1.0734597444534302, 1.1268025636672974, 1.180145263671875, 1.2334880828857422, 1.2868309020996094, 1.3401737213134766, 1.3935165405273438, 1.4468592405319214, 1.5002020597457886, 1.5535448789596558, 1.6068875789642334, 1.6602303981781006, 1.7135732173919678, 1.766916036605835, 1.8202588558197021, 1.8736015558242798, 1.926944375038147]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 4.0, 12.0, 13.0, 5.0, 8.0, 7.0, 17.0, 17.0, 19.0, 17.0, 24.0, 28.0, 29.0, 26.0, 30.0, 36.0, 35.0, 33.0, 40.0, 43.0, 30.0, 45.0, 29.0, 37.0, 36.0, 32.0, 22.0, 34.0, 33.0, 36.0, 23.0, 21.0, 26.0, 21.0, 17.0, 16.0, 12.0, 23.0, 10.0, 16.0, 7.0, 5.0, 7.0, 2.0, 5.0, 2.0, 8.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.1195793151855469, -1.0842653512954712, -1.048951506614685, -1.0136375427246094, -0.9783235788345337, -0.9430096745491028, -0.9076957702636719, -0.8723818063735962, -0.8370679020881653, -0.8017539978027344, -0.7664400339126587, -0.7311261296272278, -0.6958122253417969, -0.6604982614517212, -0.6251843571662903, -0.5898704528808594, -0.5545564889907837, -0.5192425847053528, -0.4839286208152771, -0.4486147165298462, -0.4133007824420929, -0.3779868483543396, -0.3426729440689087, -0.3073590099811554, -0.2720450758934021, -0.2367311418056488, -0.2014172226190567, -0.1661033034324646, -0.1307893693447113, -0.09547543525695801, -0.060161516070365906, -0.024847596883773804, 0.010466217994689941, 0.04578014463186264, 0.08109407126903534, 0.11640799790620804, 0.15172192454338074, 0.18703585863113403, 0.22234977781772614, 0.25766369700431824, 0.29297763109207153, 0.32829156517982483, 0.3636054992675781, 0.39891940355300903, 0.43423333764076233, 0.4695472717285156, 0.5048611760139465, 0.5401750802993774, 0.5754890441894531, 0.610802948474884, 0.6461169123649597, 0.6814308166503906, 0.7167447805404663, 0.7520586848258972, 0.7873725891113281, 0.8226865530014038, 0.8580004572868347, 0.8933143615722656, 0.9286283254623413, 0.9639422297477722, 0.9992561340332031, 1.0345700979232788, 1.0698840618133545, 1.1051979064941406, 1.1405118703842163]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 9.0, 9.0, 21.0, 23.0, 26.0, 35.0, 58.0, 78.0, 145.0, 182.0, 279.0, 420.0, 617.0, 833.0, 1273.0, 1946.0, 2980.0, 4437.0, 6468.0, 9511.0, 14122.0, 20150.0, 28597.0, 39687.0, 52228.0, 67427.0, 81790.0, 93884.0, 100042.0, 99973.0, 92837.0, 81267.0, 66285.0, 51557.0, 38564.0, 28347.0, 19676.0, 13907.0, 9248.0, 6521.0, 4258.0, 2877.0, 1954.0, 1284.0, 899.0, 561.0, 425.0, 268.0, 168.0, 130.0, 77.0, 68.0, 40.0, 37.0, 20.0, 12.0, 11.0, 10.0, 2.0, 0.0, 2.0], "bins": [-0.9580078125, -0.9280471801757812, -0.8980865478515625, -0.8681259155273438, -0.838165283203125, -0.8082046508789062, -0.7782440185546875, -0.7482833862304688, -0.71832275390625, -0.6883621215820312, -0.6584014892578125, -0.6284408569335938, -0.598480224609375, -0.5685195922851562, -0.5385589599609375, -0.5085983276367188, -0.4786376953125, -0.44867706298828125, -0.4187164306640625, -0.38875579833984375, -0.358795166015625, -0.32883453369140625, -0.2988739013671875, -0.26891326904296875, -0.23895263671875, -0.20899200439453125, -0.1790313720703125, -0.14907073974609375, -0.119110107421875, -0.08914947509765625, -0.0591888427734375, -0.02922821044921875, 0.000732421875, 0.03069305419921875, 0.0606536865234375, 0.09061431884765625, 0.120574951171875, 0.15053558349609375, 0.1804962158203125, 0.21045684814453125, 0.24041748046875, 0.27037811279296875, 0.3003387451171875, 0.33029937744140625, 0.360260009765625, 0.39022064208984375, 0.4201812744140625, 0.45014190673828125, 0.4801025390625, 0.5100631713867188, 0.5400238037109375, 0.5699844360351562, 0.599945068359375, 0.6299057006835938, 0.6598663330078125, 0.6898269653320312, 0.71978759765625, 0.7497482299804688, 0.7797088623046875, 0.8096694946289062, 0.839630126953125, 0.8695907592773438, 0.8995513916015625, 0.9295120239257812, 0.95947265625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 9.0, 15.0, 9.0, 14.0, 18.0, 16.0, 18.0, 32.0, 18.0, 27.0, 27.0, 35.0, 32.0, 39.0, 38.0, 42.0, 42.0, 35.0, 45.0, 34.0, 30.0, 40.0, 39.0, 31.0, 31.0, 29.0, 32.0, 36.0, 20.0, 22.0, 28.0, 14.0, 24.0, 15.0, 13.0, 6.0, 7.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.2323455810546875, -1.193206787109375, -1.1540679931640625, -1.11492919921875, -1.0757904052734375, -1.036651611328125, -0.9975128173828125, -0.9583740234375, -0.9192352294921875, -0.880096435546875, -0.8409576416015625, -0.80181884765625, -0.7626800537109375, -0.723541259765625, -0.6844024658203125, -0.645263671875, -0.6061248779296875, -0.566986083984375, -0.5278472900390625, -0.48870849609375, -0.4495697021484375, -0.410430908203125, -0.3712921142578125, -0.3321533203125, -0.2930145263671875, -0.253875732421875, -0.2147369384765625, -0.17559814453125, -0.1364593505859375, -0.097320556640625, -0.0581817626953125, -0.01904296875, 0.0200958251953125, 0.059234619140625, 0.0983734130859375, 0.13751220703125, 0.1766510009765625, 0.215789794921875, 0.2549285888671875, 0.2940673828125, 0.3332061767578125, 0.372344970703125, 0.4114837646484375, 0.45062255859375, 0.4897613525390625, 0.528900146484375, 0.5680389404296875, 0.607177734375, 0.6463165283203125, 0.685455322265625, 0.7245941162109375, 0.76373291015625, 0.8028717041015625, 0.842010498046875, 0.8811492919921875, 0.9202880859375, 0.9594268798828125, 0.998565673828125, 1.0377044677734375, 1.07684326171875, 1.1159820556640625, 1.155120849609375, 1.1942596435546875, 1.2333984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 29.0, 68.0, 67.0, 119.0, 184.0, 317.0, 494.0, 762.0, 1152.0, 2022.0, 3092.0, 4905.0, 8088.0, 12717.0, 20001.0, 30216.0, 44584.0, 62767.0, 83348.0, 102451.0, 116277.0, 118908.0, 110914.0, 93998.0, 73122.0, 53166.0, 37010.0, 24681.0, 15944.0, 10088.0, 6514.0, 3982.0, 2479.0, 1537.0, 959.0, 526.0, 366.0, 207.0, 155.0, 102.0, 67.0, 40.0, 28.0, 19.0, 9.0, 14.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.1669921875, -1.13189697265625, -1.0968017578125, -1.06170654296875, -1.026611328125, -0.99151611328125, -0.9564208984375, -0.92132568359375, -0.88623046875, -0.85113525390625, -0.8160400390625, -0.78094482421875, -0.745849609375, -0.71075439453125, -0.6756591796875, -0.64056396484375, -0.60546875, -0.57037353515625, -0.5352783203125, -0.50018310546875, -0.465087890625, -0.42999267578125, -0.3948974609375, -0.35980224609375, -0.32470703125, -0.28961181640625, -0.2545166015625, -0.21942138671875, -0.184326171875, -0.14923095703125, -0.1141357421875, -0.07904052734375, -0.0439453125, -0.00885009765625, 0.0262451171875, 0.06134033203125, 0.096435546875, 0.13153076171875, 0.1666259765625, 0.20172119140625, 0.23681640625, 0.27191162109375, 0.3070068359375, 0.34210205078125, 0.377197265625, 0.41229248046875, 0.4473876953125, 0.48248291015625, 0.517578125, 0.55267333984375, 0.5877685546875, 0.62286376953125, 0.657958984375, 0.69305419921875, 0.7281494140625, 0.76324462890625, 0.79833984375, 0.83343505859375, 0.8685302734375, 0.90362548828125, 0.938720703125, 0.97381591796875, 1.0089111328125, 1.04400634765625, 1.0791015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 8.0, 17.0, 23.0, 19.0, 23.0, 29.0, 28.0, 30.0, 29.0, 28.0, 31.0, 34.0, 40.0, 48.0, 45.0, 29.0, 33.0, 38.0, 35.0, 42.0, 32.0, 40.0, 26.0, 29.0, 29.0, 31.0, 19.0, 22.0, 13.0, 16.0, 16.0, 13.0, 17.0, 3.0, 14.0, 11.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.701171875, -0.6784591674804688, -0.6557464599609375, -0.6330337524414062, -0.610321044921875, -0.5876083374023438, -0.5648956298828125, -0.5421829223632812, -0.51947021484375, -0.49675750732421875, -0.4740447998046875, -0.45133209228515625, -0.428619384765625, -0.40590667724609375, -0.3831939697265625, -0.36048126220703125, -0.3377685546875, -0.31505584716796875, -0.2923431396484375, -0.26963043212890625, -0.246917724609375, -0.22420501708984375, -0.2014923095703125, -0.17877960205078125, -0.15606689453125, -0.13335418701171875, -0.1106414794921875, -0.08792877197265625, -0.065216064453125, -0.04250335693359375, -0.0197906494140625, 0.00292205810546875, 0.025634765625, 0.04834747314453125, 0.0710601806640625, 0.09377288818359375, 0.116485595703125, 0.13919830322265625, 0.1619110107421875, 0.18462371826171875, 0.20733642578125, 0.23004913330078125, 0.2527618408203125, 0.27547454833984375, 0.298187255859375, 0.32089996337890625, 0.3436126708984375, 0.36632537841796875, 0.3890380859375, 0.41175079345703125, 0.4344635009765625, 0.45717620849609375, 0.479888916015625, 0.5026016235351562, 0.5253143310546875, 0.5480270385742188, 0.57073974609375, 0.5934524536132812, 0.6161651611328125, 0.6388778686523438, 0.661590576171875, 0.6843032836914062, 0.7070159912109375, 0.7297286987304688, 0.75244140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 9.0, 7.0, 13.0, 16.0, 29.0, 39.0, 43.0, 82.0, 137.0, 235.0, 319.0, 584.0, 978.0, 1580.0, 2731.0, 4820.0, 8641.0, 16403.0, 31157.0, 58939.0, 107061.0, 169935.0, 206219.0, 179453.0, 117424.0, 66069.0, 34905.0, 18197.0, 9790.0, 5309.0, 2977.0, 1718.0, 1037.0, 649.0, 366.0, 227.0, 145.0, 88.0, 66.0, 43.0, 32.0, 20.0, 18.0, 11.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.98583984375, -0.95733642578125, -0.9288330078125, -0.90032958984375, -0.871826171875, -0.84332275390625, -0.8148193359375, -0.78631591796875, -0.7578125, -0.72930908203125, -0.7008056640625, -0.67230224609375, -0.643798828125, -0.61529541015625, -0.5867919921875, -0.55828857421875, -0.52978515625, -0.50128173828125, -0.4727783203125, -0.44427490234375, -0.415771484375, -0.38726806640625, -0.3587646484375, -0.33026123046875, -0.3017578125, -0.27325439453125, -0.2447509765625, -0.21624755859375, -0.187744140625, -0.15924072265625, -0.1307373046875, -0.10223388671875, -0.07373046875, -0.04522705078125, -0.0167236328125, 0.01177978515625, 0.040283203125, 0.06878662109375, 0.0972900390625, 0.12579345703125, 0.154296875, 0.18280029296875, 0.2113037109375, 0.23980712890625, 0.268310546875, 0.29681396484375, 0.3253173828125, 0.35382080078125, 0.38232421875, 0.41082763671875, 0.4393310546875, 0.46783447265625, 0.496337890625, 0.52484130859375, 0.5533447265625, 0.58184814453125, 0.6103515625, 0.63885498046875, 0.6673583984375, 0.69586181640625, 0.724365234375, 0.75286865234375, 0.7813720703125, 0.80987548828125, 0.83837890625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 20.0, 14.0, 20.0, 22.0, 32.0, 29.0, 37.0, 50.0, 51.0, 50.0, 70.0, 48.0, 48.0, 61.0, 46.0, 69.0, 51.0, 41.0, 33.0, 38.0, 27.0, 18.0, 13.0, 19.0, 12.0, 14.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.426738739013672e-05, -7.211044430732727e-05, -6.995350122451782e-05, -6.779655814170837e-05, -6.563961505889893e-05, -6.348267197608948e-05, -6.132572889328003e-05, -5.916878581047058e-05, -5.701184272766113e-05, -5.4854899644851685e-05, -5.2697956562042236e-05, -5.054101347923279e-05, -4.838407039642334e-05, -4.622712731361389e-05, -4.407018423080444e-05, -4.1913241147994995e-05, -3.975629806518555e-05, -3.75993549823761e-05, -3.544241189956665e-05, -3.32854688167572e-05, -3.1128525733947754e-05, -2.8971582651138306e-05, -2.6814639568328857e-05, -2.465769648551941e-05, -2.250075340270996e-05, -2.0343810319900513e-05, -1.8186867237091064e-05, -1.6029924154281616e-05, -1.3872981071472168e-05, -1.171603798866272e-05, -9.559094905853271e-06, -7.402151823043823e-06, -5.245208740234375e-06, -3.0882656574249268e-06, -9.313225746154785e-07, 1.2256205081939697e-06, 3.382563591003418e-06, 5.539506673812866e-06, 7.696449756622314e-06, 9.853392839431763e-06, 1.2010335922241211e-05, 1.416727900505066e-05, 1.6324222087860107e-05, 1.8481165170669556e-05, 2.0638108253479004e-05, 2.2795051336288452e-05, 2.49519944190979e-05, 2.710893750190735e-05, 2.9265880584716797e-05, 3.1422823667526245e-05, 3.357976675033569e-05, 3.573670983314514e-05, 3.789365291595459e-05, 4.005059599876404e-05, 4.2207539081573486e-05, 4.4364482164382935e-05, 4.652142524719238e-05, 4.867836833000183e-05, 5.083531141281128e-05, 5.299225449562073e-05, 5.5149197578430176e-05, 5.7306140661239624e-05, 5.946308374404907e-05, 6.162002682685852e-05, 6.377696990966797e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 12.0, 15.0, 23.0, 36.0, 44.0, 74.0, 99.0, 142.0, 203.0, 282.0, 478.0, 713.0, 1120.0, 1600.0, 2595.0, 3883.0, 6021.0, 9513.0, 15378.0, 24343.0, 37686.0, 56452.0, 82289.0, 110634.0, 132661.0, 137119.0, 123755.0, 98314.0, 70054.0, 47818.0, 30862.0, 19866.0, 12479.0, 7609.0, 5040.0, 3219.0, 2080.0, 1329.0, 904.0, 634.0, 387.0, 257.0, 175.0, 117.0, 75.0, 63.0, 32.0, 24.0, 13.0, 12.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5724029541015625, -0.553497314453125, -0.5345916748046875, -0.51568603515625, -0.4967803955078125, -0.477874755859375, -0.4589691162109375, -0.4400634765625, -0.4211578369140625, -0.402252197265625, -0.3833465576171875, -0.36444091796875, -0.3455352783203125, -0.326629638671875, -0.3077239990234375, -0.288818359375, -0.2699127197265625, -0.251007080078125, -0.2321014404296875, -0.21319580078125, -0.1942901611328125, -0.175384521484375, -0.1564788818359375, -0.1375732421875, -0.1186676025390625, -0.099761962890625, -0.0808563232421875, -0.06195068359375, -0.0430450439453125, -0.024139404296875, -0.0052337646484375, 0.013671875, 0.0325775146484375, 0.051483154296875, 0.0703887939453125, 0.08929443359375, 0.1082000732421875, 0.127105712890625, 0.1460113525390625, 0.1649169921875, 0.1838226318359375, 0.202728271484375, 0.2216339111328125, 0.24053955078125, 0.2594451904296875, 0.278350830078125, 0.2972564697265625, 0.316162109375, 0.3350677490234375, 0.353973388671875, 0.3728790283203125, 0.39178466796875, 0.4106903076171875, 0.429595947265625, 0.4485015869140625, 0.4674072265625, 0.4863128662109375, 0.505218505859375, 0.5241241455078125, 0.54302978515625, 0.5619354248046875, 0.580841064453125, 0.5997467041015625, 0.61865234375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 3.0, 10.0, 7.0, 6.0, 5.0, 12.0, 18.0, 18.0, 29.0, 26.0, 26.0, 40.0, 30.0, 51.0, 35.0, 58.0, 45.0, 55.0, 52.0, 60.0, 53.0, 48.0, 51.0, 38.0, 40.0, 39.0, 19.0, 19.0, 23.0, 13.0, 16.0, 10.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22766685485839844, -0.21961593627929688, -0.2115650177001953, -0.20351409912109375, -0.1954631805419922, -0.18741226196289062, -0.17936134338378906, -0.1713104248046875, -0.16325950622558594, -0.15520858764648438, -0.1471576690673828, -0.13910675048828125, -0.1310558319091797, -0.12300491333007812, -0.11495399475097656, -0.106903076171875, -0.09885215759277344, -0.09080123901367188, -0.08275032043457031, -0.07469940185546875, -0.06664848327636719, -0.058597564697265625, -0.05054664611816406, -0.0424957275390625, -0.03444480895996094, -0.026393890380859375, -0.018342971801757812, -0.01029205322265625, -0.0022411346435546875, 0.005809783935546875, 0.013860702514648438, 0.02191162109375, 0.029962539672851562, 0.038013458251953125, 0.04606437683105469, 0.05411529541015625, 0.06216621398925781, 0.07021713256835938, 0.07826805114746094, 0.0863189697265625, 0.09436988830566406, 0.10242080688476562, 0.11047172546386719, 0.11852264404296875, 0.1265735626220703, 0.13462448120117188, 0.14267539978027344, 0.150726318359375, 0.15877723693847656, 0.16682815551757812, 0.1748790740966797, 0.18292999267578125, 0.1909809112548828, 0.19903182983398438, 0.20708274841308594, 0.2151336669921875, 0.22318458557128906, 0.23123550415039062, 0.2392864227294922, 0.24733734130859375, 0.2553882598876953, 0.2634391784667969, 0.27149009704589844, 0.279541015625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 9.0, 5.0, 6.0, 7.0, 16.0, 15.0, 21.0, 23.0, 38.0, 29.0, 47.0, 48.0, 44.0, 52.0, 50.0, 56.0, 71.0, 50.0, 58.0, 47.0, 43.0, 42.0, 35.0, 32.0, 27.0, 22.0, 22.0, 16.0, 13.0, 5.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4840911626815796, -1.4314384460449219, -1.3787857294082642, -1.3261330127716064, -1.2734804153442383, -1.2208276987075806, -1.1681749820709229, -1.1155222654342651, -1.0628695487976074, -1.0102168321609497, -0.9575641751289368, -0.904911458492279, -0.8522588014602661, -0.7996060848236084, -0.7469533681869507, -0.694300651550293, -0.6416480541229248, -0.5889953374862671, -0.5363426804542542, -0.48368996381759644, -0.4310372769832611, -0.3783845901489258, -0.32573187351226807, -0.27307918667793274, -0.2204264998435974, -0.16777381300926208, -0.11512111127376556, -0.06246840953826904, -0.009815722703933716, 0.04283696413040161, 0.09548968076705933, 0.14814236760139465, 0.20079493522644043, 0.25344762206077576, 0.3061003088951111, 0.3587530255317688, 0.4114057123661041, 0.46405839920043945, 0.5167111158370972, 0.5693638324737549, 0.6220164895057678, 0.6746692061424255, 0.7273218631744385, 0.7799745798110962, 0.8326272964477539, 0.8852799534797668, 0.9379326701164246, 0.9905853271484375, 1.0432380437850952, 1.095890760421753, 1.1485434770584106, 1.2011961936950684, 1.2538487911224365, 1.3065015077590942, 1.359154224395752, 1.4118069410324097, 1.4644596576690674, 1.517112374305725, 1.5697650909423828, 1.622417688369751, 1.6750704050064087, 1.7277231216430664, 1.7803758382797241, 1.8330285549163818, 1.88568115234375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 8.0, 13.0, 18.0, 16.0, 12.0, 27.0, 26.0, 29.0, 25.0, 37.0, 28.0, 26.0, 41.0, 37.0, 37.0, 37.0, 42.0, 36.0, 30.0, 32.0, 38.0, 39.0, 31.0, 26.0, 25.0, 30.0, 23.0, 27.0, 26.0, 17.0, 14.0, 14.0, 13.0, 13.0, 11.0, 12.0, 15.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-1.2504222393035889, -1.2146520614624023, -1.1788820028305054, -1.1431118249893188, -1.1073417663574219, -1.0715715885162354, -1.0358015298843384, -1.0000313520431519, -0.9642612934112549, -0.9284911751747131, -0.8927210569381714, -0.8569509387016296, -0.8211808204650879, -0.7854107022285461, -0.7496405839920044, -0.7138704061508179, -0.6781002879142761, -0.6423301696777344, -0.6065600514411926, -0.5707899332046509, -0.5350198149681091, -0.4992496967315674, -0.46347954869270325, -0.4277094304561615, -0.39193931221961975, -0.356169193983078, -0.32039907574653625, -0.2846289277076721, -0.24885882437229156, -0.21308870613574982, -0.17731857299804688, -0.14154845476150513, -0.10577833652496338, -0.07000821828842163, -0.034238092601299286, 0.001532033085823059, 0.03730215132236481, 0.07307226955890656, 0.1088424026966095, 0.14461252093315125, 0.180382639169693, 0.21615275740623474, 0.2519228756427765, 0.2876930236816406, 0.3234631419181824, 0.3592332601547241, 0.39500337839126587, 0.4307734966278076, 0.46654361486434937, 0.5023137331008911, 0.5380838513374329, 0.5738539695739746, 0.6096240878105164, 0.6453942060470581, 0.6811643838882446, 0.7169344425201416, 0.7527046203613281, 0.7884747385978699, 0.8242448568344116, 0.8600149750709534, 0.8957850933074951, 0.9315552115440369, 0.9673253297805786, 1.0030955076217651, 1.038865566253662]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 27.0, 51.0, 55.0, 87.0, 141.0, 202.0, 342.0, 526.0, 773.0, 1209.0, 1954.0, 3154.0, 5054.0, 8268.0, 13544.0, 22511.0, 37272.0, 62087.0, 102599.0, 165864.0, 261436.0, 385996.0, 514907.0, 595147.0, 580517.0, 478583.0, 348549.0, 230901.0, 146224.0, 89542.0, 53929.0, 32804.0, 19336.0, 11745.0, 7175.0, 4370.0, 2751.0, 1632.0, 1050.0, 640.0, 454.0, 287.0, 210.0, 126.0, 83.0, 46.0, 35.0, 22.0, 13.0, 6.0, 9.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0], "bins": [-1.1181640625, -1.0819244384765625, -1.045684814453125, -1.0094451904296875, -0.97320556640625, -0.9369659423828125, -0.900726318359375, -0.8644866943359375, -0.8282470703125, -0.7920074462890625, -0.755767822265625, -0.7195281982421875, -0.68328857421875, -0.6470489501953125, -0.610809326171875, -0.5745697021484375, -0.538330078125, -0.5020904541015625, -0.465850830078125, -0.4296112060546875, -0.39337158203125, -0.3571319580078125, -0.320892333984375, -0.2846527099609375, -0.2484130859375, -0.2121734619140625, -0.175933837890625, -0.1396942138671875, -0.10345458984375, -0.0672149658203125, -0.030975341796875, 0.0052642822265625, 0.04150390625, 0.0777435302734375, 0.113983154296875, 0.1502227783203125, 0.18646240234375, 0.2227020263671875, 0.258941650390625, 0.2951812744140625, 0.3314208984375, 0.3676605224609375, 0.403900146484375, 0.4401397705078125, 0.47637939453125, 0.5126190185546875, 0.548858642578125, 0.5850982666015625, 0.621337890625, 0.6575775146484375, 0.693817138671875, 0.7300567626953125, 0.76629638671875, 0.8025360107421875, 0.838775634765625, 0.8750152587890625, 0.9112548828125, 0.9474945068359375, 0.983734130859375, 1.0199737548828125, 1.05621337890625, 1.0924530029296875, 1.128692626953125, 1.1649322509765625, 1.201171875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 3.0, 13.0, 10.0, 10.0, 11.0, 10.0, 17.0, 22.0, 17.0, 31.0, 25.0, 39.0, 40.0, 33.0, 28.0, 37.0, 26.0, 43.0, 40.0, 39.0, 29.0, 39.0, 39.0, 39.0, 26.0, 35.0, 31.0, 33.0, 25.0, 28.0, 16.0, 23.0, 23.0, 18.0, 11.0, 11.0, 12.0, 16.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.842926025390625, -0.81622314453125, -0.789520263671875, -0.7628173828125, -0.736114501953125, -0.70941162109375, -0.682708740234375, -0.656005859375, -0.629302978515625, -0.60260009765625, -0.575897216796875, -0.5491943359375, -0.522491455078125, -0.49578857421875, -0.469085693359375, -0.4423828125, -0.415679931640625, -0.38897705078125, -0.362274169921875, -0.3355712890625, -0.308868408203125, -0.28216552734375, -0.255462646484375, -0.228759765625, -0.202056884765625, -0.17535400390625, -0.148651123046875, -0.1219482421875, -0.095245361328125, -0.06854248046875, -0.041839599609375, -0.01513671875, 0.011566162109375, 0.03826904296875, 0.064971923828125, 0.0916748046875, 0.118377685546875, 0.14508056640625, 0.171783447265625, 0.198486328125, 0.225189208984375, 0.25189208984375, 0.278594970703125, 0.3052978515625, 0.332000732421875, 0.35870361328125, 0.385406494140625, 0.412109375, 0.438812255859375, 0.46551513671875, 0.492218017578125, 0.5189208984375, 0.545623779296875, 0.57232666015625, 0.599029541015625, 0.625732421875, 0.652435302734375, 0.67913818359375, 0.705841064453125, 0.7325439453125, 0.759246826171875, 0.78594970703125, 0.812652587890625, 0.83935546875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 10.0, 18.0, 27.0, 53.0, 75.0, 140.0, 176.0, 299.0, 464.0, 772.0, 1244.0, 2035.0, 3147.0, 5348.0, 8621.0, 14054.0, 23110.0, 37565.0, 58740.0, 92549.0, 141389.0, 208076.0, 289879.0, 379392.0, 455817.0, 496042.0, 482191.0, 420586.0, 337083.0, 247941.0, 173525.0, 115371.0, 75168.0, 47425.0, 29394.0, 18006.0, 11169.0, 6637.0, 4120.0, 2539.0, 1571.0, 950.0, 580.0, 356.0, 231.0, 139.0, 93.0, 60.0, 42.0, 26.0, 20.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.001953125, -0.9693756103515625, -0.936798095703125, -0.9042205810546875, -0.87164306640625, -0.8390655517578125, -0.806488037109375, -0.7739105224609375, -0.7413330078125, -0.7087554931640625, -0.676177978515625, -0.6436004638671875, -0.61102294921875, -0.5784454345703125, -0.545867919921875, -0.5132904052734375, -0.480712890625, -0.4481353759765625, -0.415557861328125, -0.3829803466796875, -0.35040283203125, -0.3178253173828125, -0.285247802734375, -0.2526702880859375, -0.2200927734375, -0.1875152587890625, -0.154937744140625, -0.1223602294921875, -0.08978271484375, -0.0572052001953125, -0.024627685546875, 0.0079498291015625, 0.04052734375, 0.0731048583984375, 0.105682373046875, 0.1382598876953125, 0.17083740234375, 0.2034149169921875, 0.235992431640625, 0.2685699462890625, 0.3011474609375, 0.3337249755859375, 0.366302490234375, 0.3988800048828125, 0.43145751953125, 0.4640350341796875, 0.496612548828125, 0.5291900634765625, 0.561767578125, 0.5943450927734375, 0.626922607421875, 0.6595001220703125, 0.69207763671875, 0.7246551513671875, 0.757232666015625, 0.7898101806640625, 0.8223876953125, 0.8549652099609375, 0.887542724609375, 0.9201202392578125, 0.95269775390625, 0.9852752685546875, 1.017852783203125, 1.0504302978515625, 1.0830078125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 8.0, 10.0, 21.0, 28.0, 31.0, 37.0, 62.0, 68.0, 64.0, 92.0, 124.0, 139.0, 153.0, 184.0, 233.0, 217.0, 261.0, 220.0, 245.0, 226.0, 217.0, 203.0, 190.0, 163.0, 163.0, 134.0, 131.0, 121.0, 73.0, 54.0, 43.0, 46.0, 23.0, 18.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5153656005859375, -0.499481201171875, -0.4835968017578125, -0.46771240234375, -0.4518280029296875, -0.435943603515625, -0.4200592041015625, -0.4041748046875, -0.3882904052734375, -0.372406005859375, -0.3565216064453125, -0.34063720703125, -0.3247528076171875, -0.308868408203125, -0.2929840087890625, -0.277099609375, -0.2612152099609375, -0.245330810546875, -0.2294464111328125, -0.21356201171875, -0.1976776123046875, -0.181793212890625, -0.1659088134765625, -0.1500244140625, -0.1341400146484375, -0.118255615234375, -0.1023712158203125, -0.08648681640625, -0.0706024169921875, -0.054718017578125, -0.0388336181640625, -0.02294921875, -0.0070648193359375, 0.008819580078125, 0.0247039794921875, 0.04058837890625, 0.0564727783203125, 0.072357177734375, 0.0882415771484375, 0.1041259765625, 0.1200103759765625, 0.135894775390625, 0.1517791748046875, 0.16766357421875, 0.1835479736328125, 0.199432373046875, 0.2153167724609375, 0.231201171875, 0.2470855712890625, 0.262969970703125, 0.2788543701171875, 0.29473876953125, 0.3106231689453125, 0.326507568359375, 0.3423919677734375, 0.3582763671875, 0.3741607666015625, 0.390045166015625, 0.4059295654296875, 0.42181396484375, 0.4376983642578125, 0.453582763671875, 0.4694671630859375, 0.4853515625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 18.0, 17.0, 25.0, 29.0, 38.0, 34.0, 45.0, 47.0, 45.0, 56.0, 63.0, 65.0, 61.0, 46.0, 63.0, 40.0, 35.0, 31.0, 29.0, 30.0, 31.0, 18.0, 23.0, 22.0, 7.0, 7.0, 10.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7404402494430542, -1.6902867555618286, -1.6401333808898926, -1.589979887008667, -1.5398263931274414, -1.4896728992462158, -1.4395195245742798, -1.3893660306930542, -1.3392125368118286, -1.289059042930603, -1.238905668258667, -1.1887521743774414, -1.1385986804962158, -1.0884451866149902, -1.0382918119430542, -0.9881383180618286, -0.9379848837852478, -0.887831449508667, -0.8376779556274414, -0.7875245213508606, -0.737371027469635, -0.6872175931930542, -0.6370640993118286, -0.5869106650352478, -0.536757230758667, -0.4866037666797638, -0.4364503026008606, -0.3862968683242798, -0.3361433744430542, -0.2859899401664734, -0.2358364760875702, -0.185683012008667, -0.1355295181274414, -0.08537605404853821, -0.03522259742021561, 0.014930859208106995, 0.06508432328701019, 0.1152377724647522, 0.1653912365436554, 0.2155447006225586, 0.2656981647014618, 0.315851628780365, 0.3660050928592682, 0.4161585569381714, 0.4663119912147522, 0.516465425491333, 0.5666189193725586, 0.6167724132537842, 0.666925847530365, 0.7170792818069458, 0.7672327756881714, 0.8173862099647522, 0.8675397038459778, 0.9176931381225586, 0.9678466320037842, 1.0180001258850098, 1.0681535005569458, 1.1183069944381714, 1.1684603691101074, 1.218613862991333, 1.2687673568725586, 1.3189208507537842, 1.3690742254257202, 1.4192277193069458, 1.4693812131881714]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 33.0, 31.0, 49.0, 32.0, 43.0, 33.0, 42.0, 45.0, 38.0, 41.0, 46.0, 48.0, 35.0, 43.0, 32.0, 41.0, 34.0, 29.0, 22.0, 29.0, 18.0, 22.0, 18.0, 18.0, 10.0, 13.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1312960386276245, -1.0931018590927124, -1.0549076795578003, -1.0167135000228882, -0.9785193204879761, -0.940325140953064, -0.9021309614181519, -0.8639367818832397, -0.8257426023483276, -0.7875484228134155, -0.7493542432785034, -0.7111600637435913, -0.6729658842086792, -0.6347717046737671, -0.596577525138855, -0.5583833456039429, -0.520189106464386, -0.4819949269294739, -0.44380074739456177, -0.40560656785964966, -0.36741238832473755, -0.32921820878982544, -0.29102399945259094, -0.25282981991767883, -0.21463564038276672, -0.17644146084785461, -0.1382472813129425, -0.1000530868768692, -0.06185890734195709, -0.023664727807044983, 0.01452946662902832, 0.05272364616394043, 0.09091782569885254, 0.12911200523376465, 0.16730618476867676, 0.20550037920475006, 0.24369455873966217, 0.2818887233734131, 0.3200829327106476, 0.3582771122455597, 0.3964712917804718, 0.4346654713153839, 0.472859650850296, 0.5110538601875305, 0.5492480397224426, 0.5874422192573547, 0.6256363987922668, 0.663830578327179, 0.7020247578620911, 0.7402189373970032, 0.7784131169319153, 0.8166072964668274, 0.8548014760017395, 0.8929956555366516, 0.9311898946762085, 0.9693840742111206, 1.0075782537460327, 1.0457724332809448, 1.083966612815857, 1.122160792350769, 1.1603549718856812, 1.1985491514205933, 1.2367433309555054, 1.2749375104904175, 1.3131316900253296]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 11.0, 22.0, 16.0, 46.0, 63.0, 92.0, 134.0, 198.0, 265.0, 442.0, 722.0, 1011.0, 1595.0, 2449.0, 3737.0, 5824.0, 8756.0, 13578.0, 20997.0, 32060.0, 48982.0, 73299.0, 105470.0, 140775.0, 155347.0, 133909.0, 99948.0, 68504.0, 45225.0, 29942.0, 19296.0, 12498.0, 8209.0, 5180.0, 3422.0, 2184.0, 1536.0, 928.0, 632.0, 396.0, 281.0, 194.0, 134.0, 76.0, 51.0, 37.0, 31.0, 26.0, 8.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.358642578125, -0.3485145568847656, -0.33838653564453125, -0.3282585144042969, -0.3181304931640625, -0.3080024719238281, -0.29787445068359375, -0.2877464294433594, -0.277618408203125, -0.2674903869628906, -0.25736236572265625, -0.24723434448242188, -0.2371063232421875, -0.22697830200195312, -0.21685028076171875, -0.20672225952148438, -0.19659423828125, -0.18646621704101562, -0.17633819580078125, -0.16621017456054688, -0.1560821533203125, -0.14595413208007812, -0.13582611083984375, -0.12569808959960938, -0.115570068359375, -0.10544204711914062, -0.09531402587890625, -0.08518600463867188, -0.0750579833984375, -0.06492996215820312, -0.05480194091796875, -0.044673919677734375, -0.0345458984375, -0.024417877197265625, -0.01428985595703125, -0.004161834716796875, 0.0059661865234375, 0.016094207763671875, 0.02622222900390625, 0.036350250244140625, 0.046478271484375, 0.056606292724609375, 0.06673431396484375, 0.07686233520507812, 0.0869903564453125, 0.09711837768554688, 0.10724639892578125, 0.11737442016601562, 0.12750244140625, 0.13763046264648438, 0.14775848388671875, 0.15788650512695312, 0.1680145263671875, 0.17814254760742188, 0.18827056884765625, 0.19839859008789062, 0.208526611328125, 0.21865463256835938, 0.22878265380859375, 0.23891067504882812, 0.2490386962890625, 0.2591667175292969, 0.26929473876953125, 0.2794227600097656, 0.28955078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 5.0, 8.0, 5.0, 8.0, 10.0, 13.0, 9.0, 18.0, 18.0, 27.0, 19.0, 31.0, 35.0, 35.0, 35.0, 29.0, 52.0, 31.0, 33.0, 46.0, 38.0, 42.0, 42.0, 45.0, 38.0, 40.0, 38.0, 26.0, 26.0, 32.0, 22.0, 31.0, 13.0, 18.0, 14.0, 10.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0423736572265625, -1.005645751953125, -0.9689178466796875, -0.93218994140625, -0.8954620361328125, -0.858734130859375, -0.8220062255859375, -0.7852783203125, -0.7485504150390625, -0.711822509765625, -0.6750946044921875, -0.63836669921875, -0.6016387939453125, -0.564910888671875, -0.5281829833984375, -0.491455078125, -0.4547271728515625, -0.417999267578125, -0.3812713623046875, -0.34454345703125, -0.3078155517578125, -0.271087646484375, -0.2343597412109375, -0.1976318359375, -0.1609039306640625, -0.124176025390625, -0.0874481201171875, -0.05072021484375, -0.0139923095703125, 0.022735595703125, 0.0594635009765625, 0.09619140625, 0.1329193115234375, 0.169647216796875, 0.2063751220703125, 0.24310302734375, 0.2798309326171875, 0.316558837890625, 0.3532867431640625, 0.3900146484375, 0.4267425537109375, 0.463470458984375, 0.5001983642578125, 0.53692626953125, 0.5736541748046875, 0.610382080078125, 0.6471099853515625, 0.683837890625, 0.7205657958984375, 0.757293701171875, 0.7940216064453125, 0.83074951171875, 0.8674774169921875, 0.904205322265625, 0.9409332275390625, 0.9776611328125, 1.0143890380859375, 1.051116943359375, 1.0878448486328125, 1.12457275390625, 1.1613006591796875, 1.198028564453125, 1.2347564697265625, 1.271484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 20.0, 13.0, 23.0, 29.0, 55.0, 75.0, 119.0, 169.0, 306.0, 486.0, 820.0, 1418.0, 2535.0, 4501.0, 8335.0, 16166.0, 31751.0, 62708.0, 120147.0, 204119.0, 236822.0, 167482.0, 92455.0, 47155.0, 23902.0, 12360.0, 6375.0, 3495.0, 1908.0, 1073.0, 645.0, 373.0, 215.0, 137.0, 120.0, 68.0, 51.0, 33.0, 17.0, 12.0, 14.0, 5.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.50390625, -0.48876953125, -0.4736328125, -0.45849609375, -0.443359375, -0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 7.0, 7.0, 13.0, 13.0, 25.0, 18.0, 19.0, 25.0, 24.0, 26.0, 45.0, 29.0, 31.0, 34.0, 42.0, 34.0, 33.0, 38.0, 32.0, 39.0, 35.0, 33.0, 28.0, 29.0, 28.0, 31.0, 28.0, 29.0, 23.0, 29.0, 19.0, 23.0, 21.0, 14.0, 14.0, 16.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6994247436523438, -0.6766815185546875, -0.6539382934570312, -0.631195068359375, -0.6084518432617188, -0.5857086181640625, -0.5629653930664062, -0.54022216796875, -0.5174789428710938, -0.4947357177734375, -0.47199249267578125, -0.449249267578125, -0.42650604248046875, -0.4037628173828125, -0.38101959228515625, -0.3582763671875, -0.33553314208984375, -0.3127899169921875, -0.29004669189453125, -0.267303466796875, -0.24456024169921875, -0.2218170166015625, -0.19907379150390625, -0.17633056640625, -0.15358734130859375, -0.1308441162109375, -0.10810089111328125, -0.085357666015625, -0.06261444091796875, -0.0398712158203125, -0.01712799072265625, 0.005615234375, 0.02835845947265625, 0.0511016845703125, 0.07384490966796875, 0.096588134765625, 0.11933135986328125, 0.1420745849609375, 0.16481781005859375, 0.18756103515625, 0.21030426025390625, 0.2330474853515625, 0.25579071044921875, 0.278533935546875, 0.30127716064453125, 0.3240203857421875, 0.34676361083984375, 0.3695068359375, 0.39225006103515625, 0.4149932861328125, 0.43773651123046875, 0.460479736328125, 0.48322296142578125, 0.5059661865234375, 0.5287094116210938, 0.55145263671875, 0.5741958618164062, 0.5969390869140625, 0.6196823120117188, 0.642425537109375, 0.6651687622070312, 0.6879119873046875, 0.7106552124023438, 0.7333984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 19.0, 26.0, 30.0, 53.0, 92.0, 94.0, 129.0, 178.0, 271.0, 372.0, 490.0, 724.0, 1016.0, 1391.0, 2200.0, 3264.0, 5237.0, 8778.0, 16545.0, 32888.0, 73867.0, 178310.0, 335355.0, 214488.0, 88057.0, 38656.0, 18903.0, 9985.0, 5853.0, 3593.0, 2335.0, 1601.0, 1055.0, 700.0, 542.0, 389.0, 279.0, 215.0, 158.0, 110.0, 77.0, 58.0, 36.0, 25.0, 26.0, 14.0, 15.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.19970703125, -0.1933879852294922, -0.18706893920898438, -0.18074989318847656, -0.17443084716796875, -0.16811180114746094, -0.16179275512695312, -0.1554737091064453, -0.1491546630859375, -0.1428356170654297, -0.13651657104492188, -0.13019752502441406, -0.12387847900390625, -0.11755943298339844, -0.11124038696289062, -0.10492134094238281, -0.098602294921875, -0.09228324890136719, -0.08596420288085938, -0.07964515686035156, -0.07332611083984375, -0.06700706481933594, -0.060688018798828125, -0.05436897277832031, -0.0480499267578125, -0.04173088073730469, -0.035411834716796875, -0.029092788696289062, -0.02277374267578125, -0.016454696655273438, -0.010135650634765625, -0.0038166046142578125, 0.00250244140625, 0.008821487426757812, 0.015140533447265625, 0.021459579467773438, 0.02777862548828125, 0.03409767150878906, 0.040416717529296875, 0.04673576354980469, 0.0530548095703125, 0.05937385559082031, 0.06569290161132812, 0.07201194763183594, 0.07833099365234375, 0.08465003967285156, 0.09096908569335938, 0.09728813171386719, 0.103607177734375, 0.10992622375488281, 0.11624526977539062, 0.12256431579589844, 0.12888336181640625, 0.13520240783691406, 0.14152145385742188, 0.1478404998779297, 0.1541595458984375, 0.1604785919189453, 0.16679763793945312, 0.17311668395996094, 0.17943572998046875, 0.18575477600097656, 0.19207382202148438, 0.1983928680419922, 0.2047119140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 10.0, 2.0, 7.0, 17.0, 15.0, 16.0, 17.0, 30.0, 33.0, 58.0, 68.0, 59.0, 72.0, 71.0, 74.0, 83.0, 72.0, 62.0, 52.0, 38.0, 43.0, 20.0, 23.0, 12.0, 16.0, 9.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.3930723071098328e-05, -1.3377517461776733e-05, -1.282431185245514e-05, -1.2271106243133545e-05, -1.171790063381195e-05, -1.1164695024490356e-05, -1.0611489415168762e-05, -1.0058283805847168e-05, -9.505078196525574e-06, -8.95187258720398e-06, -8.398666977882385e-06, -7.845461368560791e-06, -7.292255759239197e-06, -6.7390501499176025e-06, -6.185844540596008e-06, -5.632638931274414e-06, -5.07943332195282e-06, -4.526227712631226e-06, -3.973022103309631e-06, -3.419816493988037e-06, -2.866610884666443e-06, -2.3134052753448486e-06, -1.7601996660232544e-06, -1.2069940567016602e-06, -6.537884473800659e-07, -1.0058283805847168e-07, 4.5262277126312256e-07, 1.0058283805847168e-06, 1.559033989906311e-06, 2.1122395992279053e-06, 2.6654452085494995e-06, 3.2186508178710938e-06, 3.771856427192688e-06, 4.325062036514282e-06, 4.8782676458358765e-06, 5.431473255157471e-06, 5.984678864479065e-06, 6.537884473800659e-06, 7.091090083122253e-06, 7.644295692443848e-06, 8.197501301765442e-06, 8.750706911087036e-06, 9.30391252040863e-06, 9.857118129730225e-06, 1.0410323739051819e-05, 1.0963529348373413e-05, 1.1516734957695007e-05, 1.2069940567016602e-05, 1.2623146176338196e-05, 1.317635178565979e-05, 1.3729557394981384e-05, 1.4282763004302979e-05, 1.4835968613624573e-05, 1.5389174222946167e-05, 1.594237983226776e-05, 1.6495585441589355e-05, 1.704879105091095e-05, 1.7601996660232544e-05, 1.8155202269554138e-05, 1.8708407878875732e-05, 1.9261613488197327e-05, 1.981481909751892e-05, 2.0368024706840515e-05, 2.092123031616211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 4.0, 15.0, 24.0, 26.0, 34.0, 50.0, 94.0, 146.0, 233.0, 368.0, 577.0, 898.0, 1420.0, 2468.0, 3811.0, 6526.0, 11684.0, 21027.0, 39899.0, 75922.0, 139346.0, 220519.0, 220420.0, 138690.0, 75217.0, 39763.0, 20831.0, 11654.0, 6795.0, 3905.0, 2368.0, 1410.0, 832.0, 564.0, 334.0, 217.0, 133.0, 123.0, 55.0, 35.0, 43.0, 23.0, 15.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1708984375, -0.16500473022460938, -0.15911102294921875, -0.15321731567382812, -0.1473236083984375, -0.14142990112304688, -0.13553619384765625, -0.12964248657226562, -0.123748779296875, -0.11785507202148438, -0.11196136474609375, -0.10606765747070312, -0.1001739501953125, -0.09428024291992188, -0.08838653564453125, -0.08249282836914062, -0.07659912109375, -0.07070541381835938, -0.06481170654296875, -0.058917999267578125, -0.0530242919921875, -0.047130584716796875, -0.04123687744140625, -0.035343170166015625, -0.029449462890625, -0.023555755615234375, -0.01766204833984375, -0.011768341064453125, -0.0058746337890625, 1.9073486328125e-05, 0.00591278076171875, 0.011806488037109375, 0.0177001953125, 0.023593902587890625, 0.02948760986328125, 0.035381317138671875, 0.0412750244140625, 0.047168731689453125, 0.05306243896484375, 0.058956146240234375, 0.064849853515625, 0.07074356079101562, 0.07663726806640625, 0.08253097534179688, 0.0884246826171875, 0.09431838989257812, 0.10021209716796875, 0.10610580444335938, 0.11199951171875, 0.11789321899414062, 0.12378692626953125, 0.12968063354492188, 0.1355743408203125, 0.14146804809570312, 0.14736175537109375, 0.15325546264648438, 0.159149169921875, 0.16504287719726562, 0.17093658447265625, 0.17683029174804688, 0.1827239990234375, 0.18861770629882812, 0.19451141357421875, 0.20040512084960938, 0.206298828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 18.0, 15.0, 20.0, 21.0, 20.0, 21.0, 30.0, 32.0, 31.0, 49.0, 52.0, 58.0, 52.0, 51.0, 58.0, 55.0, 56.0, 43.0, 37.0, 33.0, 40.0, 26.0, 34.0, 22.0, 19.0, 14.0, 6.0, 15.0, 3.0, 11.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03614616394042969, -0.034938812255859375, -0.03373146057128906, -0.03252410888671875, -0.03131675720214844, -0.030109405517578125, -0.028902053833007812, -0.0276947021484375, -0.026487350463867188, -0.025279998779296875, -0.024072647094726562, -0.02286529541015625, -0.021657943725585938, -0.020450592041015625, -0.019243240356445312, -0.018035888671875, -0.016828536987304688, -0.015621185302734375, -0.014413833618164062, -0.01320648193359375, -0.011999130249023438, -0.010791778564453125, -0.009584426879882812, -0.0083770751953125, -0.0071697235107421875, -0.005962371826171875, -0.0047550201416015625, -0.00354766845703125, -0.0023403167724609375, -0.001132965087890625, 7.43865966796875e-05, 0.00128173828125, 0.0024890899658203125, 0.003696441650390625, 0.0049037933349609375, 0.00611114501953125, 0.0073184967041015625, 0.008525848388671875, 0.009733200073242188, 0.0109405517578125, 0.012147903442382812, 0.013355255126953125, 0.014562606811523438, 0.01576995849609375, 0.016977310180664062, 0.018184661865234375, 0.019392013549804688, 0.020599365234375, 0.021806716918945312, 0.023014068603515625, 0.024221420288085938, 0.02542877197265625, 0.026636123657226562, 0.027843475341796875, 0.029050827026367188, 0.0302581787109375, 0.03146553039550781, 0.032672882080078125, 0.03388023376464844, 0.03508758544921875, 0.03629493713378906, 0.037502288818359375, 0.03870964050292969, 0.0399169921875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 8.0, 16.0, 19.0, 25.0, 28.0, 39.0, 41.0, 36.0, 45.0, 47.0, 68.0, 58.0, 65.0, 56.0, 54.0, 53.0, 37.0, 33.0, 34.0, 24.0, 37.0, 28.0, 29.0, 18.0, 18.0, 10.0, 4.0, 8.0, 8.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8160393238067627, -1.7665389776229858, -1.717038631439209, -1.6675382852554321, -1.6180379390716553, -1.5685375928878784, -1.5190372467041016, -1.4695369005203247, -1.4200365543365479, -1.370536208152771, -1.3210358619689941, -1.2715355157852173, -1.2220351696014404, -1.1725348234176636, -1.1230344772338867, -1.0735341310501099, -1.024033784866333, -0.9745334386825562, -0.9250330924987793, -0.8755327463150024, -0.8260324001312256, -0.7765320539474487, -0.7270317077636719, -0.677531361579895, -0.6280310153961182, -0.5785306692123413, -0.5290303230285645, -0.4795299768447876, -0.43002963066101074, -0.3805292844772339, -0.33102893829345703, -0.2815285921096802, -0.23202836513519287, -0.18252801895141602, -0.13302767276763916, -0.0835273265838623, -0.03402698040008545, 0.015473365783691406, 0.06497371196746826, 0.11447405815124512, 0.16397440433502197, 0.21347475051879883, 0.2629750967025757, 0.31247544288635254, 0.3619757890701294, 0.41147613525390625, 0.4609764814376831, 0.51047682762146, 0.5599771738052368, 0.6094775199890137, 0.6589778661727905, 0.7084782123565674, 0.7579785585403442, 0.8074789047241211, 0.856979250907898, 0.9064795970916748, 0.9559799432754517, 1.0054802894592285, 1.0549806356430054, 1.1044809818267822, 1.153981328010559, 1.203481674194336, 1.2529820203781128, 1.3024823665618896, 1.3519827127456665]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 7.0, 9.0, 15.0, 18.0, 16.0, 24.0, 37.0, 28.0, 43.0, 36.0, 39.0, 40.0, 34.0, 42.0, 44.0, 35.0, 42.0, 51.0, 42.0, 36.0, 42.0, 31.0, 41.0, 35.0, 26.0, 28.0, 22.0, 20.0, 20.0, 21.0, 14.0, 10.0, 14.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1101436614990234, -1.0721240043640137, -1.0341042280197144, -0.9960845112800598, -0.9580647945404053, -0.9200450778007507, -0.8820253610610962, -0.8440056443214417, -0.8059859275817871, -0.7679662108421326, -0.729946494102478, -0.6919267773628235, -0.653907060623169, -0.6158873438835144, -0.5778676271438599, -0.5398479104042053, -0.5018281936645508, -0.46380847692489624, -0.4257887601852417, -0.38776904344558716, -0.3497493267059326, -0.3117296099662781, -0.27370989322662354, -0.235690176486969, -0.19767045974731445, -0.1596507430076599, -0.12163102626800537, -0.08361130952835083, -0.04559159278869629, -0.007571876049041748, 0.030447840690612793, 0.06846755743026733, 0.10648727416992188, 0.14450699090957642, 0.18252670764923096, 0.2205464243888855, 0.25856614112854004, 0.2965858578681946, 0.3346055746078491, 0.37262529134750366, 0.4106450080871582, 0.44866472482681274, 0.4866844415664673, 0.5247041583061218, 0.5627238750457764, 0.6007435917854309, 0.6387633085250854, 0.67678302526474, 0.7148027420043945, 0.7528224587440491, 0.7908421754837036, 0.8288618922233582, 0.8668816089630127, 0.9049013257026672, 0.9429210424423218, 0.9809407591819763, 1.0189604759216309, 1.0569801330566406, 1.09499990940094, 1.1330196857452393, 1.171039342880249, 1.2090590000152588, 1.247078776359558, 1.2850985527038574, 1.3231182098388672]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 26.0, 32.0, 50.0, 89.0, 123.0, 213.0, 307.0, 545.0, 957.0, 1324.0, 2135.0, 3391.0, 5303.0, 8356.0, 12820.0, 19623.0, 28643.0, 41411.0, 56893.0, 74877.0, 91945.0, 104753.0, 111172.0, 106640.0, 95520.0, 79605.0, 61970.0, 45297.0, 32077.0, 21696.0, 14627.0, 9602.0, 6132.0, 3790.0, 2364.0, 1580.0, 979.0, 593.0, 399.0, 286.0, 143.0, 86.0, 69.0, 29.0, 27.0, 21.0, 11.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.94384765625, -0.9149322509765625, -0.886016845703125, -0.8571014404296875, -0.82818603515625, -0.7992706298828125, -0.770355224609375, -0.7414398193359375, -0.7125244140625, -0.6836090087890625, -0.654693603515625, -0.6257781982421875, -0.59686279296875, -0.5679473876953125, -0.539031982421875, -0.5101165771484375, -0.481201171875, -0.4522857666015625, -0.423370361328125, -0.3944549560546875, -0.36553955078125, -0.3366241455078125, -0.307708740234375, -0.2787933349609375, -0.2498779296875, -0.2209625244140625, -0.192047119140625, -0.1631317138671875, -0.13421630859375, -0.1053009033203125, -0.076385498046875, -0.0474700927734375, -0.0185546875, 0.0103607177734375, 0.039276123046875, 0.0681915283203125, 0.09710693359375, 0.1260223388671875, 0.154937744140625, 0.1838531494140625, 0.2127685546875, 0.2416839599609375, 0.270599365234375, 0.2995147705078125, 0.32843017578125, 0.3573455810546875, 0.386260986328125, 0.4151763916015625, 0.444091796875, 0.4730072021484375, 0.501922607421875, 0.5308380126953125, 0.55975341796875, 0.5886688232421875, 0.617584228515625, 0.6464996337890625, 0.6754150390625, 0.7043304443359375, 0.733245849609375, 0.7621612548828125, 0.79107666015625, 0.8199920654296875, 0.848907470703125, 0.8778228759765625, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 16.0, 11.0, 19.0, 17.0, 34.0, 24.0, 28.0, 44.0, 40.0, 36.0, 35.0, 45.0, 46.0, 40.0, 49.0, 59.0, 46.0, 45.0, 35.0, 36.0, 32.0, 34.0, 42.0, 31.0, 20.0, 20.0, 15.0, 20.0, 15.0, 14.0, 6.0, 12.0, 8.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0507049560546875, -1.008636474609375, -0.9665679931640625, -0.92449951171875, -0.8824310302734375, -0.840362548828125, -0.7982940673828125, -0.7562255859375, -0.7141571044921875, -0.672088623046875, -0.6300201416015625, -0.58795166015625, -0.5458831787109375, -0.503814697265625, -0.4617462158203125, -0.419677734375, -0.3776092529296875, -0.335540771484375, -0.2934722900390625, -0.25140380859375, -0.2093353271484375, -0.167266845703125, -0.1251983642578125, -0.0831298828125, -0.0410614013671875, 0.001007080078125, 0.0430755615234375, 0.08514404296875, 0.1272125244140625, 0.169281005859375, 0.2113494873046875, 0.25341796875, 0.2954864501953125, 0.337554931640625, 0.3796234130859375, 0.42169189453125, 0.4637603759765625, 0.505828857421875, 0.5478973388671875, 0.5899658203125, 0.6320343017578125, 0.674102783203125, 0.7161712646484375, 0.75823974609375, 0.8003082275390625, 0.842376708984375, 0.8844451904296875, 0.926513671875, 0.9685821533203125, 1.010650634765625, 1.0527191162109375, 1.09478759765625, 1.1368560791015625, 1.178924560546875, 1.2209930419921875, 1.2630615234375, 1.3051300048828125, 1.347198486328125, 1.3892669677734375, 1.43133544921875, 1.4734039306640625, 1.515472412109375, 1.5575408935546875, 1.599609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 11.0, 20.0, 30.0, 46.0, 59.0, 118.0, 220.0, 298.0, 528.0, 846.0, 1370.0, 2109.0, 3427.0, 5542.0, 8731.0, 13722.0, 20852.0, 31190.0, 44331.0, 61992.0, 80846.0, 97880.0, 110067.0, 113781.0, 106870.0, 93017.0, 74861.0, 56971.0, 40357.0, 27822.0, 18451.0, 12064.0, 7561.0, 4733.0, 2944.0, 1789.0, 1118.0, 739.0, 457.0, 305.0, 193.0, 100.0, 69.0, 30.0, 30.0, 15.0, 14.0, 8.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0], "bins": [-0.994140625, -0.9643325805664062, -0.9345245361328125, -0.9047164916992188, -0.874908447265625, -0.8451004028320312, -0.8152923583984375, -0.7854843139648438, -0.75567626953125, -0.7258682250976562, -0.6960601806640625, -0.6662521362304688, -0.636444091796875, -0.6066360473632812, -0.5768280029296875, -0.5470199584960938, -0.5172119140625, -0.48740386962890625, -0.4575958251953125, -0.42778778076171875, -0.397979736328125, -0.36817169189453125, -0.3383636474609375, -0.30855560302734375, -0.27874755859375, -0.24893951416015625, -0.2191314697265625, -0.18932342529296875, -0.159515380859375, -0.12970733642578125, -0.0998992919921875, -0.07009124755859375, -0.040283203125, -0.01047515869140625, 0.0193328857421875, 0.04914093017578125, 0.078948974609375, 0.10875701904296875, 0.1385650634765625, 0.16837310791015625, 0.19818115234375, 0.22798919677734375, 0.2577972412109375, 0.28760528564453125, 0.317413330078125, 0.34722137451171875, 0.3770294189453125, 0.40683746337890625, 0.4366455078125, 0.46645355224609375, 0.4962615966796875, 0.5260696411132812, 0.555877685546875, 0.5856857299804688, 0.6154937744140625, 0.6453018188476562, 0.67510986328125, 0.7049179077148438, 0.7347259521484375, 0.7645339965820312, 0.794342041015625, 0.8241500854492188, 0.8539581298828125, 0.8837661743164062, 0.91357421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 15.0, 13.0, 21.0, 20.0, 18.0, 36.0, 26.0, 24.0, 36.0, 28.0, 25.0, 32.0, 38.0, 37.0, 47.0, 38.0, 49.0, 39.0, 31.0, 40.0, 36.0, 32.0, 33.0, 33.0, 20.0, 23.0, 31.0, 22.0, 14.0, 22.0, 16.0, 18.0, 8.0, 7.0, 10.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64013671875, -0.6192398071289062, -0.5983428955078125, -0.5774459838867188, -0.556549072265625, -0.5356521606445312, -0.5147552490234375, -0.49385833740234375, -0.47296142578125, -0.45206451416015625, -0.4311676025390625, -0.41027069091796875, -0.389373779296875, -0.36847686767578125, -0.3475799560546875, -0.32668304443359375, -0.3057861328125, -0.28488922119140625, -0.2639923095703125, -0.24309539794921875, -0.222198486328125, -0.20130157470703125, -0.1804046630859375, -0.15950775146484375, -0.13861083984375, -0.11771392822265625, -0.0968170166015625, -0.07592010498046875, -0.055023193359375, -0.03412628173828125, -0.0132293701171875, 0.00766754150390625, 0.028564453125, 0.04946136474609375, 0.0703582763671875, 0.09125518798828125, 0.112152099609375, 0.13304901123046875, 0.1539459228515625, 0.17484283447265625, 0.19573974609375, 0.21663665771484375, 0.2375335693359375, 0.25843048095703125, 0.279327392578125, 0.30022430419921875, 0.3211212158203125, 0.34201812744140625, 0.3629150390625, 0.38381195068359375, 0.4047088623046875, 0.42560577392578125, 0.446502685546875, 0.46739959716796875, 0.4882965087890625, 0.5091934204101562, 0.53009033203125, 0.5509872436523438, 0.5718841552734375, 0.5927810668945312, 0.613677978515625, 0.6345748901367188, 0.6554718017578125, 0.6763687133789062, 0.697265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 9.0, 13.0, 28.0, 39.0, 57.0, 80.0, 105.0, 176.0, 293.0, 362.0, 572.0, 869.0, 1393.0, 2049.0, 3130.0, 4786.0, 7342.0, 11471.0, 17431.0, 26727.0, 40727.0, 60185.0, 85102.0, 109918.0, 128765.0, 131837.0, 117383.0, 93379.0, 68122.0, 46839.0, 31012.0, 20376.0, 13225.0, 8566.0, 5604.0, 3639.0, 2322.0, 1581.0, 1031.0, 674.0, 448.0, 314.0, 190.0, 130.0, 89.0, 53.0, 45.0, 26.0, 14.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4667091369628906, -0.45124053955078125, -0.4357719421386719, -0.4203033447265625, -0.4048347473144531, -0.38936614990234375, -0.3738975524902344, -0.358428955078125, -0.3429603576660156, -0.32749176025390625, -0.3120231628417969, -0.2965545654296875, -0.2810859680175781, -0.26561737060546875, -0.2501487731933594, -0.23468017578125, -0.21921157836914062, -0.20374298095703125, -0.18827438354492188, -0.1728057861328125, -0.15733718872070312, -0.14186859130859375, -0.12639999389648438, -0.110931396484375, -0.09546279907226562, -0.07999420166015625, -0.06452560424804688, -0.0490570068359375, -0.033588409423828125, -0.01811981201171875, -0.002651214599609375, 0.0128173828125, 0.028285980224609375, 0.04375457763671875, 0.059223175048828125, 0.0746917724609375, 0.09016036987304688, 0.10562896728515625, 0.12109756469726562, 0.136566162109375, 0.15203475952148438, 0.16750335693359375, 0.18297195434570312, 0.1984405517578125, 0.21390914916992188, 0.22937774658203125, 0.24484634399414062, 0.26031494140625, 0.2757835388183594, 0.29125213623046875, 0.3067207336425781, 0.3221893310546875, 0.3376579284667969, 0.35312652587890625, 0.3685951232910156, 0.384063720703125, 0.3995323181152344, 0.41500091552734375, 0.4304695129394531, 0.4459381103515625, 0.4614067077636719, 0.47687530517578125, 0.4923439025878906, 0.5078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 12.0, 16.0, 12.0, 15.0, 31.0, 29.0, 23.0, 29.0, 22.0, 39.0, 46.0, 54.0, 41.0, 65.0, 65.0, 37.0, 56.0, 56.0, 42.0, 33.0, 39.0, 30.0, 32.0, 28.0, 24.0, 16.0, 13.0, 20.0, 7.0, 5.0, 7.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.251169204711914e-05, -5.0866976380348206e-05, -4.922226071357727e-05, -4.7577545046806335e-05, -4.59328293800354e-05, -4.4288113713264465e-05, -4.264339804649353e-05, -4.0998682379722595e-05, -3.935396671295166e-05, -3.7709251046180725e-05, -3.606453537940979e-05, -3.4419819712638855e-05, -3.277510404586792e-05, -3.1130388379096985e-05, -2.948567271232605e-05, -2.7840957045555115e-05, -2.619624137878418e-05, -2.4551525712013245e-05, -2.290681004524231e-05, -2.1262094378471375e-05, -1.961737871170044e-05, -1.7972663044929504e-05, -1.632794737815857e-05, -1.4683231711387634e-05, -1.30385160446167e-05, -1.1393800377845764e-05, -9.749084711074829e-06, -8.104369044303894e-06, -6.459653377532959e-06, -4.814937710762024e-06, -3.170222043991089e-06, -1.5255063772201538e-06, 1.1920928955078125e-07, 1.7639249563217163e-06, 3.4086406230926514e-06, 5.0533562898635864e-06, 6.6980719566345215e-06, 8.342787623405457e-06, 9.987503290176392e-06, 1.1632218956947327e-05, 1.3276934623718262e-05, 1.4921650290489197e-05, 1.6566365957260132e-05, 1.8211081624031067e-05, 1.9855797290802002e-05, 2.1500512957572937e-05, 2.3145228624343872e-05, 2.4789944291114807e-05, 2.6434659957885742e-05, 2.8079375624656677e-05, 2.9724091291427612e-05, 3.136880695819855e-05, 3.301352262496948e-05, 3.465823829174042e-05, 3.630295395851135e-05, 3.794766962528229e-05, 3.959238529205322e-05, 4.123710095882416e-05, 4.288181662559509e-05, 4.452653229236603e-05, 4.617124795913696e-05, 4.78159636259079e-05, 4.946067929267883e-05, 5.110539495944977e-05, 5.27501106262207e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 16.0, 39.0, 50.0, 65.0, 134.0, 187.0, 283.0, 476.0, 726.0, 1181.0, 1872.0, 2903.0, 4727.0, 7476.0, 11813.0, 18170.0, 29183.0, 44470.0, 66653.0, 92804.0, 118968.0, 135421.0, 133745.0, 115551.0, 86846.0, 61254.0, 40689.0, 26670.0, 17076.0, 10621.0, 6882.0, 4290.0, 2694.0, 1713.0, 1105.0, 652.0, 429.0, 271.0, 167.0, 97.0, 64.0, 44.0, 27.0, 12.0, 11.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.490478515625, -0.4746055603027344, -0.45873260498046875, -0.4428596496582031, -0.4269866943359375, -0.4111137390136719, -0.39524078369140625, -0.3793678283691406, -0.363494873046875, -0.3476219177246094, -0.33174896240234375, -0.3158760070800781, -0.3000030517578125, -0.2841300964355469, -0.26825714111328125, -0.2523841857910156, -0.23651123046875, -0.22063827514648438, -0.20476531982421875, -0.18889236450195312, -0.1730194091796875, -0.15714645385742188, -0.14127349853515625, -0.12540054321289062, -0.109527587890625, -0.09365463256835938, -0.07778167724609375, -0.061908721923828125, -0.0460357666015625, -0.030162811279296875, -0.01428985595703125, 0.001583099365234375, 0.0174560546875, 0.033329010009765625, 0.04920196533203125, 0.06507492065429688, 0.0809478759765625, 0.09682083129882812, 0.11269378662109375, 0.12856674194335938, 0.144439697265625, 0.16031265258789062, 0.17618560791015625, 0.19205856323242188, 0.2079315185546875, 0.22380447387695312, 0.23967742919921875, 0.2555503845214844, 0.27142333984375, 0.2872962951660156, 0.30316925048828125, 0.3190422058105469, 0.3349151611328125, 0.3507881164550781, 0.36666107177734375, 0.3825340270996094, 0.398406982421875, 0.4142799377441406, 0.43015289306640625, 0.4460258483886719, 0.4618988037109375, 0.4777717590332031, 0.49364471435546875, 0.5095176696777344, 0.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 2.0, 14.0, 13.0, 24.0, 11.0, 17.0, 27.0, 24.0, 21.0, 28.0, 42.0, 51.0, 46.0, 50.0, 50.0, 59.0, 42.0, 53.0, 42.0, 57.0, 41.0, 32.0, 41.0, 28.0, 20.0, 30.0, 23.0, 22.0, 15.0, 10.0, 11.0, 11.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15713119506835938, -0.15166473388671875, -0.14619827270507812, -0.1407318115234375, -0.13526535034179688, -0.12979888916015625, -0.12433242797851562, -0.118865966796875, -0.11339950561523438, -0.10793304443359375, -0.10246658325195312, -0.0970001220703125, -0.09153366088867188, -0.08606719970703125, -0.08060073852539062, -0.07513427734375, -0.06966781616210938, -0.06420135498046875, -0.058734893798828125, -0.0532684326171875, -0.047801971435546875, -0.04233551025390625, -0.036869049072265625, -0.031402587890625, -0.025936126708984375, -0.02046966552734375, -0.015003204345703125, -0.0095367431640625, -0.004070281982421875, 0.00139617919921875, 0.006862640380859375, 0.0123291015625, 0.017795562744140625, 0.02326202392578125, 0.028728485107421875, 0.0341949462890625, 0.039661407470703125, 0.04512786865234375, 0.050594329833984375, 0.056060791015625, 0.061527252197265625, 0.06699371337890625, 0.07246017456054688, 0.0779266357421875, 0.08339309692382812, 0.08885955810546875, 0.09432601928710938, 0.09979248046875, 0.10525894165039062, 0.11072540283203125, 0.11619186401367188, 0.1216583251953125, 0.12712478637695312, 0.13259124755859375, 0.13805770874023438, 0.143524169921875, 0.14899063110351562, 0.15445709228515625, 0.15992355346679688, 0.1653900146484375, 0.17085647583007812, 0.17632293701171875, 0.18178939819335938, 0.187255859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 16.0, 14.0, 26.0, 29.0, 39.0, 40.0, 32.0, 54.0, 54.0, 50.0, 51.0, 63.0, 69.0, 47.0, 55.0, 34.0, 36.0, 35.0, 30.0, 34.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.7850890159606934, -1.737668514251709, -1.6902481317520142, -1.6428276300430298, -1.5954071283340454, -1.5479867458343506, -1.5005662441253662, -1.4531457424163818, -1.4057252407073975, -1.358304738998413, -1.3108843564987183, -1.2634638547897339, -1.2160433530807495, -1.1686229705810547, -1.1212024688720703, -1.073781967163086, -1.0263615846633911, -0.9789411425590515, -0.9315206408500671, -0.8841001987457275, -0.8366796970367432, -0.7892592549324036, -0.741838812828064, -0.6944183111190796, -0.64699786901474, -0.5995774269104004, -0.552156925201416, -0.5047364830970764, -0.45731601119041443, -0.40989553928375244, -0.36247509717941284, -0.31505462527275085, -0.2676340341567993, -0.22021356225013733, -0.17279310524463654, -0.12537264823913574, -0.07795217633247375, -0.030531704425811768, 0.016888737678527832, 0.06430920958518982, 0.1117296814918518, 0.1591501533985138, 0.2065706104040146, 0.2539910674095154, 0.30141153931617737, 0.34883201122283936, 0.39625245332717896, 0.44367292523384094, 0.49109339714050293, 0.5385138392448425, 0.5859343409538269, 0.6333547830581665, 0.6807752847671509, 0.7281957268714905, 0.7756161689758301, 0.8230366706848145, 0.870457112789154, 0.9178775548934937, 0.965298056602478, 1.0127184391021729, 1.0601389408111572, 1.1075594425201416, 1.154979944229126, 1.2024003267288208, 1.2498208284378052]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 4.0, 13.0, 13.0, 15.0, 23.0, 22.0, 22.0, 45.0, 25.0, 33.0, 36.0, 41.0, 47.0, 27.0, 28.0, 49.0, 44.0, 39.0, 46.0, 38.0, 50.0, 39.0, 27.0, 35.0, 34.0, 28.0, 18.0, 20.0, 23.0, 17.0, 17.0, 21.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1418660879135132, -1.1035720109939575, -1.0652778148651123, -1.0269837379455566, -0.988689661026001, -0.9503955841064453, -0.9121014475822449, -0.8738073110580444, -0.8355132341384888, -0.7972191572189331, -0.7589250206947327, -0.7206308841705322, -0.6823368072509766, -0.6440427303314209, -0.6057485938072205, -0.56745445728302, -0.5291603803634644, -0.4908662736415863, -0.45257216691970825, -0.4142780601978302, -0.37598395347595215, -0.3376898467540741, -0.29939574003219604, -0.261101633310318, -0.22280752658843994, -0.1845134198665619, -0.14621931314468384, -0.10792520642280579, -0.06963109970092773, -0.03133699297904968, 0.006957113742828369, 0.04525122046470642, 0.08354544639587402, 0.12183955311775208, 0.16013365983963013, 0.19842776656150818, 0.23672187328338623, 0.2750159800052643, 0.31331008672714233, 0.3516041934490204, 0.38989830017089844, 0.4281924068927765, 0.46648651361465454, 0.504780650138855, 0.5430747270584106, 0.5813688039779663, 0.6196629405021667, 0.6579570770263672, 0.6962511539459229, 0.7345452308654785, 0.772839367389679, 0.8111335039138794, 0.8494275808334351, 0.8877216577529907, 0.9260157942771912, 0.9643099308013916, 1.0026040077209473, 1.040898084640503, 1.0791921615600586, 1.1174863576889038, 1.1557804346084595, 1.1940745115280151, 1.2323687076568604, 1.270662784576416, 1.3089568614959717]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 12.0, 19.0, 27.0, 56.0, 92.0, 177.0, 259.0, 522.0, 890.0, 1499.0, 2833.0, 5345.0, 9825.0, 18294.0, 34720.0, 65267.0, 122446.0, 224053.0, 385772.0, 589798.0, 738902.0, 710247.0, 533755.0, 335285.0, 191041.0, 104108.0, 55782.0, 29337.0, 15295.0, 8283.0, 4550.0, 2502.0, 1361.0, 812.0, 426.0, 246.0, 168.0, 84.0, 74.0, 40.0, 26.0, 17.0, 20.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.4482421875, -1.405487060546875, -1.36273193359375, -1.319976806640625, -1.2772216796875, -1.234466552734375, -1.19171142578125, -1.148956298828125, -1.106201171875, -1.063446044921875, -1.02069091796875, -0.977935791015625, -0.9351806640625, -0.892425537109375, -0.84967041015625, -0.806915283203125, -0.76416015625, -0.721405029296875, -0.67864990234375, -0.635894775390625, -0.5931396484375, -0.550384521484375, -0.50762939453125, -0.464874267578125, -0.422119140625, -0.379364013671875, -0.33660888671875, -0.293853759765625, -0.2510986328125, -0.208343505859375, -0.16558837890625, -0.122833251953125, -0.080078125, -0.037322998046875, 0.00543212890625, 0.048187255859375, 0.0909423828125, 0.133697509765625, 0.17645263671875, 0.219207763671875, 0.261962890625, 0.304718017578125, 0.34747314453125, 0.390228271484375, 0.4329833984375, 0.475738525390625, 0.51849365234375, 0.561248779296875, 0.60400390625, 0.646759033203125, 0.68951416015625, 0.732269287109375, 0.7750244140625, 0.817779541015625, 0.86053466796875, 0.903289794921875, 0.946044921875, 0.988800048828125, 1.03155517578125, 1.074310302734375, 1.1170654296875, 1.159820556640625, 1.20257568359375, 1.245330810546875, 1.2880859375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 15.0, 17.0, 25.0, 27.0, 21.0, 19.0, 21.0, 32.0, 40.0, 38.0, 42.0, 29.0, 26.0, 51.0, 42.0, 52.0, 33.0, 46.0, 47.0, 39.0, 43.0, 25.0, 31.0, 29.0, 31.0, 20.0, 20.0, 29.0, 21.0, 7.0, 18.0, 10.0, 10.0, 5.0, 1.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.8899612426757812, -0.8619537353515625, -0.8339462280273438, -0.805938720703125, -0.7779312133789062, -0.7499237060546875, -0.7219161987304688, -0.69390869140625, -0.6659011840820312, -0.6378936767578125, -0.6098861694335938, -0.581878662109375, -0.5538711547851562, -0.5258636474609375, -0.49785614013671875, -0.4698486328125, -0.44184112548828125, -0.4138336181640625, -0.38582611083984375, -0.357818603515625, -0.32981109619140625, -0.3018035888671875, -0.27379608154296875, -0.24578857421875, -0.21778106689453125, -0.1897735595703125, -0.16176605224609375, -0.133758544921875, -0.10575103759765625, -0.0777435302734375, -0.04973602294921875, -0.021728515625, 0.00627899169921875, 0.0342864990234375, 0.06229400634765625, 0.090301513671875, 0.11830902099609375, 0.1463165283203125, 0.17432403564453125, 0.20233154296875, 0.23033905029296875, 0.2583465576171875, 0.28635406494140625, 0.314361572265625, 0.34236907958984375, 0.3703765869140625, 0.39838409423828125, 0.4263916015625, 0.45439910888671875, 0.4824066162109375, 0.5104141235351562, 0.538421630859375, 0.5664291381835938, 0.5944366455078125, 0.6224441528320312, 0.65045166015625, 0.6784591674804688, 0.7064666748046875, 0.7344741821289062, 0.762481689453125, 0.7904891967773438, 0.8184967041015625, 0.8465042114257812, 0.87451171875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 7.0, 18.0, 25.0, 51.0, 72.0, 67.0, 141.0, 243.0, 335.0, 561.0, 1030.0, 1663.0, 2766.0, 4650.0, 8010.0, 13360.0, 22186.0, 37924.0, 62782.0, 101553.0, 160775.0, 241775.0, 344058.0, 448981.0, 525655.0, 539371.0, 487189.0, 392118.0, 285105.0, 193315.0, 124145.0, 77481.0, 47066.0, 28337.0, 16965.0, 9878.0, 5880.0, 3423.0, 2081.0, 1253.0, 748.0, 466.0, 281.0, 191.0, 98.0, 94.0, 32.0, 29.0, 17.0, 9.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0810546875, -1.0475006103515625, -1.013946533203125, -0.9803924560546875, -0.94683837890625, -0.9132843017578125, -0.879730224609375, -0.8461761474609375, -0.8126220703125, -0.7790679931640625, -0.745513916015625, -0.7119598388671875, -0.67840576171875, -0.6448516845703125, -0.611297607421875, -0.5777435302734375, -0.544189453125, -0.5106353759765625, -0.477081298828125, -0.4435272216796875, -0.40997314453125, -0.3764190673828125, -0.342864990234375, -0.3093109130859375, -0.2757568359375, -0.2422027587890625, -0.208648681640625, -0.1750946044921875, -0.14154052734375, -0.1079864501953125, -0.074432373046875, -0.0408782958984375, -0.00732421875, 0.0262298583984375, 0.059783935546875, 0.0933380126953125, 0.12689208984375, 0.1604461669921875, 0.194000244140625, 0.2275543212890625, 0.2611083984375, 0.2946624755859375, 0.328216552734375, 0.3617706298828125, 0.39532470703125, 0.4288787841796875, 0.462432861328125, 0.4959869384765625, 0.529541015625, 0.5630950927734375, 0.596649169921875, 0.6302032470703125, 0.66375732421875, 0.6973114013671875, 0.730865478515625, 0.7644195556640625, 0.7979736328125, 0.8315277099609375, 0.865081787109375, 0.8986358642578125, 0.93218994140625, 0.9657440185546875, 0.999298095703125, 1.0328521728515625, 1.06640625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 24.0, 41.0, 53.0, 59.0, 85.0, 88.0, 123.0, 118.0, 134.0, 151.0, 188.0, 166.0, 209.0, 222.0, 229.0, 237.0, 239.0, 211.0, 209.0, 209.0, 158.0, 149.0, 123.0, 124.0, 94.0, 85.0, 55.0, 47.0, 40.0, 32.0, 26.0, 10.0, 19.0, 13.0, 7.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42724609375, -0.4130363464355469, -0.39882659912109375, -0.3846168518066406, -0.3704071044921875, -0.3561973571777344, -0.34198760986328125, -0.3277778625488281, -0.313568115234375, -0.2993583679199219, -0.28514862060546875, -0.2709388732910156, -0.2567291259765625, -0.24251937866210938, -0.22830963134765625, -0.21409988403320312, -0.19989013671875, -0.18568038940429688, -0.17147064208984375, -0.15726089477539062, -0.1430511474609375, -0.12884140014648438, -0.11463165283203125, -0.10042190551757812, -0.086212158203125, -0.07200241088867188, -0.05779266357421875, -0.043582916259765625, -0.0293731689453125, -0.015163421630859375, -0.00095367431640625, 0.013256072998046875, 0.0274658203125, 0.041675567626953125, 0.05588531494140625, 0.07009506225585938, 0.0843048095703125, 0.09851455688476562, 0.11272430419921875, 0.12693405151367188, 0.141143798828125, 0.15535354614257812, 0.16956329345703125, 0.18377304077148438, 0.1979827880859375, 0.21219253540039062, 0.22640228271484375, 0.24061203002929688, 0.25482177734375, 0.2690315246582031, 0.28324127197265625, 0.2974510192871094, 0.3116607666015625, 0.3258705139160156, 0.34008026123046875, 0.3542900085449219, 0.368499755859375, 0.3827095031738281, 0.39691925048828125, 0.4111289978027344, 0.4253387451171875, 0.4395484924316406, 0.45375823974609375, 0.4679679870605469, 0.482177734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 9.0, 14.0, 20.0, 25.0, 24.0, 28.0, 39.0, 43.0, 30.0, 36.0, 57.0, 52.0, 59.0, 59.0, 58.0, 53.0, 52.0, 48.0, 29.0, 37.0, 35.0, 20.0, 32.0, 22.0, 15.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.469054102897644, -1.4224615097045898, -1.3758689165115356, -1.3292763233184814, -1.2826837301254272, -1.236091136932373, -1.1894984245300293, -1.1429059505462646, -1.096313238143921, -1.0497206449508667, -1.0031280517578125, -0.9565354585647583, -0.9099428653717041, -0.8633502721786499, -0.8167576193809509, -0.7701650261878967, -0.7235724925994873, -0.6769798994064331, -0.6303873062133789, -0.5837947130203247, -0.5372021198272705, -0.4906094968318939, -0.44401687383651733, -0.39742428064346313, -0.35083168745040894, -0.30423909425735474, -0.25764650106430054, -0.21105387806892395, -0.16446128487586975, -0.11786869168281555, -0.07127606868743896, -0.024683475494384766, 0.021908998489379883, 0.06850159913301468, 0.11509419977664948, 0.16168680787086487, 0.20827940106391907, 0.25487199425697327, 0.30146461725234985, 0.34805721044540405, 0.39464980363845825, 0.44124239683151245, 0.48783499002456665, 0.5344276428222656, 0.5810202360153198, 0.627612829208374, 0.6742054224014282, 0.7207980155944824, 0.7673906087875366, 0.8139832019805908, 0.860575795173645, 0.9071683883666992, 0.9537609815597534, 1.0003535747528076, 1.0469462871551514, 1.093538761138916, 1.1401314735412598, 1.186724066734314, 1.2333166599273682, 1.2799092531204224, 1.3265018463134766, 1.3730944395065308, 1.419687032699585, 1.4662797451019287, 1.5128722190856934]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 10.0, 17.0, 10.0, 19.0, 20.0, 32.0, 23.0, 33.0, 33.0, 26.0, 35.0, 41.0, 45.0, 48.0, 43.0, 38.0, 35.0, 42.0, 29.0, 45.0, 32.0, 40.0, 36.0, 29.0, 24.0, 29.0, 20.0, 24.0, 19.0, 24.0, 12.0, 9.0, 11.0, 8.0, 13.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.993068277835846, -0.9603825807571411, -0.927696943283081, -0.8950112462043762, -0.8623255491256714, -0.8296399116516113, -0.7969542145729065, -0.7642685174942017, -0.7315828800201416, -0.6988971829414368, -0.6662115454673767, -0.6335258483886719, -0.6008402109146118, -0.568154513835907, -0.5354688167572021, -0.5027831792831421, -0.47009748220443726, -0.4374118149280548, -0.40472614765167236, -0.37204045057296753, -0.3393547832965851, -0.30666911602020264, -0.2739834189414978, -0.24129775166511536, -0.2086120843887329, -0.17592641711235046, -0.14324073493480682, -0.11055506020784378, -0.07786938548088074, -0.04518371820449829, -0.012498036026954651, 0.02018764615058899, 0.05287337303161621, 0.08555904775857925, 0.1182447224855423, 0.15093040466308594, 0.18361607193946838, 0.21630173921585083, 0.24898742139339447, 0.2816731035709381, 0.31435877084732056, 0.347044438123703, 0.37973010540008545, 0.4124158024787903, 0.44510146975517273, 0.4777871370315552, 0.51047283411026, 0.5431585311889648, 0.5758441686630249, 0.6085298657417297, 0.6412155032157898, 0.6739012002944946, 0.7065868377685547, 0.7392725348472595, 0.7719582319259644, 0.8046438694000244, 0.8373295664787292, 0.8700152635574341, 0.9027009010314941, 0.935386598110199, 0.9680722951889038, 1.0007579326629639, 1.033443570137024, 1.0661293268203735, 1.0988149642944336]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 8.0, 12.0, 21.0, 21.0, 49.0, 48.0, 90.0, 155.0, 191.0, 355.0, 591.0, 955.0, 1472.0, 2410.0, 4068.0, 6547.0, 10696.0, 17770.0, 29482.0, 48878.0, 79344.0, 122158.0, 168576.0, 177988.0, 138252.0, 91985.0, 57556.0, 34994.0, 21108.0, 12825.0, 7760.0, 4588.0, 2954.0, 1733.0, 1023.0, 651.0, 440.0, 287.0, 167.0, 119.0, 69.0, 50.0, 25.0, 24.0, 16.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.315673828125, -0.3061561584472656, -0.29663848876953125, -0.2871208190917969, -0.2776031494140625, -0.2680854797363281, -0.25856781005859375, -0.24905014038085938, -0.239532470703125, -0.23001480102539062, -0.22049713134765625, -0.21097946166992188, -0.2014617919921875, -0.19194412231445312, -0.18242645263671875, -0.17290878295898438, -0.16339111328125, -0.15387344360351562, -0.14435577392578125, -0.13483810424804688, -0.1253204345703125, -0.11580276489257812, -0.10628509521484375, -0.09676742553710938, -0.087249755859375, -0.07773208618164062, -0.06821441650390625, -0.058696746826171875, -0.0491790771484375, -0.039661407470703125, -0.03014373779296875, -0.020626068115234375, -0.0111083984375, -0.001590728759765625, 0.00792694091796875, 0.017444610595703125, 0.0269622802734375, 0.036479949951171875, 0.04599761962890625, 0.055515289306640625, 0.065032958984375, 0.07455062866210938, 0.08406829833984375, 0.09358596801757812, 0.1031036376953125, 0.11262130737304688, 0.12213897705078125, 0.13165664672851562, 0.14117431640625, 0.15069198608398438, 0.16020965576171875, 0.16972732543945312, 0.1792449951171875, 0.18876266479492188, 0.19828033447265625, 0.20779800415039062, 0.217315673828125, 0.22683334350585938, 0.23635101318359375, 0.24586868286132812, 0.2553863525390625, 0.2649040222167969, 0.27442169189453125, 0.2839393615722656, 0.29345703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 11.0, 23.0, 14.0, 18.0, 18.0, 30.0, 24.0, 38.0, 27.0, 50.0, 61.0, 48.0, 46.0, 41.0, 48.0, 55.0, 45.0, 42.0, 39.0, 41.0, 37.0, 36.0, 32.0, 21.0, 23.0, 19.0, 19.0, 11.0, 11.0, 15.0, 5.0, 8.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.23504638671875, -1.1947021484375, -1.15435791015625, -1.114013671875, -1.07366943359375, -1.0333251953125, -0.99298095703125, -0.95263671875, -0.91229248046875, -0.8719482421875, -0.83160400390625, -0.791259765625, -0.75091552734375, -0.7105712890625, -0.67022705078125, -0.6298828125, -0.58953857421875, -0.5491943359375, -0.50885009765625, -0.468505859375, -0.42816162109375, -0.3878173828125, -0.34747314453125, -0.30712890625, -0.26678466796875, -0.2264404296875, -0.18609619140625, -0.145751953125, -0.10540771484375, -0.0650634765625, -0.02471923828125, 0.015625, 0.05596923828125, 0.0963134765625, 0.13665771484375, 0.177001953125, 0.21734619140625, 0.2576904296875, 0.29803466796875, 0.33837890625, 0.37872314453125, 0.4190673828125, 0.45941162109375, 0.499755859375, 0.54010009765625, 0.5804443359375, 0.62078857421875, 0.6611328125, 0.70147705078125, 0.7418212890625, 0.78216552734375, 0.822509765625, 0.86285400390625, 0.9031982421875, 0.94354248046875, 0.98388671875, 1.02423095703125, 1.0645751953125, 1.10491943359375, 1.145263671875, 1.18560791015625, 1.2259521484375, 1.26629638671875, 1.306640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 6.0, 6.0, 20.0, 21.0, 41.0, 53.0, 90.0, 135.0, 224.0, 344.0, 597.0, 1046.0, 1847.0, 3292.0, 6116.0, 11655.0, 22439.0, 44921.0, 88282.0, 165038.0, 245352.0, 209021.0, 120249.0, 62166.0, 31260.0, 15929.0, 8079.0, 4618.0, 2368.0, 1313.0, 770.0, 460.0, 283.0, 157.0, 109.0, 81.0, 48.0, 30.0, 17.0, 10.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4267578125, -0.4141082763671875, -0.401458740234375, -0.3888092041015625, -0.37615966796875, -0.3635101318359375, -0.350860595703125, -0.3382110595703125, -0.3255615234375, -0.3129119873046875, -0.300262451171875, -0.2876129150390625, -0.27496337890625, -0.2623138427734375, -0.249664306640625, -0.2370147705078125, -0.224365234375, -0.2117156982421875, -0.199066162109375, -0.1864166259765625, -0.17376708984375, -0.1611175537109375, -0.148468017578125, -0.1358184814453125, -0.1231689453125, -0.1105194091796875, -0.097869873046875, -0.0852203369140625, -0.07257080078125, -0.0599212646484375, -0.047271728515625, -0.0346221923828125, -0.02197265625, -0.0093231201171875, 0.003326416015625, 0.0159759521484375, 0.02862548828125, 0.0412750244140625, 0.053924560546875, 0.0665740966796875, 0.0792236328125, 0.0918731689453125, 0.104522705078125, 0.1171722412109375, 0.12982177734375, 0.1424713134765625, 0.155120849609375, 0.1677703857421875, 0.180419921875, 0.1930694580078125, 0.205718994140625, 0.2183685302734375, 0.23101806640625, 0.2436676025390625, 0.256317138671875, 0.2689666748046875, 0.2816162109375, 0.2942657470703125, 0.306915283203125, 0.3195648193359375, 0.33221435546875, 0.3448638916015625, 0.357513427734375, 0.3701629638671875, 0.3828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 11.0, 10.0, 10.0, 14.0, 23.0, 16.0, 19.0, 23.0, 21.0, 26.0, 28.0, 26.0, 37.0, 38.0, 40.0, 47.0, 38.0, 41.0, 49.0, 32.0, 43.0, 33.0, 35.0, 32.0, 42.0, 35.0, 23.0, 25.0, 19.0, 16.0, 30.0, 10.0, 18.0, 12.0, 14.0, 7.0, 5.0, 5.0, 3.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6044921875, -0.5842742919921875, -0.564056396484375, -0.5438385009765625, -0.52362060546875, -0.5034027099609375, -0.483184814453125, -0.4629669189453125, -0.4427490234375, -0.4225311279296875, -0.402313232421875, -0.3820953369140625, -0.36187744140625, -0.3416595458984375, -0.321441650390625, -0.3012237548828125, -0.281005859375, -0.2607879638671875, -0.240570068359375, -0.2203521728515625, -0.20013427734375, -0.1799163818359375, -0.159698486328125, -0.1394805908203125, -0.1192626953125, -0.0990447998046875, -0.078826904296875, -0.0586090087890625, -0.03839111328125, -0.0181732177734375, 0.002044677734375, 0.0222625732421875, 0.04248046875, 0.0626983642578125, 0.082916259765625, 0.1031341552734375, 0.12335205078125, 0.1435699462890625, 0.163787841796875, 0.1840057373046875, 0.2042236328125, 0.2244415283203125, 0.244659423828125, 0.2648773193359375, 0.28509521484375, 0.3053131103515625, 0.325531005859375, 0.3457489013671875, 0.365966796875, 0.3861846923828125, 0.406402587890625, 0.4266204833984375, 0.44683837890625, 0.4670562744140625, 0.487274169921875, 0.5074920654296875, 0.5277099609375, 0.5479278564453125, 0.568145751953125, 0.5883636474609375, 0.60858154296875, 0.6287994384765625, 0.649017333984375, 0.6692352294921875, 0.689453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 19.0, 18.0, 40.0, 40.0, 82.0, 99.0, 191.0, 249.0, 411.0, 609.0, 887.0, 1549.0, 2450.0, 4303.0, 7593.0, 15093.0, 32191.0, 78715.0, 214299.0, 377292.0, 185032.0, 67972.0, 28689.0, 13487.0, 7011.0, 3928.0, 2280.0, 1451.0, 886.0, 561.0, 391.0, 219.0, 154.0, 104.0, 63.0, 66.0, 41.0, 14.0, 18.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.19189453125, -0.18615341186523438, -0.18041229248046875, -0.17467117309570312, -0.1689300537109375, -0.16318893432617188, -0.15744781494140625, -0.15170669555664062, -0.145965576171875, -0.14022445678710938, -0.13448333740234375, -0.12874221801757812, -0.1230010986328125, -0.11725997924804688, -0.11151885986328125, -0.10577774047851562, -0.10003662109375, -0.09429550170898438, -0.08855438232421875, -0.08281326293945312, -0.0770721435546875, -0.07133102416992188, -0.06558990478515625, -0.059848785400390625, -0.054107666015625, -0.048366546630859375, -0.04262542724609375, -0.036884307861328125, -0.0311431884765625, -0.025402069091796875, -0.01966094970703125, -0.013919830322265625, -0.0081787109375, -0.002437591552734375, 0.00330352783203125, 0.009044647216796875, 0.0147857666015625, 0.020526885986328125, 0.02626800537109375, 0.032009124755859375, 0.037750244140625, 0.043491363525390625, 0.04923248291015625, 0.054973602294921875, 0.0607147216796875, 0.06645584106445312, 0.07219696044921875, 0.07793807983398438, 0.08367919921875, 0.08942031860351562, 0.09516143798828125, 0.10090255737304688, 0.1066436767578125, 0.11238479614257812, 0.11812591552734375, 0.12386703491210938, 0.129608154296875, 0.13534927368164062, 0.14109039306640625, 0.14683151245117188, 0.1525726318359375, 0.15831375122070312, 0.16405487060546875, 0.16979598999023438, 0.175537109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 6.0, 3.0, 14.0, 12.0, 21.0, 24.0, 33.0, 28.0, 30.0, 38.0, 42.0, 46.0, 45.0, 51.0, 39.0, 55.0, 46.0, 45.0, 64.0, 40.0, 55.0, 32.0, 24.0, 25.0, 22.0, 18.0, 19.0, 23.0, 17.0, 13.0, 12.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -8.977949619293213e-06, -8.657574653625488e-06, -8.337199687957764e-06, -8.016824722290039e-06, -7.696449756622314e-06, -7.37607479095459e-06, -7.055699825286865e-06, -6.735324859619141e-06, -6.414949893951416e-06, -6.094574928283691e-06, -5.774199962615967e-06, -5.453824996948242e-06, -5.133450031280518e-06, -4.813075065612793e-06, -4.492700099945068e-06, -4.172325134277344e-06, -3.851950168609619e-06, -3.5315752029418945e-06, -3.21120023727417e-06, -2.8908252716064453e-06, -2.5704503059387207e-06, -2.250075340270996e-06, -1.9297003746032715e-06, -1.6093254089355469e-06, -1.2889504432678223e-06, -9.685754776000977e-07, -6.48200511932373e-07, -3.2782554626464844e-07, -7.450580596923828e-09, 3.129243850708008e-07, 6.332993507385254e-07, 9.5367431640625e-07, 1.2740492820739746e-06, 1.5944242477416992e-06, 1.914799213409424e-06, 2.2351741790771484e-06, 2.555549144744873e-06, 2.8759241104125977e-06, 3.1962990760803223e-06, 3.516674041748047e-06, 3.8370490074157715e-06, 4.157423973083496e-06, 4.477798938751221e-06, 4.798173904418945e-06, 5.11854887008667e-06, 5.4389238357543945e-06, 5.759298801422119e-06, 6.079673767089844e-06, 6.400048732757568e-06, 6.720423698425293e-06, 7.040798664093018e-06, 7.361173629760742e-06, 7.681548595428467e-06, 8.001923561096191e-06, 8.322298526763916e-06, 8.64267349243164e-06, 8.963048458099365e-06, 9.28342342376709e-06, 9.603798389434814e-06, 9.924173355102539e-06, 1.0244548320770264e-05, 1.0564923286437988e-05, 1.0885298252105713e-05, 1.1205673217773438e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 10.0, 15.0, 33.0, 26.0, 45.0, 79.0, 95.0, 147.0, 187.0, 331.0, 554.0, 788.0, 1247.0, 2113.0, 3588.0, 6208.0, 10415.0, 18253.0, 31186.0, 56630.0, 100991.0, 169169.0, 219709.0, 177462.0, 108321.0, 60437.0, 34049.0, 19150.0, 11045.0, 6387.0, 3707.0, 2269.0, 1410.0, 887.0, 534.0, 371.0, 254.0, 142.0, 105.0, 65.0, 45.0, 22.0, 23.0, 24.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12136077880859375, -0.1171112060546875, -0.11286163330078125, -0.108612060546875, -0.10436248779296875, -0.1001129150390625, -0.09586334228515625, -0.09161376953125, -0.08736419677734375, -0.0831146240234375, -0.07886505126953125, -0.074615478515625, -0.07036590576171875, -0.0661163330078125, -0.06186676025390625, -0.0576171875, -0.05336761474609375, -0.0491180419921875, -0.04486846923828125, -0.040618896484375, -0.03636932373046875, -0.0321197509765625, -0.02787017822265625, -0.02362060546875, -0.01937103271484375, -0.0151214599609375, -0.01087188720703125, -0.006622314453125, -0.00237274169921875, 0.0018768310546875, 0.00612640380859375, 0.0103759765625, 0.01462554931640625, 0.0188751220703125, 0.02312469482421875, 0.027374267578125, 0.03162384033203125, 0.0358734130859375, 0.04012298583984375, 0.04437255859375, 0.04862213134765625, 0.0528717041015625, 0.05712127685546875, 0.061370849609375, 0.06562042236328125, 0.0698699951171875, 0.07411956787109375, 0.078369140625, 0.08261871337890625, 0.0868682861328125, 0.09111785888671875, 0.095367431640625, 0.09961700439453125, 0.1038665771484375, 0.10811614990234375, 0.11236572265625, 0.11661529541015625, 0.1208648681640625, 0.12511444091796875, 0.129364013671875, 0.13361358642578125, 0.1378631591796875, 0.14211273193359375, 0.1463623046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 6.0, 13.0, 4.0, 16.0, 12.0, 15.0, 17.0, 14.0, 14.0, 24.0, 30.0, 33.0, 31.0, 36.0, 45.0, 53.0, 70.0, 78.0, 55.0, 48.0, 44.0, 42.0, 44.0, 35.0, 35.0, 30.0, 31.0, 8.0, 21.0, 16.0, 11.0, 11.0, 5.0, 6.0, 2.0, 8.0, 5.0, 5.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0284576416015625, -0.027442216873168945, -0.02642679214477539, -0.025411367416381836, -0.02439594268798828, -0.023380517959594727, -0.022365093231201172, -0.021349668502807617, -0.020334243774414062, -0.019318819046020508, -0.018303394317626953, -0.0172879695892334, -0.016272544860839844, -0.015257120132446289, -0.014241695404052734, -0.01322627067565918, -0.012210845947265625, -0.01119542121887207, -0.010179996490478516, -0.009164571762084961, -0.008149147033691406, -0.0071337223052978516, -0.006118297576904297, -0.005102872848510742, -0.0040874481201171875, -0.003072023391723633, -0.002056598663330078, -0.0010411739349365234, -2.574920654296875e-05, 0.000989675521850586, 0.0020051002502441406, 0.0030205249786376953, 0.00403594970703125, 0.005051374435424805, 0.006066799163818359, 0.007082223892211914, 0.008097648620605469, 0.009113073348999023, 0.010128498077392578, 0.011143922805786133, 0.012159347534179688, 0.013174772262573242, 0.014190196990966797, 0.015205621719360352, 0.016221046447753906, 0.01723647117614746, 0.018251895904541016, 0.01926732063293457, 0.020282745361328125, 0.02129817008972168, 0.022313594818115234, 0.02332901954650879, 0.024344444274902344, 0.0253598690032959, 0.026375293731689453, 0.027390718460083008, 0.028406143188476562, 0.029421567916870117, 0.030436992645263672, 0.03145241737365723, 0.03246784210205078, 0.033483266830444336, 0.03449869155883789, 0.035514116287231445, 0.036529541015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 15.0, 8.0, 9.0, 23.0, 11.0, 28.0, 19.0, 31.0, 46.0, 32.0, 34.0, 35.0, 60.0, 57.0, 57.0, 56.0, 55.0, 57.0, 46.0, 49.0, 28.0, 33.0, 34.0, 23.0, 26.0, 28.0, 16.0, 17.0, 11.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.437822937965393, -1.3920657634735107, -1.3463085889816284, -1.300551414489746, -1.2547943592071533, -1.209037184715271, -1.1632800102233887, -1.1175228357315063, -1.071765661239624, -1.0260084867477417, -0.9802513718605042, -0.9344941973686218, -0.8887370824813843, -0.842979907989502, -0.7972227334976196, -0.7514655590057373, -0.7057085037231445, -0.6599513292312622, -0.6141942143440247, -0.5684370398521423, -0.5226799249649048, -0.47692275047302246, -0.43116557598114014, -0.3854084312915802, -0.33965128660202026, -0.2938941419124603, -0.2481369823217392, -0.20237982273101807, -0.15662267804145813, -0.1108655333518982, -0.06510835886001587, -0.019351214170455933, 0.026405811309814453, 0.07216296344995499, 0.11792011559009552, 0.16367727518081665, 0.2094344198703766, 0.2551915645599365, 0.30094873905181885, 0.3467058837413788, 0.3924630284309387, 0.43822017312049866, 0.4839773178100586, 0.5297344923019409, 0.5754916667938232, 0.6212487816810608, 0.6670059561729431, 0.7127630710601807, 0.758520245552063, 0.8042774200439453, 0.8500345349311829, 0.8957917094230652, 0.9415488243103027, 0.9873059988021851, 1.0330631732940674, 1.0788203477859497, 1.124577522277832, 1.1703346967697144, 1.2160918712615967, 1.2618489265441895, 1.3076061010360718, 1.353363275527954, 1.3991204500198364, 1.4448776245117188, 1.4906346797943115]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 3.0, 8.0, 13.0, 13.0, 14.0, 16.0, 22.0, 29.0, 23.0, 38.0, 32.0, 24.0, 34.0, 47.0, 47.0, 46.0, 38.0, 39.0, 40.0, 38.0, 26.0, 45.0, 36.0, 36.0, 41.0, 28.0, 27.0, 22.0, 21.0, 28.0, 21.0, 19.0, 9.0, 13.0, 12.0, 5.0, 12.0, 11.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9932097792625427, -0.960573136806488, -0.9279365539550781, -0.8952999114990234, -0.8626633286476135, -0.8300266861915588, -0.7973901033401489, -0.7647534608840942, -0.7321168184280396, -0.6994801759719849, -0.666843593120575, -0.6342069506645203, -0.6015703678131104, -0.5689337253570557, -0.536297082901001, -0.5036605000495911, -0.47102391719818115, -0.43838730454444885, -0.40575069189071655, -0.37311404943466187, -0.34047746658325195, -0.30784082412719727, -0.27520421147346497, -0.24256759881973267, -0.20993098616600037, -0.17729437351226807, -0.14465776085853577, -0.11202113330364227, -0.07938452064990997, -0.04674790799617767, -0.01411128044128418, 0.01852533221244812, 0.051161885261535645, 0.08379849791526794, 0.11643511801958084, 0.14907173812389374, 0.18170835077762604, 0.21434496343135834, 0.24698159098625183, 0.27961820363998413, 0.31225481629371643, 0.34489142894744873, 0.37752804160118103, 0.41016465425491333, 0.442801296710968, 0.47543787956237793, 0.5080745220184326, 0.5407111644744873, 0.5733477473258972, 0.6059843897819519, 0.6386209726333618, 0.6712576150894165, 0.7038941979408264, 0.7365308403968811, 0.769167423248291, 0.8018040657043457, 0.8344407081604004, 0.8670773506164551, 0.899713933467865, 0.9323505759239197, 0.9649871587753296, 0.9976238012313843, 1.030260443687439, 1.062896966934204, 1.0955336093902588]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 15.0, 25.0, 37.0, 39.0, 78.0, 130.0, 287.0, 484.0, 746.0, 1330.0, 2261.0, 3887.0, 6577.0, 11004.0, 18470.0, 30062.0, 46316.0, 69047.0, 95066.0, 118543.0, 132622.0, 130941.0, 114651.0, 89790.0, 64373.0, 42822.0, 27180.0, 17338.0, 9994.0, 6031.0, 3485.0, 2028.0, 1248.0, 667.0, 382.0, 222.0, 145.0, 84.0, 57.0, 37.0, 17.0, 11.0, 9.0, 4.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0747604370117188, -1.0420989990234375, -1.0094375610351562, -0.976776123046875, -0.9441146850585938, -0.9114532470703125, -0.8787918090820312, -0.84613037109375, -0.8134689331054688, -0.7808074951171875, -0.7481460571289062, -0.715484619140625, -0.6828231811523438, -0.6501617431640625, -0.6175003051757812, -0.5848388671875, -0.5521774291992188, -0.5195159912109375, -0.48685455322265625, -0.454193115234375, -0.42153167724609375, -0.3888702392578125, -0.35620880126953125, -0.32354736328125, -0.29088592529296875, -0.2582244873046875, -0.22556304931640625, -0.192901611328125, -0.16024017333984375, -0.1275787353515625, -0.09491729736328125, -0.062255859375, -0.02959442138671875, 0.0030670166015625, 0.03572845458984375, 0.068389892578125, 0.10105133056640625, 0.1337127685546875, 0.16637420654296875, 0.19903564453125, 0.23169708251953125, 0.2643585205078125, 0.29701995849609375, 0.329681396484375, 0.36234283447265625, 0.3950042724609375, 0.42766571044921875, 0.4603271484375, 0.49298858642578125, 0.5256500244140625, 0.5583114624023438, 0.590972900390625, 0.6236343383789062, 0.6562957763671875, 0.6889572143554688, 0.72161865234375, 0.7542800903320312, 0.7869415283203125, 0.8196029663085938, 0.852264404296875, 0.8849258422851562, 0.9175872802734375, 0.9502487182617188, 0.98291015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 7.0, 11.0, 12.0, 12.0, 32.0, 19.0, 39.0, 37.0, 38.0, 31.0, 39.0, 42.0, 59.0, 56.0, 54.0, 39.0, 58.0, 41.0, 41.0, 33.0, 47.0, 28.0, 29.0, 27.0, 28.0, 25.0, 15.0, 17.0, 14.0, 19.0, 6.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.11480712890625, -1.0753173828125, -1.03582763671875, -0.996337890625, -0.95684814453125, -0.9173583984375, -0.87786865234375, -0.83837890625, -0.79888916015625, -0.7593994140625, -0.71990966796875, -0.680419921875, -0.64093017578125, -0.6014404296875, -0.56195068359375, -0.5224609375, -0.48297119140625, -0.4434814453125, -0.40399169921875, -0.364501953125, -0.32501220703125, -0.2855224609375, -0.24603271484375, -0.20654296875, -0.16705322265625, -0.1275634765625, -0.08807373046875, -0.048583984375, -0.00909423828125, 0.0303955078125, 0.06988525390625, 0.109375, 0.14886474609375, 0.1883544921875, 0.22784423828125, 0.267333984375, 0.30682373046875, 0.3463134765625, 0.38580322265625, 0.42529296875, 0.46478271484375, 0.5042724609375, 0.54376220703125, 0.583251953125, 0.62274169921875, 0.6622314453125, 0.70172119140625, 0.7412109375, 0.78070068359375, 0.8201904296875, 0.85968017578125, 0.899169921875, 0.93865966796875, 0.9781494140625, 1.01763916015625, 1.05712890625, 1.09661865234375, 1.1361083984375, 1.17559814453125, 1.215087890625, 1.25457763671875, 1.2940673828125, 1.33355712890625, 1.373046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 15.0, 15.0, 25.0, 46.0, 61.0, 101.0, 151.0, 245.0, 404.0, 648.0, 984.0, 1589.0, 2513.0, 3897.0, 6072.0, 9312.0, 14391.0, 21976.0, 31910.0, 45404.0, 61562.0, 79713.0, 96118.0, 107680.0, 111343.0, 105211.0, 91511.0, 74286.0, 56345.0, 41036.0, 28749.0, 19406.0, 12786.0, 8361.0, 5350.0, 3397.0, 2147.0, 1382.0, 871.0, 543.0, 364.0, 248.0, 153.0, 76.0, 62.0, 38.0, 17.0, 13.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.847564697265625, -0.81964111328125, -0.791717529296875, -0.7637939453125, -0.735870361328125, -0.70794677734375, -0.680023193359375, -0.652099609375, -0.624176025390625, -0.59625244140625, -0.568328857421875, -0.5404052734375, -0.512481689453125, -0.48455810546875, -0.456634521484375, -0.4287109375, -0.400787353515625, -0.37286376953125, -0.344940185546875, -0.3170166015625, -0.289093017578125, -0.26116943359375, -0.233245849609375, -0.205322265625, -0.177398681640625, -0.14947509765625, -0.121551513671875, -0.0936279296875, -0.065704345703125, -0.03778076171875, -0.009857177734375, 0.01806640625, 0.045989990234375, 0.07391357421875, 0.101837158203125, 0.1297607421875, 0.157684326171875, 0.18560791015625, 0.213531494140625, 0.241455078125, 0.269378662109375, 0.29730224609375, 0.325225830078125, 0.3531494140625, 0.381072998046875, 0.40899658203125, 0.436920166015625, 0.46484375, 0.492767333984375, 0.52069091796875, 0.548614501953125, 0.5765380859375, 0.604461669921875, 0.63238525390625, 0.660308837890625, 0.688232421875, 0.716156005859375, 0.74407958984375, 0.772003173828125, 0.7999267578125, 0.827850341796875, 0.85577392578125, 0.883697509765625, 0.91162109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 12.0, 16.0, 20.0, 13.0, 32.0, 40.0, 31.0, 24.0, 45.0, 52.0, 52.0, 51.0, 56.0, 42.0, 44.0, 47.0, 48.0, 56.0, 41.0, 33.0, 50.0, 33.0, 26.0, 29.0, 24.0, 13.0, 11.0, 11.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6833038330078125, -0.657623291015625, -0.6319427490234375, -0.60626220703125, -0.5805816650390625, -0.554901123046875, -0.5292205810546875, -0.5035400390625, -0.4778594970703125, -0.452178955078125, -0.4264984130859375, -0.40081787109375, -0.3751373291015625, -0.349456787109375, -0.3237762451171875, -0.298095703125, -0.2724151611328125, -0.246734619140625, -0.2210540771484375, -0.19537353515625, -0.1696929931640625, -0.144012451171875, -0.1183319091796875, -0.0926513671875, -0.0669708251953125, -0.041290283203125, -0.0156097412109375, 0.01007080078125, 0.0357513427734375, 0.061431884765625, 0.0871124267578125, 0.11279296875, 0.1384735107421875, 0.164154052734375, 0.1898345947265625, 0.21551513671875, 0.2411956787109375, 0.266876220703125, 0.2925567626953125, 0.3182373046875, 0.3439178466796875, 0.369598388671875, 0.3952789306640625, 0.42095947265625, 0.4466400146484375, 0.472320556640625, 0.4980010986328125, 0.523681640625, 0.5493621826171875, 0.575042724609375, 0.6007232666015625, 0.62640380859375, 0.6520843505859375, 0.677764892578125, 0.7034454345703125, 0.7291259765625, 0.7548065185546875, 0.780487060546875, 0.8061676025390625, 0.83184814453125, 0.8575286865234375, 0.883209228515625, 0.9088897705078125, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 4.0, 9.0, 19.0, 29.0, 30.0, 37.0, 56.0, 82.0, 124.0, 215.0, 246.0, 403.0, 587.0, 869.0, 1309.0, 1976.0, 3057.0, 4616.0, 7145.0, 11384.0, 17593.0, 27230.0, 42210.0, 62524.0, 88929.0, 116502.0, 134577.0, 136402.0, 116924.0, 89630.0, 63299.0, 42319.0, 27685.0, 17843.0, 11367.0, 7256.0, 4924.0, 3130.0, 1965.0, 1289.0, 882.0, 565.0, 374.0, 276.0, 205.0, 132.0, 97.0, 66.0, 48.0, 39.0, 23.0, 21.0, 8.0, 11.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.46142578125, -0.44605255126953125, -0.4306793212890625, -0.41530609130859375, -0.399932861328125, -0.38455963134765625, -0.3691864013671875, -0.35381317138671875, -0.33843994140625, -0.32306671142578125, -0.3076934814453125, -0.29232025146484375, -0.276947021484375, -0.26157379150390625, -0.2462005615234375, -0.23082733154296875, -0.2154541015625, -0.20008087158203125, -0.1847076416015625, -0.16933441162109375, -0.153961181640625, -0.13858795166015625, -0.1232147216796875, -0.10784149169921875, -0.09246826171875, -0.07709503173828125, -0.0617218017578125, -0.04634857177734375, -0.030975341796875, -0.01560211181640625, -0.0002288818359375, 0.01514434814453125, 0.030517578125, 0.04589080810546875, 0.0612640380859375, 0.07663726806640625, 0.092010498046875, 0.10738372802734375, 0.1227569580078125, 0.13813018798828125, 0.15350341796875, 0.16887664794921875, 0.1842498779296875, 0.19962310791015625, 0.214996337890625, 0.23036956787109375, 0.2457427978515625, 0.26111602783203125, 0.2764892578125, 0.29186248779296875, 0.3072357177734375, 0.32260894775390625, 0.337982177734375, 0.35335540771484375, 0.3687286376953125, 0.38410186767578125, 0.39947509765625, 0.41484832763671875, 0.4302215576171875, 0.44559478759765625, 0.460968017578125, 0.47634124755859375, 0.4917144775390625, 0.5070877075195312, 0.5224609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 16.0, 22.0, 25.0, 28.0, 40.0, 35.0, 52.0, 48.0, 61.0, 59.0, 68.0, 65.0, 69.0, 50.0, 56.0, 50.0, 29.0, 46.0, 27.0, 16.0, 21.0, 16.0, 16.0, 13.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.340576171875e-05, -5.150400102138519e-05, -4.9602240324020386e-05, -4.770047962665558e-05, -4.579871892929077e-05, -4.3896958231925964e-05, -4.199519753456116e-05, -4.009343683719635e-05, -3.819167613983154e-05, -3.6289915442466736e-05, -3.438815474510193e-05, -3.248639404773712e-05, -3.0584633350372314e-05, -2.8682872653007507e-05, -2.67811119556427e-05, -2.4879351258277893e-05, -2.2977590560913086e-05, -2.107582986354828e-05, -1.917406916618347e-05, -1.7272308468818665e-05, -1.5370547771453857e-05, -1.346878707408905e-05, -1.1567026376724243e-05, -9.665265679359436e-06, -7.763504981994629e-06, -5.861744284629822e-06, -3.959983587265015e-06, -2.0582228899002075e-06, -1.564621925354004e-07, 1.7452985048294067e-06, 3.647059202194214e-06, 5.548819899559021e-06, 7.450580596923828e-06, 9.352341294288635e-06, 1.1254101991653442e-05, 1.315586268901825e-05, 1.5057623386383057e-05, 1.6959384083747864e-05, 1.886114478111267e-05, 2.0762905478477478e-05, 2.2664666175842285e-05, 2.4566426873207092e-05, 2.64681875705719e-05, 2.8369948267936707e-05, 3.0271708965301514e-05, 3.217346966266632e-05, 3.407523036003113e-05, 3.5976991057395935e-05, 3.787875175476074e-05, 3.978051245212555e-05, 4.1682273149490356e-05, 4.3584033846855164e-05, 4.548579454421997e-05, 4.738755524158478e-05, 4.9289315938949585e-05, 5.119107663631439e-05, 5.30928373336792e-05, 5.4994598031044006e-05, 5.6896358728408813e-05, 5.879811942577362e-05, 6.069988012313843e-05, 6.260164082050323e-05, 6.450340151786804e-05, 6.640516221523285e-05, 6.830692291259766e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 12.0, 8.0, 18.0, 28.0, 35.0, 41.0, 74.0, 106.0, 182.0, 280.0, 517.0, 771.0, 1402.0, 2447.0, 4601.0, 8304.0, 15893.0, 30309.0, 56366.0, 98206.0, 150535.0, 190416.0, 179239.0, 131875.0, 80131.0, 45044.0, 24030.0, 12518.0, 6665.0, 3629.0, 2037.0, 1047.0, 704.0, 403.0, 240.0, 147.0, 87.0, 85.0, 35.0, 31.0, 17.0, 20.0, 6.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5778579711914062, -0.5570831298828125, -0.5363082885742188, -0.515533447265625, -0.49475860595703125, -0.4739837646484375, -0.45320892333984375, -0.43243408203125, -0.41165924072265625, -0.3908843994140625, -0.37010955810546875, -0.349334716796875, -0.32855987548828125, -0.3077850341796875, -0.28701019287109375, -0.2662353515625, -0.24546051025390625, -0.2246856689453125, -0.20391082763671875, -0.183135986328125, -0.16236114501953125, -0.1415863037109375, -0.12081146240234375, -0.10003662109375, -0.07926177978515625, -0.0584869384765625, -0.03771209716796875, -0.016937255859375, 0.00383758544921875, 0.0246124267578125, 0.04538726806640625, 0.066162109375, 0.08693695068359375, 0.1077117919921875, 0.12848663330078125, 0.149261474609375, 0.17003631591796875, 0.1908111572265625, 0.21158599853515625, 0.23236083984375, 0.25313568115234375, 0.2739105224609375, 0.29468536376953125, 0.315460205078125, 0.33623504638671875, 0.3570098876953125, 0.37778472900390625, 0.3985595703125, 0.41933441162109375, 0.4401092529296875, 0.46088409423828125, 0.481658935546875, 0.5024337768554688, 0.5232086181640625, 0.5439834594726562, 0.56475830078125, 0.5855331420898438, 0.6063079833984375, 0.6270828247070312, 0.647857666015625, 0.6686325073242188, 0.6894073486328125, 0.7101821899414062, 0.73095703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 15.0, 8.0, 13.0, 12.0, 20.0, 18.0, 25.0, 31.0, 37.0, 31.0, 28.0, 35.0, 34.0, 39.0, 44.0, 48.0, 59.0, 45.0, 46.0, 36.0, 47.0, 43.0, 39.0, 35.0, 25.0, 24.0, 28.0, 15.0, 16.0, 15.0, 14.0, 7.0, 13.0, 11.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.154296875, -0.14919281005859375, -0.1440887451171875, -0.13898468017578125, -0.133880615234375, -0.12877655029296875, -0.1236724853515625, -0.11856842041015625, -0.11346435546875, -0.10836029052734375, -0.1032562255859375, -0.09815216064453125, -0.093048095703125, -0.08794403076171875, -0.0828399658203125, -0.07773590087890625, -0.0726318359375, -0.06752777099609375, -0.0624237060546875, -0.05731964111328125, -0.052215576171875, -0.04711151123046875, -0.0420074462890625, -0.03690338134765625, -0.03179931640625, -0.02669525146484375, -0.0215911865234375, -0.01648712158203125, -0.011383056640625, -0.00627899169921875, -0.0011749267578125, 0.00392913818359375, 0.009033203125, 0.01413726806640625, 0.0192413330078125, 0.02434539794921875, 0.029449462890625, 0.03455352783203125, 0.0396575927734375, 0.04476165771484375, 0.04986572265625, 0.05496978759765625, 0.0600738525390625, 0.06517791748046875, 0.070281982421875, 0.07538604736328125, 0.0804901123046875, 0.08559417724609375, 0.0906982421875, 0.09580230712890625, 0.1009063720703125, 0.10601043701171875, 0.111114501953125, 0.11621856689453125, 0.1213226318359375, 0.12642669677734375, 0.13153076171875, 0.13663482666015625, 0.1417388916015625, 0.14684295654296875, 0.151947021484375, 0.15705108642578125, 0.1621551513671875, 0.16725921630859375, 0.17236328125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 16.0, 6.0, 15.0, 20.0, 18.0, 33.0, 39.0, 30.0, 43.0, 39.0, 54.0, 55.0, 60.0, 48.0, 60.0, 65.0, 46.0, 48.0, 45.0, 50.0, 34.0, 18.0, 22.0, 22.0, 19.0, 14.0, 14.0, 21.0, 7.0, 4.0, 6.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.6769119501113892, -1.6277453899383545, -1.5785787105560303, -1.5294121503829956, -1.4802454710006714, -1.4310789108276367, -1.3819122314453125, -1.3327456712722778, -1.2835791110992432, -1.2344125509262085, -1.1852458715438843, -1.1360793113708496, -1.0869126319885254, -1.0377460718154907, -0.9885794520378113, -0.9394128322601318, -0.8902461528778076, -0.8410795331001282, -0.7919129133224487, -0.7427463531494141, -0.6935796737670898, -0.6444131135940552, -0.5952464938163757, -0.5460798740386963, -0.49691325426101685, -0.4477466344833374, -0.39858001470565796, -0.3494134247303009, -0.30024680495262146, -0.251080185174942, -0.20191359519958496, -0.15274697542190552, -0.10358047485351562, -0.05441386252641678, -0.005247250199317932, 0.04391935467720032, 0.09308597445487976, 0.1422525942325592, 0.19141918420791626, 0.2405858039855957, 0.28975242376327515, 0.3389190435409546, 0.38808566331863403, 0.4372522532939911, 0.48641887307167053, 0.5355855226516724, 0.584752082824707, 0.6339187026023865, 0.6830853223800659, 0.7322519421577454, 0.7814185619354248, 0.8305851221084595, 0.8797518014907837, 0.9289183616638184, 0.9780849814414978, 1.0272516012191772, 1.076418161392212, 1.1255847215652466, 1.1747514009475708, 1.2239179611206055, 1.2730846405029297, 1.3222512006759644, 1.371417760848999, 1.4205844402313232, 1.4697511196136475]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 9.0, 22.0, 16.0, 26.0, 21.0, 23.0, 30.0, 30.0, 41.0, 38.0, 37.0, 39.0, 51.0, 48.0, 35.0, 56.0, 37.0, 38.0, 33.0, 31.0, 28.0, 35.0, 27.0, 34.0, 31.0, 28.0, 27.0, 19.0, 11.0, 7.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.144634485244751, -1.109297513961792, -1.073960542678833, -1.0386236906051636, -1.0032867193222046, -0.9679497480392456, -0.9326127767562866, -0.8972758054733276, -0.8619388937950134, -0.8266019225120544, -0.7912650108337402, -0.7559280395507812, -0.7205910682678223, -0.6852541565895081, -0.6499171853065491, -0.6145802736282349, -0.5792433023452759, -0.5439063310623169, -0.5085694193840027, -0.4732324481010437, -0.4378955066204071, -0.4025585651397705, -0.3672215938568115, -0.3318846523761749, -0.29654771089553833, -0.26121076941490173, -0.22587381303310394, -0.19053685665130615, -0.15519991517066956, -0.11986297369003296, -0.08452601730823517, -0.04918906092643738, -0.013852119445800781, 0.021484829485416412, 0.056821778416633606, 0.0921587273478508, 0.127495676279068, 0.1628326177597046, 0.19816957414150238, 0.23350653052330017, 0.26884347200393677, 0.30418041348457336, 0.33951735496520996, 0.37485432624816895, 0.41019126772880554, 0.44552820920944214, 0.4808651804924011, 0.5162020921707153, 0.5515390634536743, 0.5868760347366333, 0.6222129464149475, 0.6575499176979065, 0.6928868293762207, 0.7282238006591797, 0.7635607719421387, 0.7988977432250977, 0.8342346549034119, 0.8695716261863708, 0.9049085378646851, 0.940245509147644, 0.975582480430603, 1.0109193325042725, 1.0462563037872314, 1.0815932750701904, 1.1169302463531494]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 13.0, 11.0, 15.0, 41.0, 46.0, 109.0, 174.0, 333.0, 568.0, 1207.0, 2272.0, 4708.0, 9716.0, 20627.0, 44025.0, 95672.0, 203285.0, 409970.0, 706146.0, 909909.0, 798348.0, 501046.0, 258374.0, 121932.0, 55986.0, 25905.0, 12256.0, 5804.0, 2836.0, 1409.0, 723.0, 384.0, 184.0, 94.0, 64.0, 39.0, 19.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.755859375, -1.7052001953125, -1.654541015625, -1.6038818359375, -1.55322265625, -1.5025634765625, -1.451904296875, -1.4012451171875, -1.3505859375, -1.2999267578125, -1.249267578125, -1.1986083984375, -1.14794921875, -1.0972900390625, -1.046630859375, -0.9959716796875, -0.9453125, -0.8946533203125, -0.843994140625, -0.7933349609375, -0.74267578125, -0.6920166015625, -0.641357421875, -0.5906982421875, -0.5400390625, -0.4893798828125, -0.438720703125, -0.3880615234375, -0.33740234375, -0.2867431640625, -0.236083984375, -0.1854248046875, -0.134765625, -0.0841064453125, -0.033447265625, 0.0172119140625, 0.06787109375, 0.1185302734375, 0.169189453125, 0.2198486328125, 0.2705078125, 0.3211669921875, 0.371826171875, 0.4224853515625, 0.47314453125, 0.5238037109375, 0.574462890625, 0.6251220703125, 0.67578125, 0.7264404296875, 0.777099609375, 0.8277587890625, 0.87841796875, 0.9290771484375, 0.979736328125, 1.0303955078125, 1.0810546875, 1.1317138671875, 1.182373046875, 1.2330322265625, 1.28369140625, 1.3343505859375, 1.385009765625, 1.4356689453125, 1.486328125]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 13.0, 9.0, 12.0, 10.0, 19.0, 31.0, 30.0, 29.0, 26.0, 49.0, 33.0, 41.0, 45.0, 49.0, 38.0, 35.0, 40.0, 45.0, 37.0, 43.0, 29.0, 45.0, 33.0, 27.0, 30.0, 25.0, 16.0, 29.0, 25.0, 18.0, 17.0, 10.0, 7.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.787078857421875, -0.76019287109375, -0.733306884765625, -0.7064208984375, -0.679534912109375, -0.65264892578125, -0.625762939453125, -0.598876953125, -0.571990966796875, -0.54510498046875, -0.518218994140625, -0.4913330078125, -0.464447021484375, -0.43756103515625, -0.410675048828125, -0.3837890625, -0.356903076171875, -0.33001708984375, -0.303131103515625, -0.2762451171875, -0.249359130859375, -0.22247314453125, -0.195587158203125, -0.168701171875, -0.141815185546875, -0.11492919921875, -0.088043212890625, -0.0611572265625, -0.034271240234375, -0.00738525390625, 0.019500732421875, 0.04638671875, 0.073272705078125, 0.10015869140625, 0.127044677734375, 0.1539306640625, 0.180816650390625, 0.20770263671875, 0.234588623046875, 0.261474609375, 0.288360595703125, 0.31524658203125, 0.342132568359375, 0.3690185546875, 0.395904541015625, 0.42279052734375, 0.449676513671875, 0.4765625, 0.503448486328125, 0.53033447265625, 0.557220458984375, 0.5841064453125, 0.610992431640625, 0.63787841796875, 0.664764404296875, 0.691650390625, 0.718536376953125, 0.74542236328125, 0.772308349609375, 0.7991943359375, 0.826080322265625, 0.85296630859375, 0.879852294921875, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 13.0, 15.0, 24.0, 32.0, 52.0, 98.0, 134.0, 218.0, 400.0, 645.0, 1104.0, 1712.0, 2976.0, 4915.0, 8323.0, 14300.0, 23989.0, 40635.0, 68420.0, 112730.0, 179049.0, 273481.0, 385726.0, 496175.0, 562167.0, 549921.0, 468452.0, 354587.0, 243655.0, 158411.0, 97473.0, 59054.0, 34842.0, 20728.0, 12034.0, 7288.0, 4193.0, 2548.0, 1474.0, 897.0, 544.0, 323.0, 208.0, 126.0, 71.0, 49.0, 17.0, 19.0, 16.0, 3.0, 3.0, 2.0, 5.0], "bins": [-1.2412109375, -1.2065963745117188, -1.1719818115234375, -1.1373672485351562, -1.102752685546875, -1.0681381225585938, -1.0335235595703125, -0.9989089965820312, -0.96429443359375, -0.9296798706054688, -0.8950653076171875, -0.8604507446289062, -0.825836181640625, -0.7912216186523438, -0.7566070556640625, -0.7219924926757812, -0.6873779296875, -0.6527633666992188, -0.6181488037109375, -0.5835342407226562, -0.548919677734375, -0.5143051147460938, -0.4796905517578125, -0.44507598876953125, -0.41046142578125, -0.37584686279296875, -0.3412322998046875, -0.30661773681640625, -0.272003173828125, -0.23738861083984375, -0.2027740478515625, -0.16815948486328125, -0.133544921875, -0.09893035888671875, -0.0643157958984375, -0.02970123291015625, 0.004913330078125, 0.03952789306640625, 0.0741424560546875, 0.10875701904296875, 0.14337158203125, 0.17798614501953125, 0.2126007080078125, 0.24721527099609375, 0.281829833984375, 0.31644439697265625, 0.3510589599609375, 0.38567352294921875, 0.4202880859375, 0.45490264892578125, 0.4895172119140625, 0.5241317749023438, 0.558746337890625, 0.5933609008789062, 0.6279754638671875, 0.6625900268554688, 0.69720458984375, 0.7318191528320312, 0.7664337158203125, 0.8010482788085938, 0.835662841796875, 0.8702774047851562, 0.9048919677734375, 0.9395065307617188, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 13.0, 10.0, 15.0, 11.0, 25.0, 26.0, 24.0, 32.0, 44.0, 62.0, 72.0, 77.0, 112.0, 123.0, 109.0, 142.0, 148.0, 164.0, 194.0, 216.0, 214.0, 193.0, 221.0, 194.0, 202.0, 178.0, 155.0, 176.0, 144.0, 127.0, 103.0, 82.0, 92.0, 73.0, 59.0, 41.0, 50.0, 29.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 2.0], "bins": [-0.425048828125, -0.4124870300292969, -0.39992523193359375, -0.3873634338378906, -0.3748016357421875, -0.3622398376464844, -0.34967803955078125, -0.3371162414550781, -0.324554443359375, -0.3119926452636719, -0.29943084716796875, -0.2868690490722656, -0.2743072509765625, -0.2617454528808594, -0.24918365478515625, -0.23662185668945312, -0.22406005859375, -0.21149826049804688, -0.19893646240234375, -0.18637466430664062, -0.1738128662109375, -0.16125106811523438, -0.14868927001953125, -0.13612747192382812, -0.123565673828125, -0.11100387573242188, -0.09844207763671875, -0.08588027954101562, -0.0733184814453125, -0.060756683349609375, -0.04819488525390625, -0.035633087158203125, -0.0230712890625, -0.010509490966796875, 0.00205230712890625, 0.014614105224609375, 0.0271759033203125, 0.039737701416015625, 0.05229949951171875, 0.06486129760742188, 0.077423095703125, 0.08998489379882812, 0.10254669189453125, 0.11510848999023438, 0.1276702880859375, 0.14023208618164062, 0.15279388427734375, 0.16535568237304688, 0.17791748046875, 0.19047927856445312, 0.20304107666015625, 0.21560287475585938, 0.2281646728515625, 0.24072647094726562, 0.25328826904296875, 0.2658500671386719, 0.278411865234375, 0.2909736633300781, 0.30353546142578125, 0.3160972595214844, 0.3286590576171875, 0.3412208557128906, 0.35378265380859375, 0.3663444519042969, 0.37890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 14.0, 20.0, 21.0, 23.0, 32.0, 42.0, 41.0, 47.0, 55.0, 63.0, 73.0, 64.0, 59.0, 70.0, 55.0, 55.0, 47.0, 50.0, 23.0, 22.0, 22.0, 17.0, 15.0, 12.0, 9.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7150763273239136, -1.6594101190567017, -1.6037440299987793, -1.5480778217315674, -1.4924116134643555, -1.4367454051971436, -1.3810791969299316, -1.3254131078720093, -1.2697468996047974, -1.2140806913375854, -1.158414602279663, -1.1027483940124512, -1.0470821857452393, -0.9914159774780273, -0.9357498288154602, -0.8800836801528931, -0.8244174718856812, -0.7687512636184692, -0.7130851149559021, -0.657418966293335, -0.601752758026123, -0.5460865497589111, -0.490420401096344, -0.43475422263145447, -0.37908804416656494, -0.3234218657016754, -0.2677556872367859, -0.21208950877189636, -0.15642333030700684, -0.10075715184211731, -0.04509097337722778, 0.010575205087661743, 0.06624150276184082, 0.12190768122673035, 0.17757385969161987, 0.2332400381565094, 0.2889062166213989, 0.34457239508628845, 0.400238573551178, 0.4559047520160675, 0.511570930480957, 0.567237138748169, 0.6229032874107361, 0.6785694360733032, 0.7342356443405151, 0.789901852607727, 0.8455680012702942, 0.9012341499328613, 0.9569003582000732, 1.0125665664672852, 1.068232774734497, 1.1238988637924194, 1.1795650720596313, 1.2352312803268433, 1.2908973693847656, 1.3465635776519775, 1.4022297859191895, 1.4578959941864014, 1.5135622024536133, 1.5692282915115356, 1.6248944997787476, 1.6805607080459595, 1.7362267971038818, 1.7918930053710938, 1.8475592136383057]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 12.0, 9.0, 17.0, 12.0, 14.0, 25.0, 23.0, 24.0, 23.0, 38.0, 36.0, 38.0, 33.0, 33.0, 38.0, 52.0, 30.0, 51.0, 30.0, 50.0, 43.0, 42.0, 31.0, 35.0, 34.0, 33.0, 28.0, 11.0, 27.0, 16.0, 11.0, 14.0, 10.0, 5.0, 9.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0477453470230103, -1.0165857076644897, -0.9854260087013245, -0.9542663097381592, -0.9231066703796387, -0.8919470310211182, -0.8607873320579529, -0.8296276330947876, -0.7984679937362671, -0.7673083543777466, -0.7361486554145813, -0.704988956451416, -0.6738293170928955, -0.642669677734375, -0.6115099787712097, -0.5803502798080444, -0.5491906404495239, -0.5180310010910034, -0.48687130212783813, -0.45571163296699524, -0.42455196380615234, -0.39339229464530945, -0.36223262548446655, -0.33107295632362366, -0.29991328716278076, -0.26875361800193787, -0.23759394884109497, -0.20643427968025208, -0.17527461051940918, -0.14411494135856628, -0.11295527219772339, -0.0817956030368805, -0.0506359338760376, -0.019476264715194702, 0.011683404445648193, 0.04284307360649109, 0.07400274276733398, 0.10516241192817688, 0.13632208108901978, 0.16748175024986267, 0.19864141941070557, 0.22980108857154846, 0.26096075773239136, 0.29212042689323425, 0.32328009605407715, 0.35443976521492004, 0.38559943437576294, 0.41675910353660583, 0.44791877269744873, 0.4790784418582916, 0.5102381110191345, 0.5413978099822998, 0.5725574493408203, 0.6037170886993408, 0.6348767876625061, 0.6660364866256714, 0.6971961259841919, 0.7283557653427124, 0.7595154643058777, 0.790675163269043, 0.8218348026275635, 0.852994441986084, 0.8841541409492493, 0.9153138399124146, 0.9464734792709351]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 7.0, 8.0, 17.0, 33.0, 33.0, 74.0, 89.0, 155.0, 243.0, 405.0, 644.0, 1115.0, 1781.0, 2826.0, 4627.0, 7473.0, 12351.0, 20138.0, 33082.0, 53694.0, 83657.0, 124547.0, 163936.0, 168373.0, 130924.0, 89435.0, 57114.0, 35471.0, 22043.0, 13466.0, 8199.0, 4824.0, 2978.0, 1825.0, 1112.0, 689.0, 447.0, 265.0, 164.0, 106.0, 72.0, 49.0, 38.0, 14.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21484375, -0.20660400390625, -0.1983642578125, -0.19012451171875, -0.181884765625, -0.17364501953125, -0.1654052734375, -0.15716552734375, -0.14892578125, -0.14068603515625, -0.1324462890625, -0.12420654296875, -0.115966796875, -0.10772705078125, -0.0994873046875, -0.09124755859375, -0.0830078125, -0.07476806640625, -0.0665283203125, -0.05828857421875, -0.050048828125, -0.04180908203125, -0.0335693359375, -0.02532958984375, -0.01708984375, -0.00885009765625, -0.0006103515625, 0.00762939453125, 0.015869140625, 0.02410888671875, 0.0323486328125, 0.04058837890625, 0.048828125, 0.05706787109375, 0.0653076171875, 0.07354736328125, 0.081787109375, 0.09002685546875, 0.0982666015625, 0.10650634765625, 0.11474609375, 0.12298583984375, 0.1312255859375, 0.13946533203125, 0.147705078125, 0.15594482421875, 0.1641845703125, 0.17242431640625, 0.1806640625, 0.18890380859375, 0.1971435546875, 0.20538330078125, 0.213623046875, 0.22186279296875, 0.2301025390625, 0.23834228515625, 0.24658203125, 0.25482177734375, 0.2630615234375, 0.27130126953125, 0.279541015625, 0.28778076171875, 0.2960205078125, 0.30426025390625, 0.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 5.0, 7.0, 16.0, 18.0, 14.0, 16.0, 22.0, 27.0, 31.0, 33.0, 41.0, 35.0, 36.0, 30.0, 44.0, 47.0, 42.0, 51.0, 44.0, 45.0, 31.0, 40.0, 37.0, 31.0, 27.0, 35.0, 14.0, 32.0, 27.0, 26.0, 8.0, 12.0, 15.0, 8.0, 5.0, 6.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.09375, -1.0586395263671875, -1.023529052734375, -0.9884185791015625, -0.95330810546875, -0.9181976318359375, -0.883087158203125, -0.8479766845703125, -0.8128662109375, -0.7777557373046875, -0.742645263671875, -0.7075347900390625, -0.67242431640625, -0.6373138427734375, -0.602203369140625, -0.5670928955078125, -0.531982421875, -0.4968719482421875, -0.461761474609375, -0.4266510009765625, -0.39154052734375, -0.3564300537109375, -0.321319580078125, -0.2862091064453125, -0.2510986328125, -0.2159881591796875, -0.180877685546875, -0.1457672119140625, -0.11065673828125, -0.0755462646484375, -0.040435791015625, -0.0053253173828125, 0.02978515625, 0.0648956298828125, 0.100006103515625, 0.1351165771484375, 0.17022705078125, 0.2053375244140625, 0.240447998046875, 0.2755584716796875, 0.3106689453125, 0.3457794189453125, 0.380889892578125, 0.4160003662109375, 0.45111083984375, 0.4862213134765625, 0.521331787109375, 0.5564422607421875, 0.591552734375, 0.6266632080078125, 0.661773681640625, 0.6968841552734375, 0.73199462890625, 0.7671051025390625, 0.802215576171875, 0.8373260498046875, 0.8724365234375, 0.9075469970703125, 0.942657470703125, 0.9777679443359375, 1.01287841796875, 1.0479888916015625, 1.083099365234375, 1.1182098388671875, 1.1533203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 16.0, 21.0, 26.0, 44.0, 65.0, 100.0, 151.0, 321.0, 527.0, 1001.0, 1953.0, 3783.0, 7899.0, 16429.0, 34407.0, 72623.0, 143544.0, 232116.0, 237087.0, 149841.0, 76474.0, 36324.0, 17294.0, 8163.0, 4082.0, 1903.0, 1014.0, 571.0, 291.0, 193.0, 83.0, 63.0, 48.0, 22.0, 25.0, 14.0, 8.0, 7.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.437255859375, -0.424407958984375, -0.41156005859375, -0.398712158203125, -0.3858642578125, -0.373016357421875, -0.36016845703125, -0.347320556640625, -0.33447265625, -0.321624755859375, -0.30877685546875, -0.295928955078125, -0.2830810546875, -0.270233154296875, -0.25738525390625, -0.244537353515625, -0.231689453125, -0.218841552734375, -0.20599365234375, -0.193145751953125, -0.1802978515625, -0.167449951171875, -0.15460205078125, -0.141754150390625, -0.12890625, -0.116058349609375, -0.10321044921875, -0.090362548828125, -0.0775146484375, -0.064666748046875, -0.05181884765625, -0.038970947265625, -0.026123046875, -0.013275146484375, -0.00042724609375, 0.012420654296875, 0.0252685546875, 0.038116455078125, 0.05096435546875, 0.063812255859375, 0.07666015625, 0.089508056640625, 0.10235595703125, 0.115203857421875, 0.1280517578125, 0.140899658203125, 0.15374755859375, 0.166595458984375, 0.179443359375, 0.192291259765625, 0.20513916015625, 0.217987060546875, 0.2308349609375, 0.243682861328125, 0.25653076171875, 0.269378662109375, 0.2822265625, 0.295074462890625, 0.30792236328125, 0.320770263671875, 0.3336181640625, 0.346466064453125, 0.35931396484375, 0.372161865234375, 0.385009765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 10.0, 22.0, 23.0, 25.0, 25.0, 32.0, 25.0, 40.0, 36.0, 36.0, 37.0, 44.0, 35.0, 36.0, 34.0, 47.0, 40.0, 39.0, 47.0, 42.0, 43.0, 25.0, 43.0, 29.0, 27.0, 31.0, 15.0, 14.0, 13.0, 12.0, 8.0, 8.0, 6.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.748046875, -0.7252426147460938, -0.7024383544921875, -0.6796340942382812, -0.656829833984375, -0.6340255737304688, -0.6112213134765625, -0.5884170532226562, -0.56561279296875, -0.5428085327148438, -0.5200042724609375, -0.49720001220703125, -0.474395751953125, -0.45159149169921875, -0.4287872314453125, -0.40598297119140625, -0.3831787109375, -0.36037445068359375, -0.3375701904296875, -0.31476593017578125, -0.291961669921875, -0.26915740966796875, -0.2463531494140625, -0.22354888916015625, -0.20074462890625, -0.17794036865234375, -0.1551361083984375, -0.13233184814453125, -0.109527587890625, -0.08672332763671875, -0.0639190673828125, -0.04111480712890625, -0.018310546875, 0.00449371337890625, 0.0272979736328125, 0.05010223388671875, 0.072906494140625, 0.09571075439453125, 0.1185150146484375, 0.14131927490234375, 0.16412353515625, 0.18692779541015625, 0.2097320556640625, 0.23253631591796875, 0.255340576171875, 0.27814483642578125, 0.3009490966796875, 0.32375335693359375, 0.3465576171875, 0.36936187744140625, 0.3921661376953125, 0.41497039794921875, 0.437774658203125, 0.46057891845703125, 0.4833831787109375, 0.5061874389648438, 0.52899169921875, 0.5517959594726562, 0.5746002197265625, 0.5974044799804688, 0.620208740234375, 0.6430130004882812, 0.6658172607421875, 0.6886215209960938, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 7.0, 15.0, 20.0, 30.0, 33.0, 39.0, 80.0, 106.0, 159.0, 253.0, 363.0, 540.0, 882.0, 1338.0, 2145.0, 3523.0, 5848.0, 10449.0, 19765.0, 42676.0, 104117.0, 275394.0, 334154.0, 138400.0, 53669.0, 24343.0, 12486.0, 6746.0, 4049.0, 2498.0, 1514.0, 985.0, 650.0, 397.0, 284.0, 186.0, 112.0, 71.0, 69.0, 46.0, 28.0, 23.0, 22.0, 12.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1417236328125, -0.13717269897460938, -0.13262176513671875, -0.12807083129882812, -0.1235198974609375, -0.11896896362304688, -0.11441802978515625, -0.10986709594726562, -0.105316162109375, -0.10076522827148438, -0.09621429443359375, -0.09166336059570312, -0.0871124267578125, -0.08256149291992188, -0.07801055908203125, -0.07345962524414062, -0.06890869140625, -0.06435775756835938, -0.05980682373046875, -0.055255889892578125, -0.0507049560546875, -0.046154022216796875, -0.04160308837890625, -0.037052154541015625, -0.032501220703125, -0.027950286865234375, -0.02339935302734375, -0.018848419189453125, -0.0142974853515625, -0.009746551513671875, -0.00519561767578125, -0.000644683837890625, 0.00390625, 0.008457183837890625, 0.01300811767578125, 0.017559051513671875, 0.0221099853515625, 0.026660919189453125, 0.03121185302734375, 0.035762786865234375, 0.040313720703125, 0.044864654541015625, 0.04941558837890625, 0.053966522216796875, 0.0585174560546875, 0.06306838989257812, 0.06761932373046875, 0.07217025756835938, 0.07672119140625, 0.08127212524414062, 0.08582305908203125, 0.09037399291992188, 0.0949249267578125, 0.09947586059570312, 0.10402679443359375, 0.10857772827148438, 0.113128662109375, 0.11767959594726562, 0.12223052978515625, 0.12678146362304688, 0.1313323974609375, 0.13588333129882812, 0.14043426513671875, 0.14498519897460938, 0.1495361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 12.0, 15.0, 12.0, 30.0, 30.0, 31.0, 34.0, 43.0, 42.0, 46.0, 42.0, 64.0, 59.0, 59.0, 50.0, 56.0, 43.0, 51.0, 38.0, 39.0, 29.0, 30.0, 27.0, 21.0, 10.0, 9.0, 11.0, 10.0, 7.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0132789611816406e-05, -9.812414646148682e-06, -9.492039680480957e-06, -9.171664714813232e-06, -8.851289749145508e-06, -8.530914783477783e-06, -8.210539817810059e-06, -7.890164852142334e-06, -7.569789886474609e-06, -7.249414920806885e-06, -6.92903995513916e-06, -6.6086649894714355e-06, -6.288290023803711e-06, -5.967915058135986e-06, -5.647540092468262e-06, -5.327165126800537e-06, -5.0067901611328125e-06, -4.686415195465088e-06, -4.366040229797363e-06, -4.045665264129639e-06, -3.725290298461914e-06, -3.4049153327941895e-06, -3.084540367126465e-06, -2.7641654014587402e-06, -2.4437904357910156e-06, -2.123415470123291e-06, -1.8030405044555664e-06, -1.4826655387878418e-06, -1.1622905731201172e-06, -8.419156074523926e-07, -5.21540641784668e-07, -2.0116567611694336e-07, 1.1920928955078125e-07, 4.3958425521850586e-07, 7.599592208862305e-07, 1.080334186553955e-06, 1.4007091522216797e-06, 1.7210841178894043e-06, 2.041459083557129e-06, 2.3618340492248535e-06, 2.682209014892578e-06, 3.0025839805603027e-06, 3.3229589462280273e-06, 3.643333911895752e-06, 3.9637088775634766e-06, 4.284083843231201e-06, 4.604458808898926e-06, 4.92483377456665e-06, 5.245208740234375e-06, 5.5655837059021e-06, 5.885958671569824e-06, 6.206333637237549e-06, 6.5267086029052734e-06, 6.847083568572998e-06, 7.167458534240723e-06, 7.487833499908447e-06, 7.808208465576172e-06, 8.128583431243896e-06, 8.448958396911621e-06, 8.769333362579346e-06, 9.08970832824707e-06, 9.410083293914795e-06, 9.73045825958252e-06, 1.0050833225250244e-05, 1.0371208190917969e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 0.0, 7.0, 18.0, 19.0, 27.0, 53.0, 80.0, 119.0, 212.0, 291.0, 476.0, 824.0, 1382.0, 2432.0, 4030.0, 7078.0, 12623.0, 23080.0, 43206.0, 84580.0, 157625.0, 234993.0, 210404.0, 124752.0, 64491.0, 33679.0, 18115.0, 10100.0, 5688.0, 3372.0, 1835.0, 1180.0, 700.0, 384.0, 259.0, 164.0, 100.0, 64.0, 42.0, 20.0, 19.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111572265625, -0.1075592041015625, -0.103546142578125, -0.0995330810546875, -0.09552001953125, -0.0915069580078125, -0.087493896484375, -0.0834808349609375, -0.0794677734375, -0.0754547119140625, -0.071441650390625, -0.0674285888671875, -0.06341552734375, -0.0594024658203125, -0.055389404296875, -0.0513763427734375, -0.04736328125, -0.0433502197265625, -0.039337158203125, -0.0353240966796875, -0.03131103515625, -0.0272979736328125, -0.023284912109375, -0.0192718505859375, -0.0152587890625, -0.0112457275390625, -0.007232666015625, -0.0032196044921875, 0.00079345703125, 0.0048065185546875, 0.008819580078125, 0.0128326416015625, 0.016845703125, 0.0208587646484375, 0.024871826171875, 0.0288848876953125, 0.03289794921875, 0.0369110107421875, 0.040924072265625, 0.0449371337890625, 0.0489501953125, 0.0529632568359375, 0.056976318359375, 0.0609893798828125, 0.06500244140625, 0.0690155029296875, 0.073028564453125, 0.0770416259765625, 0.0810546875, 0.0850677490234375, 0.089080810546875, 0.0930938720703125, 0.09710693359375, 0.1011199951171875, 0.105133056640625, 0.1091461181640625, 0.1131591796875, 0.1171722412109375, 0.121185302734375, 0.1251983642578125, 0.12921142578125, 0.1332244873046875, 0.137237548828125, 0.1412506103515625, 0.145263671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 8.0, 6.0, 9.0, 17.0, 23.0, 31.0, 40.0, 47.0, 59.0, 60.0, 76.0, 96.0, 70.0, 84.0, 81.0, 55.0, 50.0, 42.0, 27.0, 22.0, 19.0, 7.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.028400421142578125, -0.02716827392578125, -0.025936126708984375, -0.0247039794921875, -0.023471832275390625, -0.02223968505859375, -0.021007537841796875, -0.019775390625, -0.018543243408203125, -0.01731109619140625, -0.016078948974609375, -0.0148468017578125, -0.013614654541015625, -0.01238250732421875, -0.011150360107421875, -0.009918212890625, -0.008686065673828125, -0.00745391845703125, -0.006221771240234375, -0.0049896240234375, -0.003757476806640625, -0.00252532958984375, -0.001293182373046875, -6.103515625e-05, 0.001171112060546875, 0.00240325927734375, 0.003635406494140625, 0.0048675537109375, 0.006099700927734375, 0.00733184814453125, 0.008563995361328125, 0.009796142578125, 0.011028289794921875, 0.01226043701171875, 0.013492584228515625, 0.0147247314453125, 0.015956878662109375, 0.01718902587890625, 0.018421173095703125, 0.0196533203125, 0.020885467529296875, 0.02211761474609375, 0.023349761962890625, 0.0245819091796875, 0.025814056396484375, 0.02704620361328125, 0.028278350830078125, 0.029510498046875, 0.030742645263671875, 0.03197479248046875, 0.033206939697265625, 0.0344390869140625, 0.035671234130859375, 0.03690338134765625, 0.038135528564453125, 0.03936767578125, 0.040599822998046875, 0.04183197021484375, 0.043064117431640625, 0.0442962646484375, 0.045528411865234375, 0.04676055908203125, 0.047992706298828125, 0.049224853515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 7.0, 6.0, 6.0, 9.0, 10.0, 16.0, 19.0, 20.0, 28.0, 48.0, 30.0, 45.0, 46.0, 66.0, 55.0, 71.0, 69.0, 54.0, 70.0, 52.0, 47.0, 43.0, 45.0, 25.0, 23.0, 18.0, 18.0, 15.0, 9.0, 10.0, 10.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.644814133644104, -1.5906760692596436, -1.5365378856658936, -1.482399821281433, -1.428261637687683, -1.3741235733032227, -1.3199853897094727, -1.2658473253250122, -1.2117092609405518, -1.1575711965560913, -1.1034330129623413, -1.0492949485778809, -0.9951568245887756, -0.9410187005996704, -0.8868805766105652, -0.83274245262146, -0.7786043286323547, -0.7244662046432495, -0.6703280806541443, -0.6161899566650391, -0.5620518922805786, -0.5079137682914734, -0.45377564430236816, -0.3996375501155853, -0.3454994261264801, -0.2913613021373749, -0.23722320795059204, -0.18308508396148682, -0.12894697487354279, -0.07480886578559875, -0.02067074179649353, 0.03346735239028931, 0.08760547637939453, 0.14174358546733856, 0.1958816945552826, 0.2500198185443878, 0.30415791273117065, 0.3582960367202759, 0.4124341607093811, 0.46657225489616394, 0.5207103490829468, 0.574848473072052, 0.6289865970611572, 0.6831246614456177, 0.7372627854347229, 0.7914009094238281, 0.8455390334129333, 0.8996771574020386, 0.9538152813911438, 1.007953405380249, 1.0620914697647095, 1.1162296533584595, 1.17036771774292, 1.22450590133667, 1.2786439657211304, 1.3327820301055908, 1.3869202136993408, 1.4410582780838013, 1.4951964616775513, 1.5493345260620117, 1.6034727096557617, 1.6576107740402222, 1.7117488384246826, 1.7658870220184326, 1.820025086402893]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 16.0, 11.0, 14.0, 17.0, 27.0, 20.0, 24.0, 28.0, 41.0, 36.0, 33.0, 33.0, 37.0, 41.0, 44.0, 40.0, 41.0, 35.0, 49.0, 46.0, 33.0, 39.0, 36.0, 29.0, 29.0, 26.0, 14.0, 24.0, 15.0, 13.0, 12.0, 8.0, 7.0, 10.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0365345478057861, -1.0054458379745483, -0.9743571877479553, -0.9432684779167175, -0.9121797680854797, -0.8810911178588867, -0.8500024080276489, -0.8189136981964111, -0.7878249883651733, -0.7567362785339355, -0.7256476283073425, -0.6945589184761047, -0.6634702086448669, -0.6323815584182739, -0.6012928485870361, -0.5702041387557983, -0.5391154289245605, -0.5080267190933228, -0.47693803906440735, -0.44584935903549194, -0.41476064920425415, -0.38367196917533875, -0.35258328914642334, -0.32149457931518555, -0.29040592908859253, -0.2593172490596771, -0.22822853922843933, -0.19713985919952393, -0.16605114936828613, -0.13496246933937073, -0.10387377440929413, -0.07278507947921753, -0.041696369647979736, -0.010607676580548286, 0.020481016486883163, 0.051569707691669464, 0.08265840262174606, 0.11374709010124207, 0.14483578503131866, 0.17592447996139526, 0.20701317489147186, 0.23810186982154846, 0.26919054985046387, 0.30027925968170166, 0.33136793971061707, 0.36245661973953247, 0.39354532957077026, 0.42463403940200806, 0.45572271943092346, 0.48681139945983887, 0.5179001092910767, 0.5489888191223145, 0.5800774693489075, 0.6111661791801453, 0.6422548890113831, 0.6733435392379761, 0.7044322490692139, 0.7355209589004517, 0.7666096091270447, 0.7976983189582825, 0.8287870287895203, 0.8598756790161133, 0.8909643888473511, 0.9220530986785889, 0.9531418085098267]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 15.0, 13.0, 24.0, 35.0, 67.0, 98.0, 133.0, 251.0, 436.0, 672.0, 1159.0, 2024.0, 3361.0, 5546.0, 9478.0, 15526.0, 24875.0, 38559.0, 57642.0, 80537.0, 104299.0, 122948.0, 129396.0, 121257.0, 101697.0, 77271.0, 54921.0, 37020.0, 23107.0, 14401.0, 8788.0, 5247.0, 3018.0, 1896.0, 1153.0, 637.0, 369.0, 241.0, 147.0, 106.0, 59.0, 37.0, 27.0, 21.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 6.0], "bins": [-1.0537109375, -1.0231094360351562, -0.9925079345703125, -0.9619064331054688, -0.931304931640625, -0.9007034301757812, -0.8701019287109375, -0.8395004272460938, -0.80889892578125, -0.7782974243164062, -0.7476959228515625, -0.7170944213867188, -0.686492919921875, -0.6558914184570312, -0.6252899169921875, -0.5946884155273438, -0.5640869140625, -0.5334854125976562, -0.5028839111328125, -0.47228240966796875, -0.441680908203125, -0.41107940673828125, -0.3804779052734375, -0.34987640380859375, -0.31927490234375, -0.28867340087890625, -0.2580718994140625, -0.22747039794921875, -0.196868896484375, -0.16626739501953125, -0.1356658935546875, -0.10506439208984375, -0.074462890625, -0.04386138916015625, -0.0132598876953125, 0.01734161376953125, 0.047943115234375, 0.07854461669921875, 0.1091461181640625, 0.13974761962890625, 0.17034912109375, 0.20095062255859375, 0.2315521240234375, 0.26215362548828125, 0.292755126953125, 0.32335662841796875, 0.3539581298828125, 0.38455963134765625, 0.4151611328125, 0.44576263427734375, 0.4763641357421875, 0.5069656372070312, 0.537567138671875, 0.5681686401367188, 0.5987701416015625, 0.6293716430664062, 0.65997314453125, 0.6905746459960938, 0.7211761474609375, 0.7517776489257812, 0.782379150390625, 0.8129806518554688, 0.8435821533203125, 0.8741836547851562, 0.90478515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 12.0, 5.0, 14.0, 16.0, 11.0, 23.0, 35.0, 22.0, 33.0, 31.0, 30.0, 44.0, 49.0, 44.0, 60.0, 49.0, 53.0, 52.0, 37.0, 45.0, 44.0, 43.0, 30.0, 25.0, 28.0, 29.0, 25.0, 8.0, 16.0, 11.0, 15.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.22607421875, -1.1884765625, -1.15087890625, -1.11328125, -1.07568359375, -1.0380859375, -1.00048828125, -0.962890625, -0.92529296875, -0.8876953125, -0.85009765625, -0.8125, -0.77490234375, -0.7373046875, -0.69970703125, -0.662109375, -0.62451171875, -0.5869140625, -0.54931640625, -0.51171875, -0.47412109375, -0.4365234375, -0.39892578125, -0.361328125, -0.32373046875, -0.2861328125, -0.24853515625, -0.2109375, -0.17333984375, -0.1357421875, -0.09814453125, -0.060546875, -0.02294921875, 0.0146484375, 0.05224609375, 0.08984375, 0.12744140625, 0.1650390625, 0.20263671875, 0.240234375, 0.27783203125, 0.3154296875, 0.35302734375, 0.390625, 0.42822265625, 0.4658203125, 0.50341796875, 0.541015625, 0.57861328125, 0.6162109375, 0.65380859375, 0.69140625, 0.72900390625, 0.7666015625, 0.80419921875, 0.841796875, 0.87939453125, 0.9169921875, 0.95458984375, 0.9921875, 1.02978515625, 1.0673828125, 1.10498046875, 1.142578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 5.0, 13.0, 18.0, 27.0, 37.0, 68.0, 94.0, 179.0, 303.0, 486.0, 819.0, 1395.0, 2398.0, 3926.0, 6242.0, 10014.0, 16372.0, 25509.0, 38498.0, 55605.0, 75921.0, 97229.0, 114464.0, 121588.0, 117499.0, 101670.0, 80640.0, 59727.0, 42282.0, 27995.0, 18212.0, 11424.0, 6979.0, 4390.0, 2663.0, 1530.0, 971.0, 557.0, 339.0, 179.0, 129.0, 59.0, 41.0, 23.0, 12.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.97216796875, -0.9423599243164062, -0.9125518798828125, -0.8827438354492188, -0.852935791015625, -0.8231277465820312, -0.7933197021484375, -0.7635116577148438, -0.73370361328125, -0.7038955688476562, -0.6740875244140625, -0.6442794799804688, -0.614471435546875, -0.5846633911132812, -0.5548553466796875, -0.5250473022460938, -0.4952392578125, -0.46543121337890625, -0.4356231689453125, -0.40581512451171875, -0.376007080078125, -0.34619903564453125, -0.3163909912109375, -0.28658294677734375, -0.25677490234375, -0.22696685791015625, -0.1971588134765625, -0.16735076904296875, -0.137542724609375, -0.10773468017578125, -0.0779266357421875, -0.04811859130859375, -0.018310546875, 0.01149749755859375, 0.0413055419921875, 0.07111358642578125, 0.100921630859375, 0.13072967529296875, 0.1605377197265625, 0.19034576416015625, 0.22015380859375, 0.24996185302734375, 0.2797698974609375, 0.30957794189453125, 0.339385986328125, 0.36919403076171875, 0.3990020751953125, 0.42881011962890625, 0.4586181640625, 0.48842620849609375, 0.5182342529296875, 0.5480422973632812, 0.577850341796875, 0.6076583862304688, 0.6374664306640625, 0.6672744750976562, 0.69708251953125, 0.7268905639648438, 0.7566986083984375, 0.7865066528320312, 0.816314697265625, 0.8461227416992188, 0.8759307861328125, 0.9057388305664062, 0.935546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 7.0, 16.0, 12.0, 29.0, 22.0, 21.0, 28.0, 25.0, 44.0, 31.0, 42.0, 53.0, 47.0, 40.0, 41.0, 30.0, 41.0, 34.0, 44.0, 47.0, 38.0, 46.0, 28.0, 32.0, 26.0, 22.0, 23.0, 26.0, 18.0, 23.0, 10.0, 9.0, 8.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5962295532226562, -0.5747833251953125, -0.5533370971679688, -0.531890869140625, -0.5104446411132812, -0.4889984130859375, -0.46755218505859375, -0.44610595703125, -0.42465972900390625, -0.4032135009765625, -0.38176727294921875, -0.360321044921875, -0.33887481689453125, -0.3174285888671875, -0.29598236083984375, -0.2745361328125, -0.25308990478515625, -0.2316436767578125, -0.21019744873046875, -0.188751220703125, -0.16730499267578125, -0.1458587646484375, -0.12441253662109375, -0.10296630859375, -0.08152008056640625, -0.0600738525390625, -0.03862762451171875, -0.017181396484375, 0.00426483154296875, 0.0257110595703125, 0.04715728759765625, 0.068603515625, 0.09004974365234375, 0.1114959716796875, 0.13294219970703125, 0.154388427734375, 0.17583465576171875, 0.1972808837890625, 0.21872711181640625, 0.24017333984375, 0.26161956787109375, 0.2830657958984375, 0.30451202392578125, 0.325958251953125, 0.34740447998046875, 0.3688507080078125, 0.39029693603515625, 0.4117431640625, 0.43318939208984375, 0.4546356201171875, 0.47608184814453125, 0.497528076171875, 0.5189743041992188, 0.5404205322265625, 0.5618667602539062, 0.58331298828125, 0.6047592163085938, 0.6262054443359375, 0.6476516723632812, 0.669097900390625, 0.6905441284179688, 0.7119903564453125, 0.7334365844726562, 0.7548828125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 21.0, 26.0, 52.0, 71.0, 107.0, 147.0, 193.0, 351.0, 498.0, 812.0, 1331.0, 2348.0, 4114.0, 7777.0, 14953.0, 29138.0, 56813.0, 104569.0, 168142.0, 209219.0, 184407.0, 121519.0, 67684.0, 35248.0, 17903.0, 9201.0, 4971.0, 2733.0, 1586.0, 945.0, 573.0, 352.0, 242.0, 158.0, 103.0, 59.0, 48.0, 39.0, 21.0, 18.0, 15.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.70123291015625, -0.6783447265625, -0.65545654296875, -0.632568359375, -0.60968017578125, -0.5867919921875, -0.56390380859375, -0.541015625, -0.51812744140625, -0.4952392578125, -0.47235107421875, -0.449462890625, -0.42657470703125, -0.4036865234375, -0.38079833984375, -0.35791015625, -0.33502197265625, -0.3121337890625, -0.28924560546875, -0.266357421875, -0.24346923828125, -0.2205810546875, -0.19769287109375, -0.1748046875, -0.15191650390625, -0.1290283203125, -0.10614013671875, -0.083251953125, -0.06036376953125, -0.0374755859375, -0.01458740234375, 0.00830078125, 0.03118896484375, 0.0540771484375, 0.07696533203125, 0.099853515625, 0.12274169921875, 0.1456298828125, 0.16851806640625, 0.19140625, 0.21429443359375, 0.2371826171875, 0.26007080078125, 0.282958984375, 0.30584716796875, 0.3287353515625, 0.35162353515625, 0.37451171875, 0.39739990234375, 0.4202880859375, 0.44317626953125, 0.466064453125, 0.48895263671875, 0.5118408203125, 0.53472900390625, 0.5576171875, 0.58050537109375, 0.6033935546875, 0.62628173828125, 0.649169921875, 0.67205810546875, 0.6949462890625, 0.71783447265625, 0.74072265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 1.0, 5.0, 11.0, 7.0, 11.0, 15.0, 17.0, 24.0, 22.0, 23.0, 27.0, 45.0, 39.0, 34.0, 52.0, 51.0, 62.0, 47.0, 40.0, 69.0, 48.0, 53.0, 48.0, 52.0, 32.0, 32.0, 36.0, 17.0, 11.0, 18.0, 8.0, 8.0, 5.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.357099533081055e-05, -4.1943974792957306e-05, -4.0316954255104065e-05, -3.8689933717250824e-05, -3.706291317939758e-05, -3.543589264154434e-05, -3.38088721036911e-05, -3.218185156583786e-05, -3.055483102798462e-05, -2.8927810490131378e-05, -2.7300789952278137e-05, -2.5673769414424896e-05, -2.4046748876571655e-05, -2.2419728338718414e-05, -2.0792707800865173e-05, -1.9165687263011932e-05, -1.753866672515869e-05, -1.591164618730545e-05, -1.428462564945221e-05, -1.2657605111598969e-05, -1.1030584573745728e-05, -9.403564035892487e-06, -7.776543498039246e-06, -6.149522960186005e-06, -4.522502422332764e-06, -2.8954818844795227e-06, -1.2684613466262817e-06, 3.5855919122695923e-07, 1.9855797290802e-06, 3.612600266933441e-06, 5.239620804786682e-06, 6.866641342639923e-06, 8.493661880493164e-06, 1.0120682418346405e-05, 1.1747702956199646e-05, 1.3374723494052887e-05, 1.5001744031906128e-05, 1.662876456975937e-05, 1.825578510761261e-05, 1.988280564546585e-05, 2.1509826183319092e-05, 2.3136846721172333e-05, 2.4763867259025574e-05, 2.6390887796878815e-05, 2.8017908334732056e-05, 2.9644928872585297e-05, 3.127194941043854e-05, 3.289896994829178e-05, 3.452599048614502e-05, 3.615301102399826e-05, 3.77800315618515e-05, 3.940705209970474e-05, 4.1034072637557983e-05, 4.2661093175411224e-05, 4.4288113713264465e-05, 4.5915134251117706e-05, 4.754215478897095e-05, 4.916917532682419e-05, 5.079619586467743e-05, 5.242321640253067e-05, 5.405023694038391e-05, 5.567725747823715e-05, 5.730427801609039e-05, 5.8931298553943634e-05, 6.0558319091796875e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 3.0, 11.0, 9.0, 17.0, 30.0, 54.0, 70.0, 127.0, 189.0, 283.0, 545.0, 880.0, 1416.0, 2431.0, 3994.0, 6661.0, 11224.0, 19066.0, 31131.0, 49666.0, 75383.0, 106676.0, 134235.0, 147185.0, 136659.0, 108893.0, 78643.0, 51342.0, 32335.0, 19917.0, 11936.0, 7034.0, 4096.0, 2517.0, 1515.0, 903.0, 569.0, 323.0, 218.0, 131.0, 84.0, 63.0, 30.0, 29.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.580078125, -0.5642051696777344, -0.5483322143554688, -0.5324592590332031, -0.5165863037109375, -0.5007133483886719, -0.48484039306640625, -0.4689674377441406, -0.453094482421875, -0.4372215270996094, -0.42134857177734375, -0.4054756164550781, -0.3896026611328125, -0.3737297058105469, -0.35785675048828125, -0.3419837951660156, -0.32611083984375, -0.3102378845214844, -0.29436492919921875, -0.2784919738769531, -0.2626190185546875, -0.24674606323242188, -0.23087310791015625, -0.21500015258789062, -0.199127197265625, -0.18325424194335938, -0.16738128662109375, -0.15150833129882812, -0.1356353759765625, -0.11976242065429688, -0.10388946533203125, -0.08801651000976562, -0.0721435546875, -0.056270599365234375, -0.04039764404296875, -0.024524688720703125, -0.0086517333984375, 0.007221221923828125, 0.02309417724609375, 0.038967132568359375, 0.054840087890625, 0.07071304321289062, 0.08658599853515625, 0.10245895385742188, 0.1183319091796875, 0.13420486450195312, 0.15007781982421875, 0.16595077514648438, 0.18182373046875, 0.19769668579101562, 0.21356964111328125, 0.22944259643554688, 0.2453155517578125, 0.2611885070800781, 0.27706146240234375, 0.2929344177246094, 0.308807373046875, 0.3246803283691406, 0.34055328369140625, 0.3564262390136719, 0.3722991943359375, 0.3881721496582031, 0.40404510498046875, 0.4199180603027344, 0.435791015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 10.0, 10.0, 8.0, 13.0, 10.0, 17.0, 22.0, 15.0, 29.0, 32.0, 36.0, 39.0, 46.0, 40.0, 43.0, 30.0, 46.0, 46.0, 45.0, 40.0, 42.0, 40.0, 37.0, 33.0, 33.0, 30.0, 23.0, 21.0, 27.0, 21.0, 19.0, 20.0, 9.0, 10.0, 9.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12152099609375, -0.11739253997802734, -0.11326408386230469, -0.10913562774658203, -0.10500717163085938, -0.10087871551513672, -0.09675025939941406, -0.0926218032836914, -0.08849334716796875, -0.0843648910522461, -0.08023643493652344, -0.07610797882080078, -0.07197952270507812, -0.06785106658935547, -0.06372261047363281, -0.059594154357910156, -0.0554656982421875, -0.051337242126464844, -0.04720878601074219, -0.04308032989501953, -0.038951873779296875, -0.03482341766357422, -0.030694961547851562, -0.026566505432128906, -0.02243804931640625, -0.018309593200683594, -0.014181137084960938, -0.010052680969238281, -0.005924224853515625, -0.0017957687377929688, 0.0023326873779296875, 0.006461143493652344, 0.010589599609375, 0.014718055725097656, 0.018846511840820312, 0.02297496795654297, 0.027103424072265625, 0.03123188018798828, 0.03536033630371094, 0.039488792419433594, 0.04361724853515625, 0.047745704650878906, 0.05187416076660156, 0.05600261688232422, 0.060131072998046875, 0.06425952911376953, 0.06838798522949219, 0.07251644134521484, 0.0766448974609375, 0.08077335357666016, 0.08490180969238281, 0.08903026580810547, 0.09315872192382812, 0.09728717803955078, 0.10141563415527344, 0.1055440902709961, 0.10967254638671875, 0.1138010025024414, 0.11792945861816406, 0.12205791473388672, 0.12618637084960938, 0.13031482696533203, 0.1344432830810547, 0.13857173919677734, 0.1427001953125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 16.0, 22.0, 26.0, 35.0, 49.0, 46.0, 52.0, 66.0, 55.0, 63.0, 78.0, 63.0, 65.0, 57.0, 39.0, 32.0, 34.0, 38.0, 17.0, 22.0, 22.0, 15.0, 10.0, 5.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5396769046783447, -1.4855743646621704, -1.4314717054367065, -1.3773691654205322, -1.3232665061950684, -1.269163966178894, -1.2150613069534302, -1.1609587669372559, -1.106856107711792, -1.0527535676956177, -0.9986509084701538, -0.9445483088493347, -0.8904457092285156, -0.8363431692123413, -0.7822405099868774, -0.7281379699707031, -0.674035370349884, -0.6199327707290649, -0.5658301711082458, -0.5117275714874268, -0.45762497186660767, -0.40352240204811096, -0.34941980242729187, -0.2953172028064728, -0.2412146031856537, -0.1871120035648346, -0.1330094039440155, -0.0789068192243576, -0.024804219603538513, 0.029298365116119385, 0.08340096473693848, 0.13750356435775757, 0.19160616397857666, 0.24570876359939575, 0.29981136322021484, 0.35391396284103394, 0.408016562461853, 0.46211913228034973, 0.5162217617034912, 0.5703243017196655, 0.6244269609451294, 0.6785295605659485, 0.7326321601867676, 0.7867347598075867, 0.8408373594284058, 0.8949398994445801, 0.949042558670044, 1.0031450986862183, 1.0572476387023926, 1.111350178718567, 1.1654528379440308, 1.219555377960205, 1.273658037185669, 1.3277605772018433, 1.3818632364273071, 1.4359657764434814, 1.4900684356689453, 1.5441709756851196, 1.5982736349105835, 1.6523761749267578, 1.7064788341522217, 1.760581374168396, 1.8146840333938599, 1.8687865734100342, 1.922889232635498]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 14.0, 19.0, 21.0, 19.0, 30.0, 30.0, 31.0, 31.0, 48.0, 46.0, 24.0, 34.0, 41.0, 45.0, 34.0, 45.0, 47.0, 44.0, 46.0, 36.0, 42.0, 37.0, 23.0, 16.0, 24.0, 22.0, 16.0, 13.0, 15.0, 11.0, 7.0, 12.0, 6.0, 10.0, 10.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0716361999511719, -1.0388997793197632, -1.006163239479065, -0.9734268188476562, -0.9406903386116028, -0.9079538583755493, -0.8752174377441406, -0.8424809575080872, -0.8097444772720337, -0.7770079970359802, -0.7442715167999268, -0.7115350961685181, -0.6787986159324646, -0.6460621356964111, -0.6133257150650024, -0.580589234828949, -0.5478527545928955, -0.515116274356842, -0.48237982392311096, -0.4496433734893799, -0.4169068932533264, -0.38417041301727295, -0.35143396258354187, -0.3186975121498108, -0.2859610319137573, -0.25322455167770386, -0.22048810124397278, -0.1877516359090805, -0.15501517057418823, -0.12227870523929596, -0.08954223990440369, -0.056805774569511414, -0.02406930923461914, 0.008667156100273132, 0.041403621435165405, 0.07414008677005768, 0.10687655210494995, 0.13961301743984222, 0.1723494827747345, 0.20508594810962677, 0.23782241344451904, 0.2705588936805725, 0.3032953441143036, 0.33603179454803467, 0.36876827478408813, 0.4015047550201416, 0.4342412054538727, 0.46697765588760376, 0.4997141361236572, 0.5324506163597107, 0.5651870965957642, 0.5979235172271729, 0.6306599974632263, 0.6633964776992798, 0.6961328983306885, 0.7288693785667419, 0.7616058588027954, 0.7943423390388489, 0.8270788192749023, 0.859815239906311, 0.8925517201423645, 0.925288200378418, 0.9580246210098267, 0.9907611012458801, 1.0234975814819336]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 17.0, 36.0, 48.0, 96.0, 103.0, 175.0, 266.0, 446.0, 790.0, 1303.0, 2120.0, 3750.0, 6345.0, 11120.0, 19382.0, 34501.0, 62484.0, 111686.0, 196831.0, 326758.0, 499138.0, 653865.0, 691305.0, 579542.0, 404078.0, 250541.0, 146391.0, 82448.0, 46626.0, 26247.0, 14894.0, 8594.0, 4901.0, 2963.0, 1765.0, 1074.0, 615.0, 380.0, 226.0, 160.0, 99.0, 52.0, 43.0, 27.0, 11.0, 7.0, 3.0, 10.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1010284423828125, -1.063385009765625, -1.0257415771484375, -0.98809814453125, -0.9504547119140625, -0.912811279296875, -0.8751678466796875, -0.8375244140625, -0.7998809814453125, -0.762237548828125, -0.7245941162109375, -0.68695068359375, -0.6493072509765625, -0.611663818359375, -0.5740203857421875, -0.536376953125, -0.4987335205078125, -0.461090087890625, -0.4234466552734375, -0.38580322265625, -0.3481597900390625, -0.310516357421875, -0.2728729248046875, -0.2352294921875, -0.1975860595703125, -0.159942626953125, -0.1222991943359375, -0.08465576171875, -0.0470123291015625, -0.009368896484375, 0.0282745361328125, 0.06591796875, 0.1035614013671875, 0.141204833984375, 0.1788482666015625, 0.21649169921875, 0.2541351318359375, 0.291778564453125, 0.3294219970703125, 0.3670654296875, 0.4047088623046875, 0.442352294921875, 0.4799957275390625, 0.51763916015625, 0.5552825927734375, 0.592926025390625, 0.6305694580078125, 0.668212890625, 0.7058563232421875, 0.743499755859375, 0.7811431884765625, 0.81878662109375, 0.8564300537109375, 0.894073486328125, 0.9317169189453125, 0.9693603515625, 1.0070037841796875, 1.044647216796875, 1.0822906494140625, 1.11993408203125, 1.1575775146484375, 1.195220947265625, 1.2328643798828125, 1.2705078125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 15.0, 9.0, 16.0, 29.0, 29.0, 26.0, 34.0, 27.0, 38.0, 44.0, 47.0, 34.0, 48.0, 49.0, 42.0, 40.0, 39.0, 43.0, 32.0, 32.0, 36.0, 33.0, 28.0, 23.0, 21.0, 21.0, 23.0, 18.0, 11.0, 15.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.806640625, -0.7824478149414062, -0.7582550048828125, -0.7340621948242188, -0.709869384765625, -0.6856765747070312, -0.6614837646484375, -0.6372909545898438, -0.61309814453125, -0.5889053344726562, -0.5647125244140625, -0.5405197143554688, -0.516326904296875, -0.49213409423828125, -0.4679412841796875, -0.44374847412109375, -0.4195556640625, -0.39536285400390625, -0.3711700439453125, -0.34697723388671875, -0.322784423828125, -0.29859161376953125, -0.2743988037109375, -0.25020599365234375, -0.22601318359375, -0.20182037353515625, -0.1776275634765625, -0.15343475341796875, -0.129241943359375, -0.10504913330078125, -0.0808563232421875, -0.05666351318359375, -0.032470703125, -0.00827789306640625, 0.0159149169921875, 0.04010772705078125, 0.064300537109375, 0.08849334716796875, 0.1126861572265625, 0.13687896728515625, 0.16107177734375, 0.18526458740234375, 0.2094573974609375, 0.23365020751953125, 0.257843017578125, 0.28203582763671875, 0.3062286376953125, 0.33042144775390625, 0.3546142578125, 0.37880706787109375, 0.4029998779296875, 0.42719268798828125, 0.451385498046875, 0.47557830810546875, 0.4997711181640625, 0.5239639282226562, 0.54815673828125, 0.5723495483398438, 0.5965423583984375, 0.6207351684570312, 0.644927978515625, 0.6691207885742188, 0.6933135986328125, 0.7175064086914062, 0.74169921875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [6.0, 3.0, 7.0, 13.0, 11.0, 26.0, 38.0, 66.0, 103.0, 191.0, 282.0, 464.0, 703.0, 1231.0, 1892.0, 3184.0, 5404.0, 8628.0, 14278.0, 23079.0, 38163.0, 62887.0, 99300.0, 157117.0, 236270.0, 334758.0, 440439.0, 517329.0, 536276.0, 490242.0, 395143.0, 289910.0, 198909.0, 128821.0, 81100.0, 50081.0, 30506.0, 18710.0, 11388.0, 6685.0, 4119.0, 2481.0, 1566.0, 985.0, 567.0, 362.0, 205.0, 140.0, 78.0, 60.0, 40.0, 20.0, 16.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92919921875, -0.8963394165039062, -0.8634796142578125, -0.8306198120117188, -0.797760009765625, -0.7649002075195312, -0.7320404052734375, -0.6991806030273438, -0.66632080078125, -0.6334609985351562, -0.6006011962890625, -0.5677413940429688, -0.534881591796875, -0.5020217895507812, -0.4691619873046875, -0.43630218505859375, -0.4034423828125, -0.37058258056640625, -0.3377227783203125, -0.30486297607421875, -0.272003173828125, -0.23914337158203125, -0.2062835693359375, -0.17342376708984375, -0.14056396484375, -0.10770416259765625, -0.0748443603515625, -0.04198455810546875, -0.009124755859375, 0.02373504638671875, 0.0565948486328125, 0.08945465087890625, 0.122314453125, 0.15517425537109375, 0.1880340576171875, 0.22089385986328125, 0.253753662109375, 0.28661346435546875, 0.3194732666015625, 0.35233306884765625, 0.38519287109375, 0.41805267333984375, 0.4509124755859375, 0.48377227783203125, 0.516632080078125, 0.5494918823242188, 0.5823516845703125, 0.6152114868164062, 0.6480712890625, 0.6809310913085938, 0.7137908935546875, 0.7466506958007812, 0.779510498046875, 0.8123703002929688, 0.8452301025390625, 0.8780899047851562, 0.91094970703125, 0.9438095092773438, 0.9766693115234375, 1.0095291137695312, 1.042388916015625, 1.0752487182617188, 1.1081085205078125, 1.1409683227539062, 1.173828125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 6.0, 6.0, 15.0, 13.0, 14.0, 22.0, 28.0, 33.0, 45.0, 52.0, 67.0, 71.0, 84.0, 81.0, 112.0, 126.0, 145.0, 147.0, 154.0, 193.0, 200.0, 202.0, 189.0, 207.0, 213.0, 185.0, 194.0, 183.0, 155.0, 141.0, 136.0, 101.0, 89.0, 79.0, 82.0, 57.0, 49.0, 28.0, 42.0, 23.0, 22.0, 10.0, 15.0, 13.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.38671875, -0.374908447265625, -0.36309814453125, -0.351287841796875, -0.3394775390625, -0.327667236328125, -0.31585693359375, -0.304046630859375, -0.292236328125, -0.280426025390625, -0.26861572265625, -0.256805419921875, -0.2449951171875, -0.233184814453125, -0.22137451171875, -0.209564208984375, -0.19775390625, -0.185943603515625, -0.17413330078125, -0.162322998046875, -0.1505126953125, -0.138702392578125, -0.12689208984375, -0.115081787109375, -0.103271484375, -0.091461181640625, -0.07965087890625, -0.067840576171875, -0.0560302734375, -0.044219970703125, -0.03240966796875, -0.020599365234375, -0.0087890625, 0.003021240234375, 0.01483154296875, 0.026641845703125, 0.0384521484375, 0.050262451171875, 0.06207275390625, 0.073883056640625, 0.085693359375, 0.097503662109375, 0.10931396484375, 0.121124267578125, 0.1329345703125, 0.144744873046875, 0.15655517578125, 0.168365478515625, 0.18017578125, 0.191986083984375, 0.20379638671875, 0.215606689453125, 0.2274169921875, 0.239227294921875, 0.25103759765625, 0.262847900390625, 0.274658203125, 0.286468505859375, 0.29827880859375, 0.310089111328125, 0.3218994140625, 0.333709716796875, 0.34552001953125, 0.357330322265625, 0.369140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 13.0, 10.0, 20.0, 14.0, 20.0, 19.0, 37.0, 42.0, 42.0, 52.0, 44.0, 60.0, 63.0, 63.0, 52.0, 53.0, 43.0, 56.0, 47.0, 41.0, 34.0, 29.0, 22.0, 25.0, 24.0, 10.0, 7.0, 12.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6071772575378418, -1.5585997104644775, -1.5100221633911133, -1.461444616317749, -1.4128670692443848, -1.3642895221710205, -1.3157119750976562, -1.267134428024292, -1.2185568809509277, -1.1699793338775635, -1.1214017868041992, -1.072824239730835, -1.0242466926574707, -0.9756691455841064, -0.927091658115387, -0.8785141110420227, -0.8299366235733032, -0.781359076499939, -0.7327815294265747, -0.6842039823532104, -0.6356264352798462, -0.5870488882064819, -0.5384714007377625, -0.4898938536643982, -0.44131630659103394, -0.3927387595176697, -0.3441612124443054, -0.29558369517326355, -0.2470061480998993, -0.19842860102653503, -0.14985108375549316, -0.1012735366821289, -0.0526958703994751, -0.004118330776691437, 0.044459208846092224, 0.09303674101829529, 0.14161428809165955, 0.1901918351650238, 0.23876935243606567, 0.28734689950942993, 0.3359244465827942, 0.38450199365615845, 0.4330795407295227, 0.4816570580005646, 0.5302345752716064, 0.5788121223449707, 0.627389669418335, 0.6759672164916992, 0.7245447635650635, 0.7731223106384277, 0.821699857711792, 0.8702774047851562, 0.9188549518585205, 0.9674324989318848, 1.016010046005249, 1.0645875930786133, 1.1131651401519775, 1.1617426872253418, 1.210320234298706, 1.2588977813720703, 1.3074753284454346, 1.3560528755187988, 1.404630422592163, 1.4532079696655273, 1.501785397529602]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 11.0, 14.0, 18.0, 20.0, 20.0, 26.0, 32.0, 26.0, 32.0, 43.0, 39.0, 31.0, 38.0, 31.0, 41.0, 42.0, 40.0, 43.0, 40.0, 42.0, 36.0, 47.0, 33.0, 29.0, 16.0, 34.0, 27.0, 15.0, 19.0, 10.0, 16.0, 12.0, 11.0, 10.0, 3.0, 10.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.025536060333252, -0.9957210421562195, -0.9659060835838318, -0.9360910654067993, -0.9062761068344116, -0.8764610886573792, -0.8466460704803467, -0.816831111907959, -0.7870160937309265, -0.757201075553894, -0.7273861169815063, -0.6975710988044739, -0.6677560806274414, -0.6379411220550537, -0.6081261038780212, -0.5783110857009888, -0.5484961271286011, -0.5186811089515686, -0.4888661503791809, -0.45905113220214844, -0.42923614382743835, -0.39942115545272827, -0.3696061372756958, -0.3397911489009857, -0.30997616052627563, -0.28016117215156555, -0.25034618377685547, -0.220531165599823, -0.19071617722511292, -0.16090118885040283, -0.13108618557453156, -0.10127118229866028, -0.0714561939239502, -0.041641198098659515, -0.011826202273368835, 0.017988793551921844, 0.047803789377212524, 0.07761877775192261, 0.10743378102779388, 0.13724878430366516, 0.16706377267837524, 0.19687876105308533, 0.2266937643289566, 0.2565087676048279, 0.28632375597953796, 0.31613874435424805, 0.3459537625312805, 0.3757687509059906, 0.4055837392807007, 0.43539872765541077, 0.46521371603012085, 0.4950287342071533, 0.524843692779541, 0.5546587109565735, 0.584473729133606, 0.6142886877059937, 0.6441037058830261, 0.6739187240600586, 0.7037336826324463, 0.7335487008094788, 0.7633637189865112, 0.7931786775588989, 0.8229936957359314, 0.8528087139129639, 0.8826236724853516]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 15.0, 21.0, 27.0, 36.0, 40.0, 75.0, 102.0, 178.0, 234.0, 318.0, 522.0, 750.0, 1180.0, 1866.0, 2999.0, 4865.0, 8342.0, 14639.0, 26880.0, 50211.0, 94159.0, 166844.0, 231184.0, 192673.0, 114023.0, 60994.0, 32664.0, 17614.0, 9820.0, 5576.0, 3467.0, 2112.0, 1335.0, 899.0, 600.0, 390.0, 272.0, 192.0, 129.0, 86.0, 59.0, 41.0, 35.0, 23.0, 18.0, 13.0, 9.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.390869140625, -0.3785209655761719, -0.36617279052734375, -0.3538246154785156, -0.3414764404296875, -0.3291282653808594, -0.31678009033203125, -0.3044319152832031, -0.292083740234375, -0.2797355651855469, -0.26738739013671875, -0.2550392150878906, -0.2426910400390625, -0.23034286499023438, -0.21799468994140625, -0.20564651489257812, -0.19329833984375, -0.18095016479492188, -0.16860198974609375, -0.15625381469726562, -0.1439056396484375, -0.13155746459960938, -0.11920928955078125, -0.10686111450195312, -0.094512939453125, -0.08216476440429688, -0.06981658935546875, -0.057468414306640625, -0.0451202392578125, -0.032772064208984375, -0.02042388916015625, -0.008075714111328125, 0.0042724609375, 0.016620635986328125, 0.02896881103515625, 0.041316986083984375, 0.0536651611328125, 0.06601333618164062, 0.07836151123046875, 0.09070968627929688, 0.103057861328125, 0.11540603637695312, 0.12775421142578125, 0.14010238647460938, 0.1524505615234375, 0.16479873657226562, 0.17714691162109375, 0.18949508666992188, 0.20184326171875, 0.21419143676757812, 0.22653961181640625, 0.23888778686523438, 0.2512359619140625, 0.2635841369628906, 0.27593231201171875, 0.2882804870605469, 0.300628662109375, 0.3129768371582031, 0.32532501220703125, 0.3376731872558594, 0.3500213623046875, 0.3623695373535156, 0.37471771240234375, 0.3870658874511719, 0.3994140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 7.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 18.0, 15.0, 26.0, 19.0, 22.0, 19.0, 26.0, 39.0, 41.0, 37.0, 38.0, 48.0, 30.0, 41.0, 48.0, 40.0, 34.0, 30.0, 38.0, 36.0, 41.0, 29.0, 31.0, 20.0, 25.0, 23.0, 25.0, 18.0, 12.0, 5.0, 12.0, 12.0, 11.0, 5.0, 4.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0360031127929688, -1.0046234130859375, -0.9732437133789062, -0.941864013671875, -0.9104843139648438, -0.8791046142578125, -0.8477249145507812, -0.81634521484375, -0.7849655151367188, -0.7535858154296875, -0.7222061157226562, -0.690826416015625, -0.6594467163085938, -0.6280670166015625, -0.5966873168945312, -0.5653076171875, -0.5339279174804688, -0.5025482177734375, -0.47116851806640625, -0.439788818359375, -0.40840911865234375, -0.3770294189453125, -0.34564971923828125, -0.31427001953125, -0.28289031982421875, -0.2515106201171875, -0.22013092041015625, -0.188751220703125, -0.15737152099609375, -0.1259918212890625, -0.09461212158203125, -0.063232421875, -0.03185272216796875, -0.0004730224609375, 0.03090667724609375, 0.062286376953125, 0.09366607666015625, 0.1250457763671875, 0.15642547607421875, 0.18780517578125, 0.21918487548828125, 0.2505645751953125, 0.28194427490234375, 0.313323974609375, 0.34470367431640625, 0.3760833740234375, 0.40746307373046875, 0.4388427734375, 0.47022247314453125, 0.5016021728515625, 0.5329818725585938, 0.564361572265625, 0.5957412719726562, 0.6271209716796875, 0.6585006713867188, 0.68988037109375, 0.7212600708007812, 0.7526397705078125, 0.7840194702148438, 0.815399169921875, 0.8467788696289062, 0.8781585693359375, 0.9095382690429688, 0.94091796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 12.0, 16.0, 27.0, 53.0, 40.0, 76.0, 128.0, 191.0, 313.0, 408.0, 645.0, 1009.0, 1678.0, 3093.0, 6303.0, 13032.0, 30344.0, 75614.0, 189844.0, 330399.0, 231462.0, 94277.0, 37567.0, 15860.0, 7191.0, 3695.0, 2024.0, 1168.0, 682.0, 465.0, 307.0, 181.0, 135.0, 108.0, 64.0, 31.0, 36.0, 13.0, 9.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5599822998046875, -0.542816162109375, -0.5256500244140625, -0.50848388671875, -0.4913177490234375, -0.474151611328125, -0.4569854736328125, -0.4398193359375, -0.4226531982421875, -0.405487060546875, -0.3883209228515625, -0.37115478515625, -0.3539886474609375, -0.336822509765625, -0.3196563720703125, -0.302490234375, -0.2853240966796875, -0.268157958984375, -0.2509918212890625, -0.23382568359375, -0.2166595458984375, -0.199493408203125, -0.1823272705078125, -0.1651611328125, -0.1479949951171875, -0.130828857421875, -0.1136627197265625, -0.09649658203125, -0.0793304443359375, -0.062164306640625, -0.0449981689453125, -0.02783203125, -0.0106658935546875, 0.006500244140625, 0.0236663818359375, 0.04083251953125, 0.0579986572265625, 0.075164794921875, 0.0923309326171875, 0.1094970703125, 0.1266632080078125, 0.143829345703125, 0.1609954833984375, 0.17816162109375, 0.1953277587890625, 0.212493896484375, 0.2296600341796875, 0.246826171875, 0.2639923095703125, 0.281158447265625, 0.2983245849609375, 0.31549072265625, 0.3326568603515625, 0.349822998046875, 0.3669891357421875, 0.3841552734375, 0.4013214111328125, 0.418487548828125, 0.4356536865234375, 0.45281982421875, 0.4699859619140625, 0.487152099609375, 0.5043182373046875, 0.521484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 8.0, 6.0, 10.0, 11.0, 11.0, 16.0, 14.0, 19.0, 20.0, 26.0, 30.0, 29.0, 39.0, 47.0, 46.0, 39.0, 42.0, 38.0, 37.0, 45.0, 46.0, 38.0, 40.0, 40.0, 42.0, 45.0, 31.0, 39.0, 14.0, 19.0, 17.0, 24.0, 14.0, 6.0, 10.0, 7.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.66143798828125, -0.6402587890625, -0.61907958984375, -0.597900390625, -0.57672119140625, -0.5555419921875, -0.53436279296875, -0.51318359375, -0.49200439453125, -0.4708251953125, -0.44964599609375, -0.428466796875, -0.40728759765625, -0.3861083984375, -0.36492919921875, -0.34375, -0.32257080078125, -0.3013916015625, -0.28021240234375, -0.259033203125, -0.23785400390625, -0.2166748046875, -0.19549560546875, -0.17431640625, -0.15313720703125, -0.1319580078125, -0.11077880859375, -0.089599609375, -0.06842041015625, -0.0472412109375, -0.02606201171875, -0.0048828125, 0.01629638671875, 0.0374755859375, 0.05865478515625, 0.079833984375, 0.10101318359375, 0.1221923828125, 0.14337158203125, 0.16455078125, 0.18572998046875, 0.2069091796875, 0.22808837890625, 0.249267578125, 0.27044677734375, 0.2916259765625, 0.31280517578125, 0.333984375, 0.35516357421875, 0.3763427734375, 0.39752197265625, 0.418701171875, 0.43988037109375, 0.4610595703125, 0.48223876953125, 0.50341796875, 0.52459716796875, 0.5457763671875, 0.56695556640625, 0.588134765625, 0.60931396484375, 0.6304931640625, 0.65167236328125, 0.6728515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 13.0, 7.0, 14.0, 19.0, 19.0, 42.0, 45.0, 62.0, 102.0, 152.0, 202.0, 311.0, 483.0, 709.0, 1112.0, 2138.0, 3962.0, 9292.0, 33561.0, 534818.0, 414011.0, 29973.0, 8666.0, 3581.0, 1907.0, 1158.0, 675.0, 459.0, 317.0, 209.0, 165.0, 94.0, 73.0, 51.0, 48.0, 31.0, 18.0, 14.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5329666137695312, -0.5131988525390625, -0.49343109130859375, -0.473663330078125, -0.45389556884765625, -0.4341278076171875, -0.41436004638671875, -0.39459228515625, -0.37482452392578125, -0.3550567626953125, -0.33528900146484375, -0.315521240234375, -0.29575347900390625, -0.2759857177734375, -0.25621795654296875, -0.2364501953125, -0.21668243408203125, -0.1969146728515625, -0.17714691162109375, -0.157379150390625, -0.13761138916015625, -0.1178436279296875, -0.09807586669921875, -0.07830810546875, -0.05854034423828125, -0.0387725830078125, -0.01900482177734375, 0.000762939453125, 0.02053070068359375, 0.0402984619140625, 0.06006622314453125, 0.079833984375, 0.09960174560546875, 0.1193695068359375, 0.13913726806640625, 0.158905029296875, 0.17867279052734375, 0.1984405517578125, 0.21820831298828125, 0.23797607421875, 0.25774383544921875, 0.2775115966796875, 0.29727935791015625, 0.317047119140625, 0.33681488037109375, 0.3565826416015625, 0.37635040283203125, 0.3961181640625, 0.41588592529296875, 0.4356536865234375, 0.45542144775390625, 0.475189208984375, 0.49495697021484375, 0.5147247314453125, 0.5344924926757812, 0.55426025390625, 0.5740280151367188, 0.5937957763671875, 0.6135635375976562, 0.633331298828125, 0.6530990600585938, 0.6728668212890625, 0.6926345825195312, 0.71240234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 7.0, 6.0, 11.0, 17.0, 37.0, 71.0, 66.0, 130.0, 157.0, 140.0, 105.0, 87.0, 61.0, 30.0, 18.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.946518361568451e-05, -2.841278910636902e-05, -2.7360394597053528e-05, -2.6308000087738037e-05, -2.5255605578422546e-05, -2.4203211069107056e-05, -2.3150816559791565e-05, -2.2098422050476074e-05, -2.1046027541160583e-05, -1.9993633031845093e-05, -1.8941238522529602e-05, -1.788884401321411e-05, -1.683644950389862e-05, -1.578405499458313e-05, -1.473166048526764e-05, -1.3679265975952148e-05, -1.2626871466636658e-05, -1.1574476957321167e-05, -1.0522082448005676e-05, -9.469687938690186e-06, -8.417293429374695e-06, -7.364898920059204e-06, -6.312504410743713e-06, -5.260109901428223e-06, -4.207715392112732e-06, -3.155320882797241e-06, -2.1029263734817505e-06, -1.0505318641662598e-06, 1.862645149230957e-09, 1.0542571544647217e-06, 2.1066516637802124e-06, 3.159046173095703e-06, 4.211440682411194e-06, 5.2638351917266846e-06, 6.316229701042175e-06, 7.368624210357666e-06, 8.421018719673157e-06, 9.473413228988647e-06, 1.0525807738304138e-05, 1.1578202247619629e-05, 1.263059675693512e-05, 1.368299126625061e-05, 1.4735385775566101e-05, 1.5787780284881592e-05, 1.6840174794197083e-05, 1.7892569303512573e-05, 1.8944963812828064e-05, 1.9997358322143555e-05, 2.1049752831459045e-05, 2.2102147340774536e-05, 2.3154541850090027e-05, 2.4206936359405518e-05, 2.5259330868721008e-05, 2.63117253780365e-05, 2.736411988735199e-05, 2.841651439666748e-05, 2.946890890598297e-05, 3.052130341529846e-05, 3.157369792461395e-05, 3.262609243392944e-05, 3.3678486943244934e-05, 3.4730881452560425e-05, 3.5783275961875916e-05, 3.6835670471191406e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 17.0, 14.0, 18.0, 39.0, 40.0, 62.0, 55.0, 96.0, 145.0, 179.0, 267.0, 332.0, 432.0, 644.0, 936.0, 1340.0, 2043.0, 3175.0, 4984.0, 8638.0, 16254.0, 38430.0, 140454.0, 507221.0, 222042.0, 53205.0, 20443.0, 10299.0, 5884.0, 3522.0, 2204.0, 1464.0, 1079.0, 701.0, 518.0, 394.0, 233.0, 200.0, 126.0, 96.0, 81.0, 64.0, 50.0, 30.0, 26.0, 18.0, 15.0, 10.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.35888671875, -0.34789276123046875, -0.3368988037109375, -0.32590484619140625, -0.314910888671875, -0.30391693115234375, -0.2929229736328125, -0.28192901611328125, -0.27093505859375, -0.25994110107421875, -0.2489471435546875, -0.23795318603515625, -0.226959228515625, -0.21596527099609375, -0.2049713134765625, -0.19397735595703125, -0.1829833984375, -0.17198944091796875, -0.1609954833984375, -0.15000152587890625, -0.139007568359375, -0.12801361083984375, -0.1170196533203125, -0.10602569580078125, -0.09503173828125, -0.08403778076171875, -0.0730438232421875, -0.06204986572265625, -0.051055908203125, -0.04006195068359375, -0.0290679931640625, -0.01807403564453125, -0.007080078125, 0.00391387939453125, 0.0149078369140625, 0.02590179443359375, 0.036895751953125, 0.04788970947265625, 0.0588836669921875, 0.06987762451171875, 0.08087158203125, 0.09186553955078125, 0.1028594970703125, 0.11385345458984375, 0.124847412109375, 0.13584136962890625, 0.1468353271484375, 0.15782928466796875, 0.1688232421875, 0.17981719970703125, 0.1908111572265625, 0.20180511474609375, 0.212799072265625, 0.22379302978515625, 0.2347869873046875, 0.24578094482421875, 0.25677490234375, 0.26776885986328125, 0.2787628173828125, 0.28975677490234375, 0.300750732421875, 0.31174468994140625, 0.3227386474609375, 0.33373260498046875, 0.3447265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 9.0, 9.0, 18.0, 20.0, 34.0, 45.0, 97.0, 220.0, 235.0, 124.0, 65.0, 31.0, 28.0, 16.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14694595336914062, -0.14264678955078125, -0.13834762573242188, -0.1340484619140625, -0.12974929809570312, -0.12545013427734375, -0.12115097045898438, -0.116851806640625, -0.11255264282226562, -0.10825347900390625, -0.10395431518554688, -0.0996551513671875, -0.09535598754882812, -0.09105682373046875, -0.08675765991210938, -0.08245849609375, -0.07815933227539062, -0.07386016845703125, -0.06956100463867188, -0.0652618408203125, -0.060962677001953125, -0.05666351318359375, -0.052364349365234375, -0.048065185546875, -0.043766021728515625, -0.03946685791015625, -0.035167694091796875, -0.0308685302734375, -0.026569366455078125, -0.02227020263671875, -0.017971038818359375, -0.013671875, -0.009372711181640625, -0.00507354736328125, -0.000774383544921875, 0.0035247802734375, 0.007823944091796875, 0.01212310791015625, 0.016422271728515625, 0.020721435546875, 0.025020599365234375, 0.02931976318359375, 0.033618927001953125, 0.0379180908203125, 0.042217254638671875, 0.04651641845703125, 0.050815582275390625, 0.05511474609375, 0.059413909912109375, 0.06371307373046875, 0.06801223754882812, 0.0723114013671875, 0.07661056518554688, 0.08090972900390625, 0.08520889282226562, 0.089508056640625, 0.09380722045898438, 0.09810638427734375, 0.10240554809570312, 0.1067047119140625, 0.11100387573242188, 0.11530303955078125, 0.11960220336914062, 0.1239013671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 21.0, 10.0, 20.0, 22.0, 33.0, 29.0, 44.0, 48.0, 51.0, 52.0, 64.0, 59.0, 46.0, 58.0, 54.0, 46.0, 49.0, 41.0, 42.0, 37.0, 21.0, 23.0, 23.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5663504600524902, -1.518341064453125, -1.4703317880630493, -1.422322392463684, -1.3743131160736084, -1.3263037204742432, -1.2782944440841675, -1.2302850484848022, -1.1822757720947266, -1.1342663764953613, -1.0862571001052856, -1.0382477045059204, -0.9902384281158447, -0.9422290921211243, -0.8942197561264038, -0.8462103605270386, -0.7982010245323181, -0.7501916885375977, -0.7021823525428772, -0.6541730165481567, -0.6061636805534363, -0.5581543445587158, -0.5101449489593506, -0.4621356427669525, -0.41412630677223206, -0.3661169707775116, -0.31810763478279114, -0.2700982689857483, -0.22208894789218903, -0.17407961189746857, -0.12607026100158691, -0.07806092500686646, -0.030051589012145996, 0.01795775070786476, 0.06596709042787552, 0.11397643387317657, 0.16198576986789703, 0.2099951058626175, 0.25800445675849915, 0.3060137927532196, 0.35402312874794006, 0.4020324647426605, 0.450041800737381, 0.49805116653442383, 0.5460605025291443, 0.5940698385238647, 0.6420791745185852, 0.6900885105133057, 0.7380978465080261, 0.7861071825027466, 0.834116518497467, 0.8821258544921875, 0.930135190486908, 0.9781445264816284, 1.0261539220809937, 1.0741631984710693, 1.1221725940704346, 1.1701819896697998, 1.2181912660598755, 1.2662006616592407, 1.3142099380493164, 1.3622193336486816, 1.4102286100387573, 1.4582380056381226, 1.5062472820281982]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 18.0, 22.0, 23.0, 23.0, 29.0, 28.0, 34.0, 39.0, 43.0, 34.0, 30.0, 35.0, 38.0, 45.0, 41.0, 39.0, 34.0, 40.0, 43.0, 40.0, 36.0, 28.0, 18.0, 34.0, 23.0, 12.0, 23.0, 14.0, 10.0, 14.0, 15.0, 8.0, 4.0, 7.0, 11.0, 7.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.999873161315918, -0.9706754088401794, -0.9414777159690857, -0.9122799634933472, -0.8830822706222534, -0.8538845181465149, -0.8246867656707764, -0.7954890727996826, -0.7662913799285889, -0.7370936274528503, -0.7078959345817566, -0.6786981821060181, -0.6495004892349243, -0.6203027367591858, -0.5911049842834473, -0.5619072914123535, -0.532709538936615, -0.5035117864608765, -0.4743140935897827, -0.4451163411140442, -0.41591864824295044, -0.3867208957672119, -0.3575231730937958, -0.32832545042037964, -0.2991277277469635, -0.26993000507354736, -0.24073228240013123, -0.2115345448255539, -0.18233682215213776, -0.15313909947872162, -0.12394136190414429, -0.09474363923072815, -0.06554597616195679, -0.03634824976325035, -0.007150523364543915, 0.02204720675945282, 0.05124492943286896, 0.0804426521062851, 0.10964038968086243, 0.13883811235427856, 0.1680358350276947, 0.19723355770111084, 0.22643128037452698, 0.2556290030479431, 0.28482675552368164, 0.3140244483947754, 0.3432222008705139, 0.37241992354393005, 0.4016176462173462, 0.43081536889076233, 0.46001309156417847, 0.489210844039917, 0.5184085369110107, 0.5476062893867493, 0.5768040418624878, 0.6060017347335815, 0.6351994276046753, 0.6643971800804138, 0.6935948729515076, 0.7227926254272461, 0.7519903182983398, 0.7811880707740784, 0.8103858232498169, 0.8395835161209106, 0.8687812685966492]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 10.0, 11.0, 23.0, 48.0, 76.0, 86.0, 154.0, 228.0, 424.0, 616.0, 877.0, 1482.0, 2232.0, 3495.0, 5394.0, 8185.0, 12522.0, 18719.0, 26972.0, 38317.0, 52104.0, 68538.0, 84633.0, 98160.0, 105484.0, 106325.0, 97266.0, 83393.0, 66853.0, 50854.0, 37206.0, 25735.0, 17828.0, 11861.0, 7833.0, 5104.0, 3333.0, 2149.0, 1460.0, 932.0, 580.0, 362.0, 280.0, 153.0, 89.0, 65.0, 35.0, 29.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.81005859375, -0.7847061157226562, -0.7593536376953125, -0.7340011596679688, -0.708648681640625, -0.6832962036132812, -0.6579437255859375, -0.6325912475585938, -0.60723876953125, -0.5818862915039062, -0.5565338134765625, -0.5311813354492188, -0.505828857421875, -0.48047637939453125, -0.4551239013671875, -0.42977142333984375, -0.4044189453125, -0.37906646728515625, -0.3537139892578125, -0.32836151123046875, -0.303009033203125, -0.27765655517578125, -0.2523040771484375, -0.22695159912109375, -0.20159912109375, -0.17624664306640625, -0.1508941650390625, -0.12554168701171875, -0.100189208984375, -0.07483673095703125, -0.0494842529296875, -0.02413177490234375, 0.001220703125, 0.02657318115234375, 0.0519256591796875, 0.07727813720703125, 0.102630615234375, 0.12798309326171875, 0.1533355712890625, 0.17868804931640625, 0.20404052734375, 0.22939300537109375, 0.2547454833984375, 0.28009796142578125, 0.305450439453125, 0.33080291748046875, 0.3561553955078125, 0.38150787353515625, 0.4068603515625, 0.43221282958984375, 0.4575653076171875, 0.48291778564453125, 0.508270263671875, 0.5336227416992188, 0.5589752197265625, 0.5843276977539062, 0.60968017578125, 0.6350326538085938, 0.6603851318359375, 0.6857376098632812, 0.711090087890625, 0.7364425659179688, 0.7617950439453125, 0.7871475219726562, 0.8125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 14.0, 11.0, 13.0, 17.0, 17.0, 22.0, 19.0, 26.0, 24.0, 36.0, 34.0, 36.0, 34.0, 41.0, 37.0, 41.0, 41.0, 28.0, 54.0, 39.0, 34.0, 39.0, 49.0, 29.0, 28.0, 27.0, 20.0, 22.0, 24.0, 23.0, 15.0, 16.0, 10.0, 13.0, 14.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0791015625, -1.04779052734375, -1.0164794921875, -0.98516845703125, -0.953857421875, -0.92254638671875, -0.8912353515625, -0.85992431640625, -0.82861328125, -0.79730224609375, -0.7659912109375, -0.73468017578125, -0.703369140625, -0.67205810546875, -0.6407470703125, -0.60943603515625, -0.578125, -0.54681396484375, -0.5155029296875, -0.48419189453125, -0.452880859375, -0.42156982421875, -0.3902587890625, -0.35894775390625, -0.32763671875, -0.29632568359375, -0.2650146484375, -0.23370361328125, -0.202392578125, -0.17108154296875, -0.1397705078125, -0.10845947265625, -0.0771484375, -0.04583740234375, -0.0145263671875, 0.01678466796875, 0.048095703125, 0.07940673828125, 0.1107177734375, 0.14202880859375, 0.17333984375, 0.20465087890625, 0.2359619140625, 0.26727294921875, 0.298583984375, 0.32989501953125, 0.3612060546875, 0.39251708984375, 0.423828125, 0.45513916015625, 0.4864501953125, 0.51776123046875, 0.549072265625, 0.58038330078125, 0.6116943359375, 0.64300537109375, 0.67431640625, 0.70562744140625, 0.7369384765625, 0.76824951171875, 0.799560546875, 0.83087158203125, 0.8621826171875, 0.89349365234375, 0.9248046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 13.0, 20.0, 29.0, 44.0, 67.0, 101.0, 148.0, 276.0, 357.0, 662.0, 1004.0, 1583.0, 2454.0, 4004.0, 6099.0, 9600.0, 15093.0, 22473.0, 32911.0, 46223.0, 62955.0, 80810.0, 97359.0, 108282.0, 110793.0, 103765.0, 90898.0, 73331.0, 55579.0, 40128.0, 28018.0, 18925.0, 12409.0, 8120.0, 5110.0, 3319.0, 2035.0, 1259.0, 846.0, 519.0, 318.0, 219.0, 143.0, 86.0, 58.0, 45.0, 18.0, 13.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8521575927734375, -0.824920654296875, -0.7976837158203125, -0.77044677734375, -0.7432098388671875, -0.715972900390625, -0.6887359619140625, -0.6614990234375, -0.6342620849609375, -0.607025146484375, -0.5797882080078125, -0.55255126953125, -0.5253143310546875, -0.498077392578125, -0.4708404541015625, -0.443603515625, -0.4163665771484375, -0.389129638671875, -0.3618927001953125, -0.33465576171875, -0.3074188232421875, -0.280181884765625, -0.2529449462890625, -0.2257080078125, -0.1984710693359375, -0.171234130859375, -0.1439971923828125, -0.11676025390625, -0.0895233154296875, -0.062286376953125, -0.0350494384765625, -0.0078125, 0.0194244384765625, 0.046661376953125, 0.0738983154296875, 0.10113525390625, 0.1283721923828125, 0.155609130859375, 0.1828460693359375, 0.2100830078125, 0.2373199462890625, 0.264556884765625, 0.2917938232421875, 0.31903076171875, 0.3462677001953125, 0.373504638671875, 0.4007415771484375, 0.427978515625, 0.4552154541015625, 0.482452392578125, 0.5096893310546875, 0.53692626953125, 0.5641632080078125, 0.591400146484375, 0.6186370849609375, 0.6458740234375, 0.6731109619140625, 0.700347900390625, 0.7275848388671875, 0.75482177734375, 0.7820587158203125, 0.809295654296875, 0.8365325927734375, 0.86376953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 17.0, 12.0, 17.0, 18.0, 12.0, 18.0, 21.0, 23.0, 33.0, 25.0, 30.0, 18.0, 29.0, 42.0, 31.0, 35.0, 46.0, 48.0, 29.0, 45.0, 41.0, 33.0, 28.0, 36.0, 31.0, 30.0, 30.0, 33.0, 26.0, 22.0, 17.0, 19.0, 15.0, 9.0, 12.0, 4.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.546875, -0.5294418334960938, -0.5120086669921875, -0.49457550048828125, -0.477142333984375, -0.45970916748046875, -0.4422760009765625, -0.42484283447265625, -0.40740966796875, -0.38997650146484375, -0.3725433349609375, -0.35511016845703125, -0.337677001953125, -0.32024383544921875, -0.3028106689453125, -0.28537750244140625, -0.2679443359375, -0.25051116943359375, -0.2330780029296875, -0.21564483642578125, -0.198211669921875, -0.18077850341796875, -0.1633453369140625, -0.14591217041015625, -0.12847900390625, -0.11104583740234375, -0.0936126708984375, -0.07617950439453125, -0.058746337890625, -0.04131317138671875, -0.0238800048828125, -0.00644683837890625, 0.010986328125, 0.02841949462890625, 0.0458526611328125, 0.06328582763671875, 0.080718994140625, 0.09815216064453125, 0.1155853271484375, 0.13301849365234375, 0.15045166015625, 0.16788482666015625, 0.1853179931640625, 0.20275115966796875, 0.220184326171875, 0.23761749267578125, 0.2550506591796875, 0.27248382568359375, 0.2899169921875, 0.30735015869140625, 0.3247833251953125, 0.34221649169921875, 0.359649658203125, 0.37708282470703125, 0.3945159912109375, 0.41194915771484375, 0.42938232421875, 0.44681549072265625, 0.4642486572265625, 0.48168182373046875, 0.499114990234375, 0.5165481567382812, 0.5339813232421875, 0.5514144897460938, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 12.0, 23.0, 47.0, 69.0, 102.0, 148.0, 236.0, 362.0, 641.0, 980.0, 1418.0, 2274.0, 3591.0, 5607.0, 8773.0, 13739.0, 21428.0, 32919.0, 49663.0, 71792.0, 96924.0, 120999.0, 132617.0, 127312.0, 107304.0, 81767.0, 57413.0, 38751.0, 25680.0, 16575.0, 10579.0, 6772.0, 4415.0, 2838.0, 1642.0, 1159.0, 706.0, 486.0, 295.0, 164.0, 128.0, 68.0, 59.0, 26.0, 19.0, 11.0, 11.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45325469970703125, -0.4384918212890625, -0.42372894287109375, -0.408966064453125, -0.39420318603515625, -0.3794403076171875, -0.36467742919921875, -0.34991455078125, -0.33515167236328125, -0.3203887939453125, -0.30562591552734375, -0.290863037109375, -0.27610015869140625, -0.2613372802734375, -0.24657440185546875, -0.2318115234375, -0.21704864501953125, -0.2022857666015625, -0.18752288818359375, -0.172760009765625, -0.15799713134765625, -0.1432342529296875, -0.12847137451171875, -0.11370849609375, -0.09894561767578125, -0.0841827392578125, -0.06941986083984375, -0.054656982421875, -0.03989410400390625, -0.0251312255859375, -0.01036834716796875, 0.00439453125, 0.01915740966796875, 0.0339202880859375, 0.04868316650390625, 0.063446044921875, 0.07820892333984375, 0.0929718017578125, 0.10773468017578125, 0.12249755859375, 0.13726043701171875, 0.1520233154296875, 0.16678619384765625, 0.181549072265625, 0.19631195068359375, 0.2110748291015625, 0.22583770751953125, 0.2406005859375, 0.25536346435546875, 0.2701263427734375, 0.28488922119140625, 0.299652099609375, 0.31441497802734375, 0.3291778564453125, 0.34394073486328125, 0.35870361328125, 0.37346649169921875, 0.3882293701171875, 0.40299224853515625, 0.417755126953125, 0.43251800537109375, 0.4472808837890625, 0.46204376220703125, 0.476806640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 12.0, 7.0, 8.0, 3.0, 14.0, 16.0, 24.0, 21.0, 35.0, 26.0, 43.0, 54.0, 50.0, 47.0, 54.0, 48.0, 53.0, 57.0, 50.0, 47.0, 45.0, 49.0, 34.0, 37.0, 35.0, 26.0, 25.0, 18.0, 17.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.739927291870117e-05, -5.577225238084793e-05, -5.414523184299469e-05, -5.251821130514145e-05, -5.089119076728821e-05, -4.926417022943497e-05, -4.7637149691581726e-05, -4.6010129153728485e-05, -4.4383108615875244e-05, -4.2756088078022e-05, -4.112906754016876e-05, -3.950204700231552e-05, -3.787502646446228e-05, -3.624800592660904e-05, -3.46209853887558e-05, -3.299396485090256e-05, -3.1366944313049316e-05, -2.9739923775196075e-05, -2.8112903237342834e-05, -2.6485882699489594e-05, -2.4858862161636353e-05, -2.323184162378311e-05, -2.160482108592987e-05, -1.997780054807663e-05, -1.835078001022339e-05, -1.6723759472370148e-05, -1.5096738934516907e-05, -1.3469718396663666e-05, -1.1842697858810425e-05, -1.0215677320957184e-05, -8.588656783103943e-06, -6.961636245250702e-06, -5.334615707397461e-06, -3.70759516954422e-06, -2.080574631690979e-06, -4.5355409383773804e-07, 1.173466444015503e-06, 2.800486981868744e-06, 4.427507519721985e-06, 6.054528057575226e-06, 7.681548595428467e-06, 9.308569133281708e-06, 1.0935589671134949e-05, 1.256261020898819e-05, 1.418963074684143e-05, 1.581665128469467e-05, 1.7443671822547913e-05, 1.9070692360401154e-05, 2.0697712898254395e-05, 2.2324733436107635e-05, 2.3951753973960876e-05, 2.5578774511814117e-05, 2.720579504966736e-05, 2.88328155875206e-05, 3.045983612537384e-05, 3.208685666322708e-05, 3.371387720108032e-05, 3.534089773893356e-05, 3.6967918276786804e-05, 3.8594938814640045e-05, 4.0221959352493286e-05, 4.184897989034653e-05, 4.347600042819977e-05, 4.510302096605301e-05, 4.673004150390625e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 14.0, 27.0, 46.0, 61.0, 116.0, 195.0, 314.0, 435.0, 773.0, 1214.0, 2107.0, 3487.0, 5866.0, 9935.0, 16769.0, 27183.0, 43301.0, 66628.0, 94840.0, 123548.0, 142199.0, 140680.0, 118615.0, 88658.0, 60800.0, 39430.0, 24270.0, 14941.0, 8973.0, 5110.0, 3178.0, 1855.0, 1107.0, 713.0, 447.0, 244.0, 173.0, 109.0, 62.0, 42.0, 34.0, 17.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49330902099609375, -0.4773406982421875, -0.46137237548828125, -0.445404052734375, -0.42943572998046875, -0.4134674072265625, -0.39749908447265625, -0.38153076171875, -0.36556243896484375, -0.3495941162109375, -0.33362579345703125, -0.317657470703125, -0.30168914794921875, -0.2857208251953125, -0.26975250244140625, -0.2537841796875, -0.23781585693359375, -0.2218475341796875, -0.20587921142578125, -0.189910888671875, -0.17394256591796875, -0.1579742431640625, -0.14200592041015625, -0.12603759765625, -0.11006927490234375, -0.0941009521484375, -0.07813262939453125, -0.062164306640625, -0.04619598388671875, -0.0302276611328125, -0.01425933837890625, 0.001708984375, 0.01767730712890625, 0.0336456298828125, 0.04961395263671875, 0.065582275390625, 0.08155059814453125, 0.0975189208984375, 0.11348724365234375, 0.12945556640625, 0.14542388916015625, 0.1613922119140625, 0.17736053466796875, 0.193328857421875, 0.20929718017578125, 0.2252655029296875, 0.24123382568359375, 0.2572021484375, 0.27317047119140625, 0.2891387939453125, 0.30510711669921875, 0.321075439453125, 0.33704376220703125, 0.3530120849609375, 0.36898040771484375, 0.38494873046875, 0.40091705322265625, 0.4168853759765625, 0.43285369873046875, 0.448822021484375, 0.46479034423828125, 0.4807586669921875, 0.49672698974609375, 0.5126953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 17.0, 9.0, 11.0, 12.0, 19.0, 17.0, 23.0, 29.0, 24.0, 37.0, 37.0, 33.0, 32.0, 41.0, 34.0, 43.0, 53.0, 50.0, 48.0, 50.0, 45.0, 54.0, 36.0, 32.0, 28.0, 24.0, 26.0, 17.0, 20.0, 15.0, 11.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.1547374725341797, -0.15017318725585938, -0.14560890197753906, -0.14104461669921875, -0.13648033142089844, -0.13191604614257812, -0.1273517608642578, -0.1227874755859375, -0.11822319030761719, -0.11365890502929688, -0.10909461975097656, -0.10453033447265625, -0.09996604919433594, -0.09540176391601562, -0.09083747863769531, -0.086273193359375, -0.08170890808105469, -0.07714462280273438, -0.07258033752441406, -0.06801605224609375, -0.06345176696777344, -0.058887481689453125, -0.05432319641113281, -0.0497589111328125, -0.04519462585449219, -0.040630340576171875, -0.03606605529785156, -0.03150177001953125, -0.026937484741210938, -0.022373199462890625, -0.017808914184570312, -0.01324462890625, -0.008680343627929688, -0.004116058349609375, 0.0004482269287109375, 0.00501251220703125, 0.009576797485351562, 0.014141082763671875, 0.018705368041992188, 0.0232696533203125, 0.027833938598632812, 0.032398223876953125, 0.03696250915527344, 0.04152679443359375, 0.04609107971191406, 0.050655364990234375, 0.05521965026855469, 0.059783935546875, 0.06434822082519531, 0.06891250610351562, 0.07347679138183594, 0.07804107666015625, 0.08260536193847656, 0.08716964721679688, 0.09173393249511719, 0.0962982177734375, 0.10086250305175781, 0.10542678833007812, 0.10999107360839844, 0.11455535888671875, 0.11911964416503906, 0.12368392944335938, 0.1282482147216797, 0.1328125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 7.0, 8.0, 6.0, 11.0, 11.0, 18.0, 17.0, 22.0, 28.0, 35.0, 44.0, 45.0, 47.0, 43.0, 42.0, 49.0, 56.0, 61.0, 54.0, 46.0, 47.0, 38.0, 41.0, 40.0, 34.0, 27.0, 24.0, 23.0, 13.0, 15.0, 10.0, 6.0, 9.0, 5.0, 5.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.5691479444503784, -1.5247411727905273, -1.4803344011306763, -1.4359276294708252, -1.3915208578109741, -1.347114086151123, -1.302707314491272, -1.258300542831421, -1.2138937711715698, -1.1694869995117188, -1.1250802278518677, -1.0806734561920166, -1.0362666845321655, -0.9918599128723145, -0.9474531412124634, -0.9030463695526123, -0.858639657497406, -0.8142328858375549, -0.7698261141777039, -0.7254193425178528, -0.6810125708580017, -0.6366057991981506, -0.5921990871429443, -0.5477923154830933, -0.5033855438232422, -0.4589787721633911, -0.41457200050354004, -0.37016522884368896, -0.3257584571838379, -0.2813516855239868, -0.23694494366645813, -0.19253817200660706, -0.1481313705444336, -0.10372459888458252, -0.05931783467531204, -0.014911070466041565, 0.02949570119380951, 0.07390247285366058, 0.11830922961235046, 0.16271600127220154, 0.2071227729320526, 0.2515295445919037, 0.29593631625175476, 0.34034305810928345, 0.3847498297691345, 0.4291566014289856, 0.47356337308883667, 0.5179701447486877, 0.5623769164085388, 0.6067836880683899, 0.651190459728241, 0.695597231388092, 0.7400040030479431, 0.7844107747077942, 0.8288174867630005, 0.8732242584228516, 0.9176310300827026, 0.9620378017425537, 1.0064445734024048, 1.0508513450622559, 1.095258116722107, 1.139664888381958, 1.184071660041809, 1.2284784317016602, 1.2728852033615112]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 3.0, 1.0, 11.0, 7.0, 14.0, 14.0, 17.0, 23.0, 14.0, 32.0, 18.0, 27.0, 26.0, 38.0, 34.0, 32.0, 37.0, 31.0, 40.0, 43.0, 31.0, 47.0, 36.0, 26.0, 32.0, 33.0, 23.0, 25.0, 33.0, 29.0, 31.0, 23.0, 21.0, 28.0, 21.0, 19.0, 6.0, 7.0, 6.0, 10.0, 5.0, 9.0, 8.0, 8.0, 5.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8512454032897949, -0.823173463344574, -0.795101523399353, -0.7670295834541321, -0.7389576435089111, -0.7108856439590454, -0.6828137040138245, -0.6547417640686035, -0.6266698241233826, -0.5985978841781616, -0.5705259442329407, -0.5424540042877197, -0.514382004737854, -0.48631009459495544, -0.4582381248474121, -0.43016618490219116, -0.4020942449569702, -0.37402230501174927, -0.3459503650665283, -0.317878395318985, -0.28980645537376404, -0.2617345154285431, -0.23366256058216095, -0.2055906057357788, -0.17751866579055786, -0.14944672584533691, -0.12137477099895477, -0.09330282360315323, -0.06523087620735168, -0.03715893626213074, -0.009086981415748596, 0.018984973430633545, 0.04705685377120972, 0.07512880116701126, 0.1032007485628128, 0.13127270340919495, 0.1593446433544159, 0.18741658329963684, 0.21548853814601898, 0.24356049299240112, 0.27163243293762207, 0.299704372882843, 0.32777631282806396, 0.3558482825756073, 0.38392022252082825, 0.4119921624660492, 0.44006413221359253, 0.4681360721588135, 0.4962080121040344, 0.5242799520492554, 0.5523518919944763, 0.5804238319396973, 0.608495831489563, 0.6365677118301392, 0.6646397113800049, 0.6927116513252258, 0.7207835912704468, 0.7488555312156677, 0.7769274711608887, 0.8049994111061096, 0.8330713510513306, 0.8611433506011963, 0.8892152905464172, 0.9172872304916382, 0.9453591704368591]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 14.0, 13.0, 21.0, 48.0, 64.0, 116.0, 182.0, 321.0, 636.0, 1056.0, 1945.0, 3825.0, 7265.0, 14544.0, 28719.0, 57960.0, 116626.0, 230718.0, 419027.0, 664369.0, 820548.0, 738583.0, 502134.0, 286032.0, 149223.0, 74702.0, 37259.0, 18699.0, 9440.0, 4701.0, 2513.0, 1301.0, 746.0, 417.0, 191.0, 134.0, 85.0, 44.0, 21.0, 17.0, 7.0, 6.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5625, -1.5160980224609375, -1.469696044921875, -1.4232940673828125, -1.37689208984375, -1.3304901123046875, -1.284088134765625, -1.2376861572265625, -1.1912841796875, -1.1448822021484375, -1.098480224609375, -1.0520782470703125, -1.00567626953125, -0.9592742919921875, -0.912872314453125, -0.8664703369140625, -0.820068359375, -0.7736663818359375, -0.727264404296875, -0.6808624267578125, -0.63446044921875, -0.5880584716796875, -0.541656494140625, -0.4952545166015625, -0.4488525390625, -0.4024505615234375, -0.356048583984375, -0.3096466064453125, -0.26324462890625, -0.2168426513671875, -0.170440673828125, -0.1240386962890625, -0.07763671875, -0.0312347412109375, 0.015167236328125, 0.0615692138671875, 0.10797119140625, 0.1543731689453125, 0.200775146484375, 0.2471771240234375, 0.2935791015625, 0.3399810791015625, 0.386383056640625, 0.4327850341796875, 0.47918701171875, 0.5255889892578125, 0.571990966796875, 0.6183929443359375, 0.664794921875, 0.7111968994140625, 0.757598876953125, 0.8040008544921875, 0.85040283203125, 0.8968048095703125, 0.943206787109375, 0.9896087646484375, 1.0360107421875, 1.0824127197265625, 1.128814697265625, 1.1752166748046875, 1.22161865234375, 1.2680206298828125, 1.314422607421875, 1.3608245849609375, 1.4072265625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 14.0, 13.0, 15.0, 18.0, 37.0, 25.0, 29.0, 32.0, 29.0, 33.0, 33.0, 42.0, 39.0, 47.0, 38.0, 48.0, 35.0, 49.0, 52.0, 39.0, 34.0, 36.0, 28.0, 29.0, 32.0, 18.0, 22.0, 17.0, 14.0, 12.0, 8.0, 12.0, 14.0, 4.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.73187255859375, -0.7064208984375, -0.68096923828125, -0.655517578125, -0.63006591796875, -0.6046142578125, -0.57916259765625, -0.5537109375, -0.52825927734375, -0.5028076171875, -0.47735595703125, -0.451904296875, -0.42645263671875, -0.4010009765625, -0.37554931640625, -0.35009765625, -0.32464599609375, -0.2991943359375, -0.27374267578125, -0.248291015625, -0.22283935546875, -0.1973876953125, -0.17193603515625, -0.146484375, -0.12103271484375, -0.0955810546875, -0.07012939453125, -0.044677734375, -0.01922607421875, 0.0062255859375, 0.03167724609375, 0.05712890625, 0.08258056640625, 0.1080322265625, 0.13348388671875, 0.158935546875, 0.18438720703125, 0.2098388671875, 0.23529052734375, 0.2607421875, 0.28619384765625, 0.3116455078125, 0.33709716796875, 0.362548828125, 0.38800048828125, 0.4134521484375, 0.43890380859375, 0.46435546875, 0.48980712890625, 0.5152587890625, 0.54071044921875, 0.566162109375, 0.59161376953125, 0.6170654296875, 0.64251708984375, 0.66796875, 0.69342041015625, 0.7188720703125, 0.74432373046875, 0.769775390625, 0.79522705078125, 0.8206787109375, 0.84613037109375, 0.87158203125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 10.0, 15.0, 29.0, 49.0, 59.0, 101.0, 147.0, 208.0, 345.0, 565.0, 924.0, 1485.0, 2386.0, 3765.0, 5901.0, 9598.0, 15752.0, 25186.0, 39861.0, 63095.0, 98882.0, 148523.0, 217341.0, 302422.0, 391982.0, 468376.0, 502358.0, 479228.0, 411582.0, 320062.0, 232448.0, 160558.0, 105881.0, 69419.0, 43298.0, 27452.0, 16920.0, 10505.0, 6654.0, 4075.0, 2620.0, 1543.0, 991.0, 646.0, 381.0, 258.0, 134.0, 80.0, 75.0, 29.0, 29.0, 21.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.97314453125, -0.9413375854492188, -0.9095306396484375, -0.8777236938476562, -0.845916748046875, -0.8141098022460938, -0.7823028564453125, -0.7504959106445312, -0.71868896484375, -0.6868820190429688, -0.6550750732421875, -0.6232681274414062, -0.591461181640625, -0.5596542358398438, -0.5278472900390625, -0.49604034423828125, -0.4642333984375, -0.43242645263671875, -0.4006195068359375, -0.36881256103515625, -0.337005615234375, -0.30519866943359375, -0.2733917236328125, -0.24158477783203125, -0.20977783203125, -0.17797088623046875, -0.1461639404296875, -0.11435699462890625, -0.082550048828125, -0.05074310302734375, -0.0189361572265625, 0.01287078857421875, 0.044677734375, 0.07648468017578125, 0.1082916259765625, 0.14009857177734375, 0.171905517578125, 0.20371246337890625, 0.2355194091796875, 0.26732635498046875, 0.29913330078125, 0.33094024658203125, 0.3627471923828125, 0.39455413818359375, 0.426361083984375, 0.45816802978515625, 0.4899749755859375, 0.5217819213867188, 0.5535888671875, 0.5853958129882812, 0.6172027587890625, 0.6490097045898438, 0.680816650390625, 0.7126235961914062, 0.7444305419921875, 0.7762374877929688, 0.80804443359375, 0.8398513793945312, 0.8716583251953125, 0.9034652709960938, 0.935272216796875, 0.9670791625976562, 0.9988861083984375, 1.0306930541992188, 1.0625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 24.0, 16.0, 21.0, 33.0, 30.0, 47.0, 66.0, 62.0, 90.0, 85.0, 91.0, 122.0, 112.0, 157.0, 172.0, 160.0, 202.0, 196.0, 209.0, 175.0, 189.0, 207.0, 182.0, 204.0, 166.0, 154.0, 135.0, 126.0, 108.0, 84.0, 69.0, 65.0, 54.0, 41.0, 54.0, 28.0, 40.0, 20.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.392578125, -0.3801116943359375, -0.367645263671875, -0.3551788330078125, -0.34271240234375, -0.3302459716796875, -0.317779541015625, -0.3053131103515625, -0.2928466796875, -0.2803802490234375, -0.267913818359375, -0.2554473876953125, -0.24298095703125, -0.2305145263671875, -0.218048095703125, -0.2055816650390625, -0.193115234375, -0.1806488037109375, -0.168182373046875, -0.1557159423828125, -0.14324951171875, -0.1307830810546875, -0.118316650390625, -0.1058502197265625, -0.0933837890625, -0.0809173583984375, -0.068450927734375, -0.0559844970703125, -0.04351806640625, -0.0310516357421875, -0.018585205078125, -0.0061187744140625, 0.00634765625, 0.0188140869140625, 0.031280517578125, 0.0437469482421875, 0.05621337890625, 0.0686798095703125, 0.081146240234375, 0.0936126708984375, 0.1060791015625, 0.1185455322265625, 0.131011962890625, 0.1434783935546875, 0.15594482421875, 0.1684112548828125, 0.180877685546875, 0.1933441162109375, 0.205810546875, 0.2182769775390625, 0.230743408203125, 0.2432098388671875, 0.25567626953125, 0.2681427001953125, 0.280609130859375, 0.2930755615234375, 0.3055419921875, 0.3180084228515625, 0.330474853515625, 0.3429412841796875, 0.35540771484375, 0.3678741455078125, 0.380340576171875, 0.3928070068359375, 0.4052734375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 17.0, 32.0, 32.0, 19.0, 50.0, 41.0, 49.0, 57.0, 63.0, 61.0, 41.0, 55.0, 33.0, 43.0, 47.0, 27.0, 34.0, 34.0, 30.0, 18.0, 13.0, 19.0, 16.0, 10.0, 15.0, 13.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.5239067077636719, -1.4816919565200806, -1.4394772052764893, -1.397262454032898, -1.3550477027893066, -1.3128328323364258, -1.2706180810928345, -1.2284033298492432, -1.1861885786056519, -1.1439738273620605, -1.1017590761184692, -1.059544324874878, -1.017329454421997, -0.9751147627830505, -0.9328999519348145, -0.8906852006912231, -0.8484704494476318, -0.8062556982040405, -0.7640409469604492, -0.7218261361122131, -0.6796113848686218, -0.6373966336250305, -0.5951818227767944, -0.5529670715332031, -0.5107523202896118, -0.4685375690460205, -0.4263227880001068, -0.3841080069541931, -0.3418932557106018, -0.2996785044670105, -0.2574637234210968, -0.2152489423751831, -0.17303407192230225, -0.13081930577754974, -0.08860453963279724, -0.04638977348804474, -0.004175007343292236, 0.038039758801460266, 0.08025452494621277, 0.12246930599212646, 0.16468405723571777, 0.20689882338047028, 0.24911358952522278, 0.2913283705711365, 0.3335431218147278, 0.3757578730583191, 0.4179726541042328, 0.4601874351501465, 0.5024021863937378, 0.5446169376373291, 0.5868316888809204, 0.6290464997291565, 0.6712612509727478, 0.7134760022163391, 0.7556908130645752, 0.7979055643081665, 0.8401203155517578, 0.8823350667953491, 0.9245498180389404, 0.9667646288871765, 1.008979320526123, 1.051194190979004, 1.0934089422225952, 1.1356236934661865, 1.1778384447097778]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 22.0, 14.0, 18.0, 17.0, 24.0, 38.0, 25.0, 29.0, 32.0, 31.0, 44.0, 37.0, 43.0, 28.0, 41.0, 32.0, 44.0, 34.0, 46.0, 40.0, 34.0, 33.0, 35.0, 27.0, 32.0, 27.0, 20.0, 15.0, 16.0, 9.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8927128911018372, -0.8629211783409119, -0.8331294655799866, -0.8033376932144165, -0.7735459804534912, -0.7437542676925659, -0.7139625549316406, -0.6841708421707153, -0.65437912940979, -0.6245874166488647, -0.5947957038879395, -0.5650039911270142, -0.5352122187614441, -0.5054205060005188, -0.4756287932395935, -0.4458370804786682, -0.41604530811309814, -0.38625359535217285, -0.35646185278892517, -0.3266701400279999, -0.2968783974647522, -0.2670866847038269, -0.2372949719429016, -0.20750324428081512, -0.17771151661872864, -0.14791978895664215, -0.11812806874513626, -0.08833634853363037, -0.058544620871543884, -0.028752893209457397, 0.0010388195514678955, 0.030830547213554382, 0.060622334480285645, 0.09041406214237213, 0.12020578235387802, 0.1499975025653839, 0.1797892302274704, 0.20958095788955688, 0.23937267065048218, 0.26916438341140747, 0.29895612597465515, 0.32874783873558044, 0.3585395812988281, 0.3883312940597534, 0.4181230068206787, 0.4479147493839264, 0.4777064621448517, 0.5074982047080994, 0.5372899174690247, 0.56708163022995, 0.5968733429908752, 0.6266651153564453, 0.6564568281173706, 0.6862485408782959, 0.7160402536392212, 0.7458319664001465, 0.7756236791610718, 0.8054153919219971, 0.8352071046829224, 0.8649988174438477, 0.8947905898094177, 0.924582302570343, 0.9543740153312683, 0.9841657280921936, 1.0139575004577637]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 17.0, 36.0, 47.0, 64.0, 99.0, 135.0, 252.0, 363.0, 579.0, 888.0, 1426.0, 2285.0, 3651.0, 5875.0, 9740.0, 16518.0, 27680.0, 46405.0, 75989.0, 122123.0, 171544.0, 184211.0, 142336.0, 93330.0, 57356.0, 34168.0, 20107.0, 12079.0, 7463.0, 4430.0, 2690.0, 1632.0, 1083.0, 690.0, 426.0, 295.0, 154.0, 122.0, 75.0, 57.0, 37.0, 25.0, 16.0, 15.0, 5.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.287109375, -0.2779083251953125, -0.268707275390625, -0.2595062255859375, -0.25030517578125, -0.2411041259765625, -0.231903076171875, -0.2227020263671875, -0.2135009765625, -0.2042999267578125, -0.195098876953125, -0.1858978271484375, -0.17669677734375, -0.1674957275390625, -0.158294677734375, -0.1490936279296875, -0.139892578125, -0.1306915283203125, -0.121490478515625, -0.1122894287109375, -0.10308837890625, -0.0938873291015625, -0.084686279296875, -0.0754852294921875, -0.0662841796875, -0.0570831298828125, -0.047882080078125, -0.0386810302734375, -0.02947998046875, -0.0202789306640625, -0.011077880859375, -0.0018768310546875, 0.00732421875, 0.0165252685546875, 0.025726318359375, 0.0349273681640625, 0.04412841796875, 0.0533294677734375, 0.062530517578125, 0.0717315673828125, 0.0809326171875, 0.0901336669921875, 0.099334716796875, 0.1085357666015625, 0.11773681640625, 0.1269378662109375, 0.136138916015625, 0.1453399658203125, 0.154541015625, 0.1637420654296875, 0.172943115234375, 0.1821441650390625, 0.19134521484375, 0.2005462646484375, 0.209747314453125, 0.2189483642578125, 0.2281494140625, 0.2373504638671875, 0.246551513671875, 0.2557525634765625, 0.26495361328125, 0.2741546630859375, 0.283355712890625, 0.2925567626953125, 0.3017578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 5.0, 10.0, 8.0, 10.0, 15.0, 17.0, 18.0, 29.0, 31.0, 34.0, 31.0, 39.0, 38.0, 55.0, 50.0, 34.0, 43.0, 34.0, 47.0, 49.0, 50.0, 48.0, 47.0, 50.0, 32.0, 38.0, 18.0, 24.0, 28.0, 17.0, 9.0, 5.0, 10.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0746002197265625, -1.036895751953125, -0.9991912841796875, -0.96148681640625, -0.9237823486328125, -0.886077880859375, -0.8483734130859375, -0.8106689453125, -0.7729644775390625, -0.735260009765625, -0.6975555419921875, -0.65985107421875, -0.6221466064453125, -0.584442138671875, -0.5467376708984375, -0.509033203125, -0.4713287353515625, -0.433624267578125, -0.3959197998046875, -0.35821533203125, -0.3205108642578125, -0.282806396484375, -0.2451019287109375, -0.2073974609375, -0.1696929931640625, -0.131988525390625, -0.0942840576171875, -0.05657958984375, -0.0188751220703125, 0.018829345703125, 0.0565338134765625, 0.09423828125, 0.1319427490234375, 0.169647216796875, 0.2073516845703125, 0.24505615234375, 0.2827606201171875, 0.320465087890625, 0.3581695556640625, 0.3958740234375, 0.4335784912109375, 0.471282958984375, 0.5089874267578125, 0.54669189453125, 0.5843963623046875, 0.622100830078125, 0.6598052978515625, 0.697509765625, 0.7352142333984375, 0.772918701171875, 0.8106231689453125, 0.84832763671875, 0.8860321044921875, 0.923736572265625, 0.9614410400390625, 0.9991455078125, 1.0368499755859375, 1.074554443359375, 1.1122589111328125, 1.14996337890625, 1.1876678466796875, 1.225372314453125, 1.2630767822265625, 1.30078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 19.0, 26.0, 31.0, 48.0, 78.0, 92.0, 183.0, 287.0, 428.0, 713.0, 1215.0, 2119.0, 3675.0, 6701.0, 12524.0, 24172.0, 47481.0, 92232.0, 167658.0, 238107.0, 202878.0, 118327.0, 62149.0, 31329.0, 16273.0, 8631.0, 4754.0, 2584.0, 1481.0, 870.0, 511.0, 345.0, 192.0, 136.0, 91.0, 63.0, 40.0, 21.0, 21.0, 16.0, 8.0, 11.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.39501953125, -0.3829383850097656, -0.37085723876953125, -0.3587760925292969, -0.3466949462890625, -0.3346138000488281, -0.32253265380859375, -0.3104515075683594, -0.298370361328125, -0.2862892150878906, -0.27420806884765625, -0.2621269226074219, -0.2500457763671875, -0.23796463012695312, -0.22588348388671875, -0.21380233764648438, -0.20172119140625, -0.18964004516601562, -0.17755889892578125, -0.16547775268554688, -0.1533966064453125, -0.14131546020507812, -0.12923431396484375, -0.11715316772460938, -0.105072021484375, -0.09299087524414062, -0.08090972900390625, -0.06882858276367188, -0.0567474365234375, -0.044666290283203125, -0.03258514404296875, -0.020503997802734375, -0.0084228515625, 0.003658294677734375, 0.01573944091796875, 0.027820587158203125, 0.0399017333984375, 0.051982879638671875, 0.06406402587890625, 0.07614517211914062, 0.088226318359375, 0.10030746459960938, 0.11238861083984375, 0.12446975708007812, 0.1365509033203125, 0.14863204956054688, 0.16071319580078125, 0.17279434204101562, 0.18487548828125, 0.19695663452148438, 0.20903778076171875, 0.22111892700195312, 0.2332000732421875, 0.24528121948242188, 0.25736236572265625, 0.2694435119628906, 0.281524658203125, 0.2936058044433594, 0.30568695068359375, 0.3177680969238281, 0.3298492431640625, 0.3419303894042969, 0.35401153564453125, 0.3660926818847656, 0.378173828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 6.0, 4.0, 6.0, 1.0, 10.0, 11.0, 15.0, 17.0, 23.0, 20.0, 11.0, 32.0, 27.0, 31.0, 29.0, 39.0, 31.0, 37.0, 23.0, 50.0, 35.0, 32.0, 39.0, 45.0, 44.0, 27.0, 36.0, 28.0, 33.0, 29.0, 37.0, 25.0, 18.0, 22.0, 16.0, 13.0, 13.0, 10.0, 12.0, 11.0, 16.0, 5.0, 4.0, 9.0, 1.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.5888671875, -0.5704879760742188, -0.5521087646484375, -0.5337295532226562, -0.515350341796875, -0.49697113037109375, -0.4785919189453125, -0.46021270751953125, -0.44183349609375, -0.42345428466796875, -0.4050750732421875, -0.38669586181640625, -0.368316650390625, -0.34993743896484375, -0.3315582275390625, -0.31317901611328125, -0.2947998046875, -0.27642059326171875, -0.2580413818359375, -0.23966217041015625, -0.221282958984375, -0.20290374755859375, -0.1845245361328125, -0.16614532470703125, -0.14776611328125, -0.12938690185546875, -0.1110076904296875, -0.09262847900390625, -0.074249267578125, -0.05587005615234375, -0.0374908447265625, -0.01911163330078125, -0.000732421875, 0.01764678955078125, 0.0360260009765625, 0.05440521240234375, 0.072784423828125, 0.09116363525390625, 0.1095428466796875, 0.12792205810546875, 0.14630126953125, 0.16468048095703125, 0.1830596923828125, 0.20143890380859375, 0.219818115234375, 0.23819732666015625, 0.2565765380859375, 0.27495574951171875, 0.2933349609375, 0.31171417236328125, 0.3300933837890625, 0.34847259521484375, 0.366851806640625, 0.38523101806640625, 0.4036102294921875, 0.42198944091796875, 0.44036865234375, 0.45874786376953125, 0.4771270751953125, 0.49550628662109375, 0.513885498046875, 0.5322647094726562, 0.5506439208984375, 0.5690231323242188, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 16.0, 33.0, 24.0, 29.0, 84.0, 87.0, 135.0, 177.0, 268.0, 419.0, 613.0, 960.0, 1519.0, 2474.0, 4525.0, 8841.0, 21741.0, 72438.0, 375292.0, 430020.0, 83585.0, 23599.0, 9634.0, 4815.0, 2649.0, 1516.0, 1006.0, 651.0, 446.0, 278.0, 229.0, 142.0, 88.0, 57.0, 41.0, 30.0, 24.0, 14.0, 11.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2736091613769531, -0.26450347900390625, -0.2553977966308594, -0.2462921142578125, -0.23718643188476562, -0.22808074951171875, -0.21897506713867188, -0.209869384765625, -0.20076370239257812, -0.19165802001953125, -0.18255233764648438, -0.1734466552734375, -0.16434097290039062, -0.15523529052734375, -0.14612960815429688, -0.13702392578125, -0.12791824340820312, -0.11881256103515625, -0.10970687866210938, -0.1006011962890625, -0.09149551391601562, -0.08238983154296875, -0.07328414916992188, -0.064178466796875, -0.055072784423828125, -0.04596710205078125, -0.036861419677734375, -0.0277557373046875, -0.018650054931640625, -0.00954437255859375, -0.000438690185546875, 0.0086669921875, 0.017772674560546875, 0.02687835693359375, 0.035984039306640625, 0.0450897216796875, 0.054195404052734375, 0.06330108642578125, 0.07240676879882812, 0.081512451171875, 0.09061813354492188, 0.09972381591796875, 0.10882949829101562, 0.1179351806640625, 0.12704086303710938, 0.13614654541015625, 0.14525222778320312, 0.15435791015625, 0.16346359252929688, 0.17256927490234375, 0.18167495727539062, 0.1907806396484375, 0.19988632202148438, 0.20899200439453125, 0.21809768676757812, 0.227203369140625, 0.23630905151367188, 0.24541473388671875, 0.2545204162597656, 0.2636260986328125, 0.2727317810058594, 0.28183746337890625, 0.2909431457519531, 0.300048828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 16.0, 29.0, 65.0, 64.0, 88.0, 110.0, 125.0, 124.0, 115.0, 89.0, 52.0, 29.0, 26.0, 15.0, 10.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1655112504959106e-05, -2.0839273929595947e-05, -2.0023435354232788e-05, -1.920759677886963e-05, -1.839175820350647e-05, -1.757591962814331e-05, -1.676008105278015e-05, -1.5944242477416992e-05, -1.5128403902053833e-05, -1.4312565326690674e-05, -1.3496726751327515e-05, -1.2680888175964355e-05, -1.1865049600601196e-05, -1.1049211025238037e-05, -1.0233372449874878e-05, -9.417533874511719e-06, -8.60169529914856e-06, -7.7858567237854e-06, -6.970018148422241e-06, -6.154179573059082e-06, -5.338340997695923e-06, -4.522502422332764e-06, -3.7066638469696045e-06, -2.8908252716064453e-06, -2.074986696243286e-06, -1.259148120880127e-06, -4.4330954551696777e-07, 3.725290298461914e-07, 1.1883676052093506e-06, 2.0042061805725098e-06, 2.820044755935669e-06, 3.635883331298828e-06, 4.451721906661987e-06, 5.2675604820251465e-06, 6.083399057388306e-06, 6.899237632751465e-06, 7.715076208114624e-06, 8.530914783477783e-06, 9.346753358840942e-06, 1.0162591934204102e-05, 1.097843050956726e-05, 1.179426908493042e-05, 1.2610107660293579e-05, 1.3425946235656738e-05, 1.4241784811019897e-05, 1.5057623386383057e-05, 1.5873461961746216e-05, 1.6689300537109375e-05, 1.7505139112472534e-05, 1.8320977687835693e-05, 1.9136816263198853e-05, 1.9952654838562012e-05, 2.076849341392517e-05, 2.158433198928833e-05, 2.240017056465149e-05, 2.321600914001465e-05, 2.4031847715377808e-05, 2.4847686290740967e-05, 2.5663524866104126e-05, 2.6479363441467285e-05, 2.7295202016830444e-05, 2.8111040592193604e-05, 2.8926879167556763e-05, 2.9742717742919922e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 6.0, 16.0, 15.0, 9.0, 28.0, 42.0, 49.0, 69.0, 102.0, 174.0, 244.0, 368.0, 621.0, 935.0, 1592.0, 2658.0, 4724.0, 9444.0, 22645.0, 73713.0, 302116.0, 442906.0, 124475.0, 34270.0, 12918.0, 6156.0, 3245.0, 1832.0, 1072.0, 689.0, 449.0, 282.0, 209.0, 130.0, 93.0, 61.0, 50.0, 28.0, 25.0, 14.0, 15.0, 13.0, 11.0, 6.0, 3.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3310546875, -0.320770263671875, -0.31048583984375, -0.300201416015625, -0.2899169921875, -0.279632568359375, -0.26934814453125, -0.259063720703125, -0.248779296875, -0.238494873046875, -0.22821044921875, -0.217926025390625, -0.2076416015625, -0.197357177734375, -0.18707275390625, -0.176788330078125, -0.16650390625, -0.156219482421875, -0.14593505859375, -0.135650634765625, -0.1253662109375, -0.115081787109375, -0.10479736328125, -0.094512939453125, -0.084228515625, -0.073944091796875, -0.06365966796875, -0.053375244140625, -0.0430908203125, -0.032806396484375, -0.02252197265625, -0.012237548828125, -0.001953125, 0.008331298828125, 0.01861572265625, 0.028900146484375, 0.0391845703125, 0.049468994140625, 0.05975341796875, 0.070037841796875, 0.080322265625, 0.090606689453125, 0.10089111328125, 0.111175537109375, 0.1214599609375, 0.131744384765625, 0.14202880859375, 0.152313232421875, 0.16259765625, 0.172882080078125, 0.18316650390625, 0.193450927734375, 0.2037353515625, 0.214019775390625, 0.22430419921875, 0.234588623046875, 0.244873046875, 0.255157470703125, 0.26544189453125, 0.275726318359375, 0.2860107421875, 0.296295166015625, 0.30657958984375, 0.316864013671875, 0.3271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 3.0, 10.0, 4.0, 3.0, 7.0, 12.0, 10.0, 13.0, 18.0, 17.0, 21.0, 31.0, 44.0, 54.0, 74.0, 100.0, 93.0, 76.0, 80.0, 62.0, 42.0, 45.0, 26.0, 27.0, 19.0, 18.0, 14.0, 11.0, 7.0, 7.0, 7.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048370361328125, -0.04680013656616211, -0.04522991180419922, -0.04365968704223633, -0.04208946228027344, -0.04051923751831055, -0.038949012756347656, -0.037378787994384766, -0.035808563232421875, -0.034238338470458984, -0.032668113708496094, -0.031097888946533203, -0.029527664184570312, -0.027957439422607422, -0.02638721466064453, -0.02481698989868164, -0.02324676513671875, -0.02167654037475586, -0.02010631561279297, -0.018536090850830078, -0.016965866088867188, -0.015395641326904297, -0.013825416564941406, -0.012255191802978516, -0.010684967041015625, -0.009114742279052734, -0.007544517517089844, -0.005974292755126953, -0.0044040679931640625, -0.002833843231201172, -0.0012636184692382812, 0.0003066062927246094, 0.0018768310546875, 0.0034470558166503906, 0.005017280578613281, 0.006587505340576172, 0.008157730102539062, 0.009727954864501953, 0.011298179626464844, 0.012868404388427734, 0.014438629150390625, 0.016008853912353516, 0.017579078674316406, 0.019149303436279297, 0.020719528198242188, 0.022289752960205078, 0.02385997772216797, 0.02543020248413086, 0.02700042724609375, 0.02857065200805664, 0.03014087677001953, 0.03171110153198242, 0.03328132629394531, 0.0348515510559082, 0.036421775817871094, 0.037992000579833984, 0.039562225341796875, 0.041132450103759766, 0.042702674865722656, 0.04427289962768555, 0.04584312438964844, 0.04741334915161133, 0.04898357391357422, 0.05055379867553711, 0.0521240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 13.0, 19.0, 19.0, 17.0, 22.0, 21.0, 40.0, 24.0, 44.0, 43.0, 57.0, 52.0, 66.0, 56.0, 51.0, 45.0, 36.0, 50.0, 37.0, 30.0, 37.0, 36.0, 26.0, 18.0, 17.0, 13.0, 15.0, 14.0, 16.0, 6.0, 11.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.584175705909729, -1.5413509607315063, -1.4985262155532837, -1.455701470375061, -1.412876844406128, -1.3700520992279053, -1.3272273540496826, -1.28440260887146, -1.2415778636932373, -1.1987531185150146, -1.155928373336792, -1.1131036281585693, -1.0702788829803467, -1.0274542570114136, -0.9846295118331909, -0.9418047666549683, -0.8989800214767456, -0.856155276298523, -0.8133305311203003, -0.7705058455467224, -0.7276811003684998, -0.6848563551902771, -0.6420316696166992, -0.5992069244384766, -0.5563821792602539, -0.5135574340820312, -0.470732718706131, -0.4279080033302307, -0.38508325815200806, -0.3422585129737854, -0.29943379759788513, -0.25660908222198486, -0.21378445625305176, -0.1709597259759903, -0.12813499569892883, -0.08531026542186737, -0.04248553514480591, 0.0003391951322555542, 0.04316392540931702, 0.08598864078521729, 0.12881338596343994, 0.1716381162405014, 0.21446284651756287, 0.25728756189346313, 0.3001123070716858, 0.34293705224990845, 0.3857617676258087, 0.428586483001709, 0.47141122817993164, 0.5142359733581543, 0.557060718536377, 0.5998854041099548, 0.6427101492881775, 0.6855348944664001, 0.728359580039978, 0.7711843252182007, 0.8140090703964233, 0.856833815574646, 0.8996585607528687, 0.9424832463264465, 0.9853079915046692, 1.028132677078247, 1.0709574222564697, 1.1137821674346924, 1.156606912612915]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 18.0, 15.0, 15.0, 19.0, 20.0, 16.0, 30.0, 32.0, 25.0, 26.0, 39.0, 32.0, 42.0, 36.0, 43.0, 35.0, 38.0, 31.0, 44.0, 46.0, 34.0, 38.0, 38.0, 29.0, 32.0, 35.0, 30.0, 25.0, 16.0, 14.0, 14.0, 11.0, 18.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8862427473068237, -0.8564247488975525, -0.8266066908836365, -0.7967886924743652, -0.766970694065094, -0.7371526956558228, -0.7073346376419067, -0.6775166392326355, -0.6476986408233643, -0.617880642414093, -0.588062584400177, -0.5582445859909058, -0.5284265875816345, -0.4986085593700409, -0.46879053115844727, -0.438972532749176, -0.40915447473526, -0.3793364465236664, -0.34951844811439514, -0.3197004199028015, -0.2898824214935303, -0.26006439328193665, -0.23024636507034302, -0.20042835175991058, -0.17061033844947815, -0.14079232513904572, -0.11097430437803268, -0.08115628361701965, -0.05133827030658722, -0.021520256996154785, 0.008297771215438843, 0.03811578452587128, 0.06793379783630371, 0.09775181114673615, 0.12756982445716858, 0.1573878526687622, 0.18720586597919464, 0.21702387928962708, 0.2468419075012207, 0.27665990591049194, 0.30647793412208557, 0.3362959623336792, 0.36611396074295044, 0.39593198895454407, 0.4257500171661377, 0.45556801557540894, 0.48538604378700256, 0.5152040719985962, 0.5450220704078674, 0.5748400688171387, 0.6046581268310547, 0.6344761252403259, 0.6642941236495972, 0.6941121816635132, 0.7239301800727844, 0.7537481784820557, 0.7835662364959717, 0.8133842349052429, 0.8432022929191589, 0.8730202913284302, 0.9028382897377014, 0.9326562881469727, 0.9624743461608887, 0.9922923445701599, 1.0221103429794312]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 13.0, 18.0, 34.0, 43.0, 58.0, 99.0, 186.0, 260.0, 451.0, 641.0, 1063.0, 1744.0, 2757.0, 4522.0, 7418.0, 11858.0, 18801.0, 29105.0, 43605.0, 62628.0, 84486.0, 104622.0, 119193.0, 122436.0, 113746.0, 95058.0, 73044.0, 52177.0, 35877.0, 23411.0, 14931.0, 9292.0, 5736.0, 3542.0, 2141.0, 1317.0, 812.0, 582.0, 305.0, 192.0, 133.0, 86.0, 49.0, 22.0, 24.0, 21.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.984375, -0.9538497924804688, -0.9233245849609375, -0.8927993774414062, -0.862274169921875, -0.8317489624023438, -0.8012237548828125, -0.7706985473632812, -0.74017333984375, -0.7096481323242188, -0.6791229248046875, -0.6485977172851562, -0.618072509765625, -0.5875473022460938, -0.5570220947265625, -0.5264968872070312, -0.4959716796875, -0.46544647216796875, -0.4349212646484375, -0.40439605712890625, -0.373870849609375, -0.34334564208984375, -0.3128204345703125, -0.28229522705078125, -0.25177001953125, -0.22124481201171875, -0.1907196044921875, -0.16019439697265625, -0.129669189453125, -0.09914398193359375, -0.0686187744140625, -0.03809356689453125, -0.007568359375, 0.02295684814453125, 0.0534820556640625, 0.08400726318359375, 0.114532470703125, 0.14505767822265625, 0.1755828857421875, 0.20610809326171875, 0.23663330078125, 0.26715850830078125, 0.2976837158203125, 0.32820892333984375, 0.358734130859375, 0.38925933837890625, 0.4197845458984375, 0.45030975341796875, 0.4808349609375, 0.5113601684570312, 0.5418853759765625, 0.5724105834960938, 0.602935791015625, 0.6334609985351562, 0.6639862060546875, 0.6945114135742188, 0.72503662109375, 0.7555618286132812, 0.7860870361328125, 0.8166122436523438, 0.847137451171875, 0.8776626586914062, 0.9081878662109375, 0.9387130737304688, 0.96923828125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 11.0, 10.0, 16.0, 15.0, 24.0, 25.0, 24.0, 18.0, 29.0, 29.0, 33.0, 36.0, 35.0, 46.0, 43.0, 40.0, 48.0, 40.0, 42.0, 32.0, 59.0, 37.0, 30.0, 39.0, 28.0, 30.0, 31.0, 22.0, 22.0, 20.0, 8.0, 21.0, 12.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0275115966796875, -0.993499755859375, -0.9594879150390625, -0.92547607421875, -0.8914642333984375, -0.857452392578125, -0.8234405517578125, -0.7894287109375, -0.7554168701171875, -0.721405029296875, -0.6873931884765625, -0.65338134765625, -0.6193695068359375, -0.585357666015625, -0.5513458251953125, -0.517333984375, -0.4833221435546875, -0.449310302734375, -0.4152984619140625, -0.38128662109375, -0.3472747802734375, -0.313262939453125, -0.2792510986328125, -0.2452392578125, -0.2112274169921875, -0.177215576171875, -0.1432037353515625, -0.10919189453125, -0.0751800537109375, -0.041168212890625, -0.0071563720703125, 0.02685546875, 0.0608673095703125, 0.094879150390625, 0.1288909912109375, 0.16290283203125, 0.1969146728515625, 0.230926513671875, 0.2649383544921875, 0.2989501953125, 0.3329620361328125, 0.366973876953125, 0.4009857177734375, 0.43499755859375, 0.4690093994140625, 0.503021240234375, 0.5370330810546875, 0.571044921875, 0.6050567626953125, 0.639068603515625, 0.6730804443359375, 0.70709228515625, 0.7411041259765625, 0.775115966796875, 0.8091278076171875, 0.8431396484375, 0.8771514892578125, 0.911163330078125, 0.9451751708984375, 0.97918701171875, 1.0131988525390625, 1.047210693359375, 1.0812225341796875, 1.115234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 25.0, 32.0, 48.0, 76.0, 93.0, 169.0, 258.0, 371.0, 583.0, 909.0, 1389.0, 2217.0, 3487.0, 5229.0, 7921.0, 11858.0, 17735.0, 25076.0, 35306.0, 48511.0, 62575.0, 77501.0, 91774.0, 99311.0, 101884.0, 97625.0, 86166.0, 72361.0, 57289.0, 42784.0, 31079.0, 22028.0, 15110.0, 10146.0, 6871.0, 4430.0, 2935.0, 1878.0, 1200.0, 805.0, 515.0, 330.0, 209.0, 163.0, 97.0, 74.0, 39.0, 26.0, 16.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.83984375, -0.8138504028320312, -0.7878570556640625, -0.7618637084960938, -0.735870361328125, -0.7098770141601562, -0.6838836669921875, -0.6578903198242188, -0.63189697265625, -0.6059036254882812, -0.5799102783203125, -0.5539169311523438, -0.527923583984375, -0.5019302368164062, -0.4759368896484375, -0.44994354248046875, -0.4239501953125, -0.39795684814453125, -0.3719635009765625, -0.34597015380859375, -0.319976806640625, -0.29398345947265625, -0.2679901123046875, -0.24199676513671875, -0.21600341796875, -0.19001007080078125, -0.1640167236328125, -0.13802337646484375, -0.112030029296875, -0.08603668212890625, -0.0600433349609375, -0.03404998779296875, -0.008056640625, 0.01793670654296875, 0.0439300537109375, 0.06992340087890625, 0.095916748046875, 0.12191009521484375, 0.1479034423828125, 0.17389678955078125, 0.19989013671875, 0.22588348388671875, 0.2518768310546875, 0.27787017822265625, 0.303863525390625, 0.32985687255859375, 0.3558502197265625, 0.38184356689453125, 0.4078369140625, 0.43383026123046875, 0.4598236083984375, 0.48581695556640625, 0.511810302734375, 0.5378036499023438, 0.5637969970703125, 0.5897903442382812, 0.61578369140625, 0.6417770385742188, 0.6677703857421875, 0.6937637329101562, 0.719757080078125, 0.7457504272460938, 0.7717437744140625, 0.7977371215820312, 0.82373046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 8.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 17.0, 8.0, 18.0, 20.0, 24.0, 21.0, 18.0, 28.0, 24.0, 37.0, 41.0, 42.0, 35.0, 34.0, 35.0, 39.0, 45.0, 25.0, 37.0, 31.0, 17.0, 29.0, 31.0, 35.0, 16.0, 30.0, 22.0, 25.0, 18.0, 18.0, 11.0, 8.0, 11.0, 13.0, 5.0, 10.0, 12.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.50830078125, -0.49228668212890625, -0.4762725830078125, -0.46025848388671875, -0.444244384765625, -0.42823028564453125, -0.4122161865234375, -0.39620208740234375, -0.38018798828125, -0.36417388916015625, -0.3481597900390625, -0.33214569091796875, -0.316131591796875, -0.30011749267578125, -0.2841033935546875, -0.26808929443359375, -0.2520751953125, -0.23606109619140625, -0.2200469970703125, -0.20403289794921875, -0.188018798828125, -0.17200469970703125, -0.1559906005859375, -0.13997650146484375, -0.12396240234375, -0.10794830322265625, -0.0919342041015625, -0.07592010498046875, -0.059906005859375, -0.04389190673828125, -0.0278778076171875, -0.01186370849609375, 0.004150390625, 0.02016448974609375, 0.0361785888671875, 0.05219268798828125, 0.068206787109375, 0.08422088623046875, 0.1002349853515625, 0.11624908447265625, 0.13226318359375, 0.14827728271484375, 0.1642913818359375, 0.18030548095703125, 0.196319580078125, 0.21233367919921875, 0.2283477783203125, 0.24436187744140625, 0.2603759765625, 0.27639007568359375, 0.2924041748046875, 0.30841827392578125, 0.324432373046875, 0.34044647216796875, 0.3564605712890625, 0.37247467041015625, 0.38848876953125, 0.40450286865234375, 0.4205169677734375, 0.43653106689453125, 0.452545166015625, 0.46855926513671875, 0.4845733642578125, 0.5005874633789062, 0.5166015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 17.0, 7.0, 26.0, 25.0, 39.0, 47.0, 53.0, 87.0, 127.0, 155.0, 224.0, 259.0, 396.0, 487.0, 733.0, 993.0, 1545.0, 2065.0, 3362.0, 5792.0, 14319.0, 62424.0, 326381.0, 465670.0, 120042.0, 23139.0, 7778.0, 3985.0, 2439.0, 1718.0, 1154.0, 826.0, 591.0, 425.0, 306.0, 235.0, 167.0, 123.0, 91.0, 74.0, 55.0, 41.0, 30.0, 23.0, 21.0, 16.0, 14.0, 7.0, 3.0, 5.0, 3.0], "bins": [-2.533203125, -2.46319580078125, -2.3931884765625, -2.32318115234375, -2.253173828125, -2.18316650390625, -2.1131591796875, -2.04315185546875, -1.97314453125, -1.90313720703125, -1.8331298828125, -1.76312255859375, -1.693115234375, -1.62310791015625, -1.5531005859375, -1.48309326171875, -1.4130859375, -1.34307861328125, -1.2730712890625, -1.20306396484375, -1.133056640625, -1.06304931640625, -0.9930419921875, -0.92303466796875, -0.85302734375, -0.78302001953125, -0.7130126953125, -0.64300537109375, -0.572998046875, -0.50299072265625, -0.4329833984375, -0.36297607421875, -0.29296875, -0.22296142578125, -0.1529541015625, -0.08294677734375, -0.012939453125, 0.05706787109375, 0.1270751953125, 0.19708251953125, 0.26708984375, 0.33709716796875, 0.4071044921875, 0.47711181640625, 0.547119140625, 0.61712646484375, 0.6871337890625, 0.75714111328125, 0.8271484375, 0.89715576171875, 0.9671630859375, 1.03717041015625, 1.107177734375, 1.17718505859375, 1.2471923828125, 1.31719970703125, 1.38720703125, 1.45721435546875, 1.5272216796875, 1.59722900390625, 1.667236328125, 1.73724365234375, 1.8072509765625, 1.87725830078125, 1.947265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 15.0, 28.0, 52.0, 81.0, 166.0, 194.0, 164.0, 116.0, 82.0, 34.0, 20.0, 11.0, 7.0, 6.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021147727966308594, -0.0002046283334493637, -0.00019777938723564148, -0.00019093044102191925, -0.00018408149480819702, -0.0001772325485944748, -0.00017038360238075256, -0.00016353465616703033, -0.0001566857099533081, -0.00014983676373958588, -0.00014298781752586365, -0.00013613887131214142, -0.0001292899250984192, -0.00012244097888469696, -0.00011559203267097473, -0.0001087430864572525, -0.00010189414024353027, -9.504519402980804e-05, -8.819624781608582e-05, -8.134730160236359e-05, -7.449835538864136e-05, -6.764940917491913e-05, -6.08004629611969e-05, -5.395151674747467e-05, -4.710257053375244e-05, -4.025362432003021e-05, -3.3404678106307983e-05, -2.6555731892585754e-05, -1.9706785678863525e-05, -1.2857839465141296e-05, -6.008893251419067e-06, 8.400529623031616e-07, 7.68899917602539e-06, 1.453794538974762e-05, 2.138689160346985e-05, 2.8235837817192078e-05, 3.508478403091431e-05, 4.1933730244636536e-05, 4.8782676458358765e-05, 5.5631622672080994e-05, 6.248056888580322e-05, 6.932951509952545e-05, 7.617846131324768e-05, 8.302740752696991e-05, 8.987635374069214e-05, 9.672529995441437e-05, 0.0001035742461681366, 0.00011042319238185883, 0.00011727213859558105, 0.00012412108480930328, 0.0001309700310230255, 0.00013781897723674774, 0.00014466792345046997, 0.0001515168696641922, 0.00015836581587791443, 0.00016521476209163666, 0.0001720637083053589, 0.00017891265451908112, 0.00018576160073280334, 0.00019261054694652557, 0.0001994594931602478, 0.00020630843937397003, 0.00021315738558769226, 0.0002200063318014145, 0.00022685527801513672]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 9.0, 8.0, 8.0, 20.0, 22.0, 34.0, 45.0, 82.0, 109.0, 167.0, 227.0, 401.0, 532.0, 804.0, 1270.0, 2045.0, 3555.0, 8269.0, 31062.0, 166683.0, 480473.0, 274360.0, 54881.0, 12088.0, 4607.0, 2537.0, 1476.0, 958.0, 593.0, 424.0, 236.0, 181.0, 107.0, 79.0, 47.0, 43.0, 32.0, 26.0, 19.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.306640625, -2.241973876953125, -2.17730712890625, -2.112640380859375, -2.0479736328125, -1.983306884765625, -1.91864013671875, -1.853973388671875, -1.789306640625, -1.724639892578125, -1.65997314453125, -1.595306396484375, -1.5306396484375, -1.465972900390625, -1.40130615234375, -1.336639404296875, -1.27197265625, -1.207305908203125, -1.14263916015625, -1.077972412109375, -1.0133056640625, -0.948638916015625, -0.88397216796875, -0.819305419921875, -0.754638671875, -0.689971923828125, -0.62530517578125, -0.560638427734375, -0.4959716796875, -0.431304931640625, -0.36663818359375, -0.301971435546875, -0.2373046875, -0.172637939453125, -0.10797119140625, -0.043304443359375, 0.0213623046875, 0.086029052734375, 0.15069580078125, 0.215362548828125, 0.280029296875, 0.344696044921875, 0.40936279296875, 0.474029541015625, 0.5386962890625, 0.603363037109375, 0.66802978515625, 0.732696533203125, 0.79736328125, 0.862030029296875, 0.92669677734375, 0.991363525390625, 1.0560302734375, 1.120697021484375, 1.18536376953125, 1.250030517578125, 1.314697265625, 1.379364013671875, 1.44403076171875, 1.508697509765625, 1.5733642578125, 1.638031005859375, 1.70269775390625, 1.767364501953125, 1.83203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 10.0, 7.0, 12.0, 16.0, 17.0, 26.0, 34.0, 42.0, 59.0, 56.0, 73.0, 74.0, 65.0, 84.0, 84.0, 82.0, 69.0, 46.0, 39.0, 21.0, 25.0, 14.0, 11.0, 9.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212646484375, -0.20475387573242188, -0.19686126708984375, -0.18896865844726562, -0.1810760498046875, -0.17318344116210938, -0.16529083251953125, -0.15739822387695312, -0.149505615234375, -0.14161300659179688, -0.13372039794921875, -0.12582778930664062, -0.1179351806640625, -0.11004257202148438, -0.10214996337890625, -0.09425735473632812, -0.08636474609375, -0.07847213745117188, -0.07057952880859375, -0.06268692016601562, -0.0547943115234375, -0.046901702880859375, -0.03900909423828125, -0.031116485595703125, -0.023223876953125, -0.015331268310546875, -0.00743865966796875, 0.000453948974609375, 0.0083465576171875, 0.016239166259765625, 0.02413177490234375, 0.032024383544921875, 0.0399169921875, 0.047809600830078125, 0.05570220947265625, 0.06359481811523438, 0.0714874267578125, 0.07938003540039062, 0.08727264404296875, 0.09516525268554688, 0.103057861328125, 0.11095046997070312, 0.11884307861328125, 0.12673568725585938, 0.1346282958984375, 0.14252090454101562, 0.15041351318359375, 0.15830612182617188, 0.16619873046875, 0.17409133911132812, 0.18198394775390625, 0.18987655639648438, 0.1977691650390625, 0.20566177368164062, 0.21355438232421875, 0.22144699096679688, 0.229339599609375, 0.23723220825195312, 0.24512481689453125, 0.2530174255371094, 0.2609100341796875, 0.2688026428222656, 0.27669525146484375, 0.2845878601074219, 0.29248046875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 29.0, 28.0, 28.0, 33.0, 39.0, 41.0, 51.0, 48.0, 54.0, 55.0, 65.0, 56.0, 51.0, 36.0, 51.0, 37.0, 39.0, 32.0, 22.0, 26.0, 21.0, 23.0, 17.0, 10.0, 8.0, 3.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.5890384912490845, -1.5426957607269287, -1.496353030204773, -1.4500102996826172, -1.4036675691604614, -1.3573248386383057, -1.3109819889068604, -1.2646393775939941, -1.2182965278625488, -1.171953797340393, -1.1256110668182373, -1.0792683362960815, -1.0329256057739258, -0.98658287525177, -0.9402400851249695, -0.8938973546028137, -0.8475546836853027, -0.801211953163147, -0.7548692226409912, -0.7085264921188354, -0.6621837615966797, -0.6158410310745239, -0.5694982409477234, -0.5231555104255676, -0.47681277990341187, -0.4304700493812561, -0.38412731885910034, -0.3377845585346222, -0.29144182801246643, -0.24509909749031067, -0.19875633716583252, -0.15241360664367676, -0.10607099533081055, -0.05972825735807419, -0.01338551938533783, 0.032957226037979126, 0.07929995656013489, 0.12564268708229065, 0.1719854474067688, 0.21832817792892456, 0.2646709084510803, 0.3110136389732361, 0.35735636949539185, 0.40369912981987, 0.45004186034202576, 0.4963845908641815, 0.5427273511886597, 0.5890700817108154, 0.6354128122329712, 0.681755542755127, 0.7280982732772827, 0.7744410037994385, 0.8207837343215942, 0.86712646484375, 0.9134692549705505, 0.9598119854927063, 1.0061547756195068, 1.0524975061416626, 1.0988402366638184, 1.1451829671859741, 1.1915256977081299, 1.2378684282302856, 1.2842111587524414, 1.3305540084838867, 1.376896619796753]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 8.0, 20.0, 21.0, 15.0, 34.0, 37.0, 23.0, 34.0, 48.0, 26.0, 46.0, 38.0, 27.0, 58.0, 38.0, 42.0, 47.0, 46.0, 47.0, 28.0, 34.0, 40.0, 38.0, 18.0, 27.0, 20.0, 19.0, 15.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.153900146484375, -1.1200770139694214, -1.0862538814544678, -1.0524308681488037, -1.01860773563385, -0.9847846031188965, -0.9509614706039429, -0.9171383380889893, -0.8833152651786804, -0.8494921326637268, -0.815669059753418, -0.7818459272384644, -0.7480227947235107, -0.7141997218132019, -0.6803765892982483, -0.6465535163879395, -0.6127303838729858, -0.5789072513580322, -0.5450841784477234, -0.5112610459327698, -0.47743794322013855, -0.4436148405075073, -0.4097917079925537, -0.3759686052799225, -0.34214550256729126, -0.30832239985466003, -0.2744992971420288, -0.2406761646270752, -0.20685306191444397, -0.17302995920181274, -0.13920684158802032, -0.1053837239742279, -0.07156062126159668, -0.03773751109838486, -0.003914400935173035, 0.029908709228038788, 0.06373181939125061, 0.09755492210388184, 0.13137803971767426, 0.16520115733146667, 0.1990242600440979, 0.23284736275672913, 0.26667046546936035, 0.30049359798431396, 0.3343167006969452, 0.3681398034095764, 0.40196293592453003, 0.43578603863716125, 0.4696091413497925, 0.5034322738647461, 0.5372553467750549, 0.5710784792900085, 0.6049015522003174, 0.638724684715271, 0.6725478172302246, 0.7063709497451782, 0.7401940226554871, 0.7740171551704407, 0.8078402280807495, 0.8416633605957031, 0.8754864931106567, 0.9093095660209656, 0.9431326985359192, 0.976955771446228, 1.0107789039611816]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 6.0, 12.0, 18.0, 34.0, 53.0, 88.0, 133.0, 229.0, 338.0, 530.0, 858.0, 1469.0, 2435.0, 4044.0, 6904.0, 11900.0, 20216.0, 35296.0, 61153.0, 104817.0, 176564.0, 285254.0, 423747.0, 563860.0, 633579.0, 591438.0, 462193.0, 318973.0, 200328.0, 120198.0, 69911.0, 40563.0, 23435.0, 13945.0, 7871.0, 4776.0, 2818.0, 1682.0, 1052.0, 608.0, 375.0, 231.0, 136.0, 88.0, 45.0, 27.0, 16.0, 14.0, 10.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.265625, -1.2279815673828125, -1.190338134765625, -1.1526947021484375, -1.11505126953125, -1.0774078369140625, -1.039764404296875, -1.0021209716796875, -0.9644775390625, -0.9268341064453125, -0.889190673828125, -0.8515472412109375, -0.81390380859375, -0.7762603759765625, -0.738616943359375, -0.7009735107421875, -0.663330078125, -0.6256866455078125, -0.588043212890625, -0.5503997802734375, -0.51275634765625, -0.4751129150390625, -0.437469482421875, -0.3998260498046875, -0.3621826171875, -0.3245391845703125, -0.286895751953125, -0.2492523193359375, -0.21160888671875, -0.1739654541015625, -0.136322021484375, -0.0986785888671875, -0.06103515625, -0.0233917236328125, 0.014251708984375, 0.0518951416015625, 0.08953857421875, 0.1271820068359375, 0.164825439453125, 0.2024688720703125, 0.2401123046875, 0.2777557373046875, 0.315399169921875, 0.3530426025390625, 0.39068603515625, 0.4283294677734375, 0.465972900390625, 0.5036163330078125, 0.541259765625, 0.5789031982421875, 0.616546630859375, 0.6541900634765625, 0.69183349609375, 0.7294769287109375, 0.767120361328125, 0.8047637939453125, 0.8424072265625, 0.8800506591796875, 0.917694091796875, 0.9553375244140625, 0.99298095703125, 1.0306243896484375, 1.068267822265625, 1.1059112548828125, 1.1435546875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 10.0, 15.0, 21.0, 19.0, 30.0, 28.0, 25.0, 26.0, 30.0, 28.0, 37.0, 45.0, 45.0, 44.0, 43.0, 47.0, 57.0, 51.0, 58.0, 36.0, 33.0, 30.0, 30.0, 23.0, 32.0, 25.0, 26.0, 13.0, 6.0, 17.0, 14.0, 8.0, 10.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9123153686523438, -0.8842010498046875, -0.8560867309570312, -0.827972412109375, -0.7998580932617188, -0.7717437744140625, -0.7436294555664062, -0.71551513671875, -0.6874008178710938, -0.6592864990234375, -0.6311721801757812, -0.603057861328125, -0.5749435424804688, -0.5468292236328125, -0.5187149047851562, -0.4906005859375, -0.46248626708984375, -0.4343719482421875, -0.40625762939453125, -0.378143310546875, -0.35002899169921875, -0.3219146728515625, -0.29380035400390625, -0.26568603515625, -0.23757171630859375, -0.2094573974609375, -0.18134307861328125, -0.153228759765625, -0.12511444091796875, -0.0970001220703125, -0.06888580322265625, -0.040771484375, -0.01265716552734375, 0.0154571533203125, 0.04357147216796875, 0.071685791015625, 0.09980010986328125, 0.1279144287109375, 0.15602874755859375, 0.18414306640625, 0.21225738525390625, 0.2403717041015625, 0.26848602294921875, 0.296600341796875, 0.32471466064453125, 0.3528289794921875, 0.38094329833984375, 0.4090576171875, 0.43717193603515625, 0.4652862548828125, 0.49340057373046875, 0.521514892578125, 0.5496292114257812, 0.5777435302734375, 0.6058578491210938, 0.63397216796875, 0.6620864868164062, 0.6902008056640625, 0.7183151245117188, 0.746429443359375, 0.7745437622070312, 0.8026580810546875, 0.8307723999023438, 0.85888671875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 21.0, 27.0, 57.0, 73.0, 166.0, 238.0, 393.0, 785.0, 1107.0, 2026.0, 3309.0, 5889.0, 10196.0, 17635.0, 30827.0, 53391.0, 91300.0, 149651.0, 236105.0, 349679.0, 470769.0, 561428.0, 579443.0, 510425.0, 397337.0, 277121.0, 179294.0, 110597.0, 64992.0, 38232.0, 22053.0, 12648.0, 7146.0, 4113.0, 2403.0, 1389.0, 786.0, 492.0, 306.0, 164.0, 119.0, 69.0, 31.0, 21.0, 10.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1825103759765625, -1.143341064453125, -1.1041717529296875, -1.06500244140625, -1.0258331298828125, -0.986663818359375, -0.9474945068359375, -0.9083251953125, -0.8691558837890625, -0.829986572265625, -0.7908172607421875, -0.75164794921875, -0.7124786376953125, -0.673309326171875, -0.6341400146484375, -0.594970703125, -0.5558013916015625, -0.516632080078125, -0.4774627685546875, -0.43829345703125, -0.3991241455078125, -0.359954833984375, -0.3207855224609375, -0.2816162109375, -0.2424468994140625, -0.203277587890625, -0.1641082763671875, -0.12493896484375, -0.0857696533203125, -0.046600341796875, -0.0074310302734375, 0.03173828125, 0.0709075927734375, 0.110076904296875, 0.1492462158203125, 0.18841552734375, 0.2275848388671875, 0.266754150390625, 0.3059234619140625, 0.3450927734375, 0.3842620849609375, 0.423431396484375, 0.4626007080078125, 0.50177001953125, 0.5409393310546875, 0.580108642578125, 0.6192779541015625, 0.658447265625, 0.6976165771484375, 0.736785888671875, 0.7759552001953125, 0.81512451171875, 0.8542938232421875, 0.893463134765625, 0.9326324462890625, 0.9718017578125, 1.0109710693359375, 1.050140380859375, 1.0893096923828125, 1.12847900390625, 1.1676483154296875, 1.206817626953125, 1.2459869384765625, 1.28515625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 36.0, 44.0, 40.0, 53.0, 71.0, 92.0, 107.0, 91.0, 145.0, 128.0, 168.0, 178.0, 196.0, 188.0, 209.0, 218.0, 199.0, 219.0, 220.0, 196.0, 173.0, 160.0, 141.0, 143.0, 105.0, 82.0, 75.0, 77.0, 69.0, 31.0, 26.0, 20.0, 26.0, 17.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.400146484375, -0.3865547180175781, -0.37296295166015625, -0.3593711853027344, -0.3457794189453125, -0.3321876525878906, -0.31859588623046875, -0.3050041198730469, -0.291412353515625, -0.2778205871582031, -0.26422882080078125, -0.2506370544433594, -0.2370452880859375, -0.22345352172851562, -0.20986175537109375, -0.19626998901367188, -0.18267822265625, -0.16908645629882812, -0.15549468994140625, -0.14190292358398438, -0.1283111572265625, -0.11471939086914062, -0.10112762451171875, -0.08753585815429688, -0.073944091796875, -0.060352325439453125, -0.04676055908203125, -0.033168792724609375, -0.0195770263671875, -0.005985260009765625, 0.00760650634765625, 0.021198272705078125, 0.0347900390625, 0.048381805419921875, 0.06197357177734375, 0.07556533813476562, 0.0891571044921875, 0.10274887084960938, 0.11634063720703125, 0.12993240356445312, 0.143524169921875, 0.15711593627929688, 0.17070770263671875, 0.18429946899414062, 0.1978912353515625, 0.21148300170898438, 0.22507476806640625, 0.23866653442382812, 0.25225830078125, 0.2658500671386719, 0.27944183349609375, 0.2930335998535156, 0.3066253662109375, 0.3202171325683594, 0.33380889892578125, 0.3474006652832031, 0.360992431640625, 0.3745841979980469, 0.38817596435546875, 0.4017677307128906, 0.4153594970703125, 0.4289512634277344, 0.44254302978515625, 0.4561347961425781, 0.4697265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 3.0, 1.0, 8.0, 13.0, 13.0, 14.0, 21.0, 20.0, 29.0, 31.0, 34.0, 49.0, 51.0, 42.0, 44.0, 43.0, 55.0, 61.0, 64.0, 59.0, 60.0, 48.0, 42.0, 34.0, 24.0, 24.0, 23.0, 15.0, 12.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5419496297836304, -1.49064040184021, -1.4393311738967896, -1.3880219459533691, -1.3367127180099487, -1.2854034900665283, -1.234094262123108, -1.1827850341796875, -1.131475806236267, -1.0801665782928467, -1.0288573503494263, -0.9775481224060059, -0.9262388944625854, -0.874929666519165, -0.8236204385757446, -0.7723112106323242, -0.721001923084259, -0.6696926951408386, -0.6183834671974182, -0.5670742392539978, -0.5157650113105774, -0.4644557535648346, -0.4131465256214142, -0.3618372976779938, -0.31052806973457336, -0.25921884179115295, -0.20790961384773254, -0.15660037100315094, -0.10529114305973053, -0.053981900215148926, -0.0026726722717285156, 0.048636555671691895, 0.0999457836151123, 0.15125501155853271, 0.20256423950195312, 0.25387346744537354, 0.30518269538879395, 0.35649195313453674, 0.40780118107795715, 0.45911040902137756, 0.5104196071624756, 0.561728835105896, 0.6130380630493164, 0.6643472909927368, 0.7156565189361572, 0.7669657468795776, 0.818274974822998, 0.8695842027664185, 0.9208934903144836, 0.972202718257904, 1.0235120058059692, 1.0748212337493896, 1.12613046169281, 1.1774396896362305, 1.2287489175796509, 1.2800581455230713, 1.3313673734664917, 1.382676601409912, 1.4339858293533325, 1.485295057296753, 1.5366042852401733, 1.5879135131835938, 1.6392227411270142, 1.6905319690704346, 1.741841197013855]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 0.0, 10.0, 7.0, 9.0, 7.0, 13.0, 8.0, 16.0, 18.0, 18.0, 23.0, 32.0, 38.0, 37.0, 31.0, 34.0, 29.0, 39.0, 33.0, 41.0, 39.0, 38.0, 24.0, 37.0, 25.0, 48.0, 47.0, 40.0, 33.0, 36.0, 22.0, 22.0, 16.0, 19.0, 16.0, 22.0, 15.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.0659161806106567, -1.0348045825958252, -1.0036929845809937, -0.9725813865661621, -0.9414697885513306, -0.910358190536499, -0.8792465329170227, -0.8481349349021912, -0.8170233368873596, -0.7859117388725281, -0.7548001408576965, -0.723688542842865, -0.6925768852233887, -0.6614652872085571, -0.6303536891937256, -0.599242091178894, -0.5681304931640625, -0.537018895149231, -0.5059072971343994, -0.4747956693172455, -0.44368407130241394, -0.4125724732875824, -0.38146084547042847, -0.3503492474555969, -0.3192376494407654, -0.28812605142593384, -0.2570144534111023, -0.22590282559394836, -0.19479122757911682, -0.16367962956428528, -0.13256801664829254, -0.1014564037322998, -0.07034474611282349, -0.039233140647411346, -0.008121535181999207, 0.022990070283412933, 0.05410167574882507, 0.08521327376365662, 0.11632488667964935, 0.1474364995956421, 0.17854809761047363, 0.20965969562530518, 0.2407713085412979, 0.27188292145729065, 0.3029945194721222, 0.33410611748695374, 0.36521774530410767, 0.3963293433189392, 0.42744094133377075, 0.4585525393486023, 0.48966413736343384, 0.5207757353782654, 0.5518873929977417, 0.5829989910125732, 0.6141105890274048, 0.6452221870422363, 0.6763337850570679, 0.7074453830718994, 0.738556981086731, 0.7696685791015625, 0.800780177116394, 0.8318917751312256, 0.8630034327507019, 0.8941150307655334, 0.925226628780365]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 5.0, 10.0, 21.0, 20.0, 36.0, 48.0, 81.0, 101.0, 197.0, 289.0, 464.0, 776.0, 1383.0, 2312.0, 4198.0, 7676.0, 14496.0, 28443.0, 54446.0, 105623.0, 185868.0, 241308.0, 183822.0, 104303.0, 53288.0, 27486.0, 14362.0, 7641.0, 4094.0, 2366.0, 1313.0, 816.0, 455.0, 271.0, 176.0, 127.0, 64.0, 51.0, 27.0, 23.0, 19.0, 13.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.404052734375, -0.3912200927734375, -0.378387451171875, -0.3655548095703125, -0.35272216796875, -0.3398895263671875, -0.327056884765625, -0.3142242431640625, -0.3013916015625, -0.2885589599609375, -0.275726318359375, -0.2628936767578125, -0.25006103515625, -0.2372283935546875, -0.224395751953125, -0.2115631103515625, -0.19873046875, -0.1858978271484375, -0.173065185546875, -0.1602325439453125, -0.14739990234375, -0.1345672607421875, -0.121734619140625, -0.1089019775390625, -0.0960693359375, -0.0832366943359375, -0.070404052734375, -0.0575714111328125, -0.04473876953125, -0.0319061279296875, -0.019073486328125, -0.0062408447265625, 0.006591796875, 0.0194244384765625, 0.032257080078125, 0.0450897216796875, 0.05792236328125, 0.0707550048828125, 0.083587646484375, 0.0964202880859375, 0.1092529296875, 0.1220855712890625, 0.134918212890625, 0.1477508544921875, 0.16058349609375, 0.1734161376953125, 0.186248779296875, 0.1990814208984375, 0.2119140625, 0.2247467041015625, 0.237579345703125, 0.2504119873046875, 0.26324462890625, 0.2760772705078125, 0.288909912109375, 0.3017425537109375, 0.3145751953125, 0.3274078369140625, 0.340240478515625, 0.3530731201171875, 0.36590576171875, 0.3787384033203125, 0.391571044921875, 0.4044036865234375, 0.417236328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 10.0, 8.0, 24.0, 25.0, 19.0, 31.0, 25.0, 32.0, 52.0, 36.0, 36.0, 43.0, 41.0, 42.0, 46.0, 41.0, 43.0, 44.0, 43.0, 44.0, 42.0, 41.0, 36.0, 38.0, 21.0, 19.0, 18.0, 19.0, 25.0, 8.0, 9.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.277587890625, -1.23681640625, -1.196044921875, -1.1552734375, -1.114501953125, -1.07373046875, -1.032958984375, -0.9921875, -0.951416015625, -0.91064453125, -0.869873046875, -0.8291015625, -0.788330078125, -0.74755859375, -0.706787109375, -0.666015625, -0.625244140625, -0.58447265625, -0.543701171875, -0.5029296875, -0.462158203125, -0.42138671875, -0.380615234375, -0.33984375, -0.299072265625, -0.25830078125, -0.217529296875, -0.1767578125, -0.135986328125, -0.09521484375, -0.054443359375, -0.013671875, 0.027099609375, 0.06787109375, 0.108642578125, 0.1494140625, 0.190185546875, 0.23095703125, 0.271728515625, 0.3125, 0.353271484375, 0.39404296875, 0.434814453125, 0.4755859375, 0.516357421875, 0.55712890625, 0.597900390625, 0.638671875, 0.679443359375, 0.72021484375, 0.760986328125, 0.8017578125, 0.842529296875, 0.88330078125, 0.924072265625, 0.96484375, 1.005615234375, 1.04638671875, 1.087158203125, 1.1279296875, 1.168701171875, 1.20947265625, 1.250244140625, 1.291015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 12.0, 24.0, 25.0, 58.0, 77.0, 111.0, 167.0, 244.0, 331.0, 498.0, 861.0, 1489.0, 2551.0, 5101.0, 9958.0, 21089.0, 45580.0, 99574.0, 198390.0, 276317.0, 197932.0, 99271.0, 46143.0, 21146.0, 10069.0, 4889.0, 2702.0, 1481.0, 866.0, 529.0, 335.0, 214.0, 157.0, 94.0, 70.0, 51.0, 31.0, 31.0, 20.0, 14.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.53369140625, -0.5190696716308594, -0.5044479370117188, -0.4898262023925781, -0.4752044677734375, -0.4605827331542969, -0.44596099853515625, -0.4313392639160156, -0.416717529296875, -0.4020957946777344, -0.38747406005859375, -0.3728523254394531, -0.3582305908203125, -0.3436088562011719, -0.32898712158203125, -0.3143653869628906, -0.29974365234375, -0.2851219177246094, -0.27050018310546875, -0.2558784484863281, -0.2412567138671875, -0.22663497924804688, -0.21201324462890625, -0.19739151000976562, -0.182769775390625, -0.16814804077148438, -0.15352630615234375, -0.13890457153320312, -0.1242828369140625, -0.10966110229492188, -0.09503936767578125, -0.08041763305664062, -0.0657958984375, -0.051174163818359375, -0.03655242919921875, -0.021930694580078125, -0.0073089599609375, 0.007312774658203125, 0.02193450927734375, 0.036556243896484375, 0.051177978515625, 0.06579971313476562, 0.08042144775390625, 0.09504318237304688, 0.1096649169921875, 0.12428665161132812, 0.13890838623046875, 0.15353012084960938, 0.16815185546875, 0.18277359008789062, 0.19739532470703125, 0.21201705932617188, 0.2266387939453125, 0.24126052856445312, 0.25588226318359375, 0.2705039978027344, 0.285125732421875, 0.2997474670410156, 0.31436920166015625, 0.3289909362792969, 0.3436126708984375, 0.3582344055175781, 0.37285614013671875, 0.3874778747558594, 0.402099609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 2.0, 9.0, 7.0, 13.0, 7.0, 20.0, 13.0, 31.0, 22.0, 28.0, 24.0, 21.0, 31.0, 22.0, 16.0, 33.0, 33.0, 33.0, 44.0, 38.0, 37.0, 46.0, 37.0, 39.0, 47.0, 31.0, 28.0, 27.0, 24.0, 25.0, 21.0, 26.0, 23.0, 18.0, 23.0, 12.0, 12.0, 14.0, 10.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56787109375, -0.5485000610351562, -0.5291290283203125, -0.5097579956054688, -0.490386962890625, -0.47101593017578125, -0.4516448974609375, -0.43227386474609375, -0.41290283203125, -0.39353179931640625, -0.3741607666015625, -0.35478973388671875, -0.335418701171875, -0.31604766845703125, -0.2966766357421875, -0.27730560302734375, -0.2579345703125, -0.23856353759765625, -0.2191925048828125, -0.19982147216796875, -0.180450439453125, -0.16107940673828125, -0.1417083740234375, -0.12233734130859375, -0.10296630859375, -0.08359527587890625, -0.0642242431640625, -0.04485321044921875, -0.025482177734375, -0.00611114501953125, 0.0132598876953125, 0.03263092041015625, 0.052001953125, 0.07137298583984375, 0.0907440185546875, 0.11011505126953125, 0.129486083984375, 0.14885711669921875, 0.1682281494140625, 0.18759918212890625, 0.20697021484375, 0.22634124755859375, 0.2457122802734375, 0.26508331298828125, 0.284454345703125, 0.30382537841796875, 0.3231964111328125, 0.34256744384765625, 0.3619384765625, 0.38130950927734375, 0.4006805419921875, 0.42005157470703125, 0.439422607421875, 0.45879364013671875, 0.4781646728515625, 0.49753570556640625, 0.51690673828125, 0.5362777709960938, 0.5556488037109375, 0.5750198364257812, 0.594390869140625, 0.6137619018554688, 0.6331329345703125, 0.6525039672851562, 0.671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 2.0, 16.0, 14.0, 34.0, 35.0, 45.0, 63.0, 93.0, 155.0, 224.0, 306.0, 520.0, 867.0, 1549.0, 3290.0, 8701.0, 36064.0, 429811.0, 509021.0, 40619.0, 9380.0, 3567.0, 1655.0, 952.0, 524.0, 364.0, 206.0, 135.0, 108.0, 70.0, 43.0, 32.0, 21.0, 13.0, 10.0, 9.0, 11.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.59375, -0.5768013000488281, -0.5598526000976562, -0.5429039001464844, -0.5259552001953125, -0.5090065002441406, -0.49205780029296875, -0.4751091003417969, -0.458160400390625, -0.4412117004394531, -0.42426300048828125, -0.4073143005371094, -0.3903656005859375, -0.3734169006347656, -0.35646820068359375, -0.3395195007324219, -0.32257080078125, -0.3056221008300781, -0.28867340087890625, -0.2717247009277344, -0.2547760009765625, -0.23782730102539062, -0.22087860107421875, -0.20392990112304688, -0.186981201171875, -0.17003250122070312, -0.15308380126953125, -0.13613510131835938, -0.1191864013671875, -0.10223770141601562, -0.08528900146484375, -0.06834030151367188, -0.0513916015625, -0.034442901611328125, -0.01749420166015625, -0.000545501708984375, 0.0164031982421875, 0.033351898193359375, 0.05030059814453125, 0.06724929809570312, 0.084197998046875, 0.10114669799804688, 0.11809539794921875, 0.13504409790039062, 0.1519927978515625, 0.16894149780273438, 0.18589019775390625, 0.20283889770507812, 0.21978759765625, 0.23673629760742188, 0.25368499755859375, 0.2706336975097656, 0.2875823974609375, 0.3045310974121094, 0.32147979736328125, 0.3384284973144531, 0.355377197265625, 0.3723258972167969, 0.38927459716796875, 0.4062232971191406, 0.4231719970703125, 0.4401206970214844, 0.45706939697265625, 0.4740180969238281, 0.490966796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 11.0, 12.0, 20.0, 54.0, 67.0, 94.0, 115.0, 132.0, 110.0, 125.0, 87.0, 68.0, 33.0, 26.0, 21.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7060508728027344e-05, -2.623721957206726e-05, -2.5413930416107178e-05, -2.4590641260147095e-05, -2.3767352104187012e-05, -2.294406294822693e-05, -2.2120773792266846e-05, -2.1297484636306763e-05, -2.047419548034668e-05, -1.9650906324386597e-05, -1.8827617168426514e-05, -1.800432801246643e-05, -1.7181038856506348e-05, -1.6357749700546265e-05, -1.553446054458618e-05, -1.4711171388626099e-05, -1.3887882232666016e-05, -1.3064593076705933e-05, -1.224130392074585e-05, -1.1418014764785767e-05, -1.0594725608825684e-05, -9.7714364528656e-06, -8.948147296905518e-06, -8.124858140945435e-06, -7.3015689849853516e-06, -6.4782798290252686e-06, -5.6549906730651855e-06, -4.8317015171051025e-06, -4.0084123611450195e-06, -3.1851232051849365e-06, -2.3618340492248535e-06, -1.5385448932647705e-06, -7.152557373046875e-07, 1.0803341865539551e-07, 9.313225746154785e-07, 1.7546117305755615e-06, 2.5779008865356445e-06, 3.4011900424957275e-06, 4.2244791984558105e-06, 5.0477683544158936e-06, 5.8710575103759766e-06, 6.6943466663360596e-06, 7.517635822296143e-06, 8.340924978256226e-06, 9.164214134216309e-06, 9.987503290176392e-06, 1.0810792446136475e-05, 1.1634081602096558e-05, 1.245737075805664e-05, 1.3280659914016724e-05, 1.4103949069976807e-05, 1.492723822593689e-05, 1.5750527381896973e-05, 1.6573816537857056e-05, 1.739710569381714e-05, 1.822039484977722e-05, 1.9043684005737305e-05, 1.9866973161697388e-05, 2.069026231765747e-05, 2.1513551473617554e-05, 2.2336840629577637e-05, 2.316012978553772e-05, 2.3983418941497803e-05, 2.4806708097457886e-05, 2.562999725341797e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 10.0, 7.0, 14.0, 26.0, 21.0, 38.0, 59.0, 56.0, 104.0, 129.0, 162.0, 249.0, 270.0, 353.0, 460.0, 659.0, 885.0, 1273.0, 1744.0, 2701.0, 4083.0, 7419.0, 15063.0, 36196.0, 98868.0, 284753.0, 360898.0, 139700.0, 48294.0, 19614.0, 9155.0, 5025.0, 3056.0, 1934.0, 1379.0, 998.0, 696.0, 548.0, 439.0, 302.0, 224.0, 178.0, 109.0, 118.0, 72.0, 68.0, 41.0, 34.0, 25.0, 19.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2734375, -0.2649345397949219, -0.25643157958984375, -0.24792861938476562, -0.2394256591796875, -0.23092269897460938, -0.22241973876953125, -0.21391677856445312, -0.205413818359375, -0.19691085815429688, -0.18840789794921875, -0.17990493774414062, -0.1714019775390625, -0.16289901733398438, -0.15439605712890625, -0.14589309692382812, -0.13739013671875, -0.12888717651367188, -0.12038421630859375, -0.11188125610351562, -0.1033782958984375, -0.09487533569335938, -0.08637237548828125, -0.07786941528320312, -0.069366455078125, -0.060863494873046875, -0.05236053466796875, -0.043857574462890625, -0.0353546142578125, -0.026851654052734375, -0.01834869384765625, -0.009845733642578125, -0.0013427734375, 0.007160186767578125, 0.01566314697265625, 0.024166107177734375, 0.0326690673828125, 0.041172027587890625, 0.04967498779296875, 0.058177947998046875, 0.066680908203125, 0.07518386840820312, 0.08368682861328125, 0.09218978881835938, 0.1006927490234375, 0.10919570922851562, 0.11769866943359375, 0.12620162963867188, 0.13470458984375, 0.14320755004882812, 0.15171051025390625, 0.16021347045898438, 0.1687164306640625, 0.17721939086914062, 0.18572235107421875, 0.19422531127929688, 0.202728271484375, 0.21123123168945312, 0.21973419189453125, 0.22823715209960938, 0.2367401123046875, 0.24524307250976562, 0.25374603271484375, 0.2622489929199219, 0.270751953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 12.0, 16.0, 25.0, 65.0, 80.0, 151.0, 188.0, 150.0, 119.0, 59.0, 40.0, 23.0, 15.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10774517059326172, -0.10434532165527344, -0.10094547271728516, -0.09754562377929688, -0.0941457748413086, -0.09074592590332031, -0.08734607696533203, -0.08394622802734375, -0.08054637908935547, -0.07714653015136719, -0.0737466812133789, -0.07034683227539062, -0.06694698333740234, -0.06354713439941406, -0.06014728546142578, -0.0567474365234375, -0.05334758758544922, -0.04994773864746094, -0.046547889709472656, -0.043148040771484375, -0.039748191833496094, -0.03634834289550781, -0.03294849395751953, -0.02954864501953125, -0.02614879608154297, -0.022748947143554688, -0.019349098205566406, -0.015949249267578125, -0.012549400329589844, -0.009149551391601562, -0.005749702453613281, -0.002349853515625, 0.0010499954223632812, 0.0044498443603515625, 0.007849693298339844, 0.011249542236328125, 0.014649391174316406, 0.018049240112304688, 0.02144908905029297, 0.02484893798828125, 0.02824878692626953, 0.03164863586425781, 0.035048484802246094, 0.038448333740234375, 0.041848182678222656, 0.04524803161621094, 0.04864788055419922, 0.0520477294921875, 0.05544757843017578, 0.05884742736816406, 0.062247276306152344, 0.06564712524414062, 0.0690469741821289, 0.07244682312011719, 0.07584667205810547, 0.07924652099609375, 0.08264636993408203, 0.08604621887207031, 0.0894460678100586, 0.09284591674804688, 0.09624576568603516, 0.09964561462402344, 0.10304546356201172, 0.1064453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 3.0, 9.0, 10.0, 17.0, 13.0, 16.0, 27.0, 27.0, 23.0, 40.0, 51.0, 56.0, 40.0, 43.0, 40.0, 57.0, 57.0, 69.0, 62.0, 64.0, 47.0, 32.0, 33.0, 28.0, 18.0, 27.0, 16.0, 11.0, 12.0, 11.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5451518297195435, -1.4936035871505737, -1.442055344581604, -1.3905071020126343, -1.3389588594436646, -1.2874106168746948, -1.2358622550964355, -1.1843140125274658, -1.132765769958496, -1.0812175273895264, -1.0296692848205566, -0.9781210422515869, -0.9265727996826172, -0.8750245571136475, -0.823476254940033, -0.7719280123710632, -0.7203798294067383, -0.6688315868377686, -0.6172833442687988, -0.5657351016998291, -0.5141868591308594, -0.46263858675956726, -0.41109031438827515, -0.3595420718193054, -0.3079938292503357, -0.25644558668136597, -0.20489732921123505, -0.15334907174110413, -0.1018008291721344, -0.05025258660316467, 0.0012956857681274414, 0.05284392833709717, 0.10439229011535645, 0.15594053268432617, 0.2074887901544571, 0.259037047624588, 0.31058529019355774, 0.36213353276252747, 0.4136818051338196, 0.4652300477027893, 0.516778290271759, 0.5683265328407288, 0.6198747754096985, 0.671423077583313, 0.7229713201522827, 0.7745195627212524, 0.8260678052902222, 0.8776160478591919, 0.9291642904281616, 0.9807125329971313, 1.032260775566101, 1.0838090181350708, 1.1353572607040405, 1.1869055032730103, 1.2384538650512695, 1.2900021076202393, 1.341550350189209, 1.3930985927581787, 1.4446468353271484, 1.4961950778961182, 1.547743320465088, 1.5992915630340576, 1.6508398056030273, 1.702388048171997, 1.7539362907409668]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 9.0, 5.0, 8.0, 8.0, 9.0, 10.0, 15.0, 23.0, 14.0, 26.0, 29.0, 34.0, 39.0, 35.0, 38.0, 22.0, 40.0, 37.0, 42.0, 35.0, 41.0, 28.0, 32.0, 28.0, 50.0, 43.0, 40.0, 39.0, 31.0, 30.0, 14.0, 25.0, 14.0, 17.0, 19.0, 15.0, 14.0, 5.0, 6.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.084733486175537, -1.0531185865402222, -1.0215036869049072, -0.9898887872695923, -0.9582739472389221, -0.9266590476036072, -0.8950441479682922, -0.8634292483329773, -0.8318144083023071, -0.8001995086669922, -0.7685846090316772, -0.7369697093963623, -0.7053548693656921, -0.6737399697303772, -0.6421250700950623, -0.6105101704597473, -0.5788952708244324, -0.5472803711891174, -0.5156654715538025, -0.48405060172080994, -0.4524357318878174, -0.42082083225250244, -0.3892059326171875, -0.35759103298187256, -0.32597616314888, -0.29436126351356506, -0.2627463936805725, -0.23113149404525757, -0.19951660931110382, -0.16790172457695007, -0.13628682494163513, -0.10467194020748138, -0.07305705547332764, -0.04144216701388359, -0.009827278554439545, 0.0217876136302948, 0.05340249836444855, 0.0850173830986023, 0.11663228273391724, 0.14824716746807098, 0.17986205220222473, 0.21147693693637848, 0.24309182167053223, 0.27470672130584717, 0.3063216209411621, 0.33793649077415466, 0.3695513904094696, 0.40116626024246216, 0.4327811598777771, 0.46439605951309204, 0.4960109293460846, 0.5276257991790771, 0.5592406988143921, 0.590855598449707, 0.622470498085022, 0.6540853977203369, 0.6857002973556519, 0.7173151969909668, 0.7489300966262817, 0.7805449962615967, 0.8121598362922668, 0.8437747359275818, 0.8753896355628967, 0.9070045351982117, 0.9386193752288818]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 6.0, 5.0, 12.0, 13.0, 12.0, 23.0, 36.0, 49.0, 92.0, 137.0, 210.0, 384.0, 712.0, 1241.0, 2273.0, 4014.0, 7296.0, 13048.0, 22807.0, 38352.0, 61084.0, 91232.0, 122152.0, 143329.0, 145623.0, 127589.0, 97427.0, 67908.0, 42830.0, 25478.0, 14627.0, 8248.0, 4399.0, 2518.0, 1425.0, 834.0, 477.0, 242.0, 149.0, 97.0, 50.0, 38.0, 25.0, 15.0, 15.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.015777587890625, -0.97686767578125, -0.937957763671875, -0.8990478515625, -0.860137939453125, -0.82122802734375, -0.782318115234375, -0.743408203125, -0.704498291015625, -0.66558837890625, -0.626678466796875, -0.5877685546875, -0.548858642578125, -0.50994873046875, -0.471038818359375, -0.43212890625, -0.393218994140625, -0.35430908203125, -0.315399169921875, -0.2764892578125, -0.237579345703125, -0.19866943359375, -0.159759521484375, -0.120849609375, -0.081939697265625, -0.04302978515625, -0.004119873046875, 0.0347900390625, 0.073699951171875, 0.11260986328125, 0.151519775390625, 0.1904296875, 0.229339599609375, 0.26824951171875, 0.307159423828125, 0.3460693359375, 0.384979248046875, 0.42388916015625, 0.462799072265625, 0.501708984375, 0.540618896484375, 0.57952880859375, 0.618438720703125, 0.6573486328125, 0.696258544921875, 0.73516845703125, 0.774078369140625, 0.81298828125, 0.851898193359375, 0.89080810546875, 0.929718017578125, 0.9686279296875, 1.007537841796875, 1.04644775390625, 1.085357666015625, 1.124267578125, 1.163177490234375, 1.20208740234375, 1.240997314453125, 1.2799072265625, 1.318817138671875, 1.35772705078125, 1.396636962890625, 1.435546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 3.0, 6.0, 10.0, 8.0, 9.0, 18.0, 15.0, 17.0, 14.0, 27.0, 23.0, 34.0, 29.0, 28.0, 26.0, 28.0, 35.0, 37.0, 33.0, 25.0, 34.0, 42.0, 36.0, 34.0, 34.0, 35.0, 40.0, 35.0, 22.0, 28.0, 32.0, 28.0, 21.0, 27.0, 15.0, 18.0, 13.0, 14.0, 11.0, 11.0, 7.0, 4.0, 8.0, 4.0, 10.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.99609375, -0.9644775390625, -0.932861328125, -0.9012451171875, -0.86962890625, -0.8380126953125, -0.806396484375, -0.7747802734375, -0.7431640625, -0.7115478515625, -0.679931640625, -0.6483154296875, -0.61669921875, -0.5850830078125, -0.553466796875, -0.5218505859375, -0.490234375, -0.4586181640625, -0.427001953125, -0.3953857421875, -0.36376953125, -0.3321533203125, -0.300537109375, -0.2689208984375, -0.2373046875, -0.2056884765625, -0.174072265625, -0.1424560546875, -0.11083984375, -0.0792236328125, -0.047607421875, -0.0159912109375, 0.015625, 0.0472412109375, 0.078857421875, 0.1104736328125, 0.14208984375, 0.1737060546875, 0.205322265625, 0.2369384765625, 0.2685546875, 0.3001708984375, 0.331787109375, 0.3634033203125, 0.39501953125, 0.4266357421875, 0.458251953125, 0.4898681640625, 0.521484375, 0.5531005859375, 0.584716796875, 0.6163330078125, 0.64794921875, 0.6795654296875, 0.711181640625, 0.7427978515625, 0.7744140625, 0.8060302734375, 0.837646484375, 0.8692626953125, 0.90087890625, 0.9324951171875, 0.964111328125, 0.9957275390625, 1.02734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 15.0, 26.0, 34.0, 56.0, 75.0, 121.0, 226.0, 399.0, 700.0, 1088.0, 1722.0, 3012.0, 4984.0, 8379.0, 13891.0, 21694.0, 33191.0, 48950.0, 69343.0, 91114.0, 110539.0, 121366.0, 120343.0, 108176.0, 88922.0, 67483.0, 47664.0, 31834.0, 20388.0, 12991.0, 7889.0, 4780.0, 2863.0, 1694.0, 1065.0, 628.0, 358.0, 208.0, 124.0, 84.0, 46.0, 31.0, 21.0, 14.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0368804931640625, -1.004425048828125, -0.9719696044921875, -0.93951416015625, -0.9070587158203125, -0.874603271484375, -0.8421478271484375, -0.8096923828125, -0.7772369384765625, -0.744781494140625, -0.7123260498046875, -0.67987060546875, -0.6474151611328125, -0.614959716796875, -0.5825042724609375, -0.550048828125, -0.5175933837890625, -0.485137939453125, -0.4526824951171875, -0.42022705078125, -0.3877716064453125, -0.355316162109375, -0.3228607177734375, -0.2904052734375, -0.2579498291015625, -0.225494384765625, -0.1930389404296875, -0.16058349609375, -0.1281280517578125, -0.095672607421875, -0.0632171630859375, -0.03076171875, 0.0016937255859375, 0.034149169921875, 0.0666046142578125, 0.09906005859375, 0.1315155029296875, 0.163970947265625, 0.1964263916015625, 0.2288818359375, 0.2613372802734375, 0.293792724609375, 0.3262481689453125, 0.35870361328125, 0.3911590576171875, 0.423614501953125, 0.4560699462890625, 0.488525390625, 0.5209808349609375, 0.553436279296875, 0.5858917236328125, 0.61834716796875, 0.6508026123046875, 0.683258056640625, 0.7157135009765625, 0.7481689453125, 0.7806243896484375, 0.813079833984375, 0.8455352783203125, 0.87799072265625, 0.9104461669921875, 0.942901611328125, 0.9753570556640625, 1.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 8.0, 6.0, 13.0, 16.0, 15.0, 15.0, 26.0, 22.0, 22.0, 28.0, 28.0, 39.0, 39.0, 32.0, 32.0, 38.0, 41.0, 40.0, 29.0, 44.0, 42.0, 56.0, 37.0, 22.0, 32.0, 32.0, 33.0, 31.0, 17.0, 22.0, 17.0, 21.0, 20.0, 15.0, 9.0, 8.0, 5.0, 5.0, 11.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.6943359375, -0.6731109619140625, -0.651885986328125, -0.6306610107421875, -0.60943603515625, -0.5882110595703125, -0.566986083984375, -0.5457611083984375, -0.5245361328125, -0.5033111572265625, -0.482086181640625, -0.4608612060546875, -0.43963623046875, -0.4184112548828125, -0.397186279296875, -0.3759613037109375, -0.354736328125, -0.3335113525390625, -0.312286376953125, -0.2910614013671875, -0.26983642578125, -0.2486114501953125, -0.227386474609375, -0.2061614990234375, -0.1849365234375, -0.1637115478515625, -0.142486572265625, -0.1212615966796875, -0.10003662109375, -0.0788116455078125, -0.057586669921875, -0.0363616943359375, -0.01513671875, 0.0060882568359375, 0.027313232421875, 0.0485382080078125, 0.06976318359375, 0.0909881591796875, 0.112213134765625, 0.1334381103515625, 0.1546630859375, 0.1758880615234375, 0.197113037109375, 0.2183380126953125, 0.23956298828125, 0.2607879638671875, 0.282012939453125, 0.3032379150390625, 0.324462890625, 0.3456878662109375, 0.366912841796875, 0.3881378173828125, 0.40936279296875, 0.4305877685546875, 0.451812744140625, 0.4730377197265625, 0.4942626953125, 0.5154876708984375, 0.536712646484375, 0.5579376220703125, 0.57916259765625, 0.6003875732421875, 0.621612548828125, 0.6428375244140625, 0.6640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 10.0, 12.0, 11.0, 9.0, 20.0, 23.0, 46.0, 50.0, 88.0, 131.0, 161.0, 282.0, 387.0, 716.0, 940.0, 1534.0, 2416.0, 3875.0, 7295.0, 22962.0, 200420.0, 637312.0, 135941.0, 17513.0, 6396.0, 3667.0, 2365.0, 1340.0, 876.0, 574.0, 380.0, 252.0, 153.0, 110.0, 93.0, 56.0, 47.0, 20.0, 23.0, 13.0, 13.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.880859375, -2.77947998046875, -2.6781005859375, -2.57672119140625, -2.475341796875, -2.37396240234375, -2.2725830078125, -2.17120361328125, -2.06982421875, -1.96844482421875, -1.8670654296875, -1.76568603515625, -1.664306640625, -1.56292724609375, -1.4615478515625, -1.36016845703125, -1.2587890625, -1.15740966796875, -1.0560302734375, -0.95465087890625, -0.853271484375, -0.75189208984375, -0.6505126953125, -0.54913330078125, -0.44775390625, -0.34637451171875, -0.2449951171875, -0.14361572265625, -0.042236328125, 0.05914306640625, 0.1605224609375, 0.26190185546875, 0.36328125, 0.46466064453125, 0.5660400390625, 0.66741943359375, 0.768798828125, 0.87017822265625, 0.9715576171875, 1.07293701171875, 1.17431640625, 1.27569580078125, 1.3770751953125, 1.47845458984375, 1.579833984375, 1.68121337890625, 1.7825927734375, 1.88397216796875, 1.9853515625, 2.08673095703125, 2.1881103515625, 2.28948974609375, 2.390869140625, 2.49224853515625, 2.5936279296875, 2.69500732421875, 2.79638671875, 2.89776611328125, 2.9991455078125, 3.10052490234375, 3.201904296875, 3.30328369140625, 3.4046630859375, 3.50604248046875, 3.607421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 27.0, 57.0, 98.0, 146.0, 205.0, 173.0, 135.0, 59.0, 35.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002510547637939453, -0.0002442058175802231, -0.00023735687136650085, -0.00023050792515277863, -0.0002236589789390564, -0.00021681003272533417, -0.00020996108651161194, -0.0002031121402978897, -0.00019626319408416748, -0.00018941424787044525, -0.00018256530165672302, -0.0001757163554430008, -0.00016886740922927856, -0.00016201846301555634, -0.0001551695168018341, -0.00014832057058811188, -0.00014147162437438965, -0.00013462267816066742, -0.0001277737319469452, -0.00012092478573322296, -0.00011407583951950073, -0.0001072268933057785, -0.00010037794709205627, -9.352900087833405e-05, -8.668005466461182e-05, -7.983110845088959e-05, -7.298216223716736e-05, -6.613321602344513e-05, -5.92842698097229e-05, -5.243532359600067e-05, -4.558637738227844e-05, -3.873743116855621e-05, -3.1888484954833984e-05, -2.5039538741111755e-05, -1.8190592527389526e-05, -1.1341646313667297e-05, -4.492700099945068e-06, 2.3562461137771606e-06, 9.20519232749939e-06, 1.605413854122162e-05, 2.2903084754943848e-05, 2.9752030968666077e-05, 3.6600977182388306e-05, 4.3449923396110535e-05, 5.0298869609832764e-05, 5.714781582355499e-05, 6.399676203727722e-05, 7.084570825099945e-05, 7.769465446472168e-05, 8.454360067844391e-05, 9.139254689216614e-05, 9.824149310588837e-05, 0.0001050904393196106, 0.00011193938553333282, 0.00011878833174705505, 0.00012563727796077728, 0.0001324862241744995, 0.00013933517038822174, 0.00014618411660194397, 0.0001530330628156662, 0.00015988200902938843, 0.00016673095524311066, 0.00017357990145683289, 0.00018042884767055511, 0.00018727779388427734]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 32.0, 38.0, 53.0, 65.0, 93.0, 137.0, 170.0, 295.0, 415.0, 596.0, 920.0, 1494.0, 2164.0, 3684.0, 7856.0, 29919.0, 198674.0, 553854.0, 199567.0, 30264.0, 7896.0, 3835.0, 2164.0, 1463.0, 918.0, 602.0, 404.0, 274.0, 185.0, 139.0, 95.0, 63.0, 55.0, 39.0, 23.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.76171875, -2.681671142578125, -2.60162353515625, -2.521575927734375, -2.4415283203125, -2.361480712890625, -2.28143310546875, -2.201385498046875, -2.121337890625, -2.041290283203125, -1.96124267578125, -1.881195068359375, -1.8011474609375, -1.721099853515625, -1.64105224609375, -1.561004638671875, -1.48095703125, -1.400909423828125, -1.32086181640625, -1.240814208984375, -1.1607666015625, -1.080718994140625, -1.00067138671875, -0.920623779296875, -0.840576171875, -0.760528564453125, -0.68048095703125, -0.600433349609375, -0.5203857421875, -0.440338134765625, -0.36029052734375, -0.280242919921875, -0.2001953125, -0.120147705078125, -0.04010009765625, 0.039947509765625, 0.1199951171875, 0.200042724609375, 0.28009033203125, 0.360137939453125, 0.440185546875, 0.520233154296875, 0.60028076171875, 0.680328369140625, 0.7603759765625, 0.840423583984375, 0.92047119140625, 1.000518798828125, 1.08056640625, 1.160614013671875, 1.24066162109375, 1.320709228515625, 1.4007568359375, 1.480804443359375, 1.56085205078125, 1.640899658203125, 1.720947265625, 1.800994873046875, 1.88104248046875, 1.961090087890625, 2.0411376953125, 2.121185302734375, 2.20123291015625, 2.281280517578125, 2.361328125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 9.0, 10.0, 13.0, 28.0, 25.0, 44.0, 32.0, 60.0, 69.0, 74.0, 74.0, 81.0, 88.0, 66.0, 70.0, 57.0, 37.0, 42.0, 23.0, 21.0, 10.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.292724609375, -0.28343963623046875, -0.2741546630859375, -0.26486968994140625, -0.255584716796875, -0.24629974365234375, -0.2370147705078125, -0.22772979736328125, -0.21844482421875, -0.20915985107421875, -0.1998748779296875, -0.19058990478515625, -0.181304931640625, -0.17201995849609375, -0.1627349853515625, -0.15345001220703125, -0.1441650390625, -0.13488006591796875, -0.1255950927734375, -0.11631011962890625, -0.107025146484375, -0.09774017333984375, -0.0884552001953125, -0.07917022705078125, -0.06988525390625, -0.06060028076171875, -0.0513153076171875, -0.04203033447265625, -0.032745361328125, -0.02346038818359375, -0.0141754150390625, -0.00489044189453125, 0.00439453125, 0.01367950439453125, 0.0229644775390625, 0.03224945068359375, 0.041534423828125, 0.05081939697265625, 0.0601043701171875, 0.06938934326171875, 0.07867431640625, 0.08795928955078125, 0.0972442626953125, 0.10652923583984375, 0.115814208984375, 0.12509918212890625, 0.1343841552734375, 0.14366912841796875, 0.1529541015625, 0.16223907470703125, 0.1715240478515625, 0.18080902099609375, 0.190093994140625, 0.19937896728515625, 0.2086639404296875, 0.21794891357421875, 0.22723388671875, 0.23651885986328125, 0.2458038330078125, 0.25508880615234375, 0.264373779296875, 0.27365875244140625, 0.2829437255859375, 0.29222869873046875, 0.301513671875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 7.0, 11.0, 10.0, 12.0, 16.0, 20.0, 31.0, 26.0, 29.0, 44.0, 40.0, 45.0, 46.0, 50.0, 49.0, 54.0, 76.0, 60.0, 41.0, 48.0, 51.0, 37.0, 35.0, 26.0, 20.0, 13.0, 12.0, 15.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4523892402648926, -1.4023908376693726, -1.352392554283142, -1.302394151687622, -1.2523958683013916, -1.2023974657058716, -1.1523990631103516, -1.102400779724121, -1.0524024963378906, -1.0024040937423706, -0.9524058103561401, -0.9024074077606201, -0.8524091243743896, -0.8024107217788696, -0.7524123787879944, -0.7024140357971191, -0.6524156332015991, -0.6024172902107239, -0.5524189472198486, -0.5024205446243286, -0.45242223143577576, -0.4024238884449005, -0.3524255156517029, -0.30242717266082764, -0.2524288296699524, -0.20243048667907715, -0.1524321287870407, -0.10243377089500427, -0.05243542790412903, -0.002437084913253784, 0.04756128787994385, 0.09755963087081909, 0.1475580930709839, 0.19755643606185913, 0.24755479395389557, 0.297553151845932, 0.34755149483680725, 0.3975498378276825, 0.4475482106208801, 0.49754655361175537, 0.5475448966026306, 0.5975432395935059, 0.6475415825843811, 0.6975399255752563, 0.7475383281707764, 0.7975366115570068, 0.8475350141525269, 0.8975333571434021, 0.9475317001342773, 0.9975300431251526, 1.0475283861160278, 1.0975267887115479, 1.1475250720977783, 1.1975234746932983, 1.2475218772888184, 1.2975201606750488, 1.3475184440612793, 1.3975168466567993, 1.4475151300430298, 1.4975135326385498, 1.5475118160247803, 1.5975102186203003, 1.6475086212158203, 1.6975069046020508, 1.7475053071975708]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 10.0, 14.0, 14.0, 15.0, 12.0, 11.0, 27.0, 39.0, 29.0, 22.0, 31.0, 40.0, 30.0, 48.0, 40.0, 41.0, 37.0, 46.0, 35.0, 38.0, 40.0, 37.0, 41.0, 46.0, 31.0, 30.0, 30.0, 19.0, 18.0, 16.0, 11.0, 18.0, 13.0, 10.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9461370706558228, -0.9124075770378113, -0.8786780834197998, -0.8449485898017883, -0.8112190961837769, -0.7774896025657654, -0.7437601089477539, -0.7100306153297424, -0.676301121711731, -0.6425716280937195, -0.608842134475708, -0.5751126408576965, -0.5413831472396851, -0.5076536536216736, -0.4739241600036621, -0.44019466638565063, -0.40646517276763916, -0.3727356791496277, -0.3390061855316162, -0.30527669191360474, -0.27154719829559326, -0.2378177046775818, -0.2040882110595703, -0.17035871744155884, -0.13662922382354736, -0.10289973020553589, -0.06917023658752441, -0.03544074296951294, -0.0017112493515014648, 0.03201824426651001, 0.06574773788452148, 0.09947723150253296, 0.13320660591125488, 0.16693609952926636, 0.20066559314727783, 0.2343950867652893, 0.2681245803833008, 0.30185407400131226, 0.33558356761932373, 0.3693130612373352, 0.4030425548553467, 0.43677204847335815, 0.47050154209136963, 0.5042310357093811, 0.5379605293273926, 0.571690022945404, 0.6054195165634155, 0.639149010181427, 0.6728785037994385, 0.70660799741745, 0.7403374910354614, 0.7740669846534729, 0.8077964782714844, 0.8415259718894958, 0.8752554655075073, 0.9089849591255188, 0.9427144527435303, 0.9764439463615417, 1.0101734399795532, 1.04390287399292, 1.0776324272155762, 1.1113619804382324, 1.1450914144515991, 1.1788208484649658, 1.212550401687622]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 14.0, 20.0, 47.0, 74.0, 134.0, 214.0, 368.0, 632.0, 1061.0, 1799.0, 3203.0, 6021.0, 11090.0, 20479.0, 39249.0, 72928.0, 136052.0, 243458.0, 407757.0, 595266.0, 715323.0, 678755.0, 515434.0, 330522.0, 191268.0, 104274.0, 55907.0, 29351.0, 15477.0, 8022.0, 4434.0, 2479.0, 1335.0, 711.0, 462.0, 249.0, 154.0, 102.0, 50.0, 36.0, 21.0, 9.0, 7.0, 11.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2174224853515625, -1.170196533203125, -1.1229705810546875, -1.07574462890625, -1.0285186767578125, -0.981292724609375, -0.9340667724609375, -0.8868408203125, -0.8396148681640625, -0.792388916015625, -0.7451629638671875, -0.69793701171875, -0.6507110595703125, -0.603485107421875, -0.5562591552734375, -0.509033203125, -0.4618072509765625, -0.414581298828125, -0.3673553466796875, -0.32012939453125, -0.2729034423828125, -0.225677490234375, -0.1784515380859375, -0.1312255859375, -0.0839996337890625, -0.036773681640625, 0.0104522705078125, 0.05767822265625, 0.1049041748046875, 0.152130126953125, 0.1993560791015625, 0.24658203125, 0.2938079833984375, 0.341033935546875, 0.3882598876953125, 0.43548583984375, 0.4827117919921875, 0.529937744140625, 0.5771636962890625, 0.6243896484375, 0.6716156005859375, 0.718841552734375, 0.7660675048828125, 0.81329345703125, 0.8605194091796875, 0.907745361328125, 0.9549713134765625, 1.002197265625, 1.0494232177734375, 1.096649169921875, 1.1438751220703125, 1.19110107421875, 1.2383270263671875, 1.285552978515625, 1.3327789306640625, 1.3800048828125, 1.4272308349609375, 1.474456787109375, 1.5216827392578125, 1.56890869140625, 1.6161346435546875, 1.663360595703125, 1.7105865478515625, 1.7578125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 10.0, 16.0, 14.0, 18.0, 17.0, 29.0, 27.0, 28.0, 41.0, 35.0, 49.0, 53.0, 46.0, 53.0, 54.0, 63.0, 47.0, 58.0, 40.0, 52.0, 32.0, 32.0, 36.0, 23.0, 28.0, 15.0, 17.0, 10.0, 19.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9773101806640625, -0.941925048828125, -0.9065399169921875, -0.87115478515625, -0.8357696533203125, -0.800384521484375, -0.7649993896484375, -0.7296142578125, -0.6942291259765625, -0.658843994140625, -0.6234588623046875, -0.58807373046875, -0.5526885986328125, -0.517303466796875, -0.4819183349609375, -0.446533203125, -0.4111480712890625, -0.375762939453125, -0.3403778076171875, -0.30499267578125, -0.2696075439453125, -0.234222412109375, -0.1988372802734375, -0.1634521484375, -0.1280670166015625, -0.092681884765625, -0.0572967529296875, -0.02191162109375, 0.0134735107421875, 0.048858642578125, 0.0842437744140625, 0.11962890625, 0.1550140380859375, 0.190399169921875, 0.2257843017578125, 0.26116943359375, 0.2965545654296875, 0.331939697265625, 0.3673248291015625, 0.4027099609375, 0.4380950927734375, 0.473480224609375, 0.5088653564453125, 0.54425048828125, 0.5796356201171875, 0.615020751953125, 0.6504058837890625, 0.685791015625, 0.7211761474609375, 0.756561279296875, 0.7919464111328125, 0.82733154296875, 0.8627166748046875, 0.898101806640625, 0.9334869384765625, 0.9688720703125, 1.0042572021484375, 1.039642333984375, 1.0750274658203125, 1.11041259765625, 1.1457977294921875, 1.181182861328125, 1.2165679931640625, 1.251953125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 15.0, 23.0, 38.0, 61.0, 103.0, 157.0, 284.0, 415.0, 661.0, 1177.0, 1817.0, 2773.0, 4503.0, 7114.0, 11331.0, 18261.0, 28860.0, 45113.0, 70205.0, 107095.0, 160165.0, 228873.0, 312064.0, 395004.0, 460143.0, 484807.0, 459232.0, 394357.0, 311583.0, 228009.0, 160185.0, 107599.0, 70442.0, 45002.0, 28526.0, 17976.0, 11296.0, 7058.0, 4404.0, 2856.0, 1727.0, 1111.0, 717.0, 424.0, 251.0, 182.0, 110.0, 59.0, 37.0, 30.0, 21.0, 11.0, 4.0, 4.0, 7.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0959014892578125, -1.059967041015625, -1.0240325927734375, -0.98809814453125, -0.9521636962890625, -0.916229248046875, -0.8802947998046875, -0.8443603515625, -0.8084259033203125, -0.772491455078125, -0.7365570068359375, -0.70062255859375, -0.6646881103515625, -0.628753662109375, -0.5928192138671875, -0.556884765625, -0.5209503173828125, -0.485015869140625, -0.4490814208984375, -0.41314697265625, -0.3772125244140625, -0.341278076171875, -0.3053436279296875, -0.2694091796875, -0.2334747314453125, -0.197540283203125, -0.1616058349609375, -0.12567138671875, -0.0897369384765625, -0.053802490234375, -0.0178680419921875, 0.01806640625, 0.0540008544921875, 0.089935302734375, 0.1258697509765625, 0.16180419921875, 0.1977386474609375, 0.233673095703125, 0.2696075439453125, 0.3055419921875, 0.3414764404296875, 0.377410888671875, 0.4133453369140625, 0.44927978515625, 0.4852142333984375, 0.521148681640625, 0.5570831298828125, 0.593017578125, 0.6289520263671875, 0.664886474609375, 0.7008209228515625, 0.73675537109375, 0.7726898193359375, 0.808624267578125, 0.8445587158203125, 0.8804931640625, 0.9164276123046875, 0.952362060546875, 0.9882965087890625, 1.02423095703125, 1.0601654052734375, 1.096099853515625, 1.1320343017578125, 1.16796875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 5.0, 15.0, 21.0, 19.0, 24.0, 41.0, 49.0, 56.0, 66.0, 72.0, 89.0, 86.0, 92.0, 140.0, 127.0, 155.0, 179.0, 191.0, 192.0, 222.0, 184.0, 216.0, 211.0, 202.0, 184.0, 167.0, 148.0, 143.0, 144.0, 97.0, 100.0, 61.0, 80.0, 69.0, 53.0, 36.0, 28.0, 25.0, 23.0, 9.0, 13.0, 6.0, 3.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.4287147521972656, -0.41431427001953125, -0.3999137878417969, -0.3855133056640625, -0.3711128234863281, -0.35671234130859375, -0.3423118591308594, -0.327911376953125, -0.3135108947753906, -0.29911041259765625, -0.2847099304199219, -0.2703094482421875, -0.2559089660644531, -0.24150848388671875, -0.22710800170898438, -0.21270751953125, -0.19830703735351562, -0.18390655517578125, -0.16950607299804688, -0.1551055908203125, -0.14070510864257812, -0.12630462646484375, -0.11190414428710938, -0.097503662109375, -0.08310317993164062, -0.06870269775390625, -0.054302215576171875, -0.0399017333984375, -0.025501251220703125, -0.01110076904296875, 0.003299713134765625, 0.0177001953125, 0.032100677490234375, 0.04650115966796875, 0.060901641845703125, 0.0753021240234375, 0.08970260620117188, 0.10410308837890625, 0.11850357055664062, 0.132904052734375, 0.14730453491210938, 0.16170501708984375, 0.17610549926757812, 0.1905059814453125, 0.20490646362304688, 0.21930694580078125, 0.23370742797851562, 0.24810791015625, 0.2625083923339844, 0.27690887451171875, 0.2913093566894531, 0.3057098388671875, 0.3201103210449219, 0.33451080322265625, 0.3489112854003906, 0.363311767578125, 0.3777122497558594, 0.39211273193359375, 0.4065132141113281, 0.4209136962890625, 0.4353141784667969, 0.44971466064453125, 0.4641151428222656, 0.478515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 7.0, 1.0, 3.0, 8.0, 9.0, 21.0, 4.0, 24.0, 27.0, 17.0, 29.0, 37.0, 31.0, 35.0, 49.0, 47.0, 49.0, 40.0, 48.0, 54.0, 40.0, 61.0, 48.0, 45.0, 51.0, 39.0, 34.0, 10.0, 22.0, 22.0, 11.0, 7.0, 11.0, 12.0, 9.0, 4.0, 2.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.58762526512146, -1.5393799543380737, -1.491134524345398, -1.4428892135620117, -1.394643783569336, -1.3463984727859497, -1.2981531620025635, -1.2499077320098877, -1.2016624212265015, -1.1534171104431152, -1.1051716804504395, -1.0569263696670532, -1.008681058883667, -0.9604356288909912, -0.912190318107605, -0.863944947719574, -0.815699577331543, -0.767454206943512, -0.719208836555481, -0.6709635257720947, -0.6227181553840637, -0.5744727849960327, -0.5262274742126465, -0.4779821038246155, -0.4297367334365845, -0.38149136304855347, -0.33324602246284485, -0.28500068187713623, -0.23675531148910522, -0.1885099560022354, -0.1402646005153656, -0.09201925992965698, -0.04377400875091553, 0.004471346735954285, 0.0527167022228241, 0.10096205770969391, 0.14920741319656372, 0.19745276868343353, 0.24569812417030334, 0.29394346475601196, 0.34218883514404297, 0.390434205532074, 0.4386795461177826, 0.4869248867034912, 0.5351702570915222, 0.5834156274795532, 0.6316609382629395, 0.6799063086509705, 0.7281516790390015, 0.7763970494270325, 0.8246424198150635, 0.8728877305984497, 0.9211331009864807, 0.9693784713745117, 1.017623782157898, 1.0658690929412842, 1.11411452293396, 1.1623598337173462, 1.210605263710022, 1.2588505744934082, 1.307096004486084, 1.3553413152694702, 1.4035866260528564, 1.4518320560455322, 1.5000773668289185]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 5.0, 8.0, 10.0, 14.0, 7.0, 19.0, 25.0, 15.0, 23.0, 26.0, 29.0, 31.0, 33.0, 30.0, 26.0, 41.0, 44.0, 38.0, 39.0, 40.0, 44.0, 33.0, 41.0, 34.0, 41.0, 33.0, 22.0, 33.0, 37.0, 34.0, 19.0, 18.0, 18.0, 15.0, 13.0, 7.0, 7.0, 13.0, 7.0, 3.0, 7.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9469460844993591, -0.91257643699646, -0.878206729888916, -0.8438370823860168, -0.8094674348831177, -0.7750977873802185, -0.7407281398773193, -0.7063584327697754, -0.6719887852668762, -0.637619137763977, -0.6032494306564331, -0.5688797831535339, -0.5345101356506348, -0.5001404881477356, -0.46577081084251404, -0.4314011335372925, -0.3970314860343933, -0.36266183853149414, -0.3282921612262726, -0.293922483921051, -0.25955283641815186, -0.2251831740140915, -0.19081351161003113, -0.15644384920597076, -0.1220741868019104, -0.08770452439785004, -0.05333486199378967, -0.01896519958972931, 0.015404462814331055, 0.04977412521839142, 0.08414378762245178, 0.11851345002651215, 0.15288305282592773, 0.1872527152299881, 0.22162237763404846, 0.25599205493927, 0.2903617024421692, 0.32473134994506836, 0.3591010272502899, 0.3934707045555115, 0.42784035205841064, 0.4622099995613098, 0.49657967686653137, 0.5309493541717529, 0.5653190016746521, 0.5996886491775513, 0.6340583562850952, 0.6684280037879944, 0.7027976512908936, 0.7371672987937927, 0.7715369462966919, 0.8059066534042358, 0.840276300907135, 0.8746459484100342, 0.9090156555175781, 0.9433853030204773, 0.9777549505233765, 1.0121246576309204, 1.0464942455291748, 1.0808639526367188, 1.1152336597442627, 1.149603247642517, 1.183972954750061, 1.2183425426483154, 1.2527122497558594]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 17.0, 29.0, 58.0, 80.0, 132.0, 217.0, 323.0, 509.0, 782.0, 1239.0, 1847.0, 2890.0, 4691.0, 7261.0, 11411.0, 17941.0, 28141.0, 44028.0, 66459.0, 97515.0, 131501.0, 153763.0, 144211.0, 110781.0, 78027.0, 51626.0, 33684.0, 21337.0, 13813.0, 8786.0, 5674.0, 3549.0, 2228.0, 1407.0, 933.0, 575.0, 392.0, 260.0, 143.0, 96.0, 64.0, 41.0, 31.0, 17.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22223663330078125, -0.2144927978515625, -0.20674896240234375, -0.199005126953125, -0.19126129150390625, -0.1835174560546875, -0.17577362060546875, -0.16802978515625, -0.16028594970703125, -0.1525421142578125, -0.14479827880859375, -0.137054443359375, -0.12931060791015625, -0.1215667724609375, -0.11382293701171875, -0.1060791015625, -0.09833526611328125, -0.0905914306640625, -0.08284759521484375, -0.075103759765625, -0.06735992431640625, -0.0596160888671875, -0.05187225341796875, -0.04412841796875, -0.03638458251953125, -0.0286407470703125, -0.02089691162109375, -0.013153076171875, -0.00540924072265625, 0.0023345947265625, 0.01007843017578125, 0.017822265625, 0.02556610107421875, 0.0333099365234375, 0.04105377197265625, 0.048797607421875, 0.05654144287109375, 0.0642852783203125, 0.07202911376953125, 0.07977294921875, 0.08751678466796875, 0.0952606201171875, 0.10300445556640625, 0.110748291015625, 0.11849212646484375, 0.1262359619140625, 0.13397979736328125, 0.1417236328125, 0.14946746826171875, 0.1572113037109375, 0.16495513916015625, 0.172698974609375, 0.18044281005859375, 0.1881866455078125, 0.19593048095703125, 0.20367431640625, 0.21141815185546875, 0.2191619873046875, 0.22690582275390625, 0.234649658203125, 0.24239349365234375, 0.2501373291015625, 0.25788116455078125, 0.265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 7.0, 4.0, 6.0, 3.0, 8.0, 10.0, 17.0, 16.0, 21.0, 29.0, 18.0, 30.0, 41.0, 39.0, 35.0, 35.0, 39.0, 43.0, 35.0, 40.0, 37.0, 54.0, 32.0, 39.0, 43.0, 32.0, 45.0, 27.0, 31.0, 37.0, 25.0, 23.0, 18.0, 12.0, 11.0, 12.0, 7.0, 9.0, 2.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2645416259765625, -1.225372314453125, -1.1862030029296875, -1.14703369140625, -1.1078643798828125, -1.068695068359375, -1.0295257568359375, -0.9903564453125, -0.9511871337890625, -0.912017822265625, -0.8728485107421875, -0.83367919921875, -0.7945098876953125, -0.755340576171875, -0.7161712646484375, -0.677001953125, -0.6378326416015625, -0.598663330078125, -0.5594940185546875, -0.52032470703125, -0.4811553955078125, -0.441986083984375, -0.4028167724609375, -0.3636474609375, -0.3244781494140625, -0.285308837890625, -0.2461395263671875, -0.20697021484375, -0.1678009033203125, -0.128631591796875, -0.0894622802734375, -0.05029296875, -0.0111236572265625, 0.028045654296875, 0.0672149658203125, 0.10638427734375, 0.1455535888671875, 0.184722900390625, 0.2238922119140625, 0.2630615234375, 0.3022308349609375, 0.341400146484375, 0.3805694580078125, 0.41973876953125, 0.4589080810546875, 0.498077392578125, 0.5372467041015625, 0.576416015625, 0.6155853271484375, 0.654754638671875, 0.6939239501953125, 0.73309326171875, 0.7722625732421875, 0.811431884765625, 0.8506011962890625, 0.8897705078125, 0.9289398193359375, 0.968109130859375, 1.0072784423828125, 1.04644775390625, 1.0856170654296875, 1.124786376953125, 1.1639556884765625, 1.203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 4.0, 13.0, 17.0, 16.0, 32.0, 70.0, 63.0, 132.0, 169.0, 250.0, 485.0, 729.0, 1315.0, 2065.0, 3783.0, 6854.0, 12615.0, 24199.0, 45849.0, 87053.0, 153431.0, 218223.0, 203564.0, 132397.0, 72529.0, 38114.0, 20149.0, 10826.0, 5734.0, 3248.0, 1827.0, 1050.0, 654.0, 389.0, 238.0, 164.0, 95.0, 54.0, 45.0, 30.0, 21.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3344306945800781, -0.32242584228515625, -0.3104209899902344, -0.2984161376953125, -0.2864112854003906, -0.27440643310546875, -0.2624015808105469, -0.250396728515625, -0.23839187622070312, -0.22638702392578125, -0.21438217163085938, -0.2023773193359375, -0.19037246704101562, -0.17836761474609375, -0.16636276245117188, -0.15435791015625, -0.14235305786132812, -0.13034820556640625, -0.11834335327148438, -0.1063385009765625, -0.09433364868164062, -0.08232879638671875, -0.07032394409179688, -0.058319091796875, -0.046314239501953125, -0.03430938720703125, -0.022304534912109375, -0.0102996826171875, 0.001705169677734375, 0.01371002197265625, 0.025714874267578125, 0.0377197265625, 0.049724578857421875, 0.06172943115234375, 0.07373428344726562, 0.0857391357421875, 0.09774398803710938, 0.10974884033203125, 0.12175369262695312, 0.133758544921875, 0.14576339721679688, 0.15776824951171875, 0.16977310180664062, 0.1817779541015625, 0.19378280639648438, 0.20578765869140625, 0.21779251098632812, 0.22979736328125, 0.24180221557617188, 0.25380706787109375, 0.2658119201660156, 0.2778167724609375, 0.2898216247558594, 0.30182647705078125, 0.3138313293457031, 0.325836181640625, 0.3378410339355469, 0.34984588623046875, 0.3618507385253906, 0.3738555908203125, 0.3858604431152344, 0.39786529541015625, 0.4098701477050781, 0.421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 15.0, 9.0, 12.0, 15.0, 18.0, 14.0, 20.0, 30.0, 21.0, 22.0, 25.0, 30.0, 25.0, 37.0, 48.0, 44.0, 34.0, 40.0, 42.0, 50.0, 34.0, 42.0, 43.0, 37.0, 32.0, 32.0, 43.0, 18.0, 36.0, 14.0, 14.0, 13.0, 11.0, 11.0, 8.0, 12.0, 9.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7030868530273438, -0.6800994873046875, -0.6571121215820312, -0.634124755859375, -0.6111373901367188, -0.5881500244140625, -0.5651626586914062, -0.54217529296875, -0.5191879272460938, -0.4962005615234375, -0.47321319580078125, -0.450225830078125, -0.42723846435546875, -0.4042510986328125, -0.38126373291015625, -0.3582763671875, -0.33528900146484375, -0.3123016357421875, -0.28931427001953125, -0.266326904296875, -0.24333953857421875, -0.2203521728515625, -0.19736480712890625, -0.17437744140625, -0.15139007568359375, -0.1284027099609375, -0.10541534423828125, -0.082427978515625, -0.05944061279296875, -0.0364532470703125, -0.01346588134765625, 0.009521484375, 0.03250885009765625, 0.0554962158203125, 0.07848358154296875, 0.101470947265625, 0.12445831298828125, 0.1474456787109375, 0.17043304443359375, 0.19342041015625, 0.21640777587890625, 0.2393951416015625, 0.26238250732421875, 0.285369873046875, 0.30835723876953125, 0.3313446044921875, 0.35433197021484375, 0.3773193359375, 0.40030670166015625, 0.4232940673828125, 0.44628143310546875, 0.469268798828125, 0.49225616455078125, 0.5152435302734375, 0.5382308959960938, 0.56121826171875, 0.5842056274414062, 0.6071929931640625, 0.6301803588867188, 0.653167724609375, 0.6761550903320312, 0.6991424560546875, 0.7221298217773438, 0.7451171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 32.0, 23.0, 46.0, 54.0, 102.0, 160.0, 184.0, 321.0, 511.0, 749.0, 1195.0, 1951.0, 3226.0, 5470.0, 10192.0, 20521.0, 47821.0, 132885.0, 374830.0, 283790.0, 92254.0, 35682.0, 16228.0, 8277.0, 4553.0, 2758.0, 1689.0, 1065.0, 693.0, 423.0, 242.0, 169.0, 99.0, 105.0, 70.0, 36.0, 26.0, 27.0, 15.0, 13.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.199462890625, -0.19373703002929688, -0.18801116943359375, -0.18228530883789062, -0.1765594482421875, -0.17083358764648438, -0.16510772705078125, -0.15938186645507812, -0.153656005859375, -0.14793014526367188, -0.14220428466796875, -0.13647842407226562, -0.1307525634765625, -0.12502670288085938, -0.11930084228515625, -0.11357498168945312, -0.10784912109375, -0.10212326049804688, -0.09639739990234375, -0.09067153930664062, -0.0849456787109375, -0.07921981811523438, -0.07349395751953125, -0.06776809692382812, -0.062042236328125, -0.056316375732421875, -0.05059051513671875, -0.044864654541015625, -0.0391387939453125, -0.033412933349609375, -0.02768707275390625, -0.021961212158203125, -0.0162353515625, -0.010509490966796875, -0.00478363037109375, 0.000942230224609375, 0.0066680908203125, 0.012393951416015625, 0.01811981201171875, 0.023845672607421875, 0.029571533203125, 0.035297393798828125, 0.04102325439453125, 0.046749114990234375, 0.0524749755859375, 0.058200836181640625, 0.06392669677734375, 0.06965255737304688, 0.07537841796875, 0.08110427856445312, 0.08683013916015625, 0.09255599975585938, 0.0982818603515625, 0.10400772094726562, 0.10973358154296875, 0.11545944213867188, 0.121185302734375, 0.12691116333007812, 0.13263702392578125, 0.13836288452148438, 0.1440887451171875, 0.14981460571289062, 0.15554046630859375, 0.16126632690429688, 0.1669921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 6.0, 12.0, 11.0, 6.0, 14.0, 20.0, 10.0, 15.0, 18.0, 15.0, 26.0, 30.0, 46.0, 36.0, 36.0, 37.0, 46.0, 37.0, 43.0, 44.0, 41.0, 32.0, 30.0, 40.0, 50.0, 46.0, 29.0, 26.0, 29.0, 27.0, 15.0, 21.0, 16.0, 15.0, 7.0, 15.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.445923984050751e-06, -7.202848792076111e-06, -6.959773600101471e-06, -6.716698408126831e-06, -6.473623216152191e-06, -6.230548024177551e-06, -5.987472832202911e-06, -5.7443976402282715e-06, -5.501322448253632e-06, -5.258247256278992e-06, -5.015172064304352e-06, -4.772096872329712e-06, -4.529021680355072e-06, -4.285946488380432e-06, -4.042871296405792e-06, -3.7997961044311523e-06, -3.5567209124565125e-06, -3.3136457204818726e-06, -3.0705705285072327e-06, -2.8274953365325928e-06, -2.584420144557953e-06, -2.341344952583313e-06, -2.098269760608673e-06, -1.8551945686340332e-06, -1.6121193766593933e-06, -1.3690441846847534e-06, -1.1259689927101135e-06, -8.828938007354736e-07, -6.398186087608337e-07, -3.9674341678619385e-07, -1.5366822481155396e-07, 8.940696716308594e-08, 3.3248215913772583e-07, 5.755573511123657e-07, 8.186325430870056e-07, 1.0617077350616455e-06, 1.3047829270362854e-06, 1.5478581190109253e-06, 1.7909333109855652e-06, 2.034008502960205e-06, 2.277083694934845e-06, 2.520158886909485e-06, 2.7632340788841248e-06, 3.0063092708587646e-06, 3.2493844628334045e-06, 3.4924596548080444e-06, 3.7355348467826843e-06, 3.978610038757324e-06, 4.221685230731964e-06, 4.464760422706604e-06, 4.707835614681244e-06, 4.950910806655884e-06, 5.193985998630524e-06, 5.4370611906051636e-06, 5.6801363825798035e-06, 5.923211574554443e-06, 6.166286766529083e-06, 6.409361958503723e-06, 6.652437150478363e-06, 6.895512342453003e-06, 7.138587534427643e-06, 7.381662726402283e-06, 7.624737918376923e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 12.0, 23.0, 30.0, 36.0, 62.0, 116.0, 164.0, 239.0, 424.0, 666.0, 1065.0, 1836.0, 3230.0, 5851.0, 11140.0, 22446.0, 46314.0, 101049.0, 209933.0, 286311.0, 186535.0, 88597.0, 40421.0, 19503.0, 10092.0, 5292.0, 2853.0, 1686.0, 985.0, 625.0, 366.0, 221.0, 153.0, 120.0, 59.0, 43.0, 16.0, 16.0, 7.0, 1.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.197998046875, -0.19256019592285156, -0.18712234497070312, -0.1816844940185547, -0.17624664306640625, -0.1708087921142578, -0.16537094116210938, -0.15993309020996094, -0.1544952392578125, -0.14905738830566406, -0.14361953735351562, -0.1381816864013672, -0.13274383544921875, -0.1273059844970703, -0.12186813354492188, -0.11643028259277344, -0.110992431640625, -0.10555458068847656, -0.10011672973632812, -0.09467887878417969, -0.08924102783203125, -0.08380317687988281, -0.07836532592773438, -0.07292747497558594, -0.0674896240234375, -0.06205177307128906, -0.056613922119140625, -0.05117607116699219, -0.04573822021484375, -0.04030036926269531, -0.034862518310546875, -0.029424667358398438, -0.02398681640625, -0.018548965454101562, -0.013111114501953125, -0.0076732635498046875, -0.00223541259765625, 0.0032024383544921875, 0.008640289306640625, 0.014078140258789062, 0.0195159912109375, 0.024953842163085938, 0.030391693115234375, 0.03582954406738281, 0.04126739501953125, 0.04670524597167969, 0.052143096923828125, 0.05758094787597656, 0.063018798828125, 0.06845664978027344, 0.07389450073242188, 0.07933235168457031, 0.08477020263671875, 0.09020805358886719, 0.09564590454101562, 0.10108375549316406, 0.1065216064453125, 0.11195945739746094, 0.11739730834960938, 0.12283515930175781, 0.12827301025390625, 0.1337108612060547, 0.13914871215820312, 0.14458656311035156, 0.1500244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 8.0, 5.0, 11.0, 14.0, 20.0, 12.0, 13.0, 18.0, 36.0, 37.0, 40.0, 36.0, 49.0, 58.0, 58.0, 65.0, 49.0, 57.0, 44.0, 44.0, 40.0, 41.0, 34.0, 31.0, 25.0, 25.0, 19.0, 17.0, 10.0, 7.0, 9.0, 13.0, 6.0, 8.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.036956787109375, -0.0358738899230957, -0.034790992736816406, -0.03370809555053711, -0.03262519836425781, -0.031542301177978516, -0.03045940399169922, -0.029376506805419922, -0.028293609619140625, -0.027210712432861328, -0.02612781524658203, -0.025044918060302734, -0.023962020874023438, -0.02287912368774414, -0.021796226501464844, -0.020713329315185547, -0.01963043212890625, -0.018547534942626953, -0.017464637756347656, -0.01638174057006836, -0.015298843383789062, -0.014215946197509766, -0.013133049011230469, -0.012050151824951172, -0.010967254638671875, -0.009884357452392578, -0.008801460266113281, -0.007718563079833984, -0.0066356658935546875, -0.005552768707275391, -0.004469871520996094, -0.003386974334716797, -0.0023040771484375, -0.0012211799621582031, -0.00013828277587890625, 0.0009446144104003906, 0.0020275115966796875, 0.0031104087829589844, 0.004193305969238281, 0.005276203155517578, 0.006359100341796875, 0.007441997528076172, 0.008524894714355469, 0.009607791900634766, 0.010690689086914062, 0.01177358627319336, 0.012856483459472656, 0.013939380645751953, 0.01502227783203125, 0.016105175018310547, 0.017188072204589844, 0.01827096939086914, 0.019353866577148438, 0.020436763763427734, 0.02151966094970703, 0.022602558135986328, 0.023685455322265625, 0.024768352508544922, 0.02585124969482422, 0.026934146881103516, 0.028017044067382812, 0.02909994125366211, 0.030182838439941406, 0.0312657356262207, 0.0323486328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 1.0, 1.0, 9.0, 8.0, 15.0, 14.0, 18.0, 26.0, 26.0, 23.0, 32.0, 25.0, 36.0, 49.0, 51.0, 45.0, 37.0, 51.0, 54.0, 48.0, 56.0, 47.0, 41.0, 46.0, 47.0, 32.0, 20.0, 21.0, 17.0, 16.0, 11.0, 9.0, 10.0, 11.0, 5.0, 3.0, 7.0, 3.0, 6.0, 5.0, 0.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.542368769645691, -1.4943792819976807, -1.44638991355896, -1.3984004259109497, -1.3504109382629395, -1.3024214506149292, -1.254431962966919, -1.2064425945281982, -1.158453106880188, -1.1104636192321777, -1.062474250793457, -1.0144847631454468, -0.9664952754974365, -0.9185057878494263, -0.8705163598060608, -0.8225269317626953, -0.7745374441146851, -0.7265479564666748, -0.6785585284233093, -0.6305691003799438, -0.5825796127319336, -0.5345901250839233, -0.48660069704055786, -0.43861123919487, -0.39062178134918213, -0.34263232350349426, -0.2946428656578064, -0.24665340781211853, -0.19866394996643066, -0.1506744921207428, -0.10268503427505493, -0.054695576429367065, -0.0067059993743896484, 0.04128345847129822, 0.08927291631698608, 0.13726237416267395, 0.18525183200836182, 0.23324128985404968, 0.28123074769973755, 0.3292202055454254, 0.3772096633911133, 0.42519912123680115, 0.473188579082489, 0.5211780071258545, 0.5691674947738647, 0.617156982421875, 0.6651464104652405, 0.713135838508606, 0.7611253261566162, 0.8091148138046265, 0.8571042418479919, 0.9050936698913574, 0.9530831575393677, 1.001072645187378, 1.0490620136260986, 1.0970515012741089, 1.1450409889221191, 1.1930304765701294, 1.2410199642181396, 1.2890093326568604, 1.3369988203048706, 1.3849883079528809, 1.4329776763916016, 1.4809671640396118, 1.528956651687622]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 10.0, 6.0, 7.0, 9.0, 8.0, 13.0, 8.0, 19.0, 25.0, 16.0, 24.0, 26.0, 27.0, 30.0, 31.0, 34.0, 26.0, 38.0, 40.0, 36.0, 50.0, 38.0, 41.0, 36.0, 34.0, 34.0, 42.0, 34.0, 27.0, 29.0, 35.0, 34.0, 25.0, 17.0, 18.0, 15.0, 13.0, 6.0, 8.0, 12.0, 7.0, 4.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9426308274269104, -0.908301591873169, -0.8739722967147827, -0.8396430611610413, -0.8053138256072998, -0.7709845900535583, -0.7366553544998169, -0.7023260593414307, -0.6679968237876892, -0.6336675882339478, -0.5993382930755615, -0.5650090575218201, -0.5306798219680786, -0.49635058641433716, -0.4620213210582733, -0.4276920557022095, -0.393362820148468, -0.35903358459472656, -0.3247043192386627, -0.2903750538825989, -0.2560458183288574, -0.22171656787395477, -0.18738731741905212, -0.15305806696414948, -0.11872881650924683, -0.08439956605434418, -0.05007031559944153, -0.01574106514453888, 0.01858818531036377, 0.05291743576526642, 0.08724668622016907, 0.12157593667507172, 0.1559051275253296, 0.19023437798023224, 0.2245636284351349, 0.25889289379119873, 0.2932221293449402, 0.32755136489868164, 0.3618806302547455, 0.3962098956108093, 0.4305391311645508, 0.46486836671829224, 0.4991976320743561, 0.5335268974304199, 0.5678561329841614, 0.6021853685379028, 0.6365146636962891, 0.6708438992500305, 0.705173134803772, 0.7395023703575134, 0.7738316059112549, 0.8081609010696411, 0.8424901366233826, 0.876819372177124, 0.9111486673355103, 0.9454779028892517, 0.9798071384429932, 1.0141364336013794, 1.048465609550476, 1.0827949047088623, 1.117124080657959, 1.1514533758163452, 1.1857826709747314, 1.2201118469238281, 1.2544411420822144]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 18.0, 10.0, 23.0, 45.0, 56.0, 101.0, 196.0, 313.0, 462.0, 797.0, 1301.0, 2144.0, 3470.0, 5554.0, 9074.0, 14025.0, 21432.0, 31929.0, 46236.0, 62590.0, 81074.0, 98146.0, 109613.0, 112145.0, 106358.0, 92312.0, 74645.0, 56736.0, 40207.0, 27881.0, 18387.0, 11884.0, 7364.0, 4746.0, 2857.0, 1695.0, 1077.0, 691.0, 396.0, 217.0, 130.0, 94.0, 48.0, 28.0, 21.0, 16.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.0693359375, -1.0381698608398438, -1.0070037841796875, -0.9758377075195312, -0.944671630859375, -0.9135055541992188, -0.8823394775390625, -0.8511734008789062, -0.82000732421875, -0.7888412475585938, -0.7576751708984375, -0.7265090942382812, -0.695343017578125, -0.6641769409179688, -0.6330108642578125, -0.6018447875976562, -0.5706787109375, -0.5395126342773438, -0.5083465576171875, -0.47718048095703125, -0.446014404296875, -0.41484832763671875, -0.3836822509765625, -0.35251617431640625, -0.32135009765625, -0.29018402099609375, -0.2590179443359375, -0.22785186767578125, -0.196685791015625, -0.16551971435546875, -0.1343536376953125, -0.10318756103515625, -0.072021484375, -0.04085540771484375, -0.0096893310546875, 0.02147674560546875, 0.052642822265625, 0.08380889892578125, 0.1149749755859375, 0.14614105224609375, 0.17730712890625, 0.20847320556640625, 0.2396392822265625, 0.27080535888671875, 0.301971435546875, 0.33313751220703125, 0.3643035888671875, 0.39546966552734375, 0.4266357421875, 0.45780181884765625, 0.4889678955078125, 0.5201339721679688, 0.551300048828125, 0.5824661254882812, 0.6136322021484375, 0.6447982788085938, 0.67596435546875, 0.7071304321289062, 0.7382965087890625, 0.7694625854492188, 0.800628662109375, 0.8317947387695312, 0.8629608154296875, 0.8941268920898438, 0.92529296875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 3.0, 9.0, 7.0, 13.0, 10.0, 19.0, 14.0, 21.0, 14.0, 16.0, 20.0, 20.0, 23.0, 25.0, 37.0, 24.0, 39.0, 31.0, 36.0, 32.0, 36.0, 47.0, 38.0, 40.0, 34.0, 45.0, 32.0, 35.0, 29.0, 18.0, 35.0, 30.0, 14.0, 26.0, 17.0, 14.0, 10.0, 19.0, 12.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.00390625, -0.969512939453125, -0.93511962890625, -0.900726318359375, -0.8663330078125, -0.831939697265625, -0.79754638671875, -0.763153076171875, -0.728759765625, -0.694366455078125, -0.65997314453125, -0.625579833984375, -0.5911865234375, -0.556793212890625, -0.52239990234375, -0.488006591796875, -0.45361328125, -0.419219970703125, -0.38482666015625, -0.350433349609375, -0.3160400390625, -0.281646728515625, -0.24725341796875, -0.212860107421875, -0.178466796875, -0.144073486328125, -0.10968017578125, -0.075286865234375, -0.0408935546875, -0.006500244140625, 0.02789306640625, 0.062286376953125, 0.0966796875, 0.131072998046875, 0.16546630859375, 0.199859619140625, 0.2342529296875, 0.268646240234375, 0.30303955078125, 0.337432861328125, 0.371826171875, 0.406219482421875, 0.44061279296875, 0.475006103515625, 0.5093994140625, 0.543792724609375, 0.57818603515625, 0.612579345703125, 0.64697265625, 0.681365966796875, 0.71575927734375, 0.750152587890625, 0.7845458984375, 0.818939208984375, 0.85333251953125, 0.887725830078125, 0.922119140625, 0.956512451171875, 0.99090576171875, 1.025299072265625, 1.0596923828125, 1.094085693359375, 1.12847900390625, 1.162872314453125, 1.197265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 9.0, 4.0, 9.0, 13.0, 26.0, 39.0, 72.0, 82.0, 121.0, 177.0, 266.0, 477.0, 676.0, 978.0, 1503.0, 2389.0, 3548.0, 5526.0, 8398.0, 12473.0, 18010.0, 26113.0, 36334.0, 48920.0, 63210.0, 77698.0, 89308.0, 97870.0, 99361.0, 95435.0, 84868.0, 71558.0, 57634.0, 43627.0, 32365.0, 22577.0, 15850.0, 10575.0, 7127.0, 4665.0, 2954.0, 2017.0, 1277.0, 825.0, 554.0, 376.0, 219.0, 164.0, 90.0, 83.0, 33.0, 30.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0], "bins": [-0.88916015625, -0.86163330078125, -0.8341064453125, -0.80657958984375, -0.779052734375, -0.75152587890625, -0.7239990234375, -0.69647216796875, -0.6689453125, -0.64141845703125, -0.6138916015625, -0.58636474609375, -0.558837890625, -0.53131103515625, -0.5037841796875, -0.47625732421875, -0.44873046875, -0.42120361328125, -0.3936767578125, -0.36614990234375, -0.338623046875, -0.31109619140625, -0.2835693359375, -0.25604248046875, -0.228515625, -0.20098876953125, -0.1734619140625, -0.14593505859375, -0.118408203125, -0.09088134765625, -0.0633544921875, -0.03582763671875, -0.00830078125, 0.01922607421875, 0.0467529296875, 0.07427978515625, 0.101806640625, 0.12933349609375, 0.1568603515625, 0.18438720703125, 0.2119140625, 0.23944091796875, 0.2669677734375, 0.29449462890625, 0.322021484375, 0.34954833984375, 0.3770751953125, 0.40460205078125, 0.43212890625, 0.45965576171875, 0.4871826171875, 0.51470947265625, 0.542236328125, 0.56976318359375, 0.5972900390625, 0.62481689453125, 0.65234375, 0.67987060546875, 0.7073974609375, 0.73492431640625, 0.762451171875, 0.78997802734375, 0.8175048828125, 0.84503173828125, 0.87255859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 8.0, 9.0, 6.0, 10.0, 15.0, 18.0, 18.0, 26.0, 32.0, 27.0, 33.0, 34.0, 35.0, 38.0, 47.0, 41.0, 43.0, 39.0, 51.0, 46.0, 33.0, 35.0, 25.0, 42.0, 33.0, 27.0, 24.0, 31.0, 25.0, 22.0, 24.0, 21.0, 9.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7119598388671875, -0.688568115234375, -0.6651763916015625, -0.64178466796875, -0.6183929443359375, -0.595001220703125, -0.5716094970703125, -0.5482177734375, -0.5248260498046875, -0.501434326171875, -0.4780426025390625, -0.45465087890625, -0.4312591552734375, -0.407867431640625, -0.3844757080078125, -0.361083984375, -0.3376922607421875, -0.314300537109375, -0.2909088134765625, -0.26751708984375, -0.2441253662109375, -0.220733642578125, -0.1973419189453125, -0.1739501953125, -0.1505584716796875, -0.127166748046875, -0.1037750244140625, -0.08038330078125, -0.0569915771484375, -0.033599853515625, -0.0102081298828125, 0.01318359375, 0.0365753173828125, 0.059967041015625, 0.0833587646484375, 0.10675048828125, 0.1301422119140625, 0.153533935546875, 0.1769256591796875, 0.2003173828125, 0.2237091064453125, 0.247100830078125, 0.2704925537109375, 0.29388427734375, 0.3172760009765625, 0.340667724609375, 0.3640594482421875, 0.387451171875, 0.4108428955078125, 0.434234619140625, 0.4576263427734375, 0.48101806640625, 0.5044097900390625, 0.527801513671875, 0.5511932373046875, 0.5745849609375, 0.5979766845703125, 0.621368408203125, 0.6447601318359375, 0.66815185546875, 0.6915435791015625, 0.714935302734375, 0.7383270263671875, 0.76171875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 26.0, 23.0, 34.0, 67.0, 91.0, 140.0, 204.0, 316.0, 442.0, 720.0, 1123.0, 1711.0, 2578.0, 4119.0, 6639.0, 10492.0, 16850.0, 27204.0, 43180.0, 67381.0, 97196.0, 128152.0, 145784.0, 140292.0, 115908.0, 84659.0, 56949.0, 36088.0, 22574.0, 13903.0, 8576.0, 5370.0, 3394.0, 2155.0, 1455.0, 917.0, 654.0, 435.0, 239.0, 160.0, 125.0, 72.0, 58.0, 33.0, 16.0, 18.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65234375, -0.6318283081054688, -0.6113128662109375, -0.5907974243164062, -0.570281982421875, -0.5497665405273438, -0.5292510986328125, -0.5087356567382812, -0.48822021484375, -0.46770477294921875, -0.4471893310546875, -0.42667388916015625, -0.406158447265625, -0.38564300537109375, -0.3651275634765625, -0.34461212158203125, -0.3240966796875, -0.30358123779296875, -0.2830657958984375, -0.26255035400390625, -0.242034912109375, -0.22151947021484375, -0.2010040283203125, -0.18048858642578125, -0.15997314453125, -0.13945770263671875, -0.1189422607421875, -0.09842681884765625, -0.077911376953125, -0.05739593505859375, -0.0368804931640625, -0.01636505126953125, 0.004150390625, 0.02466583251953125, 0.0451812744140625, 0.06569671630859375, 0.086212158203125, 0.10672760009765625, 0.1272430419921875, 0.14775848388671875, 0.16827392578125, 0.18878936767578125, 0.2093048095703125, 0.22982025146484375, 0.250335693359375, 0.27085113525390625, 0.2913665771484375, 0.31188201904296875, 0.3323974609375, 0.35291290283203125, 0.3734283447265625, 0.39394378662109375, 0.414459228515625, 0.43497467041015625, 0.4554901123046875, 0.47600555419921875, 0.49652099609375, 0.5170364379882812, 0.5375518798828125, 0.5580673217773438, 0.578582763671875, 0.5990982055664062, 0.6196136474609375, 0.6401290893554688, 0.66064453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 7.0, 9.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 30.0, 35.0, 46.0, 53.0, 49.0, 44.0, 57.0, 58.0, 58.0, 58.0, 49.0, 57.0, 52.0, 35.0, 46.0, 29.0, 26.0, 18.0, 16.0, 14.0, 11.0, 15.0, 11.0, 4.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.841868162155151e-05, -6.614625453948975e-05, -6.387382745742798e-05, -6.160140037536621e-05, -5.932897329330444e-05, -5.7056546211242676e-05, -5.478411912918091e-05, -5.251169204711914e-05, -5.023926496505737e-05, -4.7966837882995605e-05, -4.569441080093384e-05, -4.342198371887207e-05, -4.11495566368103e-05, -3.8877129554748535e-05, -3.660470247268677e-05, -3.4332275390625e-05, -3.205984830856323e-05, -2.9787421226501465e-05, -2.7514994144439697e-05, -2.524256706237793e-05, -2.2970139980316162e-05, -2.0697712898254395e-05, -1.8425285816192627e-05, -1.615285873413086e-05, -1.3880431652069092e-05, -1.1608004570007324e-05, -9.335577487945557e-06, -7.063150405883789e-06, -4.7907233238220215e-06, -2.518296241760254e-06, -2.4586915969848633e-07, 2.0265579223632812e-06, 4.298985004425049e-06, 6.571412086486816e-06, 8.843839168548584e-06, 1.1116266250610352e-05, 1.3388693332672119e-05, 1.5661120414733887e-05, 1.7933547496795654e-05, 2.0205974578857422e-05, 2.247840166091919e-05, 2.4750828742980957e-05, 2.7023255825042725e-05, 2.9295682907104492e-05, 3.156810998916626e-05, 3.384053707122803e-05, 3.6112964153289795e-05, 3.838539123535156e-05, 4.065781831741333e-05, 4.29302453994751e-05, 4.5202672481536865e-05, 4.747509956359863e-05, 4.97475266456604e-05, 5.201995372772217e-05, 5.4292380809783936e-05, 5.65648078918457e-05, 5.883723497390747e-05, 6.110966205596924e-05, 6.3382089138031e-05, 6.565451622009277e-05, 6.792694330215454e-05, 7.019937038421631e-05, 7.247179746627808e-05, 7.474422454833984e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 3.0, 15.0, 19.0, 29.0, 46.0, 42.0, 90.0, 113.0, 141.0, 227.0, 312.0, 487.0, 711.0, 1077.0, 1674.0, 2668.0, 4250.0, 6433.0, 10284.0, 16137.0, 24976.0, 38845.0, 57677.0, 81109.0, 107378.0, 127329.0, 132846.0, 120742.0, 98360.0, 72531.0, 49906.0, 32907.0, 21387.0, 13490.0, 8662.0, 5562.0, 3464.0, 2240.0, 1455.0, 980.0, 598.0, 416.0, 283.0, 193.0, 122.0, 95.0, 65.0, 56.0, 35.0, 22.0, 21.0, 10.0, 10.0, 10.0, 4.0, 4.0, 2.0, 5.0], "bins": [-0.60009765625, -0.5815277099609375, -0.562957763671875, -0.5443878173828125, -0.52581787109375, -0.5072479248046875, -0.488677978515625, -0.4701080322265625, -0.4515380859375, -0.4329681396484375, -0.414398193359375, -0.3958282470703125, -0.37725830078125, -0.3586883544921875, -0.340118408203125, -0.3215484619140625, -0.302978515625, -0.2844085693359375, -0.265838623046875, -0.2472686767578125, -0.22869873046875, -0.2101287841796875, -0.191558837890625, -0.1729888916015625, -0.1544189453125, -0.1358489990234375, -0.117279052734375, -0.0987091064453125, -0.08013916015625, -0.0615692138671875, -0.042999267578125, -0.0244293212890625, -0.005859375, 0.0127105712890625, 0.031280517578125, 0.0498504638671875, 0.06842041015625, 0.0869903564453125, 0.105560302734375, 0.1241302490234375, 0.1427001953125, 0.1612701416015625, 0.179840087890625, 0.1984100341796875, 0.21697998046875, 0.2355499267578125, 0.254119873046875, 0.2726898193359375, 0.291259765625, 0.3098297119140625, 0.328399658203125, 0.3469696044921875, 0.36553955078125, 0.3841094970703125, 0.402679443359375, 0.4212493896484375, 0.4398193359375, 0.4583892822265625, 0.476959228515625, 0.4955291748046875, 0.51409912109375, 0.5326690673828125, 0.551239013671875, 0.5698089599609375, 0.58837890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 18.0, 18.0, 21.0, 19.0, 27.0, 23.0, 30.0, 37.0, 37.0, 47.0, 44.0, 58.0, 50.0, 42.0, 56.0, 39.0, 45.0, 51.0, 28.0, 35.0, 42.0, 40.0, 33.0, 28.0, 15.0, 19.0, 15.0, 13.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 0.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2127685546875, -0.20659637451171875, -0.2004241943359375, -0.19425201416015625, -0.188079833984375, -0.18190765380859375, -0.1757354736328125, -0.16956329345703125, -0.16339111328125, -0.15721893310546875, -0.1510467529296875, -0.14487457275390625, -0.138702392578125, -0.13253021240234375, -0.1263580322265625, -0.12018585205078125, -0.114013671875, -0.10784149169921875, -0.1016693115234375, -0.09549713134765625, -0.089324951171875, -0.08315277099609375, -0.0769805908203125, -0.07080841064453125, -0.06463623046875, -0.05846405029296875, -0.0522918701171875, -0.04611968994140625, -0.039947509765625, -0.03377532958984375, -0.0276031494140625, -0.02143096923828125, -0.0152587890625, -0.00908660888671875, -0.0029144287109375, 0.00325775146484375, 0.009429931640625, 0.01560211181640625, 0.0217742919921875, 0.02794647216796875, 0.03411865234375, 0.04029083251953125, 0.0464630126953125, 0.05263519287109375, 0.058807373046875, 0.06497955322265625, 0.0711517333984375, 0.07732391357421875, 0.08349609375, 0.08966827392578125, 0.0958404541015625, 0.10201263427734375, 0.108184814453125, 0.11435699462890625, 0.1205291748046875, 0.12670135498046875, 0.13287353515625, 0.13904571533203125, 0.1452178955078125, 0.15139007568359375, 0.157562255859375, 0.16373443603515625, 0.1699066162109375, 0.17607879638671875, 0.1822509765625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 5.0, 10.0, 22.0, 28.0, 24.0, 28.0, 32.0, 47.0, 38.0, 48.0, 46.0, 44.0, 66.0, 51.0, 47.0, 59.0, 63.0, 50.0, 51.0, 39.0, 27.0, 36.0, 18.0, 14.0, 20.0, 11.0, 7.0, 13.0, 7.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67812180519104, -1.6232253313064575, -1.568328857421875, -1.513432264328003, -1.4585357904434204, -1.403639316558838, -1.3487428426742554, -1.2938463687896729, -1.2389497756958008, -1.1840533018112183, -1.1291568279266357, -1.0742602348327637, -1.0193637609481812, -0.9644672870635986, -0.9095708131790161, -0.8546743392944336, -0.7997778654098511, -0.7448813915252686, -0.6899848580360413, -0.6350883841514587, -0.5801918506622314, -0.5252953767776489, -0.4703989028930664, -0.4155023992061615, -0.3606058955192566, -0.3057093918323517, -0.2508128881454468, -0.19591641426086426, -0.14101991057395935, -0.08612340688705444, -0.031226933002471924, 0.023669570684432983, 0.07856607437133789, 0.1334625780582428, 0.1883590668439865, 0.24325555562973022, 0.29815205931663513, 0.35304856300354004, 0.40794503688812256, 0.46284154057502747, 0.5177380442619324, 0.5726345181465149, 0.6275310516357422, 0.6824275255203247, 0.7373239994049072, 0.7922205328941345, 0.847117006778717, 0.9020135402679443, 0.9569100141525269, 1.0118064880371094, 1.066702961921692, 1.1215994358062744, 1.1764960289001465, 1.231392502784729, 1.2862889766693115, 1.341185450553894, 1.3960819244384766, 1.450978398323059, 1.5058748722076416, 1.5607714653015137, 1.6156679391860962, 1.6705644130706787, 1.7254608869552612, 1.7803573608398438, 1.8352539539337158]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 9.0, 8.0, 8.0, 19.0, 20.0, 25.0, 13.0, 19.0, 25.0, 33.0, 29.0, 29.0, 41.0, 40.0, 35.0, 44.0, 31.0, 44.0, 44.0, 41.0, 44.0, 41.0, 37.0, 31.0, 44.0, 33.0, 25.0, 40.0, 22.0, 26.0, 19.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1000877618789673, -1.062829852104187, -1.0255720615386963, -0.988314151763916, -0.9510563015937805, -0.913798451423645, -0.8765405416488647, -0.8392826914787292, -0.8020248413085938, -0.7647669911384583, -0.7275091409683228, -0.6902512311935425, -0.652993381023407, -0.6157355308532715, -0.5784776210784912, -0.5412197709083557, -0.5039619207382202, -0.4667040705680847, -0.42944619059562683, -0.39218831062316895, -0.35493046045303345, -0.31767261028289795, -0.28041473031044006, -0.24315685033798218, -0.20589900016784668, -0.16864113509655, -0.1313832700252533, -0.0941254049539566, -0.05686753988265991, -0.01960967481136322, 0.01764819025993347, 0.05490607023239136, 0.0921638011932373, 0.129421666264534, 0.1666795313358307, 0.20393739640712738, 0.24119526147842407, 0.27845311164855957, 0.31571099162101746, 0.35296887159347534, 0.39022672176361084, 0.42748457193374634, 0.4647424519062042, 0.5020003318786621, 0.5392581820487976, 0.5765160322189331, 0.6137739419937134, 0.6510317921638489, 0.6882896423339844, 0.7255474925041199, 0.7628053426742554, 0.8000632524490356, 0.8373211026191711, 0.8745789527893066, 0.9118368625640869, 0.9490947127342224, 0.9863525629043579, 1.0236104726791382, 1.060868263244629, 1.0981261730194092, 1.1353840827941895, 1.1726418733596802, 1.2098997831344604, 1.2471575736999512, 1.2844154834747314]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 5.0, 13.0, 14.0, 29.0, 27.0, 59.0, 82.0, 137.0, 238.0, 369.0, 606.0, 1014.0, 1689.0, 2746.0, 4712.0, 7934.0, 13483.0, 23605.0, 40828.0, 69666.0, 118268.0, 195329.0, 304290.0, 438709.0, 559336.0, 611423.0, 561969.0, 443387.0, 306077.0, 197396.0, 120363.0, 71279.0, 41336.0, 24236.0, 13786.0, 8127.0, 4683.0, 2835.0, 1607.0, 979.0, 621.0, 346.0, 234.0, 141.0, 97.0, 76.0, 37.0, 18.0, 17.0, 16.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1665802001953125, -1.124176025390625, -1.0817718505859375, -1.03936767578125, -0.9969635009765625, -0.954559326171875, -0.9121551513671875, -0.8697509765625, -0.8273468017578125, -0.784942626953125, -0.7425384521484375, -0.70013427734375, -0.6577301025390625, -0.615325927734375, -0.5729217529296875, -0.530517578125, -0.4881134033203125, -0.445709228515625, -0.4033050537109375, -0.36090087890625, -0.3184967041015625, -0.276092529296875, -0.2336883544921875, -0.1912841796875, -0.1488800048828125, -0.106475830078125, -0.0640716552734375, -0.02166748046875, 0.0207366943359375, 0.063140869140625, 0.1055450439453125, 0.14794921875, 0.1903533935546875, 0.232757568359375, 0.2751617431640625, 0.31756591796875, 0.3599700927734375, 0.402374267578125, 0.4447784423828125, 0.4871826171875, 0.5295867919921875, 0.571990966796875, 0.6143951416015625, 0.65679931640625, 0.6992034912109375, 0.741607666015625, 0.7840118408203125, 0.826416015625, 0.8688201904296875, 0.911224365234375, 0.9536285400390625, 0.99603271484375, 1.0384368896484375, 1.080841064453125, 1.1232452392578125, 1.1656494140625, 1.2080535888671875, 1.250457763671875, 1.2928619384765625, 1.33526611328125, 1.3776702880859375, 1.420074462890625, 1.4624786376953125, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 3.0, 6.0, 5.0, 15.0, 11.0, 7.0, 11.0, 12.0, 10.0, 17.0, 20.0, 25.0, 16.0, 25.0, 26.0, 22.0, 30.0, 37.0, 35.0, 34.0, 41.0, 30.0, 39.0, 36.0, 40.0, 40.0, 32.0, 42.0, 40.0, 38.0, 29.0, 31.0, 32.0, 26.0, 19.0, 24.0, 14.0, 11.0, 13.0, 14.0, 12.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8059539794921875, -0.777923583984375, -0.7498931884765625, -0.72186279296875, -0.6938323974609375, -0.665802001953125, -0.6377716064453125, -0.6097412109375, -0.5817108154296875, -0.553680419921875, -0.5256500244140625, -0.49761962890625, -0.4695892333984375, -0.441558837890625, -0.4135284423828125, -0.385498046875, -0.3574676513671875, -0.329437255859375, -0.3014068603515625, -0.27337646484375, -0.2453460693359375, -0.217315673828125, -0.1892852783203125, -0.1612548828125, -0.1332244873046875, -0.105194091796875, -0.0771636962890625, -0.04913330078125, -0.0211029052734375, 0.006927490234375, 0.0349578857421875, 0.06298828125, 0.0910186767578125, 0.119049072265625, 0.1470794677734375, 0.17510986328125, 0.2031402587890625, 0.231170654296875, 0.2592010498046875, 0.2872314453125, 0.3152618408203125, 0.343292236328125, 0.3713226318359375, 0.39935302734375, 0.4273834228515625, 0.455413818359375, 0.4834442138671875, 0.511474609375, 0.5395050048828125, 0.567535400390625, 0.5955657958984375, 0.62359619140625, 0.6516265869140625, 0.679656982421875, 0.7076873779296875, 0.7357177734375, 0.7637481689453125, 0.791778564453125, 0.8198089599609375, 0.84783935546875, 0.8758697509765625, 0.903900146484375, 0.9319305419921875, 0.9599609375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 9.0, 13.0, 14.0, 22.0, 28.0, 48.0, 107.0, 162.0, 224.0, 382.0, 589.0, 933.0, 1483.0, 2336.0, 3826.0, 6323.0, 10166.0, 16238.0, 26151.0, 41231.0, 65015.0, 100398.0, 149506.0, 216368.0, 296933.0, 380937.0, 449834.0, 482505.0, 464970.0, 409577.0, 326725.0, 244496.0, 173521.0, 116501.0, 75851.0, 49122.0, 30594.0, 19613.0, 11908.0, 7454.0, 4564.0, 2829.0, 1779.0, 1123.0, 702.0, 443.0, 246.0, 170.0, 119.0, 77.0, 40.0, 32.0, 24.0, 17.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1.263671875, -1.225006103515625, -1.18634033203125, -1.147674560546875, -1.1090087890625, -1.070343017578125, -1.03167724609375, -0.993011474609375, -0.954345703125, -0.915679931640625, -0.87701416015625, -0.838348388671875, -0.7996826171875, -0.761016845703125, -0.72235107421875, -0.683685302734375, -0.64501953125, -0.606353759765625, -0.56768798828125, -0.529022216796875, -0.4903564453125, -0.451690673828125, -0.41302490234375, -0.374359130859375, -0.335693359375, -0.297027587890625, -0.25836181640625, -0.219696044921875, -0.1810302734375, -0.142364501953125, -0.10369873046875, -0.065032958984375, -0.0263671875, 0.012298583984375, 0.05096435546875, 0.089630126953125, 0.1282958984375, 0.166961669921875, 0.20562744140625, 0.244293212890625, 0.282958984375, 0.321624755859375, 0.36029052734375, 0.398956298828125, 0.4376220703125, 0.476287841796875, 0.51495361328125, 0.553619384765625, 0.59228515625, 0.630950927734375, 0.66961669921875, 0.708282470703125, 0.7469482421875, 0.785614013671875, 0.82427978515625, 0.862945556640625, 0.901611328125, 0.940277099609375, 0.97894287109375, 1.017608642578125, 1.0562744140625, 1.094940185546875, 1.13360595703125, 1.172271728515625, 1.2109375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 12.0, 15.0, 10.0, 16.0, 27.0, 26.0, 39.0, 36.0, 45.0, 64.0, 79.0, 91.0, 106.0, 135.0, 119.0, 128.0, 166.0, 171.0, 160.0, 187.0, 192.0, 185.0, 195.0, 188.0, 213.0, 169.0, 189.0, 167.0, 148.0, 126.0, 105.0, 91.0, 82.0, 72.0, 68.0, 40.0, 35.0, 32.0, 25.0, 17.0, 18.0, 20.0, 11.0, 4.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.50634765625, -0.4912910461425781, -0.47623443603515625, -0.4611778259277344, -0.4461212158203125, -0.4310646057128906, -0.41600799560546875, -0.4009513854980469, -0.385894775390625, -0.3708381652832031, -0.35578155517578125, -0.3407249450683594, -0.3256683349609375, -0.3106117248535156, -0.29555511474609375, -0.2804985046386719, -0.26544189453125, -0.2503852844238281, -0.23532867431640625, -0.22027206420898438, -0.2052154541015625, -0.19015884399414062, -0.17510223388671875, -0.16004562377929688, -0.144989013671875, -0.12993240356445312, -0.11487579345703125, -0.09981918334960938, -0.0847625732421875, -0.06970596313476562, -0.05464935302734375, -0.039592742919921875, -0.0245361328125, -0.009479522705078125, 0.00557708740234375, 0.020633697509765625, 0.0356903076171875, 0.050746917724609375, 0.06580352783203125, 0.08086013793945312, 0.095916748046875, 0.11097335815429688, 0.12602996826171875, 0.14108657836914062, 0.1561431884765625, 0.17119979858398438, 0.18625640869140625, 0.20131301879882812, 0.21636962890625, 0.23142623901367188, 0.24648284912109375, 0.2615394592285156, 0.2765960693359375, 0.2916526794433594, 0.30670928955078125, 0.3217658996582031, 0.336822509765625, 0.3518791198730469, 0.36693572998046875, 0.3819923400878906, 0.3970489501953125, 0.4121055603027344, 0.42716217041015625, 0.4422187805175781, 0.457275390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 5.0, 18.0, 17.0, 16.0, 16.0, 23.0, 26.0, 44.0, 34.0, 49.0, 50.0, 45.0, 51.0, 60.0, 58.0, 46.0, 55.0, 57.0, 40.0, 46.0, 46.0, 31.0, 22.0, 35.0, 25.0, 19.0, 8.0, 10.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8614811897277832, -1.8005732297897339, -1.7396652698516846, -1.6787573099136353, -1.617849349975586, -1.5569415092468262, -1.4960334300994873, -1.4351255893707275, -1.3742176294326782, -1.313309669494629, -1.2524017095565796, -1.1914937496185303, -1.130585789680481, -1.0696778297424316, -1.0087699890136719, -0.9478620290756226, -0.8869540095329285, -0.8260460495948792, -0.7651380896568298, -0.7042301893234253, -0.643322229385376, -0.5824142694473267, -0.5215063095092773, -0.4605983793735504, -0.3996904194355011, -0.3387824594974518, -0.27787452936172485, -0.21696656942367554, -0.15605862438678741, -0.09515067934989929, -0.034242719411849976, 0.026665210723876953, 0.08757317066192627, 0.1484811156988144, 0.20938906073570251, 0.27029702067375183, 0.33120495080947876, 0.3921129107475281, 0.4530208706855774, 0.5139287710189819, 0.5748367309570312, 0.6357446908950806, 0.6966526508331299, 0.7575606107711792, 0.8184685111045837, 0.8793764710426331, 0.9402844309806824, 1.001192331314087, 1.0621004104614258, 1.123008370399475, 1.1839163303375244, 1.2448242902755737, 1.305732250213623, 1.3666400909423828, 1.4275481700897217, 1.4884560108184814, 1.5493639707565308, 1.61027193069458, 1.6711798906326294, 1.7320878505706787, 1.792995810508728, 1.8539037704467773, 1.914811611175537, 1.9757195711135864, 2.0366275310516357]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 9.0, 7.0, 10.0, 12.0, 13.0, 19.0, 27.0, 17.0, 26.0, 37.0, 43.0, 49.0, 52.0, 42.0, 40.0, 48.0, 55.0, 45.0, 52.0, 41.0, 47.0, 39.0, 44.0, 46.0, 25.0, 23.0, 27.0, 16.0, 24.0, 17.0, 8.0, 7.0, 6.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4232420921325684, -1.3767975568771362, -1.3303531408309937, -1.2839086055755615, -1.237464189529419, -1.1910196542739868, -1.1445751190185547, -1.098130702972412, -1.0516862869262695, -1.0052417516708374, -0.9587973356246948, -0.9123528003692627, -0.8659083843231201, -0.819463849067688, -0.7730193734169006, -0.7265748977661133, -0.6801303625106812, -0.6336858868598938, -0.5872414112091064, -0.5407968759536743, -0.49435243010520935, -0.447907954454422, -0.40146344900131226, -0.3550189733505249, -0.30857449769973755, -0.2621300220489502, -0.21568553149700165, -0.1692410409450531, -0.12279656529426575, -0.0763520896434784, -0.029907584190368652, 0.0165368914604187, 0.06298136711120605, 0.109425850212574, 0.15587033331394196, 0.2023148238658905, 0.24875929951667786, 0.2952037751674652, 0.34164828062057495, 0.3880927562713623, 0.43453723192214966, 0.480981707572937, 0.5274261832237244, 0.5738706588745117, 0.6203151941299438, 0.6667596101760864, 0.7132041454315186, 0.7596486210823059, 0.8060930967330933, 0.8525375723838806, 0.898982048034668, 0.9454265832901001, 0.9918709993362427, 1.0383155345916748, 1.0847599506378174, 1.1312044858932495, 1.1776490211486816, 1.2240935564041138, 1.2705379724502563, 1.3169825077056885, 1.363426923751831, 1.4098714590072632, 1.4563159942626953, 1.502760410308838, 1.5492048263549805]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 12.0, 19.0, 29.0, 50.0, 48.0, 107.0, 147.0, 221.0, 325.0, 534.0, 786.0, 1106.0, 1828.0, 3008.0, 4740.0, 7689.0, 12914.0, 21252.0, 35628.0, 58930.0, 94956.0, 143121.0, 179111.0, 166344.0, 120305.0, 76739.0, 46917.0, 27907.0, 16792.0, 10252.0, 6125.0, 3879.0, 2443.0, 1487.0, 926.0, 641.0, 441.0, 263.0, 177.0, 102.0, 81.0, 55.0, 31.0, 19.0, 21.0, 11.0, 2.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.35888671875, -0.3479347229003906, -0.33698272705078125, -0.3260307312011719, -0.3150787353515625, -0.3041267395019531, -0.29317474365234375, -0.2822227478027344, -0.271270751953125, -0.2603187561035156, -0.24936676025390625, -0.23841476440429688, -0.2274627685546875, -0.21651077270507812, -0.20555877685546875, -0.19460678100585938, -0.18365478515625, -0.17270278930664062, -0.16175079345703125, -0.15079879760742188, -0.1398468017578125, -0.12889480590820312, -0.11794281005859375, -0.10699081420898438, -0.096038818359375, -0.08508682250976562, -0.07413482666015625, -0.06318283081054688, -0.0522308349609375, -0.041278839111328125, -0.03032684326171875, -0.019374847412109375, -0.0084228515625, 0.002529144287109375, 0.01348114013671875, 0.024433135986328125, 0.0353851318359375, 0.046337127685546875, 0.05728912353515625, 0.06824111938476562, 0.079193115234375, 0.09014511108398438, 0.10109710693359375, 0.11204910278320312, 0.1230010986328125, 0.13395309448242188, 0.14490509033203125, 0.15585708618164062, 0.16680908203125, 0.17776107788085938, 0.18871307373046875, 0.19966506958007812, 0.2106170654296875, 0.22156906127929688, 0.23252105712890625, 0.24347305297851562, 0.254425048828125, 0.2653770446777344, 0.27632904052734375, 0.2872810363769531, 0.2982330322265625, 0.3091850280761719, 0.32013702392578125, 0.3310890197753906, 0.342041015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 12.0, 13.0, 14.0, 15.0, 33.0, 17.0, 29.0, 49.0, 27.0, 40.0, 44.0, 51.0, 38.0, 33.0, 51.0, 46.0, 45.0, 47.0, 44.0, 52.0, 43.0, 42.0, 35.0, 27.0, 23.0, 16.0, 15.0, 17.0, 11.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4326171875, -1.384765625, -1.3369140625, -1.2890625, -1.2412109375, -1.193359375, -1.1455078125, -1.09765625, -1.0498046875, -1.001953125, -0.9541015625, -0.90625, -0.8583984375, -0.810546875, -0.7626953125, -0.71484375, -0.6669921875, -0.619140625, -0.5712890625, -0.5234375, -0.4755859375, -0.427734375, -0.3798828125, -0.33203125, -0.2841796875, -0.236328125, -0.1884765625, -0.140625, -0.0927734375, -0.044921875, 0.0029296875, 0.05078125, 0.0986328125, 0.146484375, 0.1943359375, 0.2421875, 0.2900390625, 0.337890625, 0.3857421875, 0.43359375, 0.4814453125, 0.529296875, 0.5771484375, 0.625, 0.6728515625, 0.720703125, 0.7685546875, 0.81640625, 0.8642578125, 0.912109375, 0.9599609375, 1.0078125, 1.0556640625, 1.103515625, 1.1513671875, 1.19921875, 1.2470703125, 1.294921875, 1.3427734375, 1.390625, 1.4384765625, 1.486328125, 1.5341796875, 1.58203125, 1.6298828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 12.0, 8.0, 7.0, 12.0, 13.0, 19.0, 25.0, 48.0, 63.0, 100.0, 141.0, 213.0, 288.0, 442.0, 691.0, 1057.0, 1655.0, 2696.0, 4574.0, 8210.0, 14611.0, 27187.0, 50959.0, 95104.0, 166356.0, 227233.0, 192001.0, 115673.0, 63178.0, 33557.0, 18064.0, 9982.0, 5562.0, 3213.0, 2044.0, 1256.0, 772.0, 470.0, 340.0, 213.0, 144.0, 103.0, 66.0, 62.0, 44.0, 18.0, 19.0, 14.0, 12.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-0.45361328125, -0.439727783203125, -0.42584228515625, -0.411956787109375, -0.3980712890625, -0.384185791015625, -0.37030029296875, -0.356414794921875, -0.342529296875, -0.328643798828125, -0.31475830078125, -0.300872802734375, -0.2869873046875, -0.273101806640625, -0.25921630859375, -0.245330810546875, -0.2314453125, -0.217559814453125, -0.20367431640625, -0.189788818359375, -0.1759033203125, -0.162017822265625, -0.14813232421875, -0.134246826171875, -0.120361328125, -0.106475830078125, -0.09259033203125, -0.078704833984375, -0.0648193359375, -0.050933837890625, -0.03704833984375, -0.023162841796875, -0.00927734375, 0.004608154296875, 0.01849365234375, 0.032379150390625, 0.0462646484375, 0.060150146484375, 0.07403564453125, 0.087921142578125, 0.101806640625, 0.115692138671875, 0.12957763671875, 0.143463134765625, 0.1573486328125, 0.171234130859375, 0.18511962890625, 0.199005126953125, 0.212890625, 0.226776123046875, 0.24066162109375, 0.254547119140625, 0.2684326171875, 0.282318115234375, 0.29620361328125, 0.310089111328125, 0.323974609375, 0.337860107421875, 0.35174560546875, 0.365631103515625, 0.3795166015625, 0.393402099609375, 0.40728759765625, 0.421173095703125, 0.43505859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 7.0, 8.0, 8.0, 18.0, 25.0, 29.0, 26.0, 26.0, 29.0, 33.0, 32.0, 40.0, 38.0, 35.0, 37.0, 50.0, 53.0, 40.0, 53.0, 28.0, 35.0, 29.0, 38.0, 34.0, 29.0, 26.0, 19.0, 29.0, 19.0, 26.0, 13.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8212203979492188, -0.7942962646484375, -0.7673721313476562, -0.740447998046875, -0.7135238647460938, -0.6865997314453125, -0.6596755981445312, -0.63275146484375, -0.6058273315429688, -0.5789031982421875, -0.5519790649414062, -0.525054931640625, -0.49813079833984375, -0.4712066650390625, -0.44428253173828125, -0.4173583984375, -0.39043426513671875, -0.3635101318359375, -0.33658599853515625, -0.309661865234375, -0.28273773193359375, -0.2558135986328125, -0.22888946533203125, -0.20196533203125, -0.17504119873046875, -0.1481170654296875, -0.12119293212890625, -0.094268798828125, -0.06734466552734375, -0.0404205322265625, -0.01349639892578125, 0.013427734375, 0.04035186767578125, 0.0672760009765625, 0.09420013427734375, 0.121124267578125, 0.14804840087890625, 0.1749725341796875, 0.20189666748046875, 0.22882080078125, 0.25574493408203125, 0.2826690673828125, 0.30959320068359375, 0.336517333984375, 0.36344146728515625, 0.3903656005859375, 0.41728973388671875, 0.4442138671875, 0.47113800048828125, 0.4980621337890625, 0.5249862670898438, 0.551910400390625, 0.5788345336914062, 0.6057586669921875, 0.6326828002929688, 0.65960693359375, 0.6865310668945312, 0.7134552001953125, 0.7403793334960938, 0.767303466796875, 0.7942276000976562, 0.8211517333984375, 0.8480758666992188, 0.875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 10.0, 11.0, 13.0, 21.0, 18.0, 24.0, 37.0, 43.0, 63.0, 79.0, 85.0, 175.0, 235.0, 393.0, 629.0, 959.0, 1778.0, 3458.0, 7204.0, 18633.0, 66772.0, 420814.0, 425475.0, 67459.0, 18764.0, 7329.0, 3400.0, 1820.0, 1036.0, 588.0, 393.0, 236.0, 185.0, 97.0, 80.0, 62.0, 34.0, 28.0, 24.0, 18.0, 20.0, 10.0, 9.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3502845764160156, -0.33777618408203125, -0.3252677917480469, -0.3127593994140625, -0.3002510070800781, -0.28774261474609375, -0.2752342224121094, -0.262725830078125, -0.2502174377441406, -0.23770904541015625, -0.22520065307617188, -0.2126922607421875, -0.20018386840820312, -0.18767547607421875, -0.17516708374023438, -0.16265869140625, -0.15015029907226562, -0.13764190673828125, -0.12513351440429688, -0.1126251220703125, -0.10011672973632812, -0.08760833740234375, -0.07509994506835938, -0.062591552734375, -0.050083160400390625, -0.03757476806640625, -0.025066375732421875, -0.0125579833984375, -4.9591064453125e-05, 0.01245880126953125, 0.024967193603515625, 0.0374755859375, 0.049983978271484375, 0.06249237060546875, 0.07500076293945312, 0.0875091552734375, 0.10001754760742188, 0.11252593994140625, 0.12503433227539062, 0.137542724609375, 0.15005111694335938, 0.16255950927734375, 0.17506790161132812, 0.1875762939453125, 0.20008468627929688, 0.21259307861328125, 0.22510147094726562, 0.23760986328125, 0.2501182556152344, 0.26262664794921875, 0.2751350402832031, 0.2876434326171875, 0.3001518249511719, 0.31266021728515625, 0.3251686096191406, 0.337677001953125, 0.3501853942871094, 0.36269378662109375, 0.3752021789550781, 0.3877105712890625, 0.4002189636230469, 0.41272735595703125, 0.4252357482910156, 0.437744140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 14.0, 15.0, 18.0, 22.0, 41.0, 39.0, 47.0, 44.0, 61.0, 72.0, 62.0, 76.0, 60.0, 67.0, 48.0, 63.0, 47.0, 38.0, 33.0, 19.0, 24.0, 18.0, 17.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5463680028915405e-05, -1.5012919902801514e-05, -1.4562159776687622e-05, -1.411139965057373e-05, -1.3660639524459839e-05, -1.3209879398345947e-05, -1.2759119272232056e-05, -1.2308359146118164e-05, -1.1857599020004272e-05, -1.1406838893890381e-05, -1.095607876777649e-05, -1.0505318641662598e-05, -1.0054558515548706e-05, -9.603798389434814e-06, -9.153038263320923e-06, -8.702278137207031e-06, -8.25151801109314e-06, -7.800757884979248e-06, -7.3499977588653564e-06, -6.899237632751465e-06, -6.448477506637573e-06, -5.997717380523682e-06, -5.54695725440979e-06, -5.0961971282958984e-06, -4.645437002182007e-06, -4.194676876068115e-06, -3.7439167499542236e-06, -3.293156623840332e-06, -2.8423964977264404e-06, -2.391636371612549e-06, -1.9408762454986572e-06, -1.4901161193847656e-06, -1.039355993270874e-06, -5.885958671569824e-07, -1.3783574104309082e-07, 3.129243850708008e-07, 7.636845111846924e-07, 1.214444637298584e-06, 1.6652047634124756e-06, 2.115964889526367e-06, 2.566725015640259e-06, 3.0174851417541504e-06, 3.468245267868042e-06, 3.919005393981934e-06, 4.369765520095825e-06, 4.820525646209717e-06, 5.271285772323608e-06, 5.7220458984375e-06, 6.172806024551392e-06, 6.623566150665283e-06, 7.074326276779175e-06, 7.525086402893066e-06, 7.975846529006958e-06, 8.42660665512085e-06, 8.877366781234741e-06, 9.328126907348633e-06, 9.778887033462524e-06, 1.0229647159576416e-05, 1.0680407285690308e-05, 1.11311674118042e-05, 1.158192753791809e-05, 1.2032687664031982e-05, 1.2483447790145874e-05, 1.2934207916259766e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 14.0, 10.0, 24.0, 30.0, 29.0, 39.0, 42.0, 60.0, 89.0, 146.0, 195.0, 269.0, 371.0, 540.0, 776.0, 1207.0, 1838.0, 2898.0, 4977.0, 8937.0, 17829.0, 40222.0, 100456.0, 249803.0, 332979.0, 164280.0, 63700.0, 26940.0, 12380.0, 6590.0, 3778.0, 2273.0, 1515.0, 1034.0, 663.0, 449.0, 341.0, 241.0, 177.0, 114.0, 95.0, 60.0, 43.0, 29.0, 18.0, 16.0, 9.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2736701965332031, -0.26462554931640625, -0.2555809020996094, -0.2465362548828125, -0.23749160766601562, -0.22844696044921875, -0.21940231323242188, -0.210357666015625, -0.20131301879882812, -0.19226837158203125, -0.18322372436523438, -0.1741790771484375, -0.16513442993164062, -0.15608978271484375, -0.14704513549804688, -0.13800048828125, -0.12895584106445312, -0.11991119384765625, -0.11086654663085938, -0.1018218994140625, -0.09277725219726562, -0.08373260498046875, -0.07468795776367188, -0.065643310546875, -0.056598663330078125, -0.04755401611328125, -0.038509368896484375, -0.0294647216796875, -0.020420074462890625, -0.01137542724609375, -0.002330780029296875, 0.0067138671875, 0.015758514404296875, 0.02480316162109375, 0.033847808837890625, 0.0428924560546875, 0.051937103271484375, 0.06098175048828125, 0.07002639770507812, 0.079071044921875, 0.08811569213867188, 0.09716033935546875, 0.10620498657226562, 0.1152496337890625, 0.12429428100585938, 0.13333892822265625, 0.14238357543945312, 0.15142822265625, 0.16047286987304688, 0.16951751708984375, 0.17856216430664062, 0.1876068115234375, 0.19665145874023438, 0.20569610595703125, 0.21474075317382812, 0.223785400390625, 0.23283004760742188, 0.24187469482421875, 0.2509193420410156, 0.2599639892578125, 0.2690086364746094, 0.27805328369140625, 0.2870979309082031, 0.296142578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 10.0, 14.0, 24.0, 33.0, 49.0, 69.0, 109.0, 129.0, 151.0, 145.0, 98.0, 52.0, 37.0, 18.0, 12.0, 7.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08376884460449219, -0.08056259155273438, -0.07735633850097656, -0.07415008544921875, -0.07094383239746094, -0.06773757934570312, -0.06453132629394531, -0.0613250732421875, -0.05811882019042969, -0.054912567138671875, -0.05170631408691406, -0.04850006103515625, -0.04529380798339844, -0.042087554931640625, -0.03888130187988281, -0.035675048828125, -0.03246879577636719, -0.029262542724609375, -0.026056289672851562, -0.02285003662109375, -0.019643783569335938, -0.016437530517578125, -0.013231277465820312, -0.0100250244140625, -0.0068187713623046875, -0.003612518310546875, -0.0004062652587890625, 0.00279998779296875, 0.0060062408447265625, 0.009212493896484375, 0.012418746948242188, 0.015625, 0.018831253051757812, 0.022037506103515625, 0.025243759155273438, 0.02845001220703125, 0.03165626525878906, 0.034862518310546875, 0.03806877136230469, 0.0412750244140625, 0.04448127746582031, 0.047687530517578125, 0.05089378356933594, 0.05410003662109375, 0.05730628967285156, 0.060512542724609375, 0.06371879577636719, 0.066925048828125, 0.07013130187988281, 0.07333755493164062, 0.07654380798339844, 0.07975006103515625, 0.08295631408691406, 0.08616256713867188, 0.08936882019042969, 0.0925750732421875, 0.09578132629394531, 0.09898757934570312, 0.10219383239746094, 0.10540008544921875, 0.10860633850097656, 0.11181259155273438, 0.11501884460449219, 0.11822509765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 1.0, 9.0, 3.0, 12.0, 12.0, 19.0, 14.0, 21.0, 27.0, 29.0, 42.0, 43.0, 47.0, 41.0, 52.0, 60.0, 60.0, 50.0, 56.0, 53.0, 54.0, 41.0, 49.0, 42.0, 23.0, 34.0, 24.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9357694387435913, -1.8736472129821777, -1.8115248680114746, -1.7494025230407715, -1.687280297279358, -1.6251580715179443, -1.5630357265472412, -1.500913381576538, -1.4387911558151245, -1.376668930053711, -1.3145465850830078, -1.2524242401123047, -1.1903020143508911, -1.1281797885894775, -1.0660574436187744, -1.0039350986480713, -0.9418128728866577, -0.8796905875205994, -0.817568302154541, -0.7554460167884827, -0.6933237314224243, -0.631201446056366, -0.5690791606903076, -0.5069568753242493, -0.4448345899581909, -0.38271230459213257, -0.3205900192260742, -0.25846773386001587, -0.19634544849395752, -0.13422316312789917, -0.07210087776184082, -0.00997859239578247, 0.05214381217956543, 0.11426609754562378, 0.17638838291168213, 0.23851066827774048, 0.30063295364379883, 0.3627552390098572, 0.4248775243759155, 0.4869998097419739, 0.5491220951080322, 0.6112443804740906, 0.6733666658401489, 0.7354889512062073, 0.7976112365722656, 0.859733521938324, 0.9218558073043823, 0.9839780926704407, 1.046100378036499, 1.1082227230072021, 1.1703449487686157, 1.2324671745300293, 1.2945895195007324, 1.3567118644714355, 1.4188340902328491, 1.4809563159942627, 1.5430786609649658, 1.605201005935669, 1.6673232316970825, 1.729445457458496, 1.7915678024291992, 1.8536901473999023, 1.915812373161316, 1.9779345989227295, 2.0400569438934326]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 9.0, 13.0, 5.0, 9.0, 9.0, 13.0, 12.0, 18.0, 29.0, 18.0, 27.0, 41.0, 40.0, 51.0, 52.0, 37.0, 46.0, 52.0, 50.0, 46.0, 47.0, 45.0, 48.0, 35.0, 46.0, 46.0, 25.0, 21.0, 31.0, 14.0, 19.0, 16.0, 10.0, 6.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4187204837799072, -1.3720732927322388, -1.3254261016845703, -1.2787789106369019, -1.2321317195892334, -1.1854846477508545, -1.1388373374938965, -1.0921902656555176, -1.0455430746078491, -0.9988958835601807, -0.9522486925125122, -0.9056015014648438, -0.8589543700218201, -0.8123071789741516, -0.7656599879264832, -0.7190128564834595, -0.6723656058311462, -0.6257184147834778, -0.5790712237358093, -0.5324240922927856, -0.4857769012451172, -0.43912971019744873, -0.3924825191497803, -0.3458353579044342, -0.29918816685676575, -0.2525409758090973, -0.20589381456375122, -0.15924662351608276, -0.1125994473695755, -0.06595227122306824, -0.01930508017539978, 0.02734208106994629, 0.07398927211761475, 0.12063644826412201, 0.16728362441062927, 0.21393081545829773, 0.2605779767036438, 0.30722516775131226, 0.3538723587989807, 0.4005195200443268, 0.44716671109199524, 0.4938139021396637, 0.5404610633850098, 0.5871082544326782, 0.6337554454803467, 0.6804026365280151, 0.7270498275756836, 0.7736969590187073, 0.8203441500663757, 0.8669913411140442, 0.9136385321617126, 0.9602856636047363, 1.0069328546524048, 1.0535800457000732, 1.1002272367477417, 1.1468744277954102, 1.1935216188430786, 1.240168809890747, 1.2868160009384155, 1.333463191986084, 1.3801103830337524, 1.426757574081421, 1.4734046459197998, 1.5200518369674683, 1.5666990280151367]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 21.0, 29.0, 59.0, 93.0, 115.0, 215.0, 357.0, 556.0, 914.0, 1436.0, 2456.0, 3962.0, 6272.0, 9967.0, 15798.0, 23710.0, 35374.0, 50109.0, 67737.0, 86839.0, 102476.0, 112177.0, 112537.0, 103339.0, 87901.0, 69103.0, 51012.0, 36121.0, 24443.0, 16034.0, 10233.0, 6615.0, 4023.0, 2534.0, 1472.0, 913.0, 580.0, 382.0, 253.0, 143.0, 83.0, 54.0, 30.0, 26.0, 7.0, 16.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.033203125, -0.999908447265625, -0.96661376953125, -0.933319091796875, -0.9000244140625, -0.866729736328125, -0.83343505859375, -0.800140380859375, -0.766845703125, -0.733551025390625, -0.70025634765625, -0.666961669921875, -0.6336669921875, -0.600372314453125, -0.56707763671875, -0.533782958984375, -0.50048828125, -0.467193603515625, -0.43389892578125, -0.400604248046875, -0.3673095703125, -0.334014892578125, -0.30072021484375, -0.267425537109375, -0.234130859375, -0.200836181640625, -0.16754150390625, -0.134246826171875, -0.1009521484375, -0.067657470703125, -0.03436279296875, -0.001068115234375, 0.0322265625, 0.065521240234375, 0.09881591796875, 0.132110595703125, 0.1654052734375, 0.198699951171875, 0.23199462890625, 0.265289306640625, 0.298583984375, 0.331878662109375, 0.36517333984375, 0.398468017578125, 0.4317626953125, 0.465057373046875, 0.49835205078125, 0.531646728515625, 0.56494140625, 0.598236083984375, 0.63153076171875, 0.664825439453125, 0.6981201171875, 0.731414794921875, 0.76470947265625, 0.798004150390625, 0.831298828125, 0.864593505859375, 0.89788818359375, 0.931182861328125, 0.9644775390625, 0.997772216796875, 1.03106689453125, 1.064361572265625, 1.09765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 9.0, 9.0, 25.0, 8.0, 13.0, 27.0, 31.0, 25.0, 28.0, 30.0, 48.0, 50.0, 44.0, 47.0, 55.0, 59.0, 42.0, 49.0, 54.0, 43.0, 54.0, 38.0, 31.0, 30.0, 31.0, 19.0, 16.0, 20.0, 20.0, 8.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6743927001953125, -1.623199462890625, -1.5720062255859375, -1.52081298828125, -1.4696197509765625, -1.418426513671875, -1.3672332763671875, -1.3160400390625, -1.2648468017578125, -1.213653564453125, -1.1624603271484375, -1.11126708984375, -1.0600738525390625, -1.008880615234375, -0.9576873779296875, -0.906494140625, -0.8553009033203125, -0.804107666015625, -0.7529144287109375, -0.70172119140625, -0.6505279541015625, -0.599334716796875, -0.5481414794921875, -0.4969482421875, -0.4457550048828125, -0.394561767578125, -0.3433685302734375, -0.29217529296875, -0.2409820556640625, -0.189788818359375, -0.1385955810546875, -0.08740234375, -0.0362091064453125, 0.014984130859375, 0.0661773681640625, 0.11737060546875, 0.1685638427734375, 0.219757080078125, 0.2709503173828125, 0.3221435546875, 0.3733367919921875, 0.424530029296875, 0.4757232666015625, 0.52691650390625, 0.5781097412109375, 0.629302978515625, 0.6804962158203125, 0.731689453125, 0.7828826904296875, 0.834075927734375, 0.8852691650390625, 0.93646240234375, 0.9876556396484375, 1.038848876953125, 1.0900421142578125, 1.1412353515625, 1.1924285888671875, 1.243621826171875, 1.2948150634765625, 1.34600830078125, 1.3972015380859375, 1.448394775390625, 1.4995880126953125, 1.55078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 37.0, 47.0, 80.0, 149.0, 207.0, 298.0, 477.0, 771.0, 1205.0, 1883.0, 2874.0, 4354.0, 6469.0, 9581.0, 14008.0, 20079.0, 28277.0, 38270.0, 49942.0, 63771.0, 76515.0, 86947.0, 94432.0, 95371.0, 91425.0, 82589.0, 70116.0, 56284.0, 44099.0, 33042.0, 23600.0, 16956.0, 11675.0, 7698.0, 5212.0, 3450.0, 2238.0, 1459.0, 972.0, 607.0, 346.0, 238.0, 160.0, 110.0, 68.0, 41.0, 24.0, 27.0, 14.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8673171997070312, -0.8386383056640625, -0.8099594116210938, -0.781280517578125, -0.7526016235351562, -0.7239227294921875, -0.6952438354492188, -0.66656494140625, -0.6378860473632812, -0.6092071533203125, -0.5805282592773438, -0.551849365234375, -0.5231704711914062, -0.4944915771484375, -0.46581268310546875, -0.4371337890625, -0.40845489501953125, -0.3797760009765625, -0.35109710693359375, -0.322418212890625, -0.29373931884765625, -0.2650604248046875, -0.23638153076171875, -0.20770263671875, -0.17902374267578125, -0.1503448486328125, -0.12166595458984375, -0.092987060546875, -0.06430816650390625, -0.0356292724609375, -0.00695037841796875, 0.021728515625, 0.05040740966796875, 0.0790863037109375, 0.10776519775390625, 0.136444091796875, 0.16512298583984375, 0.1938018798828125, 0.22248077392578125, 0.25115966796875, 0.27983856201171875, 0.3085174560546875, 0.33719635009765625, 0.365875244140625, 0.39455413818359375, 0.4232330322265625, 0.45191192626953125, 0.4805908203125, 0.5092697143554688, 0.5379486083984375, 0.5666275024414062, 0.595306396484375, 0.6239852905273438, 0.6526641845703125, 0.6813430786132812, 0.71002197265625, 0.7387008666992188, 0.7673797607421875, 0.7960586547851562, 0.824737548828125, 0.8534164428710938, 0.8820953369140625, 0.9107742309570312, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 13.0, 5.0, 14.0, 15.0, 11.0, 19.0, 19.0, 22.0, 21.0, 22.0, 34.0, 38.0, 25.0, 30.0, 36.0, 39.0, 37.0, 39.0, 28.0, 30.0, 40.0, 36.0, 29.0, 42.0, 38.0, 32.0, 33.0, 30.0, 26.0, 26.0, 26.0, 16.0, 20.0, 9.0, 19.0, 15.0, 10.0, 8.0, 7.0, 5.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.8330078125, -0.8095779418945312, -0.7861480712890625, -0.7627182006835938, -0.739288330078125, -0.7158584594726562, -0.6924285888671875, -0.6689987182617188, -0.64556884765625, -0.6221389770507812, -0.5987091064453125, -0.5752792358398438, -0.551849365234375, -0.5284194946289062, -0.5049896240234375, -0.48155975341796875, -0.4581298828125, -0.43470001220703125, -0.4112701416015625, -0.38784027099609375, -0.364410400390625, -0.34098052978515625, -0.3175506591796875, -0.29412078857421875, -0.27069091796875, -0.24726104736328125, -0.2238311767578125, -0.20040130615234375, -0.176971435546875, -0.15354156494140625, -0.1301116943359375, -0.10668182373046875, -0.083251953125, -0.05982208251953125, -0.0363922119140625, -0.01296234130859375, 0.010467529296875, 0.03389739990234375, 0.0573272705078125, 0.08075714111328125, 0.10418701171875, 0.12761688232421875, 0.1510467529296875, 0.17447662353515625, 0.197906494140625, 0.22133636474609375, 0.2447662353515625, 0.26819610595703125, 0.2916259765625, 0.31505584716796875, 0.3384857177734375, 0.36191558837890625, 0.385345458984375, 0.40877532958984375, 0.4322052001953125, 0.45563507080078125, 0.47906494140625, 0.5024948120117188, 0.5259246826171875, 0.5493545532226562, 0.572784423828125, 0.5962142944335938, 0.6196441650390625, 0.6430740356445312, 0.66650390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 13.0, 27.0, 30.0, 53.0, 72.0, 89.0, 119.0, 186.0, 221.0, 362.0, 500.0, 748.0, 1130.0, 1782.0, 2819.0, 5074.0, 9421.0, 18078.0, 34812.0, 65433.0, 114540.0, 168930.0, 195492.0, 170623.0, 115426.0, 65912.0, 35101.0, 18451.0, 9577.0, 5133.0, 2947.0, 1789.0, 1155.0, 753.0, 505.0, 362.0, 243.0, 165.0, 114.0, 116.0, 55.0, 62.0, 33.0, 22.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.9111328125, -0.8822174072265625, -0.853302001953125, -0.8243865966796875, -0.79547119140625, -0.7665557861328125, -0.737640380859375, -0.7087249755859375, -0.6798095703125, -0.6508941650390625, -0.621978759765625, -0.5930633544921875, -0.56414794921875, -0.5352325439453125, -0.506317138671875, -0.4774017333984375, -0.448486328125, -0.4195709228515625, -0.390655517578125, -0.3617401123046875, -0.33282470703125, -0.3039093017578125, -0.274993896484375, -0.2460784912109375, -0.2171630859375, -0.1882476806640625, -0.159332275390625, -0.1304168701171875, -0.10150146484375, -0.0725860595703125, -0.043670654296875, -0.0147552490234375, 0.01416015625, 0.0430755615234375, 0.071990966796875, 0.1009063720703125, 0.12982177734375, 0.1587371826171875, 0.187652587890625, 0.2165679931640625, 0.2454833984375, 0.2743988037109375, 0.303314208984375, 0.3322296142578125, 0.36114501953125, 0.3900604248046875, 0.418975830078125, 0.4478912353515625, 0.476806640625, 0.5057220458984375, 0.534637451171875, 0.5635528564453125, 0.59246826171875, 0.6213836669921875, 0.650299072265625, 0.6792144775390625, 0.7081298828125, 0.7370452880859375, 0.765960693359375, 0.7948760986328125, 0.82379150390625, 0.8527069091796875, 0.881622314453125, 0.9105377197265625, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 15.0, 32.0, 34.0, 52.0, 69.0, 104.0, 114.0, 99.0, 115.0, 98.0, 70.0, 53.0, 46.0, 29.0, 16.0, 12.0, 8.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010120868682861328, -9.655021131038666e-05, -9.189173579216003e-05, -8.723326027393341e-05, -8.257478475570679e-05, -7.791630923748016e-05, -7.325783371925354e-05, -6.859935820102692e-05, -6.394088268280029e-05, -5.928240716457367e-05, -5.4623931646347046e-05, -4.996545612812042e-05, -4.53069806098938e-05, -4.0648505091667175e-05, -3.599002957344055e-05, -3.133155405521393e-05, -2.6673078536987305e-05, -2.201460301876068e-05, -1.7356127500534058e-05, -1.2697651982307434e-05, -8.03917646408081e-06, -3.380700945854187e-06, 1.2777745723724365e-06, 5.93625009059906e-06, 1.0594725608825684e-05, 1.5253201127052307e-05, 1.991167664527893e-05, 2.4570152163505554e-05, 2.9228627681732178e-05, 3.38871031999588e-05, 3.8545578718185425e-05, 4.320405423641205e-05, 4.786252975463867e-05, 5.2521005272865295e-05, 5.717948079109192e-05, 6.183795630931854e-05, 6.649643182754517e-05, 7.115490734577179e-05, 7.581338286399841e-05, 8.047185838222504e-05, 8.513033390045166e-05, 8.978880941867828e-05, 9.444728493690491e-05, 9.910576045513153e-05, 0.00010376423597335815, 0.00010842271149158478, 0.0001130811870098114, 0.00011773966252803802, 0.00012239813804626465, 0.00012705661356449127, 0.0001317150890827179, 0.00013637356460094452, 0.00014103204011917114, 0.00014569051563739777, 0.0001503489911556244, 0.000155007466673851, 0.00015966594219207764, 0.00016432441771030426, 0.00016898289322853088, 0.0001736413687467575, 0.00017829984426498413, 0.00018295831978321075, 0.00018761679530143738, 0.000192275270819664, 0.00019693374633789062]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 8.0, 5.0, 7.0, 17.0, 10.0, 26.0, 35.0, 40.0, 62.0, 87.0, 135.0, 178.0, 259.0, 351.0, 536.0, 766.0, 1161.0, 1730.0, 2595.0, 4006.0, 6300.0, 10164.0, 17278.0, 28996.0, 49312.0, 79210.0, 115121.0, 147790.0, 158166.0, 139796.0, 105500.0, 69976.0, 42988.0, 25683.0, 14877.0, 9033.0, 5630.0, 3598.0, 2328.0, 1536.0, 975.0, 685.0, 483.0, 327.0, 240.0, 169.0, 111.0, 83.0, 58.0, 35.0, 36.0, 24.0, 13.0, 7.0, 11.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.73828125, -0.7147445678710938, -0.6912078857421875, -0.6676712036132812, -0.644134521484375, -0.6205978393554688, -0.5970611572265625, -0.5735244750976562, -0.54998779296875, -0.5264511108398438, -0.5029144287109375, -0.47937774658203125, -0.455841064453125, -0.43230438232421875, -0.4087677001953125, -0.38523101806640625, -0.3616943359375, -0.33815765380859375, -0.3146209716796875, -0.29108428955078125, -0.267547607421875, -0.24401092529296875, -0.2204742431640625, -0.19693756103515625, -0.17340087890625, -0.14986419677734375, -0.1263275146484375, -0.10279083251953125, -0.079254150390625, -0.05571746826171875, -0.0321807861328125, -0.00864410400390625, 0.014892578125, 0.03842926025390625, 0.0619659423828125, 0.08550262451171875, 0.109039306640625, 0.13257598876953125, 0.1561126708984375, 0.17964935302734375, 0.20318603515625, 0.22672271728515625, 0.2502593994140625, 0.27379608154296875, 0.297332763671875, 0.32086944580078125, 0.3444061279296875, 0.36794281005859375, 0.3914794921875, 0.41501617431640625, 0.4385528564453125, 0.46208953857421875, 0.485626220703125, 0.5091629028320312, 0.5326995849609375, 0.5562362670898438, 0.57977294921875, 0.6033096313476562, 0.6268463134765625, 0.6503829956054688, 0.673919677734375, 0.6974563598632812, 0.7209930419921875, 0.7445297241210938, 0.76806640625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 2.0, 8.0, 12.0, 6.0, 11.0, 25.0, 22.0, 31.0, 34.0, 34.0, 39.0, 50.0, 43.0, 52.0, 66.0, 65.0, 69.0, 64.0, 56.0, 43.0, 44.0, 43.0, 27.0, 25.0, 29.0, 20.0, 8.0, 6.0, 12.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.234619140625, -0.22672653198242188, -0.21883392333984375, -0.21094131469726562, -0.2030487060546875, -0.19515609741210938, -0.18726348876953125, -0.17937088012695312, -0.171478271484375, -0.16358566284179688, -0.15569305419921875, -0.14780044555664062, -0.1399078369140625, -0.13201522827148438, -0.12412261962890625, -0.11623001098632812, -0.10833740234375, -0.10044479370117188, -0.09255218505859375, -0.08465957641601562, -0.0767669677734375, -0.06887435913085938, -0.06098175048828125, -0.053089141845703125, -0.045196533203125, -0.037303924560546875, -0.02941131591796875, -0.021518707275390625, -0.0136260986328125, -0.005733489990234375, 0.00215911865234375, 0.010051727294921875, 0.0179443359375, 0.025836944580078125, 0.03372955322265625, 0.041622161865234375, 0.0495147705078125, 0.057407379150390625, 0.06529998779296875, 0.07319259643554688, 0.081085205078125, 0.08897781372070312, 0.09687042236328125, 0.10476303100585938, 0.1126556396484375, 0.12054824829101562, 0.12844085693359375, 0.13633346557617188, 0.14422607421875, 0.15211868286132812, 0.16001129150390625, 0.16790390014648438, 0.1757965087890625, 0.18368911743164062, 0.19158172607421875, 0.19947433471679688, 0.207366943359375, 0.21525955200195312, 0.22315216064453125, 0.23104476928710938, 0.2389373779296875, 0.24682998657226562, 0.25472259521484375, 0.2626152038574219, 0.2705078125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 11.0, 10.0, 14.0, 4.0, 14.0, 14.0, 15.0, 23.0, 26.0, 42.0, 51.0, 41.0, 34.0, 42.0, 54.0, 45.0, 47.0, 48.0, 51.0, 48.0, 40.0, 40.0, 44.0, 42.0, 32.0, 33.0, 23.0, 21.0, 16.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6329678297042847, -1.5764333009719849, -1.519898772239685, -1.4633642435073853, -1.4068297147750854, -1.3502951860427856, -1.2937607765197754, -1.2372262477874756, -1.1806917190551758, -1.124157190322876, -1.0676226615905762, -1.0110881328582764, -0.9545536041259766, -0.8980190753936768, -0.8414846062660217, -0.7849500775337219, -0.7284154891967773, -0.6718809604644775, -0.6153464317321777, -0.5588119029998779, -0.5022773742675781, -0.4457428753376007, -0.3892083764076233, -0.3326738476753235, -0.2761393189430237, -0.21960479021072388, -0.16307027637958527, -0.10653576254844666, -0.05000123381614685, 0.006533294916152954, 0.06306779384613037, 0.11960232257843018, 0.17613673210144043, 0.23267126083374023, 0.28920578956604004, 0.34574028849601746, 0.40227481722831726, 0.45880934596061707, 0.5153438448905945, 0.5718783736228943, 0.6284129023551941, 0.6849474310874939, 0.7414819598197937, 0.7980164289474487, 0.8545509576797485, 0.9110854864120483, 0.9676200151443481, 1.024154543876648, 1.0806890726089478, 1.1372236013412476, 1.1937581300735474, 1.2502926588058472, 1.306827187538147, 1.3633617162704468, 1.419896125793457, 1.4764306545257568, 1.5329651832580566, 1.5894997119903564, 1.6460342407226562, 1.702568769454956, 1.7591032981872559, 1.8156378269195557, 1.8721723556518555, 1.9287068843841553, 1.985241413116455]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 16.0, 6.0, 16.0, 16.0, 18.0, 22.0, 23.0, 22.0, 32.0, 30.0, 46.0, 34.0, 39.0, 52.0, 40.0, 35.0, 49.0, 42.0, 42.0, 46.0, 38.0, 35.0, 38.0, 32.0, 35.0, 30.0, 28.0, 21.0, 19.0, 17.0, 14.0, 15.0, 5.0, 6.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3978337049484253, -1.353912115097046, -1.309990406036377, -1.2660688161849976, -1.2221472263336182, -1.1782256364822388, -1.1343040466308594, -1.0903823375701904, -1.046460747718811, -1.0025391578674316, -0.9586175084114075, -0.9146958589553833, -0.8707742691040039, -0.8268526792526245, -0.7829310297966003, -0.7390093803405762, -0.6950877904891968, -0.6511662006378174, -0.6072445511817932, -0.563322901725769, -0.5194013118743896, -0.47547969222068787, -0.4315580725669861, -0.3876364529132843, -0.3437148332595825, -0.29979321360588074, -0.25587159395217896, -0.21194997429847717, -0.1680283546447754, -0.12410673499107361, -0.08018511533737183, -0.036263495683670044, 0.007658123970031738, 0.05157974362373352, 0.0955013632774353, 0.13942298293113708, 0.18334460258483887, 0.22726622223854065, 0.27118784189224243, 0.3151094615459442, 0.359031081199646, 0.4029527008533478, 0.44687432050704956, 0.49079594016075134, 0.5347175598144531, 0.5786391496658325, 0.6225607991218567, 0.6664824485778809, 0.7104040384292603, 0.7543256282806396, 0.7982472777366638, 0.842168927192688, 0.8860905170440674, 0.9300121068954468, 0.973933756351471, 1.0178554058074951, 1.0617769956588745, 1.105698585510254, 1.1496202945709229, 1.1935418844223022, 1.2374634742736816, 1.281385064125061, 1.3253066539764404, 1.3692283630371094, 1.4131499528884888]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 6.0, 13.0, 25.0, 33.0, 57.0, 92.0, 168.0, 263.0, 480.0, 773.0, 1243.0, 2205.0, 3993.0, 7227.0, 12803.0, 23414.0, 42565.0, 76368.0, 134845.0, 227770.0, 360197.0, 510090.0, 622073.0, 637597.0, 540215.0, 391226.0, 252904.0, 151390.0, 86177.0, 48244.0, 26735.0, 14644.0, 8074.0, 4462.0, 2513.0, 1424.0, 809.0, 477.0, 285.0, 168.0, 93.0, 50.0, 41.0, 21.0, 16.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4785308837890625, -1.427764892578125, -1.3769989013671875, -1.32623291015625, -1.2754669189453125, -1.224700927734375, -1.1739349365234375, -1.1231689453125, -1.0724029541015625, -1.021636962890625, -0.9708709716796875, -0.92010498046875, -0.8693389892578125, -0.818572998046875, -0.7678070068359375, -0.717041015625, -0.6662750244140625, -0.615509033203125, -0.5647430419921875, -0.51397705078125, -0.4632110595703125, -0.412445068359375, -0.3616790771484375, -0.3109130859375, -0.2601470947265625, -0.209381103515625, -0.1586151123046875, -0.10784912109375, -0.0570831298828125, -0.006317138671875, 0.0444488525390625, 0.09521484375, 0.1459808349609375, 0.196746826171875, 0.2475128173828125, 0.29827880859375, 0.3490447998046875, 0.399810791015625, 0.4505767822265625, 0.5013427734375, 0.5521087646484375, 0.602874755859375, 0.6536407470703125, 0.70440673828125, 0.7551727294921875, 0.805938720703125, 0.8567047119140625, 0.907470703125, 0.9582366943359375, 1.009002685546875, 1.0597686767578125, 1.11053466796875, 1.1613006591796875, 1.212066650390625, 1.2628326416015625, 1.3135986328125, 1.3643646240234375, 1.415130615234375, 1.4658966064453125, 1.51666259765625, 1.5674285888671875, 1.618194580078125, 1.6689605712890625, 1.7197265625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 8.0, 13.0, 13.0, 15.0, 18.0, 29.0, 25.0, 27.0, 19.0, 30.0, 26.0, 43.0, 40.0, 52.0, 27.0, 33.0, 51.0, 43.0, 37.0, 45.0, 37.0, 31.0, 34.0, 41.0, 40.0, 34.0, 31.0, 27.0, 13.0, 22.0, 14.0, 19.0, 11.0, 10.0, 4.0, 11.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1434173583984375, -1.108123779296875, -1.0728302001953125, -1.03753662109375, -1.0022430419921875, -0.966949462890625, -0.9316558837890625, -0.8963623046875, -0.8610687255859375, -0.825775146484375, -0.7904815673828125, -0.75518798828125, -0.7198944091796875, -0.684600830078125, -0.6493072509765625, -0.614013671875, -0.5787200927734375, -0.543426513671875, -0.5081329345703125, -0.47283935546875, -0.4375457763671875, -0.402252197265625, -0.3669586181640625, -0.3316650390625, -0.2963714599609375, -0.261077880859375, -0.2257843017578125, -0.19049072265625, -0.1551971435546875, -0.119903564453125, -0.0846099853515625, -0.04931640625, -0.0140228271484375, 0.021270751953125, 0.0565643310546875, 0.09185791015625, 0.1271514892578125, 0.162445068359375, 0.1977386474609375, 0.2330322265625, 0.2683258056640625, 0.303619384765625, 0.3389129638671875, 0.37420654296875, 0.4095001220703125, 0.444793701171875, 0.4800872802734375, 0.515380859375, 0.5506744384765625, 0.585968017578125, 0.6212615966796875, 0.65655517578125, 0.6918487548828125, 0.727142333984375, 0.7624359130859375, 0.7977294921875, 0.8330230712890625, 0.868316650390625, 0.9036102294921875, 0.93890380859375, 0.9741973876953125, 1.009490966796875, 1.0447845458984375, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 18.0, 18.0, 42.0, 58.0, 88.0, 126.0, 195.0, 327.0, 564.0, 890.0, 1364.0, 2316.0, 3681.0, 5795.0, 9585.0, 15446.0, 25553.0, 40369.0, 63993.0, 98149.0, 146268.0, 212878.0, 290699.0, 372180.0, 438707.0, 474247.0, 462564.0, 411738.0, 337848.0, 254038.0, 181491.0, 123446.0, 81500.0, 52030.0, 32834.0, 20388.0, 12460.0, 7816.0, 4756.0, 2940.0, 1811.0, 1181.0, 682.0, 464.0, 255.0, 188.0, 111.0, 65.0, 49.0, 28.0, 17.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.388671875, -1.344970703125, -1.30126953125, -1.257568359375, -1.2138671875, -1.170166015625, -1.12646484375, -1.082763671875, -1.0390625, -0.995361328125, -0.95166015625, -0.907958984375, -0.8642578125, -0.820556640625, -0.77685546875, -0.733154296875, -0.689453125, -0.645751953125, -0.60205078125, -0.558349609375, -0.5146484375, -0.470947265625, -0.42724609375, -0.383544921875, -0.33984375, -0.296142578125, -0.25244140625, -0.208740234375, -0.1650390625, -0.121337890625, -0.07763671875, -0.033935546875, 0.009765625, 0.053466796875, 0.09716796875, 0.140869140625, 0.1845703125, 0.228271484375, 0.27197265625, 0.315673828125, 0.359375, 0.403076171875, 0.44677734375, 0.490478515625, 0.5341796875, 0.577880859375, 0.62158203125, 0.665283203125, 0.708984375, 0.752685546875, 0.79638671875, 0.840087890625, 0.8837890625, 0.927490234375, 0.97119140625, 1.014892578125, 1.05859375, 1.102294921875, 1.14599609375, 1.189697265625, 1.2333984375, 1.277099609375, 1.32080078125, 1.364501953125, 1.408203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 14.0, 16.0, 19.0, 20.0, 32.0, 30.0, 31.0, 39.0, 49.0, 58.0, 71.0, 74.0, 109.0, 119.0, 122.0, 127.0, 154.0, 171.0, 174.0, 193.0, 206.0, 210.0, 168.0, 207.0, 190.0, 159.0, 157.0, 140.0, 148.0, 126.0, 119.0, 113.0, 82.0, 79.0, 68.0, 42.0, 45.0, 45.0, 30.0, 27.0, 20.0, 15.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.54931640625, -0.5322036743164062, -0.5150909423828125, -0.49797821044921875, -0.480865478515625, -0.46375274658203125, -0.4466400146484375, -0.42952728271484375, -0.41241455078125, -0.39530181884765625, -0.3781890869140625, -0.36107635498046875, -0.343963623046875, -0.32685089111328125, -0.3097381591796875, -0.29262542724609375, -0.2755126953125, -0.25839996337890625, -0.2412872314453125, -0.22417449951171875, -0.207061767578125, -0.18994903564453125, -0.1728363037109375, -0.15572357177734375, -0.13861083984375, -0.12149810791015625, -0.1043853759765625, -0.08727264404296875, -0.070159912109375, -0.05304718017578125, -0.0359344482421875, -0.01882171630859375, -0.001708984375, 0.01540374755859375, 0.0325164794921875, 0.04962921142578125, 0.066741943359375, 0.08385467529296875, 0.1009674072265625, 0.11808013916015625, 0.13519287109375, 0.15230560302734375, 0.1694183349609375, 0.18653106689453125, 0.203643798828125, 0.22075653076171875, 0.2378692626953125, 0.25498199462890625, 0.2720947265625, 0.28920745849609375, 0.3063201904296875, 0.32343292236328125, 0.340545654296875, 0.35765838623046875, 0.3747711181640625, 0.39188385009765625, 0.40899658203125, 0.42610931396484375, 0.4432220458984375, 0.46033477783203125, 0.477447509765625, 0.49456024169921875, 0.5116729736328125, 0.5287857055664062, 0.5458984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 7.0, 14.0, 15.0, 9.0, 17.0, 16.0, 26.0, 27.0, 28.0, 41.0, 41.0, 48.0, 55.0, 64.0, 52.0, 57.0, 49.0, 62.0, 42.0, 48.0, 49.0, 30.0, 28.0, 28.0, 23.0, 22.0, 24.0, 12.0, 17.0, 11.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.348088264465332, -2.280186176300049, -2.2122840881347656, -2.1443819999694824, -2.0764801502227783, -2.008578062057495, -1.940675973892212, -1.8727738857269287, -1.8048717975616455, -1.7369697093963623, -1.6690677404403687, -1.6011656522750854, -1.5332635641098022, -1.4653615951538086, -1.3974595069885254, -1.3295574188232422, -1.2616554498672485, -1.1937533617019653, -1.1258513927459717, -1.0579493045806885, -0.9900472164154053, -0.9221451878547668, -0.8542431592941284, -0.7863410711288452, -0.7184390425682068, -0.6505370140075684, -0.5826349258422852, -0.5147328972816467, -0.4468308389186859, -0.3789287805557251, -0.31102675199508667, -0.24312469363212585, -0.17522263526916504, -0.10732058435678482, -0.0394185334444046, 0.02848351001739502, 0.09638556838035583, 0.16428762674331665, 0.23218965530395508, 0.3000917136669159, 0.3679937720298767, 0.4358958303928375, 0.5037978887557983, 0.5716999173164368, 0.6396019458770752, 0.7075040340423584, 0.7754060626029968, 0.8433080911636353, 0.9112101793289185, 0.9791122078895569, 1.0470142364501953, 1.1149163246154785, 1.1828184127807617, 1.250720500946045, 1.3186224699020386, 1.3865245580673218, 1.4544265270233154, 1.5223286151885986, 1.5902305841445923, 1.6581326723098755, 1.7260347604751587, 1.7939367294311523, 1.8618388175964355, 1.9297409057617188, 1.997642993927002]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 12.0, 9.0, 12.0, 18.0, 15.0, 23.0, 14.0, 24.0, 18.0, 29.0, 36.0, 47.0, 40.0, 33.0, 39.0, 46.0, 42.0, 39.0, 41.0, 51.0, 44.0, 42.0, 49.0, 30.0, 27.0, 26.0, 26.0, 31.0, 19.0, 19.0, 16.0, 17.0, 11.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.7488301992416382, -1.7021123170852661, -1.6553945541381836, -1.6086766719818115, -1.561958909034729, -1.515241026878357, -1.4685232639312744, -1.4218053817749023, -1.3750876188278198, -1.3283697366714478, -1.2816519737243652, -1.2349340915679932, -1.1882163286209106, -1.1414984464645386, -1.094780683517456, -1.048062801361084, -1.001344919204712, -0.9546270966529846, -0.9079092741012573, -0.86119145154953, -0.8144736289978027, -0.7677558064460754, -0.7210379838943481, -0.6743201017379761, -0.6276023387908936, -0.5808845162391663, -0.534166693687439, -0.48744887113571167, -0.4407310485839844, -0.3940132260322571, -0.3472953736782074, -0.3005775511264801, -0.2538597583770752, -0.2071419358253479, -0.1604241132736206, -0.11370627582073212, -0.06698845326900482, -0.020270630717277527, 0.026447206735610962, 0.07316502928733826, 0.11988285183906555, 0.16660067439079285, 0.21331849694252014, 0.2600363492965698, 0.3067541718482971, 0.3534719944000244, 0.4001898169517517, 0.446907639503479, 0.4936254620552063, 0.5403432846069336, 0.5870611071586609, 0.6337789297103882, 0.6804967522621155, 0.7272145748138428, 0.7739324569702148, 0.8206502199172974, 0.8673681020736694, 0.9140859246253967, 0.960803747177124, 1.007521629333496, 1.0542393922805786, 1.1009572744369507, 1.1476750373840332, 1.1943929195404053, 1.2411106824874878]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 11.0, 23.0, 20.0, 47.0, 77.0, 111.0, 146.0, 239.0, 363.0, 558.0, 883.0, 1192.0, 2080.0, 3223.0, 4981.0, 8184.0, 13213.0, 21773.0, 36158.0, 58197.0, 92153.0, 137461.0, 174055.0, 164789.0, 121882.0, 78916.0, 49423.0, 30329.0, 18173.0, 11106.0, 6880.0, 4364.0, 2661.0, 1746.0, 1066.0, 699.0, 425.0, 289.0, 197.0, 147.0, 114.0, 68.0, 41.0, 25.0, 22.0, 12.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.343505859375, -0.3323631286621094, -0.32122039794921875, -0.3100776672363281, -0.2989349365234375, -0.2877922058105469, -0.27664947509765625, -0.2655067443847656, -0.254364013671875, -0.24322128295898438, -0.23207855224609375, -0.22093582153320312, -0.2097930908203125, -0.19865036010742188, -0.18750762939453125, -0.17636489868164062, -0.16522216796875, -0.15407943725585938, -0.14293670654296875, -0.13179397583007812, -0.1206512451171875, -0.10950851440429688, -0.09836578369140625, -0.08722305297851562, -0.076080322265625, -0.06493759155273438, -0.05379486083984375, -0.042652130126953125, -0.0315093994140625, -0.020366668701171875, -0.00922393798828125, 0.001918792724609375, 0.0130615234375, 0.024204254150390625, 0.03534698486328125, 0.046489715576171875, 0.0576324462890625, 0.06877517700195312, 0.07991790771484375, 0.09106063842773438, 0.102203369140625, 0.11334609985351562, 0.12448883056640625, 0.13563156127929688, 0.1467742919921875, 0.15791702270507812, 0.16905975341796875, 0.18020248413085938, 0.19134521484375, 0.20248794555664062, 0.21363067626953125, 0.22477340698242188, 0.2359161376953125, 0.24705886840820312, 0.25820159912109375, 0.2693443298339844, 0.280487060546875, 0.2916297912597656, 0.30277252197265625, 0.3139152526855469, 0.3250579833984375, 0.3362007141113281, 0.34734344482421875, 0.3584861755371094, 0.36962890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 8.0, 12.0, 12.0, 21.0, 19.0, 21.0, 30.0, 28.0, 34.0, 27.0, 26.0, 35.0, 42.0, 40.0, 52.0, 40.0, 38.0, 34.0, 51.0, 34.0, 43.0, 51.0, 43.0, 37.0, 28.0, 16.0, 30.0, 23.0, 16.0, 27.0, 10.0, 12.0, 12.0, 7.0, 6.0, 8.0, 1.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7933349609375, -1.741943359375, -1.6905517578125, -1.63916015625, -1.5877685546875, -1.536376953125, -1.4849853515625, -1.43359375, -1.3822021484375, -1.330810546875, -1.2794189453125, -1.22802734375, -1.1766357421875, -1.125244140625, -1.0738525390625, -1.0224609375, -0.9710693359375, -0.919677734375, -0.8682861328125, -0.81689453125, -0.7655029296875, -0.714111328125, -0.6627197265625, -0.611328125, -0.5599365234375, -0.508544921875, -0.4571533203125, -0.40576171875, -0.3543701171875, -0.302978515625, -0.2515869140625, -0.2001953125, -0.1488037109375, -0.097412109375, -0.0460205078125, 0.00537109375, 0.0567626953125, 0.108154296875, 0.1595458984375, 0.2109375, 0.2623291015625, 0.313720703125, 0.3651123046875, 0.41650390625, 0.4678955078125, 0.519287109375, 0.5706787109375, 0.6220703125, 0.6734619140625, 0.724853515625, 0.7762451171875, 0.82763671875, 0.8790283203125, 0.930419921875, 0.9818115234375, 1.033203125, 1.0845947265625, 1.135986328125, 1.1873779296875, 1.23876953125, 1.2901611328125, 1.341552734375, 1.3929443359375, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 9.0, 20.0, 31.0, 26.0, 39.0, 78.0, 102.0, 152.0, 248.0, 371.0, 628.0, 1072.0, 1912.0, 3275.0, 5853.0, 11076.0, 20867.0, 40352.0, 77504.0, 140286.0, 212390.0, 215760.0, 146346.0, 80335.0, 42153.0, 21871.0, 11529.0, 6166.0, 3297.0, 1877.0, 1071.0, 650.0, 395.0, 272.0, 172.0, 89.0, 75.0, 47.0, 47.0, 23.0, 10.0, 18.0, 11.0, 9.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49560546875, -0.4806022644042969, -0.46559906005859375, -0.4505958557128906, -0.4355926513671875, -0.4205894470214844, -0.40558624267578125, -0.3905830383300781, -0.375579833984375, -0.3605766296386719, -0.34557342529296875, -0.3305702209472656, -0.3155670166015625, -0.3005638122558594, -0.28556060791015625, -0.2705574035644531, -0.25555419921875, -0.24055099487304688, -0.22554779052734375, -0.21054458618164062, -0.1955413818359375, -0.18053817749023438, -0.16553497314453125, -0.15053176879882812, -0.135528564453125, -0.12052536010742188, -0.10552215576171875, -0.09051895141601562, -0.0755157470703125, -0.060512542724609375, -0.04550933837890625, -0.030506134033203125, -0.0155029296875, -0.000499725341796875, 0.01450347900390625, 0.029506683349609375, 0.0445098876953125, 0.059513092041015625, 0.07451629638671875, 0.08951950073242188, 0.104522705078125, 0.11952590942382812, 0.13452911376953125, 0.14953231811523438, 0.1645355224609375, 0.17953872680664062, 0.19454193115234375, 0.20954513549804688, 0.22454833984375, 0.23955154418945312, 0.25455474853515625, 0.2695579528808594, 0.2845611572265625, 0.2995643615722656, 0.31456756591796875, 0.3295707702636719, 0.344573974609375, 0.3595771789550781, 0.37458038330078125, 0.3895835876464844, 0.4045867919921875, 0.4195899963378906, 0.43459320068359375, 0.4495964050292969, 0.464599609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 9.0, 3.0, 15.0, 12.0, 10.0, 17.0, 16.0, 23.0, 12.0, 32.0, 34.0, 40.0, 34.0, 51.0, 44.0, 53.0, 38.0, 37.0, 48.0, 40.0, 50.0, 42.0, 34.0, 39.0, 35.0, 36.0, 32.0, 29.0, 26.0, 22.0, 17.0, 21.0, 11.0, 8.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9091796875, -0.8769073486328125, -0.844635009765625, -0.8123626708984375, -0.78009033203125, -0.7478179931640625, -0.715545654296875, -0.6832733154296875, -0.6510009765625, -0.6187286376953125, -0.586456298828125, -0.5541839599609375, -0.52191162109375, -0.4896392822265625, -0.457366943359375, -0.4250946044921875, -0.392822265625, -0.3605499267578125, -0.328277587890625, -0.2960052490234375, -0.26373291015625, -0.2314605712890625, -0.199188232421875, -0.1669158935546875, -0.1346435546875, -0.1023712158203125, -0.070098876953125, -0.0378265380859375, -0.00555419921875, 0.0267181396484375, 0.058990478515625, 0.0912628173828125, 0.12353515625, 0.1558074951171875, 0.188079833984375, 0.2203521728515625, 0.25262451171875, 0.2848968505859375, 0.317169189453125, 0.3494415283203125, 0.3817138671875, 0.4139862060546875, 0.446258544921875, 0.4785308837890625, 0.51080322265625, 0.5430755615234375, 0.575347900390625, 0.6076202392578125, 0.639892578125, 0.6721649169921875, 0.704437255859375, 0.7367095947265625, 0.76898193359375, 0.8012542724609375, 0.833526611328125, 0.8657989501953125, 0.8980712890625, 0.9303436279296875, 0.962615966796875, 0.9948883056640625, 1.02716064453125, 1.0594329833984375, 1.091705322265625, 1.1239776611328125, 1.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 4.0, 9.0, 6.0, 17.0, 19.0, 29.0, 34.0, 51.0, 65.0, 86.0, 133.0, 175.0, 242.0, 401.0, 768.0, 1356.0, 2700.0, 6069.0, 16988.0, 70262.0, 511066.0, 363189.0, 50721.0, 13666.0, 5096.0, 2273.0, 1161.0, 669.0, 425.0, 267.0, 157.0, 124.0, 79.0, 57.0, 33.0, 30.0, 23.0, 18.0, 17.0, 14.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.47998046875, -0.4662284851074219, -0.45247650146484375, -0.4387245178222656, -0.4249725341796875, -0.4112205505371094, -0.39746856689453125, -0.3837165832519531, -0.369964599609375, -0.3562126159667969, -0.34246063232421875, -0.3287086486816406, -0.3149566650390625, -0.3012046813964844, -0.28745269775390625, -0.2737007141113281, -0.25994873046875, -0.24619674682617188, -0.23244476318359375, -0.21869277954101562, -0.2049407958984375, -0.19118881225585938, -0.17743682861328125, -0.16368484497070312, -0.149932861328125, -0.13618087768554688, -0.12242889404296875, -0.10867691040039062, -0.0949249267578125, -0.08117294311523438, -0.06742095947265625, -0.053668975830078125, -0.0399169921875, -0.026165008544921875, -0.01241302490234375, 0.001338958740234375, 0.0150909423828125, 0.028842926025390625, 0.04259490966796875, 0.056346893310546875, 0.070098876953125, 0.08385086059570312, 0.09760284423828125, 0.11135482788085938, 0.1251068115234375, 0.13885879516601562, 0.15261077880859375, 0.16636276245117188, 0.18011474609375, 0.19386672973632812, 0.20761871337890625, 0.22137069702148438, 0.2351226806640625, 0.24887466430664062, 0.26262664794921875, 0.2763786315917969, 0.290130615234375, 0.3038825988769531, 0.31763458251953125, 0.3313865661621094, 0.3451385498046875, 0.3588905334472656, 0.37264251708984375, 0.3863945007324219, 0.400146484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 20.0, 21.0, 21.0, 43.0, 45.0, 60.0, 68.0, 90.0, 97.0, 97.0, 79.0, 96.0, 56.0, 61.0, 38.0, 34.0, 21.0, 8.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.907162368297577e-05, -1.841410994529724e-05, -1.7756596207618713e-05, -1.7099082469940186e-05, -1.6441568732261658e-05, -1.578405499458313e-05, -1.5126541256904602e-05, -1.4469027519226074e-05, -1.3811513781547546e-05, -1.3154000043869019e-05, -1.249648630619049e-05, -1.1838972568511963e-05, -1.1181458830833435e-05, -1.0523945093154907e-05, -9.86643135547638e-06, -9.208917617797852e-06, -8.551403880119324e-06, -7.893890142440796e-06, -7.236376404762268e-06, -6.57886266708374e-06, -5.921348929405212e-06, -5.2638351917266846e-06, -4.606321454048157e-06, -3.948807716369629e-06, -3.291293978691101e-06, -2.6337802410125732e-06, -1.9762665033340454e-06, -1.3187527656555176e-06, -6.612390279769897e-07, -3.725290298461914e-09, 6.537884473800659e-07, 1.3113021850585938e-06, 1.9688159227371216e-06, 2.6263296604156494e-06, 3.2838433980941772e-06, 3.941357135772705e-06, 4.598870873451233e-06, 5.256384611129761e-06, 5.9138983488082886e-06, 6.571412086486816e-06, 7.228925824165344e-06, 7.886439561843872e-06, 8.5439532995224e-06, 9.201467037200928e-06, 9.858980774879456e-06, 1.0516494512557983e-05, 1.1174008250236511e-05, 1.1831521987915039e-05, 1.2489035725593567e-05, 1.3146549463272095e-05, 1.3804063200950623e-05, 1.446157693862915e-05, 1.5119090676307678e-05, 1.5776604413986206e-05, 1.6434118151664734e-05, 1.7091631889343262e-05, 1.774914562702179e-05, 1.8406659364700317e-05, 1.9064173102378845e-05, 1.9721686840057373e-05, 2.03792005777359e-05, 2.103671431541443e-05, 2.1694228053092957e-05, 2.2351741790771484e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 19.0, 19.0, 34.0, 47.0, 37.0, 83.0, 87.0, 142.0, 181.0, 217.0, 326.0, 407.0, 591.0, 808.0, 1166.0, 1744.0, 3056.0, 6147.0, 14618.0, 44795.0, 169416.0, 469661.0, 238226.0, 60446.0, 18656.0, 7510.0, 3536.0, 2064.0, 1343.0, 893.0, 569.0, 415.0, 330.0, 246.0, 163.0, 148.0, 97.0, 81.0, 60.0, 39.0, 23.0, 28.0, 16.0, 17.0, 8.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.372314453125, -0.35930633544921875, -0.3462982177734375, -0.33329010009765625, -0.320281982421875, -0.30727386474609375, -0.2942657470703125, -0.28125762939453125, -0.26824951171875, -0.25524139404296875, -0.2422332763671875, -0.22922515869140625, -0.216217041015625, -0.20320892333984375, -0.1902008056640625, -0.17719268798828125, -0.1641845703125, -0.15117645263671875, -0.1381683349609375, -0.12516021728515625, -0.112152099609375, -0.09914398193359375, -0.0861358642578125, -0.07312774658203125, -0.06011962890625, -0.04711151123046875, -0.0341033935546875, -0.02109527587890625, -0.008087158203125, 0.00492095947265625, 0.0179290771484375, 0.03093719482421875, 0.0439453125, 0.05695343017578125, 0.0699615478515625, 0.08296966552734375, 0.095977783203125, 0.10898590087890625, 0.1219940185546875, 0.13500213623046875, 0.14801025390625, 0.16101837158203125, 0.1740264892578125, 0.18703460693359375, 0.200042724609375, 0.21305084228515625, 0.2260589599609375, 0.23906707763671875, 0.2520751953125, 0.26508331298828125, 0.2780914306640625, 0.29109954833984375, 0.304107666015625, 0.31711578369140625, 0.3301239013671875, 0.34313201904296875, 0.35614013671875, 0.36914825439453125, 0.3821563720703125, 0.39516448974609375, 0.408172607421875, 0.42118072509765625, 0.4341888427734375, 0.44719696044921875, 0.460205078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 10.0, 4.0, 10.0, 17.0, 22.0, 34.0, 32.0, 49.0, 59.0, 91.0, 123.0, 127.0, 113.0, 66.0, 53.0, 51.0, 26.0, 22.0, 16.0, 15.0, 9.0, 3.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07037353515625, -0.06778240203857422, -0.06519126892089844, -0.06260013580322266, -0.060009002685546875, -0.057417869567871094, -0.05482673645019531, -0.05223560333251953, -0.04964447021484375, -0.04705333709716797, -0.04446220397949219, -0.041871070861816406, -0.039279937744140625, -0.036688804626464844, -0.03409767150878906, -0.03150653839111328, -0.0289154052734375, -0.02632427215576172, -0.023733139038085938, -0.021142005920410156, -0.018550872802734375, -0.015959739685058594, -0.013368606567382812, -0.010777473449707031, -0.00818634033203125, -0.005595207214355469, -0.0030040740966796875, -0.00041294097900390625, 0.002178192138671875, 0.004769325256347656, 0.0073604583740234375, 0.009951591491699219, 0.012542724609375, 0.015133857727050781, 0.017724990844726562, 0.020316123962402344, 0.022907257080078125, 0.025498390197753906, 0.028089523315429688, 0.03068065643310547, 0.03327178955078125, 0.03586292266845703, 0.03845405578613281, 0.041045188903808594, 0.043636322021484375, 0.046227455139160156, 0.04881858825683594, 0.05140972137451172, 0.0540008544921875, 0.05659198760986328, 0.05918312072753906, 0.061774253845214844, 0.06436538696289062, 0.0669565200805664, 0.06954765319824219, 0.07213878631591797, 0.07472991943359375, 0.07732105255126953, 0.07991218566894531, 0.0825033187866211, 0.08509445190429688, 0.08768558502197266, 0.09027671813964844, 0.09286785125732422, 0.095458984375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 18.0, 11.0, 19.0, 15.0, 33.0, 24.0, 36.0, 47.0, 32.0, 59.0, 61.0, 55.0, 60.0, 58.0, 49.0, 56.0, 40.0, 53.0, 39.0, 26.0, 28.0, 24.0, 22.0, 28.0, 12.0, 12.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4011058807373047, -2.3326547145843506, -2.2642035484313965, -2.1957523822784424, -2.1273012161254883, -2.058850049972534, -1.9903987646102905, -1.9219475984573364, -1.8534964323043823, -1.7850452661514282, -1.7165940999984741, -1.64814293384552, -1.5796916484832764, -1.5112404823303223, -1.4427893161773682, -1.374338150024414, -1.30588698387146, -1.2374358177185059, -1.1689846515655518, -1.1005334854125977, -1.0320823192596436, -0.9636310935020447, -0.8951798677444458, -0.8267287015914917, -0.7582775354385376, -0.6898263692855835, -0.6213752031326294, -0.5529239773750305, -0.4844728112220764, -0.4160216450691223, -0.3475704491138458, -0.27911925315856934, -0.21066796779632568, -0.1422167867422104, -0.07376560568809509, -0.005314424633979797, 0.0631367564201355, 0.1315879225730896, 0.2000391185283661, 0.2684903144836426, 0.3369414806365967, 0.4053926467895508, 0.47384384274482727, 0.5422950387001038, 0.6107462048530579, 0.679197371006012, 0.7476485967636108, 0.8160997629165649, 0.884550929069519, 0.9530020952224731, 1.0214532613754272, 1.0899044275283813, 1.158355712890625, 1.226806879043579, 1.2952580451965332, 1.3637092113494873, 1.4321603775024414, 1.5006115436553955, 1.5690627098083496, 1.6375138759613037, 1.7059650421142578, 1.774416208267212, 1.8428674936294556, 1.9113186597824097, 1.9797698259353638]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 23.0, 15.0, 22.0, 15.0, 22.0, 19.0, 31.0, 35.0, 46.0, 43.0, 30.0, 41.0, 52.0, 41.0, 38.0, 51.0, 41.0, 44.0, 44.0, 47.0, 27.0, 26.0, 29.0, 31.0, 25.0, 17.0, 20.0, 18.0, 12.0, 14.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.7654094696044922, -1.7181633710861206, -1.6709171533584595, -1.623671054840088, -1.5764248371124268, -1.5291787385940552, -1.4819326400756836, -1.4346864223480225, -1.3874403238296509, -1.3401942253112793, -1.2929480075836182, -1.2457019090652466, -1.198455810546875, -1.1512095928192139, -1.1039634943008423, -1.0567173957824707, -1.0094711780548096, -0.9622250199317932, -0.9149788618087769, -0.8677327632904053, -0.8204866051673889, -0.7732404470443726, -0.725994348526001, -0.6787481904029846, -0.6315020322799683, -0.5842558741569519, -0.5370097160339355, -0.48976361751556396, -0.4425174593925476, -0.39527130126953125, -0.3480251729488373, -0.3007790446281433, -0.25353288650512695, -0.2062867432832718, -0.15904060006141663, -0.11179445683956146, -0.0645483136177063, -0.017302170395851135, 0.02994397282600403, 0.077190101146698, 0.12443625926971436, 0.17168240249156952, 0.21892854571342468, 0.26617467403411865, 0.313420832157135, 0.36066699028015137, 0.40791311860084534, 0.4551592469215393, 0.5024054050445557, 0.549651563167572, 0.5968977212905884, 0.64414381980896, 0.6913899779319763, 0.7386361360549927, 0.7858822345733643, 0.8331283926963806, 0.880374550819397, 0.9276207089424133, 0.9748668670654297, 1.0221129655838013, 1.0693590641021729, 1.116605281829834, 1.1638513803482056, 1.2110974788665771, 1.2583436965942383]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 8.0, 15.0, 14.0, 25.0, 55.0, 81.0, 128.0, 197.0, 338.0, 544.0, 797.0, 1232.0, 1752.0, 2857.0, 4235.0, 6360.0, 9471.0, 13672.0, 19373.0, 27283.0, 36458.0, 47943.0, 60727.0, 72949.0, 84306.0, 91300.0, 93304.0, 90939.0, 83174.0, 71981.0, 59448.0, 46977.0, 35271.0, 26278.0, 18658.0, 13315.0, 9156.0, 6069.0, 4165.0, 2670.0, 1849.0, 1127.0, 762.0, 437.0, 297.0, 231.0, 133.0, 78.0, 47.0, 33.0, 19.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8684616088867188, -0.8389739990234375, -0.8094863891601562, -0.779998779296875, -0.7505111694335938, -0.7210235595703125, -0.6915359497070312, -0.66204833984375, -0.6325607299804688, -0.6030731201171875, -0.5735855102539062, -0.544097900390625, -0.5146102905273438, -0.4851226806640625, -0.45563507080078125, -0.4261474609375, -0.39665985107421875, -0.3671722412109375, -0.33768463134765625, -0.308197021484375, -0.27870941162109375, -0.2492218017578125, -0.21973419189453125, -0.19024658203125, -0.16075897216796875, -0.1312713623046875, -0.10178375244140625, -0.072296142578125, -0.04280853271484375, -0.0133209228515625, 0.01616668701171875, 0.045654296875, 0.07514190673828125, 0.1046295166015625, 0.13411712646484375, 0.163604736328125, 0.19309234619140625, 0.2225799560546875, 0.25206756591796875, 0.28155517578125, 0.31104278564453125, 0.3405303955078125, 0.37001800537109375, 0.399505615234375, 0.42899322509765625, 0.4584808349609375, 0.48796844482421875, 0.5174560546875, 0.5469436645507812, 0.5764312744140625, 0.6059188842773438, 0.635406494140625, 0.6648941040039062, 0.6943817138671875, 0.7238693237304688, 0.75335693359375, 0.7828445434570312, 0.8123321533203125, 0.8418197631835938, 0.871307373046875, 0.9007949829101562, 0.9302825927734375, 0.9597702026367188, 0.9892578125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 9.0, 10.0, 6.0, 6.0, 5.0, 15.0, 15.0, 20.0, 16.0, 21.0, 26.0, 43.0, 33.0, 31.0, 40.0, 37.0, 50.0, 41.0, 45.0, 42.0, 37.0, 36.0, 48.0, 45.0, 41.0, 46.0, 32.0, 26.0, 29.0, 22.0, 16.0, 32.0, 9.0, 19.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.822265625, -1.7723846435546875, -1.722503662109375, -1.6726226806640625, -1.62274169921875, -1.5728607177734375, -1.522979736328125, -1.4730987548828125, -1.4232177734375, -1.3733367919921875, -1.323455810546875, -1.2735748291015625, -1.22369384765625, -1.1738128662109375, -1.123931884765625, -1.0740509033203125, -1.024169921875, -0.9742889404296875, -0.924407958984375, -0.8745269775390625, -0.82464599609375, -0.7747650146484375, -0.724884033203125, -0.6750030517578125, -0.6251220703125, -0.5752410888671875, -0.525360107421875, -0.4754791259765625, -0.42559814453125, -0.3757171630859375, -0.325836181640625, -0.2759552001953125, -0.22607421875, -0.1761932373046875, -0.126312255859375, -0.0764312744140625, -0.02655029296875, 0.0233306884765625, 0.073211669921875, 0.1230926513671875, 0.1729736328125, 0.2228546142578125, 0.272735595703125, 0.3226165771484375, 0.37249755859375, 0.4223785400390625, 0.472259521484375, 0.5221405029296875, 0.572021484375, 0.6219024658203125, 0.671783447265625, 0.7216644287109375, 0.77154541015625, 0.8214263916015625, 0.871307373046875, 0.9211883544921875, 0.9710693359375, 1.0209503173828125, 1.070831298828125, 1.1207122802734375, 1.17059326171875, 1.2204742431640625, 1.270355224609375, 1.3202362060546875, 1.3701171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 29.0, 34.0, 61.0, 110.0, 157.0, 240.0, 434.0, 709.0, 1150.0, 1840.0, 3092.0, 4683.0, 7584.0, 11518.0, 17911.0, 26462.0, 37853.0, 52354.0, 68496.0, 84795.0, 98785.0, 105512.0, 105893.0, 98562.0, 84539.0, 68253.0, 52906.0, 38203.0, 26530.0, 17758.0, 11975.0, 7527.0, 4816.0, 3004.0, 1841.0, 1144.0, 702.0, 449.0, 256.0, 144.0, 82.0, 57.0, 32.0, 23.0, 24.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9275665283203125, -0.893218994140625, -0.8588714599609375, -0.82452392578125, -0.7901763916015625, -0.755828857421875, -0.7214813232421875, -0.6871337890625, -0.6527862548828125, -0.618438720703125, -0.5840911865234375, -0.54974365234375, -0.5153961181640625, -0.481048583984375, -0.4467010498046875, -0.412353515625, -0.3780059814453125, -0.343658447265625, -0.3093109130859375, -0.27496337890625, -0.2406158447265625, -0.206268310546875, -0.1719207763671875, -0.1375732421875, -0.1032257080078125, -0.068878173828125, -0.0345306396484375, -0.00018310546875, 0.0341644287109375, 0.068511962890625, 0.1028594970703125, 0.13720703125, 0.1715545654296875, 0.205902099609375, 0.2402496337890625, 0.27459716796875, 0.3089447021484375, 0.343292236328125, 0.3776397705078125, 0.4119873046875, 0.4463348388671875, 0.480682373046875, 0.5150299072265625, 0.54937744140625, 0.5837249755859375, 0.618072509765625, 0.6524200439453125, 0.686767578125, 0.7211151123046875, 0.755462646484375, 0.7898101806640625, 0.82415771484375, 0.8585052490234375, 0.892852783203125, 0.9272003173828125, 0.9615478515625, 0.9958953857421875, 1.030242919921875, 1.0645904541015625, 1.09893798828125, 1.1332855224609375, 1.167633056640625, 1.2019805908203125, 1.236328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 13.0, 11.0, 23.0, 25.0, 24.0, 21.0, 35.0, 26.0, 33.0, 36.0, 44.0, 45.0, 40.0, 41.0, 44.0, 53.0, 36.0, 49.0, 40.0, 42.0, 31.0, 28.0, 26.0, 30.0, 31.0, 24.0, 22.0, 18.0, 16.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.9163818359375, -0.885986328125, -0.8555908203125, -0.8251953125, -0.7947998046875, -0.764404296875, -0.7340087890625, -0.70361328125, -0.6732177734375, -0.642822265625, -0.6124267578125, -0.58203125, -0.5516357421875, -0.521240234375, -0.4908447265625, -0.46044921875, -0.4300537109375, -0.399658203125, -0.3692626953125, -0.3388671875, -0.3084716796875, -0.278076171875, -0.2476806640625, -0.21728515625, -0.1868896484375, -0.156494140625, -0.1260986328125, -0.095703125, -0.0653076171875, -0.034912109375, -0.0045166015625, 0.02587890625, 0.0562744140625, 0.086669921875, 0.1170654296875, 0.1474609375, 0.1778564453125, 0.208251953125, 0.2386474609375, 0.26904296875, 0.2994384765625, 0.329833984375, 0.3602294921875, 0.390625, 0.4210205078125, 0.451416015625, 0.4818115234375, 0.51220703125, 0.5426025390625, 0.572998046875, 0.6033935546875, 0.6337890625, 0.6641845703125, 0.694580078125, 0.7249755859375, 0.75537109375, 0.7857666015625, 0.816162109375, 0.8465576171875, 0.876953125, 0.9073486328125, 0.937744140625, 0.9681396484375, 0.99853515625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 7.0, 13.0, 20.0, 28.0, 53.0, 79.0, 105.0, 174.0, 261.0, 406.0, 630.0, 997.0, 1690.0, 2523.0, 4260.0, 6978.0, 11316.0, 17798.0, 28071.0, 42237.0, 61801.0, 84552.0, 106911.0, 122931.0, 126065.0, 115297.0, 96278.0, 72106.0, 51564.0, 34392.0, 22055.0, 14036.0, 8641.0, 5505.0, 3283.0, 1967.0, 1261.0, 832.0, 511.0, 333.0, 210.0, 130.0, 85.0, 53.0, 46.0, 24.0, 17.0, 6.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.654296875, -0.634613037109375, -0.61492919921875, -0.595245361328125, -0.5755615234375, -0.555877685546875, -0.53619384765625, -0.516510009765625, -0.496826171875, -0.477142333984375, -0.45745849609375, -0.437774658203125, -0.4180908203125, -0.398406982421875, -0.37872314453125, -0.359039306640625, -0.33935546875, -0.319671630859375, -0.29998779296875, -0.280303955078125, -0.2606201171875, -0.240936279296875, -0.22125244140625, -0.201568603515625, -0.181884765625, -0.162200927734375, -0.14251708984375, -0.122833251953125, -0.1031494140625, -0.083465576171875, -0.06378173828125, -0.044097900390625, -0.0244140625, -0.004730224609375, 0.01495361328125, 0.034637451171875, 0.0543212890625, 0.074005126953125, 0.09368896484375, 0.113372802734375, 0.133056640625, 0.152740478515625, 0.17242431640625, 0.192108154296875, 0.2117919921875, 0.231475830078125, 0.25115966796875, 0.270843505859375, 0.29052734375, 0.310211181640625, 0.32989501953125, 0.349578857421875, 0.3692626953125, 0.388946533203125, 0.40863037109375, 0.428314208984375, 0.447998046875, 0.467681884765625, 0.48736572265625, 0.507049560546875, 0.5267333984375, 0.546417236328125, 0.56610107421875, 0.585784912109375, 0.60546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0, 9.0, 2.0, 10.0, 11.0, 16.0, 7.0, 16.0, 16.0, 21.0, 24.0, 36.0, 43.0, 44.0, 47.0, 47.0, 43.0, 38.0, 31.0, 49.0, 54.0, 54.0, 47.0, 47.0, 45.0, 33.0, 37.0, 34.0, 20.0, 22.0, 21.0, 16.0, 18.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.736682891845703e-05, -7.528718560934067e-05, -7.32075423002243e-05, -7.112789899110794e-05, -6.904825568199158e-05, -6.696861237287521e-05, -6.488896906375885e-05, -6.280932575464249e-05, -6.072968244552612e-05, -5.865003913640976e-05, -5.6570395827293396e-05, -5.449075251817703e-05, -5.241110920906067e-05, -5.0331465899944305e-05, -4.825182259082794e-05, -4.617217928171158e-05, -4.4092535972595215e-05, -4.201289266347885e-05, -3.993324935436249e-05, -3.7853606045246124e-05, -3.577396273612976e-05, -3.36943194270134e-05, -3.1614676117897034e-05, -2.953503280878067e-05, -2.7455389499664307e-05, -2.5375746190547943e-05, -2.329610288143158e-05, -2.1216459572315216e-05, -1.9136816263198853e-05, -1.705717295408249e-05, -1.4977529644966125e-05, -1.2897886335849762e-05, -1.0818243026733398e-05, -8.738599717617035e-06, -6.658956408500671e-06, -4.579313099384308e-06, -2.4996697902679443e-06, -4.200264811515808e-07, 1.6596168279647827e-06, 3.7392601370811462e-06, 5.81890344619751e-06, 7.898546755313873e-06, 9.978190064430237e-06, 1.20578333735466e-05, 1.4137476682662964e-05, 1.6217119991779327e-05, 1.829676330089569e-05, 2.0376406610012054e-05, 2.2456049919128418e-05, 2.453569322824478e-05, 2.6615336537361145e-05, 2.869497984647751e-05, 3.077462315559387e-05, 3.2854266464710236e-05, 3.49339097738266e-05, 3.701355308294296e-05, 3.9093196392059326e-05, 4.117283970117569e-05, 4.325248301029205e-05, 4.533212631940842e-05, 4.741176962852478e-05, 4.9491412937641144e-05, 5.157105624675751e-05, 5.365069955587387e-05, 5.5730342864990234e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 7.0, 17.0, 30.0, 34.0, 49.0, 73.0, 124.0, 189.0, 261.0, 408.0, 609.0, 955.0, 1427.0, 2153.0, 3295.0, 4967.0, 7789.0, 11594.0, 17740.0, 25976.0, 37427.0, 52088.0, 69389.0, 87052.0, 102017.0, 110650.0, 109008.0, 99364.0, 83872.0, 65065.0, 49103.0, 34702.0, 24081.0, 16095.0, 10594.0, 7042.0, 4707.0, 2985.0, 1938.0, 1269.0, 880.0, 544.0, 339.0, 236.0, 130.0, 91.0, 70.0, 41.0, 22.0, 20.0, 16.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.57080078125, -0.5529022216796875, -0.535003662109375, -0.5171051025390625, -0.49920654296875, -0.4813079833984375, -0.463409423828125, -0.4455108642578125, -0.4276123046875, -0.4097137451171875, -0.391815185546875, -0.3739166259765625, -0.35601806640625, -0.3381195068359375, -0.320220947265625, -0.3023223876953125, -0.284423828125, -0.2665252685546875, -0.248626708984375, -0.2307281494140625, -0.21282958984375, -0.1949310302734375, -0.177032470703125, -0.1591339111328125, -0.1412353515625, -0.1233367919921875, -0.105438232421875, -0.0875396728515625, -0.06964111328125, -0.0517425537109375, -0.033843994140625, -0.0159454345703125, 0.001953125, 0.0198516845703125, 0.037750244140625, 0.0556488037109375, 0.07354736328125, 0.0914459228515625, 0.109344482421875, 0.1272430419921875, 0.1451416015625, 0.1630401611328125, 0.180938720703125, 0.1988372802734375, 0.21673583984375, 0.2346343994140625, 0.252532958984375, 0.2704315185546875, 0.288330078125, 0.3062286376953125, 0.324127197265625, 0.3420257568359375, 0.35992431640625, 0.3778228759765625, 0.395721435546875, 0.4136199951171875, 0.4315185546875, 0.4494171142578125, 0.467315673828125, 0.4852142333984375, 0.50311279296875, 0.5210113525390625, 0.538909912109375, 0.5568084716796875, 0.57470703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 10.0, 19.0, 16.0, 18.0, 22.0, 29.0, 20.0, 31.0, 34.0, 35.0, 39.0, 40.0, 50.0, 38.0, 51.0, 52.0, 52.0, 55.0, 34.0, 49.0, 38.0, 42.0, 39.0, 38.0, 28.0, 21.0, 20.0, 8.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1801280975341797, -0.17263412475585938, -0.16514015197753906, -0.15764617919921875, -0.15015220642089844, -0.14265823364257812, -0.1351642608642578, -0.1276702880859375, -0.12017631530761719, -0.11268234252929688, -0.10518836975097656, -0.09769439697265625, -0.09020042419433594, -0.08270645141601562, -0.07521247863769531, -0.067718505859375, -0.06022453308105469, -0.052730560302734375, -0.04523658752441406, -0.03774261474609375, -0.030248641967773438, -0.022754669189453125, -0.015260696411132812, -0.0077667236328125, -0.0002727508544921875, 0.007221221923828125, 0.014715194702148438, 0.02220916748046875, 0.029703140258789062, 0.037197113037109375, 0.04469108581542969, 0.05218505859375, 0.05967903137207031, 0.06717300415039062, 0.07466697692871094, 0.08216094970703125, 0.08965492248535156, 0.09714889526367188, 0.10464286804199219, 0.1121368408203125, 0.11963081359863281, 0.12712478637695312, 0.13461875915527344, 0.14211273193359375, 0.14960670471191406, 0.15710067749023438, 0.1645946502685547, 0.172088623046875, 0.1795825958251953, 0.18707656860351562, 0.19457054138183594, 0.20206451416015625, 0.20955848693847656, 0.21705245971679688, 0.2245464324951172, 0.2320404052734375, 0.2395343780517578, 0.24702835083007812, 0.25452232360839844, 0.26201629638671875, 0.26951026916503906, 0.2770042419433594, 0.2844982147216797, 0.2919921875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 18.0, 17.0, 27.0, 16.0, 23.0, 25.0, 41.0, 26.0, 50.0, 58.0, 47.0, 53.0, 62.0, 71.0, 58.0, 40.0, 45.0, 51.0, 34.0, 36.0, 31.0, 28.0, 23.0, 20.0, 24.0, 18.0, 12.0, 10.0, 5.0, 3.0, 5.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052737236022949, -1.9824645519256592, -1.9121919870376587, -1.8419193029403687, -1.7716466188430786, -1.7013740539550781, -1.631101369857788, -1.560828685760498, -1.490556001663208, -1.420283317565918, -1.3500107526779175, -1.2797380685806274, -1.2094653844833374, -1.139192819595337, -1.0689201354980469, -0.9986474514007568, -0.9283748865127563, -0.8581022620201111, -0.787829577922821, -0.7175569534301758, -0.6472842693328857, -0.5770116448402405, -0.5067390203475952, -0.43646636605262756, -0.3661937117576599, -0.29592105746269226, -0.2256484180688858, -0.15537577867507935, -0.0851031243801117, -0.014830470085144043, 0.05544215440750122, 0.12571480870246887, 0.19598746299743652, 0.2662601172924042, 0.3365327715873718, 0.4068053960800171, 0.47707805037498474, 0.5473507046699524, 0.6176233291625977, 0.6878960132598877, 0.758168637752533, 0.8284412622451782, 0.8987139463424683, 0.9689865708351135, 1.0392591953277588, 1.1095318794250488, 1.1798045635223389, 1.2500771284103394, 1.3203498125076294, 1.3906224966049194, 1.46089506149292, 1.53116774559021, 1.6014404296875, 1.67171311378479, 1.7419856786727905, 1.8122583627700806, 1.882530927658081, 1.952803611755371, 2.023076295852661, 2.093348979949951, 2.163621425628662, 2.233894109725952, 2.304166793823242, 2.3744394779205322, 2.4447121620178223]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 10.0, 8.0, 7.0, 18.0, 9.0, 21.0, 15.0, 27.0, 24.0, 26.0, 31.0, 35.0, 28.0, 39.0, 49.0, 44.0, 54.0, 34.0, 40.0, 41.0, 37.0, 48.0, 31.0, 43.0, 36.0, 32.0, 33.0, 25.0, 25.0, 21.0, 19.0, 11.0, 16.0, 7.0, 10.0, 10.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6441646814346313, -1.5958521366119385, -1.547539472579956, -1.4992269277572632, -1.4509143829345703, -1.4026018381118774, -1.3542892932891846, -1.3059766292572021, -1.2576640844345093, -1.2093515396118164, -1.161038875579834, -1.1127263307571411, -1.0644137859344482, -1.0161012411117554, -0.9677886366844177, -0.9194760322570801, -0.8711634874343872, -0.8228509426116943, -0.7745383381843567, -0.726225733757019, -0.6779131889343262, -0.6296006441116333, -0.5812880396842957, -0.532975435256958, -0.48466289043426514, -0.4363503158092499, -0.3880377411842346, -0.33972516655921936, -0.2914125919342041, -0.24310001730918884, -0.19478744268417358, -0.14647486805915833, -0.09816241264343262, -0.04984983801841736, -0.0015372633934020996, 0.04677531123161316, 0.09508788585662842, 0.14340046048164368, 0.19171303510665894, 0.2400256097316742, 0.28833818435668945, 0.3366507589817047, 0.38496333360671997, 0.43327590823173523, 0.4815884828567505, 0.5299010276794434, 0.578213632106781, 0.6265262365341187, 0.6748387813568115, 0.7231513261795044, 0.771463930606842, 0.8197765350341797, 0.8680890798568726, 0.9164016246795654, 0.9647142291069031, 1.0130268335342407, 1.0613393783569336, 1.1096519231796265, 1.1579644680023193, 1.2062771320343018, 1.2545896768569946, 1.3029022216796875, 1.35121488571167, 1.3995274305343628, 1.4478399753570557]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 16.0, 31.0, 52.0, 80.0, 104.0, 179.0, 311.0, 472.0, 780.0, 1244.0, 2147.0, 3646.0, 6049.0, 10341.0, 17374.0, 29901.0, 51538.0, 86344.0, 140587.0, 222680.0, 327754.0, 445322.0, 538683.0, 567637.0, 519751.0, 415012.0, 299586.0, 199195.0, 124863.0, 75576.0, 44861.0, 26159.0, 15083.0, 8728.0, 5065.0, 2967.0, 1662.0, 995.0, 599.0, 335.0, 211.0, 132.0, 92.0, 46.0, 30.0, 17.0, 17.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003570556640625, -1.549346923828125, -1.4983367919921875, -1.44732666015625, -1.3963165283203125, -1.345306396484375, -1.2942962646484375, -1.2432861328125, -1.1922760009765625, -1.141265869140625, -1.0902557373046875, -1.03924560546875, -0.9882354736328125, -0.937225341796875, -0.8862152099609375, -0.835205078125, -0.7841949462890625, -0.733184814453125, -0.6821746826171875, -0.63116455078125, -0.5801544189453125, -0.529144287109375, -0.4781341552734375, -0.4271240234375, -0.3761138916015625, -0.325103759765625, -0.2740936279296875, -0.22308349609375, -0.1720733642578125, -0.121063232421875, -0.0700531005859375, -0.01904296875, 0.0319671630859375, 0.082977294921875, 0.1339874267578125, 0.18499755859375, 0.2360076904296875, 0.287017822265625, 0.3380279541015625, 0.3890380859375, 0.4400482177734375, 0.491058349609375, 0.5420684814453125, 0.59307861328125, 0.6440887451171875, 0.695098876953125, 0.7461090087890625, 0.797119140625, 0.8481292724609375, 0.899139404296875, 0.9501495361328125, 1.00115966796875, 1.0521697998046875, 1.103179931640625, 1.1541900634765625, 1.2052001953125, 1.2562103271484375, 1.307220458984375, 1.3582305908203125, 1.40924072265625, 1.4602508544921875, 1.511260986328125, 1.5622711181640625, 1.61328125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 9.0, 11.0, 6.0, 15.0, 13.0, 16.0, 15.0, 27.0, 22.0, 28.0, 35.0, 32.0, 37.0, 40.0, 41.0, 39.0, 31.0, 37.0, 44.0, 42.0, 40.0, 37.0, 38.0, 35.0, 44.0, 25.0, 24.0, 23.0, 26.0, 25.0, 13.0, 12.0, 17.0, 18.0, 14.0, 5.0, 7.0, 5.0, 4.0, 8.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3056640625, -1.2673187255859375, -1.228973388671875, -1.1906280517578125, -1.15228271484375, -1.1139373779296875, -1.075592041015625, -1.0372467041015625, -0.9989013671875, -0.9605560302734375, -0.922210693359375, -0.8838653564453125, -0.84552001953125, -0.8071746826171875, -0.768829345703125, -0.7304840087890625, -0.692138671875, -0.6537933349609375, -0.615447998046875, -0.5771026611328125, -0.53875732421875, -0.5004119873046875, -0.462066650390625, -0.4237213134765625, -0.3853759765625, -0.3470306396484375, -0.308685302734375, -0.2703399658203125, -0.23199462890625, -0.1936492919921875, -0.155303955078125, -0.1169586181640625, -0.07861328125, -0.0402679443359375, -0.001922607421875, 0.0364227294921875, 0.07476806640625, 0.1131134033203125, 0.151458740234375, 0.1898040771484375, 0.2281494140625, 0.2664947509765625, 0.304840087890625, 0.3431854248046875, 0.38153076171875, 0.4198760986328125, 0.458221435546875, 0.4965667724609375, 0.534912109375, 0.5732574462890625, 0.611602783203125, 0.6499481201171875, 0.68829345703125, 0.7266387939453125, 0.764984130859375, 0.8033294677734375, 0.8416748046875, 0.8800201416015625, 0.918365478515625, 0.9567108154296875, 0.99505615234375, 1.0334014892578125, 1.071746826171875, 1.1100921630859375, 1.1484375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 17.0, 29.0, 42.0, 73.0, 120.0, 215.0, 351.0, 556.0, 932.0, 1594.0, 2777.0, 4568.0, 8097.0, 13402.0, 22683.0, 38392.0, 62227.0, 100217.0, 154234.0, 226711.0, 314267.0, 402179.0, 472768.0, 500720.0, 478665.0, 410040.0, 321211.0, 232322.0, 158581.0, 103429.0, 64824.0, 39677.0, 24078.0, 14092.0, 8348.0, 4799.0, 2918.0, 1680.0, 1009.0, 549.0, 338.0, 224.0, 133.0, 85.0, 49.0, 17.0, 13.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6858062744140625, -1.632354736328125, -1.5789031982421875, -1.52545166015625, -1.4720001220703125, -1.418548583984375, -1.3650970458984375, -1.3116455078125, -1.2581939697265625, -1.204742431640625, -1.1512908935546875, -1.09783935546875, -1.0443878173828125, -0.990936279296875, -0.9374847412109375, -0.884033203125, -0.8305816650390625, -0.777130126953125, -0.7236785888671875, -0.67022705078125, -0.6167755126953125, -0.563323974609375, -0.5098724365234375, -0.4564208984375, -0.4029693603515625, -0.349517822265625, -0.2960662841796875, -0.24261474609375, -0.1891632080078125, -0.135711669921875, -0.0822601318359375, -0.02880859375, 0.0246429443359375, 0.078094482421875, 0.1315460205078125, 0.18499755859375, 0.2384490966796875, 0.291900634765625, 0.3453521728515625, 0.3988037109375, 0.4522552490234375, 0.505706787109375, 0.5591583251953125, 0.61260986328125, 0.6660614013671875, 0.719512939453125, 0.7729644775390625, 0.826416015625, 0.8798675537109375, 0.933319091796875, 0.9867706298828125, 1.04022216796875, 1.0936737060546875, 1.147125244140625, 1.2005767822265625, 1.2540283203125, 1.3074798583984375, 1.360931396484375, 1.4143829345703125, 1.46783447265625, 1.5212860107421875, 1.574737548828125, 1.6281890869140625, 1.681640625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 12.0, 10.0, 6.0, 27.0, 34.0, 30.0, 34.0, 60.0, 67.0, 84.0, 118.0, 136.0, 149.0, 142.0, 168.0, 206.0, 203.0, 215.0, 216.0, 240.0, 238.0, 212.0, 217.0, 170.0, 155.0, 151.0, 142.0, 147.0, 105.0, 80.0, 63.0, 57.0, 44.0, 42.0, 29.0, 12.0, 17.0, 5.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7265853881835938, -0.7026824951171875, -0.6787796020507812, -0.654876708984375, -0.6309738159179688, -0.6070709228515625, -0.5831680297851562, -0.55926513671875, -0.5353622436523438, -0.5114593505859375, -0.48755645751953125, -0.463653564453125, -0.43975067138671875, -0.4158477783203125, -0.39194488525390625, -0.3680419921875, -0.34413909912109375, -0.3202362060546875, -0.29633331298828125, -0.272430419921875, -0.24852752685546875, -0.2246246337890625, -0.20072174072265625, -0.17681884765625, -0.15291595458984375, -0.1290130615234375, -0.10511016845703125, -0.081207275390625, -0.05730438232421875, -0.0334014892578125, -0.00949859619140625, 0.014404296875, 0.03830718994140625, 0.0622100830078125, 0.08611297607421875, 0.110015869140625, 0.13391876220703125, 0.1578216552734375, 0.18172454833984375, 0.20562744140625, 0.22953033447265625, 0.2534332275390625, 0.27733612060546875, 0.301239013671875, 0.32514190673828125, 0.3490447998046875, 0.37294769287109375, 0.3968505859375, 0.42075347900390625, 0.4446563720703125, 0.46855926513671875, 0.492462158203125, 0.5163650512695312, 0.5402679443359375, 0.5641708374023438, 0.58807373046875, 0.6119766235351562, 0.6358795166015625, 0.6597824096679688, 0.683685302734375, 0.7075881958007812, 0.7314910888671875, 0.7553939819335938, 0.779296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 13.0, 17.0, 9.0, 28.0, 33.0, 22.0, 31.0, 34.0, 48.0, 62.0, 64.0, 61.0, 71.0, 49.0, 55.0, 50.0, 66.0, 49.0, 39.0, 40.0, 28.0, 27.0, 23.0, 13.0, 15.0, 13.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.804446220397949, -2.719447135925293, -2.6344478130340576, -2.5494487285614014, -2.464449644088745, -2.3794503211975098, -2.2944512367248535, -2.2094521522521973, -2.124453067779541, -2.0394539833068848, -1.954454779624939, -1.8694555759429932, -1.784456491470337, -1.6994572877883911, -1.6144580841064453, -1.529458999633789, -1.4444596767425537, -1.359460473060608, -1.2744613885879517, -1.1894621849060059, -1.1044631004333496, -1.0194638967514038, -0.934464693069458, -0.849465548992157, -0.764466404914856, -0.6794672608375549, -0.5944681167602539, -0.5094689130783081, -0.4244697690010071, -0.33947062492370605, -0.25447142124176025, -0.16947227716445923, -0.0844733715057373, 0.0005257874727249146, 0.08552494645118713, 0.17052412033081055, 0.2555232644081116, 0.3405224084854126, 0.4255216121673584, 0.5105207562446594, 0.5955199003219604, 0.6805190443992615, 0.7655181884765625, 0.8505173921585083, 0.9355165362358093, 1.0205156803131104, 1.1055148839950562, 1.190514087677002, 1.2755131721496582, 1.360512375831604, 1.4455114603042603, 1.530510663986206, 1.6155097484588623, 1.700508952140808, 1.785508155822754, 1.8705072402954102, 1.955506443977356, 2.0405056476593018, 2.125504732131958, 2.2105040550231934, 2.2955031394958496, 2.380502223968506, 2.465501308441162, 2.5505006313323975, 2.6354997158050537]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 12.0, 9.0, 10.0, 15.0, 18.0, 14.0, 23.0, 21.0, 30.0, 21.0, 36.0, 36.0, 27.0, 31.0, 42.0, 49.0, 43.0, 33.0, 42.0, 44.0, 42.0, 34.0, 46.0, 35.0, 35.0, 28.0, 24.0, 29.0, 25.0, 21.0, 18.0, 19.0, 14.0, 6.0, 8.0, 8.0, 3.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6612660884857178, -1.6119011640548706, -1.5625362396240234, -1.5131713151931763, -1.463806390762329, -1.414441466331482, -1.3650765419006348, -1.3157117366790771, -1.2663466930389404, -1.2169817686080933, -1.167616844177246, -1.118251919746399, -1.0688869953155518, -1.0195220708847046, -0.9701572060585022, -0.920792281627655, -0.8714274168014526, -0.8220624923706055, -0.7726975679397583, -0.7233326435089111, -0.673967719078064, -0.6246027946472168, -0.5752379298210144, -0.5258730053901672, -0.47650808095932007, -0.4271431565284729, -0.37777823209762573, -0.32841333746910095, -0.2790484130382538, -0.22968348860740662, -0.18031859397888184, -0.13095366954803467, -0.08158862590789795, -0.03222370892763138, 0.017141208052635193, 0.06650611758232117, 0.11587104201316833, 0.1652359664440155, 0.21460086107254028, 0.26396578550338745, 0.3133307099342346, 0.3626956343650818, 0.41206055879592896, 0.46142545342445374, 0.5107903480529785, 0.5601552724838257, 0.6095201969146729, 0.65888512134552, 0.7082500457763672, 0.7576149702072144, 0.8069798946380615, 0.8563448190689087, 0.9057097434997559, 0.955074667930603, 1.0044395923614502, 1.0538043975830078, 1.1031694412231445, 1.1525343656539917, 1.2018992900848389, 1.251264214515686, 1.3006291389465332, 1.3499940633773804, 1.3993589878082275, 1.4487237930297852, 1.4980887174606323]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 14.0, 12.0, 23.0, 38.0, 53.0, 72.0, 121.0, 181.0, 308.0, 468.0, 734.0, 1318.0, 2311.0, 4126.0, 7945.0, 15267.0, 29808.0, 56438.0, 105028.0, 179337.0, 231757.0, 182776.0, 108068.0, 57877.0, 30468.0, 15650.0, 8120.0, 4429.0, 2416.0, 1325.0, 769.0, 482.0, 291.0, 173.0, 97.0, 68.0, 58.0, 43.0, 17.0, 19.0, 15.0, 10.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5322265625, -0.5141983032226562, -0.4961700439453125, -0.47814178466796875, -0.460113525390625, -0.44208526611328125, -0.4240570068359375, -0.40602874755859375, -0.38800048828125, -0.36997222900390625, -0.3519439697265625, -0.33391571044921875, -0.315887451171875, -0.29785919189453125, -0.2798309326171875, -0.26180267333984375, -0.2437744140625, -0.22574615478515625, -0.2077178955078125, -0.18968963623046875, -0.171661376953125, -0.15363311767578125, -0.1356048583984375, -0.11757659912109375, -0.09954833984375, -0.08152008056640625, -0.0634918212890625, -0.04546356201171875, -0.027435302734375, -0.00940704345703125, 0.0086212158203125, 0.02664947509765625, 0.044677734375, 0.06270599365234375, 0.0807342529296875, 0.09876251220703125, 0.116790771484375, 0.13481903076171875, 0.1528472900390625, 0.17087554931640625, 0.18890380859375, 0.20693206787109375, 0.2249603271484375, 0.24298858642578125, 0.261016845703125, 0.27904510498046875, 0.2970733642578125, 0.31510162353515625, 0.3331298828125, 0.35115814208984375, 0.3691864013671875, 0.38721466064453125, 0.405242919921875, 0.42327117919921875, 0.4412994384765625, 0.45932769775390625, 0.47735595703125, 0.49538421630859375, 0.5134124755859375, 0.5314407348632812, 0.549468994140625, 0.5674972534179688, 0.5855255126953125, 0.6035537719726562, 0.62158203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 20.0, 15.0, 19.0, 23.0, 22.0, 34.0, 30.0, 34.0, 26.0, 32.0, 35.0, 37.0, 37.0, 40.0, 47.0, 39.0, 45.0, 38.0, 40.0, 30.0, 33.0, 33.0, 29.0, 26.0, 20.0, 30.0, 14.0, 19.0, 26.0, 14.0, 5.0, 12.0, 10.0, 7.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.587890625, -1.536163330078125, -1.48443603515625, -1.432708740234375, -1.3809814453125, -1.329254150390625, -1.27752685546875, -1.225799560546875, -1.174072265625, -1.122344970703125, -1.07061767578125, -1.018890380859375, -0.9671630859375, -0.915435791015625, -0.86370849609375, -0.811981201171875, -0.76025390625, -0.708526611328125, -0.65679931640625, -0.605072021484375, -0.5533447265625, -0.501617431640625, -0.44989013671875, -0.398162841796875, -0.346435546875, -0.294708251953125, -0.24298095703125, -0.191253662109375, -0.1395263671875, -0.087799072265625, -0.03607177734375, 0.015655517578125, 0.0673828125, 0.119110107421875, 0.17083740234375, 0.222564697265625, 0.2742919921875, 0.326019287109375, 0.37774658203125, 0.429473876953125, 0.481201171875, 0.532928466796875, 0.58465576171875, 0.636383056640625, 0.6881103515625, 0.739837646484375, 0.79156494140625, 0.843292236328125, 0.89501953125, 0.946746826171875, 0.99847412109375, 1.050201416015625, 1.1019287109375, 1.153656005859375, 1.20538330078125, 1.257110595703125, 1.308837890625, 1.360565185546875, 1.41229248046875, 1.464019775390625, 1.5157470703125, 1.567474365234375, 1.61920166015625, 1.670928955078125, 1.72265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 9.0, 11.0, 11.0, 25.0, 28.0, 34.0, 53.0, 74.0, 120.0, 184.0, 246.0, 363.0, 602.0, 935.0, 1483.0, 2676.0, 4663.0, 9102.0, 17957.0, 36978.0, 79615.0, 163223.0, 261603.0, 228074.0, 124296.0, 58646.0, 27684.0, 13572.0, 6828.0, 3792.0, 2123.0, 1329.0, 766.0, 462.0, 319.0, 200.0, 126.0, 87.0, 61.0, 55.0, 46.0, 34.0, 18.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5990371704101562, -0.5789337158203125, -0.5588302612304688, -0.538726806640625, -0.5186233520507812, -0.4985198974609375, -0.47841644287109375, -0.45831298828125, -0.43820953369140625, -0.4181060791015625, -0.39800262451171875, -0.377899169921875, -0.35779571533203125, -0.3376922607421875, -0.31758880615234375, -0.2974853515625, -0.27738189697265625, -0.2572784423828125, -0.23717498779296875, -0.217071533203125, -0.19696807861328125, -0.1768646240234375, -0.15676116943359375, -0.13665771484375, -0.11655426025390625, -0.0964508056640625, -0.07634735107421875, -0.056243896484375, -0.03614044189453125, -0.0160369873046875, 0.00406646728515625, 0.024169921875, 0.04427337646484375, 0.0643768310546875, 0.08448028564453125, 0.104583740234375, 0.12468719482421875, 0.1447906494140625, 0.16489410400390625, 0.18499755859375, 0.20510101318359375, 0.2252044677734375, 0.24530792236328125, 0.265411376953125, 0.28551483154296875, 0.3056182861328125, 0.32572174072265625, 0.3458251953125, 0.36592864990234375, 0.3860321044921875, 0.40613555908203125, 0.426239013671875, 0.44634246826171875, 0.4664459228515625, 0.48654937744140625, 0.50665283203125, 0.5267562866210938, 0.5468597412109375, 0.5669631958007812, 0.587066650390625, 0.6071701049804688, 0.6272735595703125, 0.6473770141601562, 0.66748046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 11.0, 8.0, 16.0, 14.0, 15.0, 22.0, 28.0, 22.0, 23.0, 30.0, 28.0, 35.0, 35.0, 62.0, 38.0, 39.0, 52.0, 42.0, 52.0, 42.0, 41.0, 39.0, 41.0, 34.0, 24.0, 33.0, 23.0, 21.0, 23.0, 14.0, 19.0, 16.0, 7.0, 14.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -0.99884033203125, -0.9635009765625, -0.92816162109375, -0.892822265625, -0.85748291015625, -0.8221435546875, -0.78680419921875, -0.75146484375, -0.71612548828125, -0.6807861328125, -0.64544677734375, -0.610107421875, -0.57476806640625, -0.5394287109375, -0.50408935546875, -0.46875, -0.43341064453125, -0.3980712890625, -0.36273193359375, -0.327392578125, -0.29205322265625, -0.2567138671875, -0.22137451171875, -0.18603515625, -0.15069580078125, -0.1153564453125, -0.08001708984375, -0.044677734375, -0.00933837890625, 0.0260009765625, 0.06134033203125, 0.0966796875, 0.13201904296875, 0.1673583984375, 0.20269775390625, 0.238037109375, 0.27337646484375, 0.3087158203125, 0.34405517578125, 0.37939453125, 0.41473388671875, 0.4500732421875, 0.48541259765625, 0.520751953125, 0.55609130859375, 0.5914306640625, 0.62677001953125, 0.662109375, 0.69744873046875, 0.7327880859375, 0.76812744140625, 0.803466796875, 0.83880615234375, 0.8741455078125, 0.90948486328125, 0.94482421875, 0.98016357421875, 1.0155029296875, 1.05084228515625, 1.086181640625, 1.12152099609375, 1.1568603515625, 1.19219970703125, 1.2275390625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 7.0, 7.0, 6.0, 6.0, 13.0, 16.0, 19.0, 22.0, 49.0, 57.0, 61.0, 68.0, 98.0, 142.0, 179.0, 253.0, 331.0, 470.0, 718.0, 1055.0, 1608.0, 2597.0, 4691.0, 8932.0, 19480.0, 54137.0, 201674.0, 482523.0, 181015.0, 49612.0, 18402.0, 8207.0, 4572.0, 2545.0, 1480.0, 1001.0, 698.0, 479.0, 363.0, 221.0, 176.0, 157.0, 118.0, 77.0, 53.0, 48.0, 22.0, 27.0, 17.0, 14.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.33349609375, -0.32254791259765625, -0.3115997314453125, -0.30065155029296875, -0.289703369140625, -0.27875518798828125, -0.2678070068359375, -0.25685882568359375, -0.24591064453125, -0.23496246337890625, -0.2240142822265625, -0.21306610107421875, -0.202117919921875, -0.19116973876953125, -0.1802215576171875, -0.16927337646484375, -0.1583251953125, -0.14737701416015625, -0.1364288330078125, -0.12548065185546875, -0.114532470703125, -0.10358428955078125, -0.0926361083984375, -0.08168792724609375, -0.07073974609375, -0.05979156494140625, -0.0488433837890625, -0.03789520263671875, -0.026947021484375, -0.01599884033203125, -0.0050506591796875, 0.00589752197265625, 0.016845703125, 0.02779388427734375, 0.0387420654296875, 0.04969024658203125, 0.060638427734375, 0.07158660888671875, 0.0825347900390625, 0.09348297119140625, 0.10443115234375, 0.11537933349609375, 0.1263275146484375, 0.13727569580078125, 0.148223876953125, 0.15917205810546875, 0.1701202392578125, 0.18106842041015625, 0.1920166015625, 0.20296478271484375, 0.2139129638671875, 0.22486114501953125, 0.235809326171875, 0.24675750732421875, 0.2577056884765625, 0.26865386962890625, 0.27960205078125, 0.29055023193359375, 0.3014984130859375, 0.31244659423828125, 0.323394775390625, 0.33434295654296875, 0.3452911376953125, 0.35623931884765625, 0.3671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 10.0, 6.0, 9.0, 11.0, 9.0, 14.0, 14.0, 15.0, 35.0, 35.0, 32.0, 35.0, 42.0, 36.0, 56.0, 34.0, 48.0, 43.0, 43.0, 57.0, 41.0, 41.0, 35.0, 42.0, 40.0, 37.0, 23.0, 23.0, 15.0, 21.0, 14.0, 11.0, 9.0, 10.0, 13.0, 7.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.049041748046875e-05, -1.0143034160137177e-05, -9.795650839805603e-06, -9.44826751947403e-06, -9.100884199142456e-06, -8.753500878810883e-06, -8.406117558479309e-06, -8.058734238147736e-06, -7.711350917816162e-06, -7.363967597484589e-06, -7.016584277153015e-06, -6.669200956821442e-06, -6.321817636489868e-06, -5.974434316158295e-06, -5.627050995826721e-06, -5.279667675495148e-06, -4.932284355163574e-06, -4.584901034832001e-06, -4.237517714500427e-06, -3.890134394168854e-06, -3.5427510738372803e-06, -3.1953677535057068e-06, -2.8479844331741333e-06, -2.50060111284256e-06, -2.1532177925109863e-06, -1.8058344721794128e-06, -1.4584511518478394e-06, -1.1110678315162659e-06, -7.636845111846924e-07, -4.163011908531189e-07, -6.891787052154541e-08, 2.784654498100281e-07, 6.258487701416016e-07, 9.73232090473175e-07, 1.3206154108047485e-06, 1.667998731136322e-06, 2.0153820514678955e-06, 2.362765371799469e-06, 2.7101486921310425e-06, 3.057532012462616e-06, 3.4049153327941895e-06, 3.752298653125763e-06, 4.0996819734573364e-06, 4.44706529378891e-06, 4.794448614120483e-06, 5.141831934452057e-06, 5.48921525478363e-06, 5.836598575115204e-06, 6.183981895446777e-06, 6.531365215778351e-06, 6.878748536109924e-06, 7.226131856441498e-06, 7.573515176773071e-06, 7.920898497104645e-06, 8.268281817436218e-06, 8.615665137767792e-06, 8.963048458099365e-06, 9.310431778430939e-06, 9.657815098762512e-06, 1.0005198419094086e-05, 1.035258173942566e-05, 1.0699965059757233e-05, 1.1047348380088806e-05, 1.139473170042038e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 27.0, 18.0, 42.0, 53.0, 85.0, 121.0, 199.0, 227.0, 386.0, 571.0, 860.0, 1284.0, 2241.0, 4135.0, 8937.0, 22001.0, 67106.0, 226908.0, 433895.0, 188161.0, 55375.0, 18818.0, 7780.0, 3694.0, 1961.0, 1204.0, 713.0, 552.0, 357.0, 253.0, 169.0, 126.0, 68.0, 61.0, 48.0, 24.0, 17.0, 11.0, 10.0, 10.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5, -0.48503875732421875, -0.4700775146484375, -0.45511627197265625, -0.440155029296875, -0.42519378662109375, -0.4102325439453125, -0.39527130126953125, -0.38031005859375, -0.36534881591796875, -0.3503875732421875, -0.33542633056640625, -0.320465087890625, -0.30550384521484375, -0.2905426025390625, -0.27558135986328125, -0.2606201171875, -0.24565887451171875, -0.2306976318359375, -0.21573638916015625, -0.200775146484375, -0.18581390380859375, -0.1708526611328125, -0.15589141845703125, -0.14093017578125, -0.12596893310546875, -0.1110076904296875, -0.09604644775390625, -0.081085205078125, -0.06612396240234375, -0.0511627197265625, -0.03620147705078125, -0.021240234375, -0.00627899169921875, 0.0086822509765625, 0.02364349365234375, 0.038604736328125, 0.05356597900390625, 0.0685272216796875, 0.08348846435546875, 0.09844970703125, 0.11341094970703125, 0.1283721923828125, 0.14333343505859375, 0.158294677734375, 0.17325592041015625, 0.1882171630859375, 0.20317840576171875, 0.2181396484375, 0.23310089111328125, 0.2480621337890625, 0.26302337646484375, 0.277984619140625, 0.29294586181640625, 0.3079071044921875, 0.32286834716796875, 0.33782958984375, 0.35279083251953125, 0.3677520751953125, 0.38271331787109375, 0.397674560546875, 0.41263580322265625, 0.4275970458984375, 0.44255828857421875, 0.45751953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 6.0, 13.0, 7.0, 19.0, 29.0, 37.0, 70.0, 85.0, 147.0, 130.0, 124.0, 95.0, 69.0, 41.0, 33.0, 21.0, 17.0, 21.0, 4.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.12743854522705078, -0.12365150451660156, -0.11986446380615234, -0.11607742309570312, -0.1122903823852539, -0.10850334167480469, -0.10471630096435547, -0.10092926025390625, -0.09714221954345703, -0.09335517883300781, -0.0895681381225586, -0.08578109741210938, -0.08199405670166016, -0.07820701599121094, -0.07441997528076172, -0.0706329345703125, -0.06684589385986328, -0.06305885314941406, -0.059271812438964844, -0.055484771728515625, -0.051697731018066406, -0.04791069030761719, -0.04412364959716797, -0.04033660888671875, -0.03654956817626953, -0.03276252746582031, -0.028975486755371094, -0.025188446044921875, -0.021401405334472656, -0.017614364624023438, -0.013827323913574219, -0.010040283203125, -0.006253242492675781, -0.0024662017822265625, 0.0013208389282226562, 0.005107879638671875, 0.008894920349121094, 0.012681961059570312, 0.01646900177001953, 0.02025604248046875, 0.02404308319091797, 0.027830123901367188, 0.031617164611816406, 0.035404205322265625, 0.039191246032714844, 0.04297828674316406, 0.04676532745361328, 0.0505523681640625, 0.05433940887451172, 0.05812644958496094, 0.061913490295410156, 0.06570053100585938, 0.0694875717163086, 0.07327461242675781, 0.07706165313720703, 0.08084869384765625, 0.08463573455810547, 0.08842277526855469, 0.0922098159790039, 0.09599685668945312, 0.09978389739990234, 0.10357093811035156, 0.10735797882080078, 0.11114501953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 15.0, 15.0, 26.0, 32.0, 17.0, 39.0, 36.0, 53.0, 71.0, 64.0, 69.0, 63.0, 46.0, 53.0, 58.0, 55.0, 50.0, 39.0, 35.0, 33.0, 21.0, 21.0, 11.0, 13.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8028035163879395, -2.7170827388763428, -2.631361961364746, -2.5456411838531494, -2.4599204063415527, -2.374199628829956, -2.2884788513183594, -2.202758312225342, -2.117037296295166, -2.0313165187835693, -1.9455957412719727, -1.859874963760376, -1.7741541862487793, -1.6884334087371826, -1.6027127504348755, -1.5169919729232788, -1.4312713146209717, -1.345550537109375, -1.2598297595977783, -1.1741089820861816, -1.088388204574585, -1.0026674270629883, -0.9169467687606812, -0.8312259912490845, -0.7455052137374878, -0.6597844362258911, -0.5740636587142944, -0.48834294080734253, -0.40262216329574585, -0.31690138578414917, -0.23118066787719727, -0.14545989036560059, -0.059739112854003906, 0.02598164975643158, 0.11170241236686707, 0.19742316007614136, 0.28314393758773804, 0.3688647150993347, 0.4545854330062866, 0.5403062105178833, 0.62602698802948, 0.7117477655410767, 0.7974685430526733, 0.8831892609596252, 0.9689100384712219, 1.0546307563781738, 1.1403515338897705, 1.2260723114013672, 1.3117930889129639, 1.3975138664245605, 1.4832346439361572, 1.568955421447754, 1.6546761989593506, 1.7403969764709473, 1.8261176347732544, 1.911838412284851, 1.9975591897964478, 2.083279848098755, 2.1690006256103516, 2.2547214031219482, 2.340442180633545, 2.4261629581451416, 2.5118837356567383, 2.597604513168335, 2.6833252906799316]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 21.0, 23.0, 23.0, 28.0, 29.0, 42.0, 27.0, 33.0, 39.0, 48.0, 47.0, 29.0, 47.0, 48.0, 28.0, 41.0, 49.0, 36.0, 32.0, 34.0, 17.0, 34.0, 21.0, 20.0, 21.0, 19.0, 10.0, 8.0, 9.0, 6.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6686097383499146, -1.6190205812454224, -1.5694313049316406, -1.5198421478271484, -1.4702529907226562, -1.4206637144088745, -1.3710745573043823, -1.3214852809906006, -1.2718961238861084, -1.2223069667816162, -1.1727176904678345, -1.1231285333633423, -1.0735392570495605, -1.0239500999450684, -0.9743609428405762, -0.9247717261314392, -0.8751825094223022, -0.8255932927131653, -0.7760040760040283, -0.7264149188995361, -0.6768257021903992, -0.6272364854812622, -0.57764732837677, -0.5280581116676331, -0.4784688949584961, -0.42887967824935913, -0.37929049134254456, -0.32970130443573, -0.280112087726593, -0.23052288591861725, -0.18093368411064148, -0.1313444972038269, -0.08175528049468994, -0.03216607868671417, 0.017423123121261597, 0.06701232492923737, 0.11660152673721313, 0.1661907285451889, 0.21577993035316467, 0.26536911725997925, 0.3149583339691162, 0.3645475506782532, 0.41413673758506775, 0.4637259244918823, 0.5133151412010193, 0.5629043579101562, 0.6124935150146484, 0.6620827317237854, 0.7116719484329224, 0.7612611651420593, 0.8108503818511963, 0.8604395389556885, 0.9100287556648254, 0.9596179723739624, 1.0092071294784546, 1.0587964057922363, 1.1083855628967285, 1.1579747200012207, 1.2075639963150024, 1.2571531534194946, 1.3067424297332764, 1.3563315868377686, 1.4059207439422607, 1.455509901046753, 1.5050991773605347]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 16.0, 25.0, 37.0, 70.0, 107.0, 142.0, 226.0, 396.0, 625.0, 1031.0, 1565.0, 2541.0, 3896.0, 6096.0, 9060.0, 13846.0, 20351.0, 29148.0, 39452.0, 52889.0, 66788.0, 80266.0, 91485.0, 98529.0, 98322.0, 92410.0, 82139.0, 68646.0, 54180.0, 40819.0, 29955.0, 21244.0, 14587.0, 9797.0, 6427.0, 4045.0, 2712.0, 1763.0, 1078.0, 691.0, 433.0, 243.0, 172.0, 116.0, 77.0, 39.0, 25.0, 22.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0188446044921875, -0.984954833984375, -0.9510650634765625, -0.91717529296875, -0.8832855224609375, -0.849395751953125, -0.8155059814453125, -0.7816162109375, -0.7477264404296875, -0.713836669921875, -0.6799468994140625, -0.64605712890625, -0.6121673583984375, -0.578277587890625, -0.5443878173828125, -0.510498046875, -0.4766082763671875, -0.442718505859375, -0.4088287353515625, -0.37493896484375, -0.3410491943359375, -0.307159423828125, -0.2732696533203125, -0.2393798828125, -0.2054901123046875, -0.171600341796875, -0.1377105712890625, -0.10382080078125, -0.0699310302734375, -0.036041259765625, -0.0021514892578125, 0.03173828125, 0.0656280517578125, 0.099517822265625, 0.1334075927734375, 0.16729736328125, 0.2011871337890625, 0.235076904296875, 0.2689666748046875, 0.3028564453125, 0.3367462158203125, 0.370635986328125, 0.4045257568359375, 0.43841552734375, 0.4723052978515625, 0.506195068359375, 0.5400848388671875, 0.573974609375, 0.6078643798828125, 0.641754150390625, 0.6756439208984375, 0.70953369140625, 0.7434234619140625, 0.777313232421875, 0.8112030029296875, 0.8450927734375, 0.8789825439453125, 0.912872314453125, 0.9467620849609375, 0.98065185546875, 1.0145416259765625, 1.048431396484375, 1.0823211669921875, 1.1162109375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 8.0, 10.0, 10.0, 14.0, 20.0, 23.0, 19.0, 22.0, 31.0, 34.0, 27.0, 40.0, 48.0, 38.0, 50.0, 43.0, 44.0, 55.0, 43.0, 44.0, 37.0, 42.0, 32.0, 31.0, 28.0, 34.0, 24.0, 24.0, 14.0, 15.0, 19.0, 17.0, 9.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9345703125, -1.8772125244140625, -1.819854736328125, -1.7624969482421875, -1.70513916015625, -1.6477813720703125, -1.590423583984375, -1.5330657958984375, -1.4757080078125, -1.4183502197265625, -1.360992431640625, -1.3036346435546875, -1.24627685546875, -1.1889190673828125, -1.131561279296875, -1.0742034912109375, -1.016845703125, -0.9594879150390625, -0.902130126953125, -0.8447723388671875, -0.78741455078125, -0.7300567626953125, -0.672698974609375, -0.6153411865234375, -0.5579833984375, -0.5006256103515625, -0.443267822265625, -0.3859100341796875, -0.32855224609375, -0.2711944580078125, -0.213836669921875, -0.1564788818359375, -0.09912109375, -0.0417633056640625, 0.015594482421875, 0.0729522705078125, 0.13031005859375, 0.1876678466796875, 0.245025634765625, 0.3023834228515625, 0.3597412109375, 0.4170989990234375, 0.474456787109375, 0.5318145751953125, 0.58917236328125, 0.6465301513671875, 0.703887939453125, 0.7612457275390625, 0.818603515625, 0.8759613037109375, 0.933319091796875, 0.9906768798828125, 1.04803466796875, 1.1053924560546875, 1.162750244140625, 1.2201080322265625, 1.2774658203125, 1.3348236083984375, 1.392181396484375, 1.4495391845703125, 1.50689697265625, 1.5642547607421875, 1.621612548828125, 1.6789703369140625, 1.736328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 26.0, 31.0, 64.0, 89.0, 140.0, 188.0, 310.0, 489.0, 766.0, 1134.0, 1903.0, 2869.0, 4493.0, 6856.0, 10342.0, 15388.0, 22428.0, 31941.0, 43266.0, 57743.0, 72693.0, 86664.0, 96855.0, 101445.0, 98873.0, 90408.0, 76969.0, 63033.0, 48504.0, 35833.0, 24916.0, 17667.0, 11958.0, 7671.0, 5072.0, 3315.0, 2268.0, 1367.0, 953.0, 630.0, 353.0, 239.0, 149.0, 86.0, 54.0, 32.0, 21.0, 20.0, 9.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-1.1435546875, -1.108551025390625, -1.07354736328125, -1.038543701171875, -1.0035400390625, -0.968536376953125, -0.93353271484375, -0.898529052734375, -0.863525390625, -0.828521728515625, -0.79351806640625, -0.758514404296875, -0.7235107421875, -0.688507080078125, -0.65350341796875, -0.618499755859375, -0.58349609375, -0.548492431640625, -0.51348876953125, -0.478485107421875, -0.4434814453125, -0.408477783203125, -0.37347412109375, -0.338470458984375, -0.303466796875, -0.268463134765625, -0.23345947265625, -0.198455810546875, -0.1634521484375, -0.128448486328125, -0.09344482421875, -0.058441162109375, -0.0234375, 0.011566162109375, 0.04656982421875, 0.081573486328125, 0.1165771484375, 0.151580810546875, 0.18658447265625, 0.221588134765625, 0.256591796875, 0.291595458984375, 0.32659912109375, 0.361602783203125, 0.3966064453125, 0.431610107421875, 0.46661376953125, 0.501617431640625, 0.53662109375, 0.571624755859375, 0.60662841796875, 0.641632080078125, 0.6766357421875, 0.711639404296875, 0.74664306640625, 0.781646728515625, 0.816650390625, 0.851654052734375, 0.88665771484375, 0.921661376953125, 0.9566650390625, 0.991668701171875, 1.02667236328125, 1.061676025390625, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 9.0, 15.0, 15.0, 14.0, 25.0, 24.0, 29.0, 30.0, 20.0, 26.0, 40.0, 48.0, 33.0, 40.0, 36.0, 39.0, 45.0, 58.0, 36.0, 41.0, 45.0, 37.0, 49.0, 46.0, 31.0, 30.0, 19.0, 20.0, 28.0, 13.0, 13.0, 9.0, 8.0, 6.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1130523681640625, -1.076690673828125, -1.0403289794921875, -1.00396728515625, -0.9676055908203125, -0.931243896484375, -0.8948822021484375, -0.8585205078125, -0.8221588134765625, -0.785797119140625, -0.7494354248046875, -0.71307373046875, -0.6767120361328125, -0.640350341796875, -0.6039886474609375, -0.567626953125, -0.5312652587890625, -0.494903564453125, -0.4585418701171875, -0.42218017578125, -0.3858184814453125, -0.349456787109375, -0.3130950927734375, -0.2767333984375, -0.2403717041015625, -0.204010009765625, -0.1676483154296875, -0.13128662109375, -0.0949249267578125, -0.058563232421875, -0.0222015380859375, 0.01416015625, 0.0505218505859375, 0.086883544921875, 0.1232452392578125, 0.15960693359375, 0.1959686279296875, 0.232330322265625, 0.2686920166015625, 0.3050537109375, 0.3414154052734375, 0.377777099609375, 0.4141387939453125, 0.45050048828125, 0.4868621826171875, 0.523223876953125, 0.5595855712890625, 0.595947265625, 0.6323089599609375, 0.668670654296875, 0.7050323486328125, 0.74139404296875, 0.7777557373046875, 0.814117431640625, 0.8504791259765625, 0.8868408203125, 0.9232025146484375, 0.959564208984375, 0.9959259033203125, 1.03228759765625, 1.0686492919921875, 1.105010986328125, 1.1413726806640625, 1.177734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 26.0, 14.0, 18.0, 29.0, 40.0, 55.0, 84.0, 155.0, 195.0, 365.0, 556.0, 951.0, 1644.0, 3090.0, 5693.0, 10394.0, 19512.0, 35968.0, 64015.0, 104060.0, 149177.0, 175861.0, 165834.0, 126548.0, 80438.0, 47252.0, 25694.0, 14114.0, 7355.0, 3912.0, 2306.0, 1224.0, 716.0, 423.0, 240.0, 181.0, 126.0, 75.0, 52.0, 35.0, 35.0, 16.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.91845703125, -0.8895111083984375, -0.860565185546875, -0.8316192626953125, -0.80267333984375, -0.7737274169921875, -0.744781494140625, -0.7158355712890625, -0.6868896484375, -0.6579437255859375, -0.628997802734375, -0.6000518798828125, -0.57110595703125, -0.5421600341796875, -0.513214111328125, -0.4842681884765625, -0.455322265625, -0.4263763427734375, -0.397430419921875, -0.3684844970703125, -0.33953857421875, -0.3105926513671875, -0.281646728515625, -0.2527008056640625, -0.2237548828125, -0.1948089599609375, -0.165863037109375, -0.1369171142578125, -0.10797119140625, -0.0790252685546875, -0.050079345703125, -0.0211334228515625, 0.0078125, 0.0367584228515625, 0.065704345703125, 0.0946502685546875, 0.12359619140625, 0.1525421142578125, 0.181488037109375, 0.2104339599609375, 0.2393798828125, 0.2683258056640625, 0.297271728515625, 0.3262176513671875, 0.35516357421875, 0.3841094970703125, 0.413055419921875, 0.4420013427734375, 0.470947265625, 0.4998931884765625, 0.528839111328125, 0.5577850341796875, 0.58673095703125, 0.6156768798828125, 0.644622802734375, 0.6735687255859375, 0.7025146484375, 0.7314605712890625, 0.760406494140625, 0.7893524169921875, 0.81829833984375, 0.8472442626953125, 0.876190185546875, 0.9051361083984375, 0.93408203125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 5.0, 3.0, 12.0, 16.0, 13.0, 24.0, 30.0, 39.0, 30.0, 42.0, 49.0, 52.0, 62.0, 66.0, 63.0, 75.0, 50.0, 67.0, 58.0, 51.0, 35.0, 39.0, 26.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.512901306152344e-05, -9.219907224178314e-05, -8.926913142204285e-05, -8.633919060230255e-05, -8.340924978256226e-05, -8.047930896282196e-05, -7.754936814308167e-05, -7.461942732334137e-05, -7.168948650360107e-05, -6.875954568386078e-05, -6.582960486412048e-05, -6.289966404438019e-05, -5.996972322463989e-05, -5.70397824048996e-05, -5.41098415851593e-05, -5.1179900765419006e-05, -4.824995994567871e-05, -4.5320019125938416e-05, -4.239007830619812e-05, -3.9460137486457825e-05, -3.653019666671753e-05, -3.3600255846977234e-05, -3.067031502723694e-05, -2.7740374207496643e-05, -2.4810433387756348e-05, -2.1880492568016052e-05, -1.8950551748275757e-05, -1.602061092853546e-05, -1.3090670108795166e-05, -1.016072928905487e-05, -7.230788469314575e-06, -4.30084764957428e-06, -1.3709068298339844e-06, 1.559033989906311e-06, 4.4889748096466064e-06, 7.418915629386902e-06, 1.0348856449127197e-05, 1.3278797268867493e-05, 1.6208738088607788e-05, 1.9138678908348083e-05, 2.206861972808838e-05, 2.4998560547828674e-05, 2.792850136756897e-05, 3.0858442187309265e-05, 3.378838300704956e-05, 3.6718323826789856e-05, 3.964826464653015e-05, 4.257820546627045e-05, 4.550814628601074e-05, 4.843808710575104e-05, 5.136802792549133e-05, 5.429796874523163e-05, 5.7227909564971924e-05, 6.015785038471222e-05, 6.308779120445251e-05, 6.601773202419281e-05, 6.89476728439331e-05, 7.18776136636734e-05, 7.48075544834137e-05, 7.773749530315399e-05, 8.066743612289429e-05, 8.359737694263458e-05, 8.652731776237488e-05, 8.945725858211517e-05, 9.238719940185547e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 5.0, 14.0, 18.0, 34.0, 54.0, 56.0, 102.0, 127.0, 160.0, 267.0, 471.0, 735.0, 1167.0, 2161.0, 3877.0, 7541.0, 14839.0, 29396.0, 56962.0, 103039.0, 159489.0, 196257.0, 182200.0, 129725.0, 76541.0, 40230.0, 20638.0, 10244.0, 5273.0, 2858.0, 1562.0, 887.0, 555.0, 350.0, 223.0, 157.0, 118.0, 71.0, 52.0, 35.0, 22.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1484375, -1.1143951416015625, -1.080352783203125, -1.0463104248046875, -1.01226806640625, -0.9782257080078125, -0.944183349609375, -0.9101409912109375, -0.8760986328125, -0.8420562744140625, -0.808013916015625, -0.7739715576171875, -0.73992919921875, -0.7058868408203125, -0.671844482421875, -0.6378021240234375, -0.603759765625, -0.5697174072265625, -0.535675048828125, -0.5016326904296875, -0.46759033203125, -0.4335479736328125, -0.399505615234375, -0.3654632568359375, -0.3314208984375, -0.2973785400390625, -0.263336181640625, -0.2292938232421875, -0.19525146484375, -0.1612091064453125, -0.127166748046875, -0.0931243896484375, -0.05908203125, -0.0250396728515625, 0.009002685546875, 0.0430450439453125, 0.07708740234375, 0.1111297607421875, 0.145172119140625, 0.1792144775390625, 0.2132568359375, 0.2472991943359375, 0.281341552734375, 0.3153839111328125, 0.34942626953125, 0.3834686279296875, 0.417510986328125, 0.4515533447265625, 0.485595703125, 0.5196380615234375, 0.553680419921875, 0.5877227783203125, 0.62176513671875, 0.6558074951171875, 0.689849853515625, 0.7238922119140625, 0.7579345703125, 0.7919769287109375, 0.826019287109375, 0.8600616455078125, 0.89410400390625, 0.9281463623046875, 0.962188720703125, 0.9962310791015625, 1.0302734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 11.0, 14.0, 15.0, 23.0, 31.0, 32.0, 42.0, 44.0, 64.0, 61.0, 85.0, 73.0, 75.0, 72.0, 47.0, 50.0, 39.0, 57.0, 35.0, 25.0, 20.0, 19.0, 19.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.344482421875, -0.3343162536621094, -0.32415008544921875, -0.3139839172363281, -0.3038177490234375, -0.2936515808105469, -0.28348541259765625, -0.2733192443847656, -0.263153076171875, -0.2529869079589844, -0.24282073974609375, -0.23265457153320312, -0.2224884033203125, -0.21232223510742188, -0.20215606689453125, -0.19198989868164062, -0.18182373046875, -0.17165756225585938, -0.16149139404296875, -0.15132522583007812, -0.1411590576171875, -0.13099288940429688, -0.12082672119140625, -0.11066055297851562, -0.100494384765625, -0.09032821655273438, -0.08016204833984375, -0.06999588012695312, -0.0598297119140625, -0.049663543701171875, -0.03949737548828125, -0.029331207275390625, -0.0191650390625, -0.008998870849609375, 0.00116729736328125, 0.011333465576171875, 0.0214996337890625, 0.031665802001953125, 0.04183197021484375, 0.051998138427734375, 0.062164306640625, 0.07233047485351562, 0.08249664306640625, 0.09266281127929688, 0.1028289794921875, 0.11299514770507812, 0.12316131591796875, 0.13332748413085938, 0.14349365234375, 0.15365982055664062, 0.16382598876953125, 0.17399215698242188, 0.1841583251953125, 0.19432449340820312, 0.20449066162109375, 0.21465682983398438, 0.224822998046875, 0.23498916625976562, 0.24515533447265625, 0.2553215026855469, 0.2654876708984375, 0.2756538391113281, 0.28582000732421875, 0.2959861755371094, 0.30615234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 9.0, 10.0, 6.0, 4.0, 27.0, 21.0, 21.0, 22.0, 32.0, 40.0, 40.0, 51.0, 54.0, 64.0, 65.0, 55.0, 51.0, 53.0, 50.0, 61.0, 34.0, 46.0, 37.0, 36.0, 23.0, 19.0, 19.0, 13.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6378824710845947, -2.55696964263916, -2.4760570526123047, -2.39514422416687, -2.3142313957214355, -2.233318567276001, -2.1524057388305664, -2.071493148803711, -1.9905803203582764, -1.9096674919128418, -1.8287547826766968, -1.7478420734405518, -1.6669292449951172, -1.5860164165496826, -1.5051037073135376, -1.4241909980773926, -1.343278169631958, -1.2623653411865234, -1.1814526319503784, -1.1005399227142334, -1.0196270942687988, -0.938714325428009, -0.8578015565872192, -0.7768887877464294, -0.6959760189056396, -0.6150632500648499, -0.5341504812240601, -0.45323771238327026, -0.37232494354248047, -0.2914121747016907, -0.21049940586090088, -0.12958663702011108, -0.04867410659790039, 0.032238662242889404, 0.1131514310836792, 0.194064199924469, 0.2749769687652588, 0.3558897376060486, 0.4368025064468384, 0.5177152752876282, 0.598628044128418, 0.6795408129692078, 0.7604535818099976, 0.8413663506507874, 0.9222791194915771, 1.0031919479370117, 1.0841046571731567, 1.1650173664093018, 1.2459301948547363, 1.326843023300171, 1.407755732536316, 1.488668441772461, 1.5695812702178955, 1.65049409866333, 1.731406807899475, 1.8123195171356201, 1.8932323455810547, 1.9741451740264893, 2.055058002471924, 2.1359705924987793, 2.216883420944214, 2.2977962493896484, 2.378708839416504, 2.4596216678619385, 2.540534496307373]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 9.0, 12.0, 15.0, 6.0, 17.0, 16.0, 8.0, 24.0, 22.0, 28.0, 30.0, 26.0, 32.0, 40.0, 32.0, 43.0, 37.0, 35.0, 43.0, 46.0, 31.0, 46.0, 38.0, 22.0, 40.0, 34.0, 42.0, 29.0, 30.0, 29.0, 23.0, 25.0, 15.0, 12.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7800862789154053, -1.7279075384140015, -1.6757287979125977, -1.6235501766204834, -1.5713714361190796, -1.5191926956176758, -1.4670140743255615, -1.4148353338241577, -1.362656593322754, -1.31047785282135, -1.2582991123199463, -1.206120491027832, -1.1539417505264282, -1.1017630100250244, -1.0495843887329102, -0.9974056482315063, -0.9452269077301025, -0.8930481672286987, -0.8408694863319397, -0.7886908054351807, -0.7365120649337769, -0.684333324432373, -0.632154643535614, -0.579975962638855, -0.5277972221374512, -0.47561851143836975, -0.42343980073928833, -0.3712610900402069, -0.3190823793411255, -0.26690366864204407, -0.21472495794296265, -0.16254624724388123, -0.11036765575408936, -0.058188945055007935, -0.006010234355926514, 0.04616847634315491, 0.09834718704223633, 0.15052589774131775, 0.20270460844039917, 0.2548833191394806, 0.307062029838562, 0.35924074053764343, 0.41141945123672485, 0.4635981619358063, 0.5157768726348877, 0.5679556131362915, 0.6201342940330505, 0.6723129749298096, 0.7244917154312134, 0.7766704559326172, 0.8288491368293762, 0.8810278177261353, 0.9332065582275391, 0.9853852987289429, 1.0375640392303467, 1.089742660522461, 1.1419214010238647, 1.1941001415252686, 1.2462787628173828, 1.2984575033187866, 1.3506362438201904, 1.4028149843215942, 1.454993724822998, 1.5071723461151123, 1.5593510866165161]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 9.0, 18.0, 27.0, 35.0, 54.0, 83.0, 121.0, 187.0, 340.0, 522.0, 886.0, 1481.0, 2412.0, 4237.0, 7285.0, 12654.0, 21566.0, 36922.0, 62354.0, 104771.0, 166104.0, 252475.0, 357782.0, 462754.0, 534085.0, 543572.0, 487063.0, 385959.0, 277514.0, 184558.0, 116806.0, 70856.0, 41709.0, 24144.0, 13981.0, 7839.0, 4576.0, 2691.0, 1488.0, 938.0, 586.0, 295.0, 212.0, 128.0, 87.0, 43.0, 35.0, 13.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8046875, -1.7467193603515625, -1.688751220703125, -1.6307830810546875, -1.57281494140625, -1.5148468017578125, -1.456878662109375, -1.3989105224609375, -1.3409423828125, -1.2829742431640625, -1.225006103515625, -1.1670379638671875, -1.10906982421875, -1.0511016845703125, -0.993133544921875, -0.9351654052734375, -0.877197265625, -0.8192291259765625, -0.761260986328125, -0.7032928466796875, -0.64532470703125, -0.5873565673828125, -0.529388427734375, -0.4714202880859375, -0.4134521484375, -0.3554840087890625, -0.297515869140625, -0.2395477294921875, -0.18157958984375, -0.1236114501953125, -0.065643310546875, -0.0076751708984375, 0.05029296875, 0.1082611083984375, 0.166229248046875, 0.2241973876953125, 0.28216552734375, 0.3401336669921875, 0.398101806640625, 0.4560699462890625, 0.5140380859375, 0.5720062255859375, 0.629974365234375, 0.6879425048828125, 0.74591064453125, 0.8038787841796875, 0.861846923828125, 0.9198150634765625, 0.977783203125, 1.0357513427734375, 1.093719482421875, 1.1516876220703125, 1.20965576171875, 1.2676239013671875, 1.325592041015625, 1.3835601806640625, 1.4415283203125, 1.4994964599609375, 1.557464599609375, 1.6154327392578125, 1.67340087890625, 1.7313690185546875, 1.789337158203125, 1.8473052978515625, 1.9052734375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 3.0, 5.0, 10.0, 11.0, 12.0, 12.0, 9.0, 17.0, 14.0, 12.0, 16.0, 20.0, 26.0, 27.0, 40.0, 33.0, 30.0, 39.0, 42.0, 31.0, 44.0, 48.0, 40.0, 35.0, 36.0, 47.0, 34.0, 32.0, 30.0, 34.0, 35.0, 29.0, 21.0, 26.0, 18.0, 10.0, 13.0, 10.0, 8.0, 5.0, 2.0, 4.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0], "bins": [-1.611328125, -1.5662841796875, -1.521240234375, -1.4761962890625, -1.43115234375, -1.3861083984375, -1.341064453125, -1.2960205078125, -1.2509765625, -1.2059326171875, -1.160888671875, -1.1158447265625, -1.07080078125, -1.0257568359375, -0.980712890625, -0.9356689453125, -0.890625, -0.8455810546875, -0.800537109375, -0.7554931640625, -0.71044921875, -0.6654052734375, -0.620361328125, -0.5753173828125, -0.5302734375, -0.4852294921875, -0.440185546875, -0.3951416015625, -0.35009765625, -0.3050537109375, -0.260009765625, -0.2149658203125, -0.169921875, -0.1248779296875, -0.079833984375, -0.0347900390625, 0.01025390625, 0.0552978515625, 0.100341796875, 0.1453857421875, 0.1904296875, 0.2354736328125, 0.280517578125, 0.3255615234375, 0.37060546875, 0.4156494140625, 0.460693359375, 0.5057373046875, 0.55078125, 0.5958251953125, 0.640869140625, 0.6859130859375, 0.73095703125, 0.7760009765625, 0.821044921875, 0.8660888671875, 0.9111328125, 0.9561767578125, 1.001220703125, 1.0462646484375, 1.09130859375, 1.1363525390625, 1.181396484375, 1.2264404296875, 1.271484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 13.0, 15.0, 37.0, 48.0, 85.0, 127.0, 245.0, 460.0, 784.0, 1379.0, 2343.0, 4176.0, 7597.0, 13104.0, 22841.0, 39031.0, 65387.0, 106857.0, 166479.0, 247792.0, 340674.0, 431886.0, 497237.0, 511027.0, 474096.0, 395133.0, 300736.0, 211483.0, 138844.0, 87820.0, 53205.0, 31266.0, 18204.0, 10393.0, 5901.0, 3267.0, 1893.0, 1020.0, 568.0, 372.0, 186.0, 103.0, 66.0, 39.0, 19.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.890533447265625, -1.82598876953125, -1.761444091796875, -1.6968994140625, -1.632354736328125, -1.56781005859375, -1.503265380859375, -1.438720703125, -1.374176025390625, -1.30963134765625, -1.245086669921875, -1.1805419921875, -1.115997314453125, -1.05145263671875, -0.986907958984375, -0.92236328125, -0.857818603515625, -0.79327392578125, -0.728729248046875, -0.6641845703125, -0.599639892578125, -0.53509521484375, -0.470550537109375, -0.406005859375, -0.341461181640625, -0.27691650390625, -0.212371826171875, -0.1478271484375, -0.083282470703125, -0.01873779296875, 0.045806884765625, 0.1103515625, 0.174896240234375, 0.23944091796875, 0.303985595703125, 0.3685302734375, 0.433074951171875, 0.49761962890625, 0.562164306640625, 0.626708984375, 0.691253662109375, 0.75579833984375, 0.820343017578125, 0.8848876953125, 0.949432373046875, 1.01397705078125, 1.078521728515625, 1.14306640625, 1.207611083984375, 1.27215576171875, 1.336700439453125, 1.4012451171875, 1.465789794921875, 1.53033447265625, 1.594879150390625, 1.659423828125, 1.723968505859375, 1.78851318359375, 1.853057861328125, 1.9176025390625, 1.982147216796875, 2.04669189453125, 2.111236572265625, 2.17578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 12.0, 24.0, 16.0, 20.0, 33.0, 40.0, 54.0, 63.0, 68.0, 90.0, 95.0, 98.0, 117.0, 140.0, 147.0, 162.0, 183.0, 193.0, 188.0, 219.0, 235.0, 223.0, 207.0, 172.0, 175.0, 147.0, 146.0, 110.0, 122.0, 111.0, 78.0, 80.0, 60.0, 51.0, 39.0, 21.0, 25.0, 28.0, 10.0, 12.0, 10.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83203125, -0.8075332641601562, -0.7830352783203125, -0.7585372924804688, -0.734039306640625, -0.7095413208007812, -0.6850433349609375, -0.6605453491210938, -0.63604736328125, -0.6115493774414062, -0.5870513916015625, -0.5625534057617188, -0.538055419921875, -0.5135574340820312, -0.4890594482421875, -0.46456146240234375, -0.4400634765625, -0.41556549072265625, -0.3910675048828125, -0.36656951904296875, -0.342071533203125, -0.31757354736328125, -0.2930755615234375, -0.26857757568359375, -0.24407958984375, -0.21958160400390625, -0.1950836181640625, -0.17058563232421875, -0.146087646484375, -0.12158966064453125, -0.0970916748046875, -0.07259368896484375, -0.048095703125, -0.02359771728515625, 0.0009002685546875, 0.02539825439453125, 0.049896240234375, 0.07439422607421875, 0.0988922119140625, 0.12339019775390625, 0.14788818359375, 0.17238616943359375, 0.1968841552734375, 0.22138214111328125, 0.245880126953125, 0.27037811279296875, 0.2948760986328125, 0.31937408447265625, 0.3438720703125, 0.36837005615234375, 0.3928680419921875, 0.41736602783203125, 0.441864013671875, 0.46636199951171875, 0.4908599853515625, 0.5153579711914062, 0.53985595703125, 0.5643539428710938, 0.5888519287109375, 0.6133499145507812, 0.637847900390625, 0.6623458862304688, 0.6868438720703125, 0.7113418579101562, 0.73583984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 7.0, 4.0, 13.0, 13.0, 21.0, 14.0, 28.0, 33.0, 40.0, 54.0, 44.0, 39.0, 58.0, 60.0, 70.0, 74.0, 50.0, 57.0, 55.0, 43.0, 45.0, 42.0, 34.0, 22.0, 22.0, 12.0, 17.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2938148975372314, -3.1929543018341064, -3.0920934677124023, -2.9912328720092773, -2.8903722763061523, -2.7895114421844482, -2.6886508464813232, -2.587790012359619, -2.486929416656494, -2.386068820953369, -2.285207986831665, -2.18434739112854, -2.083486557006836, -1.982625961303711, -1.881765365600586, -1.7809046506881714, -1.6800439357757568, -1.5791832208633423, -1.4783225059509277, -1.3774619102478027, -1.2766011953353882, -1.1757404804229736, -1.0748798847198486, -0.9740191698074341, -0.8731584548950195, -0.772297739982605, -0.6714370846748352, -0.5705764293670654, -0.4697157144546509, -0.36885499954223633, -0.26799434423446655, -0.16713368892669678, -0.06627321243286133, 0.034587472677230835, 0.135448157787323, 0.23630884289741516, 0.3371695280075073, 0.4380302429199219, 0.5388908982276917, 0.6397515535354614, 0.740612268447876, 0.8414729833602905, 0.9423336386680603, 1.04319429397583, 1.1440550088882446, 1.2449157238006592, 1.3457763195037842, 1.4466370344161987, 1.5474977493286133, 1.6483584642410278, 1.7492191791534424, 1.8500797748565674, 1.950940489768982, 2.0518012046813965, 2.1526618003845215, 2.2535223960876465, 2.3543832302093506, 2.4552438259124756, 2.5561046600341797, 2.6569652557373047, 2.7578258514404297, 2.858686685562134, 2.959547281265259, 3.060408115386963, 3.161268711090088]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 12.0, 4.0, 6.0, 9.0, 13.0, 13.0, 23.0, 17.0, 14.0, 13.0, 28.0, 24.0, 20.0, 27.0, 28.0, 34.0, 43.0, 36.0, 44.0, 32.0, 45.0, 36.0, 46.0, 39.0, 36.0, 37.0, 32.0, 23.0, 38.0, 35.0, 33.0, 29.0, 21.0, 22.0, 11.0, 15.0, 17.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8168824911117554, -1.7598389387130737, -1.7027955055236816, -1.645751953125, -1.5887084007263184, -1.5316649675369263, -1.4746214151382446, -1.4175779819488525, -1.360534429550171, -1.3034908771514893, -1.2464474439620972, -1.1894038915634155, -1.1323603391647339, -1.0753169059753418, -1.0182733535766602, -0.9612298607826233, -0.9041863083839417, -0.8471428155899048, -0.7900992631912231, -0.7330557703971863, -0.6760122776031494, -0.6189687252044678, -0.5619252324104309, -0.504881739616394, -0.4478382170200348, -0.39079469442367554, -0.33375120162963867, -0.2767076790332794, -0.21966417133808136, -0.1626206636428833, -0.10557714104652405, -0.04853364825248718, 0.00850987434387207, 0.06555338203907013, 0.12259689718484879, 0.17964041233062744, 0.2366839200258255, 0.29372742772102356, 0.3507709503173828, 0.4078144431114197, 0.46485796570777893, 0.5219014883041382, 0.578944981098175, 0.6359884738922119, 0.6930320262908936, 0.7500755190849304, 0.8071190118789673, 0.8641625642776489, 0.9212060570716858, 0.9782495498657227, 1.0352931022644043, 1.092336654663086, 1.149380087852478, 1.2064236402511597, 1.2634670734405518, 1.3205106258392334, 1.377554178237915, 1.4345977306365967, 1.4916411638259888, 1.5486847162246704, 1.605728268623352, 1.6627717018127441, 1.7198152542114258, 1.7768588066101074, 1.8339022397994995]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 12.0, 23.0, 24.0, 46.0, 58.0, 106.0, 145.0, 224.0, 279.0, 439.0, 660.0, 1019.0, 1419.0, 2146.0, 3322.0, 4931.0, 7488.0, 11555.0, 17962.0, 28246.0, 42907.0, 65004.0, 94734.0, 128331.0, 149902.0, 141480.0, 112387.0, 80042.0, 53264.0, 34856.0, 22861.0, 14528.0, 9563.0, 6222.0, 4150.0, 2714.0, 1820.0, 1166.0, 818.0, 557.0, 362.0, 244.0, 181.0, 119.0, 71.0, 55.0, 47.0, 21.0, 14.0, 8.0, 7.0, 3.0, 1.0, 5.0], "bins": [-0.473388671875, -0.45977020263671875, -0.4461517333984375, -0.43253326416015625, -0.418914794921875, -0.40529632568359375, -0.3916778564453125, -0.37805938720703125, -0.36444091796875, -0.35082244873046875, -0.3372039794921875, -0.32358551025390625, -0.309967041015625, -0.29634857177734375, -0.2827301025390625, -0.26911163330078125, -0.2554931640625, -0.24187469482421875, -0.2282562255859375, -0.21463775634765625, -0.201019287109375, -0.18740081787109375, -0.1737823486328125, -0.16016387939453125, -0.14654541015625, -0.13292694091796875, -0.1193084716796875, -0.10569000244140625, -0.092071533203125, -0.07845306396484375, -0.0648345947265625, -0.05121612548828125, -0.03759765625, -0.02397918701171875, -0.0103607177734375, 0.00325775146484375, 0.016876220703125, 0.03049468994140625, 0.0441131591796875, 0.05773162841796875, 0.07135009765625, 0.08496856689453125, 0.0985870361328125, 0.11220550537109375, 0.125823974609375, 0.13944244384765625, 0.1530609130859375, 0.16667938232421875, 0.1802978515625, 0.19391632080078125, 0.2075347900390625, 0.22115325927734375, 0.234771728515625, 0.24839019775390625, 0.2620086669921875, 0.27562713623046875, 0.28924560546875, 0.30286407470703125, 0.3164825439453125, 0.33010101318359375, 0.343719482421875, 0.35733795166015625, 0.3709564208984375, 0.38457489013671875, 0.398193359375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 13.0, 19.0, 17.0, 22.0, 18.0, 16.0, 21.0, 19.0, 27.0, 19.0, 29.0, 33.0, 41.0, 32.0, 43.0, 44.0, 52.0, 45.0, 28.0, 50.0, 42.0, 41.0, 26.0, 40.0, 28.0, 34.0, 30.0, 26.0, 19.0, 12.0, 10.0, 18.0, 14.0, 2.0, 7.0, 4.0, 5.0, 8.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8527374267578125, -1.790435791015625, -1.7281341552734375, -1.66583251953125, -1.6035308837890625, -1.541229248046875, -1.4789276123046875, -1.4166259765625, -1.3543243408203125, -1.292022705078125, -1.2297210693359375, -1.16741943359375, -1.1051177978515625, -1.042816162109375, -0.9805145263671875, -0.918212890625, -0.8559112548828125, -0.793609619140625, -0.7313079833984375, -0.66900634765625, -0.6067047119140625, -0.544403076171875, -0.4821014404296875, -0.4197998046875, -0.3574981689453125, -0.295196533203125, -0.2328948974609375, -0.17059326171875, -0.1082916259765625, -0.045989990234375, 0.0163116455078125, 0.07861328125, 0.1409149169921875, 0.203216552734375, 0.2655181884765625, 0.32781982421875, 0.3901214599609375, 0.452423095703125, 0.5147247314453125, 0.5770263671875, 0.6393280029296875, 0.701629638671875, 0.7639312744140625, 0.82623291015625, 0.8885345458984375, 0.950836181640625, 1.0131378173828125, 1.075439453125, 1.1377410888671875, 1.200042724609375, 1.2623443603515625, 1.32464599609375, 1.3869476318359375, 1.449249267578125, 1.5115509033203125, 1.5738525390625, 1.6361541748046875, 1.698455810546875, 1.7607574462890625, 1.82305908203125, 1.8853607177734375, 1.947662353515625, 2.0099639892578125, 2.072265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 10.0, 19.0, 26.0, 35.0, 45.0, 76.0, 117.0, 174.0, 238.0, 412.0, 608.0, 1016.0, 1660.0, 2632.0, 4724.0, 8713.0, 16049.0, 30628.0, 59733.0, 114975.0, 198380.0, 239234.0, 171293.0, 93696.0, 48393.0, 25064.0, 13174.0, 7166.0, 3990.0, 2397.0, 1403.0, 875.0, 563.0, 345.0, 227.0, 139.0, 105.0, 60.0, 52.0, 26.0, 26.0, 13.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0], "bins": [-0.669921875, -0.6492080688476562, -0.6284942626953125, -0.6077804565429688, -0.587066650390625, -0.5663528442382812, -0.5456390380859375, -0.5249252319335938, -0.50421142578125, -0.48349761962890625, -0.4627838134765625, -0.44207000732421875, -0.421356201171875, -0.40064239501953125, -0.3799285888671875, -0.35921478271484375, -0.3385009765625, -0.31778717041015625, -0.2970733642578125, -0.27635955810546875, -0.255645751953125, -0.23493194580078125, -0.2142181396484375, -0.19350433349609375, -0.17279052734375, -0.15207672119140625, -0.1313629150390625, -0.11064910888671875, -0.089935302734375, -0.06922149658203125, -0.0485076904296875, -0.02779388427734375, -0.007080078125, 0.01363372802734375, 0.0343475341796875, 0.05506134033203125, 0.075775146484375, 0.09648895263671875, 0.1172027587890625, 0.13791656494140625, 0.15863037109375, 0.17934417724609375, 0.2000579833984375, 0.22077178955078125, 0.241485595703125, 0.26219940185546875, 0.2829132080078125, 0.30362701416015625, 0.3243408203125, 0.34505462646484375, 0.3657684326171875, 0.38648223876953125, 0.407196044921875, 0.42790985107421875, 0.4486236572265625, 0.46933746337890625, 0.49005126953125, 0.5107650756835938, 0.5314788818359375, 0.5521926879882812, 0.572906494140625, 0.5936203002929688, 0.6143341064453125, 0.6350479125976562, 0.65576171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 10.0, 9.0, 7.0, 11.0, 9.0, 15.0, 14.0, 27.0, 26.0, 25.0, 31.0, 31.0, 43.0, 32.0, 32.0, 38.0, 51.0, 60.0, 45.0, 40.0, 37.0, 34.0, 56.0, 36.0, 31.0, 28.0, 50.0, 21.0, 33.0, 23.0, 14.0, 12.0, 13.0, 18.0, 12.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1537017822265625, -1.113067626953125, -1.0724334716796875, -1.03179931640625, -0.9911651611328125, -0.950531005859375, -0.9098968505859375, -0.8692626953125, -0.8286285400390625, -0.787994384765625, -0.7473602294921875, -0.70672607421875, -0.6660919189453125, -0.625457763671875, -0.5848236083984375, -0.544189453125, -0.5035552978515625, -0.462921142578125, -0.4222869873046875, -0.38165283203125, -0.3410186767578125, -0.300384521484375, -0.2597503662109375, -0.2191162109375, -0.1784820556640625, -0.137847900390625, -0.0972137451171875, -0.05657958984375, -0.0159454345703125, 0.024688720703125, 0.0653228759765625, 0.10595703125, 0.1465911865234375, 0.187225341796875, 0.2278594970703125, 0.26849365234375, 0.3091278076171875, 0.349761962890625, 0.3903961181640625, 0.4310302734375, 0.4716644287109375, 0.512298583984375, 0.5529327392578125, 0.59356689453125, 0.6342010498046875, 0.674835205078125, 0.7154693603515625, 0.756103515625, 0.7967376708984375, 0.837371826171875, 0.8780059814453125, 0.91864013671875, 0.9592742919921875, 0.999908447265625, 1.0405426025390625, 1.0811767578125, 1.1218109130859375, 1.162445068359375, 1.2030792236328125, 1.24371337890625, 1.2843475341796875, 1.324981689453125, 1.3656158447265625, 1.40625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 14.0, 7.0, 28.0, 31.0, 29.0, 44.0, 53.0, 65.0, 86.0, 141.0, 183.0, 244.0, 351.0, 505.0, 727.0, 1222.0, 1885.0, 3160.0, 5712.0, 11583.0, 27475.0, 88541.0, 393989.0, 375300.0, 84834.0, 26569.0, 11473.0, 5771.0, 3045.0, 1827.0, 1134.0, 736.0, 498.0, 344.0, 238.0, 162.0, 130.0, 118.0, 88.0, 63.0, 39.0, 30.0, 18.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4084968566894531, -0.39389801025390625, -0.3792991638183594, -0.3647003173828125, -0.3501014709472656, -0.33550262451171875, -0.3209037780761719, -0.306304931640625, -0.2917060852050781, -0.27710723876953125, -0.2625083923339844, -0.2479095458984375, -0.23331069946289062, -0.21871185302734375, -0.20411300659179688, -0.18951416015625, -0.17491531372070312, -0.16031646728515625, -0.14571762084960938, -0.1311187744140625, -0.11651992797851562, -0.10192108154296875, -0.08732223510742188, -0.072723388671875, -0.058124542236328125, -0.04352569580078125, -0.028926849365234375, -0.0143280029296875, 0.000270843505859375, 0.01486968994140625, 0.029468536376953125, 0.0440673828125, 0.058666229248046875, 0.07326507568359375, 0.08786392211914062, 0.1024627685546875, 0.11706161499023438, 0.13166046142578125, 0.14625930786132812, 0.160858154296875, 0.17545700073242188, 0.19005584716796875, 0.20465469360351562, 0.2192535400390625, 0.23385238647460938, 0.24845123291015625, 0.2630500793457031, 0.27764892578125, 0.2922477722167969, 0.30684661865234375, 0.3214454650878906, 0.3360443115234375, 0.3506431579589844, 0.36524200439453125, 0.3798408508300781, 0.394439697265625, 0.4090385437011719, 0.42363739013671875, 0.4382362365722656, 0.4528350830078125, 0.4674339294433594, 0.48203277587890625, 0.4966316223144531, 0.51123046875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 6.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 4.0, 5.0, 7.0, 9.0, 12.0, 16.0, 12.0, 27.0, 15.0, 44.0, 45.0, 35.0, 40.0, 53.0, 57.0, 57.0, 62.0, 59.0, 51.0, 50.0, 36.0, 44.0, 36.0, 37.0, 22.0, 25.0, 23.0, 13.0, 20.0, 9.0, 7.0, 5.0, 9.0, 16.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.328345388174057e-05, -1.2798234820365906e-05, -1.2313015758991241e-05, -1.1827796697616577e-05, -1.1342577636241913e-05, -1.0857358574867249e-05, -1.0372139513492584e-05, -9.88692045211792e-06, -9.401701390743256e-06, -8.916482329368591e-06, -8.431263267993927e-06, -7.946044206619263e-06, -7.460825145244598e-06, -6.975606083869934e-06, -6.49038702249527e-06, -6.0051679611206055e-06, -5.519948899745941e-06, -5.034729838371277e-06, -4.5495107769966125e-06, -4.064291715621948e-06, -3.579072654247284e-06, -3.0938535928726196e-06, -2.6086345314979553e-06, -2.123415470123291e-06, -1.6381964087486267e-06, -1.1529773473739624e-06, -6.677582859992981e-07, -1.825392246246338e-07, 3.026798367500305e-07, 7.878988981246948e-07, 1.2731179594993591e-06, 1.7583370208740234e-06, 2.2435560822486877e-06, 2.728775143623352e-06, 3.2139942049980164e-06, 3.6992132663726807e-06, 4.184432327747345e-06, 4.669651389122009e-06, 5.154870450496674e-06, 5.640089511871338e-06, 6.125308573246002e-06, 6.6105276346206665e-06, 7.095746695995331e-06, 7.580965757369995e-06, 8.06618481874466e-06, 8.551403880119324e-06, 9.036622941493988e-06, 9.521842002868652e-06, 1.0007061064243317e-05, 1.0492280125617981e-05, 1.0977499186992645e-05, 1.146271824836731e-05, 1.1947937309741974e-05, 1.2433156371116638e-05, 1.2918375432491302e-05, 1.3403594493865967e-05, 1.3888813555240631e-05, 1.4374032616615295e-05, 1.485925167798996e-05, 1.5344470739364624e-05, 1.582968980073929e-05, 1.6314908862113953e-05, 1.6800127923488617e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 19.0, 18.0, 40.0, 34.0, 47.0, 96.0, 113.0, 158.0, 223.0, 314.0, 446.0, 686.0, 974.0, 1476.0, 2254.0, 3524.0, 5962.0, 10912.0, 23249.0, 58464.0, 172586.0, 384852.0, 238732.0, 80543.0, 30208.0, 13690.0, 7018.0, 4096.0, 2522.0, 1621.0, 1121.0, 772.0, 552.0, 369.0, 269.0, 181.0, 131.0, 95.0, 59.0, 37.0, 24.0, 15.0, 19.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5106124877929688, -0.4933929443359375, -0.47617340087890625, -0.458953857421875, -0.44173431396484375, -0.4245147705078125, -0.40729522705078125, -0.39007568359375, -0.37285614013671875, -0.3556365966796875, -0.33841705322265625, -0.321197509765625, -0.30397796630859375, -0.2867584228515625, -0.26953887939453125, -0.2523193359375, -0.23509979248046875, -0.2178802490234375, -0.20066070556640625, -0.183441162109375, -0.16622161865234375, -0.1490020751953125, -0.13178253173828125, -0.11456298828125, -0.09734344482421875, -0.0801239013671875, -0.06290435791015625, -0.045684814453125, -0.02846527099609375, -0.0112457275390625, 0.00597381591796875, 0.023193359375, 0.04041290283203125, 0.0576324462890625, 0.07485198974609375, 0.092071533203125, 0.10929107666015625, 0.1265106201171875, 0.14373016357421875, 0.16094970703125, 0.17816925048828125, 0.1953887939453125, 0.21260833740234375, 0.229827880859375, 0.24704742431640625, 0.2642669677734375, 0.28148651123046875, 0.2987060546875, 0.31592559814453125, 0.3331451416015625, 0.35036468505859375, 0.367584228515625, 0.38480377197265625, 0.4020233154296875, 0.41924285888671875, 0.43646240234375, 0.45368194580078125, 0.4709014892578125, 0.48812103271484375, 0.505340576171875, 0.5225601196289062, 0.5397796630859375, 0.5569992065429688, 0.57421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 16.0, 11.0, 19.0, 23.0, 31.0, 40.0, 44.0, 71.0, 73.0, 73.0, 90.0, 70.0, 86.0, 59.0, 45.0, 40.0, 23.0, 27.0, 18.0, 22.0, 8.0, 9.0, 9.0, 14.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.11407470703125, -0.11100006103515625, -0.1079254150390625, -0.10485076904296875, -0.101776123046875, -0.09870147705078125, -0.0956268310546875, -0.09255218505859375, -0.0894775390625, -0.08640289306640625, -0.0833282470703125, -0.08025360107421875, -0.077178955078125, -0.07410430908203125, -0.0710296630859375, -0.06795501708984375, -0.06488037109375, -0.06180572509765625, -0.0587310791015625, -0.05565643310546875, -0.052581787109375, -0.04950714111328125, -0.0464324951171875, -0.04335784912109375, -0.040283203125, -0.03720855712890625, -0.0341339111328125, -0.03105926513671875, -0.027984619140625, -0.02490997314453125, -0.0218353271484375, -0.01876068115234375, -0.01568603515625, -0.01261138916015625, -0.0095367431640625, -0.00646209716796875, -0.003387451171875, -0.00031280517578125, 0.0027618408203125, 0.00583648681640625, 0.0089111328125, 0.01198577880859375, 0.0150604248046875, 0.01813507080078125, 0.021209716796875, 0.02428436279296875, 0.0273590087890625, 0.03043365478515625, 0.03350830078125, 0.03658294677734375, 0.0396575927734375, 0.04273223876953125, 0.045806884765625, 0.04888153076171875, 0.0519561767578125, 0.05503082275390625, 0.05810546875, 0.06118011474609375, 0.0642547607421875, 0.06732940673828125, 0.070404052734375, 0.07347869873046875, 0.0765533447265625, 0.07962799072265625, 0.08270263671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 6.0, 5.0, 6.0, 8.0, 10.0, 16.0, 17.0, 15.0, 29.0, 36.0, 37.0, 45.0, 46.0, 47.0, 52.0, 63.0, 68.0, 78.0, 50.0, 57.0, 51.0, 43.0, 48.0, 36.0, 35.0, 28.0, 20.0, 18.0, 10.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2994351387023926, -3.1985461711883545, -3.0976574420928955, -2.9967684745788574, -2.8958797454833984, -2.7949907779693604, -2.6941020488739014, -2.5932130813598633, -2.4923243522644043, -2.391435384750366, -2.2905466556549072, -2.189657688140869, -2.08876895904541, -1.987879991531372, -1.886991262435913, -1.786102294921875, -1.6852134466171265, -1.584324598312378, -1.4834357500076294, -1.3825469017028809, -1.2816580533981323, -1.1807692050933838, -1.0798802375793457, -0.9789914488792419, -0.8781026005744934, -0.7772137522697449, -0.6763249039649963, -0.575435996055603, -0.4745471775531769, -0.37365829944610596, -0.2727694511413574, -0.1718806028366089, -0.07099175453186035, 0.02989710122346878, 0.1307859569787979, 0.23167482018470764, 0.3325636684894562, 0.4334525465965271, 0.5343413949012756, 0.6352302432060242, 0.7361190915107727, 0.8370079398155212, 0.9378967881202698, 1.038785696029663, 1.1396745443344116, 1.2405633926391602, 1.3414522409439087, 1.4423410892486572, 1.5432299375534058, 1.6441187858581543, 1.7450076341629028, 1.8458964824676514, 1.9467853307724, 2.0476741790771484, 2.1485631465911865, 2.2494518756866455, 2.3503408432006836, 2.4512298107147217, 2.5521185398101807, 2.6530075073242188, 2.7538962364196777, 2.854785203933716, 2.955673933029175, 3.056562900543213, 3.157451629638672]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 4.0, 7.0, 10.0, 10.0, 18.0, 18.0, 21.0, 13.0, 16.0, 35.0, 17.0, 23.0, 29.0, 31.0, 37.0, 37.0, 41.0, 34.0, 41.0, 45.0, 40.0, 40.0, 39.0, 34.0, 42.0, 29.0, 26.0, 39.0, 36.0, 27.0, 24.0, 20.0, 17.0, 16.0, 15.0, 15.0, 6.0, 6.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7987110614776611, -1.7415999174118042, -1.6844886541366577, -1.6273775100708008, -1.5702662467956543, -1.5131551027297974, -1.4560439586639404, -1.398932695388794, -1.3418214321136475, -1.2847102880477905, -1.227599024772644, -1.170487880706787, -1.1133766174316406, -1.0562654733657837, -0.999154269695282, -0.9420430660247803, -0.8849319219589233, -0.8278207182884216, -0.7707095146179199, -0.713598370552063, -0.6564871072769165, -0.5993759632110596, -0.5422647595405579, -0.48515355587005615, -0.42804235219955444, -0.37093114852905273, -0.313819944858551, -0.2567087709903717, -0.19959756731987, -0.1424863636493683, -0.08537518978118896, -0.028263986110687256, 0.028847098350524902, 0.08595829457044601, 0.14306949079036713, 0.20018067955970764, 0.25729188323020935, 0.31440308690071106, 0.3715142607688904, 0.4286254644393921, 0.4857366681098938, 0.5428478717803955, 0.5999590754508972, 0.6570702791213989, 0.7141814231872559, 0.7712926864624023, 0.8284038305282593, 0.885515034198761, 0.9426262378692627, 0.9997374415397644, 1.0568486452102661, 1.113959789276123, 1.1710710525512695, 1.2281821966171265, 1.2852933406829834, 1.3424046039581299, 1.3995158672332764, 1.4566270112991333, 1.5137382745742798, 1.5708494186401367, 1.6279606819152832, 1.6850718259811401, 1.742182970046997, 1.7992942333221436, 1.8564053773880005]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 12.0, 11.0, 15.0, 33.0, 44.0, 73.0, 122.0, 205.0, 321.0, 533.0, 811.0, 1353.0, 2180.0, 3316.0, 5119.0, 7668.0, 11589.0, 16934.0, 24338.0, 34025.0, 45224.0, 58397.0, 72075.0, 83815.0, 92661.0, 96235.0, 94346.0, 87113.0, 76141.0, 62501.0, 49458.0, 37534.0, 27068.0, 18914.0, 13310.0, 8831.0, 5919.0, 3782.0, 2428.0, 1487.0, 963.0, 614.0, 393.0, 233.0, 172.0, 97.0, 64.0, 32.0, 26.0, 10.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0713043212890625, -1.035186767578125, -0.9990692138671875, -0.96295166015625, -0.9268341064453125, -0.890716552734375, -0.8545989990234375, -0.8184814453125, -0.7823638916015625, -0.746246337890625, -0.7101287841796875, -0.67401123046875, -0.6378936767578125, -0.601776123046875, -0.5656585693359375, -0.529541015625, -0.4934234619140625, -0.457305908203125, -0.4211883544921875, -0.38507080078125, -0.3489532470703125, -0.312835693359375, -0.2767181396484375, -0.2406005859375, -0.2044830322265625, -0.168365478515625, -0.1322479248046875, -0.09613037109375, -0.0600128173828125, -0.023895263671875, 0.0122222900390625, 0.04833984375, 0.0844573974609375, 0.120574951171875, 0.1566925048828125, 0.19281005859375, 0.2289276123046875, 0.265045166015625, 0.3011627197265625, 0.3372802734375, 0.3733978271484375, 0.409515380859375, 0.4456329345703125, 0.48175048828125, 0.5178680419921875, 0.553985595703125, 0.5901031494140625, 0.626220703125, 0.6623382568359375, 0.698455810546875, 0.7345733642578125, 0.77069091796875, 0.8068084716796875, 0.842926025390625, 0.8790435791015625, 0.9151611328125, 0.9512786865234375, 0.987396240234375, 1.0235137939453125, 1.05963134765625, 1.0957489013671875, 1.131866455078125, 1.1679840087890625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 7.0, 15.0, 20.0, 14.0, 21.0, 19.0, 14.0, 30.0, 24.0, 32.0, 19.0, 38.0, 39.0, 38.0, 41.0, 38.0, 45.0, 49.0, 42.0, 47.0, 36.0, 43.0, 34.0, 31.0, 40.0, 32.0, 22.0, 19.0, 23.0, 15.0, 12.0, 19.0, 17.0, 10.0, 11.0, 5.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7926788330078125, -1.728912353515625, -1.6651458740234375, -1.60137939453125, -1.5376129150390625, -1.473846435546875, -1.4100799560546875, -1.3463134765625, -1.2825469970703125, -1.218780517578125, -1.1550140380859375, -1.09124755859375, -1.0274810791015625, -0.963714599609375, -0.8999481201171875, -0.836181640625, -0.7724151611328125, -0.708648681640625, -0.6448822021484375, -0.58111572265625, -0.5173492431640625, -0.453582763671875, -0.3898162841796875, -0.3260498046875, -0.2622833251953125, -0.198516845703125, -0.1347503662109375, -0.07098388671875, -0.0072174072265625, 0.056549072265625, 0.1203155517578125, 0.18408203125, 0.2478485107421875, 0.311614990234375, 0.3753814697265625, 0.43914794921875, 0.5029144287109375, 0.566680908203125, 0.6304473876953125, 0.6942138671875, 0.7579803466796875, 0.821746826171875, 0.8855133056640625, 0.94927978515625, 1.0130462646484375, 1.076812744140625, 1.1405792236328125, 1.204345703125, 1.2681121826171875, 1.331878662109375, 1.3956451416015625, 1.45941162109375, 1.5231781005859375, 1.586944580078125, 1.6507110595703125, 1.7144775390625, 1.7782440185546875, 1.842010498046875, 1.9057769775390625, 1.96954345703125, 2.0333099365234375, 2.097076416015625, 2.1608428955078125, 2.224609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 21.0, 33.0, 60.0, 73.0, 135.0, 171.0, 295.0, 467.0, 771.0, 1237.0, 1877.0, 2916.0, 4384.0, 6577.0, 10310.0, 14945.0, 21212.0, 30042.0, 40877.0, 53925.0, 67250.0, 80181.0, 90402.0, 95305.0, 95868.0, 90125.0, 79853.0, 67319.0, 53853.0, 41463.0, 30134.0, 21714.0, 15144.0, 10312.0, 6724.0, 4518.0, 2883.0, 1893.0, 1218.0, 728.0, 460.0, 314.0, 203.0, 144.0, 80.0, 35.0, 37.0, 29.0, 10.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0953369140625, -1.058837890625, -1.0223388671875, -0.98583984375, -0.9493408203125, -0.912841796875, -0.8763427734375, -0.83984375, -0.8033447265625, -0.766845703125, -0.7303466796875, -0.69384765625, -0.6573486328125, -0.620849609375, -0.5843505859375, -0.5478515625, -0.5113525390625, -0.474853515625, -0.4383544921875, -0.40185546875, -0.3653564453125, -0.328857421875, -0.2923583984375, -0.255859375, -0.2193603515625, -0.182861328125, -0.1463623046875, -0.10986328125, -0.0733642578125, -0.036865234375, -0.0003662109375, 0.0361328125, 0.0726318359375, 0.109130859375, 0.1456298828125, 0.18212890625, 0.2186279296875, 0.255126953125, 0.2916259765625, 0.328125, 0.3646240234375, 0.401123046875, 0.4376220703125, 0.47412109375, 0.5106201171875, 0.547119140625, 0.5836181640625, 0.6201171875, 0.6566162109375, 0.693115234375, 0.7296142578125, 0.76611328125, 0.8026123046875, 0.839111328125, 0.8756103515625, 0.912109375, 0.9486083984375, 0.985107421875, 1.0216064453125, 1.05810546875, 1.0946044921875, 1.131103515625, 1.1676025390625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 14.0, 14.0, 17.0, 17.0, 20.0, 23.0, 16.0, 32.0, 27.0, 33.0, 44.0, 26.0, 59.0, 38.0, 42.0, 43.0, 43.0, 44.0, 42.0, 38.0, 44.0, 40.0, 40.0, 26.0, 27.0, 21.0, 34.0, 18.0, 16.0, 16.0, 15.0, 9.0, 9.0, 5.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3603515625, -1.3197479248046875, -1.279144287109375, -1.2385406494140625, -1.19793701171875, -1.1573333740234375, -1.116729736328125, -1.0761260986328125, -1.0355224609375, -0.9949188232421875, -0.954315185546875, -0.9137115478515625, -0.87310791015625, -0.8325042724609375, -0.791900634765625, -0.7512969970703125, -0.710693359375, -0.6700897216796875, -0.629486083984375, -0.5888824462890625, -0.54827880859375, -0.5076751708984375, -0.467071533203125, -0.4264678955078125, -0.3858642578125, -0.3452606201171875, -0.304656982421875, -0.2640533447265625, -0.22344970703125, -0.1828460693359375, -0.142242431640625, -0.1016387939453125, -0.06103515625, -0.0204315185546875, 0.020172119140625, 0.0607757568359375, 0.10137939453125, 0.1419830322265625, 0.182586669921875, 0.2231903076171875, 0.2637939453125, 0.3043975830078125, 0.345001220703125, 0.3856048583984375, 0.42620849609375, 0.4668121337890625, 0.507415771484375, 0.5480194091796875, 0.588623046875, 0.6292266845703125, 0.669830322265625, 0.7104339599609375, 0.75103759765625, 0.7916412353515625, 0.832244873046875, 0.8728485107421875, 0.9134521484375, 0.9540557861328125, 0.994659423828125, 1.0352630615234375, 1.07586669921875, 1.1164703369140625, 1.157073974609375, 1.1976776123046875, 1.23828125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 19.0, 32.0, 61.0, 77.0, 131.0, 188.0, 313.0, 555.0, 697.0, 1216.0, 1949.0, 2962.0, 4571.0, 7234.0, 11177.0, 17053.0, 25180.0, 37040.0, 51644.0, 68870.0, 85769.0, 101227.0, 109306.0, 109602.0, 100557.0, 85509.0, 67554.0, 50302.0, 35657.0, 24786.0, 16555.0, 11197.0, 7003.0, 4657.0, 2830.0, 1828.0, 1165.0, 746.0, 481.0, 308.0, 197.0, 124.0, 76.0, 59.0, 28.0, 19.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.57110595703125, -0.5513916015625, -0.53167724609375, -0.511962890625, -0.49224853515625, -0.4725341796875, -0.45281982421875, -0.43310546875, -0.41339111328125, -0.3936767578125, -0.37396240234375, -0.354248046875, -0.33453369140625, -0.3148193359375, -0.29510498046875, -0.275390625, -0.25567626953125, -0.2359619140625, -0.21624755859375, -0.196533203125, -0.17681884765625, -0.1571044921875, -0.13739013671875, -0.11767578125, -0.09796142578125, -0.0782470703125, -0.05853271484375, -0.038818359375, -0.01910400390625, 0.0006103515625, 0.02032470703125, 0.0400390625, 0.05975341796875, 0.0794677734375, 0.09918212890625, 0.118896484375, 0.13861083984375, 0.1583251953125, 0.17803955078125, 0.19775390625, 0.21746826171875, 0.2371826171875, 0.25689697265625, 0.276611328125, 0.29632568359375, 0.3160400390625, 0.33575439453125, 0.35546875, 0.37518310546875, 0.3948974609375, 0.41461181640625, 0.434326171875, 0.45404052734375, 0.4737548828125, 0.49346923828125, 0.51318359375, 0.53289794921875, 0.5526123046875, 0.57232666015625, 0.592041015625, 0.61175537109375, 0.6314697265625, 0.65118408203125, 0.6708984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 16.0, 9.0, 19.0, 24.0, 21.0, 31.0, 32.0, 34.0, 43.0, 43.0, 37.0, 52.0, 66.0, 58.0, 51.0, 47.0, 58.0, 44.0, 42.0, 43.0, 35.0, 38.0, 24.0, 21.0, 20.0, 18.0, 11.0, 10.0, 11.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.399652481079102e-05, -9.12155956029892e-05, -8.843466639518738e-05, -8.565373718738556e-05, -8.287280797958374e-05, -8.009187877178192e-05, -7.73109495639801e-05, -7.453002035617828e-05, -7.174909114837646e-05, -6.896816194057465e-05, -6.618723273277283e-05, -6.340630352497101e-05, -6.062537431716919e-05, -5.784444510936737e-05, -5.506351590156555e-05, -5.228258669376373e-05, -4.9501657485961914e-05, -4.6720728278160095e-05, -4.3939799070358276e-05, -4.115886986255646e-05, -3.837794065475464e-05, -3.559701144695282e-05, -3.2816082239151e-05, -3.0035153031349182e-05, -2.7254223823547363e-05, -2.4473294615745544e-05, -2.1692365407943726e-05, -1.8911436200141907e-05, -1.6130506992340088e-05, -1.3349577784538269e-05, -1.056864857673645e-05, -7.787719368934631e-06, -5.0067901611328125e-06, -2.2258609533309937e-06, 5.550682544708252e-07, 3.335997462272644e-06, 6.116926670074463e-06, 8.897855877876282e-06, 1.16787850856781e-05, 1.445971429347992e-05, 1.7240643501281738e-05, 2.0021572709083557e-05, 2.2802501916885376e-05, 2.5583431124687195e-05, 2.8364360332489014e-05, 3.114528954029083e-05, 3.392621874809265e-05, 3.670714795589447e-05, 3.948807716369629e-05, 4.226900637149811e-05, 4.504993557929993e-05, 4.7830864787101746e-05, 5.0611793994903564e-05, 5.339272320270538e-05, 5.61736524105072e-05, 5.895458161830902e-05, 6.173551082611084e-05, 6.451644003391266e-05, 6.729736924171448e-05, 7.00782984495163e-05, 7.285922765731812e-05, 7.564015686511993e-05, 7.842108607292175e-05, 8.120201528072357e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 5.0, 7.0, 15.0, 24.0, 34.0, 70.0, 86.0, 129.0, 211.0, 299.0, 504.0, 748.0, 1220.0, 1941.0, 3099.0, 4886.0, 7731.0, 11867.0, 18267.0, 27525.0, 40138.0, 56625.0, 75412.0, 94927.0, 109401.0, 115207.0, 111321.0, 97903.0, 79672.0, 60504.0, 43184.0, 29808.0, 19820.0, 12948.0, 8397.0, 5274.0, 3350.0, 2224.0, 1393.0, 888.0, 555.0, 367.0, 214.0, 122.0, 88.0, 45.0, 41.0, 23.0, 19.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.59466552734375, -0.5731201171875, -0.55157470703125, -0.530029296875, -0.50848388671875, -0.4869384765625, -0.46539306640625, -0.44384765625, -0.42230224609375, -0.4007568359375, -0.37921142578125, -0.357666015625, -0.33612060546875, -0.3145751953125, -0.29302978515625, -0.271484375, -0.24993896484375, -0.2283935546875, -0.20684814453125, -0.185302734375, -0.16375732421875, -0.1422119140625, -0.12066650390625, -0.09912109375, -0.07757568359375, -0.0560302734375, -0.03448486328125, -0.012939453125, 0.00860595703125, 0.0301513671875, 0.05169677734375, 0.0732421875, 0.09478759765625, 0.1163330078125, 0.13787841796875, 0.159423828125, 0.18096923828125, 0.2025146484375, 0.22406005859375, 0.24560546875, 0.26715087890625, 0.2886962890625, 0.31024169921875, 0.331787109375, 0.35333251953125, 0.3748779296875, 0.39642333984375, 0.41796875, 0.43951416015625, 0.4610595703125, 0.48260498046875, 0.504150390625, 0.52569580078125, 0.5472412109375, 0.56878662109375, 0.59033203125, 0.61187744140625, 0.6334228515625, 0.65496826171875, 0.676513671875, 0.69805908203125, 0.7196044921875, 0.74114990234375, 0.7626953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 7.0, 6.0, 11.0, 14.0, 11.0, 17.0, 17.0, 20.0, 29.0, 31.0, 41.0, 42.0, 31.0, 46.0, 41.0, 57.0, 38.0, 51.0, 53.0, 54.0, 38.0, 30.0, 35.0, 36.0, 32.0, 31.0, 24.0, 23.0, 19.0, 27.0, 14.0, 14.0, 11.0, 9.0, 4.0, 7.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2149658203125, -0.20800018310546875, -0.2010345458984375, -0.19406890869140625, -0.187103271484375, -0.18013763427734375, -0.1731719970703125, -0.16620635986328125, -0.15924072265625, -0.15227508544921875, -0.1453094482421875, -0.13834381103515625, -0.131378173828125, -0.12441253662109375, -0.1174468994140625, -0.11048126220703125, -0.103515625, -0.09654998779296875, -0.0895843505859375, -0.08261871337890625, -0.075653076171875, -0.06868743896484375, -0.0617218017578125, -0.05475616455078125, -0.04779052734375, -0.04082489013671875, -0.0338592529296875, -0.02689361572265625, -0.019927978515625, -0.01296234130859375, -0.0059967041015625, 0.00096893310546875, 0.0079345703125, 0.01490020751953125, 0.0218658447265625, 0.02883148193359375, 0.035797119140625, 0.04276275634765625, 0.0497283935546875, 0.05669403076171875, 0.06365966796875, 0.07062530517578125, 0.0775909423828125, 0.08455657958984375, 0.091522216796875, 0.09848785400390625, 0.1054534912109375, 0.11241912841796875, 0.119384765625, 0.12635040283203125, 0.1333160400390625, 0.14028167724609375, 0.147247314453125, 0.15421295166015625, 0.1611785888671875, 0.16814422607421875, 0.17510986328125, 0.18207550048828125, 0.1890411376953125, 0.19600677490234375, 0.202972412109375, 0.20993804931640625, 0.2169036865234375, 0.22386932373046875, 0.2308349609375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 4.0, 7.0, 6.0, 5.0, 14.0, 16.0, 14.0, 17.0, 24.0, 28.0, 29.0, 51.0, 41.0, 52.0, 48.0, 78.0, 62.0, 54.0, 57.0, 50.0, 53.0, 43.0, 48.0, 37.0, 43.0, 25.0, 23.0, 13.0, 21.0, 13.0, 15.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.274965286254883, -3.179086208343506, -3.083207130432129, -2.987328052520752, -2.891448974609375, -2.795569896697998, -2.699690818786621, -2.603811740875244, -2.507932662963867, -2.4120535850524902, -2.3161745071411133, -2.2202954292297363, -2.1244163513183594, -2.0285372734069824, -1.932658076286316, -1.836778998374939, -1.7408998012542725, -1.6450207233428955, -1.5491416454315186, -1.4532625675201416, -1.3573834896087646, -1.2615044116973877, -1.1656252145767212, -1.0697461366653442, -0.9738670587539673, -0.8779879808425903, -0.7821089029312134, -0.6862297654151917, -0.5903506875038147, -0.49447160959243774, -0.398592472076416, -0.30271339416503906, -0.2068345546722412, -0.11095546185970306, -0.015076369047164917, 0.08080273866653442, 0.17668181657791138, 0.27256089448928833, 0.36844003200531006, 0.464319109916687, 0.560198187828064, 0.6560772657394409, 0.7519563436508179, 0.8478354811668396, 0.9437145590782166, 1.0395936965942383, 1.1354727745056152, 1.2313518524169922, 1.3272309303283691, 1.423110008239746, 1.518989086151123, 1.6148681640625, 1.710747241973877, 1.806626319885254, 1.9025055170059204, 1.9983845949172974, 2.0942635536193848, 2.1901426315307617, 2.2860217094421387, 2.3819007873535156, 2.4777798652648926, 2.5736589431762695, 2.6695380210876465, 2.7654170989990234, 2.8612964153289795]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 8.0, 11.0, 7.0, 16.0, 7.0, 14.0, 12.0, 28.0, 19.0, 25.0, 27.0, 28.0, 32.0, 26.0, 32.0, 35.0, 42.0, 38.0, 34.0, 36.0, 49.0, 29.0, 36.0, 43.0, 41.0, 34.0, 34.0, 31.0, 35.0, 31.0, 28.0, 22.0, 16.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.041332721710205, -1.9815632104873657, -1.921793818473816, -1.8620243072509766, -1.8022549152374268, -1.7424854040145874, -1.682715892791748, -1.6229465007781982, -1.5631769895553589, -1.5034074783325195, -1.4436380863189697, -1.3838685750961304, -1.324099063873291, -1.2643296718597412, -1.2045601606369019, -1.1447906494140625, -1.0850212574005127, -1.0252517461776733, -0.9654823541641235, -0.9057128429412842, -0.8459433913230896, -0.786173939704895, -0.7264044284820557, -0.6666349768638611, -0.6068655252456665, -0.5470960736274719, -0.48732659220695496, -0.427557110786438, -0.3677876591682434, -0.30801820755004883, -0.24824872612953186, -0.1884792447090149, -0.12870991230010986, -0.06894044578075409, -0.009170979261398315, 0.05059848725795746, 0.11036795377731323, 0.1701374053955078, 0.22990688681602478, 0.28967636823654175, 0.34944581985473633, 0.4092152714729309, 0.4689847528934479, 0.5287542343139648, 0.5885236859321594, 0.648293137550354, 0.7080626487731934, 0.7678321003913879, 0.8276015520095825, 0.8873710036277771, 0.9471404552459717, 1.006909966468811, 1.0666794776916504, 1.1264488697052002, 1.1862183809280396, 1.245987892150879, 1.3057572841644287, 1.365526795387268, 1.4252961874008179, 1.4850656986236572, 1.544835090637207, 1.6046046018600464, 1.6643741130828857, 1.7241435050964355, 1.783913016319275]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 9.0, 17.0, 17.0, 25.0, 35.0, 63.0, 113.0, 176.0, 273.0, 428.0, 660.0, 1147.0, 1776.0, 2867.0, 4608.0, 7447.0, 12084.0, 19588.0, 31849.0, 50790.0, 79422.0, 121833.0, 179768.0, 252160.0, 335220.0, 414206.0, 465715.0, 478873.0, 443079.0, 374101.0, 291771.0, 212306.0, 146118.0, 97448.0, 62956.0, 40249.0, 24850.0, 15443.0, 9426.0, 5844.0, 3558.0, 2225.0, 1409.0, 835.0, 548.0, 340.0, 230.0, 139.0, 96.0, 62.0, 30.0, 24.0, 17.0, 8.0, 2.0, 2.0, 1.0], "bins": [-2.076171875, -2.015533447265625, -1.95489501953125, -1.894256591796875, -1.8336181640625, -1.772979736328125, -1.71234130859375, -1.651702880859375, -1.591064453125, -1.530426025390625, -1.46978759765625, -1.409149169921875, -1.3485107421875, -1.287872314453125, -1.22723388671875, -1.166595458984375, -1.10595703125, -1.045318603515625, -0.98468017578125, -0.924041748046875, -0.8634033203125, -0.802764892578125, -0.74212646484375, -0.681488037109375, -0.620849609375, -0.560211181640625, -0.49957275390625, -0.438934326171875, -0.3782958984375, -0.317657470703125, -0.25701904296875, -0.196380615234375, -0.1357421875, -0.075103759765625, -0.01446533203125, 0.046173095703125, 0.1068115234375, 0.167449951171875, 0.22808837890625, 0.288726806640625, 0.349365234375, 0.410003662109375, 0.47064208984375, 0.531280517578125, 0.5919189453125, 0.652557373046875, 0.71319580078125, 0.773834228515625, 0.83447265625, 0.895111083984375, 0.95574951171875, 1.016387939453125, 1.0770263671875, 1.137664794921875, 1.19830322265625, 1.258941650390625, 1.319580078125, 1.380218505859375, 1.44085693359375, 1.501495361328125, 1.5621337890625, 1.622772216796875, 1.68341064453125, 1.744049072265625, 1.8046875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 12.0, 16.0, 17.0, 18.0, 25.0, 12.0, 25.0, 41.0, 23.0, 24.0, 31.0, 39.0, 53.0, 31.0, 47.0, 40.0, 43.0, 41.0, 45.0, 36.0, 35.0, 29.0, 41.0, 33.0, 27.0, 25.0, 21.0, 28.0, 28.0, 15.0, 10.0, 16.0, 10.0, 5.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0, -1.9428863525390625, -1.885772705078125, -1.8286590576171875, -1.77154541015625, -1.7144317626953125, -1.657318115234375, -1.6002044677734375, -1.5430908203125, -1.4859771728515625, -1.428863525390625, -1.3717498779296875, -1.31463623046875, -1.2575225830078125, -1.200408935546875, -1.1432952880859375, -1.086181640625, -1.0290679931640625, -0.971954345703125, -0.9148406982421875, -0.85772705078125, -0.8006134033203125, -0.743499755859375, -0.6863861083984375, -0.6292724609375, -0.5721588134765625, -0.515045166015625, -0.4579315185546875, -0.40081787109375, -0.3437042236328125, -0.286590576171875, -0.2294769287109375, -0.17236328125, -0.1152496337890625, -0.058135986328125, -0.0010223388671875, 0.05609130859375, 0.1132049560546875, 0.170318603515625, 0.2274322509765625, 0.2845458984375, 0.3416595458984375, 0.398773193359375, 0.4558868408203125, 0.51300048828125, 0.5701141357421875, 0.627227783203125, 0.6843414306640625, 0.741455078125, 0.7985687255859375, 0.855682373046875, 0.9127960205078125, 0.96990966796875, 1.0270233154296875, 1.084136962890625, 1.1412506103515625, 1.1983642578125, 1.2554779052734375, 1.312591552734375, 1.3697052001953125, 1.42681884765625, 1.4839324951171875, 1.541046142578125, 1.5981597900390625, 1.6552734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 6.0, 7.0, 13.0, 23.0, 25.0, 53.0, 66.0, 131.0, 243.0, 362.0, 605.0, 910.0, 1679.0, 2669.0, 4494.0, 7434.0, 12098.0, 19061.0, 31376.0, 49142.0, 75290.0, 113694.0, 164516.0, 227795.0, 299132.0, 368460.0, 422066.0, 445540.0, 434341.0, 388886.0, 322999.0, 250898.0, 183483.0, 128823.0, 86431.0, 56921.0, 36118.0, 22885.0, 13929.0, 8472.0, 5158.0, 3149.0, 1984.0, 1168.0, 644.0, 447.0, 231.0, 168.0, 106.0, 58.0, 41.0, 23.0, 18.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9755859375, -1.9066619873046875, -1.837738037109375, -1.7688140869140625, -1.69989013671875, -1.6309661865234375, -1.562042236328125, -1.4931182861328125, -1.4241943359375, -1.3552703857421875, -1.286346435546875, -1.2174224853515625, -1.14849853515625, -1.0795745849609375, -1.010650634765625, -0.9417266845703125, -0.872802734375, -0.8038787841796875, -0.734954833984375, -0.6660308837890625, -0.59710693359375, -0.5281829833984375, -0.459259033203125, -0.3903350830078125, -0.3214111328125, -0.2524871826171875, -0.183563232421875, -0.1146392822265625, -0.04571533203125, 0.0232086181640625, 0.092132568359375, 0.1610565185546875, 0.22998046875, 0.2989044189453125, 0.367828369140625, 0.4367523193359375, 0.50567626953125, 0.5746002197265625, 0.643524169921875, 0.7124481201171875, 0.7813720703125, 0.8502960205078125, 0.919219970703125, 0.9881439208984375, 1.05706787109375, 1.1259918212890625, 1.194915771484375, 1.2638397216796875, 1.332763671875, 1.4016876220703125, 1.470611572265625, 1.5395355224609375, 1.60845947265625, 1.6773834228515625, 1.746307373046875, 1.8152313232421875, 1.8841552734375, 1.9530792236328125, 2.022003173828125, 2.0909271240234375, 2.15985107421875, 2.2287750244140625, 2.297698974609375, 2.3666229248046875, 2.435546875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 3.0, 8.0, 7.0, 12.0, 17.0, 16.0, 24.0, 29.0, 37.0, 38.0, 56.0, 64.0, 80.0, 90.0, 107.0, 155.0, 161.0, 179.0, 207.0, 213.0, 211.0, 219.0, 251.0, 214.0, 212.0, 178.0, 201.0, 193.0, 167.0, 140.0, 129.0, 105.0, 65.0, 68.0, 40.0, 37.0, 38.0, 26.0, 14.0, 17.0, 10.0, 11.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.197265625, -1.16339111328125, -1.1295166015625, -1.09564208984375, -1.061767578125, -1.02789306640625, -0.9940185546875, -0.96014404296875, -0.92626953125, -0.89239501953125, -0.8585205078125, -0.82464599609375, -0.790771484375, -0.75689697265625, -0.7230224609375, -0.68914794921875, -0.6552734375, -0.62139892578125, -0.5875244140625, -0.55364990234375, -0.519775390625, -0.48590087890625, -0.4520263671875, -0.41815185546875, -0.38427734375, -0.35040283203125, -0.3165283203125, -0.28265380859375, -0.248779296875, -0.21490478515625, -0.1810302734375, -0.14715576171875, -0.11328125, -0.07940673828125, -0.0455322265625, -0.01165771484375, 0.022216796875, 0.05609130859375, 0.0899658203125, 0.12384033203125, 0.15771484375, 0.19158935546875, 0.2254638671875, 0.25933837890625, 0.293212890625, 0.32708740234375, 0.3609619140625, 0.39483642578125, 0.4287109375, 0.46258544921875, 0.4964599609375, 0.53033447265625, 0.564208984375, 0.59808349609375, 0.6319580078125, 0.66583251953125, 0.69970703125, 0.73358154296875, 0.7674560546875, 0.80133056640625, 0.835205078125, 0.86907958984375, 0.9029541015625, 0.93682861328125, 0.970703125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 12.0, 12.0, 9.0, 16.0, 18.0, 23.0, 17.0, 18.0, 34.0, 30.0, 27.0, 36.0, 52.0, 61.0, 46.0, 39.0, 48.0, 54.0, 46.0, 45.0, 55.0, 43.0, 36.0, 37.0, 35.0, 25.0, 18.0, 22.0, 18.0, 11.0, 10.0, 11.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.551114559173584, -3.4483602046966553, -3.3456058502197266, -3.242851495742798, -3.140097141265869, -3.0373425483703613, -2.9345881938934326, -2.831833839416504, -2.729079484939575, -2.6263251304626465, -2.5235707759857178, -2.420816421508789, -2.3180618286132812, -2.2153077125549316, -2.112553119659424, -2.009798765182495, -1.9070444107055664, -1.8042900562286377, -1.701535701751709, -1.5987812280654907, -1.496026873588562, -1.3932725191116333, -1.290518045425415, -1.1877636909484863, -1.0850093364715576, -0.9822549819946289, -0.8795005679130554, -0.7767461538314819, -0.6739917993545532, -0.5712374448776245, -0.468483030796051, -0.36572861671447754, -0.26297426223754883, -0.16021987795829773, -0.05746549367904663, 0.04528889060020447, 0.14804327487945557, 0.2507976293563843, 0.35355204343795776, 0.45630645751953125, 0.55906081199646, 0.6618151664733887, 0.7645695805549622, 0.8673239946365356, 0.9700783491134644, 1.072832703590393, 1.1755871772766113, 1.27834153175354, 1.3810958862304688, 1.4838502407073975, 1.5866045951843262, 1.6893590688705444, 1.7921134233474731, 1.8948677778244019, 1.9976222515106201, 2.100376605987549, 2.2031309604644775, 2.3058853149414062, 2.408639669418335, 2.5113940238952637, 2.6141486167907715, 2.716902732849121, 2.819657325744629, 2.9224116802215576, 3.0251660346984863]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 13.0, 9.0, 14.0, 18.0, 25.0, 16.0, 21.0, 27.0, 22.0, 29.0, 23.0, 33.0, 31.0, 36.0, 45.0, 43.0, 35.0, 45.0, 33.0, 56.0, 37.0, 30.0, 45.0, 37.0, 31.0, 30.0, 31.0, 18.0, 23.0, 22.0, 15.0, 17.0, 12.0, 21.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2918717861175537, -2.2207958698272705, -2.149719715118408, -2.078643798828125, -2.007567882537842, -1.936491847038269, -1.8654158115386963, -1.794339895248413, -1.7232638597488403, -1.6521878242492676, -1.5811119079589844, -1.5100358724594116, -1.4389598369598389, -1.3678839206695557, -1.296807885169983, -1.2257318496704102, -1.154655933380127, -1.0835798978805542, -1.012503981590271, -0.9414279460906982, -0.8703519701957703, -0.7992759943008423, -0.7281999588012695, -0.6571239829063416, -0.5860480070114136, -0.5149720311164856, -0.44389602541923523, -0.37282001972198486, -0.3017440438270569, -0.2306680679321289, -0.15959206223487854, -0.08851605653762817, -0.017440319061279297, 0.053635671734809875, 0.12471166253089905, 0.19578765332698822, 0.2668636441230774, 0.33793962001800537, 0.40901562571525574, 0.4800916314125061, 0.5511676073074341, 0.6222435832023621, 0.69331955909729, 0.7643955945968628, 0.8354715704917908, 0.9065475463867188, 0.9776235818862915, 1.0486996173858643, 1.1197755336761475, 1.1908515691757202, 1.2619274854660034, 1.3330035209655762, 1.4040794372558594, 1.4751554727554321, 1.5462315082550049, 1.617307424545288, 1.6883834600448608, 1.7594594955444336, 1.8305354118347168, 1.9016114473342896, 1.9726874828338623, 2.0437633991241455, 2.1148393154144287, 2.185915470123291, 2.256991386413574]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 12.0, 16.0, 18.0, 46.0, 68.0, 113.0, 166.0, 259.0, 476.0, 764.0, 1189.0, 2090.0, 3248.0, 5497.0, 9269.0, 15074.0, 25590.0, 41840.0, 68155.0, 105195.0, 150384.0, 176266.0, 152980.0, 108877.0, 70472.0, 43816.0, 26700.0, 16060.0, 9500.0, 5573.0, 3500.0, 2055.0, 1265.0, 785.0, 473.0, 300.0, 158.0, 94.0, 79.0, 42.0, 27.0, 10.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5694046020507812, -0.5494537353515625, -0.5295028686523438, -0.509552001953125, -0.48960113525390625, -0.4696502685546875, -0.44969940185546875, -0.42974853515625, -0.40979766845703125, -0.3898468017578125, -0.36989593505859375, -0.349945068359375, -0.32999420166015625, -0.3100433349609375, -0.29009246826171875, -0.2701416015625, -0.25019073486328125, -0.2302398681640625, -0.21028900146484375, -0.190338134765625, -0.17038726806640625, -0.1504364013671875, -0.13048553466796875, -0.11053466796875, -0.09058380126953125, -0.0706329345703125, -0.05068206787109375, -0.030731201171875, -0.01078033447265625, 0.0091705322265625, 0.02912139892578125, 0.049072265625, 0.06902313232421875, 0.0889739990234375, 0.10892486572265625, 0.128875732421875, 0.14882659912109375, 0.1687774658203125, 0.18872833251953125, 0.20867919921875, 0.22863006591796875, 0.2485809326171875, 0.26853179931640625, 0.288482666015625, 0.30843353271484375, 0.3283843994140625, 0.34833526611328125, 0.3682861328125, 0.38823699951171875, 0.4081878662109375, 0.42813873291015625, 0.448089599609375, 0.46804046630859375, 0.4879913330078125, 0.5079421997070312, 0.52789306640625, 0.5478439331054688, 0.5677947998046875, 0.5877456665039062, 0.607696533203125, 0.6276473999023438, 0.6475982666015625, 0.6675491333007812, 0.6875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 12.0, 21.0, 18.0, 13.0, 14.0, 31.0, 22.0, 33.0, 27.0, 31.0, 24.0, 35.0, 32.0, 38.0, 38.0, 40.0, 37.0, 41.0, 33.0, 28.0, 39.0, 25.0, 32.0, 32.0, 28.0, 27.0, 18.0, 22.0, 32.0, 23.0, 24.0, 14.0, 10.0, 12.0, 8.0, 9.0, 5.0, 8.0, 9.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.263671875, -2.193115234375, -2.12255859375, -2.052001953125, -1.9814453125, -1.910888671875, -1.84033203125, -1.769775390625, -1.69921875, -1.628662109375, -1.55810546875, -1.487548828125, -1.4169921875, -1.346435546875, -1.27587890625, -1.205322265625, -1.134765625, -1.064208984375, -0.99365234375, -0.923095703125, -0.8525390625, -0.781982421875, -0.71142578125, -0.640869140625, -0.5703125, -0.499755859375, -0.42919921875, -0.358642578125, -0.2880859375, -0.217529296875, -0.14697265625, -0.076416015625, -0.005859375, 0.064697265625, 0.13525390625, 0.205810546875, 0.2763671875, 0.346923828125, 0.41748046875, 0.488037109375, 0.55859375, 0.629150390625, 0.69970703125, 0.770263671875, 0.8408203125, 0.911376953125, 0.98193359375, 1.052490234375, 1.123046875, 1.193603515625, 1.26416015625, 1.334716796875, 1.4052734375, 1.475830078125, 1.54638671875, 1.616943359375, 1.6875, 1.758056640625, 1.82861328125, 1.899169921875, 1.9697265625, 2.040283203125, 2.11083984375, 2.181396484375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 12.0, 13.0, 22.0, 28.0, 32.0, 43.0, 98.0, 127.0, 193.0, 317.0, 504.0, 742.0, 1140.0, 1819.0, 3116.0, 4966.0, 8508.0, 14459.0, 25566.0, 46035.0, 82897.0, 142215.0, 204576.0, 198779.0, 134398.0, 77006.0, 42954.0, 23990.0, 13607.0, 7939.0, 4697.0, 2896.0, 1741.0, 1103.0, 678.0, 459.0, 293.0, 180.0, 123.0, 76.0, 63.0, 34.0, 37.0, 19.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.75146484375, -0.7286529541015625, -0.705841064453125, -0.6830291748046875, -0.66021728515625, -0.6374053955078125, -0.614593505859375, -0.5917816162109375, -0.5689697265625, -0.5461578369140625, -0.523345947265625, -0.5005340576171875, -0.47772216796875, -0.4549102783203125, -0.432098388671875, -0.4092864990234375, -0.386474609375, -0.3636627197265625, -0.340850830078125, -0.3180389404296875, -0.29522705078125, -0.2724151611328125, -0.249603271484375, -0.2267913818359375, -0.2039794921875, -0.1811676025390625, -0.158355712890625, -0.1355438232421875, -0.11273193359375, -0.0899200439453125, -0.067108154296875, -0.0442962646484375, -0.021484375, 0.0013275146484375, 0.024139404296875, 0.0469512939453125, 0.06976318359375, 0.0925750732421875, 0.115386962890625, 0.1381988525390625, 0.1610107421875, 0.1838226318359375, 0.206634521484375, 0.2294464111328125, 0.25225830078125, 0.2750701904296875, 0.297882080078125, 0.3206939697265625, 0.343505859375, 0.3663177490234375, 0.389129638671875, 0.4119415283203125, 0.43475341796875, 0.4575653076171875, 0.480377197265625, 0.5031890869140625, 0.5260009765625, 0.5488128662109375, 0.571624755859375, 0.5944366455078125, 0.61724853515625, 0.6400604248046875, 0.662872314453125, 0.6856842041015625, 0.70849609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 5.0, 10.0, 8.0, 12.0, 16.0, 22.0, 21.0, 13.0, 30.0, 25.0, 33.0, 21.0, 19.0, 26.0, 26.0, 37.0, 31.0, 33.0, 37.0, 42.0, 26.0, 36.0, 21.0, 41.0, 37.0, 40.0, 35.0, 38.0, 30.0, 32.0, 25.0, 17.0, 18.0, 20.0, 15.0, 15.0, 12.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.267578125, -1.2251129150390625, -1.182647705078125, -1.1401824951171875, -1.09771728515625, -1.0552520751953125, -1.012786865234375, -0.9703216552734375, -0.9278564453125, -0.8853912353515625, -0.842926025390625, -0.8004608154296875, -0.75799560546875, -0.7155303955078125, -0.673065185546875, -0.6305999755859375, -0.588134765625, -0.5456695556640625, -0.503204345703125, -0.4607391357421875, -0.41827392578125, -0.3758087158203125, -0.333343505859375, -0.2908782958984375, -0.2484130859375, -0.2059478759765625, -0.163482666015625, -0.1210174560546875, -0.07855224609375, -0.0360870361328125, 0.006378173828125, 0.0488433837890625, 0.09130859375, 0.1337738037109375, 0.176239013671875, 0.2187042236328125, 0.26116943359375, 0.3036346435546875, 0.346099853515625, 0.3885650634765625, 0.4310302734375, 0.4734954833984375, 0.515960693359375, 0.5584259033203125, 0.60089111328125, 0.6433563232421875, 0.685821533203125, 0.7282867431640625, 0.770751953125, 0.8132171630859375, 0.855682373046875, 0.8981475830078125, 0.94061279296875, 0.9830780029296875, 1.025543212890625, 1.0680084228515625, 1.1104736328125, 1.1529388427734375, 1.195404052734375, 1.2378692626953125, 1.28033447265625, 1.3227996826171875, 1.365264892578125, 1.4077301025390625, 1.4501953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 9.0, 14.0, 24.0, 21.0, 33.0, 46.0, 57.0, 95.0, 125.0, 195.0, 272.0, 426.0, 648.0, 985.0, 1684.0, 2921.0, 5313.0, 10752.0, 24373.0, 73210.0, 327167.0, 440721.0, 101124.0, 30718.0, 12651.0, 6329.0, 3391.0, 1953.0, 1110.0, 659.0, 499.0, 304.0, 218.0, 152.0, 96.0, 61.0, 47.0, 40.0, 28.0, 16.0, 19.0, 16.0, 5.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5685272216796875, -0.549652099609375, -0.5307769775390625, -0.51190185546875, -0.4930267333984375, -0.474151611328125, -0.4552764892578125, -0.4364013671875, -0.4175262451171875, -0.398651123046875, -0.3797760009765625, -0.36090087890625, -0.3420257568359375, -0.323150634765625, -0.3042755126953125, -0.285400390625, -0.2665252685546875, -0.247650146484375, -0.2287750244140625, -0.20989990234375, -0.1910247802734375, -0.172149658203125, -0.1532745361328125, -0.1343994140625, -0.1155242919921875, -0.096649169921875, -0.0777740478515625, -0.05889892578125, -0.0400238037109375, -0.021148681640625, -0.0022735595703125, 0.0166015625, 0.0354766845703125, 0.054351806640625, 0.0732269287109375, 0.09210205078125, 0.1109771728515625, 0.129852294921875, 0.1487274169921875, 0.1676025390625, 0.1864776611328125, 0.205352783203125, 0.2242279052734375, 0.24310302734375, 0.2619781494140625, 0.280853271484375, 0.2997283935546875, 0.318603515625, 0.3374786376953125, 0.356353759765625, 0.3752288818359375, 0.39410400390625, 0.4129791259765625, 0.431854248046875, 0.4507293701171875, 0.4696044921875, 0.4884796142578125, 0.507354736328125, 0.5262298583984375, 0.54510498046875, 0.5639801025390625, 0.582855224609375, 0.6017303466796875, 0.62060546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 20.0, 14.0, 19.0, 32.0, 34.0, 47.0, 43.0, 50.0, 54.0, 69.0, 72.0, 66.0, 67.0, 67.0, 56.0, 56.0, 41.0, 37.0, 27.0, 24.0, 18.0, 13.0, 10.0, 4.0, 8.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.7286278307437897e-05, -1.6571953892707825e-05, -1.5857629477977753e-05, -1.514330506324768e-05, -1.4428980648517609e-05, -1.3714656233787537e-05, -1.3000331819057465e-05, -1.2286007404327393e-05, -1.157168298959732e-05, -1.0857358574867249e-05, -1.0143034160137177e-05, -9.428709745407104e-06, -8.714385330677032e-06, -8.00006091594696e-06, -7.2857365012168884e-06, -6.571412086486816e-06, -5.857087671756744e-06, -5.142763257026672e-06, -4.4284388422966e-06, -3.7141144275665283e-06, -2.9997900128364563e-06, -2.2854655981063843e-06, -1.5711411833763123e-06, -8.568167686462402e-07, -1.424923539161682e-07, 5.718320608139038e-07, 1.2861564755439758e-06, 2.000480890274048e-06, 2.71480530500412e-06, 3.429129719734192e-06, 4.143454134464264e-06, 4.857778549194336e-06, 5.572102963924408e-06, 6.28642737865448e-06, 7.000751793384552e-06, 7.715076208114624e-06, 8.429400622844696e-06, 9.143725037574768e-06, 9.85804945230484e-06, 1.0572373867034912e-05, 1.1286698281764984e-05, 1.2001022696495056e-05, 1.2715347111225128e-05, 1.34296715259552e-05, 1.4143995940685272e-05, 1.4858320355415344e-05, 1.5572644770145416e-05, 1.6286969184875488e-05, 1.700129359960556e-05, 1.7715618014335632e-05, 1.8429942429065704e-05, 1.9144266843795776e-05, 1.985859125852585e-05, 2.057291567325592e-05, 2.1287240087985992e-05, 2.2001564502716064e-05, 2.2715888917446136e-05, 2.343021333217621e-05, 2.414453774690628e-05, 2.4858862161636353e-05, 2.5573186576366425e-05, 2.6287510991096497e-05, 2.700183540582657e-05, 2.771615982055664e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 18.0, 28.0, 55.0, 53.0, 79.0, 120.0, 173.0, 246.0, 332.0, 539.0, 810.0, 1210.0, 1789.0, 2973.0, 5186.0, 8758.0, 16601.0, 34334.0, 81535.0, 206398.0, 341909.0, 196609.0, 77668.0, 33355.0, 15950.0, 8483.0, 4859.0, 3007.0, 1874.0, 1177.0, 754.0, 537.0, 358.0, 219.0, 168.0, 106.0, 72.0, 57.0, 48.0, 26.0, 17.0, 12.0, 6.0, 13.0, 3.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.73046875, -0.7098770141601562, -0.6892852783203125, -0.6686935424804688, -0.648101806640625, -0.6275100708007812, -0.6069183349609375, -0.5863265991210938, -0.56573486328125, -0.5451431274414062, -0.5245513916015625, -0.5039596557617188, -0.483367919921875, -0.46277618408203125, -0.4421844482421875, -0.42159271240234375, -0.4010009765625, -0.38040924072265625, -0.3598175048828125, -0.33922576904296875, -0.318634033203125, -0.29804229736328125, -0.2774505615234375, -0.25685882568359375, -0.23626708984375, -0.21567535400390625, -0.1950836181640625, -0.17449188232421875, -0.153900146484375, -0.13330841064453125, -0.1127166748046875, -0.09212493896484375, -0.071533203125, -0.05094146728515625, -0.0303497314453125, -0.00975799560546875, 0.010833740234375, 0.03142547607421875, 0.0520172119140625, 0.07260894775390625, 0.09320068359375, 0.11379241943359375, 0.1343841552734375, 0.15497589111328125, 0.175567626953125, 0.19615936279296875, 0.2167510986328125, 0.23734283447265625, 0.2579345703125, 0.27852630615234375, 0.2991180419921875, 0.31970977783203125, 0.340301513671875, 0.36089324951171875, 0.3814849853515625, 0.40207672119140625, 0.42266845703125, 0.44326019287109375, 0.4638519287109375, 0.48444366455078125, 0.505035400390625, 0.5256271362304688, 0.5462188720703125, 0.5668106079101562, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 6.0, 10.0, 12.0, 17.0, 13.0, 17.0, 34.0, 39.0, 71.0, 65.0, 88.0, 110.0, 108.0, 99.0, 68.0, 54.0, 23.0, 25.0, 23.0, 22.0, 15.0, 15.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.14951324462890625, -0.1443634033203125, -0.13921356201171875, -0.134063720703125, -0.12891387939453125, -0.1237640380859375, -0.11861419677734375, -0.11346435546875, -0.10831451416015625, -0.1031646728515625, -0.09801483154296875, -0.092864990234375, -0.08771514892578125, -0.0825653076171875, -0.07741546630859375, -0.072265625, -0.06711578369140625, -0.0619659423828125, -0.05681610107421875, -0.051666259765625, -0.04651641845703125, -0.0413665771484375, -0.03621673583984375, -0.03106689453125, -0.02591705322265625, -0.0207672119140625, -0.01561737060546875, -0.010467529296875, -0.00531768798828125, -0.0001678466796875, 0.00498199462890625, 0.0101318359375, 0.01528167724609375, 0.0204315185546875, 0.02558135986328125, 0.030731201171875, 0.03588104248046875, 0.0410308837890625, 0.04618072509765625, 0.05133056640625, 0.05648040771484375, 0.0616302490234375, 0.06678009033203125, 0.071929931640625, 0.07707977294921875, 0.0822296142578125, 0.08737945556640625, 0.092529296875, 0.09767913818359375, 0.1028289794921875, 0.10797882080078125, 0.113128662109375, 0.11827850341796875, 0.1234283447265625, 0.12857818603515625, 0.13372802734375, 0.13887786865234375, 0.1440277099609375, 0.14917755126953125, 0.154327392578125, 0.15947723388671875, 0.1646270751953125, 0.16977691650390625, 0.1749267578125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 6.0, 4.0, 8.0, 11.0, 15.0, 17.0, 20.0, 17.0, 14.0, 30.0, 26.0, 34.0, 31.0, 35.0, 52.0, 56.0, 44.0, 46.0, 52.0, 46.0, 49.0, 51.0, 46.0, 45.0, 38.0, 36.0, 33.0, 16.0, 31.0, 16.0, 16.0, 11.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.535590648651123, -3.4327683448791504, -3.3299460411071777, -3.227123737335205, -3.1243014335632324, -3.0214791297912598, -2.918656826019287, -2.8158345222473145, -2.713012218475342, -2.610189914703369, -2.5073676109313965, -2.404545307159424, -2.301723003387451, -2.1989006996154785, -2.096078395843506, -1.9932562112808228, -1.8904340267181396, -1.787611722946167, -1.6847894191741943, -1.5819671154022217, -1.479144811630249, -1.3763225078582764, -1.2735003232955933, -1.1706780195236206, -1.067855715751648, -0.9650334119796753, -0.8622111082077026, -0.7593888640403748, -0.6565665602684021, -0.5537442564964294, -0.45092201232910156, -0.3480997085571289, -0.24527764320373535, -0.1424553543329239, -0.03963306546211243, 0.06318920850753784, 0.1660115122795105, 0.26883381605148315, 0.37165606021881104, 0.4744783639907837, 0.5773006677627563, 0.680122971534729, 0.7829452753067017, 0.8857675194740295, 0.9885898232460022, 1.09141206741333, 1.1942343711853027, 1.2970566749572754, 1.399878978729248, 1.5027012825012207, 1.6055235862731934, 1.708345890045166, 1.8111681938171387, 1.9139904975891113, 2.016812801361084, 2.1196351051330566, 2.2224574089050293, 2.325279712677002, 2.4281020164489746, 2.5309243202209473, 2.63374662399292, 2.7365689277648926, 2.8393912315368652, 2.942213535308838, 3.0450356006622314]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 14.0, 13.0, 20.0, 21.0, 17.0, 21.0, 27.0, 16.0, 35.0, 21.0, 36.0, 26.0, 38.0, 46.0, 46.0, 31.0, 47.0, 35.0, 48.0, 41.0, 34.0, 39.0, 42.0, 32.0, 27.0, 26.0, 24.0, 20.0, 23.0, 13.0, 20.0, 10.0, 17.0, 12.0, 8.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2628321647644043, -2.1919450759887695, -2.1210579872131348, -2.0501708984375, -1.9792838096618652, -1.9083967208862305, -1.8375095129013062, -1.7666224241256714, -1.6957353353500366, -1.6248482465744019, -1.553961157798767, -1.4830740690231323, -1.412186861038208, -1.3412997722625732, -1.2704126834869385, -1.1995255947113037, -1.128638505935669, -1.0577514171600342, -0.9868643283843994, -0.9159771800041199, -0.8450900912284851, -0.7742030024528503, -0.7033158540725708, -0.632428765296936, -0.5615416765213013, -0.4906545877456665, -0.41976746916770935, -0.3488803505897522, -0.27799326181411743, -0.20710617303848267, -0.1362190544605255, -0.06533193588256836, 0.005554914474487305, 0.07644201815128326, 0.14732912182807922, 0.21821622550487518, 0.28910332918167114, 0.3599904179573059, 0.43087753653526306, 0.5017646551132202, 0.572651743888855, 0.6435388326644897, 0.7144259214401245, 0.785313069820404, 0.8562001585960388, 0.9270872473716736, 0.9979743957519531, 1.068861484527588, 1.1397485733032227, 1.2106356620788574, 1.2815227508544922, 1.352409839630127, 1.4232969284057617, 1.4941840171813965, 1.5650712251663208, 1.6359583139419556, 1.7068454027175903, 1.777732491493225, 1.8486195802688599, 1.9195066690444946, 1.990393877029419, 2.0612809658050537, 2.1321680545806885, 2.2030551433563232, 2.273942232131958]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 9.0, 5.0, 24.0, 28.0, 58.0, 67.0, 137.0, 199.0, 332.0, 472.0, 767.0, 1159.0, 1739.0, 2823.0, 4318.0, 6322.0, 9443.0, 13741.0, 19412.0, 27325.0, 36716.0, 47635.0, 59910.0, 71428.0, 81431.0, 89062.0, 91416.0, 89418.0, 82300.0, 72935.0, 60789.0, 48772.0, 37208.0, 28021.0, 19952.0, 14287.0, 9767.0, 6516.0, 4361.0, 2902.0, 1954.0, 1210.0, 819.0, 497.0, 319.0, 208.0, 138.0, 73.0, 47.0, 36.0, 17.0, 13.0, 9.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1797943115234375, -1.139862060546875, -1.0999298095703125, -1.05999755859375, -1.0200653076171875, -0.980133056640625, -0.9402008056640625, -0.9002685546875, -0.8603363037109375, -0.820404052734375, -0.7804718017578125, -0.74053955078125, -0.7006072998046875, -0.660675048828125, -0.6207427978515625, -0.580810546875, -0.5408782958984375, -0.500946044921875, -0.4610137939453125, -0.42108154296875, -0.3811492919921875, -0.341217041015625, -0.3012847900390625, -0.2613525390625, -0.2214202880859375, -0.181488037109375, -0.1415557861328125, -0.10162353515625, -0.0616912841796875, -0.021759033203125, 0.0181732177734375, 0.05810546875, 0.0980377197265625, 0.137969970703125, 0.1779022216796875, 0.21783447265625, 0.2577667236328125, 0.297698974609375, 0.3376312255859375, 0.3775634765625, 0.4174957275390625, 0.457427978515625, 0.4973602294921875, 0.53729248046875, 0.5772247314453125, 0.617156982421875, 0.6570892333984375, 0.697021484375, 0.7369537353515625, 0.776885986328125, 0.8168182373046875, 0.85675048828125, 0.8966827392578125, 0.936614990234375, 0.9765472412109375, 1.0164794921875, 1.0564117431640625, 1.096343994140625, 1.1362762451171875, 1.17620849609375, 1.2161407470703125, 1.256072998046875, 1.2960052490234375, 1.3359375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 13.0, 11.0, 10.0, 21.0, 14.0, 13.0, 15.0, 21.0, 26.0, 29.0, 33.0, 35.0, 43.0, 31.0, 41.0, 30.0, 38.0, 45.0, 37.0, 45.0, 38.0, 40.0, 45.0, 39.0, 36.0, 24.0, 30.0, 29.0, 15.0, 24.0, 23.0, 13.0, 15.0, 11.0, 13.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.541015625, -2.4637451171875, -2.386474609375, -2.3092041015625, -2.23193359375, -2.1546630859375, -2.077392578125, -2.0001220703125, -1.9228515625, -1.8455810546875, -1.768310546875, -1.6910400390625, -1.61376953125, -1.5364990234375, -1.459228515625, -1.3819580078125, -1.3046875, -1.2274169921875, -1.150146484375, -1.0728759765625, -0.99560546875, -0.9183349609375, -0.841064453125, -0.7637939453125, -0.6865234375, -0.6092529296875, -0.531982421875, -0.4547119140625, -0.37744140625, -0.3001708984375, -0.222900390625, -0.1456298828125, -0.068359375, 0.0089111328125, 0.086181640625, 0.1634521484375, 0.24072265625, 0.3179931640625, 0.395263671875, 0.4725341796875, 0.5498046875, 0.6270751953125, 0.704345703125, 0.7816162109375, 0.85888671875, 0.9361572265625, 1.013427734375, 1.0906982421875, 1.16796875, 1.2452392578125, 1.322509765625, 1.3997802734375, 1.47705078125, 1.5543212890625, 1.631591796875, 1.7088623046875, 1.7861328125, 1.8634033203125, 1.940673828125, 2.0179443359375, 2.09521484375, 2.1724853515625, 2.249755859375, 2.3270263671875, 2.404296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 8.0, 9.0, 23.0, 24.0, 46.0, 82.0, 127.0, 164.0, 326.0, 501.0, 723.0, 1202.0, 1879.0, 2946.0, 4518.0, 6836.0, 10184.0, 15255.0, 21617.0, 29999.0, 41417.0, 53773.0, 66959.0, 79651.0, 89229.0, 95397.0, 94963.0, 89799.0, 79778.0, 67221.0, 54069.0, 41362.0, 30831.0, 22153.0, 15329.0, 10471.0, 6819.0, 4752.0, 2926.0, 1920.0, 1243.0, 717.0, 512.0, 298.0, 200.0, 114.0, 66.0, 49.0, 37.0, 12.0, 14.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-1.4267578125, -1.383544921875, -1.34033203125, -1.297119140625, -1.25390625, -1.210693359375, -1.16748046875, -1.124267578125, -1.0810546875, -1.037841796875, -0.99462890625, -0.951416015625, -0.908203125, -0.864990234375, -0.82177734375, -0.778564453125, -0.7353515625, -0.692138671875, -0.64892578125, -0.605712890625, -0.5625, -0.519287109375, -0.47607421875, -0.432861328125, -0.3896484375, -0.346435546875, -0.30322265625, -0.260009765625, -0.216796875, -0.173583984375, -0.13037109375, -0.087158203125, -0.0439453125, -0.000732421875, 0.04248046875, 0.085693359375, 0.12890625, 0.172119140625, 0.21533203125, 0.258544921875, 0.3017578125, 0.344970703125, 0.38818359375, 0.431396484375, 0.474609375, 0.517822265625, 0.56103515625, 0.604248046875, 0.6474609375, 0.690673828125, 0.73388671875, 0.777099609375, 0.8203125, 0.863525390625, 0.90673828125, 0.949951171875, 0.9931640625, 1.036376953125, 1.07958984375, 1.122802734375, 1.166015625, 1.209228515625, 1.25244140625, 1.295654296875, 1.3388671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 4.0, 16.0, 16.0, 24.0, 31.0, 23.0, 21.0, 35.0, 23.0, 31.0, 36.0, 24.0, 30.0, 45.0, 36.0, 36.0, 43.0, 41.0, 42.0, 40.0, 42.0, 38.0, 46.0, 30.0, 25.0, 30.0, 22.0, 17.0, 20.0, 19.0, 14.0, 17.0, 10.0, 15.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.6552734375, -1.6083831787109375, -1.561492919921875, -1.5146026611328125, -1.46771240234375, -1.4208221435546875, -1.373931884765625, -1.3270416259765625, -1.2801513671875, -1.2332611083984375, -1.186370849609375, -1.1394805908203125, -1.09259033203125, -1.0457000732421875, -0.998809814453125, -0.9519195556640625, -0.905029296875, -0.8581390380859375, -0.811248779296875, -0.7643585205078125, -0.71746826171875, -0.6705780029296875, -0.623687744140625, -0.5767974853515625, -0.5299072265625, -0.4830169677734375, -0.436126708984375, -0.3892364501953125, -0.34234619140625, -0.2954559326171875, -0.248565673828125, -0.2016754150390625, -0.15478515625, -0.1078948974609375, -0.061004638671875, -0.0141143798828125, 0.03277587890625, 0.0796661376953125, 0.126556396484375, 0.1734466552734375, 0.2203369140625, 0.2672271728515625, 0.314117431640625, 0.3610076904296875, 0.40789794921875, 0.4547882080078125, 0.501678466796875, 0.5485687255859375, 0.595458984375, 0.6423492431640625, 0.689239501953125, 0.7361297607421875, 0.78302001953125, 0.8299102783203125, 0.876800537109375, 0.9236907958984375, 0.9705810546875, 1.0174713134765625, 1.064361572265625, 1.1112518310546875, 1.15814208984375, 1.2050323486328125, 1.251922607421875, 1.2988128662109375, 1.345703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 16.0, 18.0, 35.0, 56.0, 67.0, 136.0, 195.0, 277.0, 441.0, 752.0, 1171.0, 1809.0, 3073.0, 4911.0, 7819.0, 12768.0, 20684.0, 31294.0, 46198.0, 65024.0, 85707.0, 104289.0, 116774.0, 117972.0, 109350.0, 92306.0, 72120.0, 53091.0, 36384.0, 23633.0, 15138.0, 9616.0, 5870.0, 3600.0, 2229.0, 1348.0, 852.0, 524.0, 344.0, 220.0, 153.0, 95.0, 65.0, 45.0, 24.0, 18.0, 13.0, 9.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.76220703125, -0.7392349243164062, -0.7162628173828125, -0.6932907104492188, -0.670318603515625, -0.6473464965820312, -0.6243743896484375, -0.6014022827148438, -0.57843017578125, -0.5554580688476562, -0.5324859619140625, -0.5095138549804688, -0.486541748046875, -0.46356964111328125, -0.4405975341796875, -0.41762542724609375, -0.3946533203125, -0.37168121337890625, -0.3487091064453125, -0.32573699951171875, -0.302764892578125, -0.27979278564453125, -0.2568206787109375, -0.23384857177734375, -0.21087646484375, -0.18790435791015625, -0.1649322509765625, -0.14196014404296875, -0.118988037109375, -0.09601593017578125, -0.0730438232421875, -0.05007171630859375, -0.027099609375, -0.00412750244140625, 0.0188446044921875, 0.04181671142578125, 0.064788818359375, 0.08776092529296875, 0.1107330322265625, 0.13370513916015625, 0.15667724609375, 0.17964935302734375, 0.2026214599609375, 0.22559356689453125, 0.248565673828125, 0.27153778076171875, 0.2945098876953125, 0.31748199462890625, 0.3404541015625, 0.36342620849609375, 0.3863983154296875, 0.40937042236328125, 0.432342529296875, 0.45531463623046875, 0.4782867431640625, 0.5012588500976562, 0.52423095703125, 0.5472030639648438, 0.5701751708984375, 0.5931472778320312, 0.616119384765625, 0.6390914916992188, 0.6620635986328125, 0.6850357055664062, 0.7080078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 10.0, 14.0, 12.0, 15.0, 14.0, 19.0, 23.0, 19.0, 27.0, 31.0, 31.0, 47.0, 36.0, 35.0, 40.0, 39.0, 47.0, 57.0, 54.0, 39.0, 42.0, 50.0, 49.0, 30.0, 29.0, 29.0, 24.0, 22.0, 19.0, 18.0, 16.0, 8.0, 13.0, 5.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.502920925617218e-05, -7.22743570804596e-05, -6.951950490474701e-05, -6.676465272903442e-05, -6.400980055332184e-05, -6.125494837760925e-05, -5.850009620189667e-05, -5.574524402618408e-05, -5.2990391850471497e-05, -5.023553967475891e-05, -4.7480687499046326e-05, -4.472583532333374e-05, -4.1970983147621155e-05, -3.921613097190857e-05, -3.6461278796195984e-05, -3.37064266204834e-05, -3.095157444477081e-05, -2.8196722269058228e-05, -2.5441870093345642e-05, -2.2687017917633057e-05, -1.993216574192047e-05, -1.7177313566207886e-05, -1.44224613904953e-05, -1.1667609214782715e-05, -8.91275703907013e-06, -6.157904863357544e-06, -3.4030526876449585e-06, -6.48200511932373e-07, 2.1066516637802124e-06, 4.861503839492798e-06, 7.616356015205383e-06, 1.0371208190917969e-05, 1.3126060366630554e-05, 1.588091254234314e-05, 1.8635764718055725e-05, 2.139061689376831e-05, 2.4145469069480896e-05, 2.690032124519348e-05, 2.9655173420906067e-05, 3.241002559661865e-05, 3.516487777233124e-05, 3.791972994804382e-05, 4.067458212375641e-05, 4.3429434299468994e-05, 4.618428647518158e-05, 4.8939138650894165e-05, 5.169399082660675e-05, 5.4448843002319336e-05, 5.720369517803192e-05, 5.995854735374451e-05, 6.271339952945709e-05, 6.546825170516968e-05, 6.822310388088226e-05, 7.097795605659485e-05, 7.373280823230743e-05, 7.648766040802002e-05, 7.92425125837326e-05, 8.199736475944519e-05, 8.475221693515778e-05, 8.750706911087036e-05, 9.026192128658295e-05, 9.301677346229553e-05, 9.577162563800812e-05, 9.85264778137207e-05]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 21.0, 30.0, 37.0, 61.0, 100.0, 138.0, 212.0, 378.0, 548.0, 957.0, 1466.0, 2512.0, 4045.0, 7152.0, 12209.0, 21844.0, 36953.0, 59736.0, 89391.0, 119891.0, 142460.0, 145242.0, 129061.0, 99974.0, 68303.0, 43575.0, 26191.0, 15054.0, 8518.0, 4930.0, 2922.0, 1726.0, 1023.0, 686.0, 409.0, 280.0, 151.0, 139.0, 85.0, 39.0, 30.0, 22.0, 17.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9258499145507812, -0.8951568603515625, -0.8644638061523438, -0.833770751953125, -0.8030776977539062, -0.7723846435546875, -0.7416915893554688, -0.71099853515625, -0.6803054809570312, -0.6496124267578125, -0.6189193725585938, -0.588226318359375, -0.5575332641601562, -0.5268402099609375, -0.49614715576171875, -0.4654541015625, -0.43476104736328125, -0.4040679931640625, -0.37337493896484375, -0.342681884765625, -0.31198883056640625, -0.2812957763671875, -0.25060272216796875, -0.21990966796875, -0.18921661376953125, -0.1585235595703125, -0.12783050537109375, -0.097137451171875, -0.06644439697265625, -0.0357513427734375, -0.00505828857421875, 0.025634765625, 0.05632781982421875, 0.0870208740234375, 0.11771392822265625, 0.148406982421875, 0.17910003662109375, 0.2097930908203125, 0.24048614501953125, 0.27117919921875, 0.30187225341796875, 0.3325653076171875, 0.36325836181640625, 0.393951416015625, 0.42464447021484375, 0.4553375244140625, 0.48603057861328125, 0.5167236328125, 0.5474166870117188, 0.5781097412109375, 0.6088027954101562, 0.639495849609375, 0.6701889038085938, 0.7008819580078125, 0.7315750122070312, 0.76226806640625, 0.7929611206054688, 0.8236541748046875, 0.8543472290039062, 0.885040283203125, 0.9157333374023438, 0.9464263916015625, 0.9771194458007812, 1.0078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 9.0, 5.0, 11.0, 6.0, 15.0, 14.0, 13.0, 24.0, 20.0, 33.0, 21.0, 31.0, 47.0, 48.0, 45.0, 39.0, 50.0, 38.0, 40.0, 41.0, 56.0, 27.0, 27.0, 41.0, 29.0, 32.0, 30.0, 23.0, 30.0, 19.0, 23.0, 13.0, 14.0, 10.0, 14.0, 3.0, 12.0, 10.0, 2.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2605476379394531, -0.25205230712890625, -0.24355697631835938, -0.2350616455078125, -0.22656631469726562, -0.21807098388671875, -0.20957565307617188, -0.201080322265625, -0.19258499145507812, -0.18408966064453125, -0.17559432983398438, -0.1670989990234375, -0.15860366821289062, -0.15010833740234375, -0.14161300659179688, -0.13311767578125, -0.12462234497070312, -0.11612701416015625, -0.10763168334960938, -0.0991363525390625, -0.09064102172851562, -0.08214569091796875, -0.07365036010742188, -0.065155029296875, -0.056659698486328125, -0.04816436767578125, -0.039669036865234375, -0.0311737060546875, -0.022678375244140625, -0.01418304443359375, -0.005687713623046875, 0.0028076171875, 0.011302947998046875, 0.01979827880859375, 0.028293609619140625, 0.0367889404296875, 0.045284271240234375, 0.05377960205078125, 0.062274932861328125, 0.070770263671875, 0.07926559448242188, 0.08776092529296875, 0.09625625610351562, 0.1047515869140625, 0.11324691772460938, 0.12174224853515625, 0.13023757934570312, 0.13873291015625, 0.14722824096679688, 0.15572357177734375, 0.16421890258789062, 0.1727142333984375, 0.18120956420898438, 0.18970489501953125, 0.19820022583007812, 0.206695556640625, 0.21519088745117188, 0.22368621826171875, 0.23218154907226562, 0.2406768798828125, 0.24917221069335938, 0.25766754150390625, 0.2661628723144531, 0.274658203125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 9.0, 9.0, 9.0, 10.0, 11.0, 14.0, 18.0, 20.0, 23.0, 29.0, 27.0, 40.0, 44.0, 37.0, 40.0, 45.0, 58.0, 58.0, 43.0, 41.0, 37.0, 58.0, 36.0, 41.0, 35.0, 38.0, 29.0, 30.0, 19.0, 20.0, 8.0, 11.0, 10.0, 5.0, 9.0, 6.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.380751848220825, -3.2809531688690186, -3.181154727935791, -3.0813560485839844, -2.981557607650757, -2.88175892829895, -2.7819604873657227, -2.682161808013916, -2.5823631286621094, -2.4825644493103027, -2.382766008377075, -2.2829673290252686, -2.183168888092041, -2.0833702087402344, -1.9835716485977173, -1.8837730884552002, -1.7839746475219727, -1.6841760873794556, -1.5843775272369385, -1.4845788478851318, -1.3847804069519043, -1.2849817276000977, -1.1851831674575806, -1.0853846073150635, -0.9855860471725464, -0.8857874870300293, -0.7859889268875122, -0.6861903071403503, -0.5863917469978333, -0.48659318685531616, -0.3867945671081543, -0.2869960069656372, -0.18719744682312012, -0.08739887177944183, 0.01239970326423645, 0.11219829320907593, 0.21199685335159302, 0.3117954134941101, 0.411594033241272, 0.5113925933837891, 0.6111911535263062, 0.7109897136688232, 0.8107882738113403, 0.9105868935585022, 1.010385513305664, 1.1101839542388916, 1.2099826335906982, 1.3097811937332153, 1.4095797538757324, 1.5093783140182495, 1.6091768741607666, 1.7089755535125732, 1.8087739944458008, 1.9085726737976074, 2.008371353149414, 2.1081697940826416, 2.207968235015869, 2.307766914367676, 2.4075653553009033, 2.50736403465271, 2.6071624755859375, 2.706961154937744, 2.806759834289551, 2.9065582752227783, 3.006356954574585]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 14.0, 9.0, 15.0, 18.0, 31.0, 28.0, 22.0, 22.0, 38.0, 47.0, 47.0, 39.0, 44.0, 48.0, 46.0, 47.0, 44.0, 50.0, 53.0, 43.0, 31.0, 37.0, 26.0, 35.0, 28.0, 23.0, 22.0, 13.0, 11.0, 12.0, 8.0, 12.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2223832607269287, -3.131322145462036, -3.0402612686157227, -2.94920015335083, -2.8581392765045166, -2.767078161239624, -2.6760172843933105, -2.584956169128418, -2.4938952922821045, -2.402834177017212, -2.3117733001708984, -2.220712184906006, -2.1296513080596924, -2.0385901927948, -1.9475293159484863, -1.8564682006835938, -1.7654072046279907, -1.6743462085723877, -1.5832852125167847, -1.4922242164611816, -1.4011632204055786, -1.3101022243499756, -1.219041109085083, -1.1279802322387695, -1.036919116973877, -0.9458581209182739, -0.8547971248626709, -0.7637361288070679, -0.6726751327514648, -0.5816141366958618, -0.490553081035614, -0.399492084980011, -0.30843114852905273, -0.2173701524734497, -0.12630914151668549, -0.035248130559921265, 0.05581286549568176, 0.1468738615512848, 0.2379348874092102, 0.32899588346481323, 0.42005687952041626, 0.5111178755760193, 0.6021788716316223, 0.6932399272918701, 0.7843009233474731, 0.8753619194030762, 0.9664229154586792, 1.0574839115142822, 1.1485449075698853, 1.2396059036254883, 1.3306668996810913, 1.4217278957366943, 1.5127888917922974, 1.6038498878479004, 1.694911003112793, 1.7859718799591064, 1.877032995223999, 1.968093991279602, 2.059154987335205, 2.1502161026000977, 2.241276979446411, 2.3323380947113037, 2.423398971557617, 2.5144600868225098, 2.6055209636688232]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 18.0, 30.0, 33.0, 53.0, 96.0, 139.0, 209.0, 383.0, 551.0, 872.0, 1520.0, 2234.0, 3653.0, 5774.0, 9396.0, 14681.0, 23514.0, 37424.0, 58179.0, 89889.0, 135010.0, 196010.0, 273121.0, 357394.0, 433796.0, 477430.0, 476084.0, 427041.0, 348518.0, 263653.0, 188259.0, 129091.0, 86045.0, 56027.0, 35856.0, 23139.0, 14330.0, 9097.0, 5802.0, 3781.0, 2313.0, 1376.0, 912.0, 588.0, 392.0, 203.0, 140.0, 85.0, 56.0, 37.0, 23.0, 10.0, 10.0, 4.0, 0.0, 1.0], "bins": [-2.603515625, -2.526824951171875, -2.45013427734375, -2.373443603515625, -2.2967529296875, -2.220062255859375, -2.14337158203125, -2.066680908203125, -1.989990234375, -1.913299560546875, -1.83660888671875, -1.759918212890625, -1.6832275390625, -1.606536865234375, -1.52984619140625, -1.453155517578125, -1.37646484375, -1.299774169921875, -1.22308349609375, -1.146392822265625, -1.0697021484375, -0.993011474609375, -0.91632080078125, -0.839630126953125, -0.762939453125, -0.686248779296875, -0.60955810546875, -0.532867431640625, -0.4561767578125, -0.379486083984375, -0.30279541015625, -0.226104736328125, -0.1494140625, -0.072723388671875, 0.00396728515625, 0.080657958984375, 0.1573486328125, 0.234039306640625, 0.31072998046875, 0.387420654296875, 0.464111328125, 0.540802001953125, 0.61749267578125, 0.694183349609375, 0.7708740234375, 0.847564697265625, 0.92425537109375, 1.000946044921875, 1.07763671875, 1.154327392578125, 1.23101806640625, 1.307708740234375, 1.3843994140625, 1.461090087890625, 1.53778076171875, 1.614471435546875, 1.691162109375, 1.767852783203125, 1.84454345703125, 1.921234130859375, 1.9979248046875, 2.074615478515625, 2.15130615234375, 2.227996826171875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 20.0, 21.0, 21.0, 28.0, 31.0, 21.0, 38.0, 36.0, 35.0, 28.0, 43.0, 44.0, 42.0, 36.0, 41.0, 36.0, 35.0, 40.0, 39.0, 43.0, 34.0, 27.0, 29.0, 27.0, 21.0, 15.0, 16.0, 20.0, 13.0, 8.0, 12.0, 9.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.51953125, -2.44488525390625, -2.3702392578125, -2.29559326171875, -2.220947265625, -2.14630126953125, -2.0716552734375, -1.99700927734375, -1.92236328125, -1.84771728515625, -1.7730712890625, -1.69842529296875, -1.623779296875, -1.54913330078125, -1.4744873046875, -1.39984130859375, -1.3251953125, -1.25054931640625, -1.1759033203125, -1.10125732421875, -1.026611328125, -0.95196533203125, -0.8773193359375, -0.80267333984375, -0.72802734375, -0.65338134765625, -0.5787353515625, -0.50408935546875, -0.429443359375, -0.35479736328125, -0.2801513671875, -0.20550537109375, -0.130859375, -0.05621337890625, 0.0184326171875, 0.09307861328125, 0.167724609375, 0.24237060546875, 0.3170166015625, 0.39166259765625, 0.46630859375, 0.54095458984375, 0.6156005859375, 0.69024658203125, 0.764892578125, 0.83953857421875, 0.9141845703125, 0.98883056640625, 1.0634765625, 1.13812255859375, 1.2127685546875, 1.28741455078125, 1.362060546875, 1.43670654296875, 1.5113525390625, 1.58599853515625, 1.66064453125, 1.73529052734375, 1.8099365234375, 1.88458251953125, 1.959228515625, 2.03387451171875, 2.1085205078125, 2.18316650390625, 2.2578125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 17.0, 30.0, 37.0, 60.0, 150.0, 199.0, 343.0, 516.0, 971.0, 1584.0, 2661.0, 4390.0, 7488.0, 12211.0, 20286.0, 33354.0, 52782.0, 83153.0, 126253.0, 185615.0, 256432.0, 337553.0, 411129.0, 460870.0, 470288.0, 436930.0, 369702.0, 290521.0, 213802.0, 148934.0, 98340.0, 64092.0, 40372.0, 25074.0, 15222.0, 9164.0, 5486.0, 3356.0, 1996.0, 1157.0, 684.0, 459.0, 232.0, 145.0, 95.0, 57.0, 30.0, 19.0, 7.0, 10.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.923828125, -2.83013916015625, -2.7364501953125, -2.64276123046875, -2.549072265625, -2.45538330078125, -2.3616943359375, -2.26800537109375, -2.17431640625, -2.08062744140625, -1.9869384765625, -1.89324951171875, -1.799560546875, -1.70587158203125, -1.6121826171875, -1.51849365234375, -1.4248046875, -1.33111572265625, -1.2374267578125, -1.14373779296875, -1.050048828125, -0.95635986328125, -0.8626708984375, -0.76898193359375, -0.67529296875, -0.58160400390625, -0.4879150390625, -0.39422607421875, -0.300537109375, -0.20684814453125, -0.1131591796875, -0.01947021484375, 0.07421875, 0.16790771484375, 0.2615966796875, 0.35528564453125, 0.448974609375, 0.54266357421875, 0.6363525390625, 0.73004150390625, 0.82373046875, 0.91741943359375, 1.0111083984375, 1.10479736328125, 1.198486328125, 1.29217529296875, 1.3858642578125, 1.47955322265625, 1.5732421875, 1.66693115234375, 1.7606201171875, 1.85430908203125, 1.947998046875, 2.04168701171875, 2.1353759765625, 2.22906494140625, 2.32275390625, 2.41644287109375, 2.5101318359375, 2.60382080078125, 2.697509765625, 2.79119873046875, 2.8848876953125, 2.97857666015625, 3.072265625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 11.0, 10.0, 21.0, 25.0, 37.0, 37.0, 46.0, 67.0, 77.0, 105.0, 140.0, 169.0, 193.0, 221.0, 237.0, 236.0, 261.0, 271.0, 256.0, 265.0, 249.0, 212.0, 187.0, 153.0, 144.0, 109.0, 77.0, 70.0, 56.0, 37.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.857818603515625, -1.80548095703125, -1.753143310546875, -1.7008056640625, -1.648468017578125, -1.59613037109375, -1.543792724609375, -1.491455078125, -1.439117431640625, -1.38677978515625, -1.334442138671875, -1.2821044921875, -1.229766845703125, -1.17742919921875, -1.125091552734375, -1.07275390625, -1.020416259765625, -0.96807861328125, -0.915740966796875, -0.8634033203125, -0.811065673828125, -0.75872802734375, -0.706390380859375, -0.654052734375, -0.601715087890625, -0.54937744140625, -0.497039794921875, -0.4447021484375, -0.392364501953125, -0.34002685546875, -0.287689208984375, -0.2353515625, -0.183013916015625, -0.13067626953125, -0.078338623046875, -0.0260009765625, 0.026336669921875, 0.07867431640625, 0.131011962890625, 0.183349609375, 0.235687255859375, 0.28802490234375, 0.340362548828125, 0.3927001953125, 0.445037841796875, 0.49737548828125, 0.549713134765625, 0.60205078125, 0.654388427734375, 0.70672607421875, 0.759063720703125, 0.8114013671875, 0.863739013671875, 0.91607666015625, 0.968414306640625, 1.020751953125, 1.073089599609375, 1.12542724609375, 1.177764892578125, 1.2301025390625, 1.282440185546875, 1.33477783203125, 1.387115478515625, 1.439453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 0.0, 4.0, 7.0, 11.0, 13.0, 9.0, 26.0, 19.0, 23.0, 32.0, 36.0, 46.0, 33.0, 49.0, 54.0, 52.0, 53.0, 45.0, 43.0, 52.0, 35.0, 39.0, 44.0, 41.0, 38.0, 30.0, 21.0, 29.0, 27.0, 13.0, 17.0, 11.0, 14.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.072996139526367, -3.9328458309173584, -3.7926955223083496, -3.6525449752807617, -3.512394666671753, -3.372244358062744, -3.2320938110351562, -3.0919435024261475, -2.9517931938171387, -2.81164288520813, -2.671492576599121, -2.531342029571533, -2.3911917209625244, -2.2510414123535156, -2.1108908653259277, -1.970740556716919, -1.8305902481079102, -1.6904399394989014, -1.550289511680603, -1.4101390838623047, -1.269988775253296, -1.129838466644287, -0.9896880388259888, -0.8495376706123352, -0.7093873023986816, -0.5692369341850281, -0.4290865659713745, -0.28893619775772095, -0.14878582954406738, -0.008635461330413818, 0.13151490688323975, 0.2716652750968933, 0.4118156433105469, 0.5519660115242004, 0.692116379737854, 0.8322667479515076, 0.9724171161651611, 1.11256742477417, 1.2527178525924683, 1.3928682804107666, 1.5330185890197754, 1.6731688976287842, 1.8133193254470825, 1.9534697532653809, 2.0936200618743896, 2.2337703704833984, 2.3739209175109863, 2.514071226119995, 2.654221534729004, 2.7943718433380127, 2.9345221519470215, 3.0746726989746094, 3.214823007583618, 3.354973316192627, 3.495123863220215, 3.6352741718292236, 3.7754244804382324, 3.915574789047241, 4.05572509765625, 4.195875644683838, 4.336026191711426, 4.4761762619018555, 4.616326808929443, 4.756476879119873, 4.896627426147461]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 8.0, 6.0, 10.0, 7.0, 17.0, 19.0, 21.0, 27.0, 21.0, 23.0, 25.0, 35.0, 27.0, 33.0, 43.0, 38.0, 49.0, 49.0, 43.0, 33.0, 44.0, 41.0, 27.0, 42.0, 35.0, 33.0, 37.0, 23.0, 22.0, 23.0, 18.0, 16.0, 15.0, 16.0, 12.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5045316219329834, -3.404284715652466, -3.3040378093719482, -3.2037906646728516, -3.103543758392334, -3.0032968521118164, -2.903049945831299, -2.8028030395507812, -2.7025561332702637, -2.602309226989746, -2.5020623207092285, -2.401815414428711, -2.3015682697296143, -2.2013213634490967, -2.101074457168579, -2.0008275508880615, -1.9005804061889648, -1.8003334999084473, -1.7000864744186401, -1.5998395681381226, -1.4995925426483154, -1.3993456363677979, -1.2990987300872803, -1.1988518238067627, -1.0986047983169556, -0.9983578324317932, -0.8981108665466309, -0.7978639602661133, -0.6976169943809509, -0.5973700284957886, -0.497123122215271, -0.39687615633010864, -0.2966291904449463, -0.19638223946094513, -0.09613528847694397, 0.004111647605895996, 0.10435861349105835, 0.2046055793762207, 0.3048524856567383, 0.40509945154190063, 0.505346417427063, 0.6055933833122253, 0.7058403491973877, 0.8060872554779053, 0.9063342213630676, 1.00658118724823, 1.1068280935287476, 1.2070751190185547, 1.3073220252990723, 1.4075689315795898, 1.507815957069397, 1.6080628633499146, 1.7083098888397217, 1.8085567951202393, 1.9088037014007568, 2.0090506076812744, 2.109297752380371, 2.2095446586608887, 2.3097915649414062, 2.410038471221924, 2.5102856159210205, 2.610532522201538, 2.7107794284820557, 2.8110263347625732, 2.911273241043091]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 13.0, 9.0, 23.0, 22.0, 34.0, 55.0, 73.0, 90.0, 147.0, 235.0, 343.0, 439.0, 689.0, 1109.0, 1684.0, 2623.0, 3833.0, 6033.0, 9165.0, 13924.0, 21680.0, 33252.0, 50761.0, 75719.0, 108031.0, 142434.0, 154598.0, 132006.0, 96595.0, 65967.0, 44188.0, 28847.0, 18870.0, 12162.0, 7925.0, 5136.0, 3365.0, 2198.0, 1416.0, 935.0, 663.0, 417.0, 282.0, 195.0, 108.0, 90.0, 68.0, 36.0, 19.0, 17.0, 12.0, 7.0, 10.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.71826171875, -0.696044921875, -0.673828125, -0.651611328125, -0.62939453125, -0.607177734375, -0.5849609375, -0.562744140625, -0.54052734375, -0.518310546875, -0.49609375, -0.473876953125, -0.45166015625, -0.429443359375, -0.4072265625, -0.385009765625, -0.36279296875, -0.340576171875, -0.318359375, -0.296142578125, -0.27392578125, -0.251708984375, -0.2294921875, -0.207275390625, -0.18505859375, -0.162841796875, -0.140625, -0.118408203125, -0.09619140625, -0.073974609375, -0.0517578125, -0.029541015625, -0.00732421875, 0.014892578125, 0.037109375, 0.059326171875, 0.08154296875, 0.103759765625, 0.1259765625, 0.148193359375, 0.17041015625, 0.192626953125, 0.21484375, 0.237060546875, 0.25927734375, 0.281494140625, 0.3037109375, 0.325927734375, 0.34814453125, 0.370361328125, 0.392578125, 0.414794921875, 0.43701171875, 0.459228515625, 0.4814453125, 0.503662109375, 0.52587890625, 0.548095703125, 0.5703125, 0.592529296875, 0.61474609375, 0.636962890625, 0.6591796875, 0.681396484375, 0.70361328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 11.0, 22.0, 18.0, 22.0, 27.0, 30.0, 30.0, 42.0, 39.0, 37.0, 29.0, 45.0, 74.0, 59.0, 51.0, 57.0, 44.0, 53.0, 34.0, 33.0, 26.0, 34.0, 30.0, 24.0, 20.0, 13.0, 12.0, 14.0, 11.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.96075439453125, -3.8316650390625, -3.70257568359375, -3.573486328125, -3.44439697265625, -3.3153076171875, -3.18621826171875, -3.05712890625, -2.92803955078125, -2.7989501953125, -2.66986083984375, -2.540771484375, -2.41168212890625, -2.2825927734375, -2.15350341796875, -2.0244140625, -1.89532470703125, -1.7662353515625, -1.63714599609375, -1.508056640625, -1.37896728515625, -1.2498779296875, -1.12078857421875, -0.99169921875, -0.86260986328125, -0.7335205078125, -0.60443115234375, -0.475341796875, -0.34625244140625, -0.2171630859375, -0.08807373046875, 0.041015625, 0.17010498046875, 0.2991943359375, 0.42828369140625, 0.557373046875, 0.68646240234375, 0.8155517578125, 0.94464111328125, 1.07373046875, 1.20281982421875, 1.3319091796875, 1.46099853515625, 1.590087890625, 1.71917724609375, 1.8482666015625, 1.97735595703125, 2.1064453125, 2.23553466796875, 2.3646240234375, 2.49371337890625, 2.622802734375, 2.75189208984375, 2.8809814453125, 3.01007080078125, 3.13916015625, 3.26824951171875, 3.3973388671875, 3.52642822265625, 3.655517578125, 3.78460693359375, 3.9136962890625, 4.04278564453125, 4.171875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 9.0, 4.0, 6.0, 5.0, 15.0, 20.0, 28.0, 26.0, 55.0, 47.0, 87.0, 128.0, 216.0, 266.0, 465.0, 709.0, 990.0, 1555.0, 2407.0, 3710.0, 6013.0, 9889.0, 16661.0, 28912.0, 50259.0, 86383.0, 141128.0, 196176.0, 187269.0, 128610.0, 77118.0, 44587.0, 25592.0, 15111.0, 8983.0, 5521.0, 3291.0, 2174.0, 1369.0, 935.0, 576.0, 389.0, 267.0, 177.0, 139.0, 87.0, 50.0, 45.0, 41.0, 18.0, 15.0, 10.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.87841796875, -0.8499832153320312, -0.8215484619140625, -0.7931137084960938, -0.764678955078125, -0.7362442016601562, -0.7078094482421875, -0.6793746948242188, -0.65093994140625, -0.6225051879882812, -0.5940704345703125, -0.5656356811523438, -0.537200927734375, -0.5087661743164062, -0.4803314208984375, -0.45189666748046875, -0.4234619140625, -0.39502716064453125, -0.3665924072265625, -0.33815765380859375, -0.309722900390625, -0.28128814697265625, -0.2528533935546875, -0.22441864013671875, -0.19598388671875, -0.16754913330078125, -0.1391143798828125, -0.11067962646484375, -0.082244873046875, -0.05381011962890625, -0.0253753662109375, 0.00305938720703125, 0.031494140625, 0.05992889404296875, 0.0883636474609375, 0.11679840087890625, 0.145233154296875, 0.17366790771484375, 0.2021026611328125, 0.23053741455078125, 0.25897216796875, 0.28740692138671875, 0.3158416748046875, 0.34427642822265625, 0.372711181640625, 0.40114593505859375, 0.4295806884765625, 0.45801544189453125, 0.4864501953125, 0.5148849487304688, 0.5433197021484375, 0.5717544555664062, 0.600189208984375, 0.6286239624023438, 0.6570587158203125, 0.6854934692382812, 0.71392822265625, 0.7423629760742188, 0.7707977294921875, 0.7992324829101562, 0.827667236328125, 0.8561019897460938, 0.8845367431640625, 0.9129714965820312, 0.94140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 11.0, 3.0, 9.0, 16.0, 14.0, 18.0, 23.0, 35.0, 20.0, 29.0, 43.0, 28.0, 37.0, 34.0, 44.0, 48.0, 46.0, 46.0, 43.0, 39.0, 39.0, 46.0, 35.0, 40.0, 39.0, 22.0, 31.0, 20.0, 18.0, 22.0, 15.0, 20.0, 10.0, 12.0, 8.0, 5.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19921875, -2.129913330078125, -2.06060791015625, -1.991302490234375, -1.9219970703125, -1.852691650390625, -1.78338623046875, -1.714080810546875, -1.644775390625, -1.575469970703125, -1.50616455078125, -1.436859130859375, -1.3675537109375, -1.298248291015625, -1.22894287109375, -1.159637451171875, -1.09033203125, -1.021026611328125, -0.95172119140625, -0.882415771484375, -0.8131103515625, -0.743804931640625, -0.67449951171875, -0.605194091796875, -0.535888671875, -0.466583251953125, -0.39727783203125, -0.327972412109375, -0.2586669921875, -0.189361572265625, -0.12005615234375, -0.050750732421875, 0.0185546875, 0.087860107421875, 0.15716552734375, 0.226470947265625, 0.2957763671875, 0.365081787109375, 0.43438720703125, 0.503692626953125, 0.572998046875, 0.642303466796875, 0.71160888671875, 0.780914306640625, 0.8502197265625, 0.919525146484375, 0.98883056640625, 1.058135986328125, 1.12744140625, 1.196746826171875, 1.26605224609375, 1.335357666015625, 1.4046630859375, 1.473968505859375, 1.54327392578125, 1.612579345703125, 1.681884765625, 1.751190185546875, 1.82049560546875, 1.889801025390625, 1.9591064453125, 2.028411865234375, 2.09771728515625, 2.167022705078125, 2.236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 19.0, 30.0, 27.0, 53.0, 68.0, 86.0, 121.0, 183.0, 231.0, 312.0, 435.0, 664.0, 998.0, 1571.0, 2386.0, 3781.0, 6264.0, 10953.0, 20913.0, 45324.0, 118264.0, 341696.0, 305237.0, 103039.0, 40309.0, 19148.0, 10149.0, 5838.0, 3511.0, 2320.0, 1453.0, 948.0, 661.0, 456.0, 292.0, 191.0, 162.0, 121.0, 73.0, 59.0, 48.0, 36.0, 28.0, 23.0, 10.0, 11.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.517578125, -0.5008468627929688, -0.4841156005859375, -0.46738433837890625, -0.450653076171875, -0.43392181396484375, -0.4171905517578125, -0.40045928955078125, -0.38372802734375, -0.36699676513671875, -0.3502655029296875, -0.33353424072265625, -0.316802978515625, -0.30007171630859375, -0.2833404541015625, -0.26660919189453125, -0.2498779296875, -0.23314666748046875, -0.2164154052734375, -0.19968414306640625, -0.182952880859375, -0.16622161865234375, -0.1494903564453125, -0.13275909423828125, -0.11602783203125, -0.09929656982421875, -0.0825653076171875, -0.06583404541015625, -0.049102783203125, -0.03237152099609375, -0.0156402587890625, 0.00109100341796875, 0.017822265625, 0.03455352783203125, 0.0512847900390625, 0.06801605224609375, 0.084747314453125, 0.10147857666015625, 0.1182098388671875, 0.13494110107421875, 0.15167236328125, 0.16840362548828125, 0.1851348876953125, 0.20186614990234375, 0.218597412109375, 0.23532867431640625, 0.2520599365234375, 0.26879119873046875, 0.2855224609375, 0.30225372314453125, 0.3189849853515625, 0.33571624755859375, 0.352447509765625, 0.36917877197265625, 0.3859100341796875, 0.40264129638671875, 0.41937255859375, 0.43610382080078125, 0.4528350830078125, 0.46956634521484375, 0.486297607421875, 0.5030288696289062, 0.5197601318359375, 0.5364913940429688, 0.55322265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 8.0, 4.0, 4.0, 12.0, 14.0, 17.0, 29.0, 24.0, 34.0, 47.0, 42.0, 55.0, 57.0, 58.0, 49.0, 61.0, 48.0, 52.0, 54.0, 41.0, 52.0, 43.0, 25.0, 29.0, 21.0, 28.0, 13.0, 22.0, 13.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4259090423583984e-05, -2.3513101041316986e-05, -2.2767111659049988e-05, -2.202112227678299e-05, -2.127513289451599e-05, -2.0529143512248993e-05, -1.9783154129981995e-05, -1.9037164747714996e-05, -1.8291175365447998e-05, -1.7545185983181e-05, -1.6799196600914e-05, -1.6053207218647003e-05, -1.5307217836380005e-05, -1.4561228454113007e-05, -1.3815239071846008e-05, -1.306924968957901e-05, -1.2323260307312012e-05, -1.1577270925045013e-05, -1.0831281542778015e-05, -1.0085292160511017e-05, -9.339302778244019e-06, -8.59331339597702e-06, -7.847324013710022e-06, -7.101334631443024e-06, -6.355345249176025e-06, -5.609355866909027e-06, -4.863366484642029e-06, -4.1173771023750305e-06, -3.3713877201080322e-06, -2.625398337841034e-06, -1.8794089555740356e-06, -1.1334195733070374e-06, -3.8743019104003906e-07, 3.5855919122695923e-07, 1.1045485734939575e-06, 1.8505379557609558e-06, 2.596527338027954e-06, 3.3425167202949524e-06, 4.088506102561951e-06, 4.834495484828949e-06, 5.580484867095947e-06, 6.3264742493629456e-06, 7.072463631629944e-06, 7.818453013896942e-06, 8.56444239616394e-06, 9.310431778430939e-06, 1.0056421160697937e-05, 1.0802410542964935e-05, 1.1548399925231934e-05, 1.2294389307498932e-05, 1.304037868976593e-05, 1.3786368072032928e-05, 1.4532357454299927e-05, 1.5278346836566925e-05, 1.6024336218833923e-05, 1.677032560110092e-05, 1.751631498336792e-05, 1.8262304365634918e-05, 1.9008293747901917e-05, 1.9754283130168915e-05, 2.0500272512435913e-05, 2.124626189470291e-05, 2.199225127696991e-05, 2.2738240659236908e-05, 2.3484230041503906e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 15.0, 21.0, 32.0, 38.0, 64.0, 67.0, 123.0, 146.0, 231.0, 309.0, 460.0, 692.0, 952.0, 1537.0, 2281.0, 3514.0, 5741.0, 9430.0, 16148.0, 29452.0, 55141.0, 109463.0, 207699.0, 257993.0, 164112.0, 83079.0, 42523.0, 22740.0, 13112.0, 7630.0, 4728.0, 3020.0, 1964.0, 1295.0, 843.0, 580.0, 406.0, 292.0, 217.0, 135.0, 97.0, 60.0, 47.0, 40.0, 23.0, 19.0, 8.0, 3.0, 11.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5765151977539062, -0.5568389892578125, -0.5371627807617188, -0.517486572265625, -0.49781036376953125, -0.4781341552734375, -0.45845794677734375, -0.43878173828125, -0.41910552978515625, -0.3994293212890625, -0.37975311279296875, -0.360076904296875, -0.34040069580078125, -0.3207244873046875, -0.30104827880859375, -0.2813720703125, -0.26169586181640625, -0.2420196533203125, -0.22234344482421875, -0.202667236328125, -0.18299102783203125, -0.1633148193359375, -0.14363861083984375, -0.12396240234375, -0.10428619384765625, -0.0846099853515625, -0.06493377685546875, -0.045257568359375, -0.02558135986328125, -0.0059051513671875, 0.01377105712890625, 0.033447265625, 0.05312347412109375, 0.0727996826171875, 0.09247589111328125, 0.112152099609375, 0.13182830810546875, 0.1515045166015625, 0.17118072509765625, 0.19085693359375, 0.21053314208984375, 0.2302093505859375, 0.24988555908203125, 0.269561767578125, 0.28923797607421875, 0.3089141845703125, 0.32859039306640625, 0.3482666015625, 0.36794281005859375, 0.3876190185546875, 0.40729522705078125, 0.426971435546875, 0.44664764404296875, 0.4663238525390625, 0.48600006103515625, 0.50567626953125, 0.5253524780273438, 0.5450286865234375, 0.5647048950195312, 0.584381103515625, 0.6040573120117188, 0.6237335205078125, 0.6434097290039062, 0.6630859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 13.0, 19.0, 23.0, 29.0, 40.0, 41.0, 58.0, 89.0, 102.0, 103.0, 93.0, 94.0, 63.0, 39.0, 35.0, 25.0, 29.0, 19.0, 17.0, 10.0, 10.0, 7.0, 6.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2238025665283203, -0.21750259399414062, -0.21120262145996094, -0.20490264892578125, -0.19860267639160156, -0.19230270385742188, -0.1860027313232422, -0.1797027587890625, -0.1734027862548828, -0.16710281372070312, -0.16080284118652344, -0.15450286865234375, -0.14820289611816406, -0.14190292358398438, -0.1356029510498047, -0.129302978515625, -0.12300300598144531, -0.11670303344726562, -0.11040306091308594, -0.10410308837890625, -0.09780311584472656, -0.09150314331054688, -0.08520317077636719, -0.0789031982421875, -0.07260322570800781, -0.06630325317382812, -0.06000328063964844, -0.05370330810546875, -0.04740333557128906, -0.041103363037109375, -0.03480339050292969, -0.02850341796875, -0.022203445434570312, -0.015903472900390625, -0.009603500366210938, -0.00330352783203125, 0.0029964447021484375, 0.009296417236328125, 0.015596389770507812, 0.0218963623046875, 0.028196334838867188, 0.034496307373046875, 0.04079627990722656, 0.04709625244140625, 0.05339622497558594, 0.059696197509765625, 0.06599617004394531, 0.072296142578125, 0.07859611511230469, 0.08489608764648438, 0.09119606018066406, 0.09749603271484375, 0.10379600524902344, 0.11009597778320312, 0.11639595031738281, 0.1226959228515625, 0.1289958953857422, 0.13529586791992188, 0.14159584045410156, 0.14789581298828125, 0.15419578552246094, 0.16049575805664062, 0.1667957305908203, 0.173095703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 11.0, 14.0, 12.0, 23.0, 20.0, 20.0, 35.0, 42.0, 41.0, 43.0, 44.0, 53.0, 52.0, 54.0, 45.0, 53.0, 39.0, 37.0, 36.0, 49.0, 39.0, 34.0, 29.0, 26.0, 27.0, 24.0, 11.0, 15.0, 17.0, 12.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.080476760864258, -3.939161539077759, -3.797846555709839, -3.65653133392334, -3.51521635055542, -3.373901128768921, -3.232585906982422, -3.091270923614502, -2.949955940246582, -2.808640718460083, -2.667325735092163, -2.526010513305664, -2.384695529937744, -2.243380308151245, -2.102065086364746, -1.9607501029968262, -1.8194348812103271, -1.6781197786331177, -1.5368046760559082, -1.3954894542694092, -1.2541744709014893, -1.1128592491149902, -0.9715441465377808, -0.8302290439605713, -0.6889139413833618, -0.5475988388061523, -0.4062837064266205, -0.2649685740470886, -0.12365347146987915, 0.017661631107330322, 0.15897679328918457, 0.30029189586639404, 0.4416069984436035, 0.582922101020813, 0.7242372035980225, 0.8655523657798767, 1.0068674087524414, 1.1481826305389404, 1.28949773311615, 1.4308128356933594, 1.5721279382705688, 1.7134430408477783, 1.8547581434249878, 1.9960732460021973, 2.1373884677886963, 2.278703451156616, 2.4200186729431152, 2.561333656311035, 2.702648878097534, 2.843964099884033, 2.985279083251953, 3.126594305038452, 3.267909288406372, 3.409224510192871, 3.550539493560791, 3.69185471534729, 3.833169937133789, 3.974485158920288, 4.115800380706787, 4.257115364074707, 4.398430347442627, 4.539745330810547, 4.681060791015625, 4.822375774383545, 4.963690757751465]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 8.0, 10.0, 9.0, 14.0, 19.0, 25.0, 23.0, 21.0, 21.0, 28.0, 26.0, 33.0, 34.0, 37.0, 44.0, 53.0, 46.0, 44.0, 35.0, 39.0, 46.0, 31.0, 36.0, 36.0, 32.0, 39.0, 21.0, 23.0, 25.0, 16.0, 16.0, 17.0, 17.0, 8.0, 15.0, 8.0, 7.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.544121503829956, -3.4429636001586914, -3.341805934906006, -3.240648031234741, -3.1394901275634766, -3.038332223892212, -2.9371743202209473, -2.8360166549682617, -2.734858751296997, -2.6337008476257324, -2.532543182373047, -2.4313852787017822, -2.3302273750305176, -2.229069471359253, -2.1279115676879883, -2.0267539024353027, -1.925595998764038, -1.8244380950927734, -1.7232803106307983, -1.6221225261688232, -1.5209646224975586, -1.419806718826294, -1.3186489343643188, -1.2174911499023438, -1.116333246231079, -1.0151753425598145, -0.9140175580978394, -0.8128597140312195, -0.7117018699645996, -0.6105440258979797, -0.5093861818313599, -0.40822833776474, -0.3070704936981201, -0.20591264963150024, -0.10475480556488037, -0.003596961498260498, 0.09756088256835938, 0.19871872663497925, 0.2998765707015991, 0.401034414768219, 0.5021922588348389, 0.6033501029014587, 0.7045079469680786, 0.8056657910346985, 0.9068236351013184, 1.007981538772583, 1.109139323234558, 1.2102971076965332, 1.3114550113677979, 1.4126129150390625, 1.5137706995010376, 1.6149284839630127, 1.7160863876342773, 1.817244291305542, 1.918402075767517, 2.019559860229492, 2.120717763900757, 2.2218756675720215, 2.323033332824707, 2.4241912364959717, 2.5253491401672363, 2.626507043838501, 2.7276649475097656, 2.828822612762451, 2.929980516433716]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 8.0, 18.0, 31.0, 49.0, 64.0, 105.0, 193.0, 297.0, 452.0, 777.0, 1245.0, 1996.0, 3214.0, 5219.0, 8187.0, 13202.0, 20357.0, 30115.0, 43785.0, 60437.0, 78977.0, 97139.0, 110044.0, 114605.0, 108107.0, 94781.0, 75695.0, 57701.0, 41740.0, 28295.0, 18724.0, 12187.0, 7927.0, 4833.0, 3035.0, 1904.0, 1158.0, 761.0, 446.0, 248.0, 180.0, 114.0, 69.0, 46.0, 35.0, 15.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-2.095703125, -2.03106689453125, -1.9664306640625, -1.90179443359375, -1.837158203125, -1.77252197265625, -1.7078857421875, -1.64324951171875, -1.57861328125, -1.51397705078125, -1.4493408203125, -1.38470458984375, -1.320068359375, -1.25543212890625, -1.1907958984375, -1.12615966796875, -1.0615234375, -0.99688720703125, -0.9322509765625, -0.86761474609375, -0.802978515625, -0.73834228515625, -0.6737060546875, -0.60906982421875, -0.54443359375, -0.47979736328125, -0.4151611328125, -0.35052490234375, -0.285888671875, -0.22125244140625, -0.1566162109375, -0.09197998046875, -0.02734375, 0.03729248046875, 0.1019287109375, 0.16656494140625, 0.231201171875, 0.29583740234375, 0.3604736328125, 0.42510986328125, 0.48974609375, 0.55438232421875, 0.6190185546875, 0.68365478515625, 0.748291015625, 0.81292724609375, 0.8775634765625, 0.94219970703125, 1.0068359375, 1.07147216796875, 1.1361083984375, 1.20074462890625, 1.265380859375, 1.33001708984375, 1.3946533203125, 1.45928955078125, 1.52392578125, 1.58856201171875, 1.6531982421875, 1.71783447265625, 1.782470703125, 1.84710693359375, 1.9117431640625, 1.97637939453125, 2.041015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 13.0, 14.0, 22.0, 31.0, 28.0, 22.0, 29.0, 33.0, 33.0, 42.0, 33.0, 40.0, 40.0, 52.0, 35.0, 34.0, 40.0, 32.0, 31.0, 41.0, 26.0, 30.0, 20.0, 28.0, 22.0, 30.0, 16.0, 20.0, 12.0, 15.0, 9.0, 8.0, 11.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.916015625, -2.81646728515625, -2.7169189453125, -2.61737060546875, -2.517822265625, -2.41827392578125, -2.3187255859375, -2.21917724609375, -2.11962890625, -2.02008056640625, -1.9205322265625, -1.82098388671875, -1.721435546875, -1.62188720703125, -1.5223388671875, -1.42279052734375, -1.3232421875, -1.22369384765625, -1.1241455078125, -1.02459716796875, -0.925048828125, -0.82550048828125, -0.7259521484375, -0.62640380859375, -0.52685546875, -0.42730712890625, -0.3277587890625, -0.22821044921875, -0.128662109375, -0.02911376953125, 0.0704345703125, 0.16998291015625, 0.26953125, 0.36907958984375, 0.4686279296875, 0.56817626953125, 0.667724609375, 0.76727294921875, 0.8668212890625, 0.96636962890625, 1.06591796875, 1.16546630859375, 1.2650146484375, 1.36456298828125, 1.464111328125, 1.56365966796875, 1.6632080078125, 1.76275634765625, 1.8623046875, 1.96185302734375, 2.0614013671875, 2.16094970703125, 2.260498046875, 2.36004638671875, 2.4595947265625, 2.55914306640625, 2.65869140625, 2.75823974609375, 2.8577880859375, 2.95733642578125, 3.056884765625, 3.15643310546875, 3.2559814453125, 3.35552978515625, 3.455078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 13.0, 20.0, 28.0, 34.0, 52.0, 76.0, 122.0, 169.0, 260.0, 371.0, 561.0, 795.0, 1264.0, 1997.0, 2851.0, 4440.0, 6644.0, 10105.0, 15290.0, 22611.0, 32520.0, 46036.0, 61666.0, 78470.0, 94495.0, 105444.0, 108590.0, 102895.0, 90152.0, 73564.0, 56844.0, 41166.0, 29131.0, 19815.0, 13519.0, 9128.0, 6006.0, 3930.0, 2503.0, 1688.0, 1076.0, 753.0, 487.0, 291.0, 232.0, 140.0, 96.0, 81.0, 41.0, 30.0, 17.0, 18.0, 11.0, 8.0, 2.0, 4.0, 2.0], "bins": [-2.224609375, -2.15789794921875, -2.0911865234375, -2.02447509765625, -1.957763671875, -1.89105224609375, -1.8243408203125, -1.75762939453125, -1.69091796875, -1.62420654296875, -1.5574951171875, -1.49078369140625, -1.424072265625, -1.35736083984375, -1.2906494140625, -1.22393798828125, -1.1572265625, -1.09051513671875, -1.0238037109375, -0.95709228515625, -0.890380859375, -0.82366943359375, -0.7569580078125, -0.69024658203125, -0.62353515625, -0.55682373046875, -0.4901123046875, -0.42340087890625, -0.356689453125, -0.28997802734375, -0.2232666015625, -0.15655517578125, -0.08984375, -0.02313232421875, 0.0435791015625, 0.11029052734375, 0.177001953125, 0.24371337890625, 0.3104248046875, 0.37713623046875, 0.44384765625, 0.51055908203125, 0.5772705078125, 0.64398193359375, 0.710693359375, 0.77740478515625, 0.8441162109375, 0.91082763671875, 0.9775390625, 1.04425048828125, 1.1109619140625, 1.17767333984375, 1.244384765625, 1.31109619140625, 1.3778076171875, 1.44451904296875, 1.51123046875, 1.57794189453125, 1.6446533203125, 1.71136474609375, 1.778076171875, 1.84478759765625, 1.9114990234375, 1.97821044921875, 2.044921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 14.0, 10.0, 17.0, 9.0, 18.0, 23.0, 27.0, 21.0, 22.0, 24.0, 25.0, 35.0, 39.0, 38.0, 37.0, 34.0, 48.0, 25.0, 31.0, 50.0, 42.0, 35.0, 27.0, 42.0, 29.0, 34.0, 28.0, 17.0, 32.0, 19.0, 25.0, 19.0, 13.0, 12.0, 14.0, 4.0, 8.0, 3.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7529296875, -1.6934661865234375, -1.634002685546875, -1.5745391845703125, -1.51507568359375, -1.4556121826171875, -1.396148681640625, -1.3366851806640625, -1.2772216796875, -1.2177581787109375, -1.158294677734375, -1.0988311767578125, -1.03936767578125, -0.9799041748046875, -0.920440673828125, -0.8609771728515625, -0.801513671875, -0.7420501708984375, -0.682586669921875, -0.6231231689453125, -0.56365966796875, -0.5041961669921875, -0.444732666015625, -0.3852691650390625, -0.3258056640625, -0.2663421630859375, -0.206878662109375, -0.1474151611328125, -0.08795166015625, -0.0284881591796875, 0.030975341796875, 0.0904388427734375, 0.14990234375, 0.2093658447265625, 0.268829345703125, 0.3282928466796875, 0.38775634765625, 0.4472198486328125, 0.506683349609375, 0.5661468505859375, 0.6256103515625, 0.6850738525390625, 0.744537353515625, 0.8040008544921875, 0.86346435546875, 0.9229278564453125, 0.982391357421875, 1.0418548583984375, 1.101318359375, 1.1607818603515625, 1.220245361328125, 1.2797088623046875, 1.33917236328125, 1.3986358642578125, 1.458099365234375, 1.5175628662109375, 1.5770263671875, 1.6364898681640625, 1.695953369140625, 1.7554168701171875, 1.81488037109375, 1.8743438720703125, 1.933807373046875, 1.9932708740234375, 2.052734375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 16.0, 22.0, 30.0, 46.0, 76.0, 79.0, 131.0, 193.0, 255.0, 378.0, 536.0, 785.0, 1254.0, 1834.0, 2872.0, 4855.0, 8611.0, 16627.0, 33492.0, 67499.0, 124095.0, 183565.0, 206651.0, 170396.0, 107148.0, 56342.0, 27984.0, 13730.0, 7178.0, 4145.0, 2610.0, 1604.0, 1100.0, 774.0, 491.0, 324.0, 245.0, 167.0, 120.0, 82.0, 72.0, 46.0, 33.0, 13.0, 13.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7421875, -1.6866455078125, -1.631103515625, -1.5755615234375, -1.52001953125, -1.4644775390625, -1.408935546875, -1.3533935546875, -1.2978515625, -1.2423095703125, -1.186767578125, -1.1312255859375, -1.07568359375, -1.0201416015625, -0.964599609375, -0.9090576171875, -0.853515625, -0.7979736328125, -0.742431640625, -0.6868896484375, -0.63134765625, -0.5758056640625, -0.520263671875, -0.4647216796875, -0.4091796875, -0.3536376953125, -0.298095703125, -0.2425537109375, -0.18701171875, -0.1314697265625, -0.075927734375, -0.0203857421875, 0.03515625, 0.0906982421875, 0.146240234375, 0.2017822265625, 0.25732421875, 0.3128662109375, 0.368408203125, 0.4239501953125, 0.4794921875, 0.5350341796875, 0.590576171875, 0.6461181640625, 0.70166015625, 0.7572021484375, 0.812744140625, 0.8682861328125, 0.923828125, 0.9793701171875, 1.034912109375, 1.0904541015625, 1.14599609375, 1.2015380859375, 1.257080078125, 1.3126220703125, 1.3681640625, 1.4237060546875, 1.479248046875, 1.5347900390625, 1.59033203125, 1.6458740234375, 1.701416015625, 1.7569580078125, 1.8125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 4.0, 12.0, 10.0, 29.0, 29.0, 43.0, 40.0, 56.0, 83.0, 86.0, 82.0, 88.0, 71.0, 68.0, 81.0, 56.0, 31.0, 26.0, 28.0, 13.0, 10.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002448558807373047, -0.00023787468671798706, -0.00023089349269866943, -0.0002239122986793518, -0.00021693110466003418, -0.00020994991064071655, -0.00020296871662139893, -0.0001959875226020813, -0.00018900632858276367, -0.00018202513456344604, -0.00017504394054412842, -0.0001680627465248108, -0.00016108155250549316, -0.00015410035848617554, -0.0001471191644668579, -0.00014013797044754028, -0.00013315677642822266, -0.00012617558240890503, -0.0001191943883895874, -0.00011221319437026978, -0.00010523200035095215, -9.825080633163452e-05, -9.12696123123169e-05, -8.428841829299927e-05, -7.730722427368164e-05, -7.032603025436401e-05, -6.334483623504639e-05, -5.636364221572876e-05, -4.938244819641113e-05, -4.2401254177093506e-05, -3.542006015777588e-05, -2.8438866138458252e-05, -2.1457672119140625e-05, -1.4476478099822998e-05, -7.495284080505371e-06, -5.140900611877441e-07, 6.467103958129883e-06, 1.344829797744751e-05, 2.0429491996765137e-05, 2.7410686016082764e-05, 3.439188003540039e-05, 4.137307405471802e-05, 4.8354268074035645e-05, 5.533546209335327e-05, 6.23166561126709e-05, 6.929785013198853e-05, 7.627904415130615e-05, 8.326023817062378e-05, 9.02414321899414e-05, 9.722262620925903e-05, 0.00010420382022857666, 0.00011118501424789429, 0.00011816620826721191, 0.00012514740228652954, 0.00013212859630584717, 0.0001391097903251648, 0.00014609098434448242, 0.00015307217836380005, 0.00016005337238311768, 0.0001670345664024353, 0.00017401576042175293, 0.00018099695444107056, 0.00018797814846038818, 0.0001949593424797058, 0.00020194053649902344]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 7.0, 14.0, 21.0, 30.0, 44.0, 72.0, 112.0, 151.0, 262.0, 368.0, 567.0, 883.0, 1384.0, 2350.0, 3866.0, 6887.0, 14517.0, 32230.0, 74050.0, 150913.0, 229577.0, 231993.0, 155453.0, 76619.0, 33579.0, 14847.0, 7327.0, 4049.0, 2236.0, 1453.0, 928.0, 612.0, 389.0, 279.0, 164.0, 96.0, 76.0, 40.0, 43.0, 17.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.205078125, -2.1383056640625, -2.071533203125, -2.0047607421875, -1.93798828125, -1.8712158203125, -1.804443359375, -1.7376708984375, -1.6708984375, -1.6041259765625, -1.537353515625, -1.4705810546875, -1.40380859375, -1.3370361328125, -1.270263671875, -1.2034912109375, -1.13671875, -1.0699462890625, -1.003173828125, -0.9364013671875, -0.86962890625, -0.8028564453125, -0.736083984375, -0.6693115234375, -0.6025390625, -0.5357666015625, -0.468994140625, -0.4022216796875, -0.33544921875, -0.2686767578125, -0.201904296875, -0.1351318359375, -0.068359375, -0.0015869140625, 0.065185546875, 0.1319580078125, 0.19873046875, 0.2655029296875, 0.332275390625, 0.3990478515625, 0.4658203125, 0.5325927734375, 0.599365234375, 0.6661376953125, 0.73291015625, 0.7996826171875, 0.866455078125, 0.9332275390625, 1.0, 1.0667724609375, 1.133544921875, 1.2003173828125, 1.26708984375, 1.3338623046875, 1.400634765625, 1.4674072265625, 1.5341796875, 1.6009521484375, 1.667724609375, 1.7344970703125, 1.80126953125, 1.8680419921875, 1.934814453125, 2.0015869140625, 2.068359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 14.0, 16.0, 25.0, 45.0, 51.0, 45.0, 62.0, 68.0, 67.0, 81.0, 90.0, 81.0, 70.0, 52.0, 44.0, 40.0, 39.0, 22.0, 22.0, 11.0, 10.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5912933349609375, -0.572235107421875, -0.5531768798828125, -0.53411865234375, -0.5150604248046875, -0.496002197265625, -0.4769439697265625, -0.4578857421875, -0.4388275146484375, -0.419769287109375, -0.4007110595703125, -0.38165283203125, -0.3625946044921875, -0.343536376953125, -0.3244781494140625, -0.305419921875, -0.2863616943359375, -0.267303466796875, -0.2482452392578125, -0.22918701171875, -0.2101287841796875, -0.191070556640625, -0.1720123291015625, -0.1529541015625, -0.1338958740234375, -0.114837646484375, -0.0957794189453125, -0.07672119140625, -0.0576629638671875, -0.038604736328125, -0.0195465087890625, -0.00048828125, 0.0185699462890625, 0.037628173828125, 0.0566864013671875, 0.07574462890625, 0.0948028564453125, 0.113861083984375, 0.1329193115234375, 0.1519775390625, 0.1710357666015625, 0.190093994140625, 0.2091522216796875, 0.22821044921875, 0.2472686767578125, 0.266326904296875, 0.2853851318359375, 0.304443359375, 0.3235015869140625, 0.342559814453125, 0.3616180419921875, 0.38067626953125, 0.3997344970703125, 0.418792724609375, 0.4378509521484375, 0.4569091796875, 0.4759674072265625, 0.495025634765625, 0.5140838623046875, 0.53314208984375, 0.5522003173828125, 0.571258544921875, 0.5903167724609375, 0.609375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 12.0, 11.0, 18.0, 23.0, 26.0, 28.0, 24.0, 38.0, 46.0, 50.0, 55.0, 48.0, 52.0, 54.0, 43.0, 38.0, 47.0, 36.0, 43.0, 43.0, 36.0, 25.0, 23.0, 23.0, 21.0, 21.0, 21.0, 12.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.149673938751221, -4.006742000579834, -3.8638100624084473, -3.7208781242370605, -3.577946186065674, -3.435014247894287, -3.2920825481414795, -3.1491506099700928, -3.006218671798706, -2.8632867336273193, -2.7203547954559326, -2.577422857284546, -2.4344911575317383, -2.2915592193603516, -2.148627281188965, -2.005695343017578, -1.8627634048461914, -1.7198314666748047, -1.576899528503418, -1.4339677095413208, -1.291035771369934, -1.1481038331985474, -1.0051720142364502, -0.8622400760650635, -0.7193081378936768, -0.57637619972229, -0.4334443211555481, -0.29051241278648376, -0.14758050441741943, -0.004648566246032715, 0.13828331232070923, 0.28121519088745117, 0.4241471290588379, 0.5670790672302246, 0.7100109457969666, 0.8529428243637085, 0.9958747625350952, 1.138806700706482, 1.281738519668579, 1.4246704578399658, 1.5676023960113525, 1.7105343341827393, 1.853466272354126, 1.9963980913162231, 2.1393299102783203, 2.282261848449707, 2.4251937866210938, 2.5681257247924805, 2.711057662963867, 2.853989601135254, 2.9969215393066406, 3.1398534774780273, 3.282785415649414, 3.425717353820801, 3.5686490535736084, 3.711580991744995, 3.854512929916382, 3.9974448680877686, 4.140376567840576, 4.283308506011963, 4.42624044418335, 4.569172382354736, 4.712104320526123, 4.85503625869751, 4.9979681968688965]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 4.0, 10.0, 11.0, 10.0, 11.0, 13.0, 18.0, 24.0, 18.0, 25.0, 27.0, 28.0, 26.0, 48.0, 37.0, 31.0, 48.0, 44.0, 43.0, 49.0, 37.0, 53.0, 33.0, 47.0, 47.0, 26.0, 26.0, 17.0, 23.0, 25.0, 17.0, 22.0, 20.0, 16.0, 8.0, 10.0, 10.0, 7.0, 5.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0], "bins": [-4.125625133514404, -4.008246421813965, -3.890867233276367, -3.7734885215759277, -3.656109571456909, -3.5387306213378906, -3.421351671218872, -3.3039727210998535, -3.186594009399414, -3.0692150592803955, -2.951836109161377, -2.8344573974609375, -2.717078447341919, -2.5996994972229004, -2.482320547103882, -2.3649415969848633, -2.2475626468658447, -2.130183696746826, -2.0128047466278076, -1.8954259157180786, -1.7780470848083496, -1.660668134689331, -1.5432891845703125, -1.425910234451294, -1.308531403541565, -1.1911524534225464, -1.0737736225128174, -0.9563946723937988, -0.839015781879425, -0.7216368913650513, -0.6042579412460327, -0.48687905073165894, -0.36950016021728516, -0.2521212697029114, -0.1347423493862152, -0.017363429069519043, 0.10001546144485474, 0.21739435195922852, 0.33477330207824707, 0.45215219259262085, 0.5695310831069946, 0.6869099736213684, 0.8042888641357422, 0.9216678142547607, 1.0390467643737793, 1.1564255952835083, 1.2738045454025269, 1.3911833763122559, 1.5085623264312744, 1.625941276550293, 1.743320107460022, 1.8606990575790405, 1.9780778884887695, 2.095456838607788, 2.2128357887268066, 2.330214738845825, 2.4475936889648438, 2.5649726390838623, 2.682351589202881, 2.7997303009033203, 2.917109251022339, 3.0344882011413574, 3.151867151260376, 3.2692461013793945, 3.386624813079834]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 12.0, 28.0, 34.0, 47.0, 92.0, 123.0, 166.0, 233.0, 398.0, 595.0, 981.0, 1544.0, 2363.0, 3999.0, 6436.0, 10950.0, 18336.0, 31499.0, 55303.0, 95817.0, 166694.0, 284017.0, 452038.0, 634462.0, 716733.0, 624006.0, 437497.0, 271210.0, 160114.0, 91545.0, 52437.0, 30475.0, 17779.0, 10376.0, 6279.0, 3676.0, 2255.0, 1442.0, 898.0, 526.0, 327.0, 211.0, 130.0, 71.0, 44.0, 24.0, 19.0, 13.0, 15.0, 3.0, 0.0, 2.0], "bins": [-5.26953125, -5.125030517578125, -4.98052978515625, -4.836029052734375, -4.6915283203125, -4.547027587890625, -4.40252685546875, -4.258026123046875, -4.113525390625, -3.969024658203125, -3.82452392578125, -3.680023193359375, -3.5355224609375, -3.391021728515625, -3.24652099609375, -3.102020263671875, -2.95751953125, -2.813018798828125, -2.66851806640625, -2.524017333984375, -2.3795166015625, -2.235015869140625, -2.09051513671875, -1.946014404296875, -1.801513671875, -1.657012939453125, -1.51251220703125, -1.368011474609375, -1.2235107421875, -1.079010009765625, -0.93450927734375, -0.790008544921875, -0.6455078125, -0.501007080078125, -0.35650634765625, -0.212005615234375, -0.0675048828125, 0.076995849609375, 0.22149658203125, 0.365997314453125, 0.510498046875, 0.654998779296875, 0.79949951171875, 0.944000244140625, 1.0885009765625, 1.233001708984375, 1.37750244140625, 1.522003173828125, 1.66650390625, 1.811004638671875, 1.95550537109375, 2.100006103515625, 2.2445068359375, 2.389007568359375, 2.53350830078125, 2.678009033203125, 2.822509765625, 2.967010498046875, 3.11151123046875, 3.256011962890625, 3.4005126953125, 3.545013427734375, 3.68951416015625, 3.834014892578125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 4.0, 6.0, 13.0, 12.0, 15.0, 17.0, 20.0, 17.0, 23.0, 28.0, 30.0, 35.0, 42.0, 32.0, 35.0, 38.0, 38.0, 47.0, 50.0, 37.0, 42.0, 37.0, 38.0, 45.0, 39.0, 32.0, 26.0, 29.0, 14.0, 18.0, 20.0, 12.0, 13.0, 17.0, 17.0, 9.0, 7.0, 7.0, 12.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.61822509765625, -3.5001220703125, -3.38201904296875, -3.263916015625, -3.14581298828125, -3.0277099609375, -2.90960693359375, -2.79150390625, -2.67340087890625, -2.5552978515625, -2.43719482421875, -2.319091796875, -2.20098876953125, -2.0828857421875, -1.96478271484375, -1.8466796875, -1.72857666015625, -1.6104736328125, -1.49237060546875, -1.374267578125, -1.25616455078125, -1.1380615234375, -1.01995849609375, -0.90185546875, -0.78375244140625, -0.6656494140625, -0.54754638671875, -0.429443359375, -0.31134033203125, -0.1932373046875, -0.07513427734375, 0.04296875, 0.16107177734375, 0.2791748046875, 0.39727783203125, 0.515380859375, 0.63348388671875, 0.7515869140625, 0.86968994140625, 0.98779296875, 1.10589599609375, 1.2239990234375, 1.34210205078125, 1.460205078125, 1.57830810546875, 1.6964111328125, 1.81451416015625, 1.9326171875, 2.05072021484375, 2.1688232421875, 2.28692626953125, 2.405029296875, 2.52313232421875, 2.6412353515625, 2.75933837890625, 2.87744140625, 2.99554443359375, 3.1136474609375, 3.23175048828125, 3.349853515625, 3.46795654296875, 3.5860595703125, 3.70416259765625, 3.822265625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 12.0, 19.0, 23.0, 37.0, 65.0, 124.0, 204.0, 294.0, 531.0, 924.0, 1563.0, 2805.0, 4727.0, 8332.0, 14990.0, 27004.0, 48049.0, 86296.0, 150623.0, 250802.0, 395535.0, 558656.0, 673454.0, 642958.0, 499298.0, 337153.0, 208527.0, 123051.0, 69896.0, 38982.0, 21476.0, 11957.0, 6731.0, 3894.0, 2114.0, 1284.0, 774.0, 410.0, 256.0, 169.0, 112.0, 68.0, 48.0, 19.0, 7.0, 8.0, 11.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.4991455078125, -5.314697265625, -5.1302490234375, -4.94580078125, -4.7613525390625, -4.576904296875, -4.3924560546875, -4.2080078125, -4.0235595703125, -3.839111328125, -3.6546630859375, -3.47021484375, -3.2857666015625, -3.101318359375, -2.9168701171875, -2.732421875, -2.5479736328125, -2.363525390625, -2.1790771484375, -1.99462890625, -1.8101806640625, -1.625732421875, -1.4412841796875, -1.2568359375, -1.0723876953125, -0.887939453125, -0.7034912109375, -0.51904296875, -0.3345947265625, -0.150146484375, 0.0343017578125, 0.21875, 0.4031982421875, 0.587646484375, 0.7720947265625, 0.95654296875, 1.1409912109375, 1.325439453125, 1.5098876953125, 1.6943359375, 1.8787841796875, 2.063232421875, 2.2476806640625, 2.43212890625, 2.6165771484375, 2.801025390625, 2.9854736328125, 3.169921875, 3.3543701171875, 3.538818359375, 3.7232666015625, 3.90771484375, 4.0921630859375, 4.276611328125, 4.4610595703125, 4.6455078125, 4.8299560546875, 5.014404296875, 5.1988525390625, 5.38330078125, 5.5677490234375, 5.752197265625, 5.9366455078125, 6.12109375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 10.0, 3.0, 7.0, 9.0, 11.0, 11.0, 28.0, 32.0, 53.0, 57.0, 67.0, 74.0, 97.0, 110.0, 132.0, 141.0, 198.0, 189.0, 231.0, 230.0, 266.0, 244.0, 272.0, 229.0, 228.0, 191.0, 170.0, 145.0, 125.0, 83.0, 94.0, 79.0, 73.0, 48.0, 25.0, 35.0, 25.0, 12.0, 12.0, 4.0, 6.0, 11.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.406463623046875, -2.33441162109375, -2.262359619140625, -2.1903076171875, -2.118255615234375, -2.04620361328125, -1.974151611328125, -1.902099609375, -1.830047607421875, -1.75799560546875, -1.685943603515625, -1.6138916015625, -1.541839599609375, -1.46978759765625, -1.397735595703125, -1.32568359375, -1.253631591796875, -1.18157958984375, -1.109527587890625, -1.0374755859375, -0.965423583984375, -0.89337158203125, -0.821319580078125, -0.749267578125, -0.677215576171875, -0.60516357421875, -0.533111572265625, -0.4610595703125, -0.389007568359375, -0.31695556640625, -0.244903564453125, -0.1728515625, -0.100799560546875, -0.02874755859375, 0.043304443359375, 0.1153564453125, 0.187408447265625, 0.25946044921875, 0.331512451171875, 0.403564453125, 0.475616455078125, 0.54766845703125, 0.619720458984375, 0.6917724609375, 0.763824462890625, 0.83587646484375, 0.907928466796875, 0.97998046875, 1.052032470703125, 1.12408447265625, 1.196136474609375, 1.2681884765625, 1.340240478515625, 1.41229248046875, 1.484344482421875, 1.556396484375, 1.628448486328125, 1.70050048828125, 1.772552490234375, 1.8446044921875, 1.916656494140625, 1.98870849609375, 2.060760498046875, 2.1328125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 7.0, 25.0, 11.0, 23.0, 32.0, 38.0, 38.0, 55.0, 56.0, 63.0, 85.0, 72.0, 57.0, 58.0, 45.0, 53.0, 67.0, 34.0, 32.0, 28.0, 21.0, 25.0, 17.0, 9.0, 8.0, 5.0, 10.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.030409812927246, -10.74123764038086, -10.452064514160156, -10.16289234161377, -9.873720169067383, -9.58454704284668, -9.295374870300293, -9.006202697753906, -8.717029571533203, -8.427857398986816, -8.138684272766113, -7.849512100219727, -7.560339450836182, -7.271166801452637, -6.98199462890625, -6.692821979522705, -6.403649806976318, -6.114477157592773, -5.825304985046387, -5.536132335662842, -5.246959686279297, -4.95778751373291, -4.668614864349365, -4.37944221496582, -4.090270042419434, -3.8010976314544678, -3.511924982070923, -3.222752571105957, -2.933579921722412, -2.6444075107574463, -2.3552350997924805, -2.0660624504089355, -1.7768893241882324, -1.487716794013977, -1.1985442638397217, -0.9093718528747559, -0.6201993227005005, -0.3310267925262451, -0.0418543815612793, 0.24731826782226562, 0.5364906787872314, 0.8256632089614868, 1.1148357391357422, 1.404008150100708, 1.6931806802749634, 1.9823532104492188, 2.2715256214141846, 2.5606982707977295, 2.8498706817626953, 3.139043092727661, 3.428215742111206, 3.717388153076172, 4.006560802459717, 4.295733451843262, 4.584905624389648, 4.874078273773193, 5.163250923156738, 5.452423572540283, 5.74159574508667, 6.030768394470215, 6.31994104385376, 6.609113693237305, 6.898285865783691, 7.187458515167236, 7.476630687713623]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 12.0, 20.0, 14.0, 20.0, 22.0, 30.0, 25.0, 25.0, 31.0, 39.0, 46.0, 37.0, 47.0, 54.0, 44.0, 36.0, 49.0, 37.0, 38.0, 39.0, 40.0, 33.0, 36.0, 31.0, 22.0, 14.0, 22.0, 13.0, 16.0, 10.0, 11.0, 10.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.184546947479248, -5.999026775360107, -5.813506603240967, -5.627986907958984, -5.442466735839844, -5.256946563720703, -5.0714263916015625, -4.885906219482422, -4.700386047363281, -4.514865875244141, -4.329345703125, -4.143825531005859, -3.958305835723877, -3.7727856636047363, -3.5872654914855957, -3.401745319366455, -3.2162256240844727, -3.030705451965332, -2.8451855182647705, -2.65966534614563, -2.4741454124450684, -2.2886252403259277, -2.103105068206787, -1.917585015296936, -1.732064962387085, -1.5465449094772339, -1.3610248565673828, -1.1755046844482422, -0.9899846315383911, -0.80446457862854, -0.6189444065093994, -0.43342435359954834, -0.24790382385253906, -0.0623837411403656, 0.12313634157180786, 0.3086564540863037, 0.4941765069961548, 0.6796965599060059, 0.8652167320251465, 1.0507367849349976, 1.2362568378448486, 1.4217768907546997, 1.6072969436645508, 1.7928171157836914, 1.9783371686935425, 2.1638572216033936, 2.349377393722534, 2.5348973274230957, 2.7204174995422363, 2.905937671661377, 3.0914576053619385, 3.276977777481079, 3.4624977111816406, 3.6480178833007812, 3.833538055419922, 4.0190582275390625, 4.204578399658203, 4.390098571777344, 4.575618743896484, 4.761138916015625, 4.946658611297607, 5.132178783416748, 5.317698955535889, 5.503219127655029, 5.688738822937012]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 4.0, 7.0, 13.0, 23.0, 30.0, 39.0, 59.0, 62.0, 120.0, 171.0, 259.0, 464.0, 696.0, 1098.0, 1675.0, 2780.0, 4663.0, 8072.0, 14588.0, 26524.0, 50066.0, 96183.0, 182020.0, 256498.0, 187294.0, 99854.0, 51825.0, 27559.0, 15058.0, 8389.0, 4847.0, 2877.0, 1716.0, 1052.0, 639.0, 432.0, 290.0, 185.0, 137.0, 93.0, 52.0, 33.0, 30.0, 25.0, 15.0, 11.0, 11.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.62890625, -1.577239990234375, -1.52557373046875, -1.473907470703125, -1.4222412109375, -1.370574951171875, -1.31890869140625, -1.267242431640625, -1.215576171875, -1.163909912109375, -1.11224365234375, -1.060577392578125, -1.0089111328125, -0.957244873046875, -0.90557861328125, -0.853912353515625, -0.80224609375, -0.750579833984375, -0.69891357421875, -0.647247314453125, -0.5955810546875, -0.543914794921875, -0.49224853515625, -0.440582275390625, -0.388916015625, -0.337249755859375, -0.28558349609375, -0.233917236328125, -0.1822509765625, -0.130584716796875, -0.07891845703125, -0.027252197265625, 0.0244140625, 0.076080322265625, 0.12774658203125, 0.179412841796875, 0.2310791015625, 0.282745361328125, 0.33441162109375, 0.386077880859375, 0.437744140625, 0.489410400390625, 0.54107666015625, 0.592742919921875, 0.6444091796875, 0.696075439453125, 0.74774169921875, 0.799407958984375, 0.85107421875, 0.902740478515625, 0.95440673828125, 1.006072998046875, 1.0577392578125, 1.109405517578125, 1.16107177734375, 1.212738037109375, 1.264404296875, 1.316070556640625, 1.36773681640625, 1.419403076171875, 1.4710693359375, 1.522735595703125, 1.57440185546875, 1.626068115234375, 1.677734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 7.0, 7.0, 5.0, 11.0, 9.0, 10.0, 17.0, 21.0, 29.0, 22.0, 26.0, 39.0, 27.0, 43.0, 49.0, 43.0, 47.0, 56.0, 33.0, 39.0, 51.0, 44.0, 45.0, 52.0, 32.0, 29.0, 35.0, 24.0, 18.0, 21.0, 21.0, 14.0, 11.0, 12.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.75, -6.53973388671875, -6.3294677734375, -6.11920166015625, -5.908935546875, -5.69866943359375, -5.4884033203125, -5.27813720703125, -5.06787109375, -4.85760498046875, -4.6473388671875, -4.43707275390625, -4.226806640625, -4.01654052734375, -3.8062744140625, -3.59600830078125, -3.3857421875, -3.17547607421875, -2.9652099609375, -2.75494384765625, -2.544677734375, -2.33441162109375, -2.1241455078125, -1.91387939453125, -1.70361328125, -1.49334716796875, -1.2830810546875, -1.07281494140625, -0.862548828125, -0.65228271484375, -0.4420166015625, -0.23175048828125, -0.021484375, 0.18878173828125, 0.3990478515625, 0.60931396484375, 0.819580078125, 1.02984619140625, 1.2401123046875, 1.45037841796875, 1.66064453125, 1.87091064453125, 2.0811767578125, 2.29144287109375, 2.501708984375, 2.71197509765625, 2.9222412109375, 3.13250732421875, 3.3427734375, 3.55303955078125, 3.7633056640625, 3.97357177734375, 4.183837890625, 4.39410400390625, 4.6043701171875, 4.81463623046875, 5.02490234375, 5.23516845703125, 5.4454345703125, 5.65570068359375, 5.865966796875, 6.07623291015625, 6.2864990234375, 6.49676513671875, 6.70703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 6.0, 8.0, 15.0, 27.0, 32.0, 60.0, 94.0, 137.0, 233.0, 357.0, 613.0, 1019.0, 1786.0, 3201.0, 6113.0, 11718.0, 23069.0, 46548.0, 95184.0, 186824.0, 272834.0, 196394.0, 101465.0, 49612.0, 24454.0, 12362.0, 6398.0, 3390.0, 1891.0, 1091.0, 624.0, 394.0, 209.0, 135.0, 93.0, 47.0, 45.0, 22.0, 22.0, 10.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5841522216796875, -1.528656005859375, -1.4731597900390625, -1.41766357421875, -1.3621673583984375, -1.306671142578125, -1.2511749267578125, -1.1956787109375, -1.1401824951171875, -1.084686279296875, -1.0291900634765625, -0.97369384765625, -0.9181976318359375, -0.862701416015625, -0.8072052001953125, -0.751708984375, -0.6962127685546875, -0.640716552734375, -0.5852203369140625, -0.52972412109375, -0.4742279052734375, -0.418731689453125, -0.3632354736328125, -0.3077392578125, -0.2522430419921875, -0.196746826171875, -0.1412506103515625, -0.08575439453125, -0.0302581787109375, 0.025238037109375, 0.0807342529296875, 0.13623046875, 0.1917266845703125, 0.247222900390625, 0.3027191162109375, 0.35821533203125, 0.4137115478515625, 0.469207763671875, 0.5247039794921875, 0.5802001953125, 0.6356964111328125, 0.691192626953125, 0.7466888427734375, 0.80218505859375, 0.8576812744140625, 0.913177490234375, 0.9686737060546875, 1.024169921875, 1.0796661376953125, 1.135162353515625, 1.1906585693359375, 1.24615478515625, 1.3016510009765625, 1.357147216796875, 1.4126434326171875, 1.4681396484375, 1.5236358642578125, 1.579132080078125, 1.6346282958984375, 1.69012451171875, 1.7456207275390625, 1.801116943359375, 1.8566131591796875, 1.912109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 3.0, 10.0, 15.0, 14.0, 11.0, 13.0, 16.0, 20.0, 23.0, 18.0, 22.0, 31.0, 35.0, 36.0, 49.0, 46.0, 42.0, 67.0, 41.0, 39.0, 45.0, 47.0, 50.0, 42.0, 41.0, 41.0, 23.0, 22.0, 24.0, 20.0, 16.0, 10.0, 11.0, 10.0, 14.0, 6.0, 4.0, 1.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.1484375, -4.0252685546875, -3.902099609375, -3.7789306640625, -3.65576171875, -3.5325927734375, -3.409423828125, -3.2862548828125, -3.1630859375, -3.0399169921875, -2.916748046875, -2.7935791015625, -2.67041015625, -2.5472412109375, -2.424072265625, -2.3009033203125, -2.177734375, -2.0545654296875, -1.931396484375, -1.8082275390625, -1.68505859375, -1.5618896484375, -1.438720703125, -1.3155517578125, -1.1923828125, -1.0692138671875, -0.946044921875, -0.8228759765625, -0.69970703125, -0.5765380859375, -0.453369140625, -0.3302001953125, -0.20703125, -0.0838623046875, 0.039306640625, 0.1624755859375, 0.28564453125, 0.4088134765625, 0.531982421875, 0.6551513671875, 0.7783203125, 0.9014892578125, 1.024658203125, 1.1478271484375, 1.27099609375, 1.3941650390625, 1.517333984375, 1.6405029296875, 1.763671875, 1.8868408203125, 2.010009765625, 2.1331787109375, 2.25634765625, 2.3795166015625, 2.502685546875, 2.6258544921875, 2.7490234375, 2.8721923828125, 2.995361328125, 3.1185302734375, 3.24169921875, 3.3648681640625, 3.488037109375, 3.6112060546875, 3.734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 13.0, 11.0, 20.0, 26.0, 52.0, 56.0, 79.0, 140.0, 209.0, 273.0, 449.0, 654.0, 1029.0, 1695.0, 2896.0, 5786.0, 14046.0, 44699.0, 204230.0, 546031.0, 163951.0, 37355.0, 12350.0, 5326.0, 2665.0, 1592.0, 1002.0, 644.0, 405.0, 274.0, 196.0, 134.0, 74.0, 72.0, 30.0, 24.0, 16.0, 13.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8901824951171875, -0.860931396484375, -0.8316802978515625, -0.80242919921875, -0.7731781005859375, -0.743927001953125, -0.7146759033203125, -0.6854248046875, -0.6561737060546875, -0.626922607421875, -0.5976715087890625, -0.56842041015625, -0.5391693115234375, -0.509918212890625, -0.4806671142578125, -0.451416015625, -0.4221649169921875, -0.392913818359375, -0.3636627197265625, -0.33441162109375, -0.3051605224609375, -0.275909423828125, -0.2466583251953125, -0.2174072265625, -0.1881561279296875, -0.158905029296875, -0.1296539306640625, -0.10040283203125, -0.0711517333984375, -0.041900634765625, -0.0126495361328125, 0.0166015625, 0.0458526611328125, 0.075103759765625, 0.1043548583984375, 0.13360595703125, 0.1628570556640625, 0.192108154296875, 0.2213592529296875, 0.2506103515625, 0.2798614501953125, 0.309112548828125, 0.3383636474609375, 0.36761474609375, 0.3968658447265625, 0.426116943359375, 0.4553680419921875, 0.484619140625, 0.5138702392578125, 0.543121337890625, 0.5723724365234375, 0.60162353515625, 0.6308746337890625, 0.660125732421875, 0.6893768310546875, 0.7186279296875, 0.7478790283203125, 0.777130126953125, 0.8063812255859375, 0.83563232421875, 0.8648834228515625, 0.894134521484375, 0.9233856201171875, 0.95263671875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 0.0, 6.0, 4.0, 6.0, 10.0, 8.0, 17.0, 28.0, 24.0, 28.0, 40.0, 39.0, 50.0, 64.0, 63.0, 66.0, 83.0, 91.0, 71.0, 60.0, 45.0, 41.0, 28.0, 27.0, 21.0, 24.0, 14.0, 20.0, 11.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8014183044433594e-05, -2.690032124519348e-05, -2.578645944595337e-05, -2.4672597646713257e-05, -2.3558735847473145e-05, -2.2444874048233032e-05, -2.133101224899292e-05, -2.0217150449752808e-05, -1.9103288650512695e-05, -1.7989426851272583e-05, -1.687556505203247e-05, -1.576170325279236e-05, -1.4647841453552246e-05, -1.3533979654312134e-05, -1.2420117855072021e-05, -1.130625605583191e-05, -1.0192394256591797e-05, -9.078532457351685e-06, -7.964670658111572e-06, -6.85080885887146e-06, -5.736947059631348e-06, -4.623085260391235e-06, -3.509223461151123e-06, -2.3953616619110107e-06, -1.2814998626708984e-06, -1.6763806343078613e-07, 9.462237358093262e-07, 2.0600855350494385e-06, 3.1739473342895508e-06, 4.287809133529663e-06, 5.401670932769775e-06, 6.515532732009888e-06, 7.62939453125e-06, 8.743256330490112e-06, 9.857118129730225e-06, 1.0970979928970337e-05, 1.208484172821045e-05, 1.3198703527450562e-05, 1.4312565326690674e-05, 1.5426427125930786e-05, 1.65402889251709e-05, 1.765415072441101e-05, 1.8768012523651123e-05, 1.9881874322891235e-05, 2.0995736122131348e-05, 2.210959792137146e-05, 2.3223459720611572e-05, 2.4337321519851685e-05, 2.5451183319091797e-05, 2.656504511833191e-05, 2.767890691757202e-05, 2.8792768716812134e-05, 2.9906630516052246e-05, 3.102049231529236e-05, 3.213435411453247e-05, 3.324821591377258e-05, 3.4362077713012695e-05, 3.547593951225281e-05, 3.658980131149292e-05, 3.770366311073303e-05, 3.8817524909973145e-05, 3.993138670921326e-05, 4.104524850845337e-05, 4.215911030769348e-05, 4.3272972106933594e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 16.0, 26.0, 41.0, 45.0, 46.0, 88.0, 136.0, 192.0, 253.0, 363.0, 502.0, 707.0, 1031.0, 1625.0, 2540.0, 4288.0, 7792.0, 15232.0, 34280.0, 84491.0, 220237.0, 360009.0, 184037.0, 70444.0, 28963.0, 13379.0, 6794.0, 3890.0, 2383.0, 1496.0, 940.0, 709.0, 418.0, 313.0, 233.0, 164.0, 126.0, 83.0, 69.0, 53.0, 26.0, 20.0, 20.0, 4.0, 13.0, 8.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.87030029296875, -0.8416748046875, -0.81304931640625, -0.784423828125, -0.75579833984375, -0.7271728515625, -0.69854736328125, -0.669921875, -0.64129638671875, -0.6126708984375, -0.58404541015625, -0.555419921875, -0.52679443359375, -0.4981689453125, -0.46954345703125, -0.44091796875, -0.41229248046875, -0.3836669921875, -0.35504150390625, -0.326416015625, -0.29779052734375, -0.2691650390625, -0.24053955078125, -0.2119140625, -0.18328857421875, -0.1546630859375, -0.12603759765625, -0.097412109375, -0.06878662109375, -0.0401611328125, -0.01153564453125, 0.01708984375, 0.04571533203125, 0.0743408203125, 0.10296630859375, 0.131591796875, 0.16021728515625, 0.1888427734375, 0.21746826171875, 0.24609375, 0.27471923828125, 0.3033447265625, 0.33197021484375, 0.360595703125, 0.38922119140625, 0.4178466796875, 0.44647216796875, 0.47509765625, 0.50372314453125, 0.5323486328125, 0.56097412109375, 0.589599609375, 0.61822509765625, 0.6468505859375, 0.67547607421875, 0.7041015625, 0.73272705078125, 0.7613525390625, 0.78997802734375, 0.818603515625, 0.84722900390625, 0.8758544921875, 0.90447998046875, 0.93310546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 15.0, 18.0, 24.0, 26.0, 47.0, 91.0, 99.0, 127.0, 137.0, 110.0, 83.0, 62.0, 61.0, 19.0, 19.0, 16.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4033203125, -0.3915367126464844, -0.37975311279296875, -0.3679695129394531, -0.3561859130859375, -0.3444023132324219, -0.33261871337890625, -0.3208351135253906, -0.309051513671875, -0.2972679138183594, -0.28548431396484375, -0.2737007141113281, -0.2619171142578125, -0.2501335144042969, -0.23834991455078125, -0.22656631469726562, -0.21478271484375, -0.20299911499023438, -0.19121551513671875, -0.17943191528320312, -0.1676483154296875, -0.15586471557617188, -0.14408111572265625, -0.13229751586914062, -0.120513916015625, -0.10873031616210938, -0.09694671630859375, -0.08516311645507812, -0.0733795166015625, -0.061595916748046875, -0.04981231689453125, -0.038028717041015625, -0.0262451171875, -0.014461517333984375, -0.00267791748046875, 0.009105682373046875, 0.0208892822265625, 0.032672882080078125, 0.04445648193359375, 0.056240081787109375, 0.068023681640625, 0.07980728149414062, 0.09159088134765625, 0.10337448120117188, 0.1151580810546875, 0.12694168090820312, 0.13872528076171875, 0.15050888061523438, 0.16229248046875, 0.17407608032226562, 0.18585968017578125, 0.19764328002929688, 0.2094268798828125, 0.22121047973632812, 0.23299407958984375, 0.24477767944335938, 0.256561279296875, 0.2683448791503906, 0.28012847900390625, 0.2919120788574219, 0.3036956787109375, 0.3154792785644531, 0.32726287841796875, 0.3390464782714844, 0.350830078125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 5.0, 24.0, 10.0, 21.0, 32.0, 37.0, 38.0, 50.0, 58.0, 60.0, 72.0, 78.0, 65.0, 54.0, 52.0, 49.0, 63.0, 39.0, 36.0, 26.0, 21.0, 28.0, 21.0, 9.0, 5.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.094508171081543, -10.80483341217041, -10.515158653259277, -10.225483894348145, -9.935808181762695, -9.646133422851562, -9.35645866394043, -9.066783905029297, -8.777109146118164, -8.487434387207031, -8.197759628295898, -7.908084392547607, -7.618409633636475, -7.328734874725342, -7.039059638977051, -6.749384880065918, -6.459710121154785, -6.170035362243652, -5.8803606033325195, -5.5906853675842285, -5.301010608673096, -5.011335849761963, -4.721660614013672, -4.431985855102539, -4.142311096191406, -3.8526363372802734, -3.5629613399505615, -3.2732863426208496, -2.983611583709717, -2.693936824798584, -2.404261827468872, -2.11458683013916, -1.8249125480651855, -1.5352376699447632, -1.2455627918243408, -0.9558879137039185, -0.6662130355834961, -0.37653815746307373, -0.08686327934265137, 0.20281171798706055, 0.49248647689819336, 0.7821613550186157, 1.071836233139038, 1.3615111112594604, 1.6511859893798828, 1.9408608675003052, 2.2305357456207275, 2.5202107429504395, 2.8098855018615723, 3.099560260772705, 3.389235258102417, 3.678910255432129, 3.9685850143432617, 4.2582597732543945, 4.547934532165527, 4.837609767913818, 5.127284526824951, 5.416959285736084, 5.706634521484375, 5.996309280395508, 6.285984039306641, 6.575658798217773, 6.865333557128906, 7.155008792877197, 7.44468355178833]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 11.0, 8.0, 13.0, 8.0, 14.0, 19.0, 16.0, 16.0, 26.0, 30.0, 27.0, 23.0, 31.0, 37.0, 37.0, 47.0, 43.0, 58.0, 40.0, 46.0, 41.0, 37.0, 42.0, 41.0, 40.0, 36.0, 37.0, 26.0, 19.0, 16.0, 19.0, 13.0, 17.0, 12.0, 9.0, 9.0, 5.0, 3.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.316371440887451, -6.126894950866699, -5.937417984008789, -5.747941017150879, -5.558464527130127, -5.368988037109375, -5.179511070251465, -4.990034103393555, -4.800557613372803, -4.611081123352051, -4.421604156494141, -4.2321271896362305, -4.0426506996154785, -3.8531739711761475, -3.6636972427368164, -3.4742205142974854, -3.2847437858581543, -3.0952670574188232, -2.905790328979492, -2.716313600540161, -2.52683687210083, -2.337360143661499, -2.147883415222168, -1.958406686782837, -1.7689299583435059, -1.5794532299041748, -1.3899765014648438, -1.2004997730255127, -1.0110230445861816, -0.8215463161468506, -0.6320695877075195, -0.4425928592681885, -0.2531156539916992, -0.06363892555236816, 0.1258378028869629, 0.31531453132629395, 0.504791259765625, 0.694267988204956, 0.8837447166442871, 1.0732214450836182, 1.2626981735229492, 1.4521749019622803, 1.6416516304016113, 1.8311283588409424, 2.0206050872802734, 2.2100818157196045, 2.3995585441589355, 2.5890352725982666, 2.7785120010375977, 2.9679887294769287, 3.1574654579162598, 3.346942186355591, 3.536418914794922, 3.725895643234253, 3.915372371673584, 4.104848861694336, 4.294325828552246, 4.483802795410156, 4.673279285430908, 4.86275577545166, 5.05223274230957, 5.2417097091674805, 5.431186199188232, 5.620662689208984, 5.8101396560668945]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 27.0, 21.0, 49.0, 54.0, 114.0, 163.0, 171.0, 290.0, 458.0, 666.0, 975.0, 1629.0, 2531.0, 4060.0, 6616.0, 11381.0, 19757.0, 35304.0, 62042.0, 104007.0, 152196.0, 179576.0, 166154.0, 121463.0, 75861.0, 43701.0, 24282.0, 13994.0, 7868.0, 4834.0, 2899.0, 1894.0, 1222.0, 747.0, 511.0, 304.0, 257.0, 141.0, 102.0, 65.0, 57.0, 32.0, 22.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3359375, -5.17266845703125, -5.0093994140625, -4.84613037109375, -4.682861328125, -4.51959228515625, -4.3563232421875, -4.19305419921875, -4.02978515625, -3.86651611328125, -3.7032470703125, -3.53997802734375, -3.376708984375, -3.21343994140625, -3.0501708984375, -2.88690185546875, -2.7236328125, -2.56036376953125, -2.3970947265625, -2.23382568359375, -2.070556640625, -1.90728759765625, -1.7440185546875, -1.58074951171875, -1.41748046875, -1.25421142578125, -1.0909423828125, -0.92767333984375, -0.764404296875, -0.60113525390625, -0.4378662109375, -0.27459716796875, -0.111328125, 0.05194091796875, 0.2152099609375, 0.37847900390625, 0.541748046875, 0.70501708984375, 0.8682861328125, 1.03155517578125, 1.19482421875, 1.35809326171875, 1.5213623046875, 1.68463134765625, 1.847900390625, 2.01116943359375, 2.1744384765625, 2.33770751953125, 2.5009765625, 2.66424560546875, 2.8275146484375, 2.99078369140625, 3.154052734375, 3.31732177734375, 3.4805908203125, 3.64385986328125, 3.80712890625, 3.97039794921875, 4.1336669921875, 4.29693603515625, 4.460205078125, 4.62347412109375, 4.7867431640625, 4.95001220703125, 5.11328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 8.0, 13.0, 12.0, 12.0, 22.0, 19.0, 24.0, 21.0, 24.0, 28.0, 35.0, 29.0, 33.0, 34.0, 40.0, 45.0, 50.0, 45.0, 50.0, 37.0, 43.0, 46.0, 38.0, 31.0, 36.0, 36.0, 22.0, 20.0, 22.0, 24.0, 15.0, 8.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.59765625, -6.400146484375, -6.20263671875, -6.005126953125, -5.8076171875, -5.610107421875, -5.41259765625, -5.215087890625, -5.017578125, -4.820068359375, -4.62255859375, -4.425048828125, -4.2275390625, -4.030029296875, -3.83251953125, -3.635009765625, -3.4375, -3.239990234375, -3.04248046875, -2.844970703125, -2.6474609375, -2.449951171875, -2.25244140625, -2.054931640625, -1.857421875, -1.659912109375, -1.46240234375, -1.264892578125, -1.0673828125, -0.869873046875, -0.67236328125, -0.474853515625, -0.27734375, -0.079833984375, 0.11767578125, 0.315185546875, 0.5126953125, 0.710205078125, 0.90771484375, 1.105224609375, 1.302734375, 1.500244140625, 1.69775390625, 1.895263671875, 2.0927734375, 2.290283203125, 2.48779296875, 2.685302734375, 2.8828125, 3.080322265625, 3.27783203125, 3.475341796875, 3.6728515625, 3.870361328125, 4.06787109375, 4.265380859375, 4.462890625, 4.660400390625, 4.85791015625, 5.055419921875, 5.2529296875, 5.450439453125, 5.64794921875, 5.845458984375, 6.04296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 8.0, 18.0, 32.0, 32.0, 51.0, 70.0, 120.0, 132.0, 213.0, 335.0, 539.0, 752.0, 1185.0, 1851.0, 3014.0, 4721.0, 7716.0, 12466.0, 20804.0, 35708.0, 62572.0, 111614.0, 176604.0, 206782.0, 164834.0, 99424.0, 55959.0, 32040.0, 18758.0, 11333.0, 6772.0, 4347.0, 2789.0, 1727.0, 1056.0, 699.0, 473.0, 298.0, 229.0, 134.0, 101.0, 62.0, 63.0, 34.0, 15.0, 12.0, 13.0, 5.0, 7.0, 1.0, 8.0, 1.0, 2.0, 4.0, 3.0, 2.0], "bins": [-7.9921875, -7.7376708984375, -7.483154296875, -7.2286376953125, -6.97412109375, -6.7196044921875, -6.465087890625, -6.2105712890625, -5.9560546875, -5.7015380859375, -5.447021484375, -5.1925048828125, -4.93798828125, -4.6834716796875, -4.428955078125, -4.1744384765625, -3.919921875, -3.6654052734375, -3.410888671875, -3.1563720703125, -2.90185546875, -2.6473388671875, -2.392822265625, -2.1383056640625, -1.8837890625, -1.6292724609375, -1.374755859375, -1.1202392578125, -0.86572265625, -0.6112060546875, -0.356689453125, -0.1021728515625, 0.15234375, 0.4068603515625, 0.661376953125, 0.9158935546875, 1.17041015625, 1.4249267578125, 1.679443359375, 1.9339599609375, 2.1884765625, 2.4429931640625, 2.697509765625, 2.9520263671875, 3.20654296875, 3.4610595703125, 3.715576171875, 3.9700927734375, 4.224609375, 4.4791259765625, 4.733642578125, 4.9881591796875, 5.24267578125, 5.4971923828125, 5.751708984375, 6.0062255859375, 6.2607421875, 6.5152587890625, 6.769775390625, 7.0242919921875, 7.27880859375, 7.5333251953125, 7.787841796875, 8.0423583984375, 8.296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 18.0, 18.0, 21.0, 31.0, 34.0, 28.0, 27.0, 27.0, 33.0, 33.0, 34.0, 40.0, 47.0, 43.0, 31.0, 40.0, 47.0, 46.0, 29.0, 35.0, 32.0, 28.0, 30.0, 33.0, 38.0, 31.0, 19.0, 15.0, 14.0, 9.0, 15.0, 6.0, 9.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.05987548828125, -3.9400634765625, -3.82025146484375, -3.700439453125, -3.58062744140625, -3.4608154296875, -3.34100341796875, -3.22119140625, -3.10137939453125, -2.9815673828125, -2.86175537109375, -2.741943359375, -2.62213134765625, -2.5023193359375, -2.38250732421875, -2.2626953125, -2.14288330078125, -2.0230712890625, -1.90325927734375, -1.783447265625, -1.66363525390625, -1.5438232421875, -1.42401123046875, -1.30419921875, -1.18438720703125, -1.0645751953125, -0.94476318359375, -0.824951171875, -0.70513916015625, -0.5853271484375, -0.46551513671875, -0.345703125, -0.22589111328125, -0.1060791015625, 0.01373291015625, 0.133544921875, 0.25335693359375, 0.3731689453125, 0.49298095703125, 0.61279296875, 0.73260498046875, 0.8524169921875, 0.97222900390625, 1.092041015625, 1.21185302734375, 1.3316650390625, 1.45147705078125, 1.5712890625, 1.69110107421875, 1.8109130859375, 1.93072509765625, 2.050537109375, 2.17034912109375, 2.2901611328125, 2.40997314453125, 2.52978515625, 2.64959716796875, 2.7694091796875, 2.88922119140625, 3.009033203125, 3.12884521484375, 3.2486572265625, 3.36846923828125, 3.48828125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 16.0, 42.0, 42.0, 93.0, 86.0, 176.0, 254.0, 354.0, 596.0, 946.0, 1402.0, 2262.0, 3653.0, 5933.0, 9872.0, 16166.0, 26282.0, 41607.0, 63102.0, 89169.0, 114388.0, 132332.0, 133759.0, 119219.0, 95489.0, 68855.0, 46245.0, 29492.0, 18039.0, 10982.0, 6656.0, 4097.0, 2533.0, 1492.0, 1055.0, 594.0, 403.0, 286.0, 166.0, 140.0, 77.0, 64.0, 46.0, 22.0, 15.0, 7.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.4638671875, -1.4196624755859375, -1.375457763671875, -1.3312530517578125, -1.28704833984375, -1.2428436279296875, -1.198638916015625, -1.1544342041015625, -1.1102294921875, -1.0660247802734375, -1.021820068359375, -0.9776153564453125, -0.93341064453125, -0.8892059326171875, -0.845001220703125, -0.8007965087890625, -0.756591796875, -0.7123870849609375, -0.668182373046875, -0.6239776611328125, -0.57977294921875, -0.5355682373046875, -0.491363525390625, -0.4471588134765625, -0.4029541015625, -0.3587493896484375, -0.314544677734375, -0.2703399658203125, -0.22613525390625, -0.1819305419921875, -0.137725830078125, -0.0935211181640625, -0.04931640625, -0.0051116943359375, 0.039093017578125, 0.0832977294921875, 0.12750244140625, 0.1717071533203125, 0.215911865234375, 0.2601165771484375, 0.3043212890625, 0.3485260009765625, 0.392730712890625, 0.4369354248046875, 0.48114013671875, 0.5253448486328125, 0.569549560546875, 0.6137542724609375, 0.657958984375, 0.7021636962890625, 0.746368408203125, 0.7905731201171875, 0.83477783203125, 0.8789825439453125, 0.923187255859375, 0.9673919677734375, 1.0115966796875, 1.0558013916015625, 1.100006103515625, 1.1442108154296875, 1.18841552734375, 1.2326202392578125, 1.276824951171875, 1.3210296630859375, 1.365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 12.0, 20.0, 21.0, 21.0, 34.0, 47.0, 36.0, 42.0, 55.0, 45.0, 62.0, 65.0, 57.0, 47.0, 59.0, 66.0, 50.0, 47.0, 38.0, 26.0, 25.0, 17.0, 26.0, 14.0, 10.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001915767788887024, -0.0001852661371231079, -0.00017895549535751343, -0.00017264485359191895, -0.00016633421182632446, -0.00016002357006072998, -0.0001537129282951355, -0.00014740228652954102, -0.00014109164476394653, -0.00013478100299835205, -0.00012847036123275757, -0.00012215971946716309, -0.0001158490777015686, -0.00010953843593597412, -0.00010322779417037964, -9.691715240478516e-05, -9.060651063919067e-05, -8.429586887359619e-05, -7.798522710800171e-05, -7.167458534240723e-05, -6.536394357681274e-05, -5.905330181121826e-05, -5.274266004562378e-05, -4.64320182800293e-05, -4.0121376514434814e-05, -3.381073474884033e-05, -2.750009298324585e-05, -2.1189451217651367e-05, -1.4878809452056885e-05, -8.568167686462402e-06, -2.25752592086792e-06, 4.0531158447265625e-06, 1.0363757610321045e-05, 1.6674399375915527e-05, 2.298504114151001e-05, 2.9295682907104492e-05, 3.5606324672698975e-05, 4.191696643829346e-05, 4.822760820388794e-05, 5.453824996948242e-05, 6.0848891735076904e-05, 6.715953350067139e-05, 7.347017526626587e-05, 7.978081703186035e-05, 8.609145879745483e-05, 9.240210056304932e-05, 9.87127423286438e-05, 0.00010502338409423828, 0.00011133402585983276, 0.00011764466762542725, 0.00012395530939102173, 0.0001302659511566162, 0.0001365765929222107, 0.00014288723468780518, 0.00014919787645339966, 0.00015550851821899414, 0.00016181915998458862, 0.0001681298017501831, 0.0001744404435157776, 0.00018075108528137207, 0.00018706172704696655, 0.00019337236881256104, 0.00019968301057815552, 0.00020599365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 9.0, 7.0, 18.0, 23.0, 48.0, 58.0, 90.0, 139.0, 252.0, 383.0, 573.0, 999.0, 1628.0, 2790.0, 4603.0, 8160.0, 13796.0, 23291.0, 38158.0, 59980.0, 87228.0, 115249.0, 135668.0, 139778.0, 125858.0, 99780.0, 71202.0, 47053.0, 29118.0, 17613.0, 10173.0, 6042.0, 3546.0, 2042.0, 1280.0, 736.0, 458.0, 286.0, 181.0, 99.0, 53.0, 54.0, 26.0, 13.0, 9.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3470306396484375, -1.302459716796875, -1.2578887939453125, -1.21331787109375, -1.1687469482421875, -1.124176025390625, -1.0796051025390625, -1.0350341796875, -0.9904632568359375, -0.945892333984375, -0.9013214111328125, -0.85675048828125, -0.8121795654296875, -0.767608642578125, -0.7230377197265625, -0.678466796875, -0.6338958740234375, -0.589324951171875, -0.5447540283203125, -0.50018310546875, -0.4556121826171875, -0.411041259765625, -0.3664703369140625, -0.3218994140625, -0.2773284912109375, -0.232757568359375, -0.1881866455078125, -0.14361572265625, -0.0990447998046875, -0.054473876953125, -0.0099029541015625, 0.03466796875, 0.0792388916015625, 0.123809814453125, 0.1683807373046875, 0.21295166015625, 0.2575225830078125, 0.302093505859375, 0.3466644287109375, 0.3912353515625, 0.4358062744140625, 0.480377197265625, 0.5249481201171875, 0.56951904296875, 0.6140899658203125, 0.658660888671875, 0.7032318115234375, 0.747802734375, 0.7923736572265625, 0.836944580078125, 0.8815155029296875, 0.92608642578125, 0.9706573486328125, 1.015228271484375, 1.0597991943359375, 1.1043701171875, 1.1489410400390625, 1.193511962890625, 1.2380828857421875, 1.28265380859375, 1.3272247314453125, 1.371795654296875, 1.4163665771484375, 1.4609375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 7.0, 10.0, 8.0, 7.0, 14.0, 18.0, 17.0, 31.0, 28.0, 25.0, 31.0, 40.0, 30.0, 48.0, 46.0, 37.0, 50.0, 44.0, 48.0, 43.0, 43.0, 43.0, 42.0, 32.0, 37.0, 27.0, 24.0, 24.0, 22.0, 14.0, 25.0, 12.0, 9.0, 9.0, 4.0, 8.0, 3.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.42792510986328125, -0.4134674072265625, -0.39900970458984375, -0.384552001953125, -0.37009429931640625, -0.3556365966796875, -0.34117889404296875, -0.32672119140625, -0.31226348876953125, -0.2978057861328125, -0.28334808349609375, -0.268890380859375, -0.25443267822265625, -0.2399749755859375, -0.22551727294921875, -0.2110595703125, -0.19660186767578125, -0.1821441650390625, -0.16768646240234375, -0.153228759765625, -0.13877105712890625, -0.1243133544921875, -0.10985565185546875, -0.09539794921875, -0.08094024658203125, -0.0664825439453125, -0.05202484130859375, -0.037567138671875, -0.02310943603515625, -0.0086517333984375, 0.00580596923828125, 0.020263671875, 0.03472137451171875, 0.0491790771484375, 0.06363677978515625, 0.078094482421875, 0.09255218505859375, 0.1070098876953125, 0.12146759033203125, 0.13592529296875, 0.15038299560546875, 0.1648406982421875, 0.17929840087890625, 0.193756103515625, 0.20821380615234375, 0.2226715087890625, 0.23712921142578125, 0.2515869140625, 0.26604461669921875, 0.2805023193359375, 0.29496002197265625, 0.309417724609375, 0.32387542724609375, 0.3383331298828125, 0.35279083251953125, 0.36724853515625, 0.38170623779296875, 0.3961639404296875, 0.41062164306640625, 0.425079345703125, 0.43953704833984375, 0.4539947509765625, 0.46845245361328125, 0.48291015625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 16.0, 16.0, 30.0, 32.0, 34.0, 37.0, 40.0, 51.0, 38.0, 63.0, 57.0, 72.0, 60.0, 55.0, 54.0, 47.0, 42.0, 29.0, 29.0, 29.0, 23.0, 15.0, 24.0, 16.0, 14.0, 11.0, 2.0, 3.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.497963905334473, -9.224068641662598, -8.950172424316406, -8.676277160644531, -8.40238094329834, -8.128485679626465, -7.854589939117432, -7.580694198608398, -7.306798934936523, -7.03290319442749, -6.759007453918457, -6.485112190246582, -6.211216449737549, -5.937320709228516, -5.663424968719482, -5.389529228210449, -5.115633487701416, -4.841737747192383, -4.56784200668335, -4.293946266174316, -4.020051002502441, -3.746155261993408, -3.472259521484375, -3.198363780975342, -2.9244682788848877, -2.6505725383758545, -2.3766770362854004, -2.102781295776367, -1.8288856744766235, -1.5549900531768799, -1.2810943126678467, -1.007198691368103, -0.7333030700683594, -0.45940741896629333, -0.1855117678642273, 0.08838391304016113, 0.3622795343399048, 0.6361751556396484, 0.9100708961486816, 1.1839665174484253, 1.457862138748169, 1.7317577600479126, 2.0056533813476562, 2.2795491218566895, 2.5534448623657227, 2.8273403644561768, 3.10123610496521, 3.375131607055664, 3.6490273475646973, 3.9229230880737305, 4.196818828582764, 4.470714569091797, 4.744609832763672, 5.018505573272705, 5.292401313781738, 5.5662970542907715, 5.840192794799805, 6.114088535308838, 6.387984275817871, 6.661879539489746, 6.935775279998779, 7.2096710205078125, 7.483566761016846, 7.757462501525879, 8.031357765197754]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 14.0, 10.0, 17.0, 20.0, 30.0, 18.0, 24.0, 29.0, 38.0, 30.0, 47.0, 41.0, 43.0, 63.0, 58.0, 38.0, 44.0, 44.0, 51.0, 38.0, 26.0, 35.0, 36.0, 37.0, 25.0, 28.0, 15.0, 19.0, 14.0, 11.0, 7.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.619253158569336, -8.35822868347168, -8.097204208374023, -7.836179733276367, -7.575155258178711, -7.314130783081055, -7.053106307983398, -6.792081832885742, -6.531057357788086, -6.27003288269043, -6.009008407592773, -5.747983932495117, -5.486959457397461, -5.225934982299805, -4.964910507202148, -4.703886032104492, -4.442862033843994, -4.181837558746338, -3.9208130836486816, -3.6597886085510254, -3.398764133453369, -3.137739658355713, -2.8767154216766357, -2.6156909465789795, -2.3546664714813232, -2.093641996383667, -1.8326175212860107, -1.571593165397644, -1.3105686902999878, -1.0495442152023315, -0.7885198593139648, -0.5274953842163086, -0.26647090911865234, -0.0054464638233184814, 0.2555779814720154, 0.5166023969650269, 0.7776268720626831, 1.0386513471603394, 1.299675703048706, 1.5607001781463623, 1.8217246532440186, 2.082749128341675, 2.343773603439331, 2.604797840118408, 2.8658223152160645, 3.1268467903137207, 3.387871265411377, 3.648895740509033, 3.9099202156066895, 4.170944690704346, 4.431969165802002, 4.692993640899658, 4.9540181159973145, 5.215042591094971, 5.476066589355469, 5.737091064453125, 5.998115539550781, 6.2591400146484375, 6.520164489746094, 6.78118896484375, 7.042213439941406, 7.3032379150390625, 7.564262390136719, 7.825286865234375, 8.086311340332031]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 5.0, 16.0, 18.0, 21.0, 31.0, 42.0, 48.0, 65.0, 81.0, 119.0, 137.0, 225.0, 301.0, 390.0, 566.0, 793.0, 1131.0, 1655.0, 2295.0, 3183.0, 4330.0, 488572.0, 5585.0, 4059.0, 3035.0, 2148.0, 1544.0, 1086.0, 749.0, 554.0, 396.0, 265.0, 222.0, 142.0, 96.0, 83.0, 60.0, 46.0, 33.0, 28.0, 26.0, 14.0, 22.0, 7.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-71.41798400878906, -69.10797119140625, -66.79795837402344, -64.48794555664062, -62.17793273925781, -59.867919921875, -57.55790328979492, -55.24789047241211, -52.9378776550293, -50.627864837646484, -48.31785202026367, -46.00783920288086, -43.69782257080078, -41.38780975341797, -39.077796936035156, -36.767784118652344, -34.45777130126953, -32.14775848388672, -29.837745666503906, -27.52773094177246, -25.21771812438965, -22.907705307006836, -20.59769058227539, -18.287677764892578, -15.977664947509766, -13.667652130126953, -11.357638359069824, -9.047624588012695, -6.737611770629883, -4.42759895324707, -2.1175851821899414, 0.1924285888671875, 2.50244140625, 4.812454700469971, 7.122467994689941, 9.43248176574707, 11.742494583129883, 14.052507400512695, 16.36252212524414, 18.672534942626953, 20.982547760009766, 23.292560577392578, 25.60257339477539, 27.912588119506836, 30.22260093688965, 32.532615661621094, 34.842628479003906, 37.15264129638672, 39.46265411376953, 41.772666931152344, 44.082679748535156, 46.39269256591797, 48.70270538330078, 51.012718200683594, 53.32273483276367, 55.632747650146484, 57.9427604675293, 60.25277328491211, 62.56278610229492, 64.872802734375, 67.18281555175781, 69.49282836914062, 71.80284118652344, 74.11285400390625, 76.42286682128906]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 12.0, 11.0, 12.0, 15.0, 22.0, 30.0, 16.0, 24.0, 29.0, 41.0, 28.0, 45.0, 43.0, 46.0, 64.0, 1080.0, 43.0, 42.0, 46.0, 50.0, 34.0, 28.0, 40.0, 36.0, 33.0, 27.0, 27.0, 12.0, 18.0, 14.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-265.3472595214844, -257.3047790527344, -249.26229858398438, -241.21981811523438, -233.17733764648438, -225.13485717773438, -217.09237670898438, -209.04989624023438, -201.00741577148438, -192.96493530273438, -184.92245483398438, -176.87997436523438, -168.83749389648438, -160.79501342773438, -152.75253295898438, -144.71005249023438, -136.66758728027344, -128.62510681152344, -120.58262634277344, -112.54014587402344, -104.49766540527344, -96.45518493652344, -88.41271209716797, -80.37023162841797, -72.32775115966797, -64.28527069091797, -56.24279022216797, -48.200313568115234, -40.157833099365234, -32.115352630615234, -24.0728759765625, -16.0303955078125, -7.9879150390625, 0.054564476013183594, 8.097043991088867, 16.139522552490234, 24.182003021240234, 32.224483489990234, 40.26696014404297, 48.30944061279297, 56.35192108154297, 64.39440155029297, 72.43688201904297, 80.47935485839844, 88.52183532714844, 96.56431579589844, 104.60679626464844, 112.64927673339844, 120.69175720214844, 128.73423767089844, 136.77671813964844, 144.81919860839844, 152.86167907714844, 160.90415954589844, 168.94662475585938, 176.98910522460938, 185.03158569335938, 193.07406616210938, 201.11654663085938, 209.15902709960938, 217.20150756835938, 225.24398803710938, 233.28646850585938, 241.32894897460938, 249.37142944335938]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 13.0, 6.0, 13.0, 21.0, 21.0, 26.0, 39.0, 51.0, 80.0, 67.0, 123.0, 156.0, 178.0, 264.0, 373.0, 523.0, 687.0, 1038.0, 1566.0, 2346.0, 3328.0, 4723.0, 6289.0, 8418.0, 10499.0, 13807.0, 20183.0, 390907.0, 30684016.0, 34277.0, 31096.0, 16687.0, 8575.0, 5095.0, 3060.0, 1958.0, 1258.0, 808.0, 584.0, 378.0, 297.0, 229.0, 168.0, 119.0, 75.0, 36.0, 22.0, 12.0, 9.0, 5.0, 5.0, 2.0], "bins": [-91.87071228027344, -89.57714080810547, -87.2835693359375, -84.989990234375, -82.69641876220703, -80.40284729003906, -78.1092758178711, -75.81570434570312, -73.52213287353516, -71.22856140136719, -68.93498992919922, -66.64141845703125, -64.34783935546875, -62.05426788330078, -59.76069641113281, -57.467124938964844, -55.17354965209961, -52.87997817993164, -50.586402893066406, -48.29283142089844, -45.99925994873047, -43.7056884765625, -41.412113189697266, -39.1185417175293, -36.82496643066406, -34.531394958496094, -32.23781967163086, -29.94424819946289, -27.650676727294922, -25.35710334777832, -23.06352996826172, -20.76995849609375, -18.47638702392578, -16.18281364440918, -13.889242172241211, -11.59566879272461, -9.302096366882324, -7.008523941040039, -4.7149505615234375, -2.4213790893554688, -0.1278057098388672, 2.165766954421997, 4.459339618682861, 6.752912521362305, 9.04648494720459, 11.340057373046875, 13.633630752563477, 15.927202224731445, 18.220775604248047, 20.51434898376465, 22.807920455932617, 25.10149383544922, 27.395065307617188, 29.68863868713379, 31.98221206665039, 34.27578353881836, 36.569358825683594, 38.86293029785156, 41.1565055847168, 43.450077056884766, 45.743648529052734, 48.03722381591797, 50.33079528808594, 52.624366760253906, 54.917938232421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 7.0, 15.0, 35.0, 47.0, 60.0, 73.0, 116.0, 167.0, 315.0, 509.0, 803.0, 1318.0, 2134.0, 3665.0, 6640.0, 12180.0, 24035.0, 51122.0, 117466.0, 302918.0, 946099.0, 3192008.0, 1063741.0, 330040.0, 126212.0, 54654.0, 25465.0, 12773.0, 6922.0, 3912.0, 2294.0, 1376.0, 862.0, 532.0, 323.0, 204.0, 118.0, 89.0, 55.0, 45.0, 26.0, 19.0, 13.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.6171875, -5.44970703125, -5.2822265625, -5.11474609375, -4.947265625, -4.77978515625, -4.6123046875, -4.44482421875, -4.27734375, -4.10986328125, -3.9423828125, -3.77490234375, -3.607421875, -3.43994140625, -3.2724609375, -3.10498046875, -2.9375, -2.77001953125, -2.6025390625, -2.43505859375, -2.267578125, -2.10009765625, -1.9326171875, -1.76513671875, -1.59765625, -1.43017578125, -1.2626953125, -1.09521484375, -0.927734375, -0.76025390625, -0.5927734375, -0.42529296875, -0.2578125, -0.09033203125, 0.0771484375, 0.24462890625, 0.412109375, 0.57958984375, 0.7470703125, 0.91455078125, 1.08203125, 1.24951171875, 1.4169921875, 1.58447265625, 1.751953125, 1.91943359375, 2.0869140625, 2.25439453125, 2.421875, 2.58935546875, 2.7568359375, 2.92431640625, 3.091796875, 3.25927734375, 3.4267578125, 3.59423828125, 3.76171875, 3.92919921875, 4.0966796875, 4.26416015625, 4.431640625, 4.59912109375, 4.7666015625, 4.93408203125, 5.1015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 3.0, 9.0, 6.0, 7.0, 9.0, 14.0, 14.0, 20.0, 21.0, 20.0, 27.0, 28.0, 34.0, 36.0, 38.0, 41.0, 44.0, 77.0, 149.0, 205.0, 258.0, 241.0, 146.0, 112.0, 74.0, 56.0, 44.0, 36.0, 35.0, 32.0, 27.0, 21.0, 24.0, 21.0, 14.0, 8.0, 17.0, 8.0, 9.0, 5.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.91796875, -3.79302978515625, -3.6680908203125, -3.54315185546875, -3.418212890625, -3.29327392578125, -3.1683349609375, -3.04339599609375, -2.91845703125, -2.79351806640625, -2.6685791015625, -2.54364013671875, -2.418701171875, -2.29376220703125, -2.1688232421875, -2.04388427734375, -1.9189453125, -1.79400634765625, -1.6690673828125, -1.54412841796875, -1.419189453125, -1.29425048828125, -1.1693115234375, -1.04437255859375, -0.91943359375, -0.79449462890625, -0.6695556640625, -0.54461669921875, -0.419677734375, -0.29473876953125, -0.1697998046875, -0.04486083984375, 0.080078125, 0.20501708984375, 0.3299560546875, 0.45489501953125, 0.579833984375, 0.70477294921875, 0.8297119140625, 0.95465087890625, 1.07958984375, 1.20452880859375, 1.3294677734375, 1.45440673828125, 1.579345703125, 1.70428466796875, 1.8292236328125, 1.95416259765625, 2.0791015625, 2.20404052734375, 2.3289794921875, 2.45391845703125, 2.578857421875, 2.70379638671875, 2.8287353515625, 2.95367431640625, 3.07861328125, 3.20355224609375, 3.3284912109375, 3.45343017578125, 3.578369140625, 3.70330810546875, 3.8282470703125, 3.95318603515625, 4.078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 5.0, 4.0, 14.0, 15.0, 16.0, 32.0, 56.0, 73.0, 81.0, 111.0, 158.0, 181.0, 267.0, 364.0, 510.0, 795.0, 1273.0, 1989.0, 3325.0, 5704.0, 9669.0, 17815.0, 33305.0, 64494.0, 130528.0, 279611.0, 702793.0, 3070359.0, 1223262.0, 388281.0, 175235.0, 85214.0, 43114.0, 22472.0, 12227.0, 6925.0, 3987.0, 2479.0, 1454.0, 1012.0, 668.0, 478.0, 318.0, 241.0, 164.0, 89.0, 60.0, 43.0, 42.0, 20.0, 20.0, 13.0, 18.0, 11.0, 10.0, 6.0, 8.0, 7.0, 7.0, 4.0, 3.0], "bins": [-3.26171875, -3.15545654296875, -3.0491943359375, -2.94293212890625, -2.836669921875, -2.73040771484375, -2.6241455078125, -2.51788330078125, -2.41162109375, -2.30535888671875, -2.1990966796875, -2.09283447265625, -1.986572265625, -1.88031005859375, -1.7740478515625, -1.66778564453125, -1.5615234375, -1.45526123046875, -1.3489990234375, -1.24273681640625, -1.136474609375, -1.03021240234375, -0.9239501953125, -0.81768798828125, -0.71142578125, -0.60516357421875, -0.4989013671875, -0.39263916015625, -0.286376953125, -0.18011474609375, -0.0738525390625, 0.03240966796875, 0.138671875, 0.24493408203125, 0.3511962890625, 0.45745849609375, 0.563720703125, 0.66998291015625, 0.7762451171875, 0.88250732421875, 0.98876953125, 1.09503173828125, 1.2012939453125, 1.30755615234375, 1.413818359375, 1.52008056640625, 1.6263427734375, 1.73260498046875, 1.8388671875, 1.94512939453125, 2.0513916015625, 2.15765380859375, 2.263916015625, 2.37017822265625, 2.4764404296875, 2.58270263671875, 2.68896484375, 2.79522705078125, 2.9014892578125, 3.00775146484375, 3.114013671875, 3.22027587890625, 3.3265380859375, 3.43280029296875, 3.5390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 16.0, 12.0, 16.0, 23.0, 26.0, 58.0, 45.0, 69.0, 88.0, 201.0, 454.0, 409.0, 172.0, 108.0, 76.0, 51.0, 40.0, 38.0, 28.0, 27.0, 11.0, 4.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.078125, -7.8463134765625, -7.614501953125, -7.3826904296875, -7.15087890625, -6.9190673828125, -6.687255859375, -6.4554443359375, -6.2236328125, -5.9918212890625, -5.760009765625, -5.5281982421875, -5.29638671875, -5.0645751953125, -4.832763671875, -4.6009521484375, -4.369140625, -4.1373291015625, -3.905517578125, -3.6737060546875, -3.44189453125, -3.2100830078125, -2.978271484375, -2.7464599609375, -2.5146484375, -2.2828369140625, -2.051025390625, -1.8192138671875, -1.58740234375, -1.3555908203125, -1.123779296875, -0.8919677734375, -0.66015625, -0.4283447265625, -0.196533203125, 0.0352783203125, 0.26708984375, 0.4989013671875, 0.730712890625, 0.9625244140625, 1.1943359375, 1.4261474609375, 1.657958984375, 1.8897705078125, 2.12158203125, 2.3533935546875, 2.585205078125, 2.8170166015625, 3.048828125, 3.2806396484375, 3.512451171875, 3.7442626953125, 3.97607421875, 4.2078857421875, 4.439697265625, 4.6715087890625, 4.9033203125, 5.1351318359375, 5.366943359375, 5.5987548828125, 5.83056640625, 6.0623779296875, 6.294189453125, 6.5260009765625, 6.7578125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 6.0, 7.0, 13.0, 10.0, 21.0, 16.0, 24.0, 37.0, 41.0, 27.0, 38.0, 54.0, 96.0, 120.0, 154.0, 214.0, 303.0, 524.0, 736.0, 1145.0, 1915.0, 3715.0, 8078.0, 21912.0, 94092.0, 5988706.0, 124753.0, 25506.0, 9146.0, 4035.0, 2220.0, 1231.0, 813.0, 519.0, 313.0, 269.0, 139.0, 135.0, 91.0, 57.0, 46.0, 29.0, 32.0, 25.0, 21.0, 17.0, 15.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-25.90625, -25.085693359375, -24.26513671875, -23.444580078125, -22.6240234375, -21.803466796875, -20.98291015625, -20.162353515625, -19.341796875, -18.521240234375, -17.70068359375, -16.880126953125, -16.0595703125, -15.239013671875, -14.41845703125, -13.597900390625, -12.77734375, -11.956787109375, -11.13623046875, -10.315673828125, -9.4951171875, -8.674560546875, -7.85400390625, -7.033447265625, -6.212890625, -5.392333984375, -4.57177734375, -3.751220703125, -2.9306640625, -2.110107421875, -1.28955078125, -0.468994140625, 0.3515625, 1.172119140625, 1.99267578125, 2.813232421875, 3.6337890625, 4.454345703125, 5.27490234375, 6.095458984375, 6.916015625, 7.736572265625, 8.55712890625, 9.377685546875, 10.1982421875, 11.018798828125, 11.83935546875, 12.659912109375, 13.48046875, 14.301025390625, 15.12158203125, 15.942138671875, 16.7626953125, 17.583251953125, 18.40380859375, 19.224365234375, 20.044921875, 20.865478515625, 21.68603515625, 22.506591796875, 23.3271484375, 24.147705078125, 24.96826171875, 25.788818359375, 26.609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 32.0, 37.0, 47.0, 49.0, 72.0, 102.0, 328.0, 542.0, 242.0, 136.0, 70.0, 52.0, 38.0, 32.0, 26.0, 22.0, 17.0, 13.0, 16.0, 8.0, 10.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3609619140625, -8.042236328125, -7.7235107421875, -7.40478515625, -7.0860595703125, -6.767333984375, -6.4486083984375, -6.1298828125, -5.8111572265625, -5.492431640625, -5.1737060546875, -4.85498046875, -4.5362548828125, -4.217529296875, -3.8988037109375, -3.580078125, -3.2613525390625, -2.942626953125, -2.6239013671875, -2.30517578125, -1.9864501953125, -1.667724609375, -1.3489990234375, -1.0302734375, -0.7115478515625, -0.392822265625, -0.0740966796875, 0.24462890625, 0.5633544921875, 0.882080078125, 1.2008056640625, 1.51953125, 1.8382568359375, 2.156982421875, 2.4757080078125, 2.79443359375, 3.1131591796875, 3.431884765625, 3.7506103515625, 4.0693359375, 4.3880615234375, 4.706787109375, 5.0255126953125, 5.34423828125, 5.6629638671875, 5.981689453125, 6.3004150390625, 6.619140625, 6.9378662109375, 7.256591796875, 7.5753173828125, 7.89404296875, 8.2127685546875, 8.531494140625, 8.8502197265625, 9.1689453125, 9.4876708984375, 9.806396484375, 10.1251220703125, 10.44384765625, 10.7625732421875, 11.081298828125, 11.4000244140625, 11.71875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 19.0, 94.0, 839.0, 33.0, 12.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-727.3897705078125, -708.3659057617188, -689.342041015625, -670.3181762695312, -651.2943115234375, -632.2704467773438, -613.24658203125, -594.2227172851562, -575.1988525390625, -556.1749877929688, -537.151123046875, -518.1272583007812, -499.1033935546875, -480.07952880859375, -461.0556640625, -442.03179931640625, -423.0079650878906, -403.9841003417969, -384.9602355957031, -365.9363708496094, -346.9125061035156, -327.8886413574219, -308.86480712890625, -289.8409423828125, -270.81707763671875, -251.793212890625, -232.76934814453125, -213.7454833984375, -194.72161865234375, -175.69775390625, -156.6739044189453, -137.65003967285156, -118.62615966796875, -99.602294921875, -80.57843017578125, -61.55457305908203, -42.53070831298828, -23.50684356689453, -4.4829864501953125, 14.540878295898438, 33.56474304199219, 52.58860778808594, 71.61247253417969, 90.6363296508789, 109.66019439697266, 128.68405151367188, 147.70791625976562, 166.73178100585938, 185.75564575195312, 204.77951049804688, 223.80337524414062, 242.82723999023438, 261.8511047363281, 280.8749694824219, 299.8988037109375, 318.92266845703125, 337.946533203125, 356.97039794921875, 375.9942626953125, 395.01812744140625, 414.0419921875, 433.06585693359375, 452.0897216796875, 471.11358642578125, 490.137451171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 17.0, 45.0, 533.0, 282.0, 38.0, 15.0, 19.0, 3.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-514.69970703125, -501.1358337402344, -487.57196044921875, -474.00811767578125, -460.4442443847656, -446.88037109375, -433.3164978027344, -419.75262451171875, -406.1887512207031, -392.6248779296875, -379.0610046386719, -365.49713134765625, -351.93328857421875, -338.3694152832031, -324.8055419921875, -311.2416687011719, -297.67779541015625, -284.1139221191406, -270.550048828125, -256.9862060546875, -243.4223175048828, -229.85845947265625, -216.29458618164062, -202.730712890625, -189.1668701171875, -175.60299682617188, -162.0391387939453, -148.4752655029297, -134.91139221191406, -121.34752655029297, -107.78366088867188, -94.21978759765625, -80.65591430664062, -67.09204864501953, -53.528175354003906, -39.96430969238281, -26.400440216064453, -12.836570739746094, 0.727294921875, 14.291168212890625, 27.85503387451172, 41.41890335083008, 54.98277282714844, 68.54663848876953, 82.11050415039062, 95.67437744140625, 109.23824310302734, 122.80211639404297, 136.36598205566406, 149.9298553466797, 163.49371337890625, 177.05758666992188, 190.6214599609375, 204.18533325195312, 217.7491912841797, 231.3130645751953, 244.87692260742188, 258.4407958984375, 272.0046691894531, 285.56854248046875, 299.13238525390625, 312.6962585449219, 326.2601318359375, 339.8240051269531, 353.38787841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 15.0, 18.0, 27.0, 30.0, 49.0, 80.0, 122.0, 171.0, 248.0, 430.0, 646.0, 976.0, 1678.0, 2917.0, 5915.0, 13237.0, 33525.0, 111659.0, 3505025.0, 419214.0, 56362.0, 22007.0, 9832.0, 4626.0, 2323.0, 1223.0, 714.0, 410.0, 249.0, 157.0, 91.0, 86.0, 53.0, 29.0, 28.0, 25.0, 22.0, 8.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3037109375, -1.2613372802734375, -1.218963623046875, -1.1765899658203125, -1.13421630859375, -1.0918426513671875, -1.049468994140625, -1.0070953369140625, -0.9647216796875, -0.9223480224609375, -0.879974365234375, -0.8376007080078125, -0.79522705078125, -0.7528533935546875, -0.710479736328125, -0.6681060791015625, -0.625732421875, -0.5833587646484375, -0.540985107421875, -0.4986114501953125, -0.45623779296875, -0.4138641357421875, -0.371490478515625, -0.3291168212890625, -0.2867431640625, -0.2443695068359375, -0.201995849609375, -0.1596221923828125, -0.11724853515625, -0.0748748779296875, -0.032501220703125, 0.0098724365234375, 0.05224609375, 0.0946197509765625, 0.136993408203125, 0.1793670654296875, 0.22174072265625, 0.2641143798828125, 0.306488037109375, 0.3488616943359375, 0.3912353515625, 0.4336090087890625, 0.475982666015625, 0.5183563232421875, 0.56072998046875, 0.6031036376953125, 0.645477294921875, 0.6878509521484375, 0.730224609375, 0.7725982666015625, 0.814971923828125, 0.8573455810546875, 0.89971923828125, 0.9420928955078125, 0.984466552734375, 1.0268402099609375, 1.0692138671875, 1.1115875244140625, 1.153961181640625, 1.1963348388671875, 1.23870849609375, 1.2810821533203125, 1.323455810546875, 1.3658294677734375, 1.408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 13.0, 13.0, 12.0, 26.0, 113.0, 277.0, 306.0, 133.0, 33.0, 16.0, 11.0, 11.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12723207473754883, -0.12433719635009766, -0.12144231796264648, -0.11854743957519531, -0.11565256118774414, -0.11275768280029297, -0.1098628044128418, -0.10696792602539062, -0.10407304763793945, -0.10117816925048828, -0.09828329086303711, -0.09538841247558594, -0.09249353408813477, -0.0895986557006836, -0.08670377731323242, -0.08380889892578125, -0.08091402053833008, -0.0780191421508789, -0.07512426376342773, -0.07222938537597656, -0.06933450698852539, -0.06643962860107422, -0.06354475021362305, -0.060649871826171875, -0.0577549934387207, -0.05486011505126953, -0.05196523666381836, -0.04907035827636719, -0.046175479888916016, -0.043280601501464844, -0.04038572311401367, -0.0374908447265625, -0.03459596633911133, -0.031701087951660156, -0.028806209564208984, -0.025911331176757812, -0.02301645278930664, -0.02012157440185547, -0.017226696014404297, -0.014331817626953125, -0.011436939239501953, -0.008542060852050781, -0.005647182464599609, -0.0027523040771484375, 0.00014257431030273438, 0.0030374526977539062, 0.005932331085205078, 0.00882720947265625, 0.011722087860107422, 0.014616966247558594, 0.017511844635009766, 0.020406723022460938, 0.02330160140991211, 0.02619647979736328, 0.029091358184814453, 0.031986236572265625, 0.0348811149597168, 0.03777599334716797, 0.04067087173461914, 0.04356575012207031, 0.046460628509521484, 0.049355506896972656, 0.05225038528442383, 0.055145263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 8.0, 8.0, 10.0, 21.0, 24.0, 34.0, 38.0, 57.0, 90.0, 110.0, 179.0, 334.0, 629.0, 1480.0, 3641.0, 10836.0, 44320.0, 290256.0, 2905048.0, 810971.0, 96440.0, 19518.0, 5926.0, 2181.0, 955.0, 463.0, 233.0, 134.0, 86.0, 59.0, 54.0, 27.0, 26.0, 9.0, 14.0, 8.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3857421875, -1.3433837890625, -1.301025390625, -1.2586669921875, -1.21630859375, -1.1739501953125, -1.131591796875, -1.0892333984375, -1.046875, -1.0045166015625, -0.962158203125, -0.9197998046875, -0.87744140625, -0.8350830078125, -0.792724609375, -0.7503662109375, -0.7080078125, -0.6656494140625, -0.623291015625, -0.5809326171875, -0.53857421875, -0.4962158203125, -0.453857421875, -0.4114990234375, -0.369140625, -0.3267822265625, -0.284423828125, -0.2420654296875, -0.19970703125, -0.1573486328125, -0.114990234375, -0.0726318359375, -0.0302734375, 0.0120849609375, 0.054443359375, 0.0968017578125, 0.13916015625, 0.1815185546875, 0.223876953125, 0.2662353515625, 0.30859375, 0.3509521484375, 0.393310546875, 0.4356689453125, 0.47802734375, 0.5203857421875, 0.562744140625, 0.6051025390625, 0.6474609375, 0.6898193359375, 0.732177734375, 0.7745361328125, 0.81689453125, 0.8592529296875, 0.901611328125, 0.9439697265625, 0.986328125, 1.0286865234375, 1.071044921875, 1.1134033203125, 1.15576171875, 1.1981201171875, 1.240478515625, 1.2828369140625, 1.3251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 10.0, 10.0, 12.0, 19.0, 21.0, 29.0, 37.0, 55.0, 66.0, 95.0, 107.0, 149.0, 193.0, 258.0, 266.0, 341.0, 451.0, 400.0, 297.0, 261.0, 196.0, 167.0, 131.0, 99.0, 100.0, 69.0, 51.0, 35.0, 33.0, 27.0, 23.0, 19.0, 11.0, 12.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17529296875, -0.16959571838378906, -0.16389846801757812, -0.1582012176513672, -0.15250396728515625, -0.1468067169189453, -0.14110946655273438, -0.13541221618652344, -0.1297149658203125, -0.12401771545410156, -0.11832046508789062, -0.11262321472167969, -0.10692596435546875, -0.10122871398925781, -0.09553146362304688, -0.08983421325683594, -0.084136962890625, -0.07843971252441406, -0.07274246215820312, -0.06704521179199219, -0.06134796142578125, -0.05565071105957031, -0.049953460693359375, -0.04425621032714844, -0.0385589599609375, -0.03286170959472656, -0.027164459228515625, -0.021467208862304688, -0.01576995849609375, -0.010072708129882812, -0.004375457763671875, 0.0013217926025390625, 0.00701904296875, 0.012716293334960938, 0.018413543701171875, 0.024110794067382812, 0.02980804443359375, 0.03550529479980469, 0.041202545166015625, 0.04689979553222656, 0.0525970458984375, 0.05829429626464844, 0.06399154663085938, 0.06968879699707031, 0.07538604736328125, 0.08108329772949219, 0.08678054809570312, 0.09247779846191406, 0.098175048828125, 0.10387229919433594, 0.10956954956054688, 0.11526679992675781, 0.12096405029296875, 0.1266613006591797, 0.13235855102539062, 0.13805580139160156, 0.1437530517578125, 0.14945030212402344, 0.15514755249023438, 0.1608448028564453, 0.16654205322265625, 0.1722393035888672, 0.17793655395507812, 0.18363380432128906, 0.1893310546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 15.0, 59.0, 160.0, 326.0, 254.0, 104.0, 50.0, 24.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.431906223297119, -4.1932783126831055, -3.954650640487671, -3.7160229682922363, -3.4773950576782227, -3.238767385482788, -3.0001397132873535, -2.76151180267334, -2.5228841304779053, -2.2842564582824707, -2.045628547668457, -1.8070008754730225, -1.5683730840682983, -1.3297452926635742, -1.0911176204681396, -0.8524898290634155, -0.6138620376586914, -0.3752342760562897, -0.13660651445388794, 0.1020212173461914, 0.3406490087509155, 0.5792768001556396, 0.8179044723510742, 1.0565322637557983, 1.2951600551605225, 1.5337878465652466, 1.7724156379699707, 2.0110433101654053, 2.24967098236084, 2.4882988929748535, 2.726926565170288, 2.9655542373657227, 3.204181671142578, 3.4428093433380127, 3.6814372539520264, 3.920064926147461, 4.158692836761475, 4.397320747375488, 4.635948181152344, 4.874576091766357, 5.113204002380371, 5.351831912994385, 5.59045934677124, 5.829087257385254, 6.067715167999268, 6.306343078613281, 6.544970512390137, 6.78359842300415, 7.022225856781006, 7.2608537673950195, 7.499481201171875, 7.738109111785889, 7.976737022399902, 8.215364456176758, 8.45399284362793, 8.692620277404785, 8.93124771118164, 9.169875144958496, 9.408503532409668, 9.647130966186523, 9.885758399963379, 10.12438678741455, 10.363014221191406, 10.601641654968262, 10.840270042419434]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 16.0, 9.0, 11.0, 12.0, 24.0, 31.0, 43.0, 57.0, 46.0, 54.0, 67.0, 67.0, 55.0, 60.0, 48.0, 55.0, 47.0, 42.0, 57.0, 37.0, 26.0, 26.0, 17.0, 19.0, 14.0, 11.0, 11.0, 7.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5127581357955933, -1.460258960723877, -1.4077597856521606, -1.3552606105804443, -1.302761435508728, -1.2502622604370117, -1.197763204574585, -1.145263910293579, -1.0927648544311523, -1.040265679359436, -0.9877665042877197, -0.9352673292160034, -0.8827681541442871, -0.8302689790725708, -0.7777698636054993, -0.725270688533783, -0.6727714538574219, -0.6202722787857056, -0.5677731037139893, -0.515273928642273, -0.46277478337287903, -0.4102756083011627, -0.3577764630317688, -0.3052772879600525, -0.2527781128883362, -0.20027893781661987, -0.14777977764606476, -0.09528061747550964, -0.042781442403793335, 0.009717732667922974, 0.062216877937316895, 0.1147160530090332, 0.16721510887145996, 0.21971428394317627, 0.2722134590148926, 0.3247126042842865, 0.3772117793560028, 0.4297109544277191, 0.48221009969711304, 0.5347092747688293, 0.5872084498405457, 0.639707624912262, 0.6922067999839783, 0.7447059154510498, 0.7972050905227661, 0.8497042655944824, 0.9022034406661987, 0.954702615737915, 1.0072017908096313, 1.0597009658813477, 1.112200140953064, 1.1646993160247803, 1.2171984910964966, 1.269697666168213, 1.3221967220306396, 1.3746960163116455, 1.4271950721740723, 1.4796942472457886, 1.5321934223175049, 1.5846925973892212, 1.6371917724609375, 1.6896909475326538, 1.7421901226043701, 1.7946891784667969, 1.8471884727478027]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 6.0, 15.0, 13.0, 22.0, 24.0, 54.0, 70.0, 79.0, 121.0, 193.0, 275.0, 441.0, 710.0, 1224.0, 2177.0, 4329.0, 9928.0, 29971.0, 170070.0, 680147.0, 108899.0, 23101.0, 8164.0, 3674.0, 1913.0, 1071.0, 648.0, 357.0, 241.0, 197.0, 112.0, 82.0, 55.0, 31.0, 28.0, 28.0, 23.0, 13.0, 11.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.802734375, -0.7806777954101562, -0.7586212158203125, -0.7365646362304688, -0.714508056640625, -0.6924514770507812, -0.6703948974609375, -0.6483383178710938, -0.62628173828125, -0.6042251586914062, -0.5821685791015625, -0.5601119995117188, -0.538055419921875, -0.5159988403320312, -0.4939422607421875, -0.47188568115234375, -0.4498291015625, -0.42777252197265625, -0.4057159423828125, -0.38365936279296875, -0.361602783203125, -0.33954620361328125, -0.3174896240234375, -0.29543304443359375, -0.27337646484375, -0.25131988525390625, -0.2292633056640625, -0.20720672607421875, -0.185150146484375, -0.16309356689453125, -0.1410369873046875, -0.11898040771484375, -0.096923828125, -0.07486724853515625, -0.0528106689453125, -0.03075408935546875, -0.008697509765625, 0.01335906982421875, 0.0354156494140625, 0.05747222900390625, 0.07952880859375, 0.10158538818359375, 0.1236419677734375, 0.14569854736328125, 0.167755126953125, 0.18981170654296875, 0.2118682861328125, 0.23392486572265625, 0.2559814453125, 0.27803802490234375, 0.3000946044921875, 0.32215118408203125, 0.344207763671875, 0.36626434326171875, 0.3883209228515625, 0.41037750244140625, 0.43243408203125, 0.45449066162109375, 0.4765472412109375, 0.49860382080078125, 0.520660400390625, 0.5427169799804688, 0.5647735595703125, 0.5868301391601562, 0.60888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 20.0, 20.0, 21.0, 44.0, 50.0, 66.0, 79.0, 86.0, 95.0, 107.0, 88.0, 78.0, 68.0, 44.0, 26.0, 19.0, 21.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06875371932983398, -0.06682872772216797, -0.06490373611450195, -0.06297874450683594, -0.06105375289916992, -0.059128761291503906, -0.05720376968383789, -0.055278778076171875, -0.05335378646850586, -0.051428794860839844, -0.04950380325317383, -0.04757881164550781, -0.0456538200378418, -0.04372882843017578, -0.041803836822509766, -0.03987884521484375, -0.037953853607177734, -0.03602886199951172, -0.0341038703918457, -0.03217887878417969, -0.030253887176513672, -0.028328895568847656, -0.02640390396118164, -0.024478912353515625, -0.02255392074584961, -0.020628929138183594, -0.018703937530517578, -0.016778945922851562, -0.014853954315185547, -0.012928962707519531, -0.011003971099853516, -0.0090789794921875, -0.007153987884521484, -0.005228996276855469, -0.003304004669189453, -0.0013790130615234375, 0.0005459785461425781, 0.0024709701538085938, 0.004395961761474609, 0.006320953369140625, 0.00824594497680664, 0.010170936584472656, 0.012095928192138672, 0.014020919799804688, 0.015945911407470703, 0.01787090301513672, 0.019795894622802734, 0.02172088623046875, 0.023645877838134766, 0.02557086944580078, 0.027495861053466797, 0.029420852661132812, 0.03134584426879883, 0.033270835876464844, 0.03519582748413086, 0.037120819091796875, 0.03904581069946289, 0.040970802307128906, 0.04289579391479492, 0.04482078552246094, 0.04674577713012695, 0.04867076873779297, 0.050595760345458984, 0.052520751953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 0.0, 8.0, 10.0, 6.0, 10.0, 15.0, 21.0, 34.0, 48.0, 47.0, 85.0, 117.0, 185.0, 338.0, 537.0, 971.0, 2105.0, 5476.0, 20586.0, 167761.0, 739844.0, 88627.0, 13708.0, 4220.0, 1683.0, 875.0, 455.0, 264.0, 175.0, 81.0, 83.0, 51.0, 33.0, 28.0, 20.0, 12.0, 12.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0087890625, -0.9744415283203125, -0.940093994140625, -0.9057464599609375, -0.87139892578125, -0.8370513916015625, -0.802703857421875, -0.7683563232421875, -0.7340087890625, -0.6996612548828125, -0.665313720703125, -0.6309661865234375, -0.59661865234375, -0.5622711181640625, -0.527923583984375, -0.4935760498046875, -0.459228515625, -0.4248809814453125, -0.390533447265625, -0.3561859130859375, -0.32183837890625, -0.2874908447265625, -0.253143310546875, -0.2187957763671875, -0.1844482421875, -0.1501007080078125, -0.115753173828125, -0.0814056396484375, -0.04705810546875, -0.0127105712890625, 0.021636962890625, 0.0559844970703125, 0.09033203125, 0.1246795654296875, 0.159027099609375, 0.1933746337890625, 0.22772216796875, 0.2620697021484375, 0.296417236328125, 0.3307647705078125, 0.3651123046875, 0.3994598388671875, 0.433807373046875, 0.4681549072265625, 0.50250244140625, 0.5368499755859375, 0.571197509765625, 0.6055450439453125, 0.639892578125, 0.6742401123046875, 0.708587646484375, 0.7429351806640625, 0.77728271484375, 0.8116302490234375, 0.845977783203125, 0.8803253173828125, 0.9146728515625, 0.9490203857421875, 0.983367919921875, 1.0177154541015625, 1.05206298828125, 1.0864105224609375, 1.120758056640625, 1.1551055908203125, 1.189453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 9.0, 5.0, 15.0, 8.0, 11.0, 13.0, 21.0, 21.0, 23.0, 35.0, 25.0, 30.0, 19.0, 34.0, 42.0, 28.0, 43.0, 49.0, 42.0, 40.0, 41.0, 41.0, 33.0, 37.0, 26.0, 35.0, 32.0, 25.0, 31.0, 14.0, 22.0, 18.0, 13.0, 18.0, 15.0, 9.0, 10.0, 6.0, 11.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.2391357421875, -0.23168373107910156, -0.22423171997070312, -0.2167797088623047, -0.20932769775390625, -0.2018756866455078, -0.19442367553710938, -0.18697166442871094, -0.1795196533203125, -0.17206764221191406, -0.16461563110351562, -0.1571636199951172, -0.14971160888671875, -0.1422595977783203, -0.13480758666992188, -0.12735557556152344, -0.119903564453125, -0.11245155334472656, -0.10499954223632812, -0.09754753112792969, -0.09009552001953125, -0.08264350891113281, -0.07519149780273438, -0.06773948669433594, -0.0602874755859375, -0.05283546447753906, -0.045383453369140625, -0.03793144226074219, -0.03047943115234375, -0.023027420043945312, -0.015575408935546875, -0.008123397827148438, -0.00067138671875, 0.0067806243896484375, 0.014232635498046875, 0.021684646606445312, 0.02913665771484375, 0.03658866882324219, 0.044040679931640625, 0.05149269104003906, 0.0589447021484375, 0.06639671325683594, 0.07384872436523438, 0.08130073547363281, 0.08875274658203125, 0.09620475769042969, 0.10365676879882812, 0.11110877990722656, 0.118560791015625, 0.12601280212402344, 0.13346481323242188, 0.1409168243408203, 0.14836883544921875, 0.1558208465576172, 0.16327285766601562, 0.17072486877441406, 0.1781768798828125, 0.18562889099121094, 0.19308090209960938, 0.2005329132080078, 0.20798492431640625, 0.2154369354248047, 0.22288894653320312, 0.23034095764160156, 0.23779296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 23.0, 14.0, 27.0, 56.0, 81.0, 180.0, 394.0, 952.0, 3808.0, 63288.0, 968521.0, 8546.0, 1610.0, 527.0, 234.0, 115.0, 61.0, 29.0, 28.0, 15.0, 10.0, 8.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2777099609375, -6.082763671875, -5.8878173828125, -5.69287109375, -5.4979248046875, -5.302978515625, -5.1080322265625, -4.9130859375, -4.7181396484375, -4.523193359375, -4.3282470703125, -4.13330078125, -3.9383544921875, -3.743408203125, -3.5484619140625, -3.353515625, -3.1585693359375, -2.963623046875, -2.7686767578125, -2.57373046875, -2.3787841796875, -2.183837890625, -1.9888916015625, -1.7939453125, -1.5989990234375, -1.404052734375, -1.2091064453125, -1.01416015625, -0.8192138671875, -0.624267578125, -0.4293212890625, -0.234375, -0.0394287109375, 0.155517578125, 0.3504638671875, 0.54541015625, 0.7403564453125, 0.935302734375, 1.1302490234375, 1.3251953125, 1.5201416015625, 1.715087890625, 1.9100341796875, 2.10498046875, 2.2999267578125, 2.494873046875, 2.6898193359375, 2.884765625, 3.0797119140625, 3.274658203125, 3.4696044921875, 3.66455078125, 3.8594970703125, 4.054443359375, 4.2493896484375, 4.4443359375, 4.6392822265625, 4.834228515625, 5.0291748046875, 5.22412109375, 5.4190673828125, 5.614013671875, 5.8089599609375, 6.00390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 2.0, 12.0, 6.0, 4.0, 16.0, 12.0, 15.0, 17.0, 24.0, 42.0, 48.0, 73.0, 139.0, 190.0, 115.0, 58.0, 41.0, 30.0, 30.0, 27.0, 16.0, 15.0, 11.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.000701904296875, -0.0006814450025558472, -0.0006609857082366943, -0.0006405264139175415, -0.0006200671195983887, -0.0005996078252792358, -0.000579148530960083, -0.0005586892366409302, -0.0005382299423217773, -0.0005177706480026245, -0.0004973113536834717, -0.00047685205936431885, -0.000456392765045166, -0.0004359334707260132, -0.00041547417640686035, -0.0003950148820877075, -0.0003745555877685547, -0.00035409629344940186, -0.000333636999130249, -0.0003131777048110962, -0.00029271841049194336, -0.00027225911617279053, -0.0002517998218536377, -0.00023134052753448486, -0.00021088123321533203, -0.0001904219388961792, -0.00016996264457702637, -0.00014950335025787354, -0.0001290440559387207, -0.00010858476161956787, -8.812546730041504e-05, -6.766617298126221e-05, -4.7206878662109375e-05, -2.6747584342956543e-05, -6.288290023803711e-06, 1.4171004295349121e-05, 3.463029861450195e-05, 5.5089592933654785e-05, 7.554888725280762e-05, 9.600818157196045e-05, 0.00011646747589111328, 0.0001369267702102661, 0.00015738606452941895, 0.00017784535884857178, 0.0001983046531677246, 0.00021876394748687744, 0.00023922324180603027, 0.0002596825361251831, 0.00028014183044433594, 0.00030060112476348877, 0.0003210604190826416, 0.00034151971340179443, 0.00036197900772094727, 0.0003824383020401001, 0.00040289759635925293, 0.00042335689067840576, 0.0004438161849975586, 0.0004642754793167114, 0.00048473477363586426, 0.0005051940679550171, 0.0005256533622741699, 0.0005461126565933228, 0.0005665719509124756, 0.0005870312452316284, 0.0006074905395507812]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 11.0, 15.0, 13.0, 17.0, 32.0, 31.0, 49.0, 53.0, 78.0, 125.0, 182.0, 282.0, 445.0, 804.0, 1377.0, 3028.0, 8091.0, 34165.0, 791428.0, 178050.0, 19378.0, 5666.0, 2339.0, 1143.0, 582.0, 356.0, 233.0, 165.0, 113.0, 80.0, 62.0, 32.0, 25.0, 22.0, 12.0, 14.0, 10.0, 16.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.048828125, -2.953033447265625, -2.85723876953125, -2.761444091796875, -2.6656494140625, -2.569854736328125, -2.47406005859375, -2.378265380859375, -2.282470703125, -2.186676025390625, -2.09088134765625, -1.995086669921875, -1.8992919921875, -1.803497314453125, -1.70770263671875, -1.611907958984375, -1.51611328125, -1.420318603515625, -1.32452392578125, -1.228729248046875, -1.1329345703125, -1.037139892578125, -0.94134521484375, -0.845550537109375, -0.749755859375, -0.653961181640625, -0.55816650390625, -0.462371826171875, -0.3665771484375, -0.270782470703125, -0.17498779296875, -0.079193115234375, 0.0166015625, 0.112396240234375, 0.20819091796875, 0.303985595703125, 0.3997802734375, 0.495574951171875, 0.59136962890625, 0.687164306640625, 0.782958984375, 0.878753662109375, 0.97454833984375, 1.070343017578125, 1.1661376953125, 1.261932373046875, 1.35772705078125, 1.453521728515625, 1.54931640625, 1.645111083984375, 1.74090576171875, 1.836700439453125, 1.9324951171875, 2.028289794921875, 2.12408447265625, 2.219879150390625, 2.315673828125, 2.411468505859375, 2.50726318359375, 2.603057861328125, 2.6988525390625, 2.794647216796875, 2.89044189453125, 2.986236572265625, 3.08203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 2.0, 14.0, 7.0, 15.0, 13.0, 25.0, 24.0, 42.0, 54.0, 85.0, 189.0, 177.0, 97.0, 67.0, 35.0, 24.0, 29.0, 18.0, 10.0, 12.0, 11.0, 3.0, 9.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0160903930664062, -0.9862823486328125, -0.9564743041992188, -0.926666259765625, -0.8968582153320312, -0.8670501708984375, -0.8372421264648438, -0.80743408203125, -0.7776260375976562, -0.7478179931640625, -0.7180099487304688, -0.688201904296875, -0.6583938598632812, -0.6285858154296875, -0.5987777709960938, -0.5689697265625, -0.5391616821289062, -0.5093536376953125, -0.47954559326171875, -0.449737548828125, -0.41992950439453125, -0.3901214599609375, -0.36031341552734375, -0.33050537109375, -0.30069732666015625, -0.2708892822265625, -0.24108123779296875, -0.211273193359375, -0.18146514892578125, -0.1516571044921875, -0.12184906005859375, -0.092041015625, -0.06223297119140625, -0.0324249267578125, -0.00261688232421875, 0.027191162109375, 0.05699920654296875, 0.0868072509765625, 0.11661529541015625, 0.14642333984375, 0.17623138427734375, 0.2060394287109375, 0.23584747314453125, 0.265655517578125, 0.29546356201171875, 0.3252716064453125, 0.35507965087890625, 0.3848876953125, 0.41469573974609375, 0.4445037841796875, 0.47431182861328125, 0.504119873046875, 0.5339279174804688, 0.5637359619140625, 0.5935440063476562, 0.62335205078125, 0.6531600952148438, 0.6829681396484375, 0.7127761840820312, 0.742584228515625, 0.7723922729492188, 0.8022003173828125, 0.8320083618164062, 0.86181640625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 14.0, 21.0, 49.0, 116.0, 256.0, 320.0, 127.0, 61.0, 25.0, 10.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.086206436157227, -9.68289852142334, -9.27959156036377, -8.876283645629883, -8.472975730895996, -8.069668769836426, -7.666360855102539, -7.2630534172058105, -6.859745979309082, -6.4564385414123535, -6.053130626678467, -5.649823188781738, -5.24651575088501, -4.843208312988281, -4.4399003982543945, -4.036592960357666, -3.6332850456237793, -3.2299773693084717, -2.826669931411743, -2.4233622550964355, -2.020054817199707, -1.6167471408843994, -1.2134394645690918, -0.8101320266723633, -0.40682435035705566, -0.00351676344871521, 0.39979082345962524, 0.8030984401702881, 1.2064059972763062, 1.6097135543823242, 2.013021230697632, 2.4163286685943604, 2.819636344909668, 3.2229440212249756, 3.626251459121704, 4.029559135437012, 4.43286657333374, 4.836174011230469, 5.2394819259643555, 5.642789363861084, 6.0460968017578125, 6.449404239654541, 6.852712154388428, 7.256019592285156, 7.659327030181885, 8.062634468078613, 8.4659423828125, 8.86924934387207, 9.272558212280273, 9.67586612701416, 10.07917308807373, 10.482481002807617, 10.885788917541504, 11.289095878601074, 11.692403793334961, 12.095710754394531, 12.499018669128418, 12.902326583862305, 13.305633544921875, 13.708941459655762, 14.112249374389648, 14.515556335449219, 14.918864250183105, 15.322172164916992, 15.725479125976562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 9.0, 28.0, 36.0, 49.0, 89.0, 93.0, 118.0, 123.0, 97.0, 106.0, 71.0, 43.0, 22.0, 29.0, 15.0, 10.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.885300636291504, -4.714145660400391, -4.5429911613464355, -4.371836185455322, -4.200681209564209, -4.029526233673096, -3.8583717346191406, -3.6872167587280273, -3.516061782836914, -3.34490704536438, -3.1737520694732666, -3.0025973320007324, -2.831442356109619, -2.660287618637085, -2.489132881164551, -2.3179779052734375, -2.1468231678009033, -1.9756683111190796, -1.8045134544372559, -1.6333587169647217, -1.4622037410736084, -1.2910490036010742, -1.1198941469192505, -0.9487392902374268, -0.777584433555603, -0.6064295768737793, -0.43527474999427795, -0.2641199231147766, -0.09296506643295288, 0.07818979024887085, 0.2493445873260498, 0.42049944400787354, 0.5916543006896973, 0.762809157371521, 0.9339640140533447, 1.105118751525879, 1.2762737274169922, 1.4474284648895264, 1.61858332157135, 1.7897381782531738, 1.9608930349349976, 2.1320478916168213, 2.3032026290893555, 2.4743576049804688, 2.645512342453003, 2.816667318344116, 2.9878220558166504, 3.1589770317077637, 3.330131769180298, 3.501286506652832, 3.6724414825439453, 3.8435962200164795, 4.014750957489014, 4.185905933380127, 4.35706090927124, 4.528215408325195, 4.699370384216309, 4.870525360107422, 5.041679859161377, 5.21283483505249, 5.3839898109436035, 5.555144786834717, 5.726299285888672, 5.897454261779785, 6.068609237670898]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 18.0, 27.0, 36.0, 122.0, 493.0, 8569.0, 4177163.0, 7429.0, 281.0, 57.0, 26.0, 13.0, 14.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.734375, -23.234619140625, -22.73486328125, -22.235107421875, -21.7353515625, -21.235595703125, -20.73583984375, -20.236083984375, -19.736328125, -19.236572265625, -18.73681640625, -18.237060546875, -17.7373046875, -17.237548828125, -16.73779296875, -16.238037109375, -15.73828125, -15.238525390625, -14.73876953125, -14.239013671875, -13.7392578125, -13.239501953125, -12.73974609375, -12.239990234375, -11.740234375, -11.240478515625, -10.74072265625, -10.240966796875, -9.7412109375, -9.241455078125, -8.74169921875, -8.241943359375, -7.7421875, -7.242431640625, -6.74267578125, -6.242919921875, -5.7431640625, -5.243408203125, -4.74365234375, -4.243896484375, -3.744140625, -3.244384765625, -2.74462890625, -2.244873046875, -1.7451171875, -1.245361328125, -0.74560546875, -0.245849609375, 0.25390625, 0.753662109375, 1.25341796875, 1.753173828125, 2.2529296875, 2.752685546875, 3.25244140625, 3.752197265625, 4.251953125, 4.751708984375, 5.25146484375, 5.751220703125, 6.2509765625, 6.750732421875, 7.25048828125, 7.750244140625, 8.25]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 8.0, 6.0, 20.0, 26.0, 31.0, 39.0, 59.0, 59.0, 75.0, 84.0, 94.0, 90.0, 92.0, 69.0, 59.0, 51.0, 32.0, 27.0, 15.0, 17.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06982421875, -0.06776952743530273, -0.06571483612060547, -0.0636601448059082, -0.06160545349121094, -0.05955076217651367, -0.057496070861816406, -0.05544137954711914, -0.053386688232421875, -0.05133199691772461, -0.049277305603027344, -0.04722261428833008, -0.04516792297363281, -0.04311323165893555, -0.04105854034423828, -0.039003849029541016, -0.03694915771484375, -0.034894466400146484, -0.03283977508544922, -0.030785083770751953, -0.028730392456054688, -0.026675701141357422, -0.024621009826660156, -0.02256631851196289, -0.020511627197265625, -0.01845693588256836, -0.016402244567871094, -0.014347553253173828, -0.012292861938476562, -0.010238170623779297, -0.008183479309082031, -0.006128787994384766, -0.0040740966796875, -0.0020194053649902344, 3.528594970703125e-05, 0.002089977264404297, 0.0041446685791015625, 0.006199359893798828, 0.008254051208496094, 0.01030874252319336, 0.012363433837890625, 0.01441812515258789, 0.016472816467285156, 0.018527507781982422, 0.020582199096679688, 0.022636890411376953, 0.02469158172607422, 0.026746273040771484, 0.02880096435546875, 0.030855655670166016, 0.03291034698486328, 0.03496503829956055, 0.03701972961425781, 0.03907442092895508, 0.041129112243652344, 0.04318380355834961, 0.045238494873046875, 0.04729318618774414, 0.049347877502441406, 0.05140256881713867, 0.05345726013183594, 0.0555119514465332, 0.05756664276123047, 0.059621334075927734, 0.061676025390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 16.0, 24.0, 37.0, 92.0, 139.0, 327.0, 739.0, 2096.0, 7842.0, 40602.0, 474716.0, 3550703.0, 96640.0, 14585.0, 3471.0, 1137.0, 488.0, 230.0, 137.0, 97.0, 42.0, 32.0, 16.0, 15.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.142578125, -3.05072021484375, -2.9588623046875, -2.86700439453125, -2.775146484375, -2.68328857421875, -2.5914306640625, -2.49957275390625, -2.40771484375, -2.31585693359375, -2.2239990234375, -2.13214111328125, -2.040283203125, -1.94842529296875, -1.8565673828125, -1.76470947265625, -1.6728515625, -1.58099365234375, -1.4891357421875, -1.39727783203125, -1.305419921875, -1.21356201171875, -1.1217041015625, -1.02984619140625, -0.93798828125, -0.84613037109375, -0.7542724609375, -0.66241455078125, -0.570556640625, -0.47869873046875, -0.3868408203125, -0.29498291015625, -0.203125, -0.11126708984375, -0.0194091796875, 0.07244873046875, 0.164306640625, 0.25616455078125, 0.3480224609375, 0.43988037109375, 0.53173828125, 0.62359619140625, 0.7154541015625, 0.80731201171875, 0.899169921875, 0.99102783203125, 1.0828857421875, 1.17474365234375, 1.2666015625, 1.35845947265625, 1.4503173828125, 1.54217529296875, 1.634033203125, 1.72589111328125, 1.8177490234375, 1.90960693359375, 2.00146484375, 2.09332275390625, 2.1851806640625, 2.27703857421875, 2.368896484375, 2.46075439453125, 2.5526123046875, 2.64447021484375, 2.736328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 6.0, 1.0, 8.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 22.0, 35.0, 37.0, 57.0, 80.0, 121.0, 161.0, 428.0, 1493.0, 716.0, 272.0, 171.0, 110.0, 72.0, 66.0, 28.0, 39.0, 17.0, 13.0, 17.0, 14.0, 6.0, 8.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2154541015625, -0.20940017700195312, -0.20334625244140625, -0.19729232788085938, -0.1912384033203125, -0.18518447875976562, -0.17913055419921875, -0.17307662963867188, -0.167022705078125, -0.16096878051757812, -0.15491485595703125, -0.14886093139648438, -0.1428070068359375, -0.13675308227539062, -0.13069915771484375, -0.12464523315429688, -0.11859130859375, -0.11253738403320312, -0.10648345947265625, -0.10042953491210938, -0.0943756103515625, -0.08832168579101562, -0.08226776123046875, -0.07621383666992188, -0.070159912109375, -0.06410598754882812, -0.05805206298828125, -0.051998138427734375, -0.0459442138671875, -0.039890289306640625, -0.03383636474609375, -0.027782440185546875, -0.021728515625, -0.015674591064453125, -0.00962066650390625, -0.003566741943359375, 0.0024871826171875, 0.008541107177734375, 0.01459503173828125, 0.020648956298828125, 0.026702880859375, 0.032756805419921875, 0.03881072998046875, 0.044864654541015625, 0.0509185791015625, 0.056972503662109375, 0.06302642822265625, 0.06908035278320312, 0.07513427734375, 0.08118820190429688, 0.08724212646484375, 0.09329605102539062, 0.0993499755859375, 0.10540390014648438, 0.11145782470703125, 0.11751174926757812, 0.123565673828125, 0.12961959838867188, 0.13567352294921875, 0.14172744750976562, 0.1477813720703125, 0.15383529663085938, 0.15988922119140625, 0.16594314575195312, 0.1719970703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 11.0, 42.0, 276.0, 547.0, 111.0, 15.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.924245834350586, -6.611834526062012, -6.2994232177734375, -5.9870123863220215, -5.674601078033447, -5.362189769744873, -5.049778938293457, -4.737367630004883, -4.424956321716309, -4.112545013427734, -3.8001339435577393, -3.487722873687744, -3.17531156539917, -2.8629002571105957, -2.5504891872406006, -2.2380781173706055, -1.9256668090820312, -1.6132556200027466, -1.300844430923462, -0.9884332418441772, -0.6760220527648926, -0.3636108636856079, -0.05119967460632324, 0.2612113952636719, 0.5736227035522461, 0.8860338926315308, 1.1984450817108154, 1.5108562707901, 1.8232674598693848, 2.135678768157959, 2.448089838027954, 2.760500907897949, 3.0729122161865234, 3.3853235244750977, 3.6977345943450928, 4.010145664215088, 4.322556972503662, 4.634968280792236, 4.947379112243652, 5.259790420532227, 5.572201728820801, 5.884613037109375, 6.197024345397949, 6.509435176849365, 6.8218464851379395, 7.134257793426514, 7.44666862487793, 7.759079933166504, 8.071491241455078, 8.383902549743652, 8.696313858032227, 9.0087251663208, 9.321136474609375, 9.633546829223633, 9.945958137512207, 10.258369445800781, 10.570780754089355, 10.88319206237793, 11.195603370666504, 11.508014678955078, 11.820425033569336, 12.13283634185791, 12.445247650146484, 12.757658958435059, 13.070070266723633]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 29.0, 45.0, 69.0, 87.0, 97.0, 95.0, 116.0, 104.0, 90.0, 66.0, 62.0, 30.0, 29.0, 11.0, 15.0, 3.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.533045768737793, -1.4771573543548584, -1.4212690591812134, -1.3653806447982788, -1.3094923496246338, -1.2536039352416992, -1.1977155208587646, -1.14182710647583, -1.085938811302185, -1.0300503969192505, -0.9741621017456055, -0.9182736873626709, -0.8623853325843811, -0.8064969778060913, -0.7506085634231567, -0.6947202086448669, -0.6388318538665771, -0.5829434990882874, -0.5270551443099976, -0.471166729927063, -0.4152783751487732, -0.3593900203704834, -0.3035016357898712, -0.24761325120925903, -0.19172489643096924, -0.13583652675151825, -0.07994815707206726, -0.024059787392616272, 0.03182858228683472, 0.08771693706512451, 0.1436053216457367, 0.19949370622634888, 0.25538206100463867, 0.31127041578292847, 0.36715880036354065, 0.42304718494415283, 0.4789355397224426, 0.5348238945007324, 0.590712308883667, 0.6466006636619568, 0.7024890184402466, 0.7583773732185364, 0.8142657279968262, 0.8701541423797607, 0.9260424971580505, 0.9819308519363403, 1.037819266319275, 1.09370756149292, 1.1495959758758545, 1.205484390258789, 1.261372685432434, 1.3172610998153687, 1.3731493949890137, 1.4290378093719482, 1.4849262237548828, 1.5408146381378174, 1.5967029333114624, 1.652591347694397, 1.708479642868042, 1.7643680572509766, 1.8202564716339111, 1.8761447668075562, 1.9320331811904907, 1.9879214763641357, 2.0438098907470703]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 4.0, 5.0, 5.0, 11.0, 10.0, 25.0, 25.0, 52.0, 69.0, 150.0, 299.0, 907.0, 3223.0, 17463.0, 344660.0, 650381.0, 25542.0, 3887.0, 1085.0, 367.0, 158.0, 82.0, 36.0, 33.0, 16.0, 11.0, 14.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.35546875, -3.25701904296875, -3.1585693359375, -3.06011962890625, -2.961669921875, -2.86322021484375, -2.7647705078125, -2.66632080078125, -2.56787109375, -2.46942138671875, -2.3709716796875, -2.27252197265625, -2.174072265625, -2.07562255859375, -1.9771728515625, -1.87872314453125, -1.7802734375, -1.68182373046875, -1.5833740234375, -1.48492431640625, -1.386474609375, -1.28802490234375, -1.1895751953125, -1.09112548828125, -0.99267578125, -0.89422607421875, -0.7957763671875, -0.69732666015625, -0.598876953125, -0.50042724609375, -0.4019775390625, -0.30352783203125, -0.205078125, -0.10662841796875, -0.0081787109375, 0.09027099609375, 0.188720703125, 0.28717041015625, 0.3856201171875, 0.48406982421875, 0.58251953125, 0.68096923828125, 0.7794189453125, 0.87786865234375, 0.976318359375, 1.07476806640625, 1.1732177734375, 1.27166748046875, 1.3701171875, 1.46856689453125, 1.5670166015625, 1.66546630859375, 1.763916015625, 1.86236572265625, 1.9608154296875, 2.05926513671875, 2.15771484375, 2.25616455078125, 2.3546142578125, 2.45306396484375, 2.551513671875, 2.64996337890625, 2.7484130859375, 2.84686279296875, 2.9453125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 6.0, 14.0, 35.0, 67.0, 103.0, 153.0, 171.0, 157.0, 135.0, 68.0, 36.0, 27.0, 12.0, 5.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06515979766845703, -0.06043434143066406, -0.055708885192871094, -0.050983428955078125, -0.046257972717285156, -0.04153251647949219, -0.03680706024169922, -0.03208160400390625, -0.02735614776611328, -0.022630691528320312, -0.017905235290527344, -0.013179779052734375, -0.008454322814941406, -0.0037288665771484375, 0.0009965896606445312, 0.0057220458984375, 0.010447502136230469, 0.015172958374023438, 0.019898414611816406, 0.024623870849609375, 0.029349327087402344, 0.03407478332519531, 0.03880023956298828, 0.04352569580078125, 0.04825115203857422, 0.05297660827636719, 0.057702064514160156, 0.062427520751953125, 0.0671529769897461, 0.07187843322753906, 0.07660388946533203, 0.081329345703125, 0.08605480194091797, 0.09078025817871094, 0.0955057144165039, 0.10023117065429688, 0.10495662689208984, 0.10968208312988281, 0.11440753936767578, 0.11913299560546875, 0.12385845184326172, 0.1285839080810547, 0.13330936431884766, 0.13803482055664062, 0.1427602767944336, 0.14748573303222656, 0.15221118927001953, 0.1569366455078125, 0.16166210174560547, 0.16638755798339844, 0.1711130142211914, 0.17583847045898438, 0.18056392669677734, 0.1852893829345703, 0.19001483917236328, 0.19474029541015625, 0.19946575164794922, 0.2041912078857422, 0.20891666412353516, 0.21364212036132812, 0.2183675765991211, 0.22309303283691406, 0.22781848907470703, 0.2325439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 2.0, 4.0, 7.0, 2.0, 4.0, 8.0, 12.0, 8.0, 11.0, 17.0, 24.0, 18.0, 25.0, 39.0, 109.0, 505.0, 5170.0, 628767.0, 408917.0, 4182.0, 456.0, 66.0, 38.0, 29.0, 20.0, 15.0, 9.0, 13.0, 12.0, 11.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-4.66015625, -4.53057861328125, -4.4010009765625, -4.27142333984375, -4.141845703125, -4.01226806640625, -3.8826904296875, -3.75311279296875, -3.62353515625, -3.49395751953125, -3.3643798828125, -3.23480224609375, -3.105224609375, -2.97564697265625, -2.8460693359375, -2.71649169921875, -2.5869140625, -2.45733642578125, -2.3277587890625, -2.19818115234375, -2.068603515625, -1.93902587890625, -1.8094482421875, -1.67987060546875, -1.55029296875, -1.42071533203125, -1.2911376953125, -1.16156005859375, -1.031982421875, -0.90240478515625, -0.7728271484375, -0.64324951171875, -0.513671875, -0.38409423828125, -0.2545166015625, -0.12493896484375, 0.004638671875, 0.13421630859375, 0.2637939453125, 0.39337158203125, 0.52294921875, 0.65252685546875, 0.7821044921875, 0.91168212890625, 1.041259765625, 1.17083740234375, 1.3004150390625, 1.42999267578125, 1.5595703125, 1.68914794921875, 1.8187255859375, 1.94830322265625, 2.077880859375, 2.20745849609375, 2.3370361328125, 2.46661376953125, 2.59619140625, 2.72576904296875, 2.8553466796875, 2.98492431640625, 3.114501953125, 3.24407958984375, 3.3736572265625, 3.50323486328125, 3.6328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 12.0, 17.0, 7.0, 14.0, 22.0, 22.0, 28.0, 38.0, 36.0, 39.0, 51.0, 66.0, 43.0, 54.0, 51.0, 52.0, 50.0, 60.0, 44.0, 45.0, 38.0, 31.0, 35.0, 26.0, 11.0, 22.0, 19.0, 9.0, 12.0, 5.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.3027229309082031, -0.29172515869140625, -0.2807273864746094, -0.2697296142578125, -0.2587318420410156, -0.24773406982421875, -0.23673629760742188, -0.225738525390625, -0.21474075317382812, -0.20374298095703125, -0.19274520874023438, -0.1817474365234375, -0.17074966430664062, -0.15975189208984375, -0.14875411987304688, -0.13775634765625, -0.12675857543945312, -0.11576080322265625, -0.10476303100585938, -0.0937652587890625, -0.08276748657226562, -0.07176971435546875, -0.060771942138671875, -0.049774169921875, -0.038776397705078125, -0.02777862548828125, -0.016780853271484375, -0.0057830810546875, 0.005214691162109375, 0.01621246337890625, 0.027210235595703125, 0.0382080078125, 0.049205780029296875, 0.06020355224609375, 0.07120132446289062, 0.0821990966796875, 0.09319686889648438, 0.10419464111328125, 0.11519241333007812, 0.126190185546875, 0.13718795776367188, 0.14818572998046875, 0.15918350219726562, 0.1701812744140625, 0.18117904663085938, 0.19217681884765625, 0.20317459106445312, 0.21417236328125, 0.22517013549804688, 0.23616790771484375, 0.24716567993164062, 0.2581634521484375, 0.2691612243652344, 0.28015899658203125, 0.2911567687988281, 0.302154541015625, 0.3131523132324219, 0.32415008544921875, 0.3351478576660156, 0.3461456298828125, 0.3571434020996094, 0.36814117431640625, 0.3791389465332031, 0.39013671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 31.0, 79.0, 346.0, 3258.0, 1012672.0, 30883.0, 907.0, 139.0, 40.0, 26.0, 12.0, 18.0, 11.0, 7.0, 6.0, 11.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.09375, -12.6044921875, -12.115234375, -11.6259765625, -11.13671875, -10.6474609375, -10.158203125, -9.6689453125, -9.1796875, -8.6904296875, -8.201171875, -7.7119140625, -7.22265625, -6.7333984375, -6.244140625, -5.7548828125, -5.265625, -4.7763671875, -4.287109375, -3.7978515625, -3.30859375, -2.8193359375, -2.330078125, -1.8408203125, -1.3515625, -0.8623046875, -0.373046875, 0.1162109375, 0.60546875, 1.0947265625, 1.583984375, 2.0732421875, 2.5625, 3.0517578125, 3.541015625, 4.0302734375, 4.51953125, 5.0087890625, 5.498046875, 5.9873046875, 6.4765625, 6.9658203125, 7.455078125, 7.9443359375, 8.43359375, 8.9228515625, 9.412109375, 9.9013671875, 10.390625, 10.8798828125, 11.369140625, 11.8583984375, 12.34765625, 12.8369140625, 13.326171875, 13.8154296875, 14.3046875, 14.7939453125, 15.283203125, 15.7724609375, 16.26171875, 16.7509765625, 17.240234375, 17.7294921875, 18.21875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 46.0, 275.0, 439.0, 82.0, 22.0, 9.0, 4.0, 3.0, 11.0, 7.0, 9.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022125244140625, -0.0021167993545532227, -0.0020210742950439453, -0.001925349235534668, -0.0018296241760253906, -0.0017338991165161133, -0.001638174057006836, -0.0015424489974975586, -0.0014467239379882812, -0.001350998878479004, -0.0012552738189697266, -0.0011595487594604492, -0.0010638236999511719, -0.0009680986404418945, -0.0008723735809326172, -0.0007766485214233398, -0.0006809234619140625, -0.0005851984024047852, -0.0004894733428955078, -0.00039374828338623047, -0.0002980232238769531, -0.00020229816436767578, -0.00010657310485839844, -1.0848045349121094e-05, 8.487701416015625e-05, 0.0001806020736694336, 0.00027632713317871094, 0.0003720521926879883, 0.0004677772521972656, 0.000563502311706543, 0.0006592273712158203, 0.0007549524307250977, 0.000850677490234375, 0.0009464025497436523, 0.0010421276092529297, 0.001137852668762207, 0.0012335777282714844, 0.0013293027877807617, 0.001425027847290039, 0.0015207529067993164, 0.0016164779663085938, 0.001712203025817871, 0.0018079280853271484, 0.0019036531448364258, 0.001999378204345703, 0.0020951032638549805, 0.002190828323364258, 0.002286553382873535, 0.0023822784423828125, 0.00247800350189209, 0.002573728561401367, 0.0026694536209106445, 0.002765178680419922, 0.0028609037399291992, 0.0029566287994384766, 0.003052353858947754, 0.0031480789184570312, 0.0032438039779663086, 0.003339529037475586, 0.0034352540969848633, 0.0035309791564941406, 0.003626704216003418, 0.0037224292755126953, 0.0038181543350219727, 0.00391387939453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 9.0, 9.0, 5.0, 13.0, 22.0, 21.0, 54.0, 52.0, 75.0, 126.0, 201.0, 266.0, 410.0, 733.0, 1268.0, 2222.0, 4205.0, 8595.0, 21763.0, 95944.0, 795824.0, 78667.0, 20337.0, 8253.0, 3928.0, 2159.0, 1159.0, 722.0, 480.0, 301.0, 219.0, 154.0, 105.0, 63.0, 48.0, 37.0, 25.0, 26.0, 14.0, 6.0, 11.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.499481201171875, -3.37200927734375, -3.244537353515625, -3.1170654296875, -2.989593505859375, -2.86212158203125, -2.734649658203125, -2.607177734375, -2.479705810546875, -2.35223388671875, -2.224761962890625, -2.0972900390625, -1.969818115234375, -1.84234619140625, -1.714874267578125, -1.58740234375, -1.459930419921875, -1.33245849609375, -1.204986572265625, -1.0775146484375, -0.950042724609375, -0.82257080078125, -0.695098876953125, -0.567626953125, -0.440155029296875, -0.31268310546875, -0.185211181640625, -0.0577392578125, 0.069732666015625, 0.19720458984375, 0.324676513671875, 0.4521484375, 0.579620361328125, 0.70709228515625, 0.834564208984375, 0.9620361328125, 1.089508056640625, 1.21697998046875, 1.344451904296875, 1.471923828125, 1.599395751953125, 1.72686767578125, 1.854339599609375, 1.9818115234375, 2.109283447265625, 2.23675537109375, 2.364227294921875, 2.49169921875, 2.619171142578125, 2.74664306640625, 2.874114990234375, 3.0015869140625, 3.129058837890625, 3.25653076171875, 3.384002685546875, 3.511474609375, 3.638946533203125, 3.76641845703125, 3.893890380859375, 4.0213623046875, 4.148834228515625, 4.27630615234375, 4.403778076171875, 4.53125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 16.0, 28.0, 30.0, 103.0, 190.0, 263.0, 158.0, 44.0, 32.0, 20.0, 18.0, 13.0, 9.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.640625, -1.57037353515625, -1.5001220703125, -1.42987060546875, -1.359619140625, -1.28936767578125, -1.2191162109375, -1.14886474609375, -1.07861328125, -1.00836181640625, -0.9381103515625, -0.86785888671875, -0.797607421875, -0.72735595703125, -0.6571044921875, -0.58685302734375, -0.5166015625, -0.44635009765625, -0.3760986328125, -0.30584716796875, -0.235595703125, -0.16534423828125, -0.0950927734375, -0.02484130859375, 0.04541015625, 0.11566162109375, 0.1859130859375, 0.25616455078125, 0.326416015625, 0.39666748046875, 0.4669189453125, 0.53717041015625, 0.607421875, 0.67767333984375, 0.7479248046875, 0.81817626953125, 0.888427734375, 0.95867919921875, 1.0289306640625, 1.09918212890625, 1.16943359375, 1.23968505859375, 1.3099365234375, 1.38018798828125, 1.450439453125, 1.52069091796875, 1.5909423828125, 1.66119384765625, 1.7314453125, 1.80169677734375, 1.8719482421875, 1.94219970703125, 2.012451171875, 2.08270263671875, 2.1529541015625, 2.22320556640625, 2.29345703125, 2.36370849609375, 2.4339599609375, 2.50421142578125, 2.574462890625, 2.64471435546875, 2.7149658203125, 2.78521728515625, 2.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 18.0, 30.0, 61.0, 109.0, 160.0, 235.0, 160.0, 104.0, 54.0, 22.0, 12.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40109634399414, -13.04529094696045, -12.689485549926758, -12.333680152893066, -11.977874755859375, -11.6220703125, -11.266263961791992, -10.910459518432617, -10.554654121398926, -10.198848724365234, -9.843043327331543, -9.487237930297852, -9.13143253326416, -8.775627136230469, -8.419822692871094, -8.064017295837402, -7.708211421966553, -7.352406024932861, -6.99660062789917, -6.640795707702637, -6.284990310668945, -5.929184913635254, -5.5733795166015625, -5.217574119567871, -4.86176872253418, -4.505963325500488, -4.150157928466797, -3.7943527698516846, -3.4385476112365723, -3.082742214202881, -2.7269368171691895, -2.371131658554077, -2.015326499938965, -1.659521222114563, -1.3037159442901611, -0.9479105472564697, -0.5921052694320679, -0.23629999160766602, 0.11950540542602539, 0.4753105640411377, 0.8311159610748291, 1.186921238899231, 1.5427265167236328, 1.8985319137573242, 2.2543373107910156, 2.610142469406128, 2.9659478664398193, 3.3217530250549316, 3.677558422088623, 4.0333638191223145, 4.389169216156006, 4.744974136352539, 5.1007795333862305, 5.456584930419922, 5.812390327453613, 6.168195724487305, 6.524001121520996, 6.8798065185546875, 7.235611915588379, 7.59141731262207, 7.9472222328186035, 8.303028106689453, 8.658832550048828, 9.01463794708252, 9.370443344116211]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 9.0, 13.0, 12.0, 16.0, 17.0, 19.0, 23.0, 30.0, 39.0, 26.0, 46.0, 46.0, 44.0, 47.0, 40.0, 50.0, 48.0, 44.0, 45.0, 48.0, 39.0, 35.0, 34.0, 27.0, 29.0, 34.0, 19.0, 16.0, 17.0, 8.0, 21.0, 11.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.948370933532715, -2.8556225299835205, -2.7628743648529053, -2.670125961303711, -2.5773775577545166, -2.4846293926239014, -2.391880989074707, -2.299132823944092, -2.2063844203948975, -2.113636016845703, -2.020887851715088, -1.9281394481658936, -1.8353911638259888, -1.742642879486084, -1.6498944759368896, -1.5571461915969849, -1.4643977880477905, -1.3716495037078857, -1.2789011001586914, -1.1861528158187866, -1.0934045314788818, -1.0006561279296875, -0.9079078435897827, -0.8151595592498779, -0.7224112153053284, -0.6296628713607788, -0.536914587020874, -0.44416624307632446, -0.3514179289340973, -0.2586696147918701, -0.16592127084732056, -0.07317298650741577, 0.01957535743713379, 0.11232367902994156, 0.20507200062274933, 0.2978203296661377, 0.39056864380836487, 0.48331695795059204, 0.5760653018951416, 0.6688135862350464, 0.761561930179596, 0.8543102741241455, 0.9470585584640503, 1.039806842803955, 1.1325552463531494, 1.2253035306930542, 1.318051815032959, 1.4108002185821533, 1.503548502922058, 1.596296787261963, 1.6890451908111572, 1.781793475151062, 1.8745417594909668, 1.9672901630401611, 2.0600385665893555, 2.1527867317199707, 2.245535135269165, 2.3382835388183594, 2.4310317039489746, 2.523780107498169, 2.6165285110473633, 2.7092766761779785, 2.802025079727173, 2.894773483276367, 2.9875216484069824]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 7.0, 7.0, 8.0, 17.0, 33.0, 35.0, 37.0, 69.0, 129.0, 295.0, 982.0, 5318.0, 68001.0, 4050005.0, 62216.0, 5372.0, 1001.0, 294.0, 149.0, 71.0, 59.0, 37.0, 33.0, 29.0, 15.0, 16.0, 13.0, 8.0, 8.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.19451904296875, -4.9984130859375, -4.80230712890625, -4.606201171875, -4.41009521484375, -4.2139892578125, -4.01788330078125, -3.82177734375, -3.62567138671875, -3.4295654296875, -3.23345947265625, -3.037353515625, -2.84124755859375, -2.6451416015625, -2.44903564453125, -2.2529296875, -2.05682373046875, -1.8607177734375, -1.66461181640625, -1.468505859375, -1.27239990234375, -1.0762939453125, -0.88018798828125, -0.68408203125, -0.48797607421875, -0.2918701171875, -0.09576416015625, 0.100341796875, 0.29644775390625, 0.4925537109375, 0.68865966796875, 0.884765625, 1.08087158203125, 1.2769775390625, 1.47308349609375, 1.669189453125, 1.86529541015625, 2.0614013671875, 2.25750732421875, 2.45361328125, 2.64971923828125, 2.8458251953125, 3.04193115234375, 3.238037109375, 3.43414306640625, 3.6302490234375, 3.82635498046875, 4.0224609375, 4.21856689453125, 4.4146728515625, 4.61077880859375, 4.806884765625, 5.00299072265625, 5.1990966796875, 5.39520263671875, 5.59130859375, 5.78741455078125, 5.9835205078125, 6.17962646484375, 6.375732421875, 6.57183837890625, 6.7679443359375, 6.96405029296875, 7.16015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 20.0, 15.0, 19.0, 36.0, 42.0, 58.0, 57.0, 53.0, 55.0, 55.0, 70.0, 57.0, 58.0, 55.0, 42.0, 53.0, 41.0, 36.0, 32.0, 23.0, 27.0, 21.0, 8.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06856441497802734, -0.06626701354980469, -0.06396961212158203, -0.061672210693359375, -0.05937480926513672, -0.05707740783691406, -0.054780006408691406, -0.05248260498046875, -0.050185203552246094, -0.04788780212402344, -0.04559040069580078, -0.043292999267578125, -0.04099559783935547, -0.03869819641113281, -0.036400794982910156, -0.0341033935546875, -0.031805992126464844, -0.029508590698242188, -0.02721118927001953, -0.024913787841796875, -0.02261638641357422, -0.020318984985351562, -0.018021583557128906, -0.01572418212890625, -0.013426780700683594, -0.011129379272460938, -0.008831977844238281, -0.006534576416015625, -0.004237174987792969, -0.0019397735595703125, 0.00035762786865234375, 0.002655029296875, 0.004952430725097656, 0.0072498321533203125, 0.009547233581542969, 0.011844635009765625, 0.014142036437988281, 0.016439437866210938, 0.018736839294433594, 0.02103424072265625, 0.023331642150878906, 0.025629043579101562, 0.02792644500732422, 0.030223846435546875, 0.03252124786376953, 0.03481864929199219, 0.037116050720214844, 0.0394134521484375, 0.041710853576660156, 0.04400825500488281, 0.04630565643310547, 0.048603057861328125, 0.05090045928955078, 0.05319786071777344, 0.055495262145996094, 0.05779266357421875, 0.060090065002441406, 0.06238746643066406, 0.06468486785888672, 0.06698226928710938, 0.06927967071533203, 0.07157707214355469, 0.07387447357177734, 0.076171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 12.0, 25.0, 27.0, 46.0, 100.0, 256.0, 1112.0, 41931.0, 4140417.0, 9423.0, 553.0, 161.0, 81.0, 44.0, 29.0, 10.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.433349609375, -8.99169921875, -8.550048828125, -8.1083984375, -7.666748046875, -7.22509765625, -6.783447265625, -6.341796875, -5.900146484375, -5.45849609375, -5.016845703125, -4.5751953125, -4.133544921875, -3.69189453125, -3.250244140625, -2.80859375, -2.366943359375, -1.92529296875, -1.483642578125, -1.0419921875, -0.600341796875, -0.15869140625, 0.282958984375, 0.724609375, 1.166259765625, 1.60791015625, 2.049560546875, 2.4912109375, 2.932861328125, 3.37451171875, 3.816162109375, 4.2578125, 4.699462890625, 5.14111328125, 5.582763671875, 6.0244140625, 6.466064453125, 6.90771484375, 7.349365234375, 7.791015625, 8.232666015625, 8.67431640625, 9.115966796875, 9.5576171875, 9.999267578125, 10.44091796875, 10.882568359375, 11.32421875, 11.765869140625, 12.20751953125, 12.649169921875, 13.0908203125, 13.532470703125, 13.97412109375, 14.415771484375, 14.857421875, 15.299072265625, 15.74072265625, 16.182373046875, 16.6240234375, 17.065673828125, 17.50732421875, 17.948974609375, 18.390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 9.0, 8.0, 19.0, 33.0, 35.0, 59.0, 71.0, 118.0, 195.0, 400.0, 1504.0, 775.0, 299.0, 201.0, 115.0, 59.0, 46.0, 41.0, 15.0, 21.0, 13.0, 8.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35433197021484375, -0.3441619873046875, -0.33399200439453125, -0.323822021484375, -0.31365203857421875, -0.3034820556640625, -0.29331207275390625, -0.28314208984375, -0.27297210693359375, -0.2628021240234375, -0.25263214111328125, -0.242462158203125, -0.23229217529296875, -0.2221221923828125, -0.21195220947265625, -0.2017822265625, -0.19161224365234375, -0.1814422607421875, -0.17127227783203125, -0.161102294921875, -0.15093231201171875, -0.1407623291015625, -0.13059234619140625, -0.12042236328125, -0.11025238037109375, -0.1000823974609375, -0.08991241455078125, -0.079742431640625, -0.06957244873046875, -0.0594024658203125, -0.04923248291015625, -0.0390625, -0.02889251708984375, -0.0187225341796875, -0.00855255126953125, 0.001617431640625, 0.01178741455078125, 0.0219573974609375, 0.03212738037109375, 0.04229736328125, 0.05246734619140625, 0.0626373291015625, 0.07280731201171875, 0.082977294921875, 0.09314727783203125, 0.1033172607421875, 0.11348724365234375, 0.1236572265625, 0.13382720947265625, 0.1439971923828125, 0.15416717529296875, 0.164337158203125, 0.17450714111328125, 0.1846771240234375, 0.19484710693359375, 0.20501708984375, 0.21518707275390625, 0.2253570556640625, 0.23552703857421875, 0.245697021484375, 0.25586700439453125, 0.2660369873046875, 0.27620697021484375, 0.286376953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 27.0, 189.0, 477.0, 269.0, 36.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.40032196044922, -20.019495010375977, -19.638669967651367, -19.257843017578125, -18.877017974853516, -18.496191024780273, -18.115365982055664, -17.734539031982422, -17.353713989257812, -16.97288703918457, -16.59206199645996, -16.21123504638672, -15.83041000366211, -15.449584007263184, -15.068758010864258, -14.687931060791016, -14.30710506439209, -13.926279067993164, -13.545453071594238, -13.164627075195312, -12.783801078796387, -12.402975082397461, -12.022148132324219, -11.64132308959961, -11.260496139526367, -10.879670143127441, -10.498844146728516, -10.11801815032959, -9.737192153930664, -9.356366157531738, -8.975540161132812, -8.59471321105957, -8.213887214660645, -7.833061218261719, -7.452235221862793, -7.071409225463867, -6.690583229064941, -6.309757232666016, -5.928930759429932, -5.548104763031006, -5.167279243469238, -4.7864532470703125, -4.405627250671387, -4.024801254272461, -3.643975019454956, -3.2631490230560303, -2.8823227882385254, -2.5014967918395996, -2.1206705570220947, -1.739844560623169, -1.3590184450149536, -0.9781923294067383, -0.5973663330078125, -0.21654033660888672, 0.16428589820861816, 0.545111894607544, 0.9259378910064697, 1.3067638874053955, 1.6875900030136108, 2.068416118621826, 2.449242115020752, 2.8300681114196777, 3.2108943462371826, 3.5917203426361084, 3.972546339035034]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 7.0, 14.0, 4.0, 9.0, 9.0, 14.0, 14.0, 22.0, 18.0, 28.0, 38.0, 27.0, 30.0, 31.0, 31.0, 32.0, 55.0, 51.0, 42.0, 57.0, 48.0, 44.0, 48.0, 43.0, 33.0, 28.0, 23.0, 30.0, 31.0, 23.0, 24.0, 11.0, 16.0, 11.0, 6.0, 11.0, 4.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.947307825088501, -0.9157190918922424, -0.8841303586959839, -0.8525416254997253, -0.8209528923034668, -0.7893641591072083, -0.7577754259109497, -0.7261867523193359, -0.6945979595184326, -0.6630092263221741, -0.6314204931259155, -0.599831759929657, -0.5682430267333984, -0.5366542935371399, -0.5050655603408813, -0.4734768569469452, -0.44188815355300903, -0.4102994203567505, -0.37871068716049194, -0.3471219539642334, -0.31553322076797485, -0.2839444875717163, -0.25235578417778015, -0.2207670509815216, -0.18917831778526306, -0.15758958458900452, -0.12600085139274597, -0.09441213309764862, -0.06282339990139008, -0.03123466670513153, 0.0003540515899658203, 0.031942784786224365, 0.06353151798248291, 0.09512025117874146, 0.126708984375, 0.15829770267009735, 0.1898864358663559, 0.22147516906261444, 0.2530638873577118, 0.28465262055397034, 0.3162413537502289, 0.3478300869464874, 0.37941882014274597, 0.41100752353668213, 0.4425962567329407, 0.4741849899291992, 0.5057737231254578, 0.5373624563217163, 0.5689511895179749, 0.6005399227142334, 0.6321286559104919, 0.6637173891067505, 0.695306122303009, 0.7268948554992676, 0.7584835290908813, 0.7900723218917847, 0.8216609954833984, 0.853249728679657, 0.8848384618759155, 0.9164271950721741, 0.9480159282684326, 0.9796046614646912, 1.0111933946609497, 1.0427820682525635, 1.0743708610534668]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 10.0, 15.0, 12.0, 20.0, 21.0, 27.0, 38.0, 38.0, 59.0, 108.0, 1651.0, 195599.0, 839217.0, 11018.0, 349.0, 81.0, 62.0, 50.0, 39.0, 25.0, 20.0, 24.0, 15.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.48046875, -5.304931640625, -5.12939453125, -4.953857421875, -4.7783203125, -4.602783203125, -4.42724609375, -4.251708984375, -4.076171875, -3.900634765625, -3.72509765625, -3.549560546875, -3.3740234375, -3.198486328125, -3.02294921875, -2.847412109375, -2.671875, -2.496337890625, -2.32080078125, -2.145263671875, -1.9697265625, -1.794189453125, -1.61865234375, -1.443115234375, -1.267578125, -1.092041015625, -0.91650390625, -0.740966796875, -0.5654296875, -0.389892578125, -0.21435546875, -0.038818359375, 0.13671875, 0.312255859375, 0.48779296875, 0.663330078125, 0.8388671875, 1.014404296875, 1.18994140625, 1.365478515625, 1.541015625, 1.716552734375, 1.89208984375, 2.067626953125, 2.2431640625, 2.418701171875, 2.59423828125, 2.769775390625, 2.9453125, 3.120849609375, 3.29638671875, 3.471923828125, 3.6474609375, 3.822998046875, 3.99853515625, 4.174072265625, 4.349609375, 4.525146484375, 4.70068359375, 4.876220703125, 5.0517578125, 5.227294921875, 5.40283203125, 5.578369140625, 5.75390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 21.0, 16.0, 18.0, 24.0, 26.0, 27.0, 46.0, 24.0, 37.0, 49.0, 53.0, 52.0, 46.0, 43.0, 62.0, 41.0, 44.0, 55.0, 44.0, 37.0, 43.0, 27.0, 28.0, 21.0, 21.0, 14.0, 16.0, 1.0, 14.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0753173828125, -0.07300186157226562, -0.07068634033203125, -0.06837081909179688, -0.0660552978515625, -0.06373977661132812, -0.06142425537109375, -0.059108734130859375, -0.056793212890625, -0.054477691650390625, -0.05216217041015625, -0.049846649169921875, -0.0475311279296875, -0.045215606689453125, -0.04290008544921875, -0.040584564208984375, -0.03826904296875, -0.035953521728515625, -0.03363800048828125, -0.031322479248046875, -0.0290069580078125, -0.026691436767578125, -0.02437591552734375, -0.022060394287109375, -0.019744873046875, -0.017429351806640625, -0.01511383056640625, -0.012798309326171875, -0.0104827880859375, -0.008167266845703125, -0.00585174560546875, -0.003536224365234375, -0.001220703125, 0.001094818115234375, 0.00341033935546875, 0.005725860595703125, 0.0080413818359375, 0.010356903076171875, 0.01267242431640625, 0.014987945556640625, 0.017303466796875, 0.019618988037109375, 0.02193450927734375, 0.024250030517578125, 0.0265655517578125, 0.028881072998046875, 0.03119659423828125, 0.033512115478515625, 0.03582763671875, 0.038143157958984375, 0.04045867919921875, 0.042774200439453125, 0.0450897216796875, 0.047405242919921875, 0.04972076416015625, 0.052036285400390625, 0.054351806640625, 0.056667327880859375, 0.05898284912109375, 0.061298370361328125, 0.0636138916015625, 0.06592941284179688, 0.06824493408203125, 0.07056045532226562, 0.0728759765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 13.0, 15.0, 15.0, 21.0, 42.0, 59.0, 84.0, 96.0, 159.0, 231.0, 289.0, 499.0, 764.0, 1314.0, 2464.0, 5284.0, 13613.0, 40183.0, 121345.0, 295639.0, 331863.0, 152119.0, 51497.0, 17388.0, 6508.0, 3009.0, 1473.0, 862.0, 572.0, 342.0, 208.0, 154.0, 103.0, 80.0, 60.0, 36.0, 37.0, 22.0, 22.0, 17.0, 10.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.3984375, -1.354888916015625, -1.31134033203125, -1.267791748046875, -1.2242431640625, -1.180694580078125, -1.13714599609375, -1.093597412109375, -1.050048828125, -1.006500244140625, -0.96295166015625, -0.919403076171875, -0.8758544921875, -0.832305908203125, -0.78875732421875, -0.745208740234375, -0.70166015625, -0.658111572265625, -0.61456298828125, -0.571014404296875, -0.5274658203125, -0.483917236328125, -0.44036865234375, -0.396820068359375, -0.353271484375, -0.309722900390625, -0.26617431640625, -0.222625732421875, -0.1790771484375, -0.135528564453125, -0.09197998046875, -0.048431396484375, -0.0048828125, 0.038665771484375, 0.08221435546875, 0.125762939453125, 0.1693115234375, 0.212860107421875, 0.25640869140625, 0.299957275390625, 0.343505859375, 0.387054443359375, 0.43060302734375, 0.474151611328125, 0.5177001953125, 0.561248779296875, 0.60479736328125, 0.648345947265625, 0.69189453125, 0.735443115234375, 0.77899169921875, 0.822540283203125, 0.8660888671875, 0.909637451171875, 0.95318603515625, 0.996734619140625, 1.040283203125, 1.083831787109375, 1.12738037109375, 1.170928955078125, 1.2144775390625, 1.258026123046875, 1.30157470703125, 1.345123291015625, 1.388671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 9.0, 15.0, 11.0, 17.0, 18.0, 22.0, 33.0, 44.0, 41.0, 49.0, 62.0, 57.0, 55.0, 70.0, 72.0, 48.0, 50.0, 53.0, 37.0, 36.0, 36.0, 30.0, 23.0, 21.0, 21.0, 11.0, 13.0, 15.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.640625, -0.621734619140625, -0.60284423828125, -0.583953857421875, -0.5650634765625, -0.546173095703125, -0.52728271484375, -0.508392333984375, -0.489501953125, -0.470611572265625, -0.45172119140625, -0.432830810546875, -0.4139404296875, -0.395050048828125, -0.37615966796875, -0.357269287109375, -0.33837890625, -0.319488525390625, -0.30059814453125, -0.281707763671875, -0.2628173828125, -0.243927001953125, -0.22503662109375, -0.206146240234375, -0.187255859375, -0.168365478515625, -0.14947509765625, -0.130584716796875, -0.1116943359375, -0.092803955078125, -0.07391357421875, -0.055023193359375, -0.0361328125, -0.017242431640625, 0.00164794921875, 0.020538330078125, 0.0394287109375, 0.058319091796875, 0.07720947265625, 0.096099853515625, 0.114990234375, 0.133880615234375, 0.15277099609375, 0.171661376953125, 0.1905517578125, 0.209442138671875, 0.22833251953125, 0.247222900390625, 0.26611328125, 0.285003662109375, 0.30389404296875, 0.322784423828125, 0.3416748046875, 0.360565185546875, 0.37945556640625, 0.398345947265625, 0.417236328125, 0.436126708984375, 0.45501708984375, 0.473907470703125, 0.4927978515625, 0.511688232421875, 0.53057861328125, 0.549468994140625, 0.568359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 14.0, 24.0, 22.0, 45.0, 56.0, 78.0, 116.0, 184.0, 322.0, 597.0, 1214.0, 2652.0, 7086.0, 21608.0, 83277.0, 322944.0, 424135.0, 134427.0, 33028.0, 9830.0, 3593.0, 1574.0, 710.0, 347.0, 205.0, 150.0, 96.0, 59.0, 36.0, 26.0, 29.0, 16.0, 14.0, 10.0, 8.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.666259765625, -1.61279296875, -1.559326171875, -1.505859375, -1.452392578125, -1.39892578125, -1.345458984375, -1.2919921875, -1.238525390625, -1.18505859375, -1.131591796875, -1.078125, -1.024658203125, -0.97119140625, -0.917724609375, -0.8642578125, -0.810791015625, -0.75732421875, -0.703857421875, -0.650390625, -0.596923828125, -0.54345703125, -0.489990234375, -0.4365234375, -0.383056640625, -0.32958984375, -0.276123046875, -0.22265625, -0.169189453125, -0.11572265625, -0.062255859375, -0.0087890625, 0.044677734375, 0.09814453125, 0.151611328125, 0.205078125, 0.258544921875, 0.31201171875, 0.365478515625, 0.4189453125, 0.472412109375, 0.52587890625, 0.579345703125, 0.6328125, 0.686279296875, 0.73974609375, 0.793212890625, 0.8466796875, 0.900146484375, 0.95361328125, 1.007080078125, 1.060546875, 1.114013671875, 1.16748046875, 1.220947265625, 1.2744140625, 1.327880859375, 1.38134765625, 1.434814453125, 1.48828125, 1.541748046875, 1.59521484375, 1.648681640625, 1.7021484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 1.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 20.0, 28.0, 28.0, 42.0, 47.0, 67.0, 79.0, 85.0, 91.0, 88.0, 72.0, 72.0, 37.0, 36.0, 22.0, 22.0, 16.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00026607513427734375, -0.0002579018473625183, -0.00024972856044769287, -0.00024155527353286743, -0.000233381986618042, -0.00022520869970321655, -0.0002170354127883911, -0.00020886212587356567, -0.00020068883895874023, -0.0001925155520439148, -0.00018434226512908936, -0.00017616897821426392, -0.00016799569129943848, -0.00015982240438461304, -0.0001516491174697876, -0.00014347583055496216, -0.00013530254364013672, -0.00012712925672531128, -0.00011895596981048584, -0.0001107826828956604, -0.00010260939598083496, -9.443610906600952e-05, -8.626282215118408e-05, -7.808953523635864e-05, -6.99162483215332e-05, -6.174296140670776e-05, -5.3569674491882324e-05, -4.5396387577056885e-05, -3.7223100662231445e-05, -2.9049813747406006e-05, -2.0876526832580566e-05, -1.2703239917755127e-05, -4.5299530029296875e-06, 3.643333911895752e-06, 1.1816620826721191e-05, 1.998990774154663e-05, 2.816319465637207e-05, 3.633648157119751e-05, 4.450976848602295e-05, 5.268305540084839e-05, 6.085634231567383e-05, 6.902962923049927e-05, 7.720291614532471e-05, 8.537620306015015e-05, 9.354948997497559e-05, 0.00010172277688980103, 0.00010989606380462646, 0.0001180693507194519, 0.00012624263763427734, 0.00013441592454910278, 0.00014258921146392822, 0.00015076249837875366, 0.0001589357852935791, 0.00016710907220840454, 0.00017528235912322998, 0.00018345564603805542, 0.00019162893295288086, 0.0001998022198677063, 0.00020797550678253174, 0.00021614879369735718, 0.00022432208061218262, 0.00023249536752700806, 0.0002406686544418335, 0.00024884194135665894, 0.0002570152282714844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 12.0, 15.0, 35.0, 39.0, 69.0, 117.0, 223.0, 454.0, 954.0, 2575.0, 8851.0, 50048.0, 398278.0, 500715.0, 69774.0, 11145.0, 3046.0, 1148.0, 472.0, 263.0, 125.0, 73.0, 25.0, 28.0, 19.0, 9.0, 7.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.80078125, -2.725250244140625, -2.64971923828125, -2.574188232421875, -2.4986572265625, -2.423126220703125, -2.34759521484375, -2.272064208984375, -2.196533203125, -2.121002197265625, -2.04547119140625, -1.969940185546875, -1.8944091796875, -1.818878173828125, -1.74334716796875, -1.667816162109375, -1.59228515625, -1.516754150390625, -1.44122314453125, -1.365692138671875, -1.2901611328125, -1.214630126953125, -1.13909912109375, -1.063568115234375, -0.988037109375, -0.912506103515625, -0.83697509765625, -0.761444091796875, -0.6859130859375, -0.610382080078125, -0.53485107421875, -0.459320068359375, -0.3837890625, -0.308258056640625, -0.23272705078125, -0.157196044921875, -0.0816650390625, -0.006134033203125, 0.06939697265625, 0.144927978515625, 0.220458984375, 0.295989990234375, 0.37152099609375, 0.447052001953125, 0.5225830078125, 0.598114013671875, 0.67364501953125, 0.749176025390625, 0.82470703125, 0.900238037109375, 0.97576904296875, 1.051300048828125, 1.1268310546875, 1.202362060546875, 1.27789306640625, 1.353424072265625, 1.428955078125, 1.504486083984375, 1.58001708984375, 1.655548095703125, 1.7310791015625, 1.806610107421875, 1.88214111328125, 1.957672119140625, 2.033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 8.0, 18.0, 16.0, 14.0, 22.0, 31.0, 29.0, 40.0, 38.0, 50.0, 66.0, 65.0, 49.0, 45.0, 44.0, 62.0, 55.0, 51.0, 47.0, 46.0, 35.0, 27.0, 28.0, 20.0, 13.0, 10.0, 9.0, 7.0, 9.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59765625, -0.5804367065429688, -0.5632171630859375, -0.5459976196289062, -0.528778076171875, -0.5115585327148438, -0.4943389892578125, -0.47711944580078125, -0.45989990234375, -0.44268035888671875, -0.4254608154296875, -0.40824127197265625, -0.391021728515625, -0.37380218505859375, -0.3565826416015625, -0.33936309814453125, -0.3221435546875, -0.30492401123046875, -0.2877044677734375, -0.27048492431640625, -0.253265380859375, -0.23604583740234375, -0.2188262939453125, -0.20160675048828125, -0.18438720703125, -0.16716766357421875, -0.1499481201171875, -0.13272857666015625, -0.115509033203125, -0.09828948974609375, -0.0810699462890625, -0.06385040283203125, -0.046630859375, -0.02941131591796875, -0.0121917724609375, 0.00502777099609375, 0.022247314453125, 0.03946685791015625, 0.0566864013671875, 0.07390594482421875, 0.09112548828125, 0.10834503173828125, 0.1255645751953125, 0.14278411865234375, 0.160003662109375, 0.17722320556640625, 0.1944427490234375, 0.21166229248046875, 0.2288818359375, 0.24610137939453125, 0.2633209228515625, 0.28054046630859375, 0.297760009765625, 0.31497955322265625, 0.3321990966796875, 0.34941864013671875, 0.36663818359375, 0.38385772705078125, 0.4010772705078125, 0.41829681396484375, 0.435516357421875, 0.45273590087890625, 0.4699554443359375, 0.48717498779296875, 0.50439453125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 19.0, 86.0, 249.0, 376.0, 191.0, 56.0, 23.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.846235752105713, -4.9172163009643555, -3.9881973266601562, -3.059178113937378, -2.1301589012145996, -1.2011399269104004, -0.27212047576904297, 0.6568989753723145, 1.5859179496765137, 2.514937162399292, 3.4439563751220703, 4.3729753494262695, 5.301994800567627, 6.231013774871826, 7.160033226013184, 8.089052200317383, 9.018072128295898, 9.947091102600098, 10.876110076904297, 11.805130004882812, 12.734148979187012, 13.663167953491211, 14.592187881469727, 15.521206855773926, 16.450225830078125, 17.37924575805664, 18.308263778686523, 19.23728370666504, 20.166301727294922, 21.095321655273438, 22.024341583251953, 22.95336151123047, 23.88237762451172, 24.811397552490234, 25.740415573120117, 26.669435501098633, 27.598453521728516, 28.52747344970703, 29.456493377685547, 30.385513305664062, 31.314531326293945, 32.24354934692383, 33.172569274902344, 34.10158920288086, 35.030609130859375, 35.959625244140625, 36.88864517211914, 37.817665100097656, 38.74668502807617, 39.67570495605469, 40.6047248840332, 41.53374099731445, 42.46276092529297, 43.391780853271484, 44.32080078125, 45.249820709228516, 46.17884063720703, 47.10786056518555, 48.03688049316406, 48.96589660644531, 49.89491653442383, 50.823936462402344, 51.75295639038086, 52.681976318359375, 53.610992431640625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 4.0, 15.0, 20.0, 14.0, 28.0, 36.0, 39.0, 38.0, 44.0, 46.0, 53.0, 53.0, 58.0, 48.0, 55.0, 67.0, 46.0, 46.0, 45.0, 42.0, 31.0, 29.0, 33.0, 20.0, 19.0, 11.0, 9.0, 12.0, 7.0, 4.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.695977210998535, -4.55609130859375, -4.416205883026123, -4.276319980621338, -4.136434078216553, -3.9965484142303467, -3.8566627502441406, -3.7167768478393555, -3.5768909454345703, -3.4370052814483643, -3.297119379043579, -3.157233715057373, -3.017347812652588, -2.877462148666382, -2.737576484680176, -2.5976905822753906, -2.4578049182891846, -2.3179192543029785, -2.1780333518981934, -2.0381476879119873, -1.8982617855072021, -1.758376121520996, -1.6184903383255005, -1.4786045551300049, -1.3387187719345093, -1.1988329887390137, -1.058947205543518, -0.9190614819526672, -0.7791756987571716, -0.639289915561676, -0.4994041919708252, -0.3595184087753296, -0.21963262557983398, -0.07974685728549957, 0.06013891100883484, 0.20002466440200806, 0.33991044759750366, 0.47979623079299927, 0.6196819543838501, 0.7595677375793457, 0.8994535207748413, 1.039339303970337, 1.1792250871658325, 1.3191108703613281, 1.4589965343475342, 1.5988824367523193, 1.7387681007385254, 1.878653883934021, 2.0185396671295166, 2.1584253311157227, 2.298311233520508, 2.438196897506714, 2.578082799911499, 2.717968463897705, 2.8578543663024902, 2.9977400302886963, 3.1376256942749023, 3.2775113582611084, 3.4173972606658936, 3.5572829246520996, 3.6971688270568848, 3.837054491043091, 3.976940155029297, 4.116826057434082, 4.256711959838867]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 13.0, 13.0, 17.0, 35.0, 33.0, 65.0, 88.0, 146.0, 355.0, 1182.0, 8371.0, 210532.0, 3937903.0, 31464.0, 2849.0, 615.0, 222.0, 102.0, 76.0, 40.0, 24.0, 25.0, 15.0, 17.0, 10.0, 11.0, 8.0, 6.0, 3.0, 3.0, 10.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.2734375, -8.0386962890625, -7.803955078125, -7.5692138671875, -7.33447265625, -7.0997314453125, -6.864990234375, -6.6302490234375, -6.3955078125, -6.1607666015625, -5.926025390625, -5.6912841796875, -5.45654296875, -5.2218017578125, -4.987060546875, -4.7523193359375, -4.517578125, -4.2828369140625, -4.048095703125, -3.8133544921875, -3.57861328125, -3.3438720703125, -3.109130859375, -2.8743896484375, -2.6396484375, -2.4049072265625, -2.170166015625, -1.9354248046875, -1.70068359375, -1.4659423828125, -1.231201171875, -0.9964599609375, -0.76171875, -0.5269775390625, -0.292236328125, -0.0574951171875, 0.17724609375, 0.4119873046875, 0.646728515625, 0.8814697265625, 1.1162109375, 1.3509521484375, 1.585693359375, 1.8204345703125, 2.05517578125, 2.2899169921875, 2.524658203125, 2.7593994140625, 2.994140625, 3.2288818359375, 3.463623046875, 3.6983642578125, 3.93310546875, 4.1678466796875, 4.402587890625, 4.6373291015625, 4.8720703125, 5.1068115234375, 5.341552734375, 5.5762939453125, 5.81103515625, 6.0457763671875, 6.280517578125, 6.5152587890625, 6.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 9.0, 19.0, 22.0, 33.0, 33.0, 50.0, 54.0, 73.0, 63.0, 84.0, 88.0, 80.0, 80.0, 74.0, 53.0, 34.0, 31.0, 26.0, 24.0, 20.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1724853515625, -0.1677417755126953, -0.16299819946289062, -0.15825462341308594, -0.15351104736328125, -0.14876747131347656, -0.14402389526367188, -0.1392803192138672, -0.1345367431640625, -0.1297931671142578, -0.12504959106445312, -0.12030601501464844, -0.11556243896484375, -0.11081886291503906, -0.10607528686523438, -0.10133171081542969, -0.096588134765625, -0.09184455871582031, -0.08710098266601562, -0.08235740661621094, -0.07761383056640625, -0.07287025451660156, -0.06812667846679688, -0.06338310241699219, -0.0586395263671875, -0.05389595031738281, -0.049152374267578125, -0.04440879821777344, -0.03966522216796875, -0.03492164611816406, -0.030178070068359375, -0.025434494018554688, -0.02069091796875, -0.015947341918945312, -0.011203765869140625, -0.0064601898193359375, -0.00171661376953125, 0.0030269622802734375, 0.007770538330078125, 0.012514114379882812, 0.0172576904296875, 0.022001266479492188, 0.026744842529296875, 0.03148841857910156, 0.03623199462890625, 0.04097557067871094, 0.045719146728515625, 0.05046272277832031, 0.055206298828125, 0.05994987487792969, 0.06469345092773438, 0.06943702697753906, 0.07418060302734375, 0.07892417907714844, 0.08366775512695312, 0.08841133117675781, 0.0931549072265625, 0.09789848327636719, 0.10264205932617188, 0.10738563537597656, 0.11212921142578125, 0.11687278747558594, 0.12161636352539062, 0.1263599395751953, 0.131103515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 23.0, 28.0, 60.0, 116.0, 144.0, 256.0, 388.0, 1713.0, 4179879.0, 10853.0, 363.0, 202.0, 113.0, 80.0, 35.0, 17.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.90625, -30.06298828125, -29.2197265625, -28.37646484375, -27.533203125, -26.68994140625, -25.8466796875, -25.00341796875, -24.16015625, -23.31689453125, -22.4736328125, -21.63037109375, -20.787109375, -19.94384765625, -19.1005859375, -18.25732421875, -17.4140625, -16.57080078125, -15.7275390625, -14.88427734375, -14.041015625, -13.19775390625, -12.3544921875, -11.51123046875, -10.66796875, -9.82470703125, -8.9814453125, -8.13818359375, -7.294921875, -6.45166015625, -5.6083984375, -4.76513671875, -3.921875, -3.07861328125, -2.2353515625, -1.39208984375, -0.548828125, 0.29443359375, 1.1376953125, 1.98095703125, 2.82421875, 3.66748046875, 4.5107421875, 5.35400390625, 6.197265625, 7.04052734375, 7.8837890625, 8.72705078125, 9.5703125, 10.41357421875, 11.2568359375, 12.10009765625, 12.943359375, 13.78662109375, 14.6298828125, 15.47314453125, 16.31640625, 17.15966796875, 18.0029296875, 18.84619140625, 19.689453125, 20.53271484375, 21.3759765625, 22.21923828125, 23.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 21.0, 95.0, 790.0, 2891.0, 246.0, 32.0, 10.0], "bins": [-4.74609375, -4.667285919189453, -4.588478088378906, -4.509670257568359, -4.4308624267578125, -4.352054595947266, -4.273246765136719, -4.194438934326172, -4.115631103515625, -4.036823272705078, -3.9580154418945312, -3.8792076110839844, -3.8003997802734375, -3.7215919494628906, -3.6427841186523438, -3.563976287841797, -3.48516845703125, -3.406360626220703, -3.3275527954101562, -3.2487449645996094, -3.1699371337890625, -3.0911293029785156, -3.0123214721679688, -2.933513641357422, -2.854705810546875, -2.775897979736328, -2.6970901489257812, -2.6182823181152344, -2.5394744873046875, -2.4606666564941406, -2.3818588256835938, -2.303050994873047, -2.2242431640625, -2.145435333251953, -2.0666275024414062, -1.9878196716308594, -1.9090118408203125, -1.8302040100097656, -1.7513961791992188, -1.6725883483886719, -1.593780517578125, -1.5149726867675781, -1.4361648559570312, -1.3573570251464844, -1.2785491943359375, -1.1997413635253906, -1.1209335327148438, -1.0421257019042969, -0.96331787109375, -0.8845100402832031, -0.8057022094726562, -0.7268943786621094, -0.6480865478515625, -0.5692787170410156, -0.49047088623046875, -0.4116630554199219, -0.332855224609375, -0.2540473937988281, -0.17523956298828125, -0.09643173217773438, -0.0176239013671875, 0.061183929443359375, 0.13999176025390625, 0.21879959106445312, 0.297607421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 33.0, 143.0, 544.0, 230.0, 36.0, 12.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.44783020019531, -42.63691711425781, -41.82600402832031, -41.01509094238281, -40.20417785644531, -39.39326858520508, -38.58235549926758, -37.77144241333008, -36.96052932739258, -36.14961624145508, -35.33870315551758, -34.52779006958008, -33.716880798339844, -32.905967712402344, -32.095054626464844, -31.284141540527344, -30.473228454589844, -29.662315368652344, -28.851402282714844, -28.040491104125977, -27.229578018188477, -26.418664932250977, -25.60775375366211, -24.79684066772461, -23.98592758178711, -23.17501449584961, -22.36410140991211, -21.553190231323242, -20.742277145385742, -19.931364059448242, -19.120452880859375, -18.309539794921875, -17.498624801635742, -16.687711715698242, -15.876799583435059, -15.065887451171875, -14.254974365234375, -13.444061279296875, -12.633149147033691, -11.822237014770508, -11.011323928833008, -10.200410842895508, -9.389498710632324, -8.57858657836914, -7.767673492431641, -6.956760883331299, -6.145848274230957, -5.334935665130615, -4.524023056030273, -3.7131104469299316, -2.90219783782959, -2.091285228729248, -1.2803726196289062, -0.46946001052856445, 0.34145259857177734, 1.1523652076721191, 1.963277816772461, 2.7741904258728027, 3.5851030349731445, 4.396015644073486, 5.206928253173828, 6.01784086227417, 6.828753471374512, 7.6396660804748535, 8.450578689575195]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 18.0, 37.0, 44.0, 76.0, 109.0, 135.0, 160.0, 130.0, 87.0, 82.0, 63.0, 35.0, 10.0, 10.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.518835067749023, -12.085025787353516, -11.651217460632324, -11.217408180236816, -10.783599853515625, -10.349790573120117, -9.91598129272461, -9.482172012329102, -9.04836368560791, -8.614554405212402, -8.180746078491211, -7.746936798095703, -7.3131279945373535, -6.879319190979004, -6.445509910583496, -6.0117011070251465, -5.577892303466797, -5.144083499908447, -4.710274696350098, -4.27646541595459, -3.8426566123962402, -3.4088478088378906, -2.975038766860962, -2.541229724884033, -2.1074209213256836, -1.6736119985580444, -1.2398030757904053, -0.8059941530227661, -0.37218523025512695, 0.061623573303222656, 0.49543261528015137, 0.9292416572570801, 1.363051414489746, 1.7968603372573853, 2.2306692600250244, 2.664478302001953, 3.0982871055603027, 3.5320959091186523, 3.965904951095581, 4.39971399307251, 4.833522796630859, 5.267331600189209, 5.701140403747559, 6.134949684143066, 6.568758487701416, 7.002567291259766, 7.436376571655273, 7.870185375213623, 8.303994178771973, 8.73780345916748, 9.171611785888672, 9.60542106628418, 10.039230346679688, 10.473038673400879, 10.906847953796387, 11.340656280517578, 11.774465560913086, 12.208274841308594, 12.642083168029785, 13.075892448425293, 13.509700775146484, 13.943510055541992, 14.3773193359375, 14.811128616333008, 15.2449369430542]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 9.0, 5.0, 2.0, 9.0, 15.0, 16.0, 17.0, 27.0, 40.0, 53.0, 62.0, 120.0, 233.0, 555.0, 1343.0, 5495.0, 52407.0, 611332.0, 347556.0, 23936.0, 3339.0, 1019.0, 448.0, 178.0, 103.0, 57.0, 46.0, 29.0, 17.0, 20.0, 9.0, 8.0, 7.0, 8.0, 8.0, 3.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.53424072265625, -4.3653564453125, -4.19647216796875, -4.027587890625, -3.85870361328125, -3.6898193359375, -3.52093505859375, -3.35205078125, -3.18316650390625, -3.0142822265625, -2.84539794921875, -2.676513671875, -2.50762939453125, -2.3387451171875, -2.16986083984375, -2.0009765625, -1.83209228515625, -1.6632080078125, -1.49432373046875, -1.325439453125, -1.15655517578125, -0.9876708984375, -0.81878662109375, -0.64990234375, -0.48101806640625, -0.3121337890625, -0.14324951171875, 0.025634765625, 0.19451904296875, 0.3634033203125, 0.53228759765625, 0.701171875, 0.87005615234375, 1.0389404296875, 1.20782470703125, 1.376708984375, 1.54559326171875, 1.7144775390625, 1.88336181640625, 2.05224609375, 2.22113037109375, 2.3900146484375, 2.55889892578125, 2.727783203125, 2.89666748046875, 3.0655517578125, 3.23443603515625, 3.4033203125, 3.57220458984375, 3.7410888671875, 3.90997314453125, 4.078857421875, 4.24774169921875, 4.4166259765625, 4.58551025390625, 4.75439453125, 4.92327880859375, 5.0921630859375, 5.26104736328125, 5.429931640625, 5.59881591796875, 5.7677001953125, 5.93658447265625, 6.10546875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 16.0, 24.0, 30.0, 33.0, 45.0, 45.0, 68.0, 71.0, 81.0, 86.0, 81.0, 79.0, 61.0, 51.0, 48.0, 48.0, 33.0, 25.0, 14.0, 16.0, 11.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41552734375, -0.404205322265625, -0.39288330078125, -0.381561279296875, -0.3702392578125, -0.358917236328125, -0.34759521484375, -0.336273193359375, -0.324951171875, -0.313629150390625, -0.30230712890625, -0.290985107421875, -0.2796630859375, -0.268341064453125, -0.25701904296875, -0.245697021484375, -0.234375, -0.223052978515625, -0.21173095703125, -0.200408935546875, -0.1890869140625, -0.177764892578125, -0.16644287109375, -0.155120849609375, -0.143798828125, -0.132476806640625, -0.12115478515625, -0.109832763671875, -0.0985107421875, -0.087188720703125, -0.07586669921875, -0.064544677734375, -0.05322265625, -0.041900634765625, -0.03057861328125, -0.019256591796875, -0.0079345703125, 0.003387451171875, 0.01470947265625, 0.026031494140625, 0.037353515625, 0.048675537109375, 0.05999755859375, 0.071319580078125, 0.0826416015625, 0.093963623046875, 0.10528564453125, 0.116607666015625, 0.1279296875, 0.139251708984375, 0.15057373046875, 0.161895751953125, 0.1732177734375, 0.184539794921875, 0.19586181640625, 0.207183837890625, 0.218505859375, 0.229827880859375, 0.24114990234375, 0.252471923828125, 0.2637939453125, 0.275115966796875, 0.28643798828125, 0.297760009765625, 0.30908203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 15.0, 18.0, 25.0, 35.0, 46.0, 73.0, 82.0, 166.0, 201.0, 313.0, 523.0, 822.0, 1582.0, 3747.0, 11602.0, 47103.0, 195655.0, 440874.0, 256103.0, 64525.0, 15642.0, 4794.0, 1868.0, 1015.0, 600.0, 366.0, 227.0, 174.0, 97.0, 84.0, 42.0, 28.0, 25.0, 18.0, 12.0, 10.0, 6.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7978515625, -1.7303009033203125, -1.662750244140625, -1.5951995849609375, -1.52764892578125, -1.4600982666015625, -1.392547607421875, -1.3249969482421875, -1.2574462890625, -1.1898956298828125, -1.122344970703125, -1.0547943115234375, -0.98724365234375, -0.9196929931640625, -0.852142333984375, -0.7845916748046875, -0.717041015625, -0.6494903564453125, -0.581939697265625, -0.5143890380859375, -0.44683837890625, -0.3792877197265625, -0.311737060546875, -0.2441864013671875, -0.1766357421875, -0.1090850830078125, -0.041534423828125, 0.0260162353515625, 0.09356689453125, 0.1611175537109375, 0.228668212890625, 0.2962188720703125, 0.36376953125, 0.4313201904296875, 0.498870849609375, 0.5664215087890625, 0.63397216796875, 0.7015228271484375, 0.769073486328125, 0.8366241455078125, 0.9041748046875, 0.9717254638671875, 1.039276123046875, 1.1068267822265625, 1.17437744140625, 1.2419281005859375, 1.309478759765625, 1.3770294189453125, 1.444580078125, 1.5121307373046875, 1.579681396484375, 1.6472320556640625, 1.71478271484375, 1.7823333740234375, 1.849884033203125, 1.9174346923828125, 1.9849853515625, 2.0525360107421875, 2.120086669921875, 2.1876373291015625, 2.25518798828125, 2.3227386474609375, 2.390289306640625, 2.4578399658203125, 2.525390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 7.0, 7.0, 10.0, 12.0, 17.0, 18.0, 24.0, 30.0, 31.0, 27.0, 33.0, 34.0, 39.0, 39.0, 44.0, 45.0, 50.0, 45.0, 35.0, 44.0, 52.0, 41.0, 40.0, 33.0, 46.0, 30.0, 23.0, 24.0, 23.0, 12.0, 11.0, 12.0, 10.0, 4.0, 5.0, 4.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0032958984375, -0.970458984375, -0.9376220703125, -0.90478515625, -0.8719482421875, -0.839111328125, -0.8062744140625, -0.7734375, -0.7406005859375, -0.707763671875, -0.6749267578125, -0.64208984375, -0.6092529296875, -0.576416015625, -0.5435791015625, -0.5107421875, -0.4779052734375, -0.445068359375, -0.4122314453125, -0.37939453125, -0.3465576171875, -0.313720703125, -0.2808837890625, -0.248046875, -0.2152099609375, -0.182373046875, -0.1495361328125, -0.11669921875, -0.0838623046875, -0.051025390625, -0.0181884765625, 0.0146484375, 0.0474853515625, 0.080322265625, 0.1131591796875, 0.14599609375, 0.1788330078125, 0.211669921875, 0.2445068359375, 0.27734375, 0.3101806640625, 0.343017578125, 0.3758544921875, 0.40869140625, 0.4415283203125, 0.474365234375, 0.5072021484375, 0.5400390625, 0.5728759765625, 0.605712890625, 0.6385498046875, 0.67138671875, 0.7042236328125, 0.737060546875, 0.7698974609375, 0.802734375, 0.8355712890625, 0.868408203125, 0.9012451171875, 0.93408203125, 0.9669189453125, 0.999755859375, 1.0325927734375, 1.0654296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 15.0, 21.0, 29.0, 52.0, 82.0, 107.0, 160.0, 309.0, 576.0, 1321.0, 3083.0, 9398.0, 36609.0, 220565.0, 582758.0, 153678.0, 27491.0, 7217.0, 2544.0, 1142.0, 528.0, 311.0, 164.0, 109.0, 85.0, 54.0, 36.0, 27.0, 16.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7534027099609375, -1.689422607421875, -1.6254425048828125, -1.56146240234375, -1.4974822998046875, -1.433502197265625, -1.3695220947265625, -1.3055419921875, -1.2415618896484375, -1.177581787109375, -1.1136016845703125, -1.04962158203125, -0.9856414794921875, -0.921661376953125, -0.8576812744140625, -0.793701171875, -0.7297210693359375, -0.665740966796875, -0.6017608642578125, -0.53778076171875, -0.4738006591796875, -0.409820556640625, -0.3458404541015625, -0.2818603515625, -0.2178802490234375, -0.153900146484375, -0.0899200439453125, -0.02593994140625, 0.0380401611328125, 0.102020263671875, 0.1660003662109375, 0.22998046875, 0.2939605712890625, 0.357940673828125, 0.4219207763671875, 0.48590087890625, 0.5498809814453125, 0.613861083984375, 0.6778411865234375, 0.7418212890625, 0.8058013916015625, 0.869781494140625, 0.9337615966796875, 0.99774169921875, 1.0617218017578125, 1.125701904296875, 1.1896820068359375, 1.253662109375, 1.3176422119140625, 1.381622314453125, 1.4456024169921875, 1.50958251953125, 1.5735626220703125, 1.637542724609375, 1.7015228271484375, 1.7655029296875, 1.8294830322265625, 1.893463134765625, 1.9574432373046875, 2.02142333984375, 2.0854034423828125, 2.149383544921875, 2.2133636474609375, 2.27734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 11.0, 9.0, 10.0, 18.0, 17.0, 19.0, 27.0, 32.0, 35.0, 48.0, 55.0, 76.0, 61.0, 69.0, 68.0, 74.0, 53.0, 56.0, 50.0, 44.0, 33.0, 27.0, 27.0, 14.0, 17.0, 17.0, 5.0, 9.0, 4.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019943714141845703, -0.00019270740449428558, -0.00018597766757011414, -0.0001792479306459427, -0.00017251819372177124, -0.0001657884567975998, -0.00015905871987342834, -0.0001523289829492569, -0.00014559924602508545, -0.000138869509100914, -0.00013213977217674255, -0.0001254100352525711, -0.00011868029832839966, -0.00011195056140422821, -0.00010522082448005676, -9.849108755588531e-05, -9.176135063171387e-05, -8.503161370754242e-05, -7.830187678337097e-05, -7.157213985919952e-05, -6.484240293502808e-05, -5.811266601085663e-05, -5.138292908668518e-05, -4.465319216251373e-05, -3.7923455238342285e-05, -3.119371831417084e-05, -2.446398138999939e-05, -1.7734244465827942e-05, -1.1004507541656494e-05, -4.274770617485046e-06, 2.4549663066864014e-06, 9.184703230857849e-06, 1.5914440155029297e-05, 2.2644177079200745e-05, 2.9373914003372192e-05, 3.610365092754364e-05, 4.283338785171509e-05, 4.9563124775886536e-05, 5.6292861700057983e-05, 6.302259862422943e-05, 6.975233554840088e-05, 7.648207247257233e-05, 8.321180939674377e-05, 8.994154632091522e-05, 9.667128324508667e-05, 0.00010340102016925812, 0.00011013075709342957, 0.00011686049401760101, 0.00012359023094177246, 0.0001303199678659439, 0.00013704970479011536, 0.0001437794417142868, 0.00015050917863845825, 0.0001572389155626297, 0.00016396865248680115, 0.0001706983894109726, 0.00017742812633514404, 0.0001841578632593155, 0.00019088760018348694, 0.00019761733710765839, 0.00020434707403182983, 0.00021107681095600128, 0.00021780654788017273, 0.00022453628480434418, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 16.0, 24.0, 38.0, 73.0, 135.0, 218.0, 478.0, 1184.0, 3787.0, 20397.0, 240860.0, 688856.0, 78732.0, 9704.0, 2340.0, 850.0, 397.0, 192.0, 109.0, 44.0, 37.0, 21.0, 16.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.806793212890625, -2.71710205078125, -2.627410888671875, -2.5377197265625, -2.448028564453125, -2.35833740234375, -2.268646240234375, -2.178955078125, -2.089263916015625, -1.99957275390625, -1.909881591796875, -1.8201904296875, -1.730499267578125, -1.64080810546875, -1.551116943359375, -1.46142578125, -1.371734619140625, -1.28204345703125, -1.192352294921875, -1.1026611328125, -1.012969970703125, -0.92327880859375, -0.833587646484375, -0.743896484375, -0.654205322265625, -0.56451416015625, -0.474822998046875, -0.3851318359375, -0.295440673828125, -0.20574951171875, -0.116058349609375, -0.0263671875, 0.063323974609375, 0.15301513671875, 0.242706298828125, 0.3323974609375, 0.422088623046875, 0.51177978515625, 0.601470947265625, 0.691162109375, 0.780853271484375, 0.87054443359375, 0.960235595703125, 1.0499267578125, 1.139617919921875, 1.22930908203125, 1.319000244140625, 1.40869140625, 1.498382568359375, 1.58807373046875, 1.677764892578125, 1.7674560546875, 1.857147216796875, 1.94683837890625, 2.036529541015625, 2.126220703125, 2.215911865234375, 2.30560302734375, 2.395294189453125, 2.4849853515625, 2.574676513671875, 2.66436767578125, 2.754058837890625, 2.84375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 11.0, 15.0, 22.0, 18.0, 33.0, 45.0, 58.0, 71.0, 77.0, 78.0, 87.0, 87.0, 80.0, 70.0, 61.0, 43.0, 39.0, 14.0, 21.0, 20.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.7998809814453125, -0.768707275390625, -0.7375335693359375, -0.70635986328125, -0.6751861572265625, -0.644012451171875, -0.6128387451171875, -0.5816650390625, -0.5504913330078125, -0.519317626953125, -0.4881439208984375, -0.45697021484375, -0.4257965087890625, -0.394622802734375, -0.3634490966796875, -0.332275390625, -0.3011016845703125, -0.269927978515625, -0.2387542724609375, -0.20758056640625, -0.1764068603515625, -0.145233154296875, -0.1140594482421875, -0.0828857421875, -0.0517120361328125, -0.020538330078125, 0.0106353759765625, 0.04180908203125, 0.0729827880859375, 0.104156494140625, 0.1353302001953125, 0.16650390625, 0.1976776123046875, 0.228851318359375, 0.2600250244140625, 0.29119873046875, 0.3223724365234375, 0.353546142578125, 0.3847198486328125, 0.4158935546875, 0.4470672607421875, 0.478240966796875, 0.5094146728515625, 0.54058837890625, 0.5717620849609375, 0.602935791015625, 0.6341094970703125, 0.665283203125, 0.6964569091796875, 0.727630615234375, 0.7588043212890625, 0.78997802734375, 0.8211517333984375, 0.852325439453125, 0.8834991455078125, 0.9146728515625, 0.9458465576171875, 0.977020263671875, 1.0081939697265625, 1.03936767578125, 1.0705413818359375, 1.101715087890625, 1.1328887939453125, 1.1640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 10.0, 24.0, 107.0, 218.0, 318.0, 208.0, 79.0, 26.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.307259559631348, -11.382889747619629, -10.458520889282227, -9.534151077270508, -8.609781265258789, -7.68541145324707, -6.76104211807251, -5.836672782897949, -4.9123029708862305, -3.987933397293091, -3.063563823699951, -2.1391942501068115, -1.2148246765136719, -0.2904548645019531, 0.6339144706726074, 1.558283805847168, 2.4826536178588867, 3.4070231914520264, 4.331392765045166, 5.255762100219727, 6.180131912231445, 7.104501724243164, 8.028871536254883, 8.953240394592285, 9.877610206604004, 10.801980018615723, 11.726348876953125, 12.650718688964844, 13.575088500976562, 14.499458312988281, 15.423828125, 16.34819793701172, 17.272567749023438, 18.196937561035156, 19.121307373046875, 20.045677185058594, 20.970046997070312, 21.89441680908203, 22.818784713745117, 23.743154525756836, 24.667524337768555, 25.591894149780273, 26.516263961791992, 27.44063377380371, 28.365001678466797, 29.289371490478516, 30.213741302490234, 31.138111114501953, 32.06248092651367, 32.98685073852539, 33.91122055053711, 34.83559036254883, 35.75996017456055, 36.684329986572266, 37.608699798583984, 38.53306579589844, 39.457435607910156, 40.381805419921875, 41.306175231933594, 42.23054504394531, 43.15491485595703, 44.07928466796875, 45.00365447998047, 45.92802429199219, 46.852394104003906]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 6.0, 11.0, 16.0, 19.0, 19.0, 19.0, 37.0, 34.0, 42.0, 38.0, 38.0, 44.0, 46.0, 52.0, 48.0, 38.0, 54.0, 41.0, 42.0, 35.0, 46.0, 36.0, 31.0, 22.0, 29.0, 30.0, 26.0, 10.0, 8.0, 9.0, 8.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.671116352081299, -7.450446128845215, -7.229775905609131, -7.009105682373047, -6.788434982299805, -6.567764759063721, -6.347094535827637, -6.126424312591553, -5.905754089355469, -5.685083866119385, -5.464413642883301, -5.243742942810059, -5.023072719573975, -4.802402496337891, -4.581732273101807, -4.361062049865723, -4.1403913497924805, -3.9197211265563965, -3.6990506649017334, -3.4783804416656494, -3.2577099800109863, -3.0370397567749023, -2.8163695335388184, -2.5956993103027344, -2.3750288486480713, -2.1543586254119873, -1.9336881637573242, -1.7130179405212402, -1.4923475980758667, -1.2716772556304932, -1.0510070323944092, -0.8303366899490356, -0.6096658706665039, -0.38899555802345276, -0.1683252453804016, 0.05234503746032715, 0.2730153799057007, 0.4936857223510742, 0.7143559455871582, 0.9350262880325317, 1.1556966304779053, 1.3763669729232788, 1.5970373153686523, 1.8177075386047363, 2.0383777618408203, 2.2590482234954834, 2.4797184467315674, 2.7003889083862305, 2.9210591316223145, 3.1417293548583984, 3.3623998165130615, 3.5830700397491455, 3.8037405014038086, 4.024410724639893, 4.245080947875977, 4.4657511711120605, 4.6864213943481445, 4.9070916175842285, 5.1277618408203125, 5.348432540893555, 5.569102764129639, 5.789772987365723, 6.010443210601807, 6.231113433837891, 6.451784133911133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 10.0, 3.0, 8.0, 15.0, 15.0, 13.0, 25.0, 28.0, 39.0, 49.0, 94.0, 127.0, 242.0, 510.0, 1122.0, 3793.0, 19237.0, 296440.0, 3790170.0, 70435.0, 8806.0, 1928.0, 637.0, 253.0, 101.0, 52.0, 34.0, 16.0, 12.0, 7.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.06597900390625, -5.8780517578125, -5.69012451171875, -5.502197265625, -5.31427001953125, -5.1263427734375, -4.93841552734375, -4.75048828125, -4.56256103515625, -4.3746337890625, -4.18670654296875, -3.998779296875, -3.81085205078125, -3.6229248046875, -3.43499755859375, -3.2470703125, -3.05914306640625, -2.8712158203125, -2.68328857421875, -2.495361328125, -2.30743408203125, -2.1195068359375, -1.93157958984375, -1.74365234375, -1.55572509765625, -1.3677978515625, -1.17987060546875, -0.991943359375, -0.80401611328125, -0.6160888671875, -0.42816162109375, -0.240234375, -0.05230712890625, 0.1356201171875, 0.32354736328125, 0.511474609375, 0.69940185546875, 0.8873291015625, 1.07525634765625, 1.26318359375, 1.45111083984375, 1.6390380859375, 1.82696533203125, 2.014892578125, 2.20281982421875, 2.3907470703125, 2.57867431640625, 2.7666015625, 2.95452880859375, 3.1424560546875, 3.33038330078125, 3.518310546875, 3.70623779296875, 3.8941650390625, 4.08209228515625, 4.27001953125, 4.45794677734375, 4.6458740234375, 4.83380126953125, 5.021728515625, 5.20965576171875, 5.3975830078125, 5.58551025390625, 5.7734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 19.0, 16.0, 18.0, 47.0, 23.0, 41.0, 49.0, 81.0, 79.0, 75.0, 98.0, 76.0, 83.0, 51.0, 51.0, 34.0, 29.0, 25.0, 28.0, 19.0, 13.0, 11.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4599609375, -0.44878387451171875, -0.4376068115234375, -0.42642974853515625, -0.415252685546875, -0.40407562255859375, -0.3928985595703125, -0.38172149658203125, -0.37054443359375, -0.35936737060546875, -0.3481903076171875, -0.33701324462890625, -0.325836181640625, -0.31465911865234375, -0.3034820556640625, -0.29230499267578125, -0.2811279296875, -0.26995086669921875, -0.2587738037109375, -0.24759674072265625, -0.236419677734375, -0.22524261474609375, -0.2140655517578125, -0.20288848876953125, -0.19171142578125, -0.18053436279296875, -0.1693572998046875, -0.15818023681640625, -0.147003173828125, -0.13582611083984375, -0.1246490478515625, -0.11347198486328125, -0.102294921875, -0.09111785888671875, -0.0799407958984375, -0.06876373291015625, -0.057586669921875, -0.04640960693359375, -0.0352325439453125, -0.02405548095703125, -0.01287841796875, -0.00170135498046875, 0.0094757080078125, 0.02065277099609375, 0.031829833984375, 0.04300689697265625, 0.0541839599609375, 0.06536102294921875, 0.0765380859375, 0.08771514892578125, 0.0988922119140625, 0.11006927490234375, 0.121246337890625, 0.13242340087890625, 0.1436004638671875, 0.15477752685546875, 0.16595458984375, 0.17713165283203125, 0.1883087158203125, 0.19948577880859375, 0.210662841796875, 0.22183990478515625, 0.2330169677734375, 0.24419403076171875, 0.25537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 12.0, 14.0, 31.0, 53.0, 112.0, 229.0, 876.0, 28119.0, 4160066.0, 4183.0, 365.0, 102.0, 59.0, 35.0, 12.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.2078857421875, -27.525146484375, -26.8424072265625, -26.15966796875, -25.4769287109375, -24.794189453125, -24.1114501953125, -23.4287109375, -22.7459716796875, -22.063232421875, -21.3804931640625, -20.69775390625, -20.0150146484375, -19.332275390625, -18.6495361328125, -17.966796875, -17.2840576171875, -16.601318359375, -15.9185791015625, -15.23583984375, -14.5531005859375, -13.870361328125, -13.1876220703125, -12.5048828125, -11.8221435546875, -11.139404296875, -10.4566650390625, -9.77392578125, -9.0911865234375, -8.408447265625, -7.7257080078125, -7.04296875, -6.3602294921875, -5.677490234375, -4.9947509765625, -4.31201171875, -3.6292724609375, -2.946533203125, -2.2637939453125, -1.5810546875, -0.8983154296875, -0.215576171875, 0.4671630859375, 1.14990234375, 1.8326416015625, 2.515380859375, 3.1981201171875, 3.880859375, 4.5635986328125, 5.246337890625, 5.9290771484375, 6.61181640625, 7.2945556640625, 7.977294921875, 8.6600341796875, 9.3427734375, 10.0255126953125, 10.708251953125, 11.3909912109375, 12.07373046875, 12.7564697265625, 13.439208984375, 14.1219482421875, 14.8046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 24.0, 63.0, 183.0, 856.0, 2329.0, 412.0, 116.0, 39.0, 20.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.0078125, -2.9491729736328125, -2.890533447265625, -2.8318939208984375, -2.77325439453125, -2.7146148681640625, -2.655975341796875, -2.5973358154296875, -2.5386962890625, -2.4800567626953125, -2.421417236328125, -2.3627777099609375, -2.30413818359375, -2.2454986572265625, -2.186859130859375, -2.1282196044921875, -2.069580078125, -2.0109405517578125, -1.952301025390625, -1.8936614990234375, -1.83502197265625, -1.7763824462890625, -1.717742919921875, -1.6591033935546875, -1.6004638671875, -1.5418243408203125, -1.483184814453125, -1.4245452880859375, -1.36590576171875, -1.3072662353515625, -1.248626708984375, -1.1899871826171875, -1.13134765625, -1.0727081298828125, -1.014068603515625, -0.9554290771484375, -0.89678955078125, -0.8381500244140625, -0.779510498046875, -0.7208709716796875, -0.6622314453125, -0.6035919189453125, -0.544952392578125, -0.4863128662109375, -0.42767333984375, -0.3690338134765625, -0.310394287109375, -0.2517547607421875, -0.193115234375, -0.1344757080078125, -0.075836181640625, -0.0171966552734375, 0.04144287109375, 0.1000823974609375, 0.158721923828125, 0.2173614501953125, 0.2760009765625, 0.3346405029296875, 0.393280029296875, 0.4519195556640625, 0.51055908203125, 0.5691986083984375, 0.627838134765625, 0.6864776611328125, 0.7451171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 23.0, 64.0, 568.0, 318.0, 32.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.848087310791016, -42.86951446533203, -41.89094543457031, -40.91237258911133, -39.93380355834961, -38.955230712890625, -37.976661682128906, -36.99808883666992, -36.01951599121094, -35.04094314575195, -34.062374114990234, -33.08380126953125, -32.10523223876953, -31.126659393310547, -30.148088455200195, -29.169517517089844, -28.190948486328125, -27.212377548217773, -26.233806610107422, -25.255233764648438, -24.276662826538086, -23.298091888427734, -22.319520950317383, -21.34095001220703, -20.362377166748047, -19.383806228637695, -18.405235290527344, -17.42666244506836, -16.448091506958008, -15.469520568847656, -14.490949630737305, -13.512378692626953, -12.533807754516602, -11.55523681640625, -10.576664924621582, -9.59809398651123, -8.619523048400879, -7.640951633453369, -6.662380218505859, -5.683809280395508, -4.705237865447998, -3.7266666889190674, -2.7480955123901367, -1.769524097442627, -0.7909529209136963, 0.18761825561523438, 1.1661896705627441, 2.1447606086730957, 3.1233320236206055, 4.101903438568115, 5.080474376678467, 6.059045791625977, 7.037616729736328, 8.01618766784668, 8.994759559631348, 9.9733304977417, 10.951902389526367, 11.930473327636719, 12.909045219421387, 13.887616157531738, 14.86618709564209, 15.844758987426758, 16.82332992553711, 17.80190086364746, 18.780471801757812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 10.0, 5.0, 8.0, 18.0, 17.0, 34.0, 34.0, 62.0, 77.0, 63.0, 74.0, 86.0, 81.0, 73.0, 81.0, 68.0, 56.0, 57.0, 47.0, 21.0, 10.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.372196197509766, -6.1926469802856445, -6.013097286224365, -5.833547592163086, -5.653998374938965, -5.474449157714844, -5.2948994636535645, -5.115349769592285, -4.935800552368164, -4.756251335144043, -4.576701641082764, -4.397151947021484, -4.217602729797363, -4.038053512573242, -3.858503818511963, -3.6789543628692627, -3.4994049072265625, -3.3198554515838623, -3.140305995941162, -2.960756540298462, -2.7812070846557617, -2.6016576290130615, -2.4221081733703613, -2.242558717727661, -2.063009262084961, -1.8834598064422607, -1.7039103507995605, -1.5243608951568604, -1.3448114395141602, -1.16526198387146, -0.9857125282287598, -0.8061630725860596, -0.6266131401062012, -0.447063684463501, -0.2675142288208008, -0.08796477317810059, 0.09158468246459961, 0.2711341381072998, 0.45068359375, 0.6302330493927002, 0.8097825050354004, 0.9893319606781006, 1.1688814163208008, 1.348430871963501, 1.5279803276062012, 1.7075297832489014, 1.8870792388916016, 2.0666286945343018, 2.246178150177002, 2.425727605819702, 2.6052770614624023, 2.7848265171051025, 2.9643759727478027, 3.143925428390503, 3.323474884033203, 3.5030243396759033, 3.6825737953186035, 3.8621232509613037, 4.041672706604004, 4.221221923828125, 4.400771617889404, 4.580321311950684, 4.759870529174805, 4.939419746398926, 5.118969440460205]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 9.0, 18.0, 18.0, 25.0, 33.0, 41.0, 59.0, 115.0, 182.0, 364.0, 856.0, 2969.0, 17148.0, 203980.0, 708904.0, 100276.0, 10002.0, 2069.0, 706.0, 299.0, 164.0, 103.0, 62.0, 39.0, 19.0, 19.0, 11.0, 10.0, 5.0, 8.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.63671875, -5.4935302734375, -5.350341796875, -5.2071533203125, -5.06396484375, -4.9207763671875, -4.777587890625, -4.6343994140625, -4.4912109375, -4.3480224609375, -4.204833984375, -4.0616455078125, -3.91845703125, -3.7752685546875, -3.632080078125, -3.4888916015625, -3.345703125, -3.2025146484375, -3.059326171875, -2.9161376953125, -2.77294921875, -2.6297607421875, -2.486572265625, -2.3433837890625, -2.2001953125, -2.0570068359375, -1.913818359375, -1.7706298828125, -1.62744140625, -1.4842529296875, -1.341064453125, -1.1978759765625, -1.0546875, -0.9114990234375, -0.768310546875, -0.6251220703125, -0.48193359375, -0.3387451171875, -0.195556640625, -0.0523681640625, 0.0908203125, 0.2340087890625, 0.377197265625, 0.5203857421875, 0.66357421875, 0.8067626953125, 0.949951171875, 1.0931396484375, 1.236328125, 1.3795166015625, 1.522705078125, 1.6658935546875, 1.80908203125, 1.9522705078125, 2.095458984375, 2.2386474609375, 2.3818359375, 2.5250244140625, 2.668212890625, 2.8114013671875, 2.95458984375, 3.0977783203125, 3.240966796875, 3.3841552734375, 3.52734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 10.0, 9.0, 13.0, 19.0, 23.0, 36.0, 34.0, 60.0, 63.0, 90.0, 69.0, 85.0, 89.0, 68.0, 77.0, 64.0, 37.0, 40.0, 38.0, 31.0, 10.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.53955078125, -0.5252456665039062, -0.5109405517578125, -0.49663543701171875, -0.482330322265625, -0.46802520751953125, -0.4537200927734375, -0.43941497802734375, -0.42510986328125, -0.41080474853515625, -0.3964996337890625, -0.38219451904296875, -0.367889404296875, -0.35358428955078125, -0.3392791748046875, -0.32497406005859375, -0.3106689453125, -0.29636383056640625, -0.2820587158203125, -0.26775360107421875, -0.253448486328125, -0.23914337158203125, -0.2248382568359375, -0.21053314208984375, -0.19622802734375, -0.18192291259765625, -0.1676177978515625, -0.15331268310546875, -0.139007568359375, -0.12470245361328125, -0.1103973388671875, -0.09609222412109375, -0.081787109375, -0.06748199462890625, -0.0531768798828125, -0.03887176513671875, -0.024566650390625, -0.01026153564453125, 0.0040435791015625, 0.01834869384765625, 0.03265380859375, 0.04695892333984375, 0.0612640380859375, 0.07556915283203125, 0.089874267578125, 0.10417938232421875, 0.1184844970703125, 0.13278961181640625, 0.1470947265625, 0.16139984130859375, 0.1757049560546875, 0.19001007080078125, 0.204315185546875, 0.21862030029296875, 0.2329254150390625, 0.24723052978515625, 0.26153564453125, 0.27584075927734375, 0.2901458740234375, 0.30445098876953125, 0.318756103515625, 0.33306121826171875, 0.3473663330078125, 0.36167144775390625, 0.3759765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 10.0, 21.0, 20.0, 28.0, 37.0, 56.0, 74.0, 113.0, 145.0, 179.0, 305.0, 434.0, 730.0, 1274.0, 2426.0, 5536.0, 15307.0, 52112.0, 186801.0, 403862.0, 262675.0, 79392.0, 22339.0, 7479.0, 3124.0, 1549.0, 857.0, 491.0, 347.0, 236.0, 139.0, 132.0, 72.0, 64.0, 47.0, 30.0, 22.0, 17.0, 15.0, 10.0, 15.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.828948974609375, -1.77117919921875, -1.713409423828125, -1.6556396484375, -1.597869873046875, -1.54010009765625, -1.482330322265625, -1.424560546875, -1.366790771484375, -1.30902099609375, -1.251251220703125, -1.1934814453125, -1.135711669921875, -1.07794189453125, -1.020172119140625, -0.96240234375, -0.904632568359375, -0.84686279296875, -0.789093017578125, -0.7313232421875, -0.673553466796875, -0.61578369140625, -0.558013916015625, -0.500244140625, -0.442474365234375, -0.38470458984375, -0.326934814453125, -0.2691650390625, -0.211395263671875, -0.15362548828125, -0.095855712890625, -0.0380859375, 0.019683837890625, 0.07745361328125, 0.135223388671875, 0.1929931640625, 0.250762939453125, 0.30853271484375, 0.366302490234375, 0.424072265625, 0.481842041015625, 0.53961181640625, 0.597381591796875, 0.6551513671875, 0.712921142578125, 0.77069091796875, 0.828460693359375, 0.88623046875, 0.944000244140625, 1.00177001953125, 1.059539794921875, 1.1173095703125, 1.175079345703125, 1.23284912109375, 1.290618896484375, 1.348388671875, 1.406158447265625, 1.46392822265625, 1.521697998046875, 1.5794677734375, 1.637237548828125, 1.69500732421875, 1.752777099609375, 1.810546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 16.0, 9.0, 10.0, 13.0, 12.0, 18.0, 18.0, 24.0, 13.0, 25.0, 37.0, 33.0, 31.0, 42.0, 39.0, 39.0, 44.0, 30.0, 50.0, 36.0, 39.0, 33.0, 40.0, 44.0, 30.0, 34.0, 31.0, 23.0, 21.0, 26.0, 19.0, 14.0, 13.0, 13.0, 11.0, 8.0, 5.0, 8.0, 10.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.984375, -0.949249267578125, -0.91412353515625, -0.878997802734375, -0.8438720703125, -0.808746337890625, -0.77362060546875, -0.738494873046875, -0.703369140625, -0.668243408203125, -0.63311767578125, -0.597991943359375, -0.5628662109375, -0.527740478515625, -0.49261474609375, -0.457489013671875, -0.42236328125, -0.387237548828125, -0.35211181640625, -0.316986083984375, -0.2818603515625, -0.246734619140625, -0.21160888671875, -0.176483154296875, -0.141357421875, -0.106231689453125, -0.07110595703125, -0.035980224609375, -0.0008544921875, 0.034271240234375, 0.06939697265625, 0.104522705078125, 0.1396484375, 0.174774169921875, 0.20989990234375, 0.245025634765625, 0.2801513671875, 0.315277099609375, 0.35040283203125, 0.385528564453125, 0.420654296875, 0.455780029296875, 0.49090576171875, 0.526031494140625, 0.5611572265625, 0.596282958984375, 0.63140869140625, 0.666534423828125, 0.70166015625, 0.736785888671875, 0.77191162109375, 0.807037353515625, 0.8421630859375, 0.877288818359375, 0.91241455078125, 0.947540283203125, 0.982666015625, 1.017791748046875, 1.05291748046875, 1.088043212890625, 1.1231689453125, 1.158294677734375, 1.19342041015625, 1.228546142578125, 1.263671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 12.0, 16.0, 23.0, 43.0, 61.0, 99.0, 168.0, 319.0, 644.0, 1464.0, 3880.0, 13165.0, 64097.0, 358201.0, 477047.0, 101658.0, 19122.0, 5088.0, 1745.0, 778.0, 381.0, 219.0, 103.0, 88.0, 42.0, 23.0, 21.0, 15.0, 13.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2764892578125, -1.232666015625, -1.1888427734375, -1.14501953125, -1.1011962890625, -1.057373046875, -1.0135498046875, -0.9697265625, -0.9259033203125, -0.882080078125, -0.8382568359375, -0.79443359375, -0.7506103515625, -0.706787109375, -0.6629638671875, -0.619140625, -0.5753173828125, -0.531494140625, -0.4876708984375, -0.44384765625, -0.4000244140625, -0.356201171875, -0.3123779296875, -0.2685546875, -0.2247314453125, -0.180908203125, -0.1370849609375, -0.09326171875, -0.0494384765625, -0.005615234375, 0.0382080078125, 0.08203125, 0.1258544921875, 0.169677734375, 0.2135009765625, 0.25732421875, 0.3011474609375, 0.344970703125, 0.3887939453125, 0.4326171875, 0.4764404296875, 0.520263671875, 0.5640869140625, 0.60791015625, 0.6517333984375, 0.695556640625, 0.7393798828125, 0.783203125, 0.8270263671875, 0.870849609375, 0.9146728515625, 0.95849609375, 1.0023193359375, 1.046142578125, 1.0899658203125, 1.1337890625, 1.1776123046875, 1.221435546875, 1.2652587890625, 1.30908203125, 1.3529052734375, 1.396728515625, 1.4405517578125, 1.484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 13.0, 7.0, 23.0, 20.0, 21.0, 27.0, 37.0, 37.0, 56.0, 53.0, 60.0, 66.0, 83.0, 69.0, 54.0, 52.0, 47.0, 46.0, 37.0, 27.0, 18.0, 18.0, 18.0, 18.0, 11.0, 12.0, 4.0, 10.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013363361358642578, -0.0001293141394853592, -0.0001249946653842926, -0.00012067519128322601, -0.00011635571718215942, -0.00011203624308109283, -0.00010771676898002625, -0.00010339729487895966, -9.907782077789307e-05, -9.475834667682648e-05, -9.043887257575989e-05, -8.61193984746933e-05, -8.179992437362671e-05, -7.748045027256012e-05, -7.316097617149353e-05, -6.884150207042694e-05, -6.452202796936035e-05, -6.020255386829376e-05, -5.588307976722717e-05, -5.1563605666160583e-05, -4.7244131565093994e-05, -4.2924657464027405e-05, -3.8605183362960815e-05, -3.4285709261894226e-05, -2.9966235160827637e-05, -2.5646761059761047e-05, -2.1327286958694458e-05, -1.700781285762787e-05, -1.268833875656128e-05, -8.36886465549469e-06, -4.049390554428101e-06, 2.7008354663848877e-07, 4.589557647705078e-06, 8.909031748771667e-06, 1.3228505849838257e-05, 1.7547979950904846e-05, 2.1867454051971436e-05, 2.6186928153038025e-05, 3.0506402254104614e-05, 3.4825876355171204e-05, 3.914535045623779e-05, 4.346482455730438e-05, 4.778429865837097e-05, 5.210377275943756e-05, 5.642324686050415e-05, 6.074272096157074e-05, 6.506219506263733e-05, 6.938166916370392e-05, 7.370114326477051e-05, 7.80206173658371e-05, 8.234009146690369e-05, 8.665956556797028e-05, 9.097903966903687e-05, 9.529851377010345e-05, 9.961798787117004e-05, 0.00010393746197223663, 0.00010825693607330322, 0.00011257641017436981, 0.0001168958842754364, 0.00012121535837650299, 0.00012553483247756958, 0.00012985430657863617, 0.00013417378067970276, 0.00013849325478076935, 0.00014281272888183594]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 10.0, 4.0, 16.0, 23.0, 21.0, 30.0, 41.0, 56.0, 88.0, 130.0, 198.0, 317.0, 571.0, 1016.0, 1921.0, 3949.0, 9542.0, 27774.0, 103135.0, 346768.0, 380272.0, 120629.0, 31951.0, 10848.0, 4475.0, 2038.0, 1099.0, 617.0, 315.0, 184.0, 167.0, 77.0, 82.0, 39.0, 29.0, 35.0, 17.0, 12.0, 13.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0274658203125, -0.994384765625, -0.9613037109375, -0.92822265625, -0.8951416015625, -0.862060546875, -0.8289794921875, -0.7958984375, -0.7628173828125, -0.729736328125, -0.6966552734375, -0.66357421875, -0.6304931640625, -0.597412109375, -0.5643310546875, -0.53125, -0.4981689453125, -0.465087890625, -0.4320068359375, -0.39892578125, -0.3658447265625, -0.332763671875, -0.2996826171875, -0.2666015625, -0.2335205078125, -0.200439453125, -0.1673583984375, -0.13427734375, -0.1011962890625, -0.068115234375, -0.0350341796875, -0.001953125, 0.0311279296875, 0.064208984375, 0.0972900390625, 0.13037109375, 0.1634521484375, 0.196533203125, 0.2296142578125, 0.2626953125, 0.2957763671875, 0.328857421875, 0.3619384765625, 0.39501953125, 0.4281005859375, 0.461181640625, 0.4942626953125, 0.52734375, 0.5604248046875, 0.593505859375, 0.6265869140625, 0.65966796875, 0.6927490234375, 0.725830078125, 0.7589111328125, 0.7919921875, 0.8250732421875, 0.858154296875, 0.8912353515625, 0.92431640625, 0.9573974609375, 0.990478515625, 1.0235595703125, 1.056640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 10.0, 21.0, 20.0, 20.0, 32.0, 24.0, 57.0, 51.0, 54.0, 53.0, 75.0, 76.0, 81.0, 70.0, 71.0, 63.0, 32.0, 36.0, 31.0, 29.0, 17.0, 12.0, 11.0, 5.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69287109375, -0.667724609375, -0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 21.0, 67.0, 157.0, 245.0, 231.0, 144.0, 70.0, 32.0, 14.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53908348083496, -22.84380531311035, -22.148527145385742, -21.453248977661133, -20.75796890258789, -20.06269073486328, -19.367412567138672, -18.672134399414062, -17.976856231689453, -17.281578063964844, -16.586299896240234, -15.891020774841309, -15.1957426071167, -14.50046443939209, -13.805185317993164, -13.109907150268555, -12.414628982543945, -11.719350814819336, -11.024072647094727, -10.3287935256958, -9.633515357971191, -8.938237190246582, -8.242958068847656, -7.547679901123047, -6.8524017333984375, -6.157123565673828, -5.4618449211120605, -4.766566276550293, -4.071288108825684, -3.376009702682495, -2.6807312965393066, -1.985452651977539, -1.2901725769042969, -0.5948941707611084, 0.10038423538208008, 0.7956626415252686, 1.490941047668457, 2.1862194538116455, 2.881497859954834, 3.5767765045166016, 4.272054672241211, 4.96733283996582, 5.662611484527588, 6.3578901290893555, 7.053168296813965, 7.748446464538574, 8.4437255859375, 9.13900375366211, 9.834281921386719, 10.529560089111328, 11.224838256835938, 11.920117378234863, 12.615395545959473, 13.310673713684082, 14.005952835083008, 14.701231002807617, 15.396509170532227, 16.091787338256836, 16.787065505981445, 17.482343673706055, 18.177623748779297, 18.872901916503906, 19.568180084228516, 20.263458251953125, 20.958736419677734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 12.0, 12.0, 12.0, 11.0, 17.0, 11.0, 25.0, 27.0, 23.0, 32.0, 34.0, 36.0, 58.0, 38.0, 45.0, 59.0, 63.0, 49.0, 51.0, 40.0, 34.0, 40.0, 31.0, 34.0, 41.0, 26.0, 26.0, 12.0, 11.0, 21.0, 12.0, 10.0, 9.0, 6.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.7847723960876465, -6.530965805053711, -6.277159214019775, -6.02335262298584, -5.7695465087890625, -5.515739440917969, -5.261933326721191, -5.008126735687256, -4.75432014465332, -4.500513553619385, -4.246706962585449, -3.9929006099700928, -3.7390940189361572, -3.4852874279022217, -3.2314810752868652, -2.9776744842529297, -2.723867893218994, -2.4700613021850586, -2.216254711151123, -1.9624483585357666, -1.708641767501831, -1.4548351764678955, -1.2010287046432495, -0.9472222328186035, -0.693415641784668, -0.4396091103553772, -0.18580257892608643, 0.06800395250320435, 0.3218104839324951, 0.5756170749664307, 0.8294235467910767, 1.0832300186157227, 1.3370361328125, 1.5908427238464355, 1.8446491956710815, 2.0984556674957275, 2.352262258529663, 2.6060688495635986, 2.859875202178955, 3.1136817932128906, 3.367488384246826, 3.6212949752807617, 3.8751015663146973, 4.128908157348633, 4.38271427154541, 4.636521339416504, 4.890327453613281, 5.144134044647217, 5.397940635681152, 5.651747226715088, 5.905553817749023, 6.159360408782959, 6.4131669998168945, 6.666973114013672, 6.920779705047607, 7.174586296081543, 7.4283928871154785, 7.682199478149414, 7.93600606918335, 8.189812660217285, 8.443618774414062, 8.697425842285156, 8.951231956481934, 9.205038070678711, 9.458845138549805]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 14.0, 5.0, 10.0, 10.0, 21.0, 25.0, 30.0, 43.0, 65.0, 78.0, 109.0, 155.0, 248.0, 484.0, 1247.0, 3750.0, 16202.0, 177915.0, 3886101.0, 91308.0, 11649.0, 2917.0, 993.0, 415.0, 181.0, 111.0, 66.0, 27.0, 26.0, 18.0, 6.0, 5.0, 14.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.90234375, -4.75555419921875, -4.6087646484375, -4.46197509765625, -4.315185546875, -4.16839599609375, -4.0216064453125, -3.87481689453125, -3.72802734375, -3.58123779296875, -3.4344482421875, -3.28765869140625, -3.140869140625, -2.99407958984375, -2.8472900390625, -2.70050048828125, -2.5537109375, -2.40692138671875, -2.2601318359375, -2.11334228515625, -1.966552734375, -1.81976318359375, -1.6729736328125, -1.52618408203125, -1.37939453125, -1.23260498046875, -1.0858154296875, -0.93902587890625, -0.792236328125, -0.64544677734375, -0.4986572265625, -0.35186767578125, -0.205078125, -0.05828857421875, 0.0885009765625, 0.23529052734375, 0.382080078125, 0.52886962890625, 0.6756591796875, 0.82244873046875, 0.96923828125, 1.11602783203125, 1.2628173828125, 1.40960693359375, 1.556396484375, 1.70318603515625, 1.8499755859375, 1.99676513671875, 2.1435546875, 2.29034423828125, 2.4371337890625, 2.58392333984375, 2.730712890625, 2.87750244140625, 3.0242919921875, 3.17108154296875, 3.31787109375, 3.46466064453125, 3.6114501953125, 3.75823974609375, 3.905029296875, 4.05181884765625, 4.1986083984375, 4.34539794921875, 4.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 3.0, 8.0, 19.0, 18.0, 25.0, 44.0, 51.0, 59.0, 58.0, 69.0, 81.0, 79.0, 82.0, 59.0, 70.0, 53.0, 49.0, 39.0, 32.0, 27.0, 15.0, 14.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.54248046875, -0.5287551879882812, -0.5150299072265625, -0.5013046264648438, -0.487579345703125, -0.47385406494140625, -0.4601287841796875, -0.44640350341796875, -0.43267822265625, -0.41895294189453125, -0.4052276611328125, -0.39150238037109375, -0.377777099609375, -0.36405181884765625, -0.3503265380859375, -0.33660125732421875, -0.3228759765625, -0.30915069580078125, -0.2954254150390625, -0.28170013427734375, -0.267974853515625, -0.25424957275390625, -0.2405242919921875, -0.22679901123046875, -0.21307373046875, -0.19934844970703125, -0.1856231689453125, -0.17189788818359375, -0.158172607421875, -0.14444732666015625, -0.1307220458984375, -0.11699676513671875, -0.103271484375, -0.08954620361328125, -0.0758209228515625, -0.06209564208984375, -0.048370361328125, -0.03464508056640625, -0.0209197998046875, -0.00719451904296875, 0.00653076171875, 0.02025604248046875, 0.0339813232421875, 0.04770660400390625, 0.061431884765625, 0.07515716552734375, 0.0888824462890625, 0.10260772705078125, 0.1163330078125, 0.13005828857421875, 0.1437835693359375, 0.15750885009765625, 0.171234130859375, 0.18495941162109375, 0.1986846923828125, 0.21240997314453125, 0.22613525390625, 0.23986053466796875, 0.2535858154296875, 0.26731109619140625, 0.281036376953125, 0.29476165771484375, 0.3084869384765625, 0.32221221923828125, 0.3359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 10.0, 15.0, 19.0, 23.0, 48.0, 65.0, 93.0, 125.0, 175.0, 507.0, 5117.0, 3762717.0, 421604.0, 2862.0, 345.0, 153.0, 108.0, 70.0, 60.0, 33.0, 37.0, 37.0, 22.0, 12.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.25, -7.8896484375, -7.529296875, -7.1689453125, -6.80859375, -6.4482421875, -6.087890625, -5.7275390625, -5.3671875, -5.0068359375, -4.646484375, -4.2861328125, -3.92578125, -3.5654296875, -3.205078125, -2.8447265625, -2.484375, -2.1240234375, -1.763671875, -1.4033203125, -1.04296875, -0.6826171875, -0.322265625, 0.0380859375, 0.3984375, 0.7587890625, 1.119140625, 1.4794921875, 1.83984375, 2.2001953125, 2.560546875, 2.9208984375, 3.28125, 3.6416015625, 4.001953125, 4.3623046875, 4.72265625, 5.0830078125, 5.443359375, 5.8037109375, 6.1640625, 6.5244140625, 6.884765625, 7.2451171875, 7.60546875, 7.9658203125, 8.326171875, 8.6865234375, 9.046875, 9.4072265625, 9.767578125, 10.1279296875, 10.48828125, 10.8486328125, 11.208984375, 11.5693359375, 11.9296875, 12.2900390625, 12.650390625, 13.0107421875, 13.37109375, 13.7314453125, 14.091796875, 14.4521484375, 14.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 16.0, 41.0, 315.0, 3052.0, 544.0, 84.0, 19.0, 12.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.483154296875, -2.38623046875, -2.289306640625, -2.1923828125, -2.095458984375, -1.99853515625, -1.901611328125, -1.8046875, -1.707763671875, -1.61083984375, -1.513916015625, -1.4169921875, -1.320068359375, -1.22314453125, -1.126220703125, -1.029296875, -0.932373046875, -0.83544921875, -0.738525390625, -0.6416015625, -0.544677734375, -0.44775390625, -0.350830078125, -0.25390625, -0.156982421875, -0.06005859375, 0.036865234375, 0.1337890625, 0.230712890625, 0.32763671875, 0.424560546875, 0.521484375, 0.618408203125, 0.71533203125, 0.812255859375, 0.9091796875, 1.006103515625, 1.10302734375, 1.199951171875, 1.296875, 1.393798828125, 1.49072265625, 1.587646484375, 1.6845703125, 1.781494140625, 1.87841796875, 1.975341796875, 2.072265625, 2.169189453125, 2.26611328125, 2.363037109375, 2.4599609375, 2.556884765625, 2.65380859375, 2.750732421875, 2.84765625, 2.944580078125, 3.04150390625, 3.138427734375, 3.2353515625, 3.332275390625, 3.42919921875, 3.526123046875, 3.623046875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 13.0, 148.0, 590.0, 212.0, 33.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.634317874908447, -5.9419779777526855, -5.249637603759766, -4.557297706604004, -3.864957809448242, -3.1726179122924805, -2.4802775382995605, -1.7879376411437988, -1.095597743988037, -0.40325772762298584, 0.28908228874206543, 0.9814224243164062, 1.673762321472168, 2.3661022186279297, 3.0584425926208496, 3.7507824897766113, 4.443122386932373, 5.135462284088135, 5.827802658081055, 6.520142555236816, 7.212482452392578, 7.90482234954834, 8.597162246704102, 9.28950309753418, 9.981842041015625, 10.674181938171387, 11.366521835327148, 12.058862686157227, 12.751201629638672, 13.44354248046875, 14.135882377624512, 14.828222274780273, 15.520561218261719, 16.212902069091797, 16.905241012573242, 17.59758186340332, 18.289920806884766, 18.982261657714844, 19.674602508544922, 20.366941452026367, 21.059280395507812, 21.75162124633789, 22.443960189819336, 23.136301040649414, 23.82863998413086, 24.520980834960938, 25.213321685791016, 25.90566062927246, 26.59800148010254, 27.290342330932617, 27.982681274414062, 28.67502212524414, 29.367361068725586, 30.059701919555664, 30.75204086303711, 31.444381713867188, 32.136722564697266, 32.829063415527344, 33.52140426635742, 34.213741302490234, 34.90608215332031, 35.59842300415039, 36.29076385498047, 36.98310089111328, 37.67544174194336]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 10.0, 17.0, 23.0, 45.0, 68.0, 98.0, 112.0, 124.0, 118.0, 96.0, 110.0, 66.0, 46.0, 34.0, 14.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.434198379516602, -8.22624397277832, -8.018289566040039, -7.810335159301758, -7.602380752563477, -7.394426345825195, -7.186471939086914, -6.978517532348633, -6.770563125610352, -6.56260871887207, -6.354654312133789, -6.146699905395508, -5.938745498657227, -5.730791091918945, -5.522836685180664, -5.314882278442383, -5.106927871704102, -4.89897346496582, -4.691019058227539, -4.483064651489258, -4.275110244750977, -4.067155838012695, -3.859201431274414, -3.651247024536133, -3.4432926177978516, -3.2353382110595703, -3.027383804321289, -2.819429397583008, -2.6114749908447266, -2.4035205841064453, -2.195566177368164, -1.9876117706298828, -1.7796573638916016, -1.5717029571533203, -1.363748550415039, -1.1557941436767578, -0.9478397369384766, -0.7398853302001953, -0.5319309234619141, -0.3239765167236328, -0.11602210998535156, 0.09193229675292969, 0.29988670349121094, 0.5078411102294922, 0.7157955169677734, 0.9237499237060547, 1.131704330444336, 1.3396587371826172, 1.5476131439208984, 1.7555675506591797, 1.963521957397461, 2.171476364135742, 2.3794307708740234, 2.5873851776123047, 2.795339584350586, 3.003293991088867, 3.2112483978271484, 3.4192028045654297, 3.627157211303711, 3.835111618041992, 4.043066024780273, 4.251020431518555, 4.458974838256836, 4.666929244995117, 4.874883651733398]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 18.0, 26.0, 49.0, 91.0, 171.0, 412.0, 1472.0, 9789.0, 267981.0, 734818.0, 29902.0, 2654.0, 669.0, 243.0, 103.0, 52.0, 30.0, 25.0, 13.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.5302734375, -4.326171875, -4.1220703125, -3.91796875, -3.7138671875, -3.509765625, -3.3056640625, -3.1015625, -2.8974609375, -2.693359375, -2.4892578125, -2.28515625, -2.0810546875, -1.876953125, -1.6728515625, -1.46875, -1.2646484375, -1.060546875, -0.8564453125, -0.65234375, -0.4482421875, -0.244140625, -0.0400390625, 0.1640625, 0.3681640625, 0.572265625, 0.7763671875, 0.98046875, 1.1845703125, 1.388671875, 1.5927734375, 1.796875, 2.0009765625, 2.205078125, 2.4091796875, 2.61328125, 2.8173828125, 3.021484375, 3.2255859375, 3.4296875, 3.6337890625, 3.837890625, 4.0419921875, 4.24609375, 4.4501953125, 4.654296875, 4.8583984375, 5.0625, 5.2666015625, 5.470703125, 5.6748046875, 5.87890625, 6.0830078125, 6.287109375, 6.4912109375, 6.6953125, 6.8994140625, 7.103515625, 7.3076171875, 7.51171875, 7.7158203125, 7.919921875, 8.1240234375, 8.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 10.0, 16.0, 31.0, 30.0, 39.0, 31.0, 53.0, 64.0, 50.0, 60.0, 70.0, 68.0, 52.0, 56.0, 53.0, 57.0, 39.0, 39.0, 30.0, 19.0, 17.0, 18.0, 12.0, 12.0, 0.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.372314453125, -0.36093902587890625, -0.3495635986328125, -0.33818817138671875, -0.326812744140625, -0.31543731689453125, -0.3040618896484375, -0.29268646240234375, -0.28131103515625, -0.26993560791015625, -0.2585601806640625, -0.24718475341796875, -0.235809326171875, -0.22443389892578125, -0.2130584716796875, -0.20168304443359375, -0.1903076171875, -0.17893218994140625, -0.1675567626953125, -0.15618133544921875, -0.144805908203125, -0.13343048095703125, -0.1220550537109375, -0.11067962646484375, -0.09930419921875, -0.08792877197265625, -0.0765533447265625, -0.06517791748046875, -0.053802490234375, -0.04242706298828125, -0.0310516357421875, -0.01967620849609375, -0.00830078125, 0.00307464599609375, 0.0144500732421875, 0.02582550048828125, 0.037200927734375, 0.04857635498046875, 0.0599517822265625, 0.07132720947265625, 0.08270263671875, 0.09407806396484375, 0.1054534912109375, 0.11682891845703125, 0.128204345703125, 0.13957977294921875, 0.1509552001953125, 0.16233062744140625, 0.1737060546875, 0.18508148193359375, 0.1964569091796875, 0.20783233642578125, 0.219207763671875, 0.23058319091796875, 0.2419586181640625, 0.25333404541015625, 0.26470947265625, 0.27608489990234375, 0.2874603271484375, 0.29883575439453125, 0.310211181640625, 0.32158660888671875, 0.3329620361328125, 0.34433746337890625, 0.355712890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 18.0, 27.0, 25.0, 33.0, 50.0, 76.0, 109.0, 126.0, 212.0, 295.0, 451.0, 724.0, 1302.0, 2612.0, 5857.0, 16768.0, 62589.0, 240845.0, 440559.0, 200452.0, 50634.0, 14204.0, 4969.0, 2334.0, 1216.0, 672.0, 421.0, 266.0, 217.0, 110.0, 85.0, 74.0, 48.0, 52.0, 31.0, 20.0, 16.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.087890625, -2.02349853515625, -1.9591064453125, -1.89471435546875, -1.830322265625, -1.76593017578125, -1.7015380859375, -1.63714599609375, -1.57275390625, -1.50836181640625, -1.4439697265625, -1.37957763671875, -1.315185546875, -1.25079345703125, -1.1864013671875, -1.12200927734375, -1.0576171875, -0.99322509765625, -0.9288330078125, -0.86444091796875, -0.800048828125, -0.73565673828125, -0.6712646484375, -0.60687255859375, -0.54248046875, -0.47808837890625, -0.4136962890625, -0.34930419921875, -0.284912109375, -0.22052001953125, -0.1561279296875, -0.09173583984375, -0.02734375, 0.03704833984375, 0.1014404296875, 0.16583251953125, 0.230224609375, 0.29461669921875, 0.3590087890625, 0.42340087890625, 0.48779296875, 0.55218505859375, 0.6165771484375, 0.68096923828125, 0.745361328125, 0.80975341796875, 0.8741455078125, 0.93853759765625, 1.0029296875, 1.06732177734375, 1.1317138671875, 1.19610595703125, 1.260498046875, 1.32489013671875, 1.3892822265625, 1.45367431640625, 1.51806640625, 1.58245849609375, 1.6468505859375, 1.71124267578125, 1.775634765625, 1.84002685546875, 1.9044189453125, 1.96881103515625, 2.033203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 13.0, 5.0, 8.0, 14.0, 7.0, 19.0, 21.0, 30.0, 21.0, 22.0, 35.0, 35.0, 40.0, 48.0, 45.0, 64.0, 55.0, 54.0, 60.0, 53.0, 40.0, 44.0, 54.0, 35.0, 22.0, 30.0, 22.0, 19.0, 15.0, 22.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.9658203125, -1.914215087890625, -1.86260986328125, -1.811004638671875, -1.7593994140625, -1.707794189453125, -1.65618896484375, -1.604583740234375, -1.552978515625, -1.501373291015625, -1.44976806640625, -1.398162841796875, -1.3465576171875, -1.294952392578125, -1.24334716796875, -1.191741943359375, -1.14013671875, -1.088531494140625, -1.03692626953125, -0.985321044921875, -0.9337158203125, -0.882110595703125, -0.83050537109375, -0.778900146484375, -0.727294921875, -0.675689697265625, -0.62408447265625, -0.572479248046875, -0.5208740234375, -0.469268798828125, -0.41766357421875, -0.366058349609375, -0.314453125, -0.262847900390625, -0.21124267578125, -0.159637451171875, -0.1080322265625, -0.056427001953125, -0.00482177734375, 0.046783447265625, 0.098388671875, 0.149993896484375, 0.20159912109375, 0.253204345703125, 0.3048095703125, 0.356414794921875, 0.40802001953125, 0.459625244140625, 0.51123046875, 0.562835693359375, 0.61444091796875, 0.666046142578125, 0.7176513671875, 0.769256591796875, 0.82086181640625, 0.872467041015625, 0.924072265625, 0.975677490234375, 1.02728271484375, 1.078887939453125, 1.1304931640625, 1.182098388671875, 1.23370361328125, 1.285308837890625, 1.3369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 7.0, 23.0, 36.0, 42.0, 63.0, 84.0, 169.0, 279.0, 459.0, 1057.0, 2330.0, 6425.0, 23757.0, 109620.0, 451595.0, 351656.0, 74982.0, 17107.0, 5041.0, 1870.0, 856.0, 452.0, 238.0, 132.0, 88.0, 55.0, 37.0, 30.0, 8.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.2896270751953125, -1.249176025390625, -1.2087249755859375, -1.16827392578125, -1.1278228759765625, -1.087371826171875, -1.0469207763671875, -1.0064697265625, -0.9660186767578125, -0.925567626953125, -0.8851165771484375, -0.84466552734375, -0.8042144775390625, -0.763763427734375, -0.7233123779296875, -0.682861328125, -0.6424102783203125, -0.601959228515625, -0.5615081787109375, -0.52105712890625, -0.4806060791015625, -0.440155029296875, -0.3997039794921875, -0.3592529296875, -0.3188018798828125, -0.278350830078125, -0.2378997802734375, -0.19744873046875, -0.1569976806640625, -0.116546630859375, -0.0760955810546875, -0.03564453125, 0.0048065185546875, 0.045257568359375, 0.0857086181640625, 0.12615966796875, 0.1666107177734375, 0.207061767578125, 0.2475128173828125, 0.2879638671875, 0.3284149169921875, 0.368865966796875, 0.4093170166015625, 0.44976806640625, 0.4902191162109375, 0.530670166015625, 0.5711212158203125, 0.611572265625, 0.6520233154296875, 0.692474365234375, 0.7329254150390625, 0.77337646484375, 0.8138275146484375, 0.854278564453125, 0.8947296142578125, 0.9351806640625, 0.9756317138671875, 1.016082763671875, 1.0565338134765625, 1.09698486328125, 1.1374359130859375, 1.177886962890625, 1.2183380126953125, 1.2587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 15.0, 9.0, 12.0, 16.0, 21.0, 34.0, 33.0, 46.0, 54.0, 75.0, 87.0, 106.0, 88.0, 74.0, 67.0, 47.0, 40.0, 45.0, 40.0, 21.0, 14.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025582313537597656, -0.0002496875822544098, -0.00024355202913284302, -0.00023741647601127625, -0.00023128092288970947, -0.0002251453697681427, -0.00021900981664657593, -0.00021287426352500916, -0.00020673871040344238, -0.0002006031572818756, -0.00019446760416030884, -0.00018833205103874207, -0.0001821964979171753, -0.00017606094479560852, -0.00016992539167404175, -0.00016378983855247498, -0.0001576542854309082, -0.00015151873230934143, -0.00014538317918777466, -0.00013924762606620789, -0.0001331120729446411, -0.00012697651982307434, -0.00012084096670150757, -0.0001147054135799408, -0.00010856986045837402, -0.00010243430733680725, -9.629875421524048e-05, -9.01632010936737e-05, -8.402764797210693e-05, -7.789209485054016e-05, -7.175654172897339e-05, -6.562098860740662e-05, -5.9485435485839844e-05, -5.334988236427307e-05, -4.72143292427063e-05, -4.1078776121139526e-05, -3.4943222999572754e-05, -2.880766987800598e-05, -2.267211675643921e-05, -1.6536563634872437e-05, -1.0401010513305664e-05, -4.265457391738892e-06, 1.8700957298278809e-06, 8.005648851394653e-06, 1.4141201972961426e-05, 2.0276755094528198e-05, 2.641230821609497e-05, 3.254786133766174e-05, 3.8683414459228516e-05, 4.481896758079529e-05, 5.095452070236206e-05, 5.709007382392883e-05, 6.32256269454956e-05, 6.936118006706238e-05, 7.549673318862915e-05, 8.163228631019592e-05, 8.77678394317627e-05, 9.390339255332947e-05, 0.00010003894567489624, 0.00010617449879646301, 0.00011231005191802979, 0.00011844560503959656, 0.00012458115816116333, 0.0001307167112827301, 0.00013685226440429688]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 21.0, 23.0, 29.0, 51.0, 94.0, 140.0, 222.0, 347.0, 625.0, 1236.0, 2533.0, 6153.0, 18152.0, 68614.0, 294202.0, 466605.0, 138793.0, 33151.0, 10028.0, 3792.0, 1668.0, 852.0, 423.0, 293.0, 169.0, 92.0, 68.0, 49.0, 33.0, 13.0, 12.0, 13.0, 12.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.12109375, -1.085205078125, -1.04931640625, -1.013427734375, -0.9775390625, -0.941650390625, -0.90576171875, -0.869873046875, -0.833984375, -0.798095703125, -0.76220703125, -0.726318359375, -0.6904296875, -0.654541015625, -0.61865234375, -0.582763671875, -0.546875, -0.510986328125, -0.47509765625, -0.439208984375, -0.4033203125, -0.367431640625, -0.33154296875, -0.295654296875, -0.259765625, -0.223876953125, -0.18798828125, -0.152099609375, -0.1162109375, -0.080322265625, -0.04443359375, -0.008544921875, 0.02734375, 0.063232421875, 0.09912109375, 0.135009765625, 0.1708984375, 0.206787109375, 0.24267578125, 0.278564453125, 0.314453125, 0.350341796875, 0.38623046875, 0.422119140625, 0.4580078125, 0.493896484375, 0.52978515625, 0.565673828125, 0.6015625, 0.637451171875, 0.67333984375, 0.709228515625, 0.7451171875, 0.781005859375, 0.81689453125, 0.852783203125, 0.888671875, 0.924560546875, 0.96044921875, 0.996337890625, 1.0322265625, 1.068115234375, 1.10400390625, 1.139892578125, 1.17578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 6.0, 16.0, 14.0, 35.0, 35.0, 48.0, 47.0, 52.0, 74.0, 93.0, 97.0, 92.0, 83.0, 70.0, 50.0, 42.0, 25.0, 25.0, 24.0, 17.0, 11.0, 6.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9664154052734375, -0.934783935546875, -0.9031524658203125, -0.87152099609375, -0.8398895263671875, -0.808258056640625, -0.7766265869140625, -0.7449951171875, -0.7133636474609375, -0.681732177734375, -0.6501007080078125, -0.61846923828125, -0.5868377685546875, -0.555206298828125, -0.5235748291015625, -0.491943359375, -0.4603118896484375, -0.428680419921875, -0.3970489501953125, -0.36541748046875, -0.3337860107421875, -0.302154541015625, -0.2705230712890625, -0.2388916015625, -0.2072601318359375, -0.175628662109375, -0.1439971923828125, -0.11236572265625, -0.0807342529296875, -0.049102783203125, -0.0174713134765625, 0.01416015625, 0.0457916259765625, 0.077423095703125, 0.1090545654296875, 0.14068603515625, 0.1723175048828125, 0.203948974609375, 0.2355804443359375, 0.2672119140625, 0.2988433837890625, 0.330474853515625, 0.3621063232421875, 0.39373779296875, 0.4253692626953125, 0.457000732421875, 0.4886322021484375, 0.520263671875, 0.5518951416015625, 0.583526611328125, 0.6151580810546875, 0.64678955078125, 0.6784210205078125, 0.710052490234375, 0.7416839599609375, 0.7733154296875, 0.8049468994140625, 0.836578369140625, 0.8682098388671875, 0.89984130859375, 0.9314727783203125, 0.963104248046875, 0.9947357177734375, 1.0263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 25.0, 27.0, 60.0, 108.0, 137.0, 176.0, 148.0, 102.0, 93.0, 45.0, 27.0, 21.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.19582748413086, -17.657377243041992, -17.118927001953125, -16.580474853515625, -16.042024612426758, -15.50357437133789, -14.965124130249023, -14.426673889160156, -13.888222694396973, -13.349772453308105, -12.811321258544922, -12.272871017456055, -11.734420776367188, -11.195969581604004, -10.657519340515137, -10.119068145751953, -9.580617904663086, -9.042167663574219, -8.503716468811035, -7.965266227722168, -7.426815509796143, -6.888364791870117, -6.34991455078125, -5.811463832855225, -5.273013114929199, -4.734562397003174, -4.196111679077148, -3.6576614379882812, -3.119210720062256, -2.5807600021362305, -2.042309522628784, -1.503859043121338, -0.9654083251953125, -0.42695772647857666, 0.11149287223815918, 0.649943470954895, 1.1883940696716309, 1.7268447875976562, 2.2652952671051025, 2.803745746612549, 3.342196464538574, 3.8806471824645996, 4.419097900390625, 4.957548141479492, 5.495998859405518, 6.034449577331543, 6.57289981842041, 7.1113505363464355, 7.649801254272461, 8.188251495361328, 8.726702690124512, 9.265152931213379, 9.803604125976562, 10.34205436706543, 10.880504608154297, 11.418954849243164, 11.957406044006348, 12.495856285095215, 13.034307479858398, 13.572757720947266, 14.111207962036133, 14.649659156799316, 15.188109397888184, 15.726560592651367, 16.265010833740234]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 1.0, 7.0, 6.0, 9.0, 20.0, 20.0, 27.0, 21.0, 28.0, 29.0, 18.0, 38.0, 34.0, 40.0, 45.0, 38.0, 45.0, 53.0, 50.0, 46.0, 53.0, 49.0, 43.0, 43.0, 33.0, 35.0, 26.0, 15.0, 23.0, 15.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.792655944824219, -8.506147384643555, -8.219637870788574, -7.93312931060791, -7.646620750427246, -7.360111713409424, -7.073602676391602, -6.7870941162109375, -6.500585556030273, -6.214076519012451, -5.927567958831787, -5.641058921813965, -5.354550361633301, -5.0680413246154785, -4.781532287597656, -4.495023727416992, -4.20851469039917, -3.9220058917999268, -3.6354970932006836, -3.3489880561828613, -3.0624794960021973, -2.775970458984375, -2.489461660385132, -2.2029528617858887, -1.9164440631866455, -1.6299352645874023, -1.3434264659881592, -1.0569175481796265, -0.7704087495803833, -0.48389995098114014, -0.19739103317260742, 0.08911776542663574, 0.3756265640258789, 0.6621353626251221, 0.94864422082901, 1.235153079032898, 1.5216618776321411, 1.8081706762313843, 2.094679594039917, 2.38118839263916, 2.6676971912384033, 2.9542059898376465, 3.2407147884368896, 3.527223587036133, 3.813732624053955, 4.100241184234619, 4.386750221252441, 4.6732587814331055, 4.959767818450928, 5.24627685546875, 5.532785415649414, 5.819294452667236, 6.1058030128479, 6.392312049865723, 6.678820610046387, 6.965329647064209, 7.251838684082031, 7.5383477210998535, 7.824856281280518, 8.11136531829834, 8.397873878479004, 8.684382438659668, 8.970891952514648, 9.257400512695312, 9.543909072875977]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 12.0, 10.0, 24.0, 29.0, 48.0, 53.0, 77.0, 119.0, 169.0, 274.0, 521.0, 1055.0, 2608.0, 7992.0, 35873.0, 350709.0, 3607440.0, 154926.0, 22482.0, 6071.0, 2073.0, 849.0, 400.0, 189.0, 96.0, 54.0, 29.0, 18.0, 18.0, 7.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.261688232421875, -4.14447021484375, -4.027252197265625, -3.9100341796875, -3.792816162109375, -3.67559814453125, -3.558380126953125, -3.441162109375, -3.323944091796875, -3.20672607421875, -3.089508056640625, -2.9722900390625, -2.855072021484375, -2.73785400390625, -2.620635986328125, -2.50341796875, -2.386199951171875, -2.26898193359375, -2.151763916015625, -2.0345458984375, -1.917327880859375, -1.80010986328125, -1.682891845703125, -1.565673828125, -1.448455810546875, -1.33123779296875, -1.214019775390625, -1.0968017578125, -0.979583740234375, -0.86236572265625, -0.745147705078125, -0.6279296875, -0.510711669921875, -0.39349365234375, -0.276275634765625, -0.1590576171875, -0.041839599609375, 0.07537841796875, 0.192596435546875, 0.309814453125, 0.427032470703125, 0.54425048828125, 0.661468505859375, 0.7786865234375, 0.895904541015625, 1.01312255859375, 1.130340576171875, 1.24755859375, 1.364776611328125, 1.48199462890625, 1.599212646484375, 1.7164306640625, 1.833648681640625, 1.95086669921875, 2.068084716796875, 2.185302734375, 2.302520751953125, 2.41973876953125, 2.536956787109375, 2.6541748046875, 2.771392822265625, 2.88861083984375, 3.005828857421875, 3.123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 9.0, 11.0, 8.0, 10.0, 15.0, 21.0, 22.0, 38.0, 37.0, 40.0, 44.0, 55.0, 59.0, 52.0, 63.0, 59.0, 63.0, 59.0, 62.0, 42.0, 35.0, 41.0, 26.0, 38.0, 27.0, 20.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396728515625, -0.3847236633300781, -0.37271881103515625, -0.3607139587402344, -0.3487091064453125, -0.3367042541503906, -0.32469940185546875, -0.3126945495605469, -0.300689697265625, -0.2886848449707031, -0.27667999267578125, -0.2646751403808594, -0.2526702880859375, -0.24066543579101562, -0.22866058349609375, -0.21665573120117188, -0.20465087890625, -0.19264602661132812, -0.18064117431640625, -0.16863632202148438, -0.1566314697265625, -0.14462661743164062, -0.13262176513671875, -0.12061691284179688, -0.108612060546875, -0.09660720825195312, -0.08460235595703125, -0.07259750366210938, -0.0605926513671875, -0.048587799072265625, -0.03658294677734375, -0.024578094482421875, -0.0125732421875, -0.000568389892578125, 0.01143646240234375, 0.023441314697265625, 0.0354461669921875, 0.047451019287109375, 0.05945587158203125, 0.07146072387695312, 0.083465576171875, 0.09547042846679688, 0.10747528076171875, 0.11948013305664062, 0.1314849853515625, 0.14348983764648438, 0.15549468994140625, 0.16749954223632812, 0.17950439453125, 0.19150924682617188, 0.20351409912109375, 0.21551895141601562, 0.2275238037109375, 0.23952865600585938, 0.25153350830078125, 0.2635383605957031, 0.275543212890625, 0.2875480651855469, 0.29955291748046875, 0.3115577697753906, 0.3235626220703125, 0.3355674743652344, 0.34757232666015625, 0.3595771789550781, 0.37158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 11.0, 9.0, 16.0, 25.0, 30.0, 50.0, 55.0, 76.0, 132.0, 204.0, 331.0, 672.0, 1892.0, 8303.0, 325949.0, 3835483.0, 16371.0, 2611.0, 849.0, 406.0, 239.0, 142.0, 132.0, 84.0, 50.0, 55.0, 29.0, 20.0, 10.0, 16.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.899658203125, -10.58056640625, -10.261474609375, -9.9423828125, -9.623291015625, -9.30419921875, -8.985107421875, -8.666015625, -8.346923828125, -8.02783203125, -7.708740234375, -7.3896484375, -7.070556640625, -6.75146484375, -6.432373046875, -6.11328125, -5.794189453125, -5.47509765625, -5.156005859375, -4.8369140625, -4.517822265625, -4.19873046875, -3.879638671875, -3.560546875, -3.241455078125, -2.92236328125, -2.603271484375, -2.2841796875, -1.965087890625, -1.64599609375, -1.326904296875, -1.0078125, -0.688720703125, -0.36962890625, -0.050537109375, 0.2685546875, 0.587646484375, 0.90673828125, 1.225830078125, 1.544921875, 1.864013671875, 2.18310546875, 2.502197265625, 2.8212890625, 3.140380859375, 3.45947265625, 3.778564453125, 4.09765625, 4.416748046875, 4.73583984375, 5.054931640625, 5.3740234375, 5.693115234375, 6.01220703125, 6.331298828125, 6.650390625, 6.969482421875, 7.28857421875, 7.607666015625, 7.9267578125, 8.245849609375, 8.56494140625, 8.884033203125, 9.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 24.0, 32.0, 108.0, 486.0, 2227.0, 881.0, 194.0, 49.0, 20.0, 13.0, 12.0, 7.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.5149383544921875, -1.429290771484375, -1.3436431884765625, -1.25799560546875, -1.1723480224609375, -1.086700439453125, -1.0010528564453125, -0.9154052734375, -0.8297576904296875, -0.744110107421875, -0.6584625244140625, -0.57281494140625, -0.4871673583984375, -0.401519775390625, -0.3158721923828125, -0.230224609375, -0.1445770263671875, -0.058929443359375, 0.0267181396484375, 0.11236572265625, 0.1980133056640625, 0.283660888671875, 0.3693084716796875, 0.4549560546875, 0.5406036376953125, 0.626251220703125, 0.7118988037109375, 0.79754638671875, 0.8831939697265625, 0.968841552734375, 1.0544891357421875, 1.14013671875, 1.2257843017578125, 1.311431884765625, 1.3970794677734375, 1.48272705078125, 1.5683746337890625, 1.654022216796875, 1.7396697998046875, 1.8253173828125, 1.9109649658203125, 1.996612548828125, 2.0822601318359375, 2.16790771484375, 2.2535552978515625, 2.339202880859375, 2.4248504638671875, 2.510498046875, 2.5961456298828125, 2.681793212890625, 2.7674407958984375, 2.85308837890625, 2.9387359619140625, 3.024383544921875, 3.1100311279296875, 3.1956787109375, 3.2813262939453125, 3.366973876953125, 3.4526214599609375, 3.53826904296875, 3.6239166259765625, 3.709564208984375, 3.7952117919921875, 3.880859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 11.0, 32.0, 101.0, 272.0, 309.0, 171.0, 62.0, 21.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.170495986938477, -28.445274353027344, -27.72005271911621, -26.994831085205078, -26.269609451293945, -25.544387817382812, -24.81916618347168, -24.093944549560547, -23.368722915649414, -22.64350128173828, -21.91827964782715, -21.193058013916016, -20.467836380004883, -19.74261474609375, -19.017393112182617, -18.292171478271484, -17.56694984436035, -16.84172821044922, -16.116506576538086, -15.391284942626953, -14.66606330871582, -13.940841674804688, -13.215620040893555, -12.490398406982422, -11.765176773071289, -11.039955139160156, -10.314733505249023, -9.58951187133789, -8.864290237426758, -8.139068603515625, -7.413846969604492, -6.688625335693359, -5.963405609130859, -5.238183975219727, -4.512962341308594, -3.787740707397461, -3.062519073486328, -2.3372974395751953, -1.6120758056640625, -0.8868541717529297, -0.16163253784179688, 0.5635890960693359, 1.2888107299804688, 2.0140323638916016, 2.7392539978027344, 3.464475631713867, 4.189697265625, 4.914918899536133, 5.640140533447266, 6.365362167358398, 7.090583801269531, 7.815805435180664, 8.541027069091797, 9.26624870300293, 9.991470336914062, 10.716691970825195, 11.441913604736328, 12.167135238647461, 12.892356872558594, 13.617578506469727, 14.34280014038086, 15.068021774291992, 15.793243408203125, 16.518465042114258, 17.24368667602539]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 4.0, 11.0, 14.0, 10.0, 18.0, 38.0, 31.0, 26.0, 38.0, 70.0, 58.0, 67.0, 77.0, 65.0, 61.0, 60.0, 49.0, 44.0, 49.0, 34.0, 37.0, 19.0, 29.0, 20.0, 11.0, 19.0, 5.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.304987907409668, -6.130555152893066, -5.956122398376465, -5.781689643859863, -5.607256889343262, -5.43282413482666, -5.258391380310059, -5.083958625793457, -4.9095258712768555, -4.735093116760254, -4.560660362243652, -4.386227607727051, -4.211794853210449, -4.037362098693848, -3.862929105758667, -3.6884963512420654, -3.5140633583068848, -3.339630603790283, -3.1651978492736816, -2.99076509475708, -2.8163323402404785, -2.641899585723877, -2.4674665927886963, -2.2930338382720947, -2.118601083755493, -1.9441683292388916, -1.76973557472229, -1.595302700996399, -1.4208699464797974, -1.2464371919631958, -1.0720043182373047, -0.8975715637207031, -0.7231383323669434, -0.5487055778503418, -0.37427276372909546, -0.19983994960784912, -0.02540719509124756, 0.149025559425354, 0.3234584331512451, 0.4978911876678467, 0.6723239421844482, 0.8467566967010498, 1.0211894512176514, 1.1956223249435425, 1.370055079460144, 1.5444878339767456, 1.7189207077026367, 1.8933534622192383, 2.06778621673584, 2.2422189712524414, 2.416651725769043, 2.5910844802856445, 2.765517234802246, 2.9399499893188477, 3.1143829822540283, 3.28881573677063, 3.4632484912872314, 3.637681245803833, 3.8121140003204346, 3.9865469932556152, 4.160979747772217, 4.335412502288818, 4.50984525680542, 4.6842780113220215, 4.858710765838623]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 10.0, 4.0, 17.0, 19.0, 27.0, 34.0, 60.0, 67.0, 89.0, 170.0, 306.0, 488.0, 885.0, 1800.0, 4098.0, 11437.0, 41076.0, 169566.0, 478468.0, 252309.0, 61066.0, 16148.0, 5419.0, 2297.0, 1100.0, 582.0, 341.0, 219.0, 143.0, 84.0, 72.0, 40.0, 33.0, 16.0, 19.0, 11.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.553436279296875, -2.46429443359375, -2.375152587890625, -2.2860107421875, -2.196868896484375, -2.10772705078125, -2.018585205078125, -1.929443359375, -1.840301513671875, -1.75115966796875, -1.662017822265625, -1.5728759765625, -1.483734130859375, -1.39459228515625, -1.305450439453125, -1.21630859375, -1.127166748046875, -1.03802490234375, -0.948883056640625, -0.8597412109375, -0.770599365234375, -0.68145751953125, -0.592315673828125, -0.503173828125, -0.414031982421875, -0.32489013671875, -0.235748291015625, -0.1466064453125, -0.057464599609375, 0.03167724609375, 0.120819091796875, 0.2099609375, 0.299102783203125, 0.38824462890625, 0.477386474609375, 0.5665283203125, 0.655670166015625, 0.74481201171875, 0.833953857421875, 0.923095703125, 1.012237548828125, 1.10137939453125, 1.190521240234375, 1.2796630859375, 1.368804931640625, 1.45794677734375, 1.547088623046875, 1.63623046875, 1.725372314453125, 1.81451416015625, 1.903656005859375, 1.9927978515625, 2.081939697265625, 2.17108154296875, 2.260223388671875, 2.349365234375, 2.438507080078125, 2.52764892578125, 2.616790771484375, 2.7059326171875, 2.795074462890625, 2.88421630859375, 2.973358154296875, 3.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 15.0, 24.0, 24.0, 40.0, 39.0, 54.0, 56.0, 62.0, 70.0, 75.0, 70.0, 67.0, 68.0, 60.0, 58.0, 50.0, 42.0, 32.0, 16.0, 19.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49755859375, -0.4821281433105469, -0.46669769287109375, -0.4512672424316406, -0.4358367919921875, -0.4204063415527344, -0.40497589111328125, -0.3895454406738281, -0.374114990234375, -0.3586845397949219, -0.34325408935546875, -0.3278236389160156, -0.3123931884765625, -0.2969627380371094, -0.28153228759765625, -0.2661018371582031, -0.25067138671875, -0.23524093627929688, -0.21981048583984375, -0.20438003540039062, -0.1889495849609375, -0.17351913452148438, -0.15808868408203125, -0.14265823364257812, -0.127227783203125, -0.11179733276367188, -0.09636688232421875, -0.08093643188476562, -0.0655059814453125, -0.050075531005859375, -0.03464508056640625, -0.019214630126953125, -0.0037841796875, 0.011646270751953125, 0.02707672119140625, 0.042507171630859375, 0.0579376220703125, 0.07336807250976562, 0.08879852294921875, 0.10422897338867188, 0.119659423828125, 0.13508987426757812, 0.15052032470703125, 0.16595077514648438, 0.1813812255859375, 0.19681167602539062, 0.21224212646484375, 0.22767257690429688, 0.24310302734375, 0.2585334777832031, 0.27396392822265625, 0.2893943786621094, 0.3048248291015625, 0.3202552795410156, 0.33568572998046875, 0.3511161804199219, 0.366546630859375, 0.3819770812988281, 0.39740753173828125, 0.4128379821777344, 0.4282684326171875, 0.4436988830566406, 0.45912933349609375, 0.4745597839355469, 0.489990234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 22.0, 14.0, 32.0, 45.0, 55.0, 95.0, 127.0, 210.0, 345.0, 481.0, 922.0, 1856.0, 4280.0, 11506.0, 38635.0, 135895.0, 369441.0, 326233.0, 109876.0, 31288.0, 9632.0, 3754.0, 1607.0, 871.0, 419.0, 289.0, 201.0, 134.0, 89.0, 49.0, 52.0, 19.0, 23.0, 16.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.549835205078125, -1.49224853515625, -1.434661865234375, -1.3770751953125, -1.319488525390625, -1.26190185546875, -1.204315185546875, -1.146728515625, -1.089141845703125, -1.03155517578125, -0.973968505859375, -0.9163818359375, -0.858795166015625, -0.80120849609375, -0.743621826171875, -0.68603515625, -0.628448486328125, -0.57086181640625, -0.513275146484375, -0.4556884765625, -0.398101806640625, -0.34051513671875, -0.282928466796875, -0.225341796875, -0.167755126953125, -0.11016845703125, -0.052581787109375, 0.0050048828125, 0.062591552734375, 0.12017822265625, 0.177764892578125, 0.2353515625, 0.292938232421875, 0.35052490234375, 0.408111572265625, 0.4656982421875, 0.523284912109375, 0.58087158203125, 0.638458251953125, 0.696044921875, 0.753631591796875, 0.81121826171875, 0.868804931640625, 0.9263916015625, 0.983978271484375, 1.04156494140625, 1.099151611328125, 1.15673828125, 1.214324951171875, 1.27191162109375, 1.329498291015625, 1.3870849609375, 1.444671630859375, 1.50225830078125, 1.559844970703125, 1.617431640625, 1.675018310546875, 1.73260498046875, 1.790191650390625, 1.8477783203125, 1.905364990234375, 1.96295166015625, 2.020538330078125, 2.078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 2.0, 6.0, 11.0, 14.0, 9.0, 17.0, 28.0, 23.0, 24.0, 36.0, 38.0, 40.0, 32.0, 41.0, 42.0, 56.0, 48.0, 42.0, 61.0, 52.0, 42.0, 42.0, 41.0, 36.0, 29.0, 37.0, 30.0, 19.0, 20.0, 16.0, 17.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.88671875, -1.8379058837890625, -1.789093017578125, -1.7402801513671875, -1.69146728515625, -1.6426544189453125, -1.593841552734375, -1.5450286865234375, -1.4962158203125, -1.4474029541015625, -1.398590087890625, -1.3497772216796875, -1.30096435546875, -1.2521514892578125, -1.203338623046875, -1.1545257568359375, -1.105712890625, -1.0569000244140625, -1.008087158203125, -0.9592742919921875, -0.91046142578125, -0.8616485595703125, -0.812835693359375, -0.7640228271484375, -0.7152099609375, -0.6663970947265625, -0.617584228515625, -0.5687713623046875, -0.51995849609375, -0.4711456298828125, -0.422332763671875, -0.3735198974609375, -0.32470703125, -0.2758941650390625, -0.227081298828125, -0.1782684326171875, -0.12945556640625, -0.0806427001953125, -0.031829833984375, 0.0169830322265625, 0.0657958984375, 0.1146087646484375, 0.163421630859375, 0.2122344970703125, 0.26104736328125, 0.3098602294921875, 0.358673095703125, 0.4074859619140625, 0.456298828125, 0.5051116943359375, 0.553924560546875, 0.6027374267578125, 0.65155029296875, 0.7003631591796875, 0.749176025390625, 0.7979888916015625, 0.8468017578125, 0.8956146240234375, 0.944427490234375, 0.9932403564453125, 1.04205322265625, 1.0908660888671875, 1.139678955078125, 1.1884918212890625, 1.2373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 2.0, 8.0, 10.0, 11.0, 15.0, 32.0, 49.0, 73.0, 135.0, 201.0, 449.0, 920.0, 2404.0, 7916.0, 45350.0, 729111.0, 236670.0, 17795.0, 4504.0, 1520.0, 643.0, 312.0, 149.0, 89.0, 56.0, 29.0, 18.0, 20.0, 15.0, 5.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.857421875, -2.761444091796875, -2.66546630859375, -2.569488525390625, -2.4735107421875, -2.377532958984375, -2.28155517578125, -2.185577392578125, -2.089599609375, -1.993621826171875, -1.89764404296875, -1.801666259765625, -1.7056884765625, -1.609710693359375, -1.51373291015625, -1.417755126953125, -1.32177734375, -1.225799560546875, -1.12982177734375, -1.033843994140625, -0.9378662109375, -0.841888427734375, -0.74591064453125, -0.649932861328125, -0.553955078125, -0.457977294921875, -0.36199951171875, -0.266021728515625, -0.1700439453125, -0.074066162109375, 0.02191162109375, 0.117889404296875, 0.2138671875, 0.309844970703125, 0.40582275390625, 0.501800537109375, 0.5977783203125, 0.693756103515625, 0.78973388671875, 0.885711669921875, 0.981689453125, 1.077667236328125, 1.17364501953125, 1.269622802734375, 1.3656005859375, 1.461578369140625, 1.55755615234375, 1.653533935546875, 1.74951171875, 1.845489501953125, 1.94146728515625, 2.037445068359375, 2.1334228515625, 2.229400634765625, 2.32537841796875, 2.421356201171875, 2.517333984375, 2.613311767578125, 2.70928955078125, 2.805267333984375, 2.9012451171875, 2.997222900390625, 3.09320068359375, 3.189178466796875, 3.28515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 18.0, 20.0, 26.0, 34.0, 41.0, 56.0, 62.0, 80.0, 83.0, 106.0, 87.0, 61.0, 63.0, 34.0, 29.0, 29.0, 34.0, 20.0, 15.0, 15.0, 8.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015825405716896057, -0.00015319138765335083, -0.0001481287181377411, -0.00014306604862213135, -0.0001380033791065216, -0.00013294070959091187, -0.00012787804007530212, -0.00012281537055969238, -0.00011775270104408264, -0.0001126900315284729, -0.00010762736201286316, -0.00010256469249725342, -9.750202298164368e-05, -9.243935346603394e-05, -8.73766839504242e-05, -8.231401443481445e-05, -7.725134491920471e-05, -7.218867540359497e-05, -6.712600588798523e-05, -6.206333637237549e-05, -5.700066685676575e-05, -5.1937997341156006e-05, -4.6875327825546265e-05, -4.1812658309936523e-05, -3.674998879432678e-05, -3.168731927871704e-05, -2.66246497631073e-05, -2.156198024749756e-05, -1.6499310731887817e-05, -1.1436641216278076e-05, -6.373971700668335e-06, -1.3113021850585938e-06, 3.7513673305511475e-06, 8.814036846160889e-06, 1.387670636177063e-05, 1.893937587738037e-05, 2.4002045392990112e-05, 2.9064714908599854e-05, 3.4127384424209595e-05, 3.9190053939819336e-05, 4.425272345542908e-05, 4.931539297103882e-05, 5.437806248664856e-05, 5.94407320022583e-05, 6.450340151786804e-05, 6.956607103347778e-05, 7.462874054908752e-05, 7.969141006469727e-05, 8.475407958030701e-05, 8.981674909591675e-05, 9.487941861152649e-05, 9.994208812713623e-05, 0.00010500475764274597, 0.00011006742715835571, 0.00011513009667396545, 0.0001201927661895752, 0.00012525543570518494, 0.00013031810522079468, 0.00013538077473640442, 0.00014044344425201416, 0.0001455061137676239, 0.00015056878328323364, 0.00015563145279884338, 0.00016069412231445312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 10.0, 20.0, 21.0, 37.0, 58.0, 89.0, 131.0, 226.0, 350.0, 670.0, 1182.0, 2261.0, 4989.0, 16840.0, 255302.0, 713861.0, 38289.0, 7497.0, 3127.0, 1513.0, 760.0, 494.0, 280.0, 186.0, 101.0, 64.0, 54.0, 34.0, 22.0, 12.0, 9.0, 8.0, 5.0, 1.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.500274658203125, -2.40484619140625, -2.309417724609375, -2.2139892578125, -2.118560791015625, -2.02313232421875, -1.927703857421875, -1.832275390625, -1.736846923828125, -1.64141845703125, -1.545989990234375, -1.4505615234375, -1.355133056640625, -1.25970458984375, -1.164276123046875, -1.06884765625, -0.973419189453125, -0.87799072265625, -0.782562255859375, -0.6871337890625, -0.591705322265625, -0.49627685546875, -0.400848388671875, -0.305419921875, -0.209991455078125, -0.11456298828125, -0.019134521484375, 0.0762939453125, 0.171722412109375, 0.26715087890625, 0.362579345703125, 0.4580078125, 0.553436279296875, 0.64886474609375, 0.744293212890625, 0.8397216796875, 0.935150146484375, 1.03057861328125, 1.126007080078125, 1.221435546875, 1.316864013671875, 1.41229248046875, 1.507720947265625, 1.6031494140625, 1.698577880859375, 1.79400634765625, 1.889434814453125, 1.98486328125, 2.080291748046875, 2.17572021484375, 2.271148681640625, 2.3665771484375, 2.462005615234375, 2.55743408203125, 2.652862548828125, 2.748291015625, 2.843719482421875, 2.93914794921875, 3.034576416015625, 3.1300048828125, 3.225433349609375, 3.32086181640625, 3.416290283203125, 3.51171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 9.0, 15.0, 51.0, 137.0, 267.0, 247.0, 134.0, 61.0, 24.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.341094970703125, -3.24273681640625, -3.144378662109375, -3.0460205078125, -2.947662353515625, -2.84930419921875, -2.750946044921875, -2.652587890625, -2.554229736328125, -2.45587158203125, -2.357513427734375, -2.2591552734375, -2.160797119140625, -2.06243896484375, -1.964080810546875, -1.86572265625, -1.767364501953125, -1.66900634765625, -1.570648193359375, -1.4722900390625, -1.373931884765625, -1.27557373046875, -1.177215576171875, -1.078857421875, -0.980499267578125, -0.88214111328125, -0.783782958984375, -0.6854248046875, -0.587066650390625, -0.48870849609375, -0.390350341796875, -0.2919921875, -0.193634033203125, -0.09527587890625, 0.003082275390625, 0.1014404296875, 0.199798583984375, 0.29815673828125, 0.396514892578125, 0.494873046875, 0.593231201171875, 0.69158935546875, 0.789947509765625, 0.8883056640625, 0.986663818359375, 1.08502197265625, 1.183380126953125, 1.28173828125, 1.380096435546875, 1.47845458984375, 1.576812744140625, 1.6751708984375, 1.773529052734375, 1.87188720703125, 1.970245361328125, 2.068603515625, 2.166961669921875, 2.26531982421875, 2.363677978515625, 2.4620361328125, 2.560394287109375, 2.65875244140625, 2.757110595703125, 2.85546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 12.0, 15.0, 17.0, 23.0, 49.0, 78.0, 127.0, 157.0, 167.0, 135.0, 93.0, 57.0, 28.0, 15.0, 9.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375171661376953, -18.81422233581543, -18.253273010253906, -17.692323684692383, -17.13137435913086, -16.570425033569336, -16.009475708007812, -15.448526382446289, -14.887577056884766, -14.326627731323242, -13.765678405761719, -13.204729080200195, -12.643779754638672, -12.082830429077148, -11.521881103515625, -10.960931777954102, -10.399982452392578, -9.839033126831055, -9.278083801269531, -8.717134475708008, -8.156185150146484, -7.595235824584961, -7.0342864990234375, -6.473337173461914, -5.912387847900391, -5.351438522338867, -4.790489196777344, -4.22953987121582, -3.668590545654297, -3.1076412200927734, -2.54669189453125, -1.9857425689697266, -1.4247913360595703, -0.8638420104980469, -0.30289268493652344, 0.258056640625, 0.8190059661865234, 1.3799552917480469, 1.9409046173095703, 2.5018539428710938, 3.062803268432617, 3.6237525939941406, 4.184701919555664, 4.7456512451171875, 5.306600570678711, 5.867549896240234, 6.428499221801758, 6.989448547363281, 7.550397872924805, 8.111347198486328, 8.672296524047852, 9.233245849609375, 9.794195175170898, 10.355144500732422, 10.916093826293945, 11.477043151855469, 12.037992477416992, 12.598941802978516, 13.159891128540039, 13.720840454101562, 14.281789779663086, 14.84273910522461, 15.403688430786133, 15.964637756347656, 16.52558708190918]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 30.0, 21.0, 27.0, 26.0, 42.0, 47.0, 68.0, 45.0, 52.0, 54.0, 59.0, 56.0, 53.0, 57.0, 39.0, 55.0, 34.0, 43.0, 32.0, 19.0, 19.0, 14.0, 12.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.465709686279297, -9.090006828308105, -8.714303970336914, -8.338601112365723, -7.962898254394531, -7.58719539642334, -7.211493015289307, -6.835790157318115, -6.460087299346924, -6.084384441375732, -5.708681583404541, -5.332979202270508, -4.957276344299316, -4.581573486328125, -4.205870628356934, -3.830167770385742, -3.454464912414551, -3.0787620544433594, -2.703059196472168, -2.3273565769195557, -1.9516537189483643, -1.5759508609771729, -1.2002482414245605, -0.8245453834533691, -0.44884252548217773, -0.0731397271156311, 0.3025630712509155, 0.6782658100128174, 1.0539686679840088, 1.4296715259552002, 1.8053741455078125, 2.181077003479004, 2.556778907775879, 2.9324817657470703, 3.3081846237182617, 3.683887243270874, 4.0595903396606445, 4.435293197631836, 4.810995578765869, 5.1866984367370605, 5.562401294708252, 5.938104152679443, 6.313807010650635, 6.689509391784668, 7.065212249755859, 7.440915107727051, 7.816617965698242, 8.192320823669434, 8.568023681640625, 8.943726539611816, 9.319429397583008, 9.6951322555542, 10.07083511352539, 10.446537971496582, 10.822240829467773, 11.197942733764648, 11.573646545410156, 11.949349403381348, 12.325052261352539, 12.70075511932373, 13.076457977294922, 13.452160835266113, 13.827863693237305, 14.20356559753418, 14.579268455505371]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 16.0, 35.0, 65.0, 88.0, 183.0, 338.0, 772.0, 2481.0, 14309.0, 988862.0, 3164369.0, 17926.0, 3165.0, 911.0, 356.0, 179.0, 85.0, 41.0, 32.0, 12.0, 15.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6796875, -7.46051025390625, -7.2413330078125, -7.02215576171875, -6.802978515625, -6.58380126953125, -6.3646240234375, -6.14544677734375, -5.92626953125, -5.70709228515625, -5.4879150390625, -5.26873779296875, -5.049560546875, -4.83038330078125, -4.6112060546875, -4.39202880859375, -4.1728515625, -3.95367431640625, -3.7344970703125, -3.51531982421875, -3.296142578125, -3.07696533203125, -2.8577880859375, -2.63861083984375, -2.41943359375, -2.20025634765625, -1.9810791015625, -1.76190185546875, -1.542724609375, -1.32354736328125, -1.1043701171875, -0.88519287109375, -0.666015625, -0.44683837890625, -0.2276611328125, -0.00848388671875, 0.210693359375, 0.42987060546875, 0.6490478515625, 0.86822509765625, 1.08740234375, 1.30657958984375, 1.5257568359375, 1.74493408203125, 1.964111328125, 2.18328857421875, 2.4024658203125, 2.62164306640625, 2.8408203125, 3.05999755859375, 3.2791748046875, 3.49835205078125, 3.717529296875, 3.93670654296875, 4.1558837890625, 4.37506103515625, 4.59423828125, 4.81341552734375, 5.0325927734375, 5.25177001953125, 5.470947265625, 5.69012451171875, 5.9093017578125, 6.12847900390625, 6.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 4.0, 8.0, 8.0, 13.0, 15.0, 9.0, 26.0, 30.0, 30.0, 44.0, 63.0, 51.0, 53.0, 53.0, 61.0, 71.0, 73.0, 54.0, 60.0, 37.0, 41.0, 44.0, 41.0, 22.0, 27.0, 8.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.484619140625, -0.47092437744140625, -0.4572296142578125, -0.44353485107421875, -0.429840087890625, -0.41614532470703125, -0.4024505615234375, -0.38875579833984375, -0.37506103515625, -0.36136627197265625, -0.3476715087890625, -0.33397674560546875, -0.320281982421875, -0.30658721923828125, -0.2928924560546875, -0.27919769287109375, -0.2655029296875, -0.25180816650390625, -0.2381134033203125, -0.22441864013671875, -0.210723876953125, -0.19702911376953125, -0.1833343505859375, -0.16963958740234375, -0.15594482421875, -0.14225006103515625, -0.1285552978515625, -0.11486053466796875, -0.101165771484375, -0.08747100830078125, -0.0737762451171875, -0.06008148193359375, -0.04638671875, -0.03269195556640625, -0.0189971923828125, -0.00530242919921875, 0.008392333984375, 0.02208709716796875, 0.0357818603515625, 0.04947662353515625, 0.06317138671875, 0.07686614990234375, 0.0905609130859375, 0.10425567626953125, 0.117950439453125, 0.13164520263671875, 0.1453399658203125, 0.15903472900390625, 0.1727294921875, 0.18642425537109375, 0.2001190185546875, 0.21381378173828125, 0.227508544921875, 0.24120330810546875, 0.2548980712890625, 0.26859283447265625, 0.28228759765625, 0.29598236083984375, 0.3096771240234375, 0.32337188720703125, 0.337066650390625, 0.35076141357421875, 0.3644561767578125, 0.37815093994140625, 0.391845703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 7.0, 5.0, 6.0, 14.0, 20.0, 8.0, 36.0, 29.0, 31.0, 57.0, 87.0, 143.0, 261.0, 560.0, 1596.0, 6263.0, 44340.0, 3544291.0, 568293.0, 22310.0, 3836.0, 1019.0, 427.0, 216.0, 118.0, 49.0, 61.0, 43.0, 36.0, 25.0, 23.0, 8.0, 18.0, 4.0, 7.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2685546875, -4.115234375, -3.9619140625, -3.80859375, -3.6552734375, -3.501953125, -3.3486328125, -3.1953125, -3.0419921875, -2.888671875, -2.7353515625, -2.58203125, -2.4287109375, -2.275390625, -2.1220703125, -1.96875, -1.8154296875, -1.662109375, -1.5087890625, -1.35546875, -1.2021484375, -1.048828125, -0.8955078125, -0.7421875, -0.5888671875, -0.435546875, -0.2822265625, -0.12890625, 0.0244140625, 0.177734375, 0.3310546875, 0.484375, 0.6376953125, 0.791015625, 0.9443359375, 1.09765625, 1.2509765625, 1.404296875, 1.5576171875, 1.7109375, 1.8642578125, 2.017578125, 2.1708984375, 2.32421875, 2.4775390625, 2.630859375, 2.7841796875, 2.9375, 3.0908203125, 3.244140625, 3.3974609375, 3.55078125, 3.7041015625, 3.857421875, 4.0107421875, 4.1640625, 4.3173828125, 4.470703125, 4.6240234375, 4.77734375, 4.9306640625, 5.083984375, 5.2373046875, 5.390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 10.0, 14.0, 8.0, 37.0, 42.0, 106.0, 241.0, 668.0, 1865.0, 611.0, 201.0, 98.0, 52.0, 37.0, 26.0, 18.0, 8.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1163482666015625, -1.078399658203125, -1.0404510498046875, -1.00250244140625, -0.9645538330078125, -0.926605224609375, -0.8886566162109375, -0.8507080078125, -0.8127593994140625, -0.774810791015625, -0.7368621826171875, -0.69891357421875, -0.6609649658203125, -0.623016357421875, -0.5850677490234375, -0.547119140625, -0.5091705322265625, -0.471221923828125, -0.4332733154296875, -0.39532470703125, -0.3573760986328125, -0.319427490234375, -0.2814788818359375, -0.2435302734375, -0.2055816650390625, -0.167633056640625, -0.1296844482421875, -0.09173583984375, -0.0537872314453125, -0.015838623046875, 0.0221099853515625, 0.06005859375, 0.0980072021484375, 0.135955810546875, 0.1739044189453125, 0.21185302734375, 0.2498016357421875, 0.287750244140625, 0.3256988525390625, 0.3636474609375, 0.4015960693359375, 0.439544677734375, 0.4774932861328125, 0.51544189453125, 0.5533905029296875, 0.591339111328125, 0.6292877197265625, 0.667236328125, 0.7051849365234375, 0.743133544921875, 0.7810821533203125, 0.81903076171875, 0.8569793701171875, 0.894927978515625, 0.9328765869140625, 0.9708251953125, 1.0087738037109375, 1.046722412109375, 1.0846710205078125, 1.12261962890625, 1.1605682373046875, 1.198516845703125, 1.2364654541015625, 1.2744140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 19.0, 57.0, 167.0, 270.0, 258.0, 135.0, 59.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.97625160217285, -17.565088272094727, -17.1539249420166, -16.742759704589844, -16.33159637451172, -15.920433044433594, -15.509268760681152, -15.098105430603027, -14.686941146850586, -14.275777816772461, -13.86461353302002, -13.453450202941895, -13.042285919189453, -12.631122589111328, -12.219958305358887, -11.808794975280762, -11.39763069152832, -10.986467361450195, -10.575303077697754, -10.164139747619629, -9.752975463867188, -9.341812133789062, -8.930647850036621, -8.519484519958496, -8.108321189880371, -7.697157382965088, -7.285993576049805, -6.8748297691345215, -6.463665962219238, -6.052502632141113, -5.641338348388672, -5.230175018310547, -4.8190107345581055, -4.407846927642822, -3.996683120727539, -3.585519313812256, -3.1743555068969727, -2.7631919384002686, -2.3520281314849854, -1.9408643245697021, -1.529700517654419, -1.1185367107391357, -0.7073729634284973, -0.2962092161178589, 0.11495459079742432, 0.526118278503418, 0.9372820854187012, 1.3484458923339844, 1.7596096992492676, 2.170773506164551, 2.581937313079834, 2.993101119995117, 3.4042649269104004, 3.8154284954071045, 4.226592063903809, 4.63775634765625, 5.048919677734375, 5.460083484649658, 5.871247291564941, 6.282411098480225, 6.693574905395508, 7.104738235473633, 7.515902519226074, 7.927065849304199, 8.33823013305664]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 10.0, 22.0, 18.0, 23.0, 31.0, 41.0, 52.0, 41.0, 65.0, 63.0, 56.0, 72.0, 73.0, 57.0, 51.0, 58.0, 48.0, 44.0, 47.0, 33.0, 28.0, 13.0, 19.0, 8.0, 8.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.697535037994385, -4.567294597625732, -4.43705415725708, -4.306813716888428, -4.176573753356934, -4.046333312988281, -3.916092872619629, -3.7858524322509766, -3.655611991882324, -3.525371551513672, -3.3951311111450195, -3.2648909091949463, -3.134650468826294, -3.0044100284576416, -2.8741698265075684, -2.743929386138916, -2.6136889457702637, -2.4834485054016113, -2.353208065032959, -2.2229678630828857, -2.0927274227142334, -1.962486982345581, -1.8322466611862183, -1.7020063400268555, -1.5717658996582031, -1.4415254592895508, -1.311285138130188, -1.1810448169708252, -1.0508043766021729, -0.9205639958381653, -0.7903236150741577, -0.6600832343101501, -0.5298428535461426, -0.399602472782135, -0.26936209201812744, -0.13912171125411987, -0.008881330490112305, 0.12135905027389526, 0.25159943103790283, 0.3818398118019104, 0.512080192565918, 0.6423205733299255, 0.7725609540939331, 0.9028013348579407, 1.0330417156219482, 1.1632821559906006, 1.2935224771499634, 1.4237627983093262, 1.5540032386779785, 1.6842436790466309, 1.8144840002059937, 1.9447243213653564, 2.074964761734009, 2.205205202102661, 2.3354454040527344, 2.4656858444213867, 2.595926284790039, 2.7261667251586914, 2.8564071655273438, 2.986647367477417, 3.1168878078460693, 3.2471282482147217, 3.377368450164795, 3.5076088905334473, 3.6378493309020996]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 7.0, 26.0, 18.0, 32.0, 29.0, 42.0, 59.0, 89.0, 128.0, 184.0, 281.0, 525.0, 817.0, 1504.0, 2934.0, 6530.0, 16793.0, 52565.0, 188764.0, 438792.0, 237120.0, 65571.0, 20448.0, 7675.0, 3486.0, 1691.0, 920.0, 490.0, 305.0, 232.0, 153.0, 95.0, 67.0, 41.0, 31.0, 22.0, 16.0, 4.0, 11.0, 11.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.44921875, -2.363555908203125, -2.27789306640625, -2.192230224609375, -2.1065673828125, -2.020904541015625, -1.93524169921875, -1.849578857421875, -1.763916015625, -1.678253173828125, -1.59259033203125, -1.506927490234375, -1.4212646484375, -1.335601806640625, -1.24993896484375, -1.164276123046875, -1.07861328125, -0.992950439453125, -0.90728759765625, -0.821624755859375, -0.7359619140625, -0.650299072265625, -0.56463623046875, -0.478973388671875, -0.393310546875, -0.307647705078125, -0.22198486328125, -0.136322021484375, -0.0506591796875, 0.035003662109375, 0.12066650390625, 0.206329345703125, 0.2919921875, 0.377655029296875, 0.46331787109375, 0.548980712890625, 0.6346435546875, 0.720306396484375, 0.80596923828125, 0.891632080078125, 0.977294921875, 1.062957763671875, 1.14862060546875, 1.234283447265625, 1.3199462890625, 1.405609130859375, 1.49127197265625, 1.576934814453125, 1.66259765625, 1.748260498046875, 1.83392333984375, 1.919586181640625, 2.0052490234375, 2.090911865234375, 2.17657470703125, 2.262237548828125, 2.347900390625, 2.433563232421875, 2.51922607421875, 2.604888916015625, 2.6905517578125, 2.776214599609375, 2.86187744140625, 2.947540283203125, 3.033203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 17.0, 19.0, 21.0, 25.0, 32.0, 51.0, 37.0, 46.0, 44.0, 73.0, 62.0, 70.0, 64.0, 53.0, 57.0, 48.0, 39.0, 42.0, 39.0, 19.0, 24.0, 22.0, 18.0, 13.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4853515625, -0.471771240234375, -0.45819091796875, -0.444610595703125, -0.4310302734375, -0.417449951171875, -0.40386962890625, -0.390289306640625, -0.376708984375, -0.363128662109375, -0.34954833984375, -0.335968017578125, -0.3223876953125, -0.308807373046875, -0.29522705078125, -0.281646728515625, -0.26806640625, -0.254486083984375, -0.24090576171875, -0.227325439453125, -0.2137451171875, -0.200164794921875, -0.18658447265625, -0.173004150390625, -0.159423828125, -0.145843505859375, -0.13226318359375, -0.118682861328125, -0.1051025390625, -0.091522216796875, -0.07794189453125, -0.064361572265625, -0.05078125, -0.037200927734375, -0.02362060546875, -0.010040283203125, 0.0035400390625, 0.017120361328125, 0.03070068359375, 0.044281005859375, 0.057861328125, 0.071441650390625, 0.08502197265625, 0.098602294921875, 0.1121826171875, 0.125762939453125, 0.13934326171875, 0.152923583984375, 0.16650390625, 0.180084228515625, 0.19366455078125, 0.207244873046875, 0.2208251953125, 0.234405517578125, 0.24798583984375, 0.261566162109375, 0.275146484375, 0.288726806640625, 0.30230712890625, 0.315887451171875, 0.3294677734375, 0.343048095703125, 0.35662841796875, 0.370208740234375, 0.3837890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 0.0, 10.0, 13.0, 13.0, 16.0, 18.0, 35.0, 41.0, 85.0, 108.0, 137.0, 208.0, 314.0, 478.0, 810.0, 1683.0, 4631.0, 17033.0, 76282.0, 304845.0, 444864.0, 149870.0, 33519.0, 8167.0, 2556.0, 1111.0, 624.0, 327.0, 241.0, 155.0, 88.0, 70.0, 51.0, 39.0, 44.0, 17.0, 13.0, 11.0, 9.0, 8.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.115234375, -2.045257568359375, -1.97528076171875, -1.905303955078125, -1.8353271484375, -1.765350341796875, -1.69537353515625, -1.625396728515625, -1.555419921875, -1.485443115234375, -1.41546630859375, -1.345489501953125, -1.2755126953125, -1.205535888671875, -1.13555908203125, -1.065582275390625, -0.99560546875, -0.925628662109375, -0.85565185546875, -0.785675048828125, -0.7156982421875, -0.645721435546875, -0.57574462890625, -0.505767822265625, -0.435791015625, -0.365814208984375, -0.29583740234375, -0.225860595703125, -0.1558837890625, -0.085906982421875, -0.01593017578125, 0.054046630859375, 0.1240234375, 0.194000244140625, 0.26397705078125, 0.333953857421875, 0.4039306640625, 0.473907470703125, 0.54388427734375, 0.613861083984375, 0.683837890625, 0.753814697265625, 0.82379150390625, 0.893768310546875, 0.9637451171875, 1.033721923828125, 1.10369873046875, 1.173675537109375, 1.24365234375, 1.313629150390625, 1.38360595703125, 1.453582763671875, 1.5235595703125, 1.593536376953125, 1.66351318359375, 1.733489990234375, 1.803466796875, 1.873443603515625, 1.94342041015625, 2.013397216796875, 2.0833740234375, 2.153350830078125, 2.22332763671875, 2.293304443359375, 2.36328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 18.0, 13.0, 17.0, 11.0, 21.0, 35.0, 19.0, 25.0, 31.0, 36.0, 31.0, 34.0, 45.0, 40.0, 37.0, 43.0, 41.0, 38.0, 37.0, 47.0, 42.0, 36.0, 35.0, 32.0, 25.0, 26.0, 23.0, 28.0, 25.0, 23.0, 18.0, 13.0, 10.0, 8.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3828125, -1.3404998779296875, -1.298187255859375, -1.2558746337890625, -1.21356201171875, -1.1712493896484375, -1.128936767578125, -1.0866241455078125, -1.0443115234375, -1.0019989013671875, -0.959686279296875, -0.9173736572265625, -0.87506103515625, -0.8327484130859375, -0.790435791015625, -0.7481231689453125, -0.705810546875, -0.6634979248046875, -0.621185302734375, -0.5788726806640625, -0.53656005859375, -0.4942474365234375, -0.451934814453125, -0.4096221923828125, -0.3673095703125, -0.3249969482421875, -0.282684326171875, -0.2403717041015625, -0.19805908203125, -0.1557464599609375, -0.113433837890625, -0.0711212158203125, -0.02880859375, 0.0135040283203125, 0.055816650390625, 0.0981292724609375, 0.14044189453125, 0.1827545166015625, 0.225067138671875, 0.2673797607421875, 0.3096923828125, 0.3520050048828125, 0.394317626953125, 0.4366302490234375, 0.47894287109375, 0.5212554931640625, 0.563568115234375, 0.6058807373046875, 0.648193359375, 0.6905059814453125, 0.732818603515625, 0.7751312255859375, 0.81744384765625, 0.8597564697265625, 0.902069091796875, 0.9443817138671875, 0.9866943359375, 1.0290069580078125, 1.071319580078125, 1.1136322021484375, 1.15594482421875, 1.1982574462890625, 1.240570068359375, 1.2828826904296875, 1.3251953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 14.0, 30.0, 46.0, 75.0, 131.0, 205.0, 379.0, 853.0, 1882.0, 5329.0, 20163.0, 145867.0, 720438.0, 126114.0, 18413.0, 5112.0, 1811.0, 811.0, 403.0, 181.0, 107.0, 63.0, 39.0, 25.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37890625, -2.307830810546875, -2.23675537109375, -2.165679931640625, -2.0946044921875, -2.023529052734375, -1.95245361328125, -1.881378173828125, -1.810302734375, -1.739227294921875, -1.66815185546875, -1.597076416015625, -1.5260009765625, -1.454925537109375, -1.38385009765625, -1.312774658203125, -1.24169921875, -1.170623779296875, -1.09954833984375, -1.028472900390625, -0.9573974609375, -0.886322021484375, -0.81524658203125, -0.744171142578125, -0.673095703125, -0.602020263671875, -0.53094482421875, -0.459869384765625, -0.3887939453125, -0.317718505859375, -0.24664306640625, -0.175567626953125, -0.1044921875, -0.033416748046875, 0.03765869140625, 0.108734130859375, 0.1798095703125, 0.250885009765625, 0.32196044921875, 0.393035888671875, 0.464111328125, 0.535186767578125, 0.60626220703125, 0.677337646484375, 0.7484130859375, 0.819488525390625, 0.89056396484375, 0.961639404296875, 1.03271484375, 1.103790283203125, 1.17486572265625, 1.245941162109375, 1.3170166015625, 1.388092041015625, 1.45916748046875, 1.530242919921875, 1.601318359375, 1.672393798828125, 1.74346923828125, 1.814544677734375, 1.8856201171875, 1.956695556640625, 2.02777099609375, 2.098846435546875, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 16.0, 18.0, 22.0, 37.0, 32.0, 55.0, 93.0, 115.0, 126.0, 97.0, 66.0, 61.0, 57.0, 41.0, 20.0, 22.0, 11.0, 8.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002562999725341797, -0.00024925172328948975, -0.0002422034740447998, -0.00023515522480010986, -0.00022810697555541992, -0.00022105872631072998, -0.00021401047706604004, -0.0002069622278213501, -0.00019991397857666016, -0.00019286572933197021, -0.00018581748008728027, -0.00017876923084259033, -0.0001717209815979004, -0.00016467273235321045, -0.0001576244831085205, -0.00015057623386383057, -0.00014352798461914062, -0.00013647973537445068, -0.00012943148612976074, -0.0001223832368850708, -0.00011533498764038086, -0.00010828673839569092, -0.00010123848915100098, -9.419023990631104e-05, -8.71419906616211e-05, -8.009374141693115e-05, -7.304549217224121e-05, -6.599724292755127e-05, -5.894899368286133e-05, -5.190074443817139e-05, -4.4852495193481445e-05, -3.7804245948791504e-05, -3.075599670410156e-05, -2.370774745941162e-05, -1.665949821472168e-05, -9.611248970031738e-06, -2.562999725341797e-06, 4.4852495193481445e-06, 1.1533498764038086e-05, 1.8581748008728027e-05, 2.562999725341797e-05, 3.267824649810791e-05, 3.972649574279785e-05, 4.677474498748779e-05, 5.3822994232177734e-05, 6.0871243476867676e-05, 6.791949272155762e-05, 7.496774196624756e-05, 8.20159912109375e-05, 8.906424045562744e-05, 9.611248970031738e-05, 0.00010316073894500732, 0.00011020898818969727, 0.00011725723743438721, 0.00012430548667907715, 0.0001313537359237671, 0.00013840198516845703, 0.00014545023441314697, 0.00015249848365783691, 0.00015954673290252686, 0.0001665949821472168, 0.00017364323139190674, 0.00018069148063659668, 0.00018773972988128662, 0.00019478797912597656]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 16.0, 29.0, 37.0, 53.0, 109.0, 212.0, 383.0, 890.0, 2919.0, 14384.0, 223354.0, 766518.0, 32189.0, 5015.0, 1365.0, 504.0, 235.0, 128.0, 73.0, 46.0, 29.0, 12.0, 14.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.53515625, -3.418060302734375, -3.30096435546875, -3.183868408203125, -3.0667724609375, -2.949676513671875, -2.83258056640625, -2.715484619140625, -2.598388671875, -2.481292724609375, -2.36419677734375, -2.247100830078125, -2.1300048828125, -2.012908935546875, -1.89581298828125, -1.778717041015625, -1.66162109375, -1.544525146484375, -1.42742919921875, -1.310333251953125, -1.1932373046875, -1.076141357421875, -0.95904541015625, -0.841949462890625, -0.724853515625, -0.607757568359375, -0.49066162109375, -0.373565673828125, -0.2564697265625, -0.139373779296875, -0.02227783203125, 0.094818115234375, 0.2119140625, 0.329010009765625, 0.44610595703125, 0.563201904296875, 0.6802978515625, 0.797393798828125, 0.91448974609375, 1.031585693359375, 1.148681640625, 1.265777587890625, 1.38287353515625, 1.499969482421875, 1.6170654296875, 1.734161376953125, 1.85125732421875, 1.968353271484375, 2.08544921875, 2.202545166015625, 2.31964111328125, 2.436737060546875, 2.5538330078125, 2.670928955078125, 2.78802490234375, 2.905120849609375, 3.022216796875, 3.139312744140625, 3.25640869140625, 3.373504638671875, 3.4906005859375, 3.607696533203125, 3.72479248046875, 3.841888427734375, 3.958984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 12.0, 14.0, 29.0, 48.0, 60.0, 108.0, 163.0, 186.0, 128.0, 80.0, 51.0, 26.0, 15.0, 17.0, 13.0, 7.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8647308349609375, -1.808563232421875, -1.7523956298828125, -1.69622802734375, -1.6400604248046875, -1.583892822265625, -1.5277252197265625, -1.4715576171875, -1.4153900146484375, -1.359222412109375, -1.3030548095703125, -1.24688720703125, -1.1907196044921875, -1.134552001953125, -1.0783843994140625, -1.022216796875, -0.9660491943359375, -0.909881591796875, -0.8537139892578125, -0.79754638671875, -0.7413787841796875, -0.685211181640625, -0.6290435791015625, -0.5728759765625, -0.5167083740234375, -0.460540771484375, -0.4043731689453125, -0.34820556640625, -0.2920379638671875, -0.235870361328125, -0.1797027587890625, -0.12353515625, -0.0673675537109375, -0.011199951171875, 0.0449676513671875, 0.10113525390625, 0.1573028564453125, 0.213470458984375, 0.2696380615234375, 0.3258056640625, 0.3819732666015625, 0.438140869140625, 0.4943084716796875, 0.55047607421875, 0.6066436767578125, 0.662811279296875, 0.7189788818359375, 0.775146484375, 0.8313140869140625, 0.887481689453125, 0.9436492919921875, 0.99981689453125, 1.0559844970703125, 1.112152099609375, 1.1683197021484375, 1.2244873046875, 1.2806549072265625, 1.336822509765625, 1.3929901123046875, 1.44915771484375, 1.5053253173828125, 1.561492919921875, 1.6176605224609375, 1.673828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 11.0, 63.0, 151.0, 295.0, 276.0, 148.0, 33.0, 19.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.460739135742188, -25.25513458251953, -24.049531936645508, -22.84392738342285, -21.638324737548828, -20.432720184326172, -19.227115631103516, -18.021512985229492, -16.81591033935547, -15.610306739807129, -14.404703140258789, -13.199098587036133, -11.99349594116211, -10.787891387939453, -9.582287788391113, -8.376684188842773, -7.171079635620117, -5.965476036071777, -4.7598724365234375, -3.5542683601379395, -2.3486647605895996, -1.1430611610412598, 0.06254291534423828, 1.2681465148925781, 2.473750114440918, 3.679353713989258, 4.884957313537598, 6.090561389923096, 7.2961649894714355, 8.501768112182617, 9.707372665405273, 10.912976264953613, 12.118579864501953, 13.324183464050293, 14.529787063598633, 15.735391616821289, 16.940994262695312, 18.14659881591797, 19.352203369140625, 20.55780601501465, 21.763408660888672, 22.969013214111328, 24.17461585998535, 25.380220413208008, 26.58582305908203, 27.791427612304688, 28.997032165527344, 30.202634811401367, 31.408239364624023, 32.61384201049805, 33.8194465637207, 35.02505111694336, 36.230655670166016, 37.436256408691406, 38.64186096191406, 39.84746551513672, 41.053070068359375, 42.25867462158203, 43.46427917480469, 44.66987991333008, 45.875484466552734, 47.08108901977539, 48.28669357299805, 49.49229431152344, 50.697898864746094]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 11.0, 11.0, 24.0, 15.0, 24.0, 25.0, 18.0, 33.0, 38.0, 25.0, 37.0, 35.0, 42.0, 39.0, 40.0, 38.0, 52.0, 34.0, 41.0, 27.0, 31.0, 40.0, 50.0, 34.0, 27.0, 44.0, 21.0, 16.0, 13.0, 16.0, 12.0, 15.0, 9.0, 8.0, 6.0, 6.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-9.608081817626953, -9.353487014770508, -9.098893165588379, -8.844298362731934, -8.589704513549805, -8.33510971069336, -8.08051586151123, -7.825921058654785, -7.571327209472656, -7.316732883453369, -7.062138557434082, -6.807544231414795, -6.552949905395508, -6.298355579376221, -6.043761253356934, -5.789166450500488, -5.534572124481201, -5.279977798461914, -5.025383472442627, -4.77078914642334, -4.516194820404053, -4.261600494384766, -4.00700569152832, -3.7524116039276123, -3.497817277908325, -3.243222951889038, -2.988628625869751, -2.7340340614318848, -2.4794397354125977, -2.2248454093933105, -1.9702510833740234, -1.7156567573547363, -1.4610624313354492, -1.206468105316162, -0.9518737196922302, -0.6972793340682983, -0.44268500804901123, -0.18809068202972412, 0.06650376319885254, 0.32109808921813965, 0.5756924152374268, 0.8302867412567139, 1.084881067276001, 1.3394755125045776, 1.5940698385238647, 1.8486641645431519, 2.1032586097717285, 2.3578529357910156, 2.6124472618103027, 2.86704158782959, 3.121635913848877, 3.376230239868164, 3.630824565887451, 3.8854188919067383, 4.140013694763184, 4.3946075439453125, 4.649202346801758, 4.903796672821045, 5.158390998840332, 5.412985324859619, 5.667579650878906, 5.922173976898193, 6.1767683029174805, 6.431363105773926, 6.685956954956055]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 12.0, 17.0, 20.0, 22.0, 42.0, 49.0, 68.0, 85.0, 124.0, 177.0, 273.0, 443.0, 720.0, 1403.0, 3060.0, 6505.0, 18102.0, 76773.0, 2534349.0, 1454108.0, 67883.0, 17055.0, 6383.0, 2983.0, 1478.0, 868.0, 469.0, 271.0, 173.0, 122.0, 59.0, 47.0, 28.0, 31.0, 12.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71875, -3.612396240234375, -3.50604248046875, -3.399688720703125, -3.2933349609375, -3.186981201171875, -3.08062744140625, -2.974273681640625, -2.867919921875, -2.761566162109375, -2.65521240234375, -2.548858642578125, -2.4425048828125, -2.336151123046875, -2.22979736328125, -2.123443603515625, -2.01708984375, -1.910736083984375, -1.80438232421875, -1.698028564453125, -1.5916748046875, -1.485321044921875, -1.37896728515625, -1.272613525390625, -1.166259765625, -1.059906005859375, -0.95355224609375, -0.847198486328125, -0.7408447265625, -0.634490966796875, -0.52813720703125, -0.421783447265625, -0.3154296875, -0.209075927734375, -0.10272216796875, 0.003631591796875, 0.1099853515625, 0.216339111328125, 0.32269287109375, 0.429046630859375, 0.535400390625, 0.641754150390625, 0.74810791015625, 0.854461669921875, 0.9608154296875, 1.067169189453125, 1.17352294921875, 1.279876708984375, 1.38623046875, 1.492584228515625, 1.59893798828125, 1.705291748046875, 1.8116455078125, 1.917999267578125, 2.02435302734375, 2.130706787109375, 2.237060546875, 2.343414306640625, 2.44976806640625, 2.556121826171875, 2.6624755859375, 2.768829345703125, 2.87518310546875, 2.981536865234375, 3.087890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 6.0, 10.0, 18.0, 21.0, 28.0, 31.0, 35.0, 47.0, 37.0, 57.0, 50.0, 58.0, 73.0, 56.0, 63.0, 51.0, 64.0, 53.0, 36.0, 36.0, 24.0, 35.0, 21.0, 10.0, 13.0, 6.0, 15.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.509765625, -0.4956817626953125, -0.481597900390625, -0.4675140380859375, -0.45343017578125, -0.4393463134765625, -0.425262451171875, -0.4111785888671875, -0.3970947265625, -0.3830108642578125, -0.368927001953125, -0.3548431396484375, -0.34075927734375, -0.3266754150390625, -0.312591552734375, -0.2985076904296875, -0.284423828125, -0.2703399658203125, -0.256256103515625, -0.2421722412109375, -0.22808837890625, -0.2140045166015625, -0.199920654296875, -0.1858367919921875, -0.1717529296875, -0.1576690673828125, -0.143585205078125, -0.1295013427734375, -0.11541748046875, -0.1013336181640625, -0.087249755859375, -0.0731658935546875, -0.05908203125, -0.0449981689453125, -0.030914306640625, -0.0168304443359375, -0.00274658203125, 0.0113372802734375, 0.025421142578125, 0.0395050048828125, 0.0535888671875, 0.0676727294921875, 0.081756591796875, 0.0958404541015625, 0.10992431640625, 0.1240081787109375, 0.138092041015625, 0.1521759033203125, 0.166259765625, 0.1803436279296875, 0.194427490234375, 0.2085113525390625, 0.22259521484375, 0.2366790771484375, 0.250762939453125, 0.2648468017578125, 0.2789306640625, 0.2930145263671875, 0.307098388671875, 0.3211822509765625, 0.33526611328125, 0.3493499755859375, 0.363433837890625, 0.3775177001953125, 0.3916015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 15.0, 15.0, 29.0, 24.0, 33.0, 62.0, 103.0, 162.0, 265.0, 621.0, 1471.0, 4492.0, 24172.0, 493295.0, 3589376.0, 67082.0, 8791.0, 2367.0, 921.0, 365.0, 222.0, 96.0, 60.0, 52.0, 27.0, 26.0, 26.0, 19.0, 8.0, 11.0, 13.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.76666259765625, -4.6231689453125, -4.47967529296875, -4.336181640625, -4.19268798828125, -4.0491943359375, -3.90570068359375, -3.76220703125, -3.61871337890625, -3.4752197265625, -3.33172607421875, -3.188232421875, -3.04473876953125, -2.9012451171875, -2.75775146484375, -2.6142578125, -2.47076416015625, -2.3272705078125, -2.18377685546875, -2.040283203125, -1.89678955078125, -1.7532958984375, -1.60980224609375, -1.46630859375, -1.32281494140625, -1.1793212890625, -1.03582763671875, -0.892333984375, -0.74884033203125, -0.6053466796875, -0.46185302734375, -0.318359375, -0.17486572265625, -0.0313720703125, 0.11212158203125, 0.255615234375, 0.39910888671875, 0.5426025390625, 0.68609619140625, 0.82958984375, 0.97308349609375, 1.1165771484375, 1.26007080078125, 1.403564453125, 1.54705810546875, 1.6905517578125, 1.83404541015625, 1.9775390625, 2.12103271484375, 2.2645263671875, 2.40802001953125, 2.551513671875, 2.69500732421875, 2.8385009765625, 2.98199462890625, 3.12548828125, 3.26898193359375, 3.4124755859375, 3.55596923828125, 3.699462890625, 3.84295654296875, 3.9864501953125, 4.12994384765625, 4.2734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 8.0, 11.0, 23.0, 35.0, 60.0, 125.0, 298.0, 784.0, 1721.0, 580.0, 217.0, 101.0, 41.0, 15.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5857696533203125, -1.536773681640625, -1.4877777099609375, -1.43878173828125, -1.3897857666015625, -1.340789794921875, -1.2917938232421875, -1.2427978515625, -1.1938018798828125, -1.144805908203125, -1.0958099365234375, -1.04681396484375, -0.9978179931640625, -0.948822021484375, -0.8998260498046875, -0.850830078125, -0.8018341064453125, -0.752838134765625, -0.7038421630859375, -0.65484619140625, -0.6058502197265625, -0.556854248046875, -0.5078582763671875, -0.4588623046875, -0.4098663330078125, -0.360870361328125, -0.3118743896484375, -0.26287841796875, -0.2138824462890625, -0.164886474609375, -0.1158905029296875, -0.06689453125, -0.0178985595703125, 0.031097412109375, 0.0800933837890625, 0.12908935546875, 0.1780853271484375, 0.227081298828125, 0.2760772705078125, 0.3250732421875, 0.3740692138671875, 0.423065185546875, 0.4720611572265625, 0.52105712890625, 0.5700531005859375, 0.619049072265625, 0.6680450439453125, 0.717041015625, 0.7660369873046875, 0.815032958984375, 0.8640289306640625, 0.91302490234375, 0.9620208740234375, 1.011016845703125, 1.0600128173828125, 1.1090087890625, 1.1580047607421875, 1.207000732421875, 1.2559967041015625, 1.30499267578125, 1.3539886474609375, 1.402984619140625, 1.4519805908203125, 1.5009765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 6.0, 16.0, 18.0, 27.0, 55.0, 79.0, 93.0, 147.0, 116.0, 143.0, 113.0, 55.0, 47.0, 34.0, 18.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21065616607666, -5.977004051208496, -5.743351936340332, -5.509699821472168, -5.276047706604004, -5.04239559173584, -4.808743476867676, -4.575091361999512, -4.341439247131348, -4.107787132263184, -3.8741350173950195, -3.6404829025268555, -3.4068307876586914, -3.1731786727905273, -2.9395267963409424, -2.7058746814727783, -2.4722228050231934, -2.2385706901550293, -2.0049185752868652, -1.7712665796279907, -1.5376144647598267, -1.3039623498916626, -1.070310354232788, -0.836658239364624, -0.60300612449646, -0.3693540394306183, -0.1357019543647766, 0.09795010089874268, 0.33160221576690674, 0.5652543306350708, 0.7989063262939453, 1.0325584411621094, 1.2662105560302734, 1.4998626708984375, 1.7335147857666016, 1.967166781425476, 2.2008190155029297, 2.4344711303710938, 2.6681230068206787, 2.9017751216888428, 3.135427236557007, 3.369079351425171, 3.602731466293335, 3.83638334274292, 4.070035457611084, 4.303687572479248, 4.537339687347412, 4.770991802215576, 5.00464391708374, 5.238296031951904, 5.471948146820068, 5.705600261688232, 5.9392523765563965, 6.1729044914245605, 6.406556129455566, 6.6402082443237305, 6.8738603591918945, 7.107512474060059, 7.341164588928223, 7.574816703796387, 7.808468818664551, 8.042120933532715, 8.275773048400879, 8.509425163269043, 8.743077278137207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 13.0, 11.0, 12.0, 17.0, 21.0, 22.0, 27.0, 35.0, 47.0, 47.0, 46.0, 50.0, 45.0, 79.0, 53.0, 52.0, 52.0, 62.0, 52.0, 45.0, 38.0, 39.0, 24.0, 24.0, 24.0, 15.0, 12.0, 5.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4587721824645996, -3.318309783935547, -3.177847385406494, -3.0373847484588623, -2.8969223499298096, -2.756459951400757, -2.615997314453125, -2.4755349159240723, -2.3350725173950195, -2.194610118865967, -2.054147720336914, -1.9136850833892822, -1.7732226848602295, -1.6327602863311768, -1.4922977685928345, -1.3518352508544922, -1.2113728523254395, -1.0709104537963867, -0.9304479360580444, -0.7899854779243469, -0.6495230197906494, -0.5090605616569519, -0.3685981035232544, -0.22813564538955688, -0.08767318725585938, 0.052789270877838135, 0.19325172901153564, 0.33371418714523315, 0.47417664527893066, 0.6146391034126282, 0.7551015615463257, 0.8955640196800232, 1.0360264778137207, 1.1764888763427734, 1.3169513940811157, 1.457413911819458, 1.5978763103485107, 1.7383387088775635, 1.8788012266159058, 2.019263744354248, 2.159726142883301, 2.3001885414123535, 2.4406509399414062, 2.581113576889038, 2.721575975418091, 2.8620383739471436, 3.0025010108947754, 3.142963409423828, 3.283425807952881, 3.4238882064819336, 3.5643506050109863, 3.704813241958618, 3.845275640487671, 3.9857380390167236, 4.1262006759643555, 4.266663074493408, 4.407125473022461, 4.547587871551514, 4.688050270080566, 4.828512668609619, 4.968975067138672, 5.109437942504883, 5.2499003410339355, 5.390362739562988, 5.530825138092041]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 7.0, 5.0, 18.0, 30.0, 47.0, 69.0, 151.0, 278.0, 631.0, 1575.0, 4364.0, 18520.0, 119148.0, 705327.0, 165860.0, 23880.0, 5434.0, 1788.0, 748.0, 319.0, 159.0, 85.0, 38.0, 28.0, 17.0, 18.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.0987548828125, -3.955322265625, -3.8118896484375, -3.66845703125, -3.5250244140625, -3.381591796875, -3.2381591796875, -3.0947265625, -2.9512939453125, -2.807861328125, -2.6644287109375, -2.52099609375, -2.3775634765625, -2.234130859375, -2.0906982421875, -1.947265625, -1.8038330078125, -1.660400390625, -1.5169677734375, -1.37353515625, -1.2301025390625, -1.086669921875, -0.9432373046875, -0.7998046875, -0.6563720703125, -0.512939453125, -0.3695068359375, -0.22607421875, -0.0826416015625, 0.060791015625, 0.2042236328125, 0.34765625, 0.4910888671875, 0.634521484375, 0.7779541015625, 0.92138671875, 1.0648193359375, 1.208251953125, 1.3516845703125, 1.4951171875, 1.6385498046875, 1.781982421875, 1.9254150390625, 2.06884765625, 2.2122802734375, 2.355712890625, 2.4991455078125, 2.642578125, 2.7860107421875, 2.929443359375, 3.0728759765625, 3.21630859375, 3.3597412109375, 3.503173828125, 3.6466064453125, 3.7900390625, 3.9334716796875, 4.076904296875, 4.2203369140625, 4.36376953125, 4.5072021484375, 4.650634765625, 4.7940673828125, 4.9375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 10.0, 10.0, 19.0, 10.0, 33.0, 33.0, 24.0, 37.0, 58.0, 57.0, 54.0, 62.0, 59.0, 65.0, 65.0, 57.0, 58.0, 49.0, 48.0, 37.0, 34.0, 27.0, 11.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5498046875, -0.5346870422363281, -0.5195693969726562, -0.5044517517089844, -0.4893341064453125, -0.4742164611816406, -0.45909881591796875, -0.4439811706542969, -0.428863525390625, -0.4137458801269531, -0.39862823486328125, -0.3835105895996094, -0.3683929443359375, -0.3532752990722656, -0.33815765380859375, -0.3230400085449219, -0.30792236328125, -0.2928047180175781, -0.27768707275390625, -0.2625694274902344, -0.2474517822265625, -0.23233413696289062, -0.21721649169921875, -0.20209884643554688, -0.186981201171875, -0.17186355590820312, -0.15674591064453125, -0.14162826538085938, -0.1265106201171875, -0.11139297485351562, -0.09627532958984375, -0.08115768432617188, -0.0660400390625, -0.050922393798828125, -0.03580474853515625, -0.020687103271484375, -0.0055694580078125, 0.009548187255859375, 0.02466583251953125, 0.039783477783203125, 0.054901123046875, 0.07001876831054688, 0.08513641357421875, 0.10025405883789062, 0.1153717041015625, 0.13048934936523438, 0.14560699462890625, 0.16072463989257812, 0.17584228515625, 0.19095993041992188, 0.20607757568359375, 0.22119522094726562, 0.2363128662109375, 0.2514305114746094, 0.26654815673828125, 0.2816658020019531, 0.296783447265625, 0.3119010925292969, 0.32701873779296875, 0.3421363830566406, 0.3572540283203125, 0.3723716735839844, 0.38748931884765625, 0.4026069641113281, 0.417724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 6.0, 8.0, 13.0, 8.0, 25.0, 37.0, 32.0, 52.0, 82.0, 109.0, 136.0, 222.0, 340.0, 628.0, 1072.0, 2268.0, 6080.0, 19562.0, 74596.0, 340462.0, 458312.0, 103999.0, 26340.0, 8087.0, 2872.0, 1313.0, 654.0, 360.0, 256.0, 163.0, 117.0, 87.0, 61.0, 44.0, 28.0, 21.0, 22.0, 23.0, 11.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.408203125, -2.333221435546875, -2.25823974609375, -2.183258056640625, -2.1082763671875, -2.033294677734375, -1.95831298828125, -1.883331298828125, -1.808349609375, -1.733367919921875, -1.65838623046875, -1.583404541015625, -1.5084228515625, -1.433441162109375, -1.35845947265625, -1.283477783203125, -1.20849609375, -1.133514404296875, -1.05853271484375, -0.983551025390625, -0.9085693359375, -0.833587646484375, -0.75860595703125, -0.683624267578125, -0.608642578125, -0.533660888671875, -0.45867919921875, -0.383697509765625, -0.3087158203125, -0.233734130859375, -0.15875244140625, -0.083770751953125, -0.0087890625, 0.066192626953125, 0.14117431640625, 0.216156005859375, 0.2911376953125, 0.366119384765625, 0.44110107421875, 0.516082763671875, 0.591064453125, 0.666046142578125, 0.74102783203125, 0.816009521484375, 0.8909912109375, 0.965972900390625, 1.04095458984375, 1.115936279296875, 1.19091796875, 1.265899658203125, 1.34088134765625, 1.415863037109375, 1.4908447265625, 1.565826416015625, 1.64080810546875, 1.715789794921875, 1.790771484375, 1.865753173828125, 1.94073486328125, 2.015716552734375, 2.0906982421875, 2.165679931640625, 2.24066162109375, 2.315643310546875, 2.390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 4.0, 12.0, 14.0, 25.0, 16.0, 28.0, 23.0, 53.0, 52.0, 50.0, 51.0, 39.0, 55.0, 52.0, 72.0, 55.0, 47.0, 55.0, 54.0, 37.0, 42.0, 32.0, 20.0, 28.0, 19.0, 13.0, 11.0, 7.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.02734375, -1.96722412109375, -1.9071044921875, -1.84698486328125, -1.786865234375, -1.72674560546875, -1.6666259765625, -1.60650634765625, -1.54638671875, -1.48626708984375, -1.4261474609375, -1.36602783203125, -1.305908203125, -1.24578857421875, -1.1856689453125, -1.12554931640625, -1.0654296875, -1.00531005859375, -0.9451904296875, -0.88507080078125, -0.824951171875, -0.76483154296875, -0.7047119140625, -0.64459228515625, -0.58447265625, -0.52435302734375, -0.4642333984375, -0.40411376953125, -0.343994140625, -0.28387451171875, -0.2237548828125, -0.16363525390625, -0.103515625, -0.04339599609375, 0.0167236328125, 0.07684326171875, 0.136962890625, 0.19708251953125, 0.2572021484375, 0.31732177734375, 0.37744140625, 0.43756103515625, 0.4976806640625, 0.55780029296875, 0.617919921875, 0.67803955078125, 0.7381591796875, 0.79827880859375, 0.8583984375, 0.91851806640625, 0.9786376953125, 1.03875732421875, 1.098876953125, 1.15899658203125, 1.2191162109375, 1.27923583984375, 1.33935546875, 1.39947509765625, 1.4595947265625, 1.51971435546875, 1.579833984375, 1.63995361328125, 1.7000732421875, 1.76019287109375, 1.8203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 11.0, 9.0, 20.0, 40.0, 48.0, 100.0, 149.0, 286.0, 645.0, 1539.0, 4888.0, 20452.0, 143080.0, 761612.0, 93661.0, 15606.0, 3972.0, 1281.0, 521.0, 263.0, 140.0, 83.0, 55.0, 36.0, 19.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.175079345703125, -2.10797119140625, -2.040863037109375, -1.9737548828125, -1.906646728515625, -1.83953857421875, -1.772430419921875, -1.705322265625, -1.638214111328125, -1.57110595703125, -1.503997802734375, -1.4368896484375, -1.369781494140625, -1.30267333984375, -1.235565185546875, -1.16845703125, -1.101348876953125, -1.03424072265625, -0.967132568359375, -0.9000244140625, -0.832916259765625, -0.76580810546875, -0.698699951171875, -0.631591796875, -0.564483642578125, -0.49737548828125, -0.430267333984375, -0.3631591796875, -0.296051025390625, -0.22894287109375, -0.161834716796875, -0.0947265625, -0.027618408203125, 0.03948974609375, 0.106597900390625, 0.1737060546875, 0.240814208984375, 0.30792236328125, 0.375030517578125, 0.442138671875, 0.509246826171875, 0.57635498046875, 0.643463134765625, 0.7105712890625, 0.777679443359375, 0.84478759765625, 0.911895751953125, 0.97900390625, 1.046112060546875, 1.11322021484375, 1.180328369140625, 1.2474365234375, 1.314544677734375, 1.38165283203125, 1.448760986328125, 1.515869140625, 1.582977294921875, 1.65008544921875, 1.717193603515625, 1.7843017578125, 1.851409912109375, 1.91851806640625, 1.985626220703125, 2.052734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 17.0, 14.0, 32.0, 37.0, 71.0, 237.0, 346.0, 102.0, 53.0, 23.0, 23.0, 12.0, 8.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006055831909179688, -0.0005901232361793518, -0.0005746632814407349, -0.0005592033267021179, -0.000543743371963501, -0.000528283417224884, -0.0005128234624862671, -0.0004973635077476501, -0.0004819035530090332, -0.00046644359827041626, -0.0004509836435317993, -0.0004355236887931824, -0.00042006373405456543, -0.0004046037793159485, -0.00038914382457733154, -0.0003736838698387146, -0.00035822391510009766, -0.0003427639603614807, -0.00032730400562286377, -0.0003118440508842468, -0.0002963840961456299, -0.00028092414140701294, -0.000265464186668396, -0.00025000423192977905, -0.0002345442771911621, -0.00021908432245254517, -0.00020362436771392822, -0.00018816441297531128, -0.00017270445823669434, -0.0001572445034980774, -0.00014178454875946045, -0.0001263245940208435, -0.00011086463928222656, -9.540468454360962e-05, -7.994472980499268e-05, -6.448477506637573e-05, -4.902482032775879e-05, -3.3564865589141846e-05, -1.8104910850524902e-05, -2.644956111907959e-06, 1.2814998626708984e-05, 2.8274953365325928e-05, 4.373490810394287e-05, 5.9194862842559814e-05, 7.465481758117676e-05, 9.01147723197937e-05, 0.00010557472705841064, 0.00012103468179702759, 0.00013649463653564453, 0.00015195459127426147, 0.00016741454601287842, 0.00018287450075149536, 0.0001983344554901123, 0.00021379441022872925, 0.0002292543649673462, 0.00024471431970596313, 0.0002601742744445801, 0.000275634229183197, 0.00029109418392181396, 0.0003065541386604309, 0.00032201409339904785, 0.0003374740481376648, 0.00035293400287628174, 0.0003683939576148987, 0.0003838539123535156]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 12.0, 13.0, 16.0, 15.0, 22.0, 35.0, 26.0, 42.0, 76.0, 100.0, 131.0, 271.0, 495.0, 996.0, 2381.0, 6156.0, 18936.0, 73313.0, 687874.0, 205020.0, 35272.0, 10403.0, 3780.0, 1463.0, 696.0, 412.0, 185.0, 121.0, 78.0, 57.0, 44.0, 30.0, 24.0, 19.0, 16.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.674041748046875, -1.61370849609375, -1.553375244140625, -1.4930419921875, -1.432708740234375, -1.37237548828125, -1.312042236328125, -1.251708984375, -1.191375732421875, -1.13104248046875, -1.070709228515625, -1.0103759765625, -0.950042724609375, -0.88970947265625, -0.829376220703125, -0.76904296875, -0.708709716796875, -0.64837646484375, -0.588043212890625, -0.5277099609375, -0.467376708984375, -0.40704345703125, -0.346710205078125, -0.286376953125, -0.226043701171875, -0.16571044921875, -0.105377197265625, -0.0450439453125, 0.015289306640625, 0.07562255859375, 0.135955810546875, 0.1962890625, 0.256622314453125, 0.31695556640625, 0.377288818359375, 0.4376220703125, 0.497955322265625, 0.55828857421875, 0.618621826171875, 0.678955078125, 0.739288330078125, 0.79962158203125, 0.859954833984375, 0.9202880859375, 0.980621337890625, 1.04095458984375, 1.101287841796875, 1.16162109375, 1.221954345703125, 1.28228759765625, 1.342620849609375, 1.4029541015625, 1.463287353515625, 1.52362060546875, 1.583953857421875, 1.644287109375, 1.704620361328125, 1.76495361328125, 1.825286865234375, 1.8856201171875, 1.945953369140625, 2.00628662109375, 2.066619873046875, 2.126953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 9.0, 4.0, 12.0, 12.0, 12.0, 21.0, 21.0, 25.0, 45.0, 68.0, 100.0, 151.0, 160.0, 110.0, 69.0, 34.0, 28.0, 20.0, 18.0, 15.0, 19.0, 18.0, 8.0, 2.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9423751831054688, -0.9018402099609375, -0.8613052368164062, -0.820770263671875, -0.7802352905273438, -0.7397003173828125, -0.6991653442382812, -0.65863037109375, -0.6180953979492188, -0.5775604248046875, -0.5370254516601562, -0.496490478515625, -0.45595550537109375, -0.4154205322265625, -0.37488555908203125, -0.3343505859375, -0.29381561279296875, -0.2532806396484375, -0.21274566650390625, -0.172210693359375, -0.13167572021484375, -0.0911407470703125, -0.05060577392578125, -0.01007080078125, 0.03046417236328125, 0.0709991455078125, 0.11153411865234375, 0.152069091796875, 0.19260406494140625, 0.2331390380859375, 0.27367401123046875, 0.314208984375, 0.35474395751953125, 0.3952789306640625, 0.43581390380859375, 0.476348876953125, 0.5168838500976562, 0.5574188232421875, 0.5979537963867188, 0.63848876953125, 0.6790237426757812, 0.7195587158203125, 0.7600936889648438, 0.800628662109375, 0.8411636352539062, 0.8816986083984375, 0.9222335815429688, 0.9627685546875, 1.0033035278320312, 1.0438385009765625, 1.0843734741210938, 1.124908447265625, 1.1654434204101562, 1.2059783935546875, 1.2465133666992188, 1.28704833984375, 1.3275833129882812, 1.3681182861328125, 1.4086532592773438, 1.449188232421875, 1.4897232055664062, 1.5302581787109375, 1.5707931518554688, 1.611328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 14.0, 31.0, 68.0, 127.0, 176.0, 186.0, 165.0, 115.0, 52.0, 31.0, 14.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.84744644165039, -24.052867889404297, -23.25828742980957, -22.463708877563477, -21.66912841796875, -20.874549865722656, -20.079971313476562, -19.285390853881836, -18.49081039428711, -17.696231842041016, -16.90165138244629, -16.107072830200195, -15.312492370605469, -14.517913818359375, -13.723334312438965, -12.928754806518555, -12.134176254272461, -11.33959674835205, -10.54501724243164, -9.750438690185547, -8.95585823059082, -8.161279678344727, -7.366700172424316, -6.572120666503906, -5.777541160583496, -4.982961654663086, -4.188382148742676, -3.393803119659424, -2.5992236137390137, -1.8046441078186035, -1.0100650787353516, -0.2154855728149414, 0.5790958404541016, 1.3736752271652222, 2.1682546138763428, 2.962833881378174, 3.757413387298584, 4.551992893218994, 5.346571922302246, 6.141151428222656, 6.935730934143066, 7.730310440063477, 8.524889945983887, 9.319469451904297, 10.11404800415039, 10.908628463745117, 11.703207015991211, 12.497786521911621, 13.292366027832031, 14.086945533752441, 14.881525039672852, 15.676103591918945, 16.470684051513672, 17.265262603759766, 18.05984115600586, 18.854421615600586, 19.649002075195312, 20.443580627441406, 21.238161087036133, 22.032739639282227, 22.827320098876953, 23.621898651123047, 24.41647720336914, 25.211057662963867, 26.00563621520996]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 4.0, 8.0, 9.0, 4.0, 12.0, 14.0, 9.0, 15.0, 12.0, 23.0, 23.0, 26.0, 21.0, 23.0, 35.0, 33.0, 28.0, 39.0, 36.0, 37.0, 31.0, 39.0, 34.0, 38.0, 41.0, 44.0, 40.0, 35.0, 27.0, 32.0, 29.0, 17.0, 23.0, 23.0, 27.0, 8.0, 14.0, 13.0, 12.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.466588497161865, -7.238072395324707, -7.009555816650391, -6.781039714813232, -6.552523136138916, -6.324007034301758, -6.095490455627441, -5.866974353790283, -5.638458251953125, -5.409942150115967, -5.18142557144165, -4.952909469604492, -4.724392890930176, -4.495876789093018, -4.267360687255859, -4.038844108581543, -3.8103275299072266, -3.5818111896514893, -3.353294849395752, -3.1247787475585938, -2.8962621688842773, -2.667746067047119, -2.439229726791382, -2.2107133865356445, -1.9821970462799072, -1.75368070602417, -1.5251643657684326, -1.2966481447219849, -1.0681318044662476, -0.8396154642105103, -0.6110992431640625, -0.3825829029083252, -0.1540665626525879, 0.07444974780082703, 0.30296605825424194, 0.5314823389053345, 0.7599986791610718, 0.9885150194168091, 1.2170312404632568, 1.4455475807189941, 1.6740639209747314, 1.9025802612304688, 2.131096601486206, 2.3596129417419434, 2.5881290435791016, 2.816645622253418, 3.045161724090576, 3.2736780643463135, 3.502194404602051, 3.730710744857788, 3.9592270851135254, 4.187743186950684, 4.416259765625, 4.644775867462158, 4.873291969299316, 5.101808547973633, 5.330325126647949, 5.558841228485107, 5.787357807159424, 6.015873908996582, 6.244390487670898, 6.472906589508057, 6.701422691345215, 6.929939270019531, 7.1584553718566895]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 16.0, 22.0, 27.0, 25.0, 44.0, 48.0, 71.0, 92.0, 138.0, 205.0, 284.0, 489.0, 928.0, 1726.0, 3564.0, 8578.0, 25818.0, 124598.0, 3425362.0, 521178.0, 54047.0, 14892.0, 5939.0, 2662.0, 1412.0, 810.0, 461.0, 269.0, 187.0, 107.0, 75.0, 60.0, 32.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-4.1796875, -4.071868896484375, -3.96405029296875, -3.856231689453125, -3.7484130859375, -3.640594482421875, -3.53277587890625, -3.424957275390625, -3.317138671875, -3.209320068359375, -3.10150146484375, -2.993682861328125, -2.8858642578125, -2.778045654296875, -2.67022705078125, -2.562408447265625, -2.45458984375, -2.346771240234375, -2.23895263671875, -2.131134033203125, -2.0233154296875, -1.915496826171875, -1.80767822265625, -1.699859619140625, -1.592041015625, -1.484222412109375, -1.37640380859375, -1.268585205078125, -1.1607666015625, -1.052947998046875, -0.94512939453125, -0.837310791015625, -0.7294921875, -0.621673583984375, -0.51385498046875, -0.406036376953125, -0.2982177734375, -0.190399169921875, -0.08258056640625, 0.025238037109375, 0.133056640625, 0.240875244140625, 0.34869384765625, 0.456512451171875, 0.5643310546875, 0.672149658203125, 0.77996826171875, 0.887786865234375, 0.99560546875, 1.103424072265625, 1.21124267578125, 1.319061279296875, 1.4268798828125, 1.534698486328125, 1.64251708984375, 1.750335693359375, 1.858154296875, 1.965972900390625, 2.07379150390625, 2.181610107421875, 2.2894287109375, 2.397247314453125, 2.50506591796875, 2.612884521484375, 2.720703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 3.0, 9.0, 8.0, 17.0, 24.0, 24.0, 32.0, 35.0, 33.0, 43.0, 43.0, 56.0, 51.0, 64.0, 72.0, 57.0, 57.0, 50.0, 54.0, 39.0, 40.0, 34.0, 36.0, 28.0, 20.0, 14.0, 14.0, 9.0, 5.0, 10.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.51220703125, -0.4975318908691406, -0.48285675048828125, -0.4681816101074219, -0.4535064697265625, -0.4388313293457031, -0.42415618896484375, -0.4094810485839844, -0.394805908203125, -0.3801307678222656, -0.36545562744140625, -0.3507804870605469, -0.3361053466796875, -0.3214302062988281, -0.30675506591796875, -0.2920799255371094, -0.27740478515625, -0.2627296447753906, -0.24805450439453125, -0.23337936401367188, -0.2187042236328125, -0.20402908325195312, -0.18935394287109375, -0.17467880249023438, -0.160003662109375, -0.14532852172851562, -0.13065338134765625, -0.11597824096679688, -0.1013031005859375, -0.08662796020507812, -0.07195281982421875, -0.057277679443359375, -0.0426025390625, -0.027927398681640625, -0.01325225830078125, 0.001422882080078125, 0.0160980224609375, 0.030773162841796875, 0.04544830322265625, 0.060123443603515625, 0.074798583984375, 0.08947372436523438, 0.10414886474609375, 0.11882400512695312, 0.1334991455078125, 0.14817428588867188, 0.16284942626953125, 0.17752456665039062, 0.19219970703125, 0.20687484741210938, 0.22154998779296875, 0.23622512817382812, 0.2509002685546875, 0.2655754089355469, 0.28025054931640625, 0.2949256896972656, 0.309600830078125, 0.3242759704589844, 0.33895111083984375, 0.3536262512207031, 0.3683013916015625, 0.3829765319824219, 0.39765167236328125, 0.4123268127441406, 0.427001953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 7.0, 15.0, 17.0, 15.0, 29.0, 19.0, 39.0, 50.0, 71.0, 102.0, 130.0, 222.0, 307.0, 708.0, 2132.0, 12830.0, 424871.0, 3719186.0, 27894.0, 3510.0, 935.0, 406.0, 221.0, 155.0, 81.0, 72.0, 65.0, 39.0, 38.0, 34.0, 17.0, 13.0, 10.0, 12.0, 8.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.5859375, -8.3609619140625, -8.135986328125, -7.9110107421875, -7.68603515625, -7.4610595703125, -7.236083984375, -7.0111083984375, -6.7861328125, -6.5611572265625, -6.336181640625, -6.1112060546875, -5.88623046875, -5.6612548828125, -5.436279296875, -5.2113037109375, -4.986328125, -4.7613525390625, -4.536376953125, -4.3114013671875, -4.08642578125, -3.8614501953125, -3.636474609375, -3.4114990234375, -3.1865234375, -2.9615478515625, -2.736572265625, -2.5115966796875, -2.28662109375, -2.0616455078125, -1.836669921875, -1.6116943359375, -1.38671875, -1.1617431640625, -0.936767578125, -0.7117919921875, -0.48681640625, -0.2618408203125, -0.036865234375, 0.1881103515625, 0.4130859375, 0.6380615234375, 0.863037109375, 1.0880126953125, 1.31298828125, 1.5379638671875, 1.762939453125, 1.9879150390625, 2.212890625, 2.4378662109375, 2.662841796875, 2.8878173828125, 3.11279296875, 3.3377685546875, 3.562744140625, 3.7877197265625, 4.0126953125, 4.2376708984375, 4.462646484375, 4.6876220703125, 4.91259765625, 5.1375732421875, 5.362548828125, 5.5875244140625, 5.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 26.0, 48.0, 116.0, 610.0, 2649.0, 459.0, 94.0, 38.0, 14.0, 10.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.9769287109375, -3.887451171875, -3.7979736328125, -3.70849609375, -3.6190185546875, -3.529541015625, -3.4400634765625, -3.3505859375, -3.2611083984375, -3.171630859375, -3.0821533203125, -2.99267578125, -2.9031982421875, -2.813720703125, -2.7242431640625, -2.634765625, -2.5452880859375, -2.455810546875, -2.3663330078125, -2.27685546875, -2.1873779296875, -2.097900390625, -2.0084228515625, -1.9189453125, -1.8294677734375, -1.739990234375, -1.6505126953125, -1.56103515625, -1.4715576171875, -1.382080078125, -1.2926025390625, -1.203125, -1.1136474609375, -1.024169921875, -0.9346923828125, -0.84521484375, -0.7557373046875, -0.666259765625, -0.5767822265625, -0.4873046875, -0.3978271484375, -0.308349609375, -0.2188720703125, -0.12939453125, -0.0399169921875, 0.049560546875, 0.1390380859375, 0.228515625, 0.3179931640625, 0.407470703125, 0.4969482421875, 0.58642578125, 0.6759033203125, 0.765380859375, 0.8548583984375, 0.9443359375, 1.0338134765625, 1.123291015625, 1.2127685546875, 1.30224609375, 1.3917236328125, 1.481201171875, 1.5706787109375, 1.66015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 42.0, 58.0, 90.0, 129.0, 169.0, 170.0, 123.0, 62.0, 50.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-10.343038558959961, -10.069808959960938, -9.796579360961914, -9.52334976196289, -9.25011920928955, -8.976889610290527, -8.703660011291504, -8.43043041229248, -8.157200813293457, -7.883971214294434, -7.610741138458252, -7.3375115394592285, -7.064281940460205, -6.791051864624023, -6.517822265625, -6.244592666625977, -5.971362590789795, -5.6981329917907715, -5.42490291595459, -5.151673316955566, -4.878443717956543, -4.6052141189575195, -4.331984043121338, -4.0587544441223145, -3.785524606704712, -3.5122947692871094, -3.239065170288086, -2.9658353328704834, -2.692605495452881, -2.4193758964538574, -2.146146059036255, -1.872916340827942, -1.5996861457824707, -1.3264564275741577, -1.0532267093658447, -0.7799968719482422, -0.5067671537399292, -0.2335374355316162, 0.03969240188598633, 0.3129221200942993, 0.5861518383026123, 0.8593815565109253, 1.1326112747192383, 1.4058411121368408, 1.6790708303451538, 1.9523005485534668, 2.2255303859710693, 2.498760223388672, 2.7719898223876953, 3.045219659805298, 3.3184492588043213, 3.591679096221924, 3.8649086952209473, 4.138138771057129, 4.411368370056152, 4.684597969055176, 4.957827568054199, 5.231057167053223, 5.504287242889404, 5.777516841888428, 6.050746440887451, 6.323976516723633, 6.597206115722656, 6.87043571472168, 7.143665790557861]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 11.0, 12.0, 22.0, 26.0, 58.0, 74.0, 65.0, 95.0, 96.0, 92.0, 76.0, 80.0, 72.0, 62.0, 44.0, 31.0, 17.0, 20.0, 14.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.705615043640137, -8.498294830322266, -8.290974617004395, -8.083654403686523, -7.876333713531494, -7.669013500213623, -7.461693286895752, -7.254373073577881, -7.047052383422852, -6.8397321701049805, -6.632411956787109, -6.425091743469238, -6.217771053314209, -6.010450839996338, -5.803130626678467, -5.595810413360596, -5.388490200042725, -5.1811699867248535, -4.973849773406982, -4.766529083251953, -4.559208869934082, -4.351888656616211, -4.14456844329834, -3.9372482299804688, -3.7299277782440186, -3.5226075649261475, -3.3152871131896973, -3.107966899871826, -2.900646686553955, -2.693326234817505, -2.486006021499634, -2.2786855697631836, -2.0713658332824707, -1.86404550075531, -1.6567251682281494, -1.4494049549102783, -1.2420846223831177, -1.034764289855957, -0.8274440765380859, -0.6201237440109253, -0.41280341148376465, -0.2054831087589264, 0.0018371939659118652, 0.20915746688842773, 0.4164777994155884, 0.623798131942749, 0.8311183452606201, 1.0384386777877808, 1.2457590103149414, 1.453079342842102, 1.6603996753692627, 1.8677198886871338, 2.075040340423584, 2.282360553741455, 2.489680767059326, 2.6970009803771973, 2.9043214321136475, 3.1116416454315186, 3.3189620971679688, 3.52628231048584, 3.733602523803711, 3.940922975540161, 4.148242950439453, 4.355563640594482, 4.5628838539123535]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 6.0, 8.0, 15.0, 38.0, 55.0, 78.0, 108.0, 156.0, 277.0, 415.0, 878.0, 1891.0, 4824.0, 16099.0, 67042.0, 416978.0, 442629.0, 71200.0, 16810.0, 4984.0, 1952.0, 887.0, 443.0, 247.0, 196.0, 103.0, 69.0, 50.0, 38.0, 23.0, 15.0, 14.0, 10.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.400146484375, -3.29052734375, -3.180908203125, -3.0712890625, -2.961669921875, -2.85205078125, -2.742431640625, -2.6328125, -2.523193359375, -2.41357421875, -2.303955078125, -2.1943359375, -2.084716796875, -1.97509765625, -1.865478515625, -1.755859375, -1.646240234375, -1.53662109375, -1.427001953125, -1.3173828125, -1.207763671875, -1.09814453125, -0.988525390625, -0.87890625, -0.769287109375, -0.65966796875, -0.550048828125, -0.4404296875, -0.330810546875, -0.22119140625, -0.111572265625, -0.001953125, 0.107666015625, 0.21728515625, 0.326904296875, 0.4365234375, 0.546142578125, 0.65576171875, 0.765380859375, 0.875, 0.984619140625, 1.09423828125, 1.203857421875, 1.3134765625, 1.423095703125, 1.53271484375, 1.642333984375, 1.751953125, 1.861572265625, 1.97119140625, 2.080810546875, 2.1904296875, 2.300048828125, 2.40966796875, 2.519287109375, 2.62890625, 2.738525390625, 2.84814453125, 2.957763671875, 3.0673828125, 3.177001953125, 3.28662109375, 3.396240234375, 3.505859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 14.0, 13.0, 30.0, 33.0, 38.0, 37.0, 68.0, 66.0, 65.0, 72.0, 87.0, 72.0, 72.0, 68.0, 54.0, 45.0, 42.0, 34.0, 17.0, 16.0, 14.0, 16.0, 6.0, 3.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7314453125, -0.712005615234375, -0.69256591796875, -0.673126220703125, -0.6536865234375, -0.634246826171875, -0.61480712890625, -0.595367431640625, -0.575927734375, -0.556488037109375, -0.53704833984375, -0.517608642578125, -0.4981689453125, -0.478729248046875, -0.45928955078125, -0.439849853515625, -0.42041015625, -0.400970458984375, -0.38153076171875, -0.362091064453125, -0.3426513671875, -0.323211669921875, -0.30377197265625, -0.284332275390625, -0.264892578125, -0.245452880859375, -0.22601318359375, -0.206573486328125, -0.1871337890625, -0.167694091796875, -0.14825439453125, -0.128814697265625, -0.109375, -0.089935302734375, -0.07049560546875, -0.051055908203125, -0.0316162109375, -0.012176513671875, 0.00726318359375, 0.026702880859375, 0.046142578125, 0.065582275390625, 0.08502197265625, 0.104461669921875, 0.1239013671875, 0.143341064453125, 0.16278076171875, 0.182220458984375, 0.20166015625, 0.221099853515625, 0.24053955078125, 0.259979248046875, 0.2794189453125, 0.298858642578125, 0.31829833984375, 0.337738037109375, 0.357177734375, 0.376617431640625, 0.39605712890625, 0.415496826171875, 0.4349365234375, 0.454376220703125, 0.47381591796875, 0.493255615234375, 0.5126953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 10.0, 22.0, 25.0, 39.0, 51.0, 76.0, 87.0, 150.0, 220.0, 343.0, 600.0, 1108.0, 2296.0, 4958.0, 10947.0, 26471.0, 68342.0, 208686.0, 425368.0, 190796.0, 63717.0, 24539.0, 10376.0, 4540.0, 2085.0, 1027.0, 587.0, 315.0, 236.0, 144.0, 106.0, 71.0, 61.0, 29.0, 22.0, 21.0, 12.0, 10.0, 8.0, 4.0, 4.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.48919677734375, -1.4403076171875, -1.39141845703125, -1.342529296875, -1.29364013671875, -1.2447509765625, -1.19586181640625, -1.14697265625, -1.09808349609375, -1.0491943359375, -1.00030517578125, -0.951416015625, -0.90252685546875, -0.8536376953125, -0.80474853515625, -0.755859375, -0.70697021484375, -0.6580810546875, -0.60919189453125, -0.560302734375, -0.51141357421875, -0.4625244140625, -0.41363525390625, -0.36474609375, -0.31585693359375, -0.2669677734375, -0.21807861328125, -0.169189453125, -0.12030029296875, -0.0714111328125, -0.02252197265625, 0.0263671875, 0.07525634765625, 0.1241455078125, 0.17303466796875, 0.221923828125, 0.27081298828125, 0.3197021484375, 0.36859130859375, 0.41748046875, 0.46636962890625, 0.5152587890625, 0.56414794921875, 0.613037109375, 0.66192626953125, 0.7108154296875, 0.75970458984375, 0.80859375, 0.85748291015625, 0.9063720703125, 0.95526123046875, 1.004150390625, 1.05303955078125, 1.1019287109375, 1.15081787109375, 1.19970703125, 1.24859619140625, 1.2974853515625, 1.34637451171875, 1.395263671875, 1.44415283203125, 1.4930419921875, 1.54193115234375, 1.5908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 11.0, 13.0, 17.0, 16.0, 14.0, 24.0, 13.0, 29.0, 26.0, 31.0, 36.0, 28.0, 39.0, 47.0, 27.0, 34.0, 51.0, 32.0, 55.0, 36.0, 39.0, 43.0, 44.0, 28.0, 28.0, 16.0, 20.0, 34.0, 23.0, 21.0, 10.0, 14.0, 18.0, 8.0, 5.0, 6.0, 11.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.4296875, -1.388214111328125, -1.34674072265625, -1.305267333984375, -1.2637939453125, -1.222320556640625, -1.18084716796875, -1.139373779296875, -1.097900390625, -1.056427001953125, -1.01495361328125, -0.973480224609375, -0.9320068359375, -0.890533447265625, -0.84906005859375, -0.807586669921875, -0.76611328125, -0.724639892578125, -0.68316650390625, -0.641693115234375, -0.6002197265625, -0.558746337890625, -0.51727294921875, -0.475799560546875, -0.434326171875, -0.392852783203125, -0.35137939453125, -0.309906005859375, -0.2684326171875, -0.226959228515625, -0.18548583984375, -0.144012451171875, -0.1025390625, -0.061065673828125, -0.01959228515625, 0.021881103515625, 0.0633544921875, 0.104827880859375, 0.14630126953125, 0.187774658203125, 0.229248046875, 0.270721435546875, 0.31219482421875, 0.353668212890625, 0.3951416015625, 0.436614990234375, 0.47808837890625, 0.519561767578125, 0.56103515625, 0.602508544921875, 0.64398193359375, 0.685455322265625, 0.7269287109375, 0.768402099609375, 0.80987548828125, 0.851348876953125, 0.892822265625, 0.934295654296875, 0.97576904296875, 1.017242431640625, 1.0587158203125, 1.100189208984375, 1.14166259765625, 1.183135986328125, 1.224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 27.0, 39.0, 52.0, 83.0, 118.0, 170.0, 294.0, 506.0, 1049.0, 2315.0, 5887.0, 20013.0, 98126.0, 737430.0, 144588.0, 25357.0, 7203.0, 2544.0, 1225.0, 635.0, 298.0, 193.0, 108.0, 74.0, 51.0, 37.0, 29.0, 12.0, 15.0, 10.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.1905670166015625, -1.145782470703125, -1.1009979248046875, -1.05621337890625, -1.0114288330078125, -0.966644287109375, -0.9218597412109375, -0.8770751953125, -0.8322906494140625, -0.787506103515625, -0.7427215576171875, -0.69793701171875, -0.6531524658203125, -0.608367919921875, -0.5635833740234375, -0.518798828125, -0.4740142822265625, -0.429229736328125, -0.3844451904296875, -0.33966064453125, -0.2948760986328125, -0.250091552734375, -0.2053070068359375, -0.1605224609375, -0.1157379150390625, -0.070953369140625, -0.0261688232421875, 0.01861572265625, 0.0634002685546875, 0.108184814453125, 0.1529693603515625, 0.19775390625, 0.2425384521484375, 0.287322998046875, 0.3321075439453125, 0.37689208984375, 0.4216766357421875, 0.466461181640625, 0.5112457275390625, 0.5560302734375, 0.6008148193359375, 0.645599365234375, 0.6903839111328125, 0.73516845703125, 0.7799530029296875, 0.824737548828125, 0.8695220947265625, 0.914306640625, 0.9590911865234375, 1.003875732421875, 1.0486602783203125, 1.09344482421875, 1.1382293701171875, 1.183013916015625, 1.2277984619140625, 1.2725830078125, 1.3173675537109375, 1.362152099609375, 1.4069366455078125, 1.45172119140625, 1.4965057373046875, 1.541290283203125, 1.5860748291015625, 1.630859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 7.0, 10.0, 18.0, 10.0, 11.0, 26.0, 19.0, 49.0, 139.0, 353.0, 186.0, 70.0, 41.0, 16.0, 16.0, 9.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025177001953125, -0.00024109333753585815, -0.0002304166555404663, -0.00021973997354507446, -0.00020906329154968262, -0.00019838660955429077, -0.00018770992755889893, -0.00017703324556350708, -0.00016635656356811523, -0.0001556798815727234, -0.00014500319957733154, -0.0001343265175819397, -0.00012364983558654785, -0.000112973153591156, -0.00010229647159576416, -9.161978960037231e-05, -8.094310760498047e-05, -7.026642560958862e-05, -5.958974361419678e-05, -4.891306161880493e-05, -3.8236379623413086e-05, -2.755969762802124e-05, -1.6883015632629395e-05, -6.206333637237549e-06, 4.470348358154297e-06, 1.5147030353546143e-05, 2.5823712348937988e-05, 3.6500394344329834e-05, 4.717707633972168e-05, 5.7853758335113525e-05, 6.853044033050537e-05, 7.920712232589722e-05, 8.988380432128906e-05, 0.00010056048631668091, 0.00011123716831207275, 0.0001219138503074646, 0.00013259053230285645, 0.0001432672142982483, 0.00015394389629364014, 0.00016462057828903198, 0.00017529726028442383, 0.00018597394227981567, 0.00019665062427520752, 0.00020732730627059937, 0.0002180039882659912, 0.00022868067026138306, 0.0002393573522567749, 0.00025003403425216675, 0.0002607107162475586, 0.00027138739824295044, 0.0002820640802383423, 0.00029274076223373413, 0.000303417444229126, 0.0003140941262245178, 0.00032477080821990967, 0.0003354474902153015, 0.00034612417221069336, 0.0003568008542060852, 0.00036747753620147705, 0.0003781542181968689, 0.00038883090019226074, 0.0003995075821876526, 0.00041018426418304443, 0.0004208609461784363, 0.0004315376281738281]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 8.0, 17.0, 21.0, 21.0, 44.0, 53.0, 123.0, 172.0, 304.0, 604.0, 1279.0, 3312.0, 9837.0, 38258.0, 388444.0, 542189.0, 45728.0, 11570.0, 3696.0, 1382.0, 661.0, 324.0, 216.0, 108.0, 67.0, 43.0, 24.0, 18.0, 12.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.729949951171875, -1.68060302734375, -1.631256103515625, -1.5819091796875, -1.532562255859375, -1.48321533203125, -1.433868408203125, -1.384521484375, -1.335174560546875, -1.28582763671875, -1.236480712890625, -1.1871337890625, -1.137786865234375, -1.08843994140625, -1.039093017578125, -0.98974609375, -0.940399169921875, -0.89105224609375, -0.841705322265625, -0.7923583984375, -0.743011474609375, -0.69366455078125, -0.644317626953125, -0.594970703125, -0.545623779296875, -0.49627685546875, -0.446929931640625, -0.3975830078125, -0.348236083984375, -0.29888916015625, -0.249542236328125, -0.2001953125, -0.150848388671875, -0.10150146484375, -0.052154541015625, -0.0028076171875, 0.046539306640625, 0.09588623046875, 0.145233154296875, 0.194580078125, 0.243927001953125, 0.29327392578125, 0.342620849609375, 0.3919677734375, 0.441314697265625, 0.49066162109375, 0.540008544921875, 0.58935546875, 0.638702392578125, 0.68804931640625, 0.737396240234375, 0.7867431640625, 0.836090087890625, 0.88543701171875, 0.934783935546875, 0.984130859375, 1.033477783203125, 1.08282470703125, 1.132171630859375, 1.1815185546875, 1.230865478515625, 1.28021240234375, 1.329559326171875, 1.37890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 11.0, 11.0, 15.0, 32.0, 35.0, 57.0, 101.0, 161.0, 164.0, 140.0, 93.0, 37.0, 17.0, 17.0, 18.0, 10.0, 11.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.4873046875, -1.4513168334960938, -1.4153289794921875, -1.3793411254882812, -1.343353271484375, -1.3073654174804688, -1.2713775634765625, -1.2353897094726562, -1.19940185546875, -1.1634140014648438, -1.1274261474609375, -1.0914382934570312, -1.055450439453125, -1.0194625854492188, -0.9834747314453125, -0.9474868774414062, -0.9114990234375, -0.8755111694335938, -0.8395233154296875, -0.8035354614257812, -0.767547607421875, -0.7315597534179688, -0.6955718994140625, -0.6595840454101562, -0.62359619140625, -0.5876083374023438, -0.5516204833984375, -0.5156326293945312, -0.479644775390625, -0.44365692138671875, -0.4076690673828125, -0.37168121337890625, -0.335693359375, -0.29970550537109375, -0.2637176513671875, -0.22772979736328125, -0.191741943359375, -0.15575408935546875, -0.1197662353515625, -0.08377838134765625, -0.04779052734375, -0.01180267333984375, 0.0241851806640625, 0.06017303466796875, 0.096160888671875, 0.13214874267578125, 0.1681365966796875, 0.20412445068359375, 0.2401123046875, 0.27610015869140625, 0.3120880126953125, 0.34807586669921875, 0.384063720703125, 0.42005157470703125, 0.4560394287109375, 0.49202728271484375, 0.52801513671875, 0.5640029907226562, 0.5999908447265625, 0.6359786987304688, 0.671966552734375, 0.7079544067382812, 0.7439422607421875, 0.7799301147460938, 0.81591796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 12.0, 24.0, 47.0, 86.0, 121.0, 149.0, 160.0, 142.0, 106.0, 72.0, 40.0, 25.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.285001754760742, -25.67831039428711, -25.07162094116211, -24.46493148803711, -23.858240127563477, -23.251548767089844, -22.644859313964844, -22.038169860839844, -21.43147850036621, -20.824787139892578, -20.218097686767578, -19.611408233642578, -19.004716873168945, -18.398025512695312, -17.791336059570312, -17.184646606445312, -16.57795524597168, -15.971264839172363, -15.364574432373047, -14.75788402557373, -14.151193618774414, -13.544503211975098, -12.937812805175781, -12.331122398376465, -11.724431991577148, -11.117741584777832, -10.511051177978516, -9.9043607711792, -9.297670364379883, -8.690979957580566, -8.08428955078125, -7.477599143981934, -6.87091064453125, -6.264220237731934, -5.657529830932617, -5.050839424133301, -4.444149017333984, -3.837458610534668, -3.2307682037353516, -2.624077796936035, -2.0173873901367188, -1.4106969833374023, -0.8040065765380859, -0.19731616973876953, 0.4093742370605469, 1.0160646438598633, 1.6227550506591797, 2.229445457458496, 2.8361358642578125, 3.442826271057129, 4.049516677856445, 4.656207084655762, 5.262897491455078, 5.8695878982543945, 6.476278305053711, 7.082968711853027, 7.689659118652344, 8.29634952545166, 8.903039932250977, 9.509730339050293, 10.11642074584961, 10.723111152648926, 11.329801559448242, 11.936491966247559, 12.543182373046875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 7.0, 4.0, 8.0, 14.0, 20.0, 18.0, 19.0, 34.0, 27.0, 27.0, 23.0, 40.0, 19.0, 44.0, 38.0, 41.0, 45.0, 45.0, 36.0, 36.0, 35.0, 37.0, 36.0, 42.0, 23.0, 34.0, 28.0, 29.0, 25.0, 24.0, 11.0, 15.0, 17.0, 9.0, 15.0, 9.0, 8.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.608931064605713, -6.402459621429443, -6.195988178253174, -5.989516735076904, -5.783045291900635, -5.576573848724365, -5.370102405548096, -5.163630962371826, -4.957159519195557, -4.750688076019287, -4.544216632843018, -4.337745189666748, -4.1312737464904785, -3.924802303314209, -3.7183308601379395, -3.51185941696167, -3.3053879737854004, -3.098916530609131, -2.8924450874328613, -2.685973644256592, -2.4795022010803223, -2.2730307579040527, -2.066559314727783, -1.8600878715515137, -1.6536164283752441, -1.4471449851989746, -1.240673542022705, -1.0342020988464355, -0.827730655670166, -0.6212592124938965, -0.41478776931762695, -0.20831632614135742, -0.0018453598022460938, 0.20462608337402344, 0.41109752655029297, 0.6175689697265625, 0.824040412902832, 1.0305118560791016, 1.236983299255371, 1.4434547424316406, 1.6499261856079102, 1.8563976287841797, 2.062869071960449, 2.2693405151367188, 2.4758119583129883, 2.682283401489258, 2.8887548446655273, 3.095226287841797, 3.3016977310180664, 3.508169174194336, 3.7146406173706055, 3.921112060546875, 4.1275835037231445, 4.334054946899414, 4.540526390075684, 4.746997833251953, 4.953469276428223, 5.159940719604492, 5.366412162780762, 5.572883605957031, 5.779355049133301, 5.98582649230957, 6.19229793548584, 6.398769378662109, 6.605240821838379]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 17.0, 18.0, 21.0, 39.0, 64.0, 73.0, 121.0, 164.0, 270.0, 423.0, 697.0, 1373.0, 2965.0, 7949.0, 28749.0, 277955.0, 3763264.0, 84298.0, 15932.0, 5110.0, 2139.0, 1099.0, 580.0, 336.0, 193.0, 115.0, 98.0, 56.0, 38.0, 16.0, 18.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3125, -6.1385498046875, -5.964599609375, -5.7906494140625, -5.61669921875, -5.4427490234375, -5.268798828125, -5.0948486328125, -4.9208984375, -4.7469482421875, -4.572998046875, -4.3990478515625, -4.22509765625, -4.0511474609375, -3.877197265625, -3.7032470703125, -3.529296875, -3.3553466796875, -3.181396484375, -3.0074462890625, -2.83349609375, -2.6595458984375, -2.485595703125, -2.3116455078125, -2.1376953125, -1.9637451171875, -1.789794921875, -1.6158447265625, -1.44189453125, -1.2679443359375, -1.093994140625, -0.9200439453125, -0.74609375, -0.5721435546875, -0.398193359375, -0.2242431640625, -0.05029296875, 0.1236572265625, 0.297607421875, 0.4715576171875, 0.6455078125, 0.8194580078125, 0.993408203125, 1.1673583984375, 1.34130859375, 1.5152587890625, 1.689208984375, 1.8631591796875, 2.037109375, 2.2110595703125, 2.385009765625, 2.5589599609375, 2.73291015625, 2.9068603515625, 3.080810546875, 3.2547607421875, 3.4287109375, 3.6026611328125, 3.776611328125, 3.9505615234375, 4.12451171875, 4.2984619140625, 4.472412109375, 4.6463623046875, 4.8203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 18.0, 32.0, 31.0, 32.0, 42.0, 57.0, 61.0, 68.0, 80.0, 83.0, 76.0, 70.0, 58.0, 64.0, 50.0, 41.0, 31.0, 27.0, 21.0, 15.0, 5.0, 13.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79345703125, -0.7735137939453125, -0.753570556640625, -0.7336273193359375, -0.71368408203125, -0.6937408447265625, -0.673797607421875, -0.6538543701171875, -0.6339111328125, -0.6139678955078125, -0.594024658203125, -0.5740814208984375, -0.55413818359375, -0.5341949462890625, -0.514251708984375, -0.4943084716796875, -0.474365234375, -0.4544219970703125, -0.434478759765625, -0.4145355224609375, -0.39459228515625, -0.3746490478515625, -0.354705810546875, -0.3347625732421875, -0.3148193359375, -0.2948760986328125, -0.274932861328125, -0.2549896240234375, -0.23504638671875, -0.2151031494140625, -0.195159912109375, -0.1752166748046875, -0.1552734375, -0.1353302001953125, -0.115386962890625, -0.0954437255859375, -0.07550048828125, -0.0555572509765625, -0.035614013671875, -0.0156707763671875, 0.0042724609375, 0.0242156982421875, 0.044158935546875, 0.0641021728515625, 0.08404541015625, 0.1039886474609375, 0.123931884765625, 0.1438751220703125, 0.163818359375, 0.1837615966796875, 0.203704833984375, 0.2236480712890625, 0.24359130859375, 0.2635345458984375, 0.283477783203125, 0.3034210205078125, 0.3233642578125, 0.3433074951171875, 0.363250732421875, 0.3831939697265625, 0.40313720703125, 0.4230804443359375, 0.443023681640625, 0.4629669189453125, 0.48291015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 10.0, 6.0, 13.0, 13.0, 12.0, 26.0, 27.0, 55.0, 61.0, 71.0, 115.0, 186.0, 236.0, 489.0, 957.0, 2785.0, 10662.0, 73824.0, 3807163.0, 268394.0, 21614.0, 4557.0, 1399.0, 612.0, 344.0, 198.0, 111.0, 92.0, 68.0, 39.0, 33.0, 35.0, 14.0, 17.0, 9.0, 6.0, 12.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.11004638671875, -5.9232177734375, -5.73638916015625, -5.549560546875, -5.36273193359375, -5.1759033203125, -4.98907470703125, -4.80224609375, -4.61541748046875, -4.4285888671875, -4.24176025390625, -4.054931640625, -3.86810302734375, -3.6812744140625, -3.49444580078125, -3.3076171875, -3.12078857421875, -2.9339599609375, -2.74713134765625, -2.560302734375, -2.37347412109375, -2.1866455078125, -1.99981689453125, -1.81298828125, -1.62615966796875, -1.4393310546875, -1.25250244140625, -1.065673828125, -0.87884521484375, -0.6920166015625, -0.50518798828125, -0.318359375, -0.13153076171875, 0.0552978515625, 0.24212646484375, 0.428955078125, 0.61578369140625, 0.8026123046875, 0.98944091796875, 1.17626953125, 1.36309814453125, 1.5499267578125, 1.73675537109375, 1.923583984375, 2.11041259765625, 2.2972412109375, 2.48406982421875, 2.6708984375, 2.85772705078125, 3.0445556640625, 3.23138427734375, 3.418212890625, 3.60504150390625, 3.7918701171875, 3.97869873046875, 4.16552734375, 4.35235595703125, 4.5391845703125, 4.72601318359375, 4.912841796875, 5.09967041015625, 5.2864990234375, 5.47332763671875, 5.66015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 7.0, 5.0, 11.0, 17.0, 24.0, 32.0, 49.0, 135.0, 271.0, 903.0, 1891.0, 350.0, 158.0, 74.0, 41.0, 26.0, 27.0, 18.0, 11.0, 10.0, 6.0, 5.0, 1.0, 4.0, 2.0], "bins": [-2.365234375, -2.3171463012695312, -2.2690582275390625, -2.2209701538085938, -2.172882080078125, -2.1247940063476562, -2.0767059326171875, -2.0286178588867188, -1.98052978515625, -1.9324417114257812, -1.8843536376953125, -1.8362655639648438, -1.788177490234375, -1.7400894165039062, -1.6920013427734375, -1.6439132690429688, -1.5958251953125, -1.5477371215820312, -1.4996490478515625, -1.4515609741210938, -1.403472900390625, -1.3553848266601562, -1.3072967529296875, -1.2592086791992188, -1.21112060546875, -1.1630325317382812, -1.1149444580078125, -1.0668563842773438, -1.018768310546875, -0.9706802368164062, -0.9225921630859375, -0.8745040893554688, -0.826416015625, -0.7783279418945312, -0.7302398681640625, -0.6821517944335938, -0.634063720703125, -0.5859756469726562, -0.5378875732421875, -0.48979949951171875, -0.44171142578125, -0.39362335205078125, -0.3455352783203125, -0.29744720458984375, -0.249359130859375, -0.20127105712890625, -0.1531829833984375, -0.10509490966796875, -0.0570068359375, -0.00891876220703125, 0.0391693115234375, 0.08725738525390625, 0.135345458984375, 0.18343353271484375, 0.2315216064453125, 0.27960968017578125, 0.32769775390625, 0.37578582763671875, 0.4238739013671875, 0.47196197509765625, 0.520050048828125, 0.5681381225585938, 0.6162261962890625, 0.6643142700195312, 0.71240234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 16.0, 23.0, 69.0, 83.0, 164.0, 194.0, 168.0, 119.0, 63.0, 30.0, 25.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.199235916137695, -9.905003547668457, -9.610770225524902, -9.316537857055664, -9.022305488586426, -8.728072166442871, -8.433839797973633, -8.139606475830078, -7.84537410736084, -7.551141262054443, -7.256908893585205, -6.962676048278809, -6.668443202972412, -6.374210357666016, -6.079977989196777, -5.785745143890381, -5.491512775421143, -5.197279930114746, -4.903047561645508, -4.608814716339111, -4.314581871032715, -4.020349502563477, -3.72611665725708, -3.4318838119506836, -3.137651205062866, -2.843418598175049, -2.5491857528686523, -2.254953145980835, -1.960720419883728, -1.666487693786621, -1.3722550868988037, -1.0780222415924072, -0.7837896347045898, -0.4895569384098053, -0.19532424211502075, 0.0989084243774414, 0.39314115047454834, 0.6873738765716553, 0.9816064834594727, 1.2758393287658691, 1.5700719356536865, 1.8643046617507935, 2.1585373878479004, 2.4527699947357178, 2.747002601623535, 3.0412354469299316, 3.335468053817749, 3.6297008991241455, 3.923933506011963, 4.218166351318359, 4.512398719787598, 4.806631565093994, 5.100864410400391, 5.395096778869629, 5.689329624176025, 5.983562469482422, 6.27779483795166, 6.572027683258057, 6.866260051727295, 7.160492897033691, 7.454725742340088, 7.748958587646484, 8.043190956115723, 8.337423324584961, 8.631656646728516]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 21.0, 22.0, 32.0, 32.0, 43.0, 53.0, 54.0, 57.0, 58.0, 65.0, 73.0, 67.0, 65.0, 82.0, 73.0, 38.0, 34.0, 25.0, 24.0, 24.0, 16.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.457943916320801, -5.303596019744873, -5.149248123168945, -4.994900226593018, -4.84055233001709, -4.68620491027832, -4.531857013702393, -4.377509117126465, -4.223161220550537, -4.068813323974609, -3.9144654273986816, -3.760117769241333, -3.6057698726654053, -3.4514219760894775, -3.297074317932129, -3.142726421356201, -2.9883785247802734, -2.8340306282043457, -2.679682731628418, -2.5253350734710693, -2.3709871768951416, -2.216639280319214, -2.0622916221618652, -1.9079437255859375, -1.7535958290100098, -1.599247932434082, -1.4449001550674438, -1.2905523777008057, -1.136204481124878, -0.981856644153595, -0.827508807182312, -0.6731610298156738, -0.5188136100769043, -0.36446577310562134, -0.21011793613433838, -0.05577009916305542, 0.09857773780822754, 0.2529255747795105, 0.40727341175079346, 0.5616211891174316, 0.7159690856933594, 0.8703169226646423, 1.0246647596359253, 1.1790125370025635, 1.3333604335784912, 1.487708330154419, 1.6420561075210571, 1.7964038848876953, 1.950751781463623, 2.105099678039551, 2.2594475746154785, 2.413795232772827, 2.568143129348755, 2.7224910259246826, 2.8768386840820312, 3.031186580657959, 3.1855344772338867, 3.3398823738098145, 3.494230270385742, 3.648577928543091, 3.8029258251190186, 3.9572737216949463, 4.111621379852295, 4.265969276428223, 4.42031717300415]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 20.0, 30.0, 52.0, 65.0, 84.0, 112.0, 177.0, 290.0, 420.0, 764.0, 1410.0, 2683.0, 5984.0, 16258.0, 50038.0, 174750.0, 453084.0, 237980.0, 68496.0, 20990.0, 7628.0, 3247.0, 1637.0, 872.0, 462.0, 305.0, 206.0, 122.0, 86.0, 63.0, 62.0, 30.0, 25.0, 19.0, 13.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.490447998046875, -2.39691162109375, -2.303375244140625, -2.2098388671875, -2.116302490234375, -2.02276611328125, -1.929229736328125, -1.835693359375, -1.742156982421875, -1.64862060546875, -1.555084228515625, -1.4615478515625, -1.368011474609375, -1.27447509765625, -1.180938720703125, -1.08740234375, -0.993865966796875, -0.90032958984375, -0.806793212890625, -0.7132568359375, -0.619720458984375, -0.52618408203125, -0.432647705078125, -0.339111328125, -0.245574951171875, -0.15203857421875, -0.058502197265625, 0.0350341796875, 0.128570556640625, 0.22210693359375, 0.315643310546875, 0.4091796875, 0.502716064453125, 0.59625244140625, 0.689788818359375, 0.7833251953125, 0.876861572265625, 0.97039794921875, 1.063934326171875, 1.157470703125, 1.251007080078125, 1.34454345703125, 1.438079833984375, 1.5316162109375, 1.625152587890625, 1.71868896484375, 1.812225341796875, 1.90576171875, 1.999298095703125, 2.09283447265625, 2.186370849609375, 2.2799072265625, 2.373443603515625, 2.46697998046875, 2.560516357421875, 2.654052734375, 2.747589111328125, 2.84112548828125, 2.934661865234375, 3.0281982421875, 3.121734619140625, 3.21527099609375, 3.308807373046875, 3.40234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 13.0, 23.0, 15.0, 43.0, 38.0, 59.0, 74.0, 73.0, 72.0, 63.0, 74.0, 72.0, 67.0, 55.0, 58.0, 35.0, 47.0, 24.0, 27.0, 14.0, 10.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7669601440429688, -0.7463226318359375, -0.7256851196289062, -0.705047607421875, -0.6844100952148438, -0.6637725830078125, -0.6431350708007812, -0.62249755859375, -0.6018600463867188, -0.5812225341796875, -0.5605850219726562, -0.539947509765625, -0.5193099975585938, -0.4986724853515625, -0.47803497314453125, -0.4573974609375, -0.43675994873046875, -0.4161224365234375, -0.39548492431640625, -0.374847412109375, -0.35420989990234375, -0.3335723876953125, -0.31293487548828125, -0.29229736328125, -0.27165985107421875, -0.2510223388671875, -0.23038482666015625, -0.209747314453125, -0.18910980224609375, -0.1684722900390625, -0.14783477783203125, -0.127197265625, -0.10655975341796875, -0.0859222412109375, -0.06528472900390625, -0.044647216796875, -0.02400970458984375, -0.0033721923828125, 0.01726531982421875, 0.03790283203125, 0.05854034423828125, 0.0791778564453125, 0.09981536865234375, 0.120452880859375, 0.14109039306640625, 0.1617279052734375, 0.18236541748046875, 0.2030029296875, 0.22364044189453125, 0.2442779541015625, 0.26491546630859375, 0.285552978515625, 0.30619049072265625, 0.3268280029296875, 0.34746551513671875, 0.36810302734375, 0.38874053955078125, 0.4093780517578125, 0.43001556396484375, 0.450653076171875, 0.47129058837890625, 0.4919281005859375, 0.5125656127929688, 0.533203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 13.0, 14.0, 22.0, 21.0, 40.0, 64.0, 62.0, 98.0, 150.0, 217.0, 359.0, 665.0, 1403.0, 4481.0, 19836.0, 118342.0, 555544.0, 285341.0, 48058.0, 9083.0, 2390.0, 968.0, 472.0, 240.0, 201.0, 110.0, 84.0, 66.0, 41.0, 36.0, 25.0, 16.0, 13.0, 9.0, 7.0, 11.0, 5.0, 7.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.20703125, -3.109100341796875, -3.01116943359375, -2.913238525390625, -2.8153076171875, -2.717376708984375, -2.61944580078125, -2.521514892578125, -2.423583984375, -2.325653076171875, -2.22772216796875, -2.129791259765625, -2.0318603515625, -1.933929443359375, -1.83599853515625, -1.738067626953125, -1.64013671875, -1.542205810546875, -1.44427490234375, -1.346343994140625, -1.2484130859375, -1.150482177734375, -1.05255126953125, -0.954620361328125, -0.856689453125, -0.758758544921875, -0.66082763671875, -0.562896728515625, -0.4649658203125, -0.367034912109375, -0.26910400390625, -0.171173095703125, -0.0732421875, 0.024688720703125, 0.12261962890625, 0.220550537109375, 0.3184814453125, 0.416412353515625, 0.51434326171875, 0.612274169921875, 0.710205078125, 0.808135986328125, 0.90606689453125, 1.003997802734375, 1.1019287109375, 1.199859619140625, 1.29779052734375, 1.395721435546875, 1.49365234375, 1.591583251953125, 1.68951416015625, 1.787445068359375, 1.8853759765625, 1.983306884765625, 2.08123779296875, 2.179168701171875, 2.277099609375, 2.375030517578125, 2.47296142578125, 2.570892333984375, 2.6688232421875, 2.766754150390625, 2.86468505859375, 2.962615966796875, 3.060546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 7.0, 11.0, 21.0, 26.0, 26.0, 40.0, 38.0, 42.0, 28.0, 55.0, 42.0, 50.0, 43.0, 46.0, 39.0, 39.0, 55.0, 50.0, 43.0, 53.0, 36.0, 27.0, 36.0, 21.0, 29.0, 12.0, 10.0, 8.0, 9.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7843475341796875, -1.723968505859375, -1.6635894775390625, -1.60321044921875, -1.5428314208984375, -1.482452392578125, -1.4220733642578125, -1.3616943359375, -1.3013153076171875, -1.240936279296875, -1.1805572509765625, -1.12017822265625, -1.0597991943359375, -0.999420166015625, -0.9390411376953125, -0.878662109375, -0.8182830810546875, -0.757904052734375, -0.6975250244140625, -0.63714599609375, -0.5767669677734375, -0.516387939453125, -0.4560089111328125, -0.3956298828125, -0.3352508544921875, -0.274871826171875, -0.2144927978515625, -0.15411376953125, -0.0937347412109375, -0.033355712890625, 0.0270233154296875, 0.08740234375, 0.1477813720703125, 0.208160400390625, 0.2685394287109375, 0.32891845703125, 0.3892974853515625, 0.449676513671875, 0.5100555419921875, 0.5704345703125, 0.6308135986328125, 0.691192626953125, 0.7515716552734375, 0.81195068359375, 0.8723297119140625, 0.932708740234375, 0.9930877685546875, 1.053466796875, 1.1138458251953125, 1.174224853515625, 1.2346038818359375, 1.29498291015625, 1.3553619384765625, 1.415740966796875, 1.4761199951171875, 1.5364990234375, 1.5968780517578125, 1.657257080078125, 1.7176361083984375, 1.77801513671875, 1.8383941650390625, 1.898773193359375, 1.9591522216796875, 2.01953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 10.0, 9.0, 18.0, 16.0, 22.0, 42.0, 55.0, 85.0, 159.0, 223.0, 392.0, 749.0, 1358.0, 2904.0, 6411.0, 16392.0, 49720.0, 189400.0, 582903.0, 136117.0, 37934.0, 13161.0, 5344.0, 2342.0, 1248.0, 623.0, 349.0, 202.0, 129.0, 70.0, 48.0, 35.0, 23.0, 12.0, 14.0, 9.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.599609375, -1.5556488037109375, -1.511688232421875, -1.4677276611328125, -1.42376708984375, -1.3798065185546875, -1.335845947265625, -1.2918853759765625, -1.2479248046875, -1.2039642333984375, -1.160003662109375, -1.1160430908203125, -1.07208251953125, -1.0281219482421875, -0.984161376953125, -0.9402008056640625, -0.896240234375, -0.8522796630859375, -0.808319091796875, -0.7643585205078125, -0.72039794921875, -0.6764373779296875, -0.632476806640625, -0.5885162353515625, -0.5445556640625, -0.5005950927734375, -0.456634521484375, -0.4126739501953125, -0.36871337890625, -0.3247528076171875, -0.280792236328125, -0.2368316650390625, -0.19287109375, -0.1489105224609375, -0.104949951171875, -0.0609893798828125, -0.01702880859375, 0.0269317626953125, 0.070892333984375, 0.1148529052734375, 0.1588134765625, 0.2027740478515625, 0.246734619140625, 0.2906951904296875, 0.33465576171875, 0.3786163330078125, 0.422576904296875, 0.4665374755859375, 0.510498046875, 0.5544586181640625, 0.598419189453125, 0.6423797607421875, 0.68634033203125, 0.7303009033203125, 0.774261474609375, 0.8182220458984375, 0.8621826171875, 0.9061431884765625, 0.950103759765625, 0.9940643310546875, 1.03802490234375, 1.0819854736328125, 1.125946044921875, 1.1699066162109375, 1.2138671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 1.0, 4.0, 7.0, 7.0, 8.0, 6.0, 21.0, 10.0, 32.0, 21.0, 27.0, 31.0, 43.0, 45.0, 85.0, 119.0, 141.0, 74.0, 80.0, 40.0, 34.0, 38.0, 24.0, 26.0, 20.0, 14.0, 13.0, 4.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021791458129882812, -0.00021151266992092133, -0.00020511075854301453, -0.00019870884716510773, -0.00019230693578720093, -0.00018590502440929413, -0.00017950311303138733, -0.00017310120165348053, -0.00016669929027557373, -0.00016029737889766693, -0.00015389546751976013, -0.00014749355614185333, -0.00014109164476394653, -0.00013468973338603973, -0.00012828782200813293, -0.00012188591063022614, -0.00011548399925231934, -0.00010908208787441254, -0.00010268017649650574, -9.627826511859894e-05, -8.987635374069214e-05, -8.347444236278534e-05, -7.707253098487854e-05, -7.067061960697174e-05, -6.426870822906494e-05, -5.786679685115814e-05, -5.146488547325134e-05, -4.5062974095344543e-05, -3.8661062717437744e-05, -3.2259151339530945e-05, -2.5857239961624146e-05, -1.9455328583717346e-05, -1.3053417205810547e-05, -6.6515058279037476e-06, -2.4959444999694824e-07, 6.152316927909851e-06, 1.255422830581665e-05, 1.895613968372345e-05, 2.535805106163025e-05, 3.175996243953705e-05, 3.816187381744385e-05, 4.456378519535065e-05, 5.0965696573257446e-05, 5.7367607951164246e-05, 6.376951932907104e-05, 7.017143070697784e-05, 7.657334208488464e-05, 8.297525346279144e-05, 8.937716484069824e-05, 9.577907621860504e-05, 0.00010218098759651184, 0.00010858289897441864, 0.00011498481035232544, 0.00012138672173023224, 0.00012778863310813904, 0.00013419054448604584, 0.00014059245586395264, 0.00014699436724185944, 0.00015339627861976624, 0.00015979818999767303, 0.00016620010137557983, 0.00017260201275348663, 0.00017900392413139343, 0.00018540583550930023, 0.00019180774688720703]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 15.0, 22.0, 51.0, 70.0, 124.0, 236.0, 376.0, 913.0, 2495.0, 10201.0, 82717.0, 820827.0, 113016.0, 12574.0, 2951.0, 935.0, 447.0, 225.0, 106.0, 67.0, 51.0, 36.0, 9.0, 16.0, 10.0, 8.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.182952880859375, -3.07879638671875, -2.974639892578125, -2.8704833984375, -2.766326904296875, -2.66217041015625, -2.558013916015625, -2.453857421875, -2.349700927734375, -2.24554443359375, -2.141387939453125, -2.0372314453125, -1.933074951171875, -1.82891845703125, -1.724761962890625, -1.62060546875, -1.516448974609375, -1.41229248046875, -1.308135986328125, -1.2039794921875, -1.099822998046875, -0.99566650390625, -0.891510009765625, -0.787353515625, -0.683197021484375, -0.57904052734375, -0.474884033203125, -0.3707275390625, -0.266571044921875, -0.16241455078125, -0.058258056640625, 0.0458984375, 0.150054931640625, 0.25421142578125, 0.358367919921875, 0.4625244140625, 0.566680908203125, 0.67083740234375, 0.774993896484375, 0.879150390625, 0.983306884765625, 1.08746337890625, 1.191619873046875, 1.2957763671875, 1.399932861328125, 1.50408935546875, 1.608245849609375, 1.71240234375, 1.816558837890625, 1.92071533203125, 2.024871826171875, 2.1290283203125, 2.233184814453125, 2.33734130859375, 2.441497802734375, 2.545654296875, 2.649810791015625, 2.75396728515625, 2.858123779296875, 2.9622802734375, 3.066436767578125, 3.17059326171875, 3.274749755859375, 3.37890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 9.0, 9.0, 12.0, 17.0, 17.0, 11.0, 39.0, 33.0, 57.0, 90.0, 168.0, 169.0, 107.0, 68.0, 51.0, 37.0, 18.0, 21.0, 15.0, 11.0, 9.0, 8.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.5775299072265625, -2.516387939453125, -2.4552459716796875, -2.39410400390625, -2.3329620361328125, -2.271820068359375, -2.2106781005859375, -2.1495361328125, -2.0883941650390625, -2.027252197265625, -1.9661102294921875, -1.90496826171875, -1.8438262939453125, -1.782684326171875, -1.7215423583984375, -1.660400390625, -1.5992584228515625, -1.538116455078125, -1.4769744873046875, -1.41583251953125, -1.3546905517578125, -1.293548583984375, -1.2324066162109375, -1.1712646484375, -1.1101226806640625, -1.048980712890625, -0.9878387451171875, -0.92669677734375, -0.8655548095703125, -0.804412841796875, -0.7432708740234375, -0.68212890625, -0.6209869384765625, -0.559844970703125, -0.4987030029296875, -0.43756103515625, -0.3764190673828125, -0.315277099609375, -0.2541351318359375, -0.1929931640625, -0.1318511962890625, -0.070709228515625, -0.0095672607421875, 0.05157470703125, 0.1127166748046875, 0.173858642578125, 0.2350006103515625, 0.296142578125, 0.3572845458984375, 0.418426513671875, 0.4795684814453125, 0.54071044921875, 0.6018524169921875, 0.662994384765625, 0.7241363525390625, 0.7852783203125, 0.8464202880859375, 0.907562255859375, 0.9687042236328125, 1.02984619140625, 1.0909881591796875, 1.152130126953125, 1.2132720947265625, 1.2744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 25.0, 43.0, 94.0, 203.0, 232.0, 180.0, 123.0, 59.0, 20.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.7812557220459, -15.626142501831055, -14.471028327941895, -13.315914154052734, -12.16080093383789, -11.005687713623047, -9.850573539733887, -8.695459365844727, -7.540346145629883, -6.385232448577881, -5.230118751525879, -4.075005054473877, -2.919891357421875, -1.764777660369873, -0.6096639633178711, 0.5454502105712891, 1.7005634307861328, 2.8556771278381348, 4.010790824890137, 5.165904521942139, 6.321018218994141, 7.476131916046143, 8.631245613098145, 9.786359786987305, 10.941473007202148, 12.096586227416992, 13.251700401306152, 14.406814575195312, 15.561927795410156, 16.717041015625, 17.872154235839844, 19.02726936340332, 20.182384490966797, 21.33749771118164, 22.492610931396484, 23.64772605895996, 24.802839279174805, 25.95795249938965, 27.113067626953125, 28.26818084716797, 29.423294067382812, 30.578407287597656, 31.7335205078125, 32.888633728027344, 34.04374694824219, 35.1988639831543, 36.35397720336914, 37.509090423583984, 38.66420364379883, 39.81931686401367, 40.974430084228516, 42.12954330444336, 43.28466033935547, 44.43977355957031, 45.594886779785156, 46.75, 47.905113220214844, 49.06022644042969, 50.21533966064453, 51.370452880859375, 52.52556610107422, 53.68068313598633, 54.83579635620117, 55.990909576416016, 57.14602279663086]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 6.0, 12.0, 13.0, 15.0, 16.0, 19.0, 20.0, 20.0, 31.0, 30.0, 27.0, 31.0, 41.0, 34.0, 34.0, 47.0, 47.0, 46.0, 40.0, 38.0, 40.0, 49.0, 32.0, 28.0, 41.0, 36.0, 28.0, 30.0, 20.0, 18.0, 12.0, 19.0, 16.0, 12.0, 13.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.910199165344238, -7.616495609283447, -7.322792053222656, -7.029088973999023, -6.735385417938232, -6.441681861877441, -6.147978782653809, -5.854275226593018, -5.560571670532227, -5.2668681144714355, -4.9731645584106445, -4.679461479187012, -4.385757923126221, -4.09205436706543, -3.7983510494232178, -3.504647731781006, -3.210944175720215, -2.917240619659424, -2.623537302017212, -2.329833984375, -2.036130428314209, -1.7424269914627075, -1.448723554611206, -1.1550202369689941, -0.8613166809082031, -0.5676132440567017, -0.2739098072052002, 0.01979362964630127, 0.31349706649780273, 0.6072005033493042, 0.9009039402008057, 1.1946072578430176, 1.488311767578125, 1.7820152044296265, 2.075718641281128, 2.36942195892334, 2.663125514984131, 2.956829071044922, 3.250532388687134, 3.5442357063293457, 3.8379392623901367, 4.131642818450928, 4.425346374511719, 4.719049453735352, 5.012753009796143, 5.306456565856934, 5.600159645080566, 5.893863201141357, 6.187566757202148, 6.4812703132629395, 6.7749738693237305, 7.068676948547363, 7.362380504608154, 7.656084060668945, 7.949787139892578, 8.243490219116211, 8.53719425201416, 8.830897331237793, 9.124601364135742, 9.418304443359375, 9.712007522583008, 10.005711555480957, 10.29941463470459, 10.593118667602539, 10.886821746826172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 9.0, 4.0, 13.0, 7.0, 25.0, 15.0, 25.0, 50.0, 64.0, 86.0, 127.0, 199.0, 310.0, 558.0, 1049.0, 2350.0, 6409.0, 24992.0, 271522.0, 3765249.0, 97414.0, 15068.0, 4665.0, 1879.0, 880.0, 480.0, 287.0, 168.0, 127.0, 66.0, 40.0, 36.0, 21.0, 18.0, 18.0, 8.0, 7.0, 6.0, 0.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2147216796875, -6.038818359375, -5.8629150390625, -5.68701171875, -5.5111083984375, -5.335205078125, -5.1593017578125, -4.9833984375, -4.8074951171875, -4.631591796875, -4.4556884765625, -4.27978515625, -4.1038818359375, -3.927978515625, -3.7520751953125, -3.576171875, -3.4002685546875, -3.224365234375, -3.0484619140625, -2.87255859375, -2.6966552734375, -2.520751953125, -2.3448486328125, -2.1689453125, -1.9930419921875, -1.817138671875, -1.6412353515625, -1.46533203125, -1.2894287109375, -1.113525390625, -0.9376220703125, -0.76171875, -0.5858154296875, -0.409912109375, -0.2340087890625, -0.05810546875, 0.1177978515625, 0.293701171875, 0.4696044921875, 0.6455078125, 0.8214111328125, 0.997314453125, 1.1732177734375, 1.34912109375, 1.5250244140625, 1.700927734375, 1.8768310546875, 2.052734375, 2.2286376953125, 2.404541015625, 2.5804443359375, 2.75634765625, 2.9322509765625, 3.108154296875, 3.2840576171875, 3.4599609375, 3.6358642578125, 3.811767578125, 3.9876708984375, 4.16357421875, 4.3394775390625, 4.515380859375, 4.6912841796875, 4.8671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 17.0, 14.0, 20.0, 20.0, 39.0, 36.0, 53.0, 58.0, 62.0, 63.0, 69.0, 82.0, 64.0, 69.0, 65.0, 56.0, 51.0, 29.0, 31.0, 21.0, 26.0, 14.0, 10.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.798828125, -0.7780838012695312, -0.7573394775390625, -0.7365951538085938, -0.715850830078125, -0.6951065063476562, -0.6743621826171875, -0.6536178588867188, -0.63287353515625, -0.6121292114257812, -0.5913848876953125, -0.5706405639648438, -0.549896240234375, -0.5291519165039062, -0.5084075927734375, -0.48766326904296875, -0.4669189453125, -0.44617462158203125, -0.4254302978515625, -0.40468597412109375, -0.383941650390625, -0.36319732666015625, -0.3424530029296875, -0.32170867919921875, -0.30096435546875, -0.28022003173828125, -0.2594757080078125, -0.23873138427734375, -0.217987060546875, -0.19724273681640625, -0.1764984130859375, -0.15575408935546875, -0.135009765625, -0.11426544189453125, -0.0935211181640625, -0.07277679443359375, -0.052032470703125, -0.03128814697265625, -0.0105438232421875, 0.01020050048828125, 0.03094482421875, 0.05168914794921875, 0.0724334716796875, 0.09317779541015625, 0.113922119140625, 0.13466644287109375, 0.1554107666015625, 0.17615509033203125, 0.1968994140625, 0.21764373779296875, 0.2383880615234375, 0.25913238525390625, 0.279876708984375, 0.30062103271484375, 0.3213653564453125, 0.34210968017578125, 0.36285400390625, 0.38359832763671875, 0.4043426513671875, 0.42508697509765625, 0.445831298828125, 0.46657562255859375, 0.4873199462890625, 0.5080642700195312, 0.52880859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 15.0, 20.0, 26.0, 26.0, 53.0, 70.0, 99.0, 171.0, 285.0, 413.0, 813.0, 1656.0, 3428.0, 7868.0, 20878.0, 75520.0, 702115.0, 3166686.0, 159211.0, 33724.0, 11509.0, 4817.0, 2280.0, 1086.0, 597.0, 334.0, 213.0, 119.0, 91.0, 38.0, 37.0, 25.0, 11.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.142578125, -3.045013427734375, -2.94744873046875, -2.849884033203125, -2.7523193359375, -2.654754638671875, -2.55718994140625, -2.459625244140625, -2.362060546875, -2.264495849609375, -2.16693115234375, -2.069366455078125, -1.9718017578125, -1.874237060546875, -1.77667236328125, -1.679107666015625, -1.58154296875, -1.483978271484375, -1.38641357421875, -1.288848876953125, -1.1912841796875, -1.093719482421875, -0.99615478515625, -0.898590087890625, -0.801025390625, -0.703460693359375, -0.60589599609375, -0.508331298828125, -0.4107666015625, -0.313201904296875, -0.21563720703125, -0.118072509765625, -0.0205078125, 0.077056884765625, 0.17462158203125, 0.272186279296875, 0.3697509765625, 0.467315673828125, 0.56488037109375, 0.662445068359375, 0.760009765625, 0.857574462890625, 0.95513916015625, 1.052703857421875, 1.1502685546875, 1.247833251953125, 1.34539794921875, 1.442962646484375, 1.54052734375, 1.638092041015625, 1.73565673828125, 1.833221435546875, 1.9307861328125, 2.028350830078125, 2.12591552734375, 2.223480224609375, 2.321044921875, 2.418609619140625, 2.51617431640625, 2.613739013671875, 2.7113037109375, 2.808868408203125, 2.90643310546875, 3.003997802734375, 3.1015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 13.0, 9.0, 18.0, 19.0, 44.0, 43.0, 107.0, 175.0, 414.0, 1100.0, 1316.0, 350.0, 177.0, 83.0, 59.0, 38.0, 27.0, 16.0, 14.0, 5.0, 10.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.2677459716796875, -1.217132568359375, -1.1665191650390625, -1.11590576171875, -1.0652923583984375, -1.014678955078125, -0.9640655517578125, -0.9134521484375, -0.8628387451171875, -0.812225341796875, -0.7616119384765625, -0.71099853515625, -0.6603851318359375, -0.609771728515625, -0.5591583251953125, -0.508544921875, -0.4579315185546875, -0.407318115234375, -0.3567047119140625, -0.30609130859375, -0.2554779052734375, -0.204864501953125, -0.1542510986328125, -0.1036376953125, -0.0530242919921875, -0.002410888671875, 0.0482025146484375, 0.09881591796875, 0.1494293212890625, 0.200042724609375, 0.2506561279296875, 0.30126953125, 0.3518829345703125, 0.402496337890625, 0.4531097412109375, 0.50372314453125, 0.5543365478515625, 0.604949951171875, 0.6555633544921875, 0.7061767578125, 0.7567901611328125, 0.807403564453125, 0.8580169677734375, 0.90863037109375, 0.9592437744140625, 1.009857177734375, 1.0604705810546875, 1.111083984375, 1.1616973876953125, 1.212310791015625, 1.2629241943359375, 1.31353759765625, 1.3641510009765625, 1.414764404296875, 1.4653778076171875, 1.5159912109375, 1.5666046142578125, 1.617218017578125, 1.6678314208984375, 1.71844482421875, 1.7690582275390625, 1.819671630859375, 1.8702850341796875, 1.9208984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 8.0, 18.0, 34.0, 50.0, 85.0, 147.0, 192.0, 179.0, 129.0, 75.0, 31.0, 21.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.364502906799316, -13.94583797454834, -13.527173042297363, -13.10850715637207, -12.689842224121094, -12.271177291870117, -11.85251235961914, -11.433847427368164, -11.015182495117188, -10.596517562866211, -10.177852630615234, -9.759187698364258, -9.340521812438965, -8.921856880187988, -8.503191947937012, -8.084527015686035, -7.6658616065979, -7.247196674346924, -6.828531265258789, -6.4098663330078125, -5.991201400756836, -5.572536468505859, -5.153871059417725, -4.735206127166748, -4.316540718078613, -3.8978755474090576, -3.479210615158081, -3.0605454444885254, -2.641880512237549, -2.223215341567993, -1.8045501708984375, -1.385885238647461, -0.9672203063964844, -0.5485552549362183, -0.12989014387130737, 0.2887749671936035, 0.7074400186538696, 1.1261050701141357, 1.5447702407836914, 1.963435173034668, 2.3821003437042236, 2.8007655143737793, 3.219430446624756, 3.6380956172943115, 4.056760787963867, 4.475425720214844, 4.89409065246582, 5.312755584716797, 5.731420993804932, 6.150085926055908, 6.568751335144043, 6.9874162673950195, 7.406081199645996, 7.824746131896973, 8.243412017822266, 8.662076950073242, 9.080741882324219, 9.499406814575195, 9.918071746826172, 10.336736679077148, 10.755402565002441, 11.174067497253418, 11.592732429504395, 12.011397361755371, 12.430062294006348]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 16.0, 13.0, 11.0, 20.0, 19.0, 35.0, 26.0, 26.0, 46.0, 43.0, 45.0, 40.0, 44.0, 57.0, 43.0, 48.0, 55.0, 47.0, 50.0, 35.0, 40.0, 27.0, 28.0, 34.0, 23.0, 20.0, 14.0, 18.0, 11.0, 10.0, 6.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.550609588623047, -4.380953311920166, -4.211296558380127, -4.041640281677246, -3.8719840049743652, -3.7023274898529053, -3.5326709747314453, -3.3630146980285645, -3.1933581829071045, -3.0237016677856445, -2.8540453910827637, -2.6843888759613037, -2.5147323608398438, -2.345076084136963, -2.175419569015503, -2.005763053894043, -1.836106777191162, -1.6664503812789917, -1.4967939853668213, -1.3271374702453613, -1.157481074333191, -0.9878246784210205, -0.8181681632995605, -0.6485117673873901, -0.4788553714752197, -0.30919894576072693, -0.13954252004623413, 0.030113935470581055, 0.19977033138275146, 0.3694267272949219, 0.5390832424163818, 0.7087396383285522, 0.8783965110778809, 1.0480529069900513, 1.2177093029022217, 1.3873658180236816, 1.557022213935852, 1.7266786098480225, 1.8963351249694824, 2.0659914016723633, 2.2356479167938232, 2.405304431915283, 2.574960708618164, 2.744617223739624, 2.914273738861084, 3.083930015563965, 3.253586530685425, 3.4232430458068848, 3.5928993225097656, 3.7625558376312256, 3.9322121143341064, 4.101868629455566, 4.271524906158447, 4.441181182861328, 4.610837936401367, 4.780494213104248, 4.950150489807129, 5.11980676651001, 5.289463520050049, 5.45911979675293, 5.6287760734558105, 5.798432350158691, 5.9680891036987305, 6.137745380401611, 6.30740213394165]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 13.0, 19.0, 25.0, 36.0, 61.0, 113.0, 145.0, 257.0, 427.0, 633.0, 1318.0, 2589.0, 6035.0, 15409.0, 44064.0, 134306.0, 314559.0, 318191.0, 137023.0, 45836.0, 15618.0, 6142.0, 2633.0, 1283.0, 716.0, 392.0, 236.0, 147.0, 86.0, 61.0, 46.0, 40.0, 22.0, 16.0, 11.0, 5.0, 6.0, 4.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.666015625, -2.582733154296875, -2.49945068359375, -2.416168212890625, -2.3328857421875, -2.249603271484375, -2.16632080078125, -2.083038330078125, -1.999755859375, -1.916473388671875, -1.83319091796875, -1.749908447265625, -1.6666259765625, -1.583343505859375, -1.50006103515625, -1.416778564453125, -1.33349609375, -1.250213623046875, -1.16693115234375, -1.083648681640625, -1.0003662109375, -0.917083740234375, -0.83380126953125, -0.750518798828125, -0.667236328125, -0.583953857421875, -0.50067138671875, -0.417388916015625, -0.3341064453125, -0.250823974609375, -0.16754150390625, -0.084259033203125, -0.0009765625, 0.082305908203125, 0.16558837890625, 0.248870849609375, 0.3321533203125, 0.415435791015625, 0.49871826171875, 0.582000732421875, 0.665283203125, 0.748565673828125, 0.83184814453125, 0.915130615234375, 0.9984130859375, 1.081695556640625, 1.16497802734375, 1.248260498046875, 1.33154296875, 1.414825439453125, 1.49810791015625, 1.581390380859375, 1.6646728515625, 1.747955322265625, 1.83123779296875, 1.914520263671875, 1.997802734375, 2.081085205078125, 2.16436767578125, 2.247650146484375, 2.3309326171875, 2.414215087890625, 2.49749755859375, 2.580780029296875, 2.6640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 17.0, 14.0, 15.0, 33.0, 42.0, 35.0, 43.0, 62.0, 66.0, 68.0, 76.0, 60.0, 67.0, 67.0, 56.0, 50.0, 48.0, 36.0, 34.0, 20.0, 16.0, 17.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.900390625, -0.8780746459960938, -0.8557586669921875, -0.8334426879882812, -0.811126708984375, -0.7888107299804688, -0.7664947509765625, -0.7441787719726562, -0.72186279296875, -0.6995468139648438, -0.6772308349609375, -0.6549148559570312, -0.632598876953125, -0.6102828979492188, -0.5879669189453125, -0.5656509399414062, -0.5433349609375, -0.5210189819335938, -0.4987030029296875, -0.47638702392578125, -0.454071044921875, -0.43175506591796875, -0.4094390869140625, -0.38712310791015625, -0.36480712890625, -0.34249114990234375, -0.3201751708984375, -0.29785919189453125, -0.275543212890625, -0.25322723388671875, -0.2309112548828125, -0.20859527587890625, -0.186279296875, -0.16396331787109375, -0.1416473388671875, -0.11933135986328125, -0.097015380859375, -0.07469940185546875, -0.0523834228515625, -0.03006744384765625, -0.00775146484375, 0.01456451416015625, 0.0368804931640625, 0.05919647216796875, 0.081512451171875, 0.10382843017578125, 0.1261444091796875, 0.14846038818359375, 0.1707763671875, 0.19309234619140625, 0.2154083251953125, 0.23772430419921875, 0.260040283203125, 0.28235626220703125, 0.3046722412109375, 0.32698822021484375, 0.34930419921875, 0.37162017822265625, 0.3939361572265625, 0.41625213623046875, 0.438568115234375, 0.46088409423828125, 0.4832000732421875, 0.5055160522460938, 0.52783203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 9.0, 7.0, 14.0, 10.0, 23.0, 34.0, 46.0, 79.0, 86.0, 111.0, 226.0, 318.0, 592.0, 1313.0, 4609.0, 29396.0, 286185.0, 621855.0, 88723.0, 10428.0, 2292.0, 865.0, 437.0, 277.0, 185.0, 122.0, 76.0, 59.0, 38.0, 27.0, 21.0, 19.0, 12.0, 11.0, 2.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.4437255859375, -4.301513671875, -4.1593017578125, -4.01708984375, -3.8748779296875, -3.732666015625, -3.5904541015625, -3.4482421875, -3.3060302734375, -3.163818359375, -3.0216064453125, -2.87939453125, -2.7371826171875, -2.594970703125, -2.4527587890625, -2.310546875, -2.1683349609375, -2.026123046875, -1.8839111328125, -1.74169921875, -1.5994873046875, -1.457275390625, -1.3150634765625, -1.1728515625, -1.0306396484375, -0.888427734375, -0.7462158203125, -0.60400390625, -0.4617919921875, -0.319580078125, -0.1773681640625, -0.03515625, 0.1070556640625, 0.249267578125, 0.3914794921875, 0.53369140625, 0.6759033203125, 0.818115234375, 0.9603271484375, 1.1025390625, 1.2447509765625, 1.386962890625, 1.5291748046875, 1.67138671875, 1.8135986328125, 1.955810546875, 2.0980224609375, 2.240234375, 2.3824462890625, 2.524658203125, 2.6668701171875, 2.80908203125, 2.9512939453125, 3.093505859375, 3.2357177734375, 3.3779296875, 3.5201416015625, 3.662353515625, 3.8045654296875, 3.94677734375, 4.0889892578125, 4.231201171875, 4.3734130859375, 4.515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 13.0, 22.0, 14.0, 18.0, 20.0, 31.0, 26.0, 26.0, 38.0, 37.0, 33.0, 32.0, 42.0, 37.0, 46.0, 49.0, 39.0, 46.0, 39.0, 36.0, 39.0, 35.0, 28.0, 29.0, 26.0, 21.0, 14.0, 20.0, 17.0, 19.0, 10.0, 15.0, 10.0, 14.0, 3.0, 5.0, 10.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.96875, -1.906036376953125, -1.84332275390625, -1.780609130859375, -1.7178955078125, -1.655181884765625, -1.59246826171875, -1.529754638671875, -1.467041015625, -1.404327392578125, -1.34161376953125, -1.278900146484375, -1.2161865234375, -1.153472900390625, -1.09075927734375, -1.028045654296875, -0.96533203125, -0.902618408203125, -0.83990478515625, -0.777191162109375, -0.7144775390625, -0.651763916015625, -0.58905029296875, -0.526336669921875, -0.463623046875, -0.400909423828125, -0.33819580078125, -0.275482177734375, -0.2127685546875, -0.150054931640625, -0.08734130859375, -0.024627685546875, 0.0380859375, 0.100799560546875, 0.16351318359375, 0.226226806640625, 0.2889404296875, 0.351654052734375, 0.41436767578125, 0.477081298828125, 0.539794921875, 0.602508544921875, 0.66522216796875, 0.727935791015625, 0.7906494140625, 0.853363037109375, 0.91607666015625, 0.978790283203125, 1.04150390625, 1.104217529296875, 1.16693115234375, 1.229644775390625, 1.2923583984375, 1.355072021484375, 1.41778564453125, 1.480499267578125, 1.543212890625, 1.605926513671875, 1.66864013671875, 1.731353759765625, 1.7940673828125, 1.856781005859375, 1.91949462890625, 1.982208251953125, 2.044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 6.0, 8.0, 12.0, 15.0, 12.0, 29.0, 26.0, 38.0, 59.0, 92.0, 138.0, 268.0, 475.0, 963.0, 2276.0, 6050.0, 18977.0, 81406.0, 404469.0, 418415.0, 84276.0, 19876.0, 6083.0, 2396.0, 975.0, 524.0, 272.0, 141.0, 86.0, 61.0, 40.0, 33.0, 17.0, 15.0, 12.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.3143157958984375, -1.254608154296875, -1.1949005126953125, -1.13519287109375, -1.0754852294921875, -1.015777587890625, -0.9560699462890625, -0.8963623046875, -0.8366546630859375, -0.776947021484375, -0.7172393798828125, -0.65753173828125, -0.5978240966796875, -0.538116455078125, -0.4784088134765625, -0.418701171875, -0.3589935302734375, -0.299285888671875, -0.2395782470703125, -0.17987060546875, -0.1201629638671875, -0.060455322265625, -0.0007476806640625, 0.0589599609375, 0.1186676025390625, 0.178375244140625, 0.2380828857421875, 0.29779052734375, 0.3574981689453125, 0.417205810546875, 0.4769134521484375, 0.53662109375, 0.5963287353515625, 0.656036376953125, 0.7157440185546875, 0.77545166015625, 0.8351593017578125, 0.894866943359375, 0.9545745849609375, 1.0142822265625, 1.0739898681640625, 1.133697509765625, 1.1934051513671875, 1.25311279296875, 1.3128204345703125, 1.372528076171875, 1.4322357177734375, 1.491943359375, 1.5516510009765625, 1.611358642578125, 1.6710662841796875, 1.73077392578125, 1.7904815673828125, 1.850189208984375, 1.9098968505859375, 1.9696044921875, 2.0293121337890625, 2.089019775390625, 2.1487274169921875, 2.20843505859375, 2.2681427001953125, 2.327850341796875, 2.3875579833984375, 2.447265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 15.0, 17.0, 23.0, 26.0, 20.0, 38.0, 36.0, 58.0, 58.0, 64.0, 68.0, 66.0, 70.0, 77.0, 66.0, 63.0, 50.0, 37.0, 17.0, 29.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001826845109462738, -0.00017630308866500854, -0.00016992166638374329, -0.00016354024410247803, -0.00015715882182121277, -0.0001507773995399475, -0.00014439597725868225, -0.000138014554977417, -0.00013163313269615173, -0.00012525171041488647, -0.00011887028813362122, -0.00011248886585235596, -0.0001061074435710907, -9.972602128982544e-05, -9.334459900856018e-05, -8.696317672729492e-05, -8.058175444602966e-05, -7.42003321647644e-05, -6.781890988349915e-05, -6.143748760223389e-05, -5.505606532096863e-05, -4.867464303970337e-05, -4.229322075843811e-05, -3.591179847717285e-05, -2.9530376195907593e-05, -2.3148953914642334e-05, -1.6767531633377075e-05, -1.0386109352111816e-05, -4.004687070846558e-06, 2.376735210418701e-06, 8.75815749168396e-06, 1.5139579772949219e-05, 2.1521002054214478e-05, 2.7902424335479736e-05, 3.4283846616744995e-05, 4.0665268898010254e-05, 4.704669117927551e-05, 5.342811346054077e-05, 5.980953574180603e-05, 6.619095802307129e-05, 7.257238030433655e-05, 7.89538025856018e-05, 8.533522486686707e-05, 9.171664714813232e-05, 9.809806942939758e-05, 0.00010447949171066284, 0.0001108609139919281, 0.00011724233627319336, 0.00012362375855445862, 0.00013000518083572388, 0.00013638660311698914, 0.0001427680253982544, 0.00014914944767951965, 0.0001555308699607849, 0.00016191229224205017, 0.00016829371452331543, 0.0001746751368045807, 0.00018105655908584595, 0.0001874379813671112, 0.00019381940364837646, 0.00020020082592964172, 0.00020658224821090698, 0.00021296367049217224, 0.0002193450927734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 16.0, 23.0, 58.0, 78.0, 111.0, 223.0, 434.0, 1060.0, 3227.0, 16296.0, 185588.0, 749278.0, 79085.0, 9173.0, 2298.0, 767.0, 377.0, 180.0, 108.0, 73.0, 27.0, 15.0, 14.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.960113525390625, -2.85186767578125, -2.743621826171875, -2.6353759765625, -2.527130126953125, -2.41888427734375, -2.310638427734375, -2.202392578125, -2.094146728515625, -1.98590087890625, -1.877655029296875, -1.7694091796875, -1.661163330078125, -1.55291748046875, -1.444671630859375, -1.33642578125, -1.228179931640625, -1.11993408203125, -1.011688232421875, -0.9034423828125, -0.795196533203125, -0.68695068359375, -0.578704833984375, -0.470458984375, -0.362213134765625, -0.25396728515625, -0.145721435546875, -0.0374755859375, 0.070770263671875, 0.17901611328125, 0.287261962890625, 0.3955078125, 0.503753662109375, 0.61199951171875, 0.720245361328125, 0.8284912109375, 0.936737060546875, 1.04498291015625, 1.153228759765625, 1.261474609375, 1.369720458984375, 1.47796630859375, 1.586212158203125, 1.6944580078125, 1.802703857421875, 1.91094970703125, 2.019195556640625, 2.12744140625, 2.235687255859375, 2.34393310546875, 2.452178955078125, 2.5604248046875, 2.668670654296875, 2.77691650390625, 2.885162353515625, 2.993408203125, 3.101654052734375, 3.20989990234375, 3.318145751953125, 3.4263916015625, 3.534637451171875, 3.64288330078125, 3.751129150390625, 3.859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 18.0, 19.0, 26.0, 25.0, 38.0, 46.0, 49.0, 79.0, 68.0, 90.0, 89.0, 84.0, 77.0, 50.0, 45.0, 28.0, 28.0, 18.0, 12.0, 18.0, 11.0, 12.0, 4.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8544921875, -1.801513671875, -1.74853515625, -1.695556640625, -1.642578125, -1.589599609375, -1.53662109375, -1.483642578125, -1.4306640625, -1.377685546875, -1.32470703125, -1.271728515625, -1.21875, -1.165771484375, -1.11279296875, -1.059814453125, -1.0068359375, -0.953857421875, -0.90087890625, -0.847900390625, -0.794921875, -0.741943359375, -0.68896484375, -0.635986328125, -0.5830078125, -0.530029296875, -0.47705078125, -0.424072265625, -0.37109375, -0.318115234375, -0.26513671875, -0.212158203125, -0.1591796875, -0.106201171875, -0.05322265625, -0.000244140625, 0.052734375, 0.105712890625, 0.15869140625, 0.211669921875, 0.2646484375, 0.317626953125, 0.37060546875, 0.423583984375, 0.4765625, 0.529541015625, 0.58251953125, 0.635498046875, 0.6884765625, 0.741455078125, 0.79443359375, 0.847412109375, 0.900390625, 0.953369140625, 1.00634765625, 1.059326171875, 1.1123046875, 1.165283203125, 1.21826171875, 1.271240234375, 1.32421875, 1.377197265625, 1.43017578125, 1.483154296875, 1.5361328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 12.0, 24.0, 50.0, 104.0, 155.0, 184.0, 172.0, 131.0, 82.0, 36.0, 25.0, 9.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.456741333007812, -21.41472053527832, -20.372697830200195, -19.330677032470703, -18.288654327392578, -17.246633529663086, -16.204612731933594, -15.162590980529785, -14.120569229125977, -13.078547477722168, -12.03652572631836, -10.994504928588867, -9.952483177185059, -8.91046142578125, -7.8684401512146, -6.826418876647949, -5.784397125244141, -4.742375373840332, -3.7003540992736816, -2.658332586288452, -1.6163110733032227, -0.5742893218994141, 0.46773195266723633, 1.5097532272338867, 2.5517749786376953, 3.593796491622925, 4.635818004608154, 5.677839279174805, 6.719861030578613, 7.761882781982422, 8.803903579711914, 9.845925331115723, 10.887947082519531, 11.92996883392334, 12.971990585327148, 14.01401138305664, 15.05603313446045, 16.098054885864258, 17.14007568359375, 18.182098388671875, 19.224119186401367, 20.26613998413086, 21.308162689208984, 22.350183486938477, 23.39220428466797, 24.434226989746094, 25.476247787475586, 26.518268585205078, 27.560291290283203, 28.602312088012695, 29.64433479309082, 30.686355590820312, 31.728378295898438, 32.77040100097656, 33.81241989135742, 34.85444259643555, 35.896461486816406, 36.93848419189453, 37.98050308227539, 39.022525787353516, 40.06454849243164, 41.1065673828125, 42.148590087890625, 43.19061279296875, 44.232635498046875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 6.0, 8.0, 9.0, 13.0, 10.0, 15.0, 20.0, 33.0, 22.0, 25.0, 39.0, 47.0, 49.0, 43.0, 56.0, 44.0, 43.0, 39.0, 54.0, 30.0, 31.0, 43.0, 44.0, 39.0, 34.0, 29.0, 27.0, 31.0, 20.0, 24.0, 9.0, 15.0, 10.0, 5.0, 8.0, 6.0, 3.0, 9.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.737166404724121, -11.365572929382324, -10.993978500366211, -10.622385025024414, -10.250791549682617, -9.87919807434082, -9.507604598999023, -9.13601016998291, -8.764416694641113, -8.392823219299316, -8.021228790283203, -7.649635314941406, -7.278041839599609, -6.9064483642578125, -6.534854412078857, -6.163260459899902, -5.7916669845581055, -5.420073509216309, -5.0484795570373535, -4.676885604858398, -4.305292129516602, -3.9336984157562256, -3.5621047019958496, -3.1905109882354736, -2.8189172744750977, -2.4473235607147217, -2.0757298469543457, -1.7041361331939697, -1.3325424194335938, -0.9609487056732178, -0.5893549919128418, -0.21776127815246582, 0.15383148193359375, 0.5254251956939697, 0.8970189094543457, 1.2686126232147217, 1.6402063369750977, 2.0118000507354736, 2.3833937644958496, 2.7549874782562256, 3.1265811920166016, 3.4981749057769775, 3.8697686195373535, 4.241362571716309, 4.6129560470581055, 4.984549522399902, 5.356143474578857, 5.7277374267578125, 6.099330902099609, 6.470924377441406, 6.842518329620361, 7.214112281799316, 7.585705757141113, 7.95729923248291, 8.328893661499023, 8.70048713684082, 9.072080612182617, 9.443674087524414, 9.815267562866211, 10.186861991882324, 10.558455467224121, 10.930048942565918, 11.301643371582031, 11.673236846923828, 12.044830322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 17.0, 29.0, 36.0, 65.0, 128.0, 199.0, 391.0, 776.0, 4127.0, 3936858.0, 246800.0, 3271.0, 713.0, 327.0, 174.0, 113.0, 75.0, 41.0, 27.0, 23.0, 7.0, 7.0, 15.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-19.3125, -18.8289794921875, -18.345458984375, -17.8619384765625, -17.37841796875, -16.8948974609375, -16.411376953125, -15.9278564453125, -15.4443359375, -14.9608154296875, -14.477294921875, -13.9937744140625, -13.51025390625, -13.0267333984375, -12.543212890625, -12.0596923828125, -11.576171875, -11.0926513671875, -10.609130859375, -10.1256103515625, -9.64208984375, -9.1585693359375, -8.675048828125, -8.1915283203125, -7.7080078125, -7.2244873046875, -6.740966796875, -6.2574462890625, -5.77392578125, -5.2904052734375, -4.806884765625, -4.3233642578125, -3.83984375, -3.3563232421875, -2.872802734375, -2.3892822265625, -1.90576171875, -1.4222412109375, -0.938720703125, -0.4552001953125, 0.0283203125, 0.5118408203125, 0.995361328125, 1.4788818359375, 1.96240234375, 2.4459228515625, 2.929443359375, 3.4129638671875, 3.896484375, 4.3800048828125, 4.863525390625, 5.3470458984375, 5.83056640625, 6.3140869140625, 6.797607421875, 7.2811279296875, 7.7646484375, 8.2481689453125, 8.731689453125, 9.2152099609375, 9.69873046875, 10.1822509765625, 10.665771484375, 11.1492919921875, 11.6328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 9.0, 13.0, 17.0, 22.0, 24.0, 34.0, 38.0, 46.0, 53.0, 53.0, 55.0, 52.0, 58.0, 57.0, 51.0, 56.0, 62.0, 61.0, 42.0, 44.0, 23.0, 40.0, 33.0, 12.0, 9.0, 6.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9130859375, -0.8897933959960938, -0.8665008544921875, -0.8432083129882812, -0.819915771484375, -0.7966232299804688, -0.7733306884765625, -0.7500381469726562, -0.72674560546875, -0.7034530639648438, -0.6801605224609375, -0.6568679809570312, -0.633575439453125, -0.6102828979492188, -0.5869903564453125, -0.5636978149414062, -0.5404052734375, -0.5171127319335938, -0.4938201904296875, -0.47052764892578125, -0.447235107421875, -0.42394256591796875, -0.4006500244140625, -0.37735748291015625, -0.35406494140625, -0.33077239990234375, -0.3074798583984375, -0.28418731689453125, -0.260894775390625, -0.23760223388671875, -0.2143096923828125, -0.19101715087890625, -0.167724609375, -0.14443206787109375, -0.1211395263671875, -0.09784698486328125, -0.074554443359375, -0.05126190185546875, -0.0279693603515625, -0.00467681884765625, 0.01861572265625, 0.04190826416015625, 0.0652008056640625, 0.08849334716796875, 0.111785888671875, 0.13507843017578125, 0.1583709716796875, 0.18166351318359375, 0.2049560546875, 0.22824859619140625, 0.2515411376953125, 0.27483367919921875, 0.298126220703125, 0.32141876220703125, 0.3447113037109375, 0.36800384521484375, 0.39129638671875, 0.41458892822265625, 0.4378814697265625, 0.46117401123046875, 0.484466552734375, 0.5077590942382812, 0.5310516357421875, 0.5543441772460938, 0.57763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 22.0, 20.0, 28.0, 38.0, 54.0, 56.0, 66.0, 96.0, 148.0, 176.0, 240.0, 324.0, 419.0, 602.0, 861.0, 1324.0, 2372.0, 4621.0, 11764.0, 48329.0, 1033662.0, 3014736.0, 50125.0, 12243.0, 4787.0, 2375.0, 1413.0, 902.0, 621.0, 463.0, 354.0, 230.0, 204.0, 123.0, 120.0, 61.0, 57.0, 55.0, 39.0, 24.0, 26.0, 15.0, 12.0, 10.0, 5.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.8359375, -2.747344970703125, -2.65875244140625, -2.570159912109375, -2.4815673828125, -2.392974853515625, -2.30438232421875, -2.215789794921875, -2.127197265625, -2.038604736328125, -1.95001220703125, -1.861419677734375, -1.7728271484375, -1.684234619140625, -1.59564208984375, -1.507049560546875, -1.41845703125, -1.329864501953125, -1.24127197265625, -1.152679443359375, -1.0640869140625, -0.975494384765625, -0.88690185546875, -0.798309326171875, -0.709716796875, -0.621124267578125, -0.53253173828125, -0.443939208984375, -0.3553466796875, -0.266754150390625, -0.17816162109375, -0.089569091796875, -0.0009765625, 0.087615966796875, 0.17620849609375, 0.264801025390625, 0.3533935546875, 0.441986083984375, 0.53057861328125, 0.619171142578125, 0.707763671875, 0.796356201171875, 0.88494873046875, 0.973541259765625, 1.0621337890625, 1.150726318359375, 1.23931884765625, 1.327911376953125, 1.41650390625, 1.505096435546875, 1.59368896484375, 1.682281494140625, 1.7708740234375, 1.859466552734375, 1.94805908203125, 2.036651611328125, 2.125244140625, 2.213836669921875, 2.30242919921875, 2.391021728515625, 2.4796142578125, 2.568206787109375, 2.65679931640625, 2.745391845703125, 2.833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 5.0, 5.0, 23.0, 26.0, 65.0, 130.0, 466.0, 2941.0, 202.0, 93.0, 44.0, 21.0, 11.0, 12.0, 7.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8349609375, -0.811920166015625, -0.78887939453125, -0.765838623046875, -0.7427978515625, -0.719757080078125, -0.69671630859375, -0.673675537109375, -0.650634765625, -0.627593994140625, -0.60455322265625, -0.581512451171875, -0.5584716796875, -0.535430908203125, -0.51239013671875, -0.489349365234375, -0.46630859375, -0.443267822265625, -0.42022705078125, -0.397186279296875, -0.3741455078125, -0.351104736328125, -0.32806396484375, -0.305023193359375, -0.281982421875, -0.258941650390625, -0.23590087890625, -0.212860107421875, -0.1898193359375, -0.166778564453125, -0.14373779296875, -0.120697021484375, -0.09765625, -0.074615478515625, -0.05157470703125, -0.028533935546875, -0.0054931640625, 0.017547607421875, 0.04058837890625, 0.063629150390625, 0.086669921875, 0.109710693359375, 0.13275146484375, 0.155792236328125, 0.1788330078125, 0.201873779296875, 0.22491455078125, 0.247955322265625, 0.27099609375, 0.294036865234375, 0.31707763671875, 0.340118408203125, 0.3631591796875, 0.386199951171875, 0.40924072265625, 0.432281494140625, 0.455322265625, 0.478363037109375, 0.50140380859375, 0.524444580078125, 0.5474853515625, 0.570526123046875, 0.59356689453125, 0.616607666015625, 0.6396484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 17.0, 27.0, 54.0, 66.0, 95.0, 119.0, 123.0, 115.0, 110.0, 81.0, 55.0, 38.0, 31.0, 17.0, 7.0, 10.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1890366077423096, -2.0963294506073, -2.00362229347229, -1.9109150171279907, -1.8182077407836914, -1.7255005836486816, -1.6327934265136719, -1.540086269378662, -1.4473789930343628, -1.354671835899353, -1.2619645595550537, -1.169257402420044, -1.0765502452850342, -0.9838429689407349, -0.8911358118057251, -0.7984285950660706, -0.705721378326416, -0.6130141615867615, -0.5203069448471069, -0.42759978771209717, -0.3348925709724426, -0.24218535423278809, -0.14947819709777832, -0.05677098035812378, 0.03593623638153076, 0.1286434382200241, 0.22135064005851746, 0.3140578269958496, 0.40676504373550415, 0.4994722604751587, 0.5921794176101685, 0.684886634349823, 0.7775936126708984, 0.870300829410553, 0.9630080461502075, 1.0557152032852173, 1.1484224796295166, 1.2411296367645264, 1.3338367938995361, 1.426543951034546, 1.5192512273788452, 1.611958384513855, 1.7046656608581543, 1.797372817993164, 1.8900799751281738, 1.9827872514724731, 2.0754942893981934, 2.1682016849517822, 2.260908842086792, 2.3536159992218018, 2.4463231563568115, 2.5390305519104004, 2.63173770904541, 2.72444486618042, 2.8171520233154297, 2.9098591804504395, 3.002566337585449, 3.095273494720459, 3.1879806518554688, 3.2806878089904785, 3.3733952045440674, 3.466102361679077, 3.558809518814087, 3.6515166759490967, 3.7442240715026855]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 14.0, 6.0, 11.0, 8.0, 19.0, 18.0, 25.0, 24.0, 28.0, 26.0, 38.0, 42.0, 31.0, 38.0, 38.0, 41.0, 40.0, 35.0, 34.0, 45.0, 33.0, 35.0, 49.0, 40.0, 36.0, 36.0, 25.0, 27.0, 13.0, 25.0, 18.0, 18.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3123985528945923, -1.2752782106399536, -1.2381579875946045, -1.2010376453399658, -1.1639174222946167, -1.126797080039978, -1.089676856994629, -1.0525565147399902, -1.0154361724853516, -0.9783158898353577, -0.9411956071853638, -0.9040753245353699, -0.866955041885376, -0.8298346996307373, -0.7927144169807434, -0.7555941343307495, -0.7184739112854004, -0.6813536286354065, -0.6442333459854126, -0.6071130633354187, -0.5699927806854248, -0.5328724384307861, -0.49575215578079224, -0.45863187313079834, -0.42151159048080444, -0.38439130783081055, -0.34727102518081665, -0.31015071272850037, -0.27303043007850647, -0.23591014742851257, -0.19878984987735748, -0.1616695523262024, -0.12454915046691895, -0.08742886036634445, -0.05030857026576996, -0.013188280165195465, 0.02393200993537903, 0.061052292585372925, 0.09817259013652802, 0.1352928876876831, 0.172413170337677, 0.2095334529876709, 0.246653750538826, 0.2837740480899811, 0.320894330739975, 0.35801461338996887, 0.39513492584228516, 0.43225520849227905, 0.46937549114227295, 0.5064957737922668, 0.5436160564422607, 0.5807363390922546, 0.6178566217422485, 0.6549769639968872, 0.6920972466468811, 0.729217529296875, 0.7663378119468689, 0.8034580945968628, 0.8405783772468567, 0.8776986598968506, 0.9148190021514893, 0.9519392251968384, 0.989059567451477, 1.0261797904968262, 1.0633001327514648]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 17.0, 28.0, 35.0, 47.0, 63.0, 97.0, 173.0, 254.0, 404.0, 588.0, 1136.0, 2059.0, 4168.0, 8587.0, 19632.0, 45649.0, 104759.0, 208480.0, 275655.0, 199791.0, 98548.0, 43161.0, 18219.0, 8192.0, 3919.0, 2003.0, 1069.0, 616.0, 410.0, 247.0, 157.0, 116.0, 73.0, 60.0, 37.0, 20.0, 24.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8012237548828125, -1.742095947265625, -1.6829681396484375, -1.62384033203125, -1.5647125244140625, -1.505584716796875, -1.4464569091796875, -1.3873291015625, -1.3282012939453125, -1.269073486328125, -1.2099456787109375, -1.15081787109375, -1.0916900634765625, -1.032562255859375, -0.9734344482421875, -0.914306640625, -0.8551788330078125, -0.796051025390625, -0.7369232177734375, -0.67779541015625, -0.6186676025390625, -0.559539794921875, -0.5004119873046875, -0.4412841796875, -0.3821563720703125, -0.323028564453125, -0.2639007568359375, -0.20477294921875, -0.1456451416015625, -0.086517333984375, -0.0273895263671875, 0.03173828125, 0.0908660888671875, 0.149993896484375, 0.2091217041015625, 0.26824951171875, 0.3273773193359375, 0.386505126953125, 0.4456329345703125, 0.5047607421875, 0.5638885498046875, 0.623016357421875, 0.6821441650390625, 0.74127197265625, 0.8003997802734375, 0.859527587890625, 0.9186553955078125, 0.977783203125, 1.0369110107421875, 1.096038818359375, 1.1551666259765625, 1.21429443359375, 1.2734222412109375, 1.332550048828125, 1.3916778564453125, 1.4508056640625, 1.5099334716796875, 1.569061279296875, 1.6281890869140625, 1.68731689453125, 1.7464447021484375, 1.805572509765625, 1.8647003173828125, 1.923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 7.0, 4.0, 3.0, 4.0, 9.0, 7.0, 13.0, 15.0, 20.0, 21.0, 33.0, 43.0, 38.0, 48.0, 58.0, 51.0, 64.0, 55.0, 54.0, 63.0, 60.0, 49.0, 42.0, 42.0, 40.0, 39.0, 31.0, 25.0, 22.0, 14.0, 9.0, 10.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.9228515625, -0.8993453979492188, -0.8758392333984375, -0.8523330688476562, -0.828826904296875, -0.8053207397460938, -0.7818145751953125, -0.7583084106445312, -0.73480224609375, -0.7112960815429688, -0.6877899169921875, -0.6642837524414062, -0.640777587890625, -0.6172714233398438, -0.5937652587890625, -0.5702590942382812, -0.5467529296875, -0.5232467651367188, -0.4997406005859375, -0.47623443603515625, -0.452728271484375, -0.42922210693359375, -0.4057159423828125, -0.38220977783203125, -0.35870361328125, -0.33519744873046875, -0.3116912841796875, -0.28818511962890625, -0.264678955078125, -0.24117279052734375, -0.2176666259765625, -0.19416046142578125, -0.170654296875, -0.14714813232421875, -0.1236419677734375, -0.10013580322265625, -0.076629638671875, -0.05312347412109375, -0.0296173095703125, -0.00611114501953125, 0.01739501953125, 0.04090118408203125, 0.0644073486328125, 0.08791351318359375, 0.111419677734375, 0.13492584228515625, 0.1584320068359375, 0.18193817138671875, 0.2054443359375, 0.22895050048828125, 0.2524566650390625, 0.27596282958984375, 0.299468994140625, 0.32297515869140625, 0.3464813232421875, 0.36998748779296875, 0.39349365234375, 0.41699981689453125, 0.4405059814453125, 0.46401214599609375, 0.487518310546875, 0.5110244750976562, 0.5345306396484375, 0.5580368041992188, 0.58154296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 19.0, 25.0, 28.0, 29.0, 41.0, 61.0, 87.0, 107.0, 139.0, 223.0, 302.0, 471.0, 741.0, 1411.0, 4831.0, 39239.0, 533320.0, 428839.0, 30913.0, 4161.0, 1326.0, 692.0, 418.0, 296.0, 186.0, 177.0, 107.0, 84.0, 62.0, 38.0, 41.0, 26.0, 17.0, 14.0, 12.0, 12.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.50390625, -5.341796875, -5.1796875, -5.017578125, -4.85546875, -4.693359375, -4.53125, -4.369140625, -4.20703125, -4.044921875, -3.8828125, -3.720703125, -3.55859375, -3.396484375, -3.234375, -3.072265625, -2.91015625, -2.748046875, -2.5859375, -2.423828125, -2.26171875, -2.099609375, -1.9375, -1.775390625, -1.61328125, -1.451171875, -1.2890625, -1.126953125, -0.96484375, -0.802734375, -0.640625, -0.478515625, -0.31640625, -0.154296875, 0.0078125, 0.169921875, 0.33203125, 0.494140625, 0.65625, 0.818359375, 0.98046875, 1.142578125, 1.3046875, 1.466796875, 1.62890625, 1.791015625, 1.953125, 2.115234375, 2.27734375, 2.439453125, 2.6015625, 2.763671875, 2.92578125, 3.087890625, 3.25, 3.412109375, 3.57421875, 3.736328125, 3.8984375, 4.060546875, 4.22265625, 4.384765625, 4.546875, 4.708984375, 4.87109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 2.0, 8.0, 9.0, 5.0, 6.0, 8.0, 17.0, 19.0, 15.0, 19.0, 23.0, 26.0, 30.0, 33.0, 39.0, 40.0, 30.0, 44.0, 43.0, 48.0, 50.0, 40.0, 36.0, 34.0, 41.0, 31.0, 32.0, 29.0, 32.0, 29.0, 28.0, 29.0, 30.0, 21.0, 14.0, 10.0, 8.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.51544189453125, -2.4351806640625, -2.35491943359375, -2.274658203125, -2.19439697265625, -2.1141357421875, -2.03387451171875, -1.95361328125, -1.87335205078125, -1.7930908203125, -1.71282958984375, -1.632568359375, -1.55230712890625, -1.4720458984375, -1.39178466796875, -1.3115234375, -1.23126220703125, -1.1510009765625, -1.07073974609375, -0.990478515625, -0.91021728515625, -0.8299560546875, -0.74969482421875, -0.66943359375, -0.58917236328125, -0.5089111328125, -0.42864990234375, -0.348388671875, -0.26812744140625, -0.1878662109375, -0.10760498046875, -0.02734375, 0.05291748046875, 0.1331787109375, 0.21343994140625, 0.293701171875, 0.37396240234375, 0.4542236328125, 0.53448486328125, 0.61474609375, 0.69500732421875, 0.7752685546875, 0.85552978515625, 0.935791015625, 1.01605224609375, 1.0963134765625, 1.17657470703125, 1.2568359375, 1.33709716796875, 1.4173583984375, 1.49761962890625, 1.577880859375, 1.65814208984375, 1.7384033203125, 1.81866455078125, 1.89892578125, 1.97918701171875, 2.0594482421875, 2.13970947265625, 2.219970703125, 2.30023193359375, 2.3804931640625, 2.46075439453125, 2.541015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 4.0, 9.0, 8.0, 9.0, 15.0, 11.0, 18.0, 34.0, 48.0, 75.0, 142.0, 292.0, 694.0, 2113.0, 9651.0, 68241.0, 593680.0, 330633.0, 34692.0, 5623.0, 1476.0, 513.0, 249.0, 118.0, 76.0, 38.0, 26.0, 19.0, 14.0, 4.0, 9.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.029998779296875, -1.96624755859375, -1.902496337890625, -1.8387451171875, -1.774993896484375, -1.71124267578125, -1.647491455078125, -1.583740234375, -1.519989013671875, -1.45623779296875, -1.392486572265625, -1.3287353515625, -1.264984130859375, -1.20123291015625, -1.137481689453125, -1.07373046875, -1.009979248046875, -0.94622802734375, -0.882476806640625, -0.8187255859375, -0.754974365234375, -0.69122314453125, -0.627471923828125, -0.563720703125, -0.499969482421875, -0.43621826171875, -0.372467041015625, -0.3087158203125, -0.244964599609375, -0.18121337890625, -0.117462158203125, -0.0537109375, 0.010040283203125, 0.07379150390625, 0.137542724609375, 0.2012939453125, 0.265045166015625, 0.32879638671875, 0.392547607421875, 0.456298828125, 0.520050048828125, 0.58380126953125, 0.647552490234375, 0.7113037109375, 0.775054931640625, 0.83880615234375, 0.902557373046875, 0.96630859375, 1.030059814453125, 1.09381103515625, 1.157562255859375, 1.2213134765625, 1.285064697265625, 1.34881591796875, 1.412567138671875, 1.476318359375, 1.540069580078125, 1.60382080078125, 1.667572021484375, 1.7313232421875, 1.795074462890625, 1.85882568359375, 1.922576904296875, 1.986328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 5.0, 13.0, 10.0, 18.0, 21.0, 21.0, 33.0, 35.0, 48.0, 70.0, 64.0, 104.0, 87.0, 82.0, 85.0, 72.0, 62.0, 39.0, 26.0, 15.0, 21.0, 17.0, 9.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003135204315185547, -0.0003064200282096863, -0.00029931962490081787, -0.00029221922159194946, -0.00028511881828308105, -0.00027801841497421265, -0.00027091801166534424, -0.00026381760835647583, -0.0002567172050476074, -0.000249616801738739, -0.0002425163984298706, -0.0002354159951210022, -0.0002283155918121338, -0.00022121518850326538, -0.00021411478519439697, -0.00020701438188552856, -0.00019991397857666016, -0.00019281357526779175, -0.00018571317195892334, -0.00017861276865005493, -0.00017151236534118652, -0.00016441196203231812, -0.0001573115587234497, -0.0001502111554145813, -0.0001431107521057129, -0.00013601034879684448, -0.00012890994548797607, -0.00012180954217910767, -0.00011470913887023926, -0.00010760873556137085, -0.00010050833225250244, -9.340792894363403e-05, -8.630752563476562e-05, -7.920712232589722e-05, -7.210671901702881e-05, -6.50063157081604e-05, -5.790591239929199e-05, -5.0805509090423584e-05, -4.3705105781555176e-05, -3.660470247268677e-05, -2.950429916381836e-05, -2.240389585494995e-05, -1.5303492546081543e-05, -8.203089237213135e-06, -1.1026859283447266e-06, 5.997717380523682e-06, 1.309812068939209e-05, 2.0198523998260498e-05, 2.7298927307128906e-05, 3.4399330615997314e-05, 4.149973392486572e-05, 4.860013723373413e-05, 5.570054054260254e-05, 6.280094385147095e-05, 6.990134716033936e-05, 7.700175046920776e-05, 8.410215377807617e-05, 9.120255708694458e-05, 9.830296039581299e-05, 0.0001054033637046814, 0.0001125037670135498, 0.00011960417032241821, 0.00012670457363128662, 0.00013380497694015503, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 4.0, 12.0, 9.0, 19.0, 25.0, 42.0, 59.0, 76.0, 122.0, 209.0, 413.0, 744.0, 1646.0, 4505.0, 19403.0, 160432.0, 709395.0, 127736.0, 16459.0, 4159.0, 1473.0, 662.0, 357.0, 195.0, 131.0, 83.0, 54.0, 37.0, 24.0, 21.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4882965087890625, -1.424835205078125, -1.3613739013671875, -1.29791259765625, -1.2344512939453125, -1.170989990234375, -1.1075286865234375, -1.0440673828125, -0.9806060791015625, -0.917144775390625, -0.8536834716796875, -0.79022216796875, -0.7267608642578125, -0.663299560546875, -0.5998382568359375, -0.536376953125, -0.4729156494140625, -0.409454345703125, -0.3459930419921875, -0.28253173828125, -0.2190704345703125, -0.155609130859375, -0.0921478271484375, -0.0286865234375, 0.0347747802734375, 0.098236083984375, 0.1616973876953125, 0.22515869140625, 0.2886199951171875, 0.352081298828125, 0.4155426025390625, 0.47900390625, 0.5424652099609375, 0.605926513671875, 0.6693878173828125, 0.73284912109375, 0.7963104248046875, 0.859771728515625, 0.9232330322265625, 0.9866943359375, 1.0501556396484375, 1.113616943359375, 1.1770782470703125, 1.24053955078125, 1.3040008544921875, 1.367462158203125, 1.4309234619140625, 1.494384765625, 1.5578460693359375, 1.621307373046875, 1.6847686767578125, 1.74822998046875, 1.8116912841796875, 1.875152587890625, 1.9386138916015625, 2.0020751953125, 2.0655364990234375, 2.128997802734375, 2.1924591064453125, 2.25592041015625, 2.3193817138671875, 2.382843017578125, 2.4463043212890625, 2.509765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 15.0, 19.0, 40.0, 45.0, 50.0, 60.0, 90.0, 108.0, 90.0, 103.0, 68.0, 65.0, 44.0, 37.0, 25.0, 21.0, 22.0, 17.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6654205322265625, -1.611114501953125, -1.5568084716796875, -1.50250244140625, -1.4481964111328125, -1.393890380859375, -1.3395843505859375, -1.2852783203125, -1.2309722900390625, -1.176666259765625, -1.1223602294921875, -1.06805419921875, -1.0137481689453125, -0.959442138671875, -0.9051361083984375, -0.850830078125, -0.7965240478515625, -0.742218017578125, -0.6879119873046875, -0.63360595703125, -0.5792999267578125, -0.524993896484375, -0.4706878662109375, -0.4163818359375, -0.3620758056640625, -0.307769775390625, -0.2534637451171875, -0.19915771484375, -0.1448516845703125, -0.090545654296875, -0.0362396240234375, 0.01806640625, 0.0723724365234375, 0.126678466796875, 0.1809844970703125, 0.23529052734375, 0.2895965576171875, 0.343902587890625, 0.3982086181640625, 0.4525146484375, 0.5068206787109375, 0.561126708984375, 0.6154327392578125, 0.66973876953125, 0.7240447998046875, 0.778350830078125, 0.8326568603515625, 0.886962890625, 0.9412689208984375, 0.995574951171875, 1.0498809814453125, 1.10418701171875, 1.1584930419921875, 1.212799072265625, 1.2671051025390625, 1.3214111328125, 1.3757171630859375, 1.430023193359375, 1.4843292236328125, 1.53863525390625, 1.5929412841796875, 1.647247314453125, 1.7015533447265625, 1.755859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 23.0, 109.0, 185.0, 262.0, 243.0, 108.0, 40.0, 4.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03076934814453, -34.6136589050293, -33.19654846191406, -31.77943992614746, -30.36233139038086, -28.945220947265625, -27.52811050415039, -26.111000061035156, -24.693891525268555, -23.27678108215332, -21.85967254638672, -20.442562103271484, -19.02545166015625, -17.60834312438965, -16.191232681274414, -14.774123191833496, -13.357013702392578, -11.93990421295166, -10.522794723510742, -9.105684280395508, -7.68857479095459, -6.271465301513672, -4.8543548583984375, -3.4372453689575195, -2.0201358795166016, -0.6030261516571045, 0.8140835762023926, 2.2311935424804688, 3.6483030319213867, 5.065412521362305, 6.482522964477539, 7.899632453918457, 9.31673812866211, 10.733847618103027, 12.150957107543945, 13.56806755065918, 14.985177040100098, 16.402286529541016, 17.81939697265625, 19.236507415771484, 20.653615951538086, 22.07072639465332, 23.487834930419922, 24.904945373535156, 26.32205581665039, 27.739164352416992, 29.156274795532227, 30.573383331298828, 31.990493774414062, 33.4076042175293, 34.82471466064453, 36.2418212890625, 37.658931732177734, 39.07604217529297, 40.4931526184082, 41.91026306152344, 43.327369689941406, 44.74448013305664, 46.161590576171875, 47.578697204589844, 48.99580764770508, 50.41291809082031, 51.83002853393555, 53.24713897705078, 54.664249420166016]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 4.0, 3.0, 9.0, 9.0, 8.0, 19.0, 17.0, 19.0, 17.0, 27.0, 34.0, 23.0, 38.0, 25.0, 48.0, 36.0, 53.0, 56.0, 49.0, 56.0, 47.0, 42.0, 38.0, 43.0, 44.0, 28.0, 26.0, 25.0, 24.0, 27.0, 28.0, 13.0, 8.0, 10.0, 5.0, 5.0, 11.0, 5.0, 1.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.027986526489258, -12.592302322387695, -12.156618118286133, -11.720934867858887, -11.285250663757324, -10.849566459655762, -10.413883209228516, -9.978199005126953, -9.54251480102539, -9.106830596923828, -8.671146392822266, -8.23546314239502, -7.799778938293457, -7.3640947341918945, -6.92841100692749, -6.492727279663086, -6.057043075561523, -5.621358871459961, -5.185675144195557, -4.749991416931152, -4.31430721282959, -3.8786232471466064, -3.442939281463623, -3.0072553157806396, -2.5715713500976562, -2.135887384414673, -1.7002034187316895, -1.264519453048706, -0.8288354873657227, -0.39315152168273926, 0.04253244400024414, 0.47821640968322754, 0.9139003753662109, 1.3495843410491943, 1.7852683067321777, 2.220952272415161, 2.6566362380981445, 3.092320203781128, 3.5280041694641113, 3.9636881351470947, 4.399372100830078, 4.835056304931641, 5.270740032196045, 5.706423759460449, 6.142107963562012, 6.577792167663574, 7.0134758949279785, 7.449159622192383, 7.884843826293945, 8.320528030395508, 8.75621223449707, 9.191895484924316, 9.627579689025879, 10.063263893127441, 10.498947143554688, 10.93463134765625, 11.370315551757812, 11.805999755859375, 12.241683959960938, 12.677367210388184, 13.113051414489746, 13.548735618591309, 13.984418869018555, 14.420103073120117, 14.85578727722168]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 11.0, 29.0, 38.0, 64.0, 90.0, 169.0, 367.0, 943.0, 8059.0, 4164181.0, 18082.0, 1288.0, 432.0, 204.0, 101.0, 57.0, 45.0, 24.0, 26.0, 7.0, 9.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.90625, -16.4793701171875, -16.052490234375, -15.6256103515625, -15.19873046875, -14.7718505859375, -14.344970703125, -13.9180908203125, -13.4912109375, -13.0643310546875, -12.637451171875, -12.2105712890625, -11.78369140625, -11.3568115234375, -10.929931640625, -10.5030517578125, -10.076171875, -9.6492919921875, -9.222412109375, -8.7955322265625, -8.36865234375, -7.9417724609375, -7.514892578125, -7.0880126953125, -6.6611328125, -6.2342529296875, -5.807373046875, -5.3804931640625, -4.95361328125, -4.5267333984375, -4.099853515625, -3.6729736328125, -3.24609375, -2.8192138671875, -2.392333984375, -1.9654541015625, -1.53857421875, -1.1116943359375, -0.684814453125, -0.2579345703125, 0.1689453125, 0.5958251953125, 1.022705078125, 1.4495849609375, 1.87646484375, 2.3033447265625, 2.730224609375, 3.1571044921875, 3.583984375, 4.0108642578125, 4.437744140625, 4.8646240234375, 5.29150390625, 5.7183837890625, 6.145263671875, 6.5721435546875, 6.9990234375, 7.4259033203125, 7.852783203125, 8.2796630859375, 8.70654296875, 9.1334228515625, 9.560302734375, 9.9871826171875, 10.4140625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 12.0, 18.0, 10.0, 18.0, 24.0, 22.0, 45.0, 32.0, 56.0, 66.0, 53.0, 56.0, 75.0, 65.0, 42.0, 48.0, 50.0, 40.0, 49.0, 45.0, 37.0, 25.0, 29.0, 12.0, 12.0, 13.0, 2.0, 13.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8427810668945312, -0.8193511962890625, -0.7959213256835938, -0.772491455078125, -0.7490615844726562, -0.7256317138671875, -0.7022018432617188, -0.67877197265625, -0.6553421020507812, -0.6319122314453125, -0.6084823608398438, -0.585052490234375, -0.5616226196289062, -0.5381927490234375, -0.5147628784179688, -0.4913330078125, -0.46790313720703125, -0.4444732666015625, -0.42104339599609375, -0.397613525390625, -0.37418365478515625, -0.3507537841796875, -0.32732391357421875, -0.30389404296875, -0.28046417236328125, -0.2570343017578125, -0.23360443115234375, -0.210174560546875, -0.18674468994140625, -0.1633148193359375, -0.13988494873046875, -0.116455078125, -0.09302520751953125, -0.0695953369140625, -0.04616546630859375, -0.022735595703125, 0.00069427490234375, 0.0241241455078125, 0.04755401611328125, 0.07098388671875, 0.09441375732421875, 0.1178436279296875, 0.14127349853515625, 0.164703369140625, 0.18813323974609375, 0.2115631103515625, 0.23499298095703125, 0.2584228515625, 0.28185272216796875, 0.3052825927734375, 0.32871246337890625, 0.352142333984375, 0.37557220458984375, 0.3990020751953125, 0.42243194580078125, 0.44586181640625, 0.46929168701171875, 0.4927215576171875, 0.5161514282226562, 0.539581298828125, 0.5630111694335938, 0.5864410400390625, 0.6098709106445312, 0.63330078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 21.0, 11.0, 17.0, 42.0, 47.0, 60.0, 83.0, 104.0, 190.0, 243.0, 411.0, 574.0, 933.0, 1520.0, 2750.0, 5444.0, 12905.0, 42955.0, 367419.0, 3645889.0, 77727.0, 18850.0, 7278.0, 3588.0, 1938.0, 1134.0, 680.0, 453.0, 282.0, 191.0, 155.0, 98.0, 71.0, 56.0, 44.0, 30.0, 17.0, 16.0, 2.0, 10.0, 4.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.091796875, -2.022491455078125, -1.95318603515625, -1.883880615234375, -1.8145751953125, -1.745269775390625, -1.67596435546875, -1.606658935546875, -1.537353515625, -1.468048095703125, -1.39874267578125, -1.329437255859375, -1.2601318359375, -1.190826416015625, -1.12152099609375, -1.052215576171875, -0.98291015625, -0.913604736328125, -0.84429931640625, -0.774993896484375, -0.7056884765625, -0.636383056640625, -0.56707763671875, -0.497772216796875, -0.428466796875, -0.359161376953125, -0.28985595703125, -0.220550537109375, -0.1512451171875, -0.081939697265625, -0.01263427734375, 0.056671142578125, 0.1259765625, 0.195281982421875, 0.26458740234375, 0.333892822265625, 0.4031982421875, 0.472503662109375, 0.54180908203125, 0.611114501953125, 0.680419921875, 0.749725341796875, 0.81903076171875, 0.888336181640625, 0.9576416015625, 1.026947021484375, 1.09625244140625, 1.165557861328125, 1.23486328125, 1.304168701171875, 1.37347412109375, 1.442779541015625, 1.5120849609375, 1.581390380859375, 1.65069580078125, 1.720001220703125, 1.789306640625, 1.858612060546875, 1.92791748046875, 1.997222900390625, 2.0665283203125, 2.135833740234375, 2.20513916015625, 2.274444580078125, 2.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 9.0, 15.0, 15.0, 30.0, 73.0, 114.0, 399.0, 2989.0, 211.0, 93.0, 32.0, 24.0, 12.0, 10.0, 9.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.781951904296875, -0.75775146484375, -0.733551025390625, -0.7093505859375, -0.685150146484375, -0.66094970703125, -0.636749267578125, -0.612548828125, -0.588348388671875, -0.56414794921875, -0.539947509765625, -0.5157470703125, -0.491546630859375, -0.46734619140625, -0.443145751953125, -0.4189453125, -0.394744873046875, -0.37054443359375, -0.346343994140625, -0.3221435546875, -0.297943115234375, -0.27374267578125, -0.249542236328125, -0.225341796875, -0.201141357421875, -0.17694091796875, -0.152740478515625, -0.1285400390625, -0.104339599609375, -0.08013916015625, -0.055938720703125, -0.03173828125, -0.007537841796875, 0.01666259765625, 0.040863037109375, 0.0650634765625, 0.089263916015625, 0.11346435546875, 0.137664794921875, 0.161865234375, 0.186065673828125, 0.21026611328125, 0.234466552734375, 0.2586669921875, 0.282867431640625, 0.30706787109375, 0.331268310546875, 0.35546875, 0.379669189453125, 0.40386962890625, 0.428070068359375, 0.4522705078125, 0.476470947265625, 0.50067138671875, 0.524871826171875, 0.549072265625, 0.573272705078125, 0.59747314453125, 0.621673583984375, 0.6458740234375, 0.670074462890625, 0.69427490234375, 0.718475341796875, 0.74267578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 11.0, 16.0, 40.0, 71.0, 124.0, 184.0, 219.0, 166.0, 100.0, 41.0, 20.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.143086910247803, -5.97553014755249, -5.8079729080200195, -5.640416145324707, -5.4728593826293945, -5.305302619934082, -5.137745380401611, -4.970188617706299, -4.802631378173828, -4.635074615478516, -4.467517375946045, -4.299960613250732, -4.13240385055542, -3.9648468494415283, -3.7972898483276367, -3.629733085632324, -3.4621763229370117, -3.29461932182312, -3.1270625591278076, -2.959505558013916, -2.7919487953186035, -2.624391794204712, -2.4568347930908203, -2.289278030395508, -2.121721029281616, -1.9541641473770142, -1.786607265472412, -1.6190502643585205, -1.4514933824539185, -1.2839365005493164, -1.1163794994354248, -0.9488226175308228, -0.7812662124633789, -0.6137093305587769, -0.44615238904953003, -0.2785954475402832, -0.11103856563568115, 0.0565183162689209, 0.2240753173828125, 0.39163219928741455, 0.5591890811920166, 0.7267459630966187, 0.8943029046058655, 1.0618598461151123, 1.2294167280197144, 1.3969736099243164, 1.564530611038208, 1.73208749294281, 1.899644374847412, 2.0672013759613037, 2.234758138656616, 2.402315139770508, 2.5698719024658203, 2.737428903579712, 2.9049859046936035, 3.072542667388916, 3.2400996685028076, 3.407656669616699, 3.5752134323120117, 3.7427704334259033, 3.910327434539795, 4.077884197235107, 4.245441436767578, 4.412998199462891, 4.580554962158203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 6.0, 8.0, 13.0, 17.0, 19.0, 25.0, 20.0, 35.0, 16.0, 29.0, 22.0, 43.0, 42.0, 36.0, 44.0, 34.0, 47.0, 35.0, 38.0, 40.0, 44.0, 40.0, 37.0, 34.0, 36.0, 35.0, 25.0, 22.0, 25.0, 26.0, 17.0, 15.0, 6.0, 6.0, 15.0, 7.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7347486019134521, -1.6803596019744873, -1.625970482826233, -1.571581482887268, -1.5171924829483032, -1.4628033638000488, -1.408414363861084, -1.3540253639221191, -1.2996362447738647, -1.2452472448349, -1.1908581256866455, -1.1364691257476807, -1.0820801258087158, -1.0276910066604614, -0.9733020067214966, -0.918912947177887, -0.8645239472389221, -0.8101348876953125, -0.7557458877563477, -0.701356828212738, -0.6469677686691284, -0.5925787687301636, -0.538189709186554, -0.48380064964294434, -0.4294116199016571, -0.3750225901603699, -0.32063353061676025, -0.266244500875473, -0.2118554562330246, -0.15746641159057617, -0.10307738184928894, -0.04868832230567932, 0.00570070743560791, 0.06008974835276604, 0.11447878926992416, 0.168867826461792, 0.22325687110424042, 0.27764591574668884, 0.3320349454879761, 0.3864240050315857, 0.4408130347728729, 0.49520206451416016, 0.5495911240577698, 0.6039801836013794, 0.6583691835403442, 0.7127582430839539, 0.7671473026275635, 0.8215363025665283, 0.8759253621101379, 0.9303144216537476, 0.9847034215927124, 1.0390925407409668, 1.0934815406799316, 1.1478705406188965, 1.2022595405578613, 1.2566486597061157, 1.3110376596450806, 1.3654266595840454, 1.4198157787322998, 1.4742047786712646, 1.5285937786102295, 1.5829828977584839, 1.6373718976974487, 1.6917610168457031, 1.746150016784668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 11.0, 9.0, 9.0, 13.0, 15.0, 27.0, 24.0, 40.0, 54.0, 66.0, 97.0, 173.0, 251.0, 406.0, 632.0, 1002.0, 1812.0, 3397.0, 6663.0, 13731.0, 31133.0, 73371.0, 165301.0, 273988.0, 244627.0, 129512.0, 55642.0, 23677.0, 10920.0, 5296.0, 2744.0, 1458.0, 859.0, 528.0, 338.0, 225.0, 141.0, 95.0, 68.0, 58.0, 50.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6167144775390625, -1.562530517578125, -1.5083465576171875, -1.45416259765625, -1.3999786376953125, -1.345794677734375, -1.2916107177734375, -1.2374267578125, -1.1832427978515625, -1.129058837890625, -1.0748748779296875, -1.02069091796875, -0.9665069580078125, -0.912322998046875, -0.8581390380859375, -0.803955078125, -0.7497711181640625, -0.695587158203125, -0.6414031982421875, -0.58721923828125, -0.5330352783203125, -0.478851318359375, -0.4246673583984375, -0.3704833984375, -0.3162994384765625, -0.262115478515625, -0.2079315185546875, -0.15374755859375, -0.0995635986328125, -0.045379638671875, 0.0088043212890625, 0.06298828125, 0.1171722412109375, 0.171356201171875, 0.2255401611328125, 0.27972412109375, 0.3339080810546875, 0.388092041015625, 0.4422760009765625, 0.4964599609375, 0.5506439208984375, 0.604827880859375, 0.6590118408203125, 0.71319580078125, 0.7673797607421875, 0.821563720703125, 0.8757476806640625, 0.929931640625, 0.9841156005859375, 1.038299560546875, 1.0924835205078125, 1.14666748046875, 1.2008514404296875, 1.255035400390625, 1.3092193603515625, 1.3634033203125, 1.4175872802734375, 1.471771240234375, 1.5259552001953125, 1.58013916015625, 1.6343231201171875, 1.688507080078125, 1.7426910400390625, 1.796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 12.0, 22.0, 10.0, 24.0, 30.0, 30.0, 32.0, 43.0, 31.0, 50.0, 50.0, 60.0, 50.0, 55.0, 60.0, 42.0, 43.0, 45.0, 45.0, 45.0, 36.0, 35.0, 32.0, 19.0, 14.0, 12.0, 13.0, 11.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.8251953125, -0.8025283813476562, -0.7798614501953125, -0.7571945190429688, -0.734527587890625, -0.7118606567382812, -0.6891937255859375, -0.6665267944335938, -0.64385986328125, -0.6211929321289062, -0.5985260009765625, -0.5758590698242188, -0.553192138671875, -0.5305252075195312, -0.5078582763671875, -0.48519134521484375, -0.4625244140625, -0.43985748291015625, -0.4171905517578125, -0.39452362060546875, -0.371856689453125, -0.34918975830078125, -0.3265228271484375, -0.30385589599609375, -0.28118896484375, -0.25852203369140625, -0.2358551025390625, -0.21318817138671875, -0.190521240234375, -0.16785430908203125, -0.1451873779296875, -0.12252044677734375, -0.099853515625, -0.07718658447265625, -0.0545196533203125, -0.03185272216796875, -0.009185791015625, 0.01348114013671875, 0.0361480712890625, 0.05881500244140625, 0.08148193359375, 0.10414886474609375, 0.1268157958984375, 0.14948272705078125, 0.172149658203125, 0.19481658935546875, 0.2174835205078125, 0.24015045166015625, 0.2628173828125, 0.28548431396484375, 0.3081512451171875, 0.33081817626953125, 0.353485107421875, 0.37615203857421875, 0.3988189697265625, 0.42148590087890625, 0.44415283203125, 0.46681976318359375, 0.4894866943359375, 0.5121536254882812, 0.534820556640625, 0.5574874877929688, 0.5801544189453125, 0.6028213500976562, 0.62548828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 19.0, 23.0, 22.0, 38.0, 66.0, 100.0, 115.0, 172.0, 266.0, 365.0, 602.0, 1085.0, 3060.0, 22592.0, 625591.0, 375131.0, 14197.0, 2469.0, 1024.0, 523.0, 322.0, 207.0, 146.0, 112.0, 75.0, 54.0, 43.0, 31.0, 31.0, 16.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.46484375, -6.2796630859375, -6.094482421875, -5.9093017578125, -5.72412109375, -5.5389404296875, -5.353759765625, -5.1685791015625, -4.9833984375, -4.7982177734375, -4.613037109375, -4.4278564453125, -4.24267578125, -4.0574951171875, -3.872314453125, -3.6871337890625, -3.501953125, -3.3167724609375, -3.131591796875, -2.9464111328125, -2.76123046875, -2.5760498046875, -2.390869140625, -2.2056884765625, -2.0205078125, -1.8353271484375, -1.650146484375, -1.4649658203125, -1.27978515625, -1.0946044921875, -0.909423828125, -0.7242431640625, -0.5390625, -0.3538818359375, -0.168701171875, 0.0164794921875, 0.20166015625, 0.3868408203125, 0.572021484375, 0.7572021484375, 0.9423828125, 1.1275634765625, 1.312744140625, 1.4979248046875, 1.68310546875, 1.8682861328125, 2.053466796875, 2.2386474609375, 2.423828125, 2.6090087890625, 2.794189453125, 2.9793701171875, 3.16455078125, 3.3497314453125, 3.534912109375, 3.7200927734375, 3.9052734375, 4.0904541015625, 4.275634765625, 4.4608154296875, 4.64599609375, 4.8311767578125, 5.016357421875, 5.2015380859375, 5.38671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 15.0, 16.0, 24.0, 19.0, 20.0, 25.0, 31.0, 41.0, 37.0, 35.0, 44.0, 39.0, 30.0, 34.0, 50.0, 54.0, 44.0, 47.0, 41.0, 33.0, 41.0, 46.0, 31.0, 35.0, 20.0, 17.0, 15.0, 16.0, 14.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.30755615234375, -2.2225341796875, -2.13751220703125, -2.052490234375, -1.96746826171875, -1.8824462890625, -1.79742431640625, -1.71240234375, -1.62738037109375, -1.5423583984375, -1.45733642578125, -1.372314453125, -1.28729248046875, -1.2022705078125, -1.11724853515625, -1.0322265625, -0.94720458984375, -0.8621826171875, -0.77716064453125, -0.692138671875, -0.60711669921875, -0.5220947265625, -0.43707275390625, -0.35205078125, -0.26702880859375, -0.1820068359375, -0.09698486328125, -0.011962890625, 0.07305908203125, 0.1580810546875, 0.24310302734375, 0.328125, 0.41314697265625, 0.4981689453125, 0.58319091796875, 0.668212890625, 0.75323486328125, 0.8382568359375, 0.92327880859375, 1.00830078125, 1.09332275390625, 1.1783447265625, 1.26336669921875, 1.348388671875, 1.43341064453125, 1.5184326171875, 1.60345458984375, 1.6884765625, 1.77349853515625, 1.8585205078125, 1.94354248046875, 2.028564453125, 2.11358642578125, 2.1986083984375, 2.28363037109375, 2.36865234375, 2.45367431640625, 2.5386962890625, 2.62371826171875, 2.708740234375, 2.79376220703125, 2.8787841796875, 2.96380615234375, 3.048828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 25.0, 19.0, 36.0, 44.0, 74.0, 81.0, 122.0, 204.0, 365.0, 733.0, 1829.0, 6037.0, 34443.0, 402963.0, 544851.0, 45298.0, 7429.0, 2063.0, 787.0, 415.0, 204.0, 152.0, 81.0, 76.0, 53.0, 33.0, 19.0, 20.0, 10.0, 9.0, 5.0, 8.0, 9.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9306640625, -1.8685150146484375, -1.806365966796875, -1.7442169189453125, -1.68206787109375, -1.6199188232421875, -1.557769775390625, -1.4956207275390625, -1.4334716796875, -1.3713226318359375, -1.309173583984375, -1.2470245361328125, -1.18487548828125, -1.1227264404296875, -1.060577392578125, -0.9984283447265625, -0.936279296875, -0.8741302490234375, -0.811981201171875, -0.7498321533203125, -0.68768310546875, -0.6255340576171875, -0.563385009765625, -0.5012359619140625, -0.4390869140625, -0.3769378662109375, -0.314788818359375, -0.2526397705078125, -0.19049072265625, -0.1283416748046875, -0.066192626953125, -0.0040435791015625, 0.05810546875, 0.1202545166015625, 0.182403564453125, 0.2445526123046875, 0.30670166015625, 0.3688507080078125, 0.430999755859375, 0.4931488037109375, 0.5552978515625, 0.6174468994140625, 0.679595947265625, 0.7417449951171875, 0.80389404296875, 0.8660430908203125, 0.928192138671875, 0.9903411865234375, 1.052490234375, 1.1146392822265625, 1.176788330078125, 1.2389373779296875, 1.30108642578125, 1.3632354736328125, 1.425384521484375, 1.4875335693359375, 1.5496826171875, 1.6118316650390625, 1.673980712890625, 1.7361297607421875, 1.79827880859375, 1.8604278564453125, 1.922576904296875, 1.9847259521484375, 2.046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 11.0, 16.0, 33.0, 38.0, 47.0, 72.0, 94.0, 98.0, 120.0, 105.0, 86.0, 74.0, 64.0, 35.0, 22.0, 11.0, 13.0, 12.0, 6.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000186920166015625, -0.00017854943871498108, -0.00017017871141433716, -0.00016180798411369324, -0.00015343725681304932, -0.0001450665295124054, -0.00013669580221176147, -0.00012832507491111755, -0.00011995434761047363, -0.00011158362030982971, -0.00010321289300918579, -9.484216570854187e-05, -8.647143840789795e-05, -7.810071110725403e-05, -6.972998380661011e-05, -6.135925650596619e-05, -5.2988529205322266e-05, -4.4617801904678345e-05, -3.6247074604034424e-05, -2.7876347303390503e-05, -1.9505620002746582e-05, -1.1134892702102661e-05, -2.7641654014587402e-06, 5.606561899185181e-06, 1.3977289199829102e-05, 2.2348016500473022e-05, 3.071874380111694e-05, 3.9089471101760864e-05, 4.7460198402404785e-05, 5.5830925703048706e-05, 6.420165300369263e-05, 7.257238030433655e-05, 8.094310760498047e-05, 8.931383490562439e-05, 9.768456220626831e-05, 0.00010605528950691223, 0.00011442601680755615, 0.00012279674410820007, 0.000131167471408844, 0.00013953819870948792, 0.00014790892601013184, 0.00015627965331077576, 0.00016465038061141968, 0.0001730211079120636, 0.00018139183521270752, 0.00018976256251335144, 0.00019813328981399536, 0.00020650401711463928, 0.0002148747444152832, 0.00022324547171592712, 0.00023161619901657104, 0.00023998692631721497, 0.0002483576536178589, 0.0002567283809185028, 0.00026509910821914673, 0.00027346983551979065, 0.00028184056282043457, 0.0002902112901210785, 0.0002985820174217224, 0.00030695274472236633, 0.00031532347202301025, 0.0003236941993236542, 0.0003320649266242981, 0.000340435653924942, 0.00034880638122558594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 4.0, 8.0, 7.0, 16.0, 15.0, 14.0, 32.0, 47.0, 56.0, 97.0, 141.0, 240.0, 465.0, 849.0, 2152.0, 6704.0, 34801.0, 457532.0, 497345.0, 36684.0, 7046.0, 2205.0, 872.0, 485.0, 235.0, 157.0, 102.0, 60.0, 50.0, 33.0, 24.0, 18.0, 8.0, 7.0, 4.0, 7.0, 1.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.16796875, -2.100250244140625, -2.03253173828125, -1.964813232421875, -1.8970947265625, -1.829376220703125, -1.76165771484375, -1.693939208984375, -1.626220703125, -1.558502197265625, -1.49078369140625, -1.423065185546875, -1.3553466796875, -1.287628173828125, -1.21990966796875, -1.152191162109375, -1.08447265625, -1.016754150390625, -0.94903564453125, -0.881317138671875, -0.8135986328125, -0.745880126953125, -0.67816162109375, -0.610443115234375, -0.542724609375, -0.475006103515625, -0.40728759765625, -0.339569091796875, -0.2718505859375, -0.204132080078125, -0.13641357421875, -0.068695068359375, -0.0009765625, 0.066741943359375, 0.13446044921875, 0.202178955078125, 0.2698974609375, 0.337615966796875, 0.40533447265625, 0.473052978515625, 0.540771484375, 0.608489990234375, 0.67620849609375, 0.743927001953125, 0.8116455078125, 0.879364013671875, 0.94708251953125, 1.014801025390625, 1.08251953125, 1.150238037109375, 1.21795654296875, 1.285675048828125, 1.3533935546875, 1.421112060546875, 1.48883056640625, 1.556549072265625, 1.624267578125, 1.691986083984375, 1.75970458984375, 1.827423095703125, 1.8951416015625, 1.962860107421875, 2.03057861328125, 2.098297119140625, 2.166015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 1.0, 10.0, 16.0, 24.0, 45.0, 59.0, 105.0, 102.0, 125.0, 110.0, 103.0, 74.0, 51.0, 39.0, 34.0, 20.0, 13.0, 4.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.10009765625, -2.0361328125, -1.97216796875, -1.908203125, -1.84423828125, -1.7802734375, -1.71630859375, -1.65234375, -1.58837890625, -1.5244140625, -1.46044921875, -1.396484375, -1.33251953125, -1.2685546875, -1.20458984375, -1.140625, -1.07666015625, -1.0126953125, -0.94873046875, -0.884765625, -0.82080078125, -0.7568359375, -0.69287109375, -0.62890625, -0.56494140625, -0.5009765625, -0.43701171875, -0.373046875, -0.30908203125, -0.2451171875, -0.18115234375, -0.1171875, -0.05322265625, 0.0107421875, 0.07470703125, 0.138671875, 0.20263671875, 0.2666015625, 0.33056640625, 0.39453125, 0.45849609375, 0.5224609375, 0.58642578125, 0.650390625, 0.71435546875, 0.7783203125, 0.84228515625, 0.90625, 0.97021484375, 1.0341796875, 1.09814453125, 1.162109375, 1.22607421875, 1.2900390625, 1.35400390625, 1.41796875, 1.48193359375, 1.5458984375, 1.60986328125, 1.673828125, 1.73779296875, 1.8017578125, 1.86572265625, 1.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 14.0, 15.0, 22.0, 30.0, 38.0, 55.0, 73.0, 93.0, 117.0, 116.0, 103.0, 104.0, 58.0, 44.0, 32.0, 19.0, 18.0, 10.0, 4.0, 9.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.40669059753418, -15.849669456481934, -15.292649269104004, -14.735628128051758, -14.178607940673828, -13.621586799621582, -13.064565658569336, -12.507545471191406, -11.950525283813477, -11.39350414276123, -10.8364839553833, -10.279462814331055, -9.722442626953125, -9.165421485900879, -8.608400344848633, -8.051380157470703, -7.494359016418457, -6.937338352203369, -6.380317687988281, -5.823296546936035, -5.2662763595581055, -4.709255218505859, -4.1522345542907715, -3.5952138900756836, -3.0381932258605957, -2.481172561645508, -1.9241517782211304, -1.367130994796753, -0.810110330581665, -0.25308966636657715, 0.30393123626708984, 0.8609519004821777, 1.4179725646972656, 1.9749932289123535, 2.5320138931274414, 3.0890347957611084, 3.6460554599761963, 4.203076362609863, 4.760097026824951, 5.317117691040039, 5.874138355255127, 6.431159019470215, 6.988179683685303, 7.545200347900391, 8.102221488952637, 8.659241676330566, 9.216262817382812, 9.773283004760742, 10.330304145812988, 10.887325286865234, 11.444345474243164, 12.00136661529541, 12.55838680267334, 13.115407943725586, 13.672428131103516, 14.229449272155762, 14.786470413208008, 15.343491554260254, 15.900511741638184, 16.45753288269043, 17.01455307006836, 17.57157325744629, 18.12859535217285, 18.68561553955078, 19.24263572692871]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 11.0, 11.0, 15.0, 19.0, 19.0, 15.0, 31.0, 29.0, 40.0, 42.0, 39.0, 44.0, 45.0, 50.0, 45.0, 46.0, 47.0, 49.0, 44.0, 45.0, 36.0, 40.0, 47.0, 27.0, 18.0, 23.0, 27.0, 11.0, 16.0, 13.0, 13.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.54494857788086, -14.098066329956055, -13.65118408203125, -13.204301834106445, -12.75741958618164, -12.310537338256836, -11.863655090332031, -11.416772842407227, -10.969890594482422, -10.523008346557617, -10.076126098632812, -9.629243850708008, -9.182361602783203, -8.735479354858398, -8.288597106933594, -7.841714382171631, -7.394831657409668, -6.947949409484863, -6.501067161560059, -6.054184913635254, -5.607302665710449, -5.1604204177856445, -4.713537693023682, -4.266655445098877, -3.8197731971740723, -3.3728909492492676, -2.926008701324463, -2.479126214981079, -2.0322439670562744, -1.5853617191314697, -1.138479232788086, -0.6915969848632812, -0.24471378326416016, 0.2021685242652893, 0.6490508317947388, 1.095933198928833, 1.5428154468536377, 1.9896976947784424, 2.436580181121826, 2.883462429046631, 3.3303446769714355, 3.7772269248962402, 4.224109172821045, 4.670991897583008, 5.1178741455078125, 5.564756393432617, 6.011638641357422, 6.458520889282227, 6.905403137207031, 7.352285385131836, 7.799167633056641, 8.246049880981445, 8.69293212890625, 9.139814376831055, 9.58669662475586, 10.033578872680664, 10.480461120605469, 10.927343368530273, 11.374225616455078, 11.821107864379883, 12.267990112304688, 12.714872360229492, 13.161754608154297, 13.608636856079102, 14.055520057678223]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 17.0, 22.0, 43.0, 55.0, 88.0, 134.0, 247.0, 551.0, 2223.0, 41773.0, 4139690.0, 7361.0, 1144.0, 384.0, 229.0, 99.0, 54.0, 40.0, 30.0, 13.0, 11.0, 9.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.390625, -13.0496826171875, -12.708740234375, -12.3677978515625, -12.02685546875, -11.6859130859375, -11.344970703125, -11.0040283203125, -10.6630859375, -10.3221435546875, -9.981201171875, -9.6402587890625, -9.29931640625, -8.9583740234375, -8.617431640625, -8.2764892578125, -7.935546875, -7.5946044921875, -7.253662109375, -6.9127197265625, -6.57177734375, -6.2308349609375, -5.889892578125, -5.5489501953125, -5.2080078125, -4.8670654296875, -4.526123046875, -4.1851806640625, -3.84423828125, -3.5032958984375, -3.162353515625, -2.8214111328125, -2.48046875, -2.1395263671875, -1.798583984375, -1.4576416015625, -1.11669921875, -0.7757568359375, -0.434814453125, -0.0938720703125, 0.2470703125, 0.5880126953125, 0.928955078125, 1.2698974609375, 1.61083984375, 1.9517822265625, 2.292724609375, 2.6336669921875, 2.974609375, 3.3155517578125, 3.656494140625, 3.9974365234375, 4.33837890625, 4.6793212890625, 5.020263671875, 5.3612060546875, 5.7021484375, 6.0430908203125, 6.384033203125, 6.7249755859375, 7.06591796875, 7.4068603515625, 7.747802734375, 8.0887451171875, 8.4296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 8.0, 10.0, 15.0, 15.0, 30.0, 26.0, 23.0, 55.0, 42.0, 57.0, 46.0, 70.0, 62.0, 64.0, 63.0, 60.0, 50.0, 40.0, 41.0, 42.0, 34.0, 30.0, 26.0, 19.0, 14.0, 16.0, 7.0, 7.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8100433349609375, -0.782684326171875, -0.7553253173828125, -0.72796630859375, -0.7006072998046875, -0.673248291015625, -0.6458892822265625, -0.6185302734375, -0.5911712646484375, -0.563812255859375, -0.5364532470703125, -0.50909423828125, -0.4817352294921875, -0.454376220703125, -0.4270172119140625, -0.399658203125, -0.3722991943359375, -0.344940185546875, -0.3175811767578125, -0.29022216796875, -0.2628631591796875, -0.235504150390625, -0.2081451416015625, -0.1807861328125, -0.1534271240234375, -0.126068115234375, -0.0987091064453125, -0.07135009765625, -0.0439910888671875, -0.016632080078125, 0.0107269287109375, 0.0380859375, 0.0654449462890625, 0.092803955078125, 0.1201629638671875, 0.14752197265625, 0.1748809814453125, 0.202239990234375, 0.2295989990234375, 0.2569580078125, 0.2843170166015625, 0.311676025390625, 0.3390350341796875, 0.36639404296875, 0.3937530517578125, 0.421112060546875, 0.4484710693359375, 0.475830078125, 0.5031890869140625, 0.530548095703125, 0.5579071044921875, 0.58526611328125, 0.6126251220703125, 0.639984130859375, 0.6673431396484375, 0.6947021484375, 0.7220611572265625, 0.749420166015625, 0.7767791748046875, 0.80413818359375, 0.8314971923828125, 0.858856201171875, 0.8862152099609375, 0.91357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 3.0, 14.0, 18.0, 22.0, 31.0, 53.0, 66.0, 91.0, 115.0, 181.0, 346.0, 620.0, 1110.0, 2436.0, 6118.0, 21587.0, 257002.0, 3853134.0, 36748.0, 8336.0, 3110.0, 1360.0, 702.0, 372.0, 223.0, 161.0, 78.0, 60.0, 50.0, 40.0, 20.0, 20.0, 8.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.4915771484375, -2.403076171875, -2.3145751953125, -2.22607421875, -2.1375732421875, -2.049072265625, -1.9605712890625, -1.8720703125, -1.7835693359375, -1.695068359375, -1.6065673828125, -1.51806640625, -1.4295654296875, -1.341064453125, -1.2525634765625, -1.1640625, -1.0755615234375, -0.987060546875, -0.8985595703125, -0.81005859375, -0.7215576171875, -0.633056640625, -0.5445556640625, -0.4560546875, -0.3675537109375, -0.279052734375, -0.1905517578125, -0.10205078125, -0.0135498046875, 0.074951171875, 0.1634521484375, 0.251953125, 0.3404541015625, 0.428955078125, 0.5174560546875, 0.60595703125, 0.6944580078125, 0.782958984375, 0.8714599609375, 0.9599609375, 1.0484619140625, 1.136962890625, 1.2254638671875, 1.31396484375, 1.4024658203125, 1.490966796875, 1.5794677734375, 1.66796875, 1.7564697265625, 1.844970703125, 1.9334716796875, 2.02197265625, 2.1104736328125, 2.198974609375, 2.2874755859375, 2.3759765625, 2.4644775390625, 2.552978515625, 2.6414794921875, 2.72998046875, 2.8184814453125, 2.906982421875, 2.9954833984375, 3.083984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 25.0, 55.0, 146.0, 3173.0, 455.0, 102.0, 36.0, 14.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0783615112304688, -1.0532073974609375, -1.0280532836914062, -1.002899169921875, -0.9777450561523438, -0.9525909423828125, -0.9274368286132812, -0.90228271484375, -0.8771286010742188, -0.8519744873046875, -0.8268203735351562, -0.801666259765625, -0.7765121459960938, -0.7513580322265625, -0.7262039184570312, -0.7010498046875, -0.6758956909179688, -0.6507415771484375, -0.6255874633789062, -0.600433349609375, -0.5752792358398438, -0.5501251220703125, -0.5249710083007812, -0.49981689453125, -0.47466278076171875, -0.4495086669921875, -0.42435455322265625, -0.399200439453125, -0.37404632568359375, -0.3488922119140625, -0.32373809814453125, -0.298583984375, -0.27342987060546875, -0.2482757568359375, -0.22312164306640625, -0.197967529296875, -0.17281341552734375, -0.1476593017578125, -0.12250518798828125, -0.09735107421875, -0.07219696044921875, -0.0470428466796875, -0.02188873291015625, 0.003265380859375, 0.02841949462890625, 0.0535736083984375, 0.07872772216796875, 0.1038818359375, 0.12903594970703125, 0.1541900634765625, 0.17934417724609375, 0.204498291015625, 0.22965240478515625, 0.2548065185546875, 0.27996063232421875, 0.30511474609375, 0.33026885986328125, 0.3554229736328125, 0.38057708740234375, 0.405731201171875, 0.43088531494140625, 0.4560394287109375, 0.48119354248046875, 0.50634765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 10.0, 20.0, 26.0, 49.0, 84.0, 118.0, 163.0, 151.0, 137.0, 111.0, 45.0, 31.0, 18.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039318323135376, -2.9488184452056885, -2.85831880569458, -2.7678189277648926, -2.677319049835205, -2.5868191719055176, -2.496319532394409, -2.4058196544647217, -2.315319776535034, -2.2248198986053467, -2.1343202590942383, -2.043820381164551, -1.9533205032348633, -1.8628207445144653, -1.7723209857940674, -1.6818211078643799, -1.591321349143982, -1.500821590423584, -1.4103217124938965, -1.3198219537734985, -1.229322075843811, -1.138822317123413, -1.0483224391937256, -0.9578226804733276, -0.8673228621482849, -0.7768230438232422, -0.6863232254981995, -0.5958234071731567, -0.5053236484527588, -0.4148238003253937, -0.32432401180267334, -0.23382419347763062, -0.1433243751525879, -0.05282456427812576, 0.037675246596336365, 0.1281750500202179, 0.21867486834526062, 0.30917468667030334, 0.3996744751930237, 0.4901742935180664, 0.5806741118431091, 0.6711739301681519, 0.7616737484931946, 0.8521735668182373, 0.9426733255386353, 1.0331732034683228, 1.1236729621887207, 1.2141728401184082, 1.3046725988388062, 1.395172357559204, 1.4856722354888916, 1.5761719942092896, 1.666671872138977, 1.757171630859375, 1.8476715087890625, 1.9381712675094604, 2.0286710262298584, 2.119170904159546, 2.2096705436706543, 2.300170421600342, 2.3906702995300293, 2.481170177459717, 2.571669816970825, 2.6621696949005127, 2.7526695728302]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 11.0, 9.0, 14.0, 7.0, 24.0, 22.0, 32.0, 29.0, 32.0, 33.0, 40.0, 52.0, 51.0, 44.0, 64.0, 47.0, 44.0, 63.0, 46.0, 42.0, 31.0, 33.0, 28.0, 37.0, 36.0, 23.0, 32.0, 18.0, 12.0, 6.0, 4.0, 2.0, 5.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798314094543457, -1.747164011001587, -1.6960139274597168, -1.6448638439178467, -1.5937137603759766, -1.5425636768341064, -1.4914137125015259, -1.4402636289596558, -1.3891135454177856, -1.3379634618759155, -1.2868133783340454, -1.2356632947921753, -1.1845133304595947, -1.1333632469177246, -1.0822131633758545, -1.0310630798339844, -0.9799129962921143, -0.9287629127502441, -0.877612829208374, -0.8264628052711487, -0.7753127217292786, -0.7241626381874084, -0.6730126142501831, -0.621862530708313, -0.5707124471664429, -0.5195623636245728, -0.468412309885025, -0.4172622561454773, -0.3661121726036072, -0.31496208906173706, -0.26381203532218933, -0.2126619815826416, -0.16151189804077148, -0.11036182940006256, -0.05921176075935364, -0.008061692118644714, 0.04308837652206421, 0.09423846006393433, 0.14538851380348206, 0.19653856754302979, 0.2476886510848999, 0.29883873462677, 0.34998878836631775, 0.4011388421058655, 0.4522889256477356, 0.5034390091896057, 0.554589033126831, 0.6057391166687012, 0.6568892002105713, 0.7080392837524414, 0.7591893672943115, 0.8103393912315369, 0.861489474773407, 0.9126395583152771, 0.9637895822525024, 1.0149396657943726, 1.0660897493362427, 1.1172398328781128, 1.168389916419983, 1.219539999961853, 1.2706899642944336, 1.3218400478363037, 1.3729901313781738, 1.424140214920044, 1.475290298461914]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 5.0, 13.0, 19.0, 31.0, 55.0, 69.0, 139.0, 266.0, 561.0, 1141.0, 2871.0, 9184.0, 37109.0, 178648.0, 513278.0, 238060.0, 49100.0, 11849.0, 3618.0, 1334.0, 553.0, 269.0, 132.0, 91.0, 49.0, 30.0, 22.0, 10.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.498046875, -3.404998779296875, -3.31195068359375, -3.218902587890625, -3.1258544921875, -3.032806396484375, -2.93975830078125, -2.846710205078125, -2.753662109375, -2.660614013671875, -2.56756591796875, -2.474517822265625, -2.3814697265625, -2.288421630859375, -2.19537353515625, -2.102325439453125, -2.00927734375, -1.916229248046875, -1.82318115234375, -1.730133056640625, -1.6370849609375, -1.544036865234375, -1.45098876953125, -1.357940673828125, -1.264892578125, -1.171844482421875, -1.07879638671875, -0.985748291015625, -0.8927001953125, -0.799652099609375, -0.70660400390625, -0.613555908203125, -0.5205078125, -0.427459716796875, -0.33441162109375, -0.241363525390625, -0.1483154296875, -0.055267333984375, 0.03778076171875, 0.130828857421875, 0.223876953125, 0.316925048828125, 0.40997314453125, 0.503021240234375, 0.5960693359375, 0.689117431640625, 0.78216552734375, 0.875213623046875, 0.96826171875, 1.061309814453125, 1.15435791015625, 1.247406005859375, 1.3404541015625, 1.433502197265625, 1.52655029296875, 1.619598388671875, 1.712646484375, 1.805694580078125, 1.89874267578125, 1.991790771484375, 2.0848388671875, 2.177886962890625, 2.27093505859375, 2.363983154296875, 2.45703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 11.0, 12.0, 19.0, 19.0, 32.0, 36.0, 32.0, 56.0, 63.0, 56.0, 58.0, 65.0, 67.0, 73.0, 57.0, 51.0, 48.0, 43.0, 37.0, 37.0, 23.0, 21.0, 14.0, 16.0, 10.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.7950592041015625, -0.763946533203125, -0.7328338623046875, -0.70172119140625, -0.6706085205078125, -0.639495849609375, -0.6083831787109375, -0.5772705078125, -0.5461578369140625, -0.515045166015625, -0.4839324951171875, -0.45281982421875, -0.4217071533203125, -0.390594482421875, -0.3594818115234375, -0.328369140625, -0.2972564697265625, -0.266143798828125, -0.2350311279296875, -0.20391845703125, -0.1728057861328125, -0.141693115234375, -0.1105804443359375, -0.0794677734375, -0.0483551025390625, -0.017242431640625, 0.0138702392578125, 0.04498291015625, 0.0760955810546875, 0.107208251953125, 0.1383209228515625, 0.16943359375, 0.2005462646484375, 0.231658935546875, 0.2627716064453125, 0.29388427734375, 0.3249969482421875, 0.356109619140625, 0.3872222900390625, 0.4183349609375, 0.4494476318359375, 0.480560302734375, 0.5116729736328125, 0.54278564453125, 0.5738983154296875, 0.605010986328125, 0.6361236572265625, 0.667236328125, 0.6983489990234375, 0.729461669921875, 0.7605743408203125, 0.79168701171875, 0.8227996826171875, 0.853912353515625, 0.8850250244140625, 0.9161376953125, 0.9472503662109375, 0.978363037109375, 1.0094757080078125, 1.04058837890625, 1.0717010498046875, 1.102813720703125, 1.1339263916015625, 1.1650390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 11.0, 8.0, 9.0, 10.0, 30.0, 46.0, 81.0, 84.0, 114.0, 210.0, 328.0, 601.0, 1155.0, 2887.0, 25646.0, 858131.0, 149706.0, 6021.0, 1577.0, 766.0, 429.0, 257.0, 164.0, 93.0, 70.0, 49.0, 20.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.9705810546875, -6.757568359375, -6.5445556640625, -6.33154296875, -6.1185302734375, -5.905517578125, -5.6925048828125, -5.4794921875, -5.2664794921875, -5.053466796875, -4.8404541015625, -4.62744140625, -4.4144287109375, -4.201416015625, -3.9884033203125, -3.775390625, -3.5623779296875, -3.349365234375, -3.1363525390625, -2.92333984375, -2.7103271484375, -2.497314453125, -2.2843017578125, -2.0712890625, -1.8582763671875, -1.645263671875, -1.4322509765625, -1.21923828125, -1.0062255859375, -0.793212890625, -0.5802001953125, -0.3671875, -0.1541748046875, 0.058837890625, 0.2718505859375, 0.48486328125, 0.6978759765625, 0.910888671875, 1.1239013671875, 1.3369140625, 1.5499267578125, 1.762939453125, 1.9759521484375, 2.18896484375, 2.4019775390625, 2.614990234375, 2.8280029296875, 3.041015625, 3.2540283203125, 3.467041015625, 3.6800537109375, 3.89306640625, 4.1060791015625, 4.319091796875, 4.5321044921875, 4.7451171875, 4.9581298828125, 5.171142578125, 5.3841552734375, 5.59716796875, 5.8101806640625, 6.023193359375, 6.2362060546875, 6.44921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 0.0, 7.0, 7.0, 9.0, 10.0, 18.0, 25.0, 28.0, 23.0, 38.0, 46.0, 58.0, 53.0, 48.0, 89.0, 66.0, 58.0, 72.0, 60.0, 47.0, 46.0, 47.0, 38.0, 26.0, 21.0, 19.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.11285400390625, -3.9522705078125, -3.79168701171875, -3.631103515625, -3.47052001953125, -3.3099365234375, -3.14935302734375, -2.98876953125, -2.82818603515625, -2.6676025390625, -2.50701904296875, -2.346435546875, -2.18585205078125, -2.0252685546875, -1.86468505859375, -1.7041015625, -1.54351806640625, -1.3829345703125, -1.22235107421875, -1.061767578125, -0.90118408203125, -0.7406005859375, -0.58001708984375, -0.41943359375, -0.25885009765625, -0.0982666015625, 0.06231689453125, 0.222900390625, 0.38348388671875, 0.5440673828125, 0.70465087890625, 0.865234375, 1.02581787109375, 1.1864013671875, 1.34698486328125, 1.507568359375, 1.66815185546875, 1.8287353515625, 1.98931884765625, 2.14990234375, 2.31048583984375, 2.4710693359375, 2.63165283203125, 2.792236328125, 2.95281982421875, 3.1134033203125, 3.27398681640625, 3.4345703125, 3.59515380859375, 3.7557373046875, 3.91632080078125, 4.076904296875, 4.23748779296875, 4.3980712890625, 4.55865478515625, 4.71923828125, 4.87982177734375, 5.0404052734375, 5.20098876953125, 5.361572265625, 5.52215576171875, 5.6827392578125, 5.84332275390625, 6.00390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 19.0, 15.0, 35.0, 50.0, 57.0, 127.0, 182.0, 374.0, 1031.0, 10553.0, 974315.0, 58658.0, 1952.0, 545.0, 228.0, 130.0, 82.0, 59.0, 34.0, 22.0, 11.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.64227294921875, -5.4642333984375, -5.28619384765625, -5.108154296875, -4.93011474609375, -4.7520751953125, -4.57403564453125, -4.39599609375, -4.21795654296875, -4.0399169921875, -3.86187744140625, -3.683837890625, -3.50579833984375, -3.3277587890625, -3.14971923828125, -2.9716796875, -2.79364013671875, -2.6156005859375, -2.43756103515625, -2.259521484375, -2.08148193359375, -1.9034423828125, -1.72540283203125, -1.54736328125, -1.36932373046875, -1.1912841796875, -1.01324462890625, -0.835205078125, -0.65716552734375, -0.4791259765625, -0.30108642578125, -0.123046875, 0.05499267578125, 0.2330322265625, 0.41107177734375, 0.589111328125, 0.76715087890625, 0.9451904296875, 1.12322998046875, 1.30126953125, 1.47930908203125, 1.6573486328125, 1.83538818359375, 2.013427734375, 2.19146728515625, 2.3695068359375, 2.54754638671875, 2.7255859375, 2.90362548828125, 3.0816650390625, 3.25970458984375, 3.437744140625, 3.61578369140625, 3.7938232421875, 3.97186279296875, 4.14990234375, 4.32794189453125, 4.5059814453125, 4.68402099609375, 4.862060546875, 5.04010009765625, 5.2181396484375, 5.39617919921875, 5.57421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 6.0, 3.0, 11.0, 5.0, 11.0, 16.0, 20.0, 23.0, 36.0, 31.0, 58.0, 73.0, 98.0, 103.0, 115.0, 84.0, 59.0, 55.0, 39.0, 37.0, 25.0, 20.0, 10.0, 9.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022470951080322266, -0.0002178587019443512, -0.00021100789308547974, -0.00020415708422660828, -0.00019730627536773682, -0.00019045546650886536, -0.0001836046576499939, -0.00017675384879112244, -0.00016990303993225098, -0.00016305223107337952, -0.00015620142221450806, -0.0001493506133556366, -0.00014249980449676514, -0.00013564899563789368, -0.00012879818677902222, -0.00012194737792015076, -0.0001150965690612793, -0.00010824576020240784, -0.00010139495134353638, -9.454414248466492e-05, -8.769333362579346e-05, -8.0842524766922e-05, -7.399171590805054e-05, -6.714090704917908e-05, -6.029009819030762e-05, -5.343928933143616e-05, -4.65884804725647e-05, -3.973767161369324e-05, -3.288686275482178e-05, -2.6036053895950317e-05, -1.9185245037078857e-05, -1.2334436178207397e-05, -5.4836273193359375e-06, 1.3671815395355225e-06, 8.217990398406982e-06, 1.5068799257278442e-05, 2.1919608116149902e-05, 2.8770416975021362e-05, 3.562122583389282e-05, 4.247203469276428e-05, 4.932284355163574e-05, 5.61736524105072e-05, 6.302446126937866e-05, 6.987527012825012e-05, 7.672607898712158e-05, 8.357688784599304e-05, 9.04276967048645e-05, 9.727850556373596e-05, 0.00010412931442260742, 0.00011098012328147888, 0.00011783093214035034, 0.0001246817409992218, 0.00013153254985809326, 0.00013838335871696472, 0.00014523416757583618, 0.00015208497643470764, 0.0001589357852935791, 0.00016578659415245056, 0.00017263740301132202, 0.00017948821187019348, 0.00018633902072906494, 0.0001931898295879364, 0.00020004063844680786, 0.00020689144730567932, 0.00021374225616455078]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 12.0, 4.0, 11.0, 7.0, 20.0, 25.0, 40.0, 41.0, 72.0, 118.0, 180.0, 322.0, 794.0, 2212.0, 10675.0, 251798.0, 757432.0, 19608.0, 3113.0, 987.0, 449.0, 237.0, 140.0, 78.0, 48.0, 41.0, 25.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.442413330078125, -3.32818603515625, -3.213958740234375, -3.0997314453125, -2.985504150390625, -2.87127685546875, -2.757049560546875, -2.642822265625, -2.528594970703125, -2.41436767578125, -2.300140380859375, -2.1859130859375, -2.071685791015625, -1.95745849609375, -1.843231201171875, -1.72900390625, -1.614776611328125, -1.50054931640625, -1.386322021484375, -1.2720947265625, -1.157867431640625, -1.04364013671875, -0.929412841796875, -0.815185546875, -0.700958251953125, -0.58673095703125, -0.472503662109375, -0.3582763671875, -0.244049072265625, -0.12982177734375, -0.015594482421875, 0.0986328125, 0.212860107421875, 0.32708740234375, 0.441314697265625, 0.5555419921875, 0.669769287109375, 0.78399658203125, 0.898223876953125, 1.012451171875, 1.126678466796875, 1.24090576171875, 1.355133056640625, 1.4693603515625, 1.583587646484375, 1.69781494140625, 1.812042236328125, 1.92626953125, 2.040496826171875, 2.15472412109375, 2.268951416015625, 2.3831787109375, 2.497406005859375, 2.61163330078125, 2.725860595703125, 2.840087890625, 2.954315185546875, 3.06854248046875, 3.182769775390625, 3.2969970703125, 3.411224365234375, 3.52545166015625, 3.639678955078125, 3.75390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 8.0, 10.0, 28.0, 39.0, 51.0, 53.0, 94.0, 132.0, 134.0, 129.0, 71.0, 72.0, 59.0, 28.0, 20.0, 11.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.59381103515625, -2.5079345703125, -2.42205810546875, -2.336181640625, -2.25030517578125, -2.1644287109375, -2.07855224609375, -1.99267578125, -1.90679931640625, -1.8209228515625, -1.73504638671875, -1.649169921875, -1.56329345703125, -1.4774169921875, -1.39154052734375, -1.3056640625, -1.21978759765625, -1.1339111328125, -1.04803466796875, -0.962158203125, -0.87628173828125, -0.7904052734375, -0.70452880859375, -0.61865234375, -0.53277587890625, -0.4468994140625, -0.36102294921875, -0.275146484375, -0.18927001953125, -0.1033935546875, -0.01751708984375, 0.068359375, 0.15423583984375, 0.2401123046875, 0.32598876953125, 0.411865234375, 0.49774169921875, 0.5836181640625, 0.66949462890625, 0.75537109375, 0.84124755859375, 0.9271240234375, 1.01300048828125, 1.098876953125, 1.18475341796875, 1.2706298828125, 1.35650634765625, 1.4423828125, 1.52825927734375, 1.6141357421875, 1.70001220703125, 1.785888671875, 1.87176513671875, 1.9576416015625, 2.04351806640625, 2.12939453125, 2.21527099609375, 2.3011474609375, 2.38702392578125, 2.472900390625, 2.55877685546875, 2.6446533203125, 2.73052978515625, 2.81640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 28.0, 142.0, 433.0, 325.0, 60.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.46310424804688, -102.12818908691406, -99.79326629638672, -97.45834350585938, -95.12342834472656, -92.78851318359375, -90.4535903930664, -88.11866760253906, -85.78375244140625, -83.44883728027344, -81.1139144897461, -78.77899169921875, -76.44407653808594, -74.10916137695312, -71.77423858642578, -69.43931579589844, -67.10440063476562, -64.76948547363281, -62.43456268310547, -60.09964370727539, -57.76472473144531, -55.429805755615234, -53.094886779785156, -50.75996780395508, -48.425048828125, -46.09012985229492, -43.755210876464844, -41.420291900634766, -39.08537292480469, -36.75045394897461, -34.41553497314453, -32.08061599731445, -29.745704650878906, -27.410785675048828, -25.07586669921875, -22.740947723388672, -20.406028747558594, -18.071109771728516, -15.736190795898438, -13.40127182006836, -11.066352844238281, -8.731433868408203, -6.396514892578125, -4.061595916748047, -1.7266769409179688, 0.6082420349121094, 2.9431610107421875, 5.278079986572266, 7.612998962402344, 9.947917938232422, 12.2828369140625, 14.617755889892578, 16.952674865722656, 19.287593841552734, 21.622512817382812, 23.95743179321289, 26.29235076904297, 28.627269744873047, 30.962188720703125, 33.2971076965332, 35.63202667236328, 37.96694564819336, 40.30186462402344, 42.636783599853516, 44.971702575683594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 6.0, 4.0, 12.0, 7.0, 9.0, 11.0, 18.0, 17.0, 17.0, 21.0, 25.0, 30.0, 32.0, 35.0, 34.0, 34.0, 38.0, 43.0, 53.0, 34.0, 47.0, 45.0, 50.0, 41.0, 40.0, 38.0, 27.0, 28.0, 21.0, 25.0, 32.0, 24.0, 19.0, 9.0, 7.0, 5.0, 13.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.858171463012695, -15.4027681350708, -14.947365760803223, -14.491962432861328, -14.03656005859375, -13.581156730651855, -13.125754356384277, -12.670351028442383, -12.214948654174805, -11.75954532623291, -11.304142951965332, -10.848739624023438, -10.39333724975586, -9.937933921813965, -9.482531547546387, -9.027128219604492, -8.571725845336914, -8.11632251739502, -7.660920143127441, -7.205517292022705, -6.750114440917969, -6.294711112976074, -5.839308738708496, -5.383905410766602, -4.928502082824707, -4.473099231719971, -4.017696380615234, -3.562293529510498, -3.1068906784057617, -2.6514875888824463, -2.19608473777771, -1.7406818866729736, -1.2852792739868164, -0.8298764228820801, -0.374473512172699, 0.08092939853668213, 0.5363322496414185, 0.9917352199554443, 1.4471380710601807, 1.902540922164917, 2.3579437732696533, 2.8133466243743896, 3.268749475479126, 3.7241525650024414, 4.179555416107178, 4.634958267211914, 5.09036111831665, 5.545763969421387, 6.001166820526123, 6.456569671630859, 6.911972522735596, 7.367375373840332, 7.822778224945068, 8.278181076049805, 8.7335844039917, 9.188986778259277, 9.644390106201172, 10.099793434143066, 10.555195808410645, 11.010599136352539, 11.466001510620117, 11.921404838562012, 12.37680721282959, 12.832210540771484, 13.287612915039062]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 12.0, 16.0, 24.0, 42.0, 66.0, 113.0, 169.0, 261.0, 529.0, 1086.0, 3374.0, 24605.0, 4050376.0, 103531.0, 6759.0, 1683.0, 723.0, 373.0, 191.0, 123.0, 64.0, 43.0, 27.0, 15.0, 12.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0], "bins": [-6.80859375, -6.63714599609375, -6.4656982421875, -6.29425048828125, -6.122802734375, -5.95135498046875, -5.7799072265625, -5.60845947265625, -5.43701171875, -5.26556396484375, -5.0941162109375, -4.92266845703125, -4.751220703125, -4.57977294921875, -4.4083251953125, -4.23687744140625, -4.0654296875, -3.89398193359375, -3.7225341796875, -3.55108642578125, -3.379638671875, -3.20819091796875, -3.0367431640625, -2.86529541015625, -2.69384765625, -2.52239990234375, -2.3509521484375, -2.17950439453125, -2.008056640625, -1.83660888671875, -1.6651611328125, -1.49371337890625, -1.322265625, -1.15081787109375, -0.9793701171875, -0.80792236328125, -0.636474609375, -0.46502685546875, -0.2935791015625, -0.12213134765625, 0.04931640625, 0.22076416015625, 0.3922119140625, 0.56365966796875, 0.735107421875, 0.90655517578125, 1.0780029296875, 1.24945068359375, 1.4208984375, 1.59234619140625, 1.7637939453125, 1.93524169921875, 2.106689453125, 2.27813720703125, 2.4495849609375, 2.62103271484375, 2.79248046875, 2.96392822265625, 3.1353759765625, 3.30682373046875, 3.478271484375, 3.64971923828125, 3.8211669921875, 3.99261474609375, 4.1640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 6.0, 2.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 12.0, 26.0, 37.0, 36.0, 41.0, 46.0, 51.0, 62.0, 61.0, 52.0, 41.0, 51.0, 45.0, 47.0, 61.0, 35.0, 31.0, 34.0, 36.0, 21.0, 15.0, 14.0, 16.0, 13.0, 7.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.9150390625, -0.889007568359375, -0.86297607421875, -0.836944580078125, -0.8109130859375, -0.784881591796875, -0.75885009765625, -0.732818603515625, -0.706787109375, -0.680755615234375, -0.65472412109375, -0.628692626953125, -0.6026611328125, -0.576629638671875, -0.55059814453125, -0.524566650390625, -0.49853515625, -0.472503662109375, -0.44647216796875, -0.420440673828125, -0.3944091796875, -0.368377685546875, -0.34234619140625, -0.316314697265625, -0.290283203125, -0.264251708984375, -0.23822021484375, -0.212188720703125, -0.1861572265625, -0.160125732421875, -0.13409423828125, -0.108062744140625, -0.08203125, -0.055999755859375, -0.02996826171875, -0.003936767578125, 0.0220947265625, 0.048126220703125, 0.07415771484375, 0.100189208984375, 0.126220703125, 0.152252197265625, 0.17828369140625, 0.204315185546875, 0.2303466796875, 0.256378173828125, 0.28240966796875, 0.308441162109375, 0.33447265625, 0.360504150390625, 0.38653564453125, 0.412567138671875, 0.4385986328125, 0.464630126953125, 0.49066162109375, 0.516693115234375, 0.542724609375, 0.568756103515625, 0.59478759765625, 0.620819091796875, 0.6468505859375, 0.672882080078125, 0.69891357421875, 0.724945068359375, 0.7509765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 10.0, 7.0, 19.0, 11.0, 22.0, 28.0, 36.0, 41.0, 50.0, 79.0, 105.0, 172.0, 268.0, 416.0, 663.0, 1235.0, 2625.0, 6999.0, 27291.0, 336434.0, 3752924.0, 47351.0, 10187.0, 3471.0, 1607.0, 814.0, 456.0, 285.0, 209.0, 130.0, 88.0, 60.0, 60.0, 26.0, 18.0, 22.0, 16.0, 13.0, 7.0, 6.0, 8.0, 3.0, 6.0, 1.0, 6.0, 0.0, 1.0, 3.0], "bins": [-3.119140625, -3.032867431640625, -2.94659423828125, -2.860321044921875, -2.7740478515625, -2.687774658203125, -2.60150146484375, -2.515228271484375, -2.428955078125, -2.342681884765625, -2.25640869140625, -2.170135498046875, -2.0838623046875, -1.997589111328125, -1.91131591796875, -1.825042724609375, -1.73876953125, -1.652496337890625, -1.56622314453125, -1.479949951171875, -1.3936767578125, -1.307403564453125, -1.22113037109375, -1.134857177734375, -1.048583984375, -0.962310791015625, -0.87603759765625, -0.789764404296875, -0.7034912109375, -0.617218017578125, -0.53094482421875, -0.444671630859375, -0.3583984375, -0.272125244140625, -0.18585205078125, -0.099578857421875, -0.0133056640625, 0.072967529296875, 0.15924072265625, 0.245513916015625, 0.331787109375, 0.418060302734375, 0.50433349609375, 0.590606689453125, 0.6768798828125, 0.763153076171875, 0.84942626953125, 0.935699462890625, 1.02197265625, 1.108245849609375, 1.19451904296875, 1.280792236328125, 1.3670654296875, 1.453338623046875, 1.53961181640625, 1.625885009765625, 1.712158203125, 1.798431396484375, 1.88470458984375, 1.970977783203125, 2.0572509765625, 2.143524169921875, 2.22979736328125, 2.316070556640625, 2.40234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 19.0, 49.0, 83.0, 417.0, 3124.0, 209.0, 58.0, 31.0, 22.0, 15.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.26971435546875, -1.2152099609375, -1.16070556640625, -1.106201171875, -1.05169677734375, -0.9971923828125, -0.94268798828125, -0.88818359375, -0.83367919921875, -0.7791748046875, -0.72467041015625, -0.670166015625, -0.61566162109375, -0.5611572265625, -0.50665283203125, -0.4521484375, -0.39764404296875, -0.3431396484375, -0.28863525390625, -0.234130859375, -0.17962646484375, -0.1251220703125, -0.07061767578125, -0.01611328125, 0.03839111328125, 0.0928955078125, 0.14739990234375, 0.201904296875, 0.25640869140625, 0.3109130859375, 0.36541748046875, 0.419921875, 0.47442626953125, 0.5289306640625, 0.58343505859375, 0.637939453125, 0.69244384765625, 0.7469482421875, 0.80145263671875, 0.85595703125, 0.91046142578125, 0.9649658203125, 1.01947021484375, 1.073974609375, 1.12847900390625, 1.1829833984375, 1.23748779296875, 1.2919921875, 1.34649658203125, 1.4010009765625, 1.45550537109375, 1.510009765625, 1.56451416015625, 1.6190185546875, 1.67352294921875, 1.72802734375, 1.78253173828125, 1.8370361328125, 1.89154052734375, 1.946044921875, 2.00054931640625, 2.0550537109375, 2.10955810546875, 2.1640625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 14.0, 32.0, 64.0, 136.0, 208.0, 234.0, 148.0, 81.0, 39.0, 17.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1591782569885254, -2.898341178894043, -2.6375041007995605, -2.376666784286499, -2.1158297061920166, -1.8549926280975342, -1.5941554307937622, -1.3333182334899902, -1.0724811553955078, -0.8116440176963806, -0.5508068799972534, -0.2899697422981262, -0.029132604598999023, 0.2317044734954834, 0.49254167079925537, 0.7533788681030273, 1.0142159461975098, 1.2750530242919922, 1.5358902215957642, 1.7967274188995361, 2.0575644969940186, 2.318401575088501, 2.5792388916015625, 2.840075969696045, 3.1009130477905273, 3.3617501258850098, 3.622587203979492, 3.8834245204925537, 4.144261360168457, 4.405098915100098, 4.66593599319458, 4.9267730712890625, 5.187610626220703, 5.4484477043151855, 5.709284782409668, 5.97012186050415, 6.230958938598633, 6.491796493530273, 6.752633571624756, 7.013470649719238, 7.274307727813721, 7.535144805908203, 7.7959818840026855, 8.056818962097168, 8.317656517028809, 8.578493118286133, 8.839330673217773, 9.100168228149414, 9.361004829406738, 9.621842384338379, 9.882678985595703, 10.143516540527344, 10.404353141784668, 10.665190696716309, 10.926027297973633, 11.186864852905273, 11.447702407836914, 11.708539962768555, 11.969376564025879, 12.23021411895752, 12.491050720214844, 12.751888275146484, 13.012724876403809, 13.27356243133545, 13.534399032592773]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 14.0, 18.0, 20.0, 35.0, 36.0, 28.0, 41.0, 45.0, 53.0, 64.0, 59.0, 55.0, 67.0, 52.0, 58.0, 57.0, 46.0, 38.0, 35.0, 21.0, 28.0, 21.0, 18.0, 10.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.197094440460205, -4.079265117645264, -3.961435317993164, -3.8436059951782227, -3.725776433944702, -3.6079468727111816, -3.490117311477661, -3.3722877502441406, -3.254458427429199, -3.1366288661956787, -3.018799304962158, -2.900969982147217, -2.7831404209136963, -2.665310859680176, -2.5474812984466553, -2.4296517372131348, -2.3118221759796143, -2.1939926147460938, -2.0761630535125732, -1.9583336114883423, -1.8405041694641113, -1.7226746082305908, -1.6048450469970703, -1.4870154857635498, -1.3691860437393188, -1.2513564825057983, -1.1335270404815674, -1.0156974792480469, -0.8978679776191711, -0.7800384759902954, -0.6622089147567749, -0.5443794131278992, -0.42654991149902344, -0.3087204098701477, -0.19089087843894958, -0.07306134700775146, 0.04476815462112427, 0.16259765625, 0.2804272174835205, 0.39825671911239624, 0.516086220741272, 0.6339157223701477, 0.7517452239990234, 0.869574785232544, 0.9874042868614197, 1.1052337884902954, 1.223063349723816, 1.3408927917480469, 1.4587223529815674, 1.576551914215088, 1.6943813562393188, 1.8122109174728394, 1.9300403594970703, 2.047869920730591, 2.1656994819641113, 2.283529043197632, 2.4013586044311523, 2.519188165664673, 2.6370177268981934, 2.7548470497131348, 2.8726766109466553, 2.990506172180176, 3.1083357334136963, 3.226165294647217, 3.343994617462158]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 18.0, 36.0, 46.0, 62.0, 118.0, 201.0, 419.0, 857.0, 1965.0, 5700.0, 21539.0, 117615.0, 546344.0, 289656.0, 47702.0, 10467.0, 3337.0, 1241.0, 561.0, 265.0, 158.0, 72.0, 45.0, 39.0, 21.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.046875, -2.940887451171875, -2.83489990234375, -2.728912353515625, -2.6229248046875, -2.516937255859375, -2.41094970703125, -2.304962158203125, -2.198974609375, -2.092987060546875, -1.98699951171875, -1.881011962890625, -1.7750244140625, -1.669036865234375, -1.56304931640625, -1.457061767578125, -1.35107421875, -1.245086669921875, -1.13909912109375, -1.033111572265625, -0.9271240234375, -0.821136474609375, -0.71514892578125, -0.609161376953125, -0.503173828125, -0.397186279296875, -0.29119873046875, -0.185211181640625, -0.0792236328125, 0.026763916015625, 0.13275146484375, 0.238739013671875, 0.3447265625, 0.450714111328125, 0.55670166015625, 0.662689208984375, 0.7686767578125, 0.874664306640625, 0.98065185546875, 1.086639404296875, 1.192626953125, 1.298614501953125, 1.40460205078125, 1.510589599609375, 1.6165771484375, 1.722564697265625, 1.82855224609375, 1.934539794921875, 2.04052734375, 2.146514892578125, 2.25250244140625, 2.358489990234375, 2.4644775390625, 2.570465087890625, 2.67645263671875, 2.782440185546875, 2.888427734375, 2.994415283203125, 3.10040283203125, 3.206390380859375, 3.3123779296875, 3.418365478515625, 3.52435302734375, 3.630340576171875, 3.736328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 5.0, 7.0, 3.0, 12.0, 13.0, 24.0, 30.0, 37.0, 28.0, 41.0, 44.0, 42.0, 48.0, 51.0, 51.0, 48.0, 74.0, 54.0, 56.0, 39.0, 33.0, 43.0, 30.0, 35.0, 28.0, 20.0, 9.0, 12.0, 15.0, 10.0, 8.0, 7.0, 11.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8998947143554688, -0.8725433349609375, -0.8451919555664062, -0.817840576171875, -0.7904891967773438, -0.7631378173828125, -0.7357864379882812, -0.70843505859375, -0.6810836791992188, -0.6537322998046875, -0.6263809204101562, -0.599029541015625, -0.5716781616210938, -0.5443267822265625, -0.5169754028320312, -0.4896240234375, -0.46227264404296875, -0.4349212646484375, -0.40756988525390625, -0.380218505859375, -0.35286712646484375, -0.3255157470703125, -0.29816436767578125, -0.27081298828125, -0.24346160888671875, -0.2161102294921875, -0.18875885009765625, -0.161407470703125, -0.13405609130859375, -0.1067047119140625, -0.07935333251953125, -0.052001953125, -0.02465057373046875, 0.0027008056640625, 0.03005218505859375, 0.057403564453125, 0.08475494384765625, 0.1121063232421875, 0.13945770263671875, 0.16680908203125, 0.19416046142578125, 0.2215118408203125, 0.24886322021484375, 0.276214599609375, 0.30356597900390625, 0.3309173583984375, 0.35826873779296875, 0.3856201171875, 0.41297149658203125, 0.4403228759765625, 0.46767425537109375, 0.495025634765625, 0.5223770141601562, 0.5497283935546875, 0.5770797729492188, 0.60443115234375, 0.6317825317382812, 0.6591339111328125, 0.6864852905273438, 0.713836669921875, 0.7411880493164062, 0.7685394287109375, 0.7958908081054688, 0.8232421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 7.0, 10.0, 23.0, 27.0, 30.0, 45.0, 74.0, 91.0, 118.0, 193.0, 305.0, 489.0, 947.0, 2328.0, 8413.0, 90980.0, 856468.0, 75862.0, 7517.0, 2204.0, 987.0, 521.0, 318.0, 167.0, 125.0, 81.0, 52.0, 41.0, 37.0, 23.0, 16.0, 12.0, 7.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.59185791015625, -5.4141845703125, -5.23651123046875, -5.058837890625, -4.88116455078125, -4.7034912109375, -4.52581787109375, -4.34814453125, -4.17047119140625, -3.9927978515625, -3.81512451171875, -3.637451171875, -3.45977783203125, -3.2821044921875, -3.10443115234375, -2.9267578125, -2.74908447265625, -2.5714111328125, -2.39373779296875, -2.216064453125, -2.03839111328125, -1.8607177734375, -1.68304443359375, -1.50537109375, -1.32769775390625, -1.1500244140625, -0.97235107421875, -0.794677734375, -0.61700439453125, -0.4393310546875, -0.26165771484375, -0.083984375, 0.09368896484375, 0.2713623046875, 0.44903564453125, 0.626708984375, 0.80438232421875, 0.9820556640625, 1.15972900390625, 1.33740234375, 1.51507568359375, 1.6927490234375, 1.87042236328125, 2.048095703125, 2.22576904296875, 2.4034423828125, 2.58111572265625, 2.7587890625, 2.93646240234375, 3.1141357421875, 3.29180908203125, 3.469482421875, 3.64715576171875, 3.8248291015625, 4.00250244140625, 4.18017578125, 4.35784912109375, 4.5355224609375, 4.71319580078125, 4.890869140625, 5.06854248046875, 5.2462158203125, 5.42388916015625, 5.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 12.0, 8.0, 17.0, 28.0, 29.0, 41.0, 44.0, 60.0, 59.0, 61.0, 73.0, 84.0, 76.0, 77.0, 74.0, 46.0, 42.0, 31.0, 32.0, 29.0, 16.0, 15.0, 9.0, 9.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.109375, -5.93841552734375, -5.7674560546875, -5.59649658203125, -5.425537109375, -5.25457763671875, -5.0836181640625, -4.91265869140625, -4.74169921875, -4.57073974609375, -4.3997802734375, -4.22882080078125, -4.057861328125, -3.88690185546875, -3.7159423828125, -3.54498291015625, -3.3740234375, -3.20306396484375, -3.0321044921875, -2.86114501953125, -2.690185546875, -2.51922607421875, -2.3482666015625, -2.17730712890625, -2.00634765625, -1.83538818359375, -1.6644287109375, -1.49346923828125, -1.322509765625, -1.15155029296875, -0.9805908203125, -0.80963134765625, -0.638671875, -0.46771240234375, -0.2967529296875, -0.12579345703125, 0.045166015625, 0.21612548828125, 0.3870849609375, 0.55804443359375, 0.72900390625, 0.89996337890625, 1.0709228515625, 1.24188232421875, 1.412841796875, 1.58380126953125, 1.7547607421875, 1.92572021484375, 2.0966796875, 2.26763916015625, 2.4385986328125, 2.60955810546875, 2.780517578125, 2.95147705078125, 3.1224365234375, 3.29339599609375, 3.46435546875, 3.63531494140625, 3.8062744140625, 3.97723388671875, 4.148193359375, 4.31915283203125, 4.4901123046875, 4.66107177734375, 4.83203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 12.0, 8.0, 8.0, 18.0, 36.0, 30.0, 42.0, 71.0, 96.0, 120.0, 197.0, 317.0, 611.0, 1416.0, 4467.0, 21928.0, 183337.0, 717859.0, 98693.0, 13602.0, 3213.0, 1140.0, 522.0, 267.0, 170.0, 119.0, 66.0, 61.0, 47.0, 24.0, 30.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9580078125, -0.9202423095703125, -0.882476806640625, -0.8447113037109375, -0.80694580078125, -0.7691802978515625, -0.731414794921875, -0.6936492919921875, -0.6558837890625, -0.6181182861328125, -0.580352783203125, -0.5425872802734375, -0.50482177734375, -0.4670562744140625, -0.429290771484375, -0.3915252685546875, -0.353759765625, -0.3159942626953125, -0.278228759765625, -0.2404632568359375, -0.20269775390625, -0.1649322509765625, -0.127166748046875, -0.0894012451171875, -0.0516357421875, -0.0138702392578125, 0.023895263671875, 0.0616607666015625, 0.09942626953125, 0.1371917724609375, 0.174957275390625, 0.2127227783203125, 0.25048828125, 0.2882537841796875, 0.326019287109375, 0.3637847900390625, 0.40155029296875, 0.4393157958984375, 0.477081298828125, 0.5148468017578125, 0.5526123046875, 0.5903778076171875, 0.628143310546875, 0.6659088134765625, 0.70367431640625, 0.7414398193359375, 0.779205322265625, 0.8169708251953125, 0.854736328125, 0.8925018310546875, 0.930267333984375, 0.9680328369140625, 1.00579833984375, 1.0435638427734375, 1.081329345703125, 1.1190948486328125, 1.1568603515625, 1.1946258544921875, 1.232391357421875, 1.2701568603515625, 1.30792236328125, 1.3456878662109375, 1.383453369140625, 1.4212188720703125, 1.458984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 12.0, 28.0, 33.0, 37.0, 38.0, 75.0, 115.0, 150.0, 161.0, 104.0, 76.0, 44.0, 34.0, 21.0, 21.0, 13.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003228187561035156, -0.00031472742557525635, -0.00030663609504699707, -0.0002985447645187378, -0.0002904534339904785, -0.00028236210346221924, -0.00027427077293395996, -0.0002661794424057007, -0.0002580881118774414, -0.00024999678134918213, -0.00024190545082092285, -0.00023381412029266357, -0.0002257227897644043, -0.00021763145923614502, -0.00020954012870788574, -0.00020144879817962646, -0.0001933574676513672, -0.0001852661371231079, -0.00017717480659484863, -0.00016908347606658936, -0.00016099214553833008, -0.0001529008150100708, -0.00014480948448181152, -0.00013671815395355225, -0.00012862682342529297, -0.00012053549289703369, -0.00011244416236877441, -0.00010435283184051514, -9.626150131225586e-05, -8.817017078399658e-05, -8.00788402557373e-05, -7.198750972747803e-05, -6.389617919921875e-05, -5.580484867095947e-05, -4.7713518142700195e-05, -3.962218761444092e-05, -3.153085708618164e-05, -2.3439526557922363e-05, -1.5348196029663086e-05, -7.256865501403809e-06, 8.344650268554688e-07, 8.925795555114746e-06, 1.7017126083374023e-05, 2.51084566116333e-05, 3.319978713989258e-05, 4.1291117668151855e-05, 4.938244819641113e-05, 5.747377872467041e-05, 6.556510925292969e-05, 7.365643978118896e-05, 8.174777030944824e-05, 8.983910083770752e-05, 9.79304313659668e-05, 0.00010602176189422607, 0.00011411309242248535, 0.00012220442295074463, 0.0001302957534790039, 0.00013838708400726318, 0.00014647841453552246, 0.00015456974506378174, 0.00016266107559204102, 0.0001707524061203003, 0.00017884373664855957, 0.00018693506717681885, 0.00019502639770507812]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 15.0, 19.0, 22.0, 41.0, 65.0, 75.0, 106.0, 198.0, 324.0, 533.0, 1019.0, 2423.0, 8085.0, 44455.0, 525835.0, 416608.0, 37077.0, 7196.0, 2229.0, 948.0, 495.0, 278.0, 157.0, 111.0, 70.0, 57.0, 23.0, 18.0, 18.0, 13.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0693359375, -1.0296630859375, -0.989990234375, -0.9503173828125, -0.91064453125, -0.8709716796875, -0.831298828125, -0.7916259765625, -0.751953125, -0.7122802734375, -0.672607421875, -0.6329345703125, -0.59326171875, -0.5535888671875, -0.513916015625, -0.4742431640625, -0.4345703125, -0.3948974609375, -0.355224609375, -0.3155517578125, -0.27587890625, -0.2362060546875, -0.196533203125, -0.1568603515625, -0.1171875, -0.0775146484375, -0.037841796875, 0.0018310546875, 0.04150390625, 0.0811767578125, 0.120849609375, 0.1605224609375, 0.2001953125, 0.2398681640625, 0.279541015625, 0.3192138671875, 0.35888671875, 0.3985595703125, 0.438232421875, 0.4779052734375, 0.517578125, 0.5572509765625, 0.596923828125, 0.6365966796875, 0.67626953125, 0.7159423828125, 0.755615234375, 0.7952880859375, 0.8349609375, 0.8746337890625, 0.914306640625, 0.9539794921875, 0.99365234375, 1.0333251953125, 1.072998046875, 1.1126708984375, 1.15234375, 1.1920166015625, 1.231689453125, 1.2713623046875, 1.31103515625, 1.3507080078125, 1.390380859375, 1.4300537109375, 1.4697265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 6.0, 15.0, 15.0, 27.0, 32.0, 46.0, 58.0, 59.0, 89.0, 113.0, 101.0, 106.0, 69.0, 67.0, 56.0, 28.0, 20.0, 17.0, 13.0, 7.0, 7.0, 3.0, 7.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1303253173828125, -1.091705322265625, -1.0530853271484375, -1.01446533203125, -0.9758453369140625, -0.937225341796875, -0.8986053466796875, -0.8599853515625, -0.8213653564453125, -0.782745361328125, -0.7441253662109375, -0.70550537109375, -0.6668853759765625, -0.628265380859375, -0.5896453857421875, -0.551025390625, -0.5124053955078125, -0.473785400390625, -0.4351654052734375, -0.39654541015625, -0.3579254150390625, -0.319305419921875, -0.2806854248046875, -0.2420654296875, -0.2034454345703125, -0.164825439453125, -0.1262054443359375, -0.08758544921875, -0.0489654541015625, -0.010345458984375, 0.0282745361328125, 0.06689453125, 0.1055145263671875, 0.144134521484375, 0.1827545166015625, 0.22137451171875, 0.2599945068359375, 0.298614501953125, 0.3372344970703125, 0.3758544921875, 0.4144744873046875, 0.453094482421875, 0.4917144775390625, 0.53033447265625, 0.5689544677734375, 0.607574462890625, 0.6461944580078125, 0.684814453125, 0.7234344482421875, 0.762054443359375, 0.8006744384765625, 0.83929443359375, 0.8779144287109375, 0.916534423828125, 0.9551544189453125, 0.9937744140625, 1.0323944091796875, 1.071014404296875, 1.1096343994140625, 1.14825439453125, 1.1868743896484375, 1.225494384765625, 1.2641143798828125, 1.302734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 16.0, 24.0, 47.0, 86.0, 136.0, 174.0, 176.0, 154.0, 84.0, 46.0, 17.0, 13.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.5147705078125, -33.63487243652344, -32.754974365234375, -31.875076293945312, -30.99517822265625, -30.115280151367188, -29.235383987426758, -28.355485916137695, -27.475587844848633, -26.59568977355957, -25.715791702270508, -24.835893630981445, -23.955997467041016, -23.076099395751953, -22.19620132446289, -21.316303253173828, -20.436405181884766, -19.556507110595703, -18.67660903930664, -17.796710968017578, -16.916812896728516, -16.036914825439453, -15.157018661499023, -14.277120590209961, -13.397222518920898, -12.517324447631836, -11.637426376342773, -10.757529258728027, -9.877631187438965, -8.997733116149902, -8.117835998535156, -7.237937927246094, -6.358037948608398, -5.478139877319336, -4.598242282867432, -3.7183444499969482, -2.838446617126465, -1.9585485458374023, -1.078650951385498, -0.19875335693359375, 0.6811447143554688, 1.5610425472259521, 2.4409403800964355, 3.320838212966919, 4.200736045837402, 5.080634117126465, 5.960531711578369, 6.840429306030273, 7.720327377319336, 8.600225448608398, 9.480123519897461, 10.360020637512207, 11.23991870880127, 12.119816780090332, 12.999713897705078, 13.87961196899414, 14.759510040283203, 15.639408111572266, 16.519306182861328, 17.39920425415039, 18.279102325439453, 19.159000396728516, 20.038896560668945, 20.918794631958008, 21.79869270324707]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 16.0, 11.0, 19.0, 9.0, 32.0, 28.0, 32.0, 44.0, 25.0, 54.0, 37.0, 51.0, 46.0, 43.0, 57.0, 56.0, 39.0, 43.0, 34.0, 42.0, 25.0, 38.0, 28.0, 30.0, 22.0, 16.0, 19.0, 15.0, 10.0, 8.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-17.00653839111328, -16.527070999145508, -16.047605514526367, -15.568138122558594, -15.088671684265137, -14.60920524597168, -14.129738807678223, -13.650272369384766, -13.170804977416992, -12.691338539123535, -12.211872100830078, -11.732404708862305, -11.252938270568848, -10.77347183227539, -10.294005393981934, -9.814538955688477, -9.33507251739502, -8.855606079101562, -8.376139640808105, -7.89667272567749, -7.417205810546875, -6.937739372253418, -6.458272933959961, -5.978806495666504, -5.499339580535889, -5.019873142242432, -4.540406227111816, -4.060939788818359, -3.5814731121063232, -3.102006435394287, -2.62253999710083, -2.143073320388794, -1.6636066436767578, -1.1841399669647217, -0.7046734094619751, -0.22520685195922852, 0.2542598247528076, 0.7337265014648438, 1.2131929397583008, 1.692659616470337, 2.172126293182373, 2.651592969894409, 3.1310596466064453, 3.6105260848999023, 4.089992523193359, 4.569459438323975, 5.048925876617432, 5.528392791748047, 6.007859230041504, 6.487325668334961, 6.966792583465576, 7.446259021759033, 7.925725936889648, 8.405192375183105, 8.884658813476562, 9.36412525177002, 9.843591690063477, 10.323058128356934, 10.80252456665039, 11.281991958618164, 11.761458396911621, 12.240924835205078, 12.720391273498535, 13.199857711791992, 13.679325103759766]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 3.0, 6.0, 9.0, 11.0, 16.0, 16.0, 30.0, 32.0, 54.0, 86.0, 104.0, 153.0, 244.0, 331.0, 596.0, 1001.0, 1813.0, 3490.0, 7249.0, 16282.0, 45543.0, 235943.0, 3310723.0, 468714.0, 62339.0, 20470.0, 8891.0, 4293.0, 2345.0, 1376.0, 784.0, 456.0, 291.0, 199.0, 124.0, 75.0, 55.0, 43.0, 45.0, 17.0, 5.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.415130615234375, -1.36737060546875, -1.319610595703125, -1.2718505859375, -1.224090576171875, -1.17633056640625, -1.128570556640625, -1.080810546875, -1.033050537109375, -0.98529052734375, -0.937530517578125, -0.8897705078125, -0.842010498046875, -0.79425048828125, -0.746490478515625, -0.69873046875, -0.650970458984375, -0.60321044921875, -0.555450439453125, -0.5076904296875, -0.459930419921875, -0.41217041015625, -0.364410400390625, -0.316650390625, -0.268890380859375, -0.22113037109375, -0.173370361328125, -0.1256103515625, -0.077850341796875, -0.03009033203125, 0.017669677734375, 0.0654296875, 0.113189697265625, 0.16094970703125, 0.208709716796875, 0.2564697265625, 0.304229736328125, 0.35198974609375, 0.399749755859375, 0.447509765625, 0.495269775390625, 0.54302978515625, 0.590789794921875, 0.6385498046875, 0.686309814453125, 0.73406982421875, 0.781829833984375, 0.82958984375, 0.877349853515625, 0.92510986328125, 0.972869873046875, 1.0206298828125, 1.068389892578125, 1.11614990234375, 1.163909912109375, 1.211669921875, 1.259429931640625, 1.30718994140625, 1.354949951171875, 1.4027099609375, 1.450469970703125, 1.49822998046875, 1.545989990234375, 1.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 3.0, 10.0, 12.0, 18.0, 25.0, 22.0, 33.0, 42.0, 53.0, 52.0, 72.0, 83.0, 76.0, 81.0, 76.0, 59.0, 38.0, 44.0, 31.0, 36.0, 33.0, 18.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1289825439453125, -1.094879150390625, -1.0607757568359375, -1.02667236328125, -0.9925689697265625, -0.958465576171875, -0.9243621826171875, -0.8902587890625, -0.8561553955078125, -0.822052001953125, -0.7879486083984375, -0.75384521484375, -0.7197418212890625, -0.685638427734375, -0.6515350341796875, -0.617431640625, -0.5833282470703125, -0.549224853515625, -0.5151214599609375, -0.48101806640625, -0.4469146728515625, -0.412811279296875, -0.3787078857421875, -0.3446044921875, -0.3105010986328125, -0.276397705078125, -0.2422943115234375, -0.20819091796875, -0.1740875244140625, -0.139984130859375, -0.1058807373046875, -0.07177734375, -0.0376739501953125, -0.003570556640625, 0.0305328369140625, 0.06463623046875, 0.0987396240234375, 0.132843017578125, 0.1669464111328125, 0.2010498046875, 0.2351531982421875, 0.269256591796875, 0.3033599853515625, 0.33746337890625, 0.3715667724609375, 0.405670166015625, 0.4397735595703125, 0.473876953125, 0.5079803466796875, 0.542083740234375, 0.5761871337890625, 0.61029052734375, 0.6443939208984375, 0.678497314453125, 0.7126007080078125, 0.7467041015625, 0.7808074951171875, 0.814910888671875, 0.8490142822265625, 0.88311767578125, 0.9172210693359375, 0.951324462890625, 0.9854278564453125, 1.01953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 12.0, 16.0, 31.0, 30.0, 63.0, 88.0, 165.0, 444.0, 1306.0, 5923.0, 43659.0, 3505316.0, 606915.0, 24805.0, 3875.0, 911.0, 350.0, 157.0, 75.0, 43.0, 25.0, 18.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.03326416015625, -3.9141845703125, -3.79510498046875, -3.676025390625, -3.55694580078125, -3.4378662109375, -3.31878662109375, -3.19970703125, -3.08062744140625, -2.9615478515625, -2.84246826171875, -2.723388671875, -2.60430908203125, -2.4852294921875, -2.36614990234375, -2.2470703125, -2.12799072265625, -2.0089111328125, -1.88983154296875, -1.770751953125, -1.65167236328125, -1.5325927734375, -1.41351318359375, -1.29443359375, -1.17535400390625, -1.0562744140625, -0.93719482421875, -0.818115234375, -0.69903564453125, -0.5799560546875, -0.46087646484375, -0.341796875, -0.22271728515625, -0.1036376953125, 0.01544189453125, 0.134521484375, 0.25360107421875, 0.3726806640625, 0.49176025390625, 0.61083984375, 0.72991943359375, 0.8489990234375, 0.96807861328125, 1.087158203125, 1.20623779296875, 1.3253173828125, 1.44439697265625, 1.5634765625, 1.68255615234375, 1.8016357421875, 1.92071533203125, 2.039794921875, 2.15887451171875, 2.2779541015625, 2.39703369140625, 2.51611328125, 2.63519287109375, 2.7542724609375, 2.87335205078125, 2.992431640625, 3.11151123046875, 3.2305908203125, 3.34967041015625, 3.46875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 15.0, 16.0, 21.0, 30.0, 58.0, 112.0, 299.0, 1048.0, 1620.0, 470.0, 145.0, 86.0, 42.0, 31.0, 18.0, 11.0, 11.0, 15.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.2018585205078125, -4.106842041015625, -4.0118255615234375, -3.91680908203125, -3.8217926025390625, -3.726776123046875, -3.6317596435546875, -3.5367431640625, -3.4417266845703125, -3.346710205078125, -3.2516937255859375, -3.15667724609375, -3.0616607666015625, -2.966644287109375, -2.8716278076171875, -2.776611328125, -2.6815948486328125, -2.586578369140625, -2.4915618896484375, -2.39654541015625, -2.3015289306640625, -2.206512451171875, -2.1114959716796875, -2.0164794921875, -1.9214630126953125, -1.826446533203125, -1.7314300537109375, -1.63641357421875, -1.5413970947265625, -1.446380615234375, -1.3513641357421875, -1.25634765625, -1.1613311767578125, -1.066314697265625, -0.9712982177734375, -0.87628173828125, -0.7812652587890625, -0.686248779296875, -0.5912322998046875, -0.4962158203125, -0.4011993408203125, -0.306182861328125, -0.2111663818359375, -0.11614990234375, -0.0211334228515625, 0.073883056640625, 0.1688995361328125, 0.263916015625, 0.3589324951171875, 0.453948974609375, 0.5489654541015625, 0.64398193359375, 0.7389984130859375, 0.834014892578125, 0.9290313720703125, 1.0240478515625, 1.1190643310546875, 1.214080810546875, 1.3090972900390625, 1.40411376953125, 1.4991302490234375, 1.594146728515625, 1.6891632080078125, 1.7841796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 20.0, 22.0, 86.0, 161.0, 165.0, 178.0, 142.0, 86.0, 52.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77971076965332, -13.158794403076172, -12.537877082824707, -11.916959762573242, -11.296043395996094, -10.675127029418945, -10.05420970916748, -9.433292388916016, -8.812376022338867, -8.191459655761719, -7.570542335510254, -6.949625492095947, -6.328708648681641, -5.707791805267334, -5.086874961853027, -4.465958118438721, -3.845041275024414, -3.2241244316101074, -2.603207588195801, -1.9822907447814941, -1.3613739013671875, -0.7404570579528809, -0.11954021453857422, 0.5013766288757324, 1.122293472290039, 1.7432103157043457, 2.3641271591186523, 2.985044002532959, 3.6059608459472656, 4.226877689361572, 4.847794532775879, 5.4687113761901855, 6.089630126953125, 6.710546970367432, 7.331463813781738, 7.952380657196045, 8.573297500610352, 9.1942138671875, 9.815131187438965, 10.43604850769043, 11.056964874267578, 11.677881240844727, 12.298798561096191, 12.919715881347656, 13.540632247924805, 14.161548614501953, 14.782465934753418, 15.403383255004883, 16.02429962158203, 16.64521598815918, 17.266132354736328, 17.88705062866211, 18.507966995239258, 19.128883361816406, 19.749801635742188, 20.370718002319336, 20.991634368896484, 21.612550735473633, 22.23346710205078, 22.854385375976562, 23.47530174255371, 24.09621810913086, 24.71713638305664, 25.33805274963379, 25.958969116210938]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 14.0, 6.0, 8.0, 16.0, 15.0, 23.0, 23.0, 26.0, 32.0, 36.0, 34.0, 32.0, 34.0, 47.0, 43.0, 38.0, 38.0, 41.0, 44.0, 55.0, 48.0, 34.0, 39.0, 29.0, 30.0, 35.0, 37.0, 24.0, 23.0, 21.0, 18.0, 11.0, 6.0, 11.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.446706295013428, -7.216037750244141, -6.985368728637695, -6.754700183868408, -6.524031639099121, -6.293362617492676, -6.062694072723389, -5.832025527954102, -5.601356506347656, -5.370687961578369, -5.140018939971924, -4.909350395202637, -4.678681373596191, -4.448012828826904, -4.217344284057617, -3.986675500869751, -3.7560067176818848, -3.5253379344940186, -3.2946691513061523, -3.0640006065368652, -2.833331823348999, -2.602663040161133, -2.3719944953918457, -2.1413257122039795, -1.9106569290161133, -1.679988145828247, -1.4493194818496704, -1.2186508178710938, -0.9879820346832275, -0.7573132514953613, -0.5266445875167847, -0.295975923538208, -0.0653076171875, 0.16536110639572144, 0.39602982997894287, 0.6266985535621643, 0.8573672771453857, 1.088036060333252, 1.3187047243118286, 1.5493733882904053, 1.7800421714782715, 2.0107109546661377, 2.241379737854004, 2.472048282623291, 2.7027170658111572, 2.9333858489990234, 3.1640543937683105, 3.3947231769561768, 3.625391960144043, 3.856060743331909, 4.086729526519775, 4.3173980712890625, 4.548067092895508, 4.778735637664795, 5.009404182434082, 5.240073204040527, 5.4707417488098145, 5.701410293579102, 5.932079315185547, 6.162747859954834, 6.393416404724121, 6.624085426330566, 6.8547539710998535, 7.085422515869141, 7.316091537475586]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 20.0, 33.0, 25.0, 38.0, 73.0, 129.0, 206.0, 397.0, 738.0, 1296.0, 2970.0, 7433.0, 20242.0, 61442.0, 215915.0, 482460.0, 175197.0, 51256.0, 17022.0, 6286.0, 2611.0, 1301.0, 620.0, 317.0, 190.0, 94.0, 74.0, 46.0, 33.0, 23.0, 11.0, 9.0, 6.0, 4.0, 6.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.2578125, -2.18817138671875, -2.1185302734375, -2.04888916015625, -1.979248046875, -1.90960693359375, -1.8399658203125, -1.77032470703125, -1.70068359375, -1.63104248046875, -1.5614013671875, -1.49176025390625, -1.422119140625, -1.35247802734375, -1.2828369140625, -1.21319580078125, -1.1435546875, -1.07391357421875, -1.0042724609375, -0.93463134765625, -0.864990234375, -0.79534912109375, -0.7257080078125, -0.65606689453125, -0.58642578125, -0.51678466796875, -0.4471435546875, -0.37750244140625, -0.307861328125, -0.23822021484375, -0.1685791015625, -0.09893798828125, -0.029296875, 0.04034423828125, 0.1099853515625, 0.17962646484375, 0.249267578125, 0.31890869140625, 0.3885498046875, 0.45819091796875, 0.52783203125, 0.59747314453125, 0.6671142578125, 0.73675537109375, 0.806396484375, 0.87603759765625, 0.9456787109375, 1.01531982421875, 1.0849609375, 1.15460205078125, 1.2242431640625, 1.29388427734375, 1.363525390625, 1.43316650390625, 1.5028076171875, 1.57244873046875, 1.64208984375, 1.71173095703125, 1.7813720703125, 1.85101318359375, 1.920654296875, 1.99029541015625, 2.0599365234375, 2.12957763671875, 2.19921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 5.0, 5.0, 21.0, 15.0, 20.0, 36.0, 56.0, 46.0, 61.0, 66.0, 75.0, 69.0, 78.0, 69.0, 63.0, 44.0, 58.0, 27.0, 34.0, 21.0, 28.0, 19.0, 14.0, 13.0, 3.0, 13.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1727523803710938, -1.1404266357421875, -1.1081008911132812, -1.075775146484375, -1.0434494018554688, -1.0111236572265625, -0.9787979125976562, -0.94647216796875, -0.9141464233398438, -0.8818206787109375, -0.8494949340820312, -0.817169189453125, -0.7848434448242188, -0.7525177001953125, -0.7201919555664062, -0.6878662109375, -0.6555404663085938, -0.6232147216796875, -0.5908889770507812, -0.558563232421875, -0.5262374877929688, -0.4939117431640625, -0.46158599853515625, -0.42926025390625, -0.39693450927734375, -0.3646087646484375, -0.33228302001953125, -0.299957275390625, -0.26763153076171875, -0.2353057861328125, -0.20298004150390625, -0.170654296875, -0.13832855224609375, -0.1060028076171875, -0.07367706298828125, -0.041351318359375, -0.00902557373046875, 0.0233001708984375, 0.05562591552734375, 0.08795166015625, 0.12027740478515625, 0.1526031494140625, 0.18492889404296875, 0.217254638671875, 0.24958038330078125, 0.2819061279296875, 0.31423187255859375, 0.3465576171875, 0.37888336181640625, 0.4112091064453125, 0.44353485107421875, 0.475860595703125, 0.5081863403320312, 0.5405120849609375, 0.5728378295898438, 0.60516357421875, 0.6374893188476562, 0.6698150634765625, 0.7021408081054688, 0.734466552734375, 0.7667922973632812, 0.7991180419921875, 0.8314437866210938, 0.86376953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 20.0, 26.0, 30.0, 38.0, 56.0, 76.0, 90.0, 124.0, 192.0, 350.0, 566.0, 1187.0, 3115.0, 11280.0, 116772.0, 845896.0, 56048.0, 7760.0, 2451.0, 1008.0, 528.0, 295.0, 169.0, 146.0, 71.0, 54.0, 44.0, 35.0, 15.0, 20.0, 15.0, 6.0, 10.0, 4.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.876953125, -4.7109375, -4.544921875, -4.37890625, -4.212890625, -4.046875, -3.880859375, -3.71484375, -3.548828125, -3.3828125, -3.216796875, -3.05078125, -2.884765625, -2.71875, -2.552734375, -2.38671875, -2.220703125, -2.0546875, -1.888671875, -1.72265625, -1.556640625, -1.390625, -1.224609375, -1.05859375, -0.892578125, -0.7265625, -0.560546875, -0.39453125, -0.228515625, -0.0625, 0.103515625, 0.26953125, 0.435546875, 0.6015625, 0.767578125, 0.93359375, 1.099609375, 1.265625, 1.431640625, 1.59765625, 1.763671875, 1.9296875, 2.095703125, 2.26171875, 2.427734375, 2.59375, 2.759765625, 2.92578125, 3.091796875, 3.2578125, 3.423828125, 3.58984375, 3.755859375, 3.921875, 4.087890625, 4.25390625, 4.419921875, 4.5859375, 4.751953125, 4.91796875, 5.083984375, 5.25, 5.416015625, 5.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 11.0, 15.0, 17.0, 22.0, 33.0, 43.0, 40.0, 52.0, 55.0, 72.0, 72.0, 75.0, 80.0, 79.0, 50.0, 60.0, 48.0, 29.0, 31.0, 18.0, 17.0, 13.0, 9.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.78717041015625, -4.6251220703125, -4.46307373046875, -4.301025390625, -4.13897705078125, -3.9769287109375, -3.81488037109375, -3.65283203125, -3.49078369140625, -3.3287353515625, -3.16668701171875, -3.004638671875, -2.84259033203125, -2.6805419921875, -2.51849365234375, -2.3564453125, -2.19439697265625, -2.0323486328125, -1.87030029296875, -1.708251953125, -1.54620361328125, -1.3841552734375, -1.22210693359375, -1.06005859375, -0.89801025390625, -0.7359619140625, -0.57391357421875, -0.411865234375, -0.24981689453125, -0.0877685546875, 0.07427978515625, 0.236328125, 0.39837646484375, 0.5604248046875, 0.72247314453125, 0.884521484375, 1.04656982421875, 1.2086181640625, 1.37066650390625, 1.53271484375, 1.69476318359375, 1.8568115234375, 2.01885986328125, 2.180908203125, 2.34295654296875, 2.5050048828125, 2.66705322265625, 2.8291015625, 2.99114990234375, 3.1531982421875, 3.31524658203125, 3.477294921875, 3.63934326171875, 3.8013916015625, 3.96343994140625, 4.12548828125, 4.28753662109375, 4.4495849609375, 4.61163330078125, 4.773681640625, 4.93572998046875, 5.0977783203125, 5.25982666015625, 5.421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 12.0, 26.0, 20.0, 28.0, 35.0, 61.0, 84.0, 159.0, 290.0, 749.0, 2303.0, 12662.0, 347521.0, 663224.0, 16948.0, 2700.0, 848.0, 350.0, 171.0, 92.0, 76.0, 48.0, 29.0, 27.0, 21.0, 9.0, 8.0, 10.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.64453125, -2.571197509765625, -2.49786376953125, -2.424530029296875, -2.3511962890625, -2.277862548828125, -2.20452880859375, -2.131195068359375, -2.057861328125, -1.984527587890625, -1.91119384765625, -1.837860107421875, -1.7645263671875, -1.691192626953125, -1.61785888671875, -1.544525146484375, -1.47119140625, -1.397857666015625, -1.32452392578125, -1.251190185546875, -1.1778564453125, -1.104522705078125, -1.03118896484375, -0.957855224609375, -0.884521484375, -0.811187744140625, -0.73785400390625, -0.664520263671875, -0.5911865234375, -0.517852783203125, -0.44451904296875, -0.371185302734375, -0.2978515625, -0.224517822265625, -0.15118408203125, -0.077850341796875, -0.0045166015625, 0.068817138671875, 0.14215087890625, 0.215484619140625, 0.288818359375, 0.362152099609375, 0.43548583984375, 0.508819580078125, 0.5821533203125, 0.655487060546875, 0.72882080078125, 0.802154541015625, 0.87548828125, 0.948822021484375, 1.02215576171875, 1.095489501953125, 1.1688232421875, 1.242156982421875, 1.31549072265625, 1.388824462890625, 1.462158203125, 1.535491943359375, 1.60882568359375, 1.682159423828125, 1.7554931640625, 1.828826904296875, 1.90216064453125, 1.975494384765625, 2.048828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 11.0, 17.0, 27.0, 32.0, 51.0, 75.0, 114.0, 170.0, 180.0, 95.0, 62.0, 36.0, 35.0, 22.0, 15.0, 18.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003750324249267578, -0.0003658607602119446, -0.00035668909549713135, -0.0003475174307823181, -0.0003383457660675049, -0.00032917410135269165, -0.0003200024366378784, -0.0003108307719230652, -0.00030165910720825195, -0.0002924874424934387, -0.0002833157777786255, -0.00027414411306381226, -0.000264972448348999, -0.0002558007836341858, -0.00024662911891937256, -0.00023745745420455933, -0.0002282857894897461, -0.00021911412477493286, -0.00020994246006011963, -0.0002007707953453064, -0.00019159913063049316, -0.00018242746591567993, -0.0001732558012008667, -0.00016408413648605347, -0.00015491247177124023, -0.000145740807056427, -0.00013656914234161377, -0.00012739747762680054, -0.0001182258129119873, -0.00010905414819717407, -9.988248348236084e-05, -9.071081876754761e-05, -8.153915405273438e-05, -7.236748933792114e-05, -6.319582462310791e-05, -5.402415990829468e-05, -4.4852495193481445e-05, -3.568083047866821e-05, -2.650916576385498e-05, -1.7337501049041748e-05, -8.165836334228516e-06, 1.0058283805847168e-06, 1.017749309539795e-05, 1.934915781021118e-05, 2.8520822525024414e-05, 3.7692487239837646e-05, 4.686415195465088e-05, 5.603581666946411e-05, 6.520748138427734e-05, 7.437914609909058e-05, 8.355081081390381e-05, 9.272247552871704e-05, 0.00010189414024353027, 0.0001110658049583435, 0.00012023746967315674, 0.00012940913438796997, 0.0001385807991027832, 0.00014775246381759644, 0.00015692412853240967, 0.0001660957932472229, 0.00017526745796203613, 0.00018443912267684937, 0.0001936107873916626, 0.00020278245210647583, 0.00021195411682128906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 10.0, 21.0, 26.0, 33.0, 29.0, 42.0, 91.0, 138.0, 196.0, 347.0, 679.0, 1461.0, 4322.0, 20215.0, 296792.0, 679992.0, 34251.0, 6027.0, 1996.0, 849.0, 385.0, 239.0, 127.0, 76.0, 69.0, 34.0, 22.0, 21.0, 14.0, 9.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.7691497802734375, -1.714080810546875, -1.6590118408203125, -1.60394287109375, -1.5488739013671875, -1.493804931640625, -1.4387359619140625, -1.3836669921875, -1.3285980224609375, -1.273529052734375, -1.2184600830078125, -1.16339111328125, -1.1083221435546875, -1.053253173828125, -0.9981842041015625, -0.943115234375, -0.8880462646484375, -0.832977294921875, -0.7779083251953125, -0.72283935546875, -0.6677703857421875, -0.612701416015625, -0.5576324462890625, -0.5025634765625, -0.4474945068359375, -0.392425537109375, -0.3373565673828125, -0.28228759765625, -0.2272186279296875, -0.172149658203125, -0.1170806884765625, -0.06201171875, -0.0069427490234375, 0.048126220703125, 0.1031951904296875, 0.15826416015625, 0.2133331298828125, 0.268402099609375, 0.3234710693359375, 0.3785400390625, 0.4336090087890625, 0.488677978515625, 0.5437469482421875, 0.59881591796875, 0.6538848876953125, 0.708953857421875, 0.7640228271484375, 0.819091796875, 0.8741607666015625, 0.929229736328125, 0.9842987060546875, 1.03936767578125, 1.0944366455078125, 1.149505615234375, 1.2045745849609375, 1.2596435546875, 1.3147125244140625, 1.369781494140625, 1.4248504638671875, 1.47991943359375, 1.5349884033203125, 1.590057373046875, 1.6451263427734375, 1.7001953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 26.0, 16.0, 28.0, 28.0, 33.0, 55.0, 74.0, 82.0, 80.0, 101.0, 108.0, 74.0, 52.0, 41.0, 44.0, 27.0, 16.0, 25.0, 13.0, 7.0, 8.0, 8.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.2902984619140625, -1.252471923828125, -1.2146453857421875, -1.17681884765625, -1.1389923095703125, -1.101165771484375, -1.0633392333984375, -1.0255126953125, -0.9876861572265625, -0.949859619140625, -0.9120330810546875, -0.87420654296875, -0.8363800048828125, -0.798553466796875, -0.7607269287109375, -0.722900390625, -0.6850738525390625, -0.647247314453125, -0.6094207763671875, -0.57159423828125, -0.5337677001953125, -0.495941162109375, -0.4581146240234375, -0.4202880859375, -0.3824615478515625, -0.344635009765625, -0.3068084716796875, -0.26898193359375, -0.2311553955078125, -0.193328857421875, -0.1555023193359375, -0.11767578125, -0.0798492431640625, -0.042022705078125, -0.0041961669921875, 0.03363037109375, 0.0714569091796875, 0.109283447265625, 0.1471099853515625, 0.1849365234375, 0.2227630615234375, 0.260589599609375, 0.2984161376953125, 0.33624267578125, 0.3740692138671875, 0.411895751953125, 0.4497222900390625, 0.487548828125, 0.5253753662109375, 0.563201904296875, 0.6010284423828125, 0.63885498046875, 0.6766815185546875, 0.714508056640625, 0.7523345947265625, 0.7901611328125, 0.8279876708984375, 0.865814208984375, 0.9036407470703125, 0.94146728515625, 0.9792938232421875, 1.017120361328125, 1.0549468994140625, 1.0927734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 23.0, 41.0, 118.0, 207.0, 258.0, 213.0, 65.0, 28.0, 16.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.58578872680664, -46.51209259033203, -45.43840026855469, -44.36470413208008, -43.29100799560547, -42.217315673828125, -41.143619537353516, -40.069923400878906, -38.99623107910156, -37.92253494262695, -36.84884262084961, -35.775146484375, -34.70145034790039, -33.62775421142578, -32.55406188964844, -31.480365753173828, -30.40666961669922, -29.332975387573242, -28.259279251098633, -27.185585021972656, -26.111888885498047, -25.03819465637207, -23.964500427246094, -22.890804290771484, -21.817110061645508, -20.74341583251953, -19.669719696044922, -18.596025466918945, -17.52233123779297, -16.44863510131836, -15.374940872192383, -14.30124568939209, -13.227546691894531, -12.153851509094238, -11.080156326293945, -10.006462097167969, -8.932766914367676, -7.859071731567383, -6.785377025604248, -5.711682319641113, -4.63798713684082, -3.5642921924591064, -2.4905972480773926, -1.4169023036956787, -0.34320735931396484, 0.7304878234863281, 1.804182529449463, 2.8778772354125977, 3.9515724182128906, 5.025267601013184, 6.098962306976318, 7.172657012939453, 8.246352195739746, 9.320047378540039, 10.393741607666016, 11.467436790466309, 12.541131973266602, 13.614827156066895, 14.688522338867188, 15.762216567993164, 16.83591079711914, 17.90960693359375, 18.983301162719727, 20.056995391845703, 21.130691528320312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 8.0, 9.0, 13.0, 12.0, 21.0, 19.0, 19.0, 19.0, 24.0, 36.0, 43.0, 41.0, 46.0, 56.0, 55.0, 58.0, 55.0, 44.0, 53.0, 43.0, 43.0, 26.0, 26.0, 25.0, 34.0, 26.0, 26.0, 23.0, 6.0, 9.0, 4.0, 6.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-12.86214828491211, -12.477662086486816, -12.093174934387207, -11.708688735961914, -11.324201583862305, -10.939715385437012, -10.555229187011719, -10.17074203491211, -9.7862548828125, -9.401768684387207, -9.017281532287598, -8.632795333862305, -8.248308181762695, -7.863821983337402, -7.479335308074951, -7.0948486328125, -6.710362434387207, -6.325875759124756, -5.941389083862305, -5.556902885437012, -5.172415733337402, -4.787929534912109, -4.403442859649658, -4.018956184387207, -3.634469509124756, -3.2499828338623047, -2.8654961585998535, -2.4810097217559814, -2.0965230464935303, -1.712036371231079, -1.327549934387207, -0.9430632591247559, -0.5585775375366211, -0.1740909218788147, 0.2103956937789917, 0.5948822498321533, 0.9793689250946045, 1.3638556003570557, 1.7483420372009277, 2.132828712463379, 2.51731538772583, 2.9018020629882812, 3.2862887382507324, 3.6707751750946045, 4.055261611938477, 4.439748764038086, 4.824234962463379, 5.20872163772583, 5.593208312988281, 5.977694988250732, 6.362181663513184, 6.746667861938477, 7.131155014038086, 7.515641212463379, 7.90012788772583, 8.284614562988281, 8.66910171508789, 9.053587913513184, 9.438075065612793, 9.822561264038086, 10.207048416137695, 10.591534614562988, 10.976020812988281, 11.36050796508789, 11.744994163513184]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 7.0, 14.0, 16.0, 28.0, 36.0, 46.0, 55.0, 87.0, 163.0, 220.0, 381.0, 782.0, 1599.0, 3453.0, 8557.0, 27591.0, 179509.0, 3462499.0, 445291.0, 42894.0, 11866.0, 4681.0, 2134.0, 1068.0, 550.0, 289.0, 177.0, 101.0, 62.0, 35.0, 21.0, 18.0, 12.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.076171875, -2.0162506103515625, -1.956329345703125, -1.8964080810546875, -1.83648681640625, -1.7765655517578125, -1.716644287109375, -1.6567230224609375, -1.5968017578125, -1.5368804931640625, -1.476959228515625, -1.4170379638671875, -1.35711669921875, -1.2971954345703125, -1.237274169921875, -1.1773529052734375, -1.117431640625, -1.0575103759765625, -0.997589111328125, -0.9376678466796875, -0.87774658203125, -0.8178253173828125, -0.757904052734375, -0.6979827880859375, -0.6380615234375, -0.5781402587890625, -0.518218994140625, -0.4582977294921875, -0.39837646484375, -0.3384552001953125, -0.278533935546875, -0.2186126708984375, -0.15869140625, -0.0987701416015625, -0.038848876953125, 0.0210723876953125, 0.08099365234375, 0.1409149169921875, 0.200836181640625, 0.2607574462890625, 0.3206787109375, 0.3805999755859375, 0.440521240234375, 0.5004425048828125, 0.56036376953125, 0.6202850341796875, 0.680206298828125, 0.7401275634765625, 0.800048828125, 0.8599700927734375, 0.919891357421875, 0.9798126220703125, 1.03973388671875, 1.0996551513671875, 1.159576416015625, 1.2194976806640625, 1.2794189453125, 1.3393402099609375, 1.399261474609375, 1.4591827392578125, 1.51910400390625, 1.5790252685546875, 1.638946533203125, 1.6988677978515625, 1.7587890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 15.0, 15.0, 25.0, 21.0, 35.0, 33.0, 50.0, 58.0, 62.0, 52.0, 49.0, 65.0, 62.0, 45.0, 61.0, 51.0, 41.0, 51.0, 32.0, 28.0, 18.0, 21.0, 16.0, 18.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.107421875, -1.0788955688476562, -1.0503692626953125, -1.0218429565429688, -0.993316650390625, -0.9647903442382812, -0.9362640380859375, -0.9077377319335938, -0.87921142578125, -0.8506851196289062, -0.8221588134765625, -0.7936325073242188, -0.765106201171875, -0.7365798950195312, -0.7080535888671875, -0.6795272827148438, -0.6510009765625, -0.6224746704101562, -0.5939483642578125, -0.5654220581054688, -0.536895751953125, -0.5083694458007812, -0.4798431396484375, -0.45131683349609375, -0.42279052734375, -0.39426422119140625, -0.3657379150390625, -0.33721160888671875, -0.308685302734375, -0.28015899658203125, -0.2516326904296875, -0.22310638427734375, -0.194580078125, -0.16605377197265625, -0.1375274658203125, -0.10900115966796875, -0.080474853515625, -0.05194854736328125, -0.0234222412109375, 0.00510406494140625, 0.03363037109375, 0.06215667724609375, 0.0906829833984375, 0.11920928955078125, 0.147735595703125, 0.17626190185546875, 0.2047882080078125, 0.23331451416015625, 0.2618408203125, 0.29036712646484375, 0.3188934326171875, 0.34741973876953125, 0.375946044921875, 0.40447235107421875, 0.4329986572265625, 0.46152496337890625, 0.49005126953125, 0.5185775756835938, 0.5471038818359375, 0.5756301879882812, 0.604156494140625, 0.6326828002929688, 0.6612091064453125, 0.6897354125976562, 0.71826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 22.0, 50.0, 69.0, 172.0, 254.0, 489.0, 1170.0, 3757.0, 16002.0, 142813.0, 3830704.0, 176338.0, 16954.0, 3523.0, 1105.0, 451.0, 204.0, 100.0, 40.0, 25.0, 12.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.132232666015625, -3.03594970703125, -2.939666748046875, -2.8433837890625, -2.747100830078125, -2.65081787109375, -2.554534912109375, -2.458251953125, -2.361968994140625, -2.26568603515625, -2.169403076171875, -2.0731201171875, -1.976837158203125, -1.88055419921875, -1.784271240234375, -1.68798828125, -1.591705322265625, -1.49542236328125, -1.399139404296875, -1.3028564453125, -1.206573486328125, -1.11029052734375, -1.014007568359375, -0.917724609375, -0.821441650390625, -0.72515869140625, -0.628875732421875, -0.5325927734375, -0.436309814453125, -0.34002685546875, -0.243743896484375, -0.1474609375, -0.051177978515625, 0.04510498046875, 0.141387939453125, 0.2376708984375, 0.333953857421875, 0.43023681640625, 0.526519775390625, 0.622802734375, 0.719085693359375, 0.81536865234375, 0.911651611328125, 1.0079345703125, 1.104217529296875, 1.20050048828125, 1.296783447265625, 1.39306640625, 1.489349365234375, 1.58563232421875, 1.681915283203125, 1.7781982421875, 1.874481201171875, 1.97076416015625, 2.067047119140625, 2.163330078125, 2.259613037109375, 2.35589599609375, 2.452178955078125, 2.5484619140625, 2.644744873046875, 2.74102783203125, 2.837310791015625, 2.93359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 30.0, 54.0, 81.0, 172.0, 468.0, 1135.0, 1205.0, 480.0, 209.0, 75.0, 57.0, 19.0, 16.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.090606689453125, -3.00933837890625, -2.928070068359375, -2.8468017578125, -2.765533447265625, -2.68426513671875, -2.602996826171875, -2.521728515625, -2.440460205078125, -2.35919189453125, -2.277923583984375, -2.1966552734375, -2.115386962890625, -2.03411865234375, -1.952850341796875, -1.87158203125, -1.790313720703125, -1.70904541015625, -1.627777099609375, -1.5465087890625, -1.465240478515625, -1.38397216796875, -1.302703857421875, -1.221435546875, -1.140167236328125, -1.05889892578125, -0.977630615234375, -0.8963623046875, -0.815093994140625, -0.73382568359375, -0.652557373046875, -0.5712890625, -0.490020751953125, -0.40875244140625, -0.327484130859375, -0.2462158203125, -0.164947509765625, -0.08367919921875, -0.002410888671875, 0.078857421875, 0.160125732421875, 0.24139404296875, 0.322662353515625, 0.4039306640625, 0.485198974609375, 0.56646728515625, 0.647735595703125, 0.72900390625, 0.810272216796875, 0.89154052734375, 0.972808837890625, 1.0540771484375, 1.135345458984375, 1.21661376953125, 1.297882080078125, 1.379150390625, 1.460418701171875, 1.54168701171875, 1.622955322265625, 1.7042236328125, 1.785491943359375, 1.86676025390625, 1.948028564453125, 2.029296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 15.0, 58.0, 253.0, 387.0, 203.0, 47.0, 16.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.369407653808594, -18.183977127075195, -16.99854850769043, -15.813117980957031, -14.627687454223633, -13.44225788116455, -12.256828308105469, -11.07139778137207, -9.885968208312988, -8.700538635253906, -7.515108108520508, -6.329678535461426, -5.1442484855651855, -3.9588184356689453, -2.7733888626098633, -1.5879583358764648, -0.4025287628173828, 0.7829011678695679, 1.9683310985565186, 3.1537609100341797, 4.33919095993042, 5.52462100982666, 6.710050582885742, 7.895481109619141, 9.080910682678223, 10.266340255737305, 11.451770782470703, 12.637200355529785, 13.822629928588867, 15.008060455322266, 16.19348907470703, 17.378921508789062, 18.564350128173828, 19.749780654907227, 20.935209274291992, 22.12063980102539, 23.30607032775879, 24.491500854492188, 25.676929473876953, 26.86236000061035, 28.04779052734375, 29.23322105407715, 30.418649673461914, 31.604080200195312, 32.78950881958008, 33.97494125366211, 35.160369873046875, 36.345802307128906, 37.531227111816406, 38.71665573120117, 39.9020881652832, 41.08751678466797, 42.272945404052734, 43.458377838134766, 44.64380645751953, 45.82923889160156, 47.01466751098633, 48.200096130371094, 49.385528564453125, 50.57095718383789, 51.756385803222656, 52.94181823730469, 54.12724685668945, 55.31267547607422, 56.49810791015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 12.0, 11.0, 10.0, 23.0, 23.0, 32.0, 34.0, 39.0, 53.0, 48.0, 45.0, 49.0, 49.0, 59.0, 42.0, 50.0, 61.0, 54.0, 43.0, 37.0, 53.0, 32.0, 22.0, 22.0, 24.0, 15.0, 13.0, 7.0, 4.0, 7.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.749755382537842, -7.472809791564941, -7.195863723754883, -6.918918132781982, -6.641972064971924, -6.365026473999023, -6.088080406188965, -5.8111348152160645, -5.534189224243164, -5.257243633270264, -4.980297565460205, -4.703351974487305, -4.426405906677246, -4.149460315704346, -3.872514486312866, -3.5955686569213867, -3.318622589111328, -3.0416767597198486, -2.764730930328369, -2.4877853393554688, -2.21083927154541, -1.9338935613632202, -1.6569478511810303, -1.3800020217895508, -1.1030561923980713, -0.8261103630065918, -0.5491645932197571, -0.27221882343292236, 0.004727005958557129, 0.2816728353500366, 0.5586185455322266, 0.835564374923706, 1.1125097274780273, 1.3894555568695068, 1.6664013862609863, 1.9433470964431763, 2.2202930450439453, 2.4972386360168457, 2.774184465408325, 3.0511302947998047, 3.328076124191284, 3.6050219535827637, 3.881967782974243, 4.158913612365723, 4.435859203338623, 4.712805271148682, 4.989750862121582, 5.266696929931641, 5.543642520904541, 5.820588111877441, 6.0975341796875, 6.3744797706604, 6.651425838470459, 6.928371429443359, 7.205317497253418, 7.482263088226318, 7.759208679199219, 8.036154747009277, 8.31309986114502, 8.590045928955078, 8.866991996765137, 9.143938064575195, 9.420883178710938, 9.697829246520996, 9.974775314331055]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 12.0, 24.0, 27.0, 34.0, 62.0, 106.0, 145.0, 248.0, 504.0, 833.0, 1511.0, 3229.0, 7003.0, 16738.0, 45458.0, 136654.0, 401281.0, 290985.0, 89678.0, 31264.0, 12339.0, 5235.0, 2393.0, 1205.0, 636.0, 343.0, 213.0, 132.0, 73.0, 49.0, 38.0, 26.0, 9.0, 10.0, 11.0, 10.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9460601806640625, -1.890167236328125, -1.8342742919921875, -1.77838134765625, -1.7224884033203125, -1.666595458984375, -1.6107025146484375, -1.5548095703125, -1.4989166259765625, -1.443023681640625, -1.3871307373046875, -1.33123779296875, -1.2753448486328125, -1.219451904296875, -1.1635589599609375, -1.107666015625, -1.0517730712890625, -0.995880126953125, -0.9399871826171875, -0.88409423828125, -0.8282012939453125, -0.772308349609375, -0.7164154052734375, -0.6605224609375, -0.6046295166015625, -0.548736572265625, -0.4928436279296875, -0.43695068359375, -0.3810577392578125, -0.325164794921875, -0.2692718505859375, -0.21337890625, -0.1574859619140625, -0.101593017578125, -0.0457000732421875, 0.01019287109375, 0.0660858154296875, 0.121978759765625, 0.1778717041015625, 0.2337646484375, 0.2896575927734375, 0.345550537109375, 0.4014434814453125, 0.45733642578125, 0.5132293701171875, 0.569122314453125, 0.6250152587890625, 0.680908203125, 0.7368011474609375, 0.792694091796875, 0.8485870361328125, 0.90447998046875, 0.9603729248046875, 1.016265869140625, 1.0721588134765625, 1.1280517578125, 1.1839447021484375, 1.239837646484375, 1.2957305908203125, 1.35162353515625, 1.4075164794921875, 1.463409423828125, 1.5193023681640625, 1.5751953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 8.0, 15.0, 8.0, 21.0, 19.0, 19.0, 29.0, 44.0, 39.0, 39.0, 59.0, 46.0, 51.0, 50.0, 58.0, 54.0, 54.0, 34.0, 39.0, 59.0, 32.0, 42.0, 29.0, 33.0, 20.0, 11.0, 15.0, 9.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.98291015625, -0.9573593139648438, -0.9318084716796875, -0.9062576293945312, -0.880706787109375, -0.8551559448242188, -0.8296051025390625, -0.8040542602539062, -0.77850341796875, -0.7529525756835938, -0.7274017333984375, -0.7018508911132812, -0.676300048828125, -0.6507492065429688, -0.6251983642578125, -0.5996475219726562, -0.5740966796875, -0.5485458374023438, -0.5229949951171875, -0.49744415283203125, -0.471893310546875, -0.44634246826171875, -0.4207916259765625, -0.39524078369140625, -0.36968994140625, -0.34413909912109375, -0.3185882568359375, -0.29303741455078125, -0.267486572265625, -0.24193572998046875, -0.2163848876953125, -0.19083404541015625, -0.165283203125, -0.13973236083984375, -0.1141815185546875, -0.08863067626953125, -0.063079833984375, -0.03752899169921875, -0.0119781494140625, 0.01357269287109375, 0.03912353515625, 0.06467437744140625, 0.0902252197265625, 0.11577606201171875, 0.141326904296875, 0.16687774658203125, 0.1924285888671875, 0.21797943115234375, 0.2435302734375, 0.26908111572265625, 0.2946319580078125, 0.32018280029296875, 0.345733642578125, 0.37128448486328125, 0.3968353271484375, 0.42238616943359375, 0.44793701171875, 0.47348785400390625, 0.4990386962890625, 0.5245895385742188, 0.550140380859375, 0.5756912231445312, 0.6012420654296875, 0.6267929077148438, 0.65234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 10.0, 8.0, 36.0, 43.0, 49.0, 83.0, 128.0, 242.0, 391.0, 736.0, 1552.0, 4132.0, 18365.0, 135598.0, 740389.0, 122342.0, 17160.0, 4166.0, 1465.0, 678.0, 332.0, 201.0, 134.0, 90.0, 54.0, 48.0, 26.0, 15.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.631103515625, -2.52783203125, -2.424560546875, -2.3212890625, -2.218017578125, -2.11474609375, -2.011474609375, -1.908203125, -1.804931640625, -1.70166015625, -1.598388671875, -1.4951171875, -1.391845703125, -1.28857421875, -1.185302734375, -1.08203125, -0.978759765625, -0.87548828125, -0.772216796875, -0.6689453125, -0.565673828125, -0.46240234375, -0.359130859375, -0.255859375, -0.152587890625, -0.04931640625, 0.053955078125, 0.1572265625, 0.260498046875, 0.36376953125, 0.467041015625, 0.5703125, 0.673583984375, 0.77685546875, 0.880126953125, 0.9833984375, 1.086669921875, 1.18994140625, 1.293212890625, 1.396484375, 1.499755859375, 1.60302734375, 1.706298828125, 1.8095703125, 1.912841796875, 2.01611328125, 2.119384765625, 2.22265625, 2.325927734375, 2.42919921875, 2.532470703125, 2.6357421875, 2.739013671875, 2.84228515625, 2.945556640625, 3.048828125, 3.152099609375, 3.25537109375, 3.358642578125, 3.4619140625, 3.565185546875, 3.66845703125, 3.771728515625, 3.875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 8.0, 12.0, 11.0, 14.0, 18.0, 19.0, 22.0, 23.0, 30.0, 36.0, 36.0, 37.0, 39.0, 45.0, 45.0, 49.0, 39.0, 46.0, 58.0, 53.0, 37.0, 37.0, 49.0, 32.0, 25.0, 30.0, 16.0, 15.0, 14.0, 13.0, 13.0, 8.0, 10.0, 12.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.78515625, -2.70001220703125, -2.6148681640625, -2.52972412109375, -2.444580078125, -2.35943603515625, -2.2742919921875, -2.18914794921875, -2.10400390625, -2.01885986328125, -1.9337158203125, -1.84857177734375, -1.763427734375, -1.67828369140625, -1.5931396484375, -1.50799560546875, -1.4228515625, -1.33770751953125, -1.2525634765625, -1.16741943359375, -1.082275390625, -0.99713134765625, -0.9119873046875, -0.82684326171875, -0.74169921875, -0.65655517578125, -0.5714111328125, -0.48626708984375, -0.401123046875, -0.31597900390625, -0.2308349609375, -0.14569091796875, -0.060546875, 0.02459716796875, 0.1097412109375, 0.19488525390625, 0.280029296875, 0.36517333984375, 0.4503173828125, 0.53546142578125, 0.62060546875, 0.70574951171875, 0.7908935546875, 0.87603759765625, 0.961181640625, 1.04632568359375, 1.1314697265625, 1.21661376953125, 1.3017578125, 1.38690185546875, 1.4720458984375, 1.55718994140625, 1.642333984375, 1.72747802734375, 1.8126220703125, 1.89776611328125, 1.98291015625, 2.06805419921875, 2.1531982421875, 2.23834228515625, 2.323486328125, 2.40863037109375, 2.4937744140625, 2.57891845703125, 2.6640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 7.0, 12.0, 29.0, 47.0, 108.0, 345.0, 2171.0, 256132.0, 786085.0, 2970.0, 422.0, 122.0, 52.0, 15.0, 14.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.790130615234375, -3.64471435546875, -3.499298095703125, -3.3538818359375, -3.208465576171875, -3.06304931640625, -2.917633056640625, -2.772216796875, -2.626800537109375, -2.48138427734375, -2.335968017578125, -2.1905517578125, -2.045135498046875, -1.89971923828125, -1.754302978515625, -1.60888671875, -1.463470458984375, -1.31805419921875, -1.172637939453125, -1.0272216796875, -0.881805419921875, -0.73638916015625, -0.590972900390625, -0.445556640625, -0.300140380859375, -0.15472412109375, -0.009307861328125, 0.1361083984375, 0.281524658203125, 0.42694091796875, 0.572357177734375, 0.7177734375, 0.863189697265625, 1.00860595703125, 1.154022216796875, 1.2994384765625, 1.444854736328125, 1.59027099609375, 1.735687255859375, 1.881103515625, 2.026519775390625, 2.17193603515625, 2.317352294921875, 2.4627685546875, 2.608184814453125, 2.75360107421875, 2.899017333984375, 3.04443359375, 3.189849853515625, 3.33526611328125, 3.480682373046875, 3.6260986328125, 3.771514892578125, 3.91693115234375, 4.062347412109375, 4.207763671875, 4.353179931640625, 4.49859619140625, 4.644012451171875, 4.7894287109375, 4.934844970703125, 5.08026123046875, 5.225677490234375, 5.37109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 10.0, 8.0, 5.0, 8.0, 11.0, 20.0, 16.0, 34.0, 40.0, 63.0, 74.0, 108.0, 143.0, 130.0, 85.0, 66.0, 43.0, 34.0, 16.0, 24.0, 6.0, 13.0, 16.0, 4.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016164779663085938, -0.00015586242079734802, -0.00015007704496383667, -0.00014429166913032532, -0.00013850629329681396, -0.0001327209174633026, -0.00012693554162979126, -0.00012115016579627991, -0.00011536478996276855, -0.0001095794141292572, -0.00010379403829574585, -9.80086624622345e-05, -9.222328662872314e-05, -8.643791079521179e-05, -8.065253496170044e-05, -7.486715912818909e-05, -6.908178329467773e-05, -6.329640746116638e-05, -5.751103162765503e-05, -5.172565579414368e-05, -4.5940279960632324e-05, -4.015490412712097e-05, -3.436952829360962e-05, -2.8584152460098267e-05, -2.2798776626586914e-05, -1.701340079307556e-05, -1.1228024959564209e-05, -5.4426491260528564e-06, 3.427267074584961e-07, 6.128102540969849e-06, 1.1913478374481201e-05, 1.7698854207992554e-05, 2.3484230041503906e-05, 2.926960587501526e-05, 3.505498170852661e-05, 4.0840357542037964e-05, 4.6625733375549316e-05, 5.241110920906067e-05, 5.819648504257202e-05, 6.398186087608337e-05, 6.976723670959473e-05, 7.555261254310608e-05, 8.133798837661743e-05, 8.712336421012878e-05, 9.290874004364014e-05, 9.869411587715149e-05, 0.00010447949171066284, 0.0001102648675441742, 0.00011605024337768555, 0.0001218356192111969, 0.00012762099504470825, 0.0001334063708782196, 0.00013919174671173096, 0.0001449771225452423, 0.00015076249837875366, 0.00015654787421226501, 0.00016233325004577637, 0.00016811862587928772, 0.00017390400171279907, 0.00017968937754631042, 0.00018547475337982178, 0.00019126012921333313, 0.00019704550504684448, 0.00020283088088035583, 0.0002086162567138672]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 11.0, 15.0, 26.0, 40.0, 66.0, 114.0, 222.0, 477.0, 1117.0, 3599.0, 18200.0, 275592.0, 704149.0, 36440.0, 5583.0, 1672.0, 584.0, 264.0, 141.0, 74.0, 55.0, 29.0, 27.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.975067138671875, -0.92669677734375, -0.878326416015625, -0.8299560546875, -0.781585693359375, -0.73321533203125, -0.684844970703125, -0.636474609375, -0.588104248046875, -0.53973388671875, -0.491363525390625, -0.4429931640625, -0.394622802734375, -0.34625244140625, -0.297882080078125, -0.24951171875, -0.201141357421875, -0.15277099609375, -0.104400634765625, -0.0560302734375, -0.007659912109375, 0.04071044921875, 0.089080810546875, 0.137451171875, 0.185821533203125, 0.23419189453125, 0.282562255859375, 0.3309326171875, 0.379302978515625, 0.42767333984375, 0.476043701171875, 0.5244140625, 0.572784423828125, 0.62115478515625, 0.669525146484375, 0.7178955078125, 0.766265869140625, 0.81463623046875, 0.863006591796875, 0.911376953125, 0.959747314453125, 1.00811767578125, 1.056488037109375, 1.1048583984375, 1.153228759765625, 1.20159912109375, 1.249969482421875, 1.29833984375, 1.346710205078125, 1.39508056640625, 1.443450927734375, 1.4918212890625, 1.540191650390625, 1.58856201171875, 1.636932373046875, 1.685302734375, 1.733673095703125, 1.78204345703125, 1.830413818359375, 1.8787841796875, 1.927154541015625, 1.97552490234375, 2.023895263671875, 2.072265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 12.0, 10.0, 22.0, 36.0, 43.0, 65.0, 87.0, 107.0, 128.0, 121.0, 93.0, 73.0, 50.0, 49.0, 36.0, 17.0, 13.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.980621337890625, -0.94268798828125, -0.904754638671875, -0.8668212890625, -0.828887939453125, -0.79095458984375, -0.753021240234375, -0.715087890625, -0.677154541015625, -0.63922119140625, -0.601287841796875, -0.5633544921875, -0.525421142578125, -0.48748779296875, -0.449554443359375, -0.41162109375, -0.373687744140625, -0.33575439453125, -0.297821044921875, -0.2598876953125, -0.221954345703125, -0.18402099609375, -0.146087646484375, -0.108154296875, -0.070220947265625, -0.03228759765625, 0.005645751953125, 0.0435791015625, 0.081512451171875, 0.11944580078125, 0.157379150390625, 0.1953125, 0.233245849609375, 0.27117919921875, 0.309112548828125, 0.3470458984375, 0.384979248046875, 0.42291259765625, 0.460845947265625, 0.498779296875, 0.536712646484375, 0.57464599609375, 0.612579345703125, 0.6505126953125, 0.688446044921875, 0.72637939453125, 0.764312744140625, 0.80224609375, 0.840179443359375, 0.87811279296875, 0.916046142578125, 0.9539794921875, 0.991912841796875, 1.02984619140625, 1.067779541015625, 1.105712890625, 1.143646240234375, 1.18157958984375, 1.219512939453125, 1.2574462890625, 1.295379638671875, 1.33331298828125, 1.371246337890625, 1.4091796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 69.0, 183.0, 351.0, 229.0, 71.0, 31.0, 10.0, 10.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.86699676513672, -38.75015640258789, -37.63331604003906, -36.516475677490234, -35.399635314941406, -34.28279495239258, -33.16595458984375, -32.04911804199219, -30.932275772094727, -29.8154354095459, -28.69859504699707, -27.581754684448242, -26.464916229248047, -25.34807586669922, -24.23123550415039, -23.114395141601562, -21.997554779052734, -20.880714416503906, -19.763874053955078, -18.64703369140625, -17.530193328857422, -16.413352966308594, -15.296514511108398, -14.17967414855957, -13.062833786010742, -11.945993423461914, -10.829153060913086, -9.712313652038574, -8.595473289489746, -7.478632926940918, -6.361793041229248, -5.244953155517578, -4.12811279296875, -3.011272668838501, -1.894432544708252, -0.7775924205780029, 0.3392477035522461, 1.4560880661010742, 2.572927951812744, 3.689767837524414, 4.806608200073242, 5.92344856262207, 7.04028844833374, 8.15712833404541, 9.273968696594238, 10.390809059143066, 11.507648468017578, 12.624488830566406, 13.741329193115234, 14.858169555664062, 15.97500991821289, 17.09185028076172, 18.208690643310547, 19.325531005859375, 20.44236946105957, 21.5592098236084, 22.676050186157227, 23.792890548706055, 24.909730911254883, 26.02657127380371, 27.143409729003906, 28.260250091552734, 29.377090454101562, 30.49393081665039, 31.61077117919922]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 9.0, 10.0, 15.0, 11.0, 23.0, 19.0, 29.0, 29.0, 34.0, 40.0, 37.0, 45.0, 55.0, 45.0, 55.0, 51.0, 52.0, 52.0, 49.0, 43.0, 31.0, 34.0, 25.0, 19.0, 25.0, 24.0, 21.0, 19.0, 16.0, 13.0, 7.0, 13.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.482670783996582, -9.140835762023926, -8.79900074005127, -8.457165718078613, -8.115331649780273, -7.773496150970459, -7.431661605834961, -7.089826583862305, -6.747991561889648, -6.406156539916992, -6.064321517944336, -5.722486972808838, -5.380651950836182, -5.038816928863525, -4.696982383728027, -4.355147361755371, -4.013312339782715, -3.6714773178100586, -3.3296425342559814, -2.9878077507019043, -2.645972728729248, -2.304137706756592, -1.9623029232025146, -1.6204681396484375, -1.2786331176757812, -0.9367982149124146, -0.5949633121490479, -0.25312840938568115, 0.08870649337768555, 0.43054139614105225, 0.772376298904419, 1.114211082458496, 1.456045150756836, 1.7978800535202026, 2.1397149562835693, 2.4815497398376465, 2.8233847618103027, 3.165219783782959, 3.507054567337036, 3.8488893508911133, 4.1907243728637695, 4.532559394836426, 4.874394416809082, 5.21622896194458, 5.558063983917236, 5.899899005889893, 6.241733551025391, 6.583568572998047, 6.925403594970703, 7.267238616943359, 7.609073638916016, 7.950908184051514, 8.292743682861328, 8.634577751159668, 8.976412773132324, 9.31824779510498, 9.660082817077637, 10.001917839050293, 10.34375286102295, 10.685587882995605, 11.027421951293945, 11.369256973266602, 11.711091995239258, 12.052927017211914, 12.39476203918457]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 14.0, 4.0, 9.0, 23.0, 26.0, 34.0, 38.0, 59.0, 86.0, 121.0, 178.0, 294.0, 444.0, 804.0, 1394.0, 2636.0, 5661.0, 13338.0, 37410.0, 147057.0, 1218279.0, 2385928.0, 287098.0, 58793.0, 19009.0, 7535.0, 3557.0, 1805.0, 973.0, 558.0, 370.0, 233.0, 156.0, 98.0, 61.0, 57.0, 38.0, 26.0, 20.0, 12.0, 11.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.306640625, -1.2684173583984375, -1.230194091796875, -1.1919708251953125, -1.15374755859375, -1.1155242919921875, -1.077301025390625, -1.0390777587890625, -1.0008544921875, -0.9626312255859375, -0.924407958984375, -0.8861846923828125, -0.84796142578125, -0.8097381591796875, -0.771514892578125, -0.7332916259765625, -0.695068359375, -0.6568450927734375, -0.618621826171875, -0.5803985595703125, -0.54217529296875, -0.5039520263671875, -0.465728759765625, -0.4275054931640625, -0.3892822265625, -0.3510589599609375, -0.312835693359375, -0.2746124267578125, -0.23638916015625, -0.1981658935546875, -0.159942626953125, -0.1217193603515625, -0.08349609375, -0.0452728271484375, -0.007049560546875, 0.0311737060546875, 0.06939697265625, 0.1076202392578125, 0.145843505859375, 0.1840667724609375, 0.2222900390625, 0.2605133056640625, 0.298736572265625, 0.3369598388671875, 0.37518310546875, 0.4134063720703125, 0.451629638671875, 0.4898529052734375, 0.528076171875, 0.5662994384765625, 0.604522705078125, 0.6427459716796875, 0.68096923828125, 0.7191925048828125, 0.757415771484375, 0.7956390380859375, 0.8338623046875, 0.8720855712890625, 0.910308837890625, 0.9485321044921875, 0.98675537109375, 1.0249786376953125, 1.063201904296875, 1.1014251708984375, 1.1396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 20.0, 21.0, 30.0, 43.0, 49.0, 60.0, 67.0, 81.0, 81.0, 81.0, 69.0, 72.0, 68.0, 51.0, 57.0, 42.0, 26.0, 14.0, 19.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1061859130859375, -1.070770263671875, -1.0353546142578125, -0.99993896484375, -0.9645233154296875, -0.929107666015625, -0.8936920166015625, -0.8582763671875, -0.8228607177734375, -0.787445068359375, -0.7520294189453125, -0.71661376953125, -0.6811981201171875, -0.645782470703125, -0.6103668212890625, -0.574951171875, -0.5395355224609375, -0.504119873046875, -0.4687042236328125, -0.43328857421875, -0.3978729248046875, -0.362457275390625, -0.3270416259765625, -0.2916259765625, -0.2562103271484375, -0.220794677734375, -0.1853790283203125, -0.14996337890625, -0.1145477294921875, -0.079132080078125, -0.0437164306640625, -0.00830078125, 0.0271148681640625, 0.062530517578125, 0.0979461669921875, 0.13336181640625, 0.1687774658203125, 0.204193115234375, 0.2396087646484375, 0.2750244140625, 0.3104400634765625, 0.345855712890625, 0.3812713623046875, 0.41668701171875, 0.4521026611328125, 0.487518310546875, 0.5229339599609375, 0.558349609375, 0.5937652587890625, 0.629180908203125, 0.6645965576171875, 0.70001220703125, 0.7354278564453125, 0.770843505859375, 0.8062591552734375, 0.8416748046875, 0.8770904541015625, 0.912506103515625, 0.9479217529296875, 0.98333740234375, 1.0187530517578125, 1.054168701171875, 1.0895843505859375, 1.125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 12.0, 27.0, 23.0, 35.0, 51.0, 74.0, 137.0, 212.0, 415.0, 847.0, 2156.0, 6016.0, 20020.0, 86916.0, 983631.0, 2865149.0, 180300.0, 33731.0, 9169.0, 2966.0, 1187.0, 523.0, 276.0, 145.0, 79.0, 48.0, 36.0, 23.0, 22.0, 11.0, 10.0, 3.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.707122802734375, -1.65057373046875, -1.594024658203125, -1.5374755859375, -1.480926513671875, -1.42437744140625, -1.367828369140625, -1.311279296875, -1.254730224609375, -1.19818115234375, -1.141632080078125, -1.0850830078125, -1.028533935546875, -0.97198486328125, -0.915435791015625, -0.85888671875, -0.802337646484375, -0.74578857421875, -0.689239501953125, -0.6326904296875, -0.576141357421875, -0.51959228515625, -0.463043212890625, -0.406494140625, -0.349945068359375, -0.29339599609375, -0.236846923828125, -0.1802978515625, -0.123748779296875, -0.06719970703125, -0.010650634765625, 0.0458984375, 0.102447509765625, 0.15899658203125, 0.215545654296875, 0.2720947265625, 0.328643798828125, 0.38519287109375, 0.441741943359375, 0.498291015625, 0.554840087890625, 0.61138916015625, 0.667938232421875, 0.7244873046875, 0.781036376953125, 0.83758544921875, 0.894134521484375, 0.95068359375, 1.007232666015625, 1.06378173828125, 1.120330810546875, 1.1768798828125, 1.233428955078125, 1.28997802734375, 1.346527099609375, 1.403076171875, 1.459625244140625, 1.51617431640625, 1.572723388671875, 1.6292724609375, 1.685821533203125, 1.74237060546875, 1.798919677734375, 1.85546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 10.0, 11.0, 21.0, 16.0, 27.0, 28.0, 43.0, 40.0, 63.0, 111.0, 138.0, 210.0, 330.0, 494.0, 553.0, 584.0, 395.0, 275.0, 186.0, 120.0, 89.0, 62.0, 53.0, 39.0, 29.0, 18.0, 17.0, 12.0, 17.0, 14.0, 7.0, 3.0, 6.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.494140625, -1.4512481689453125, -1.408355712890625, -1.3654632568359375, -1.32257080078125, -1.2796783447265625, -1.236785888671875, -1.1938934326171875, -1.1510009765625, -1.1081085205078125, -1.065216064453125, -1.0223236083984375, -0.97943115234375, -0.9365386962890625, -0.893646240234375, -0.8507537841796875, -0.807861328125, -0.7649688720703125, -0.722076416015625, -0.6791839599609375, -0.63629150390625, -0.5933990478515625, -0.550506591796875, -0.5076141357421875, -0.4647216796875, -0.4218292236328125, -0.378936767578125, -0.3360443115234375, -0.29315185546875, -0.2502593994140625, -0.207366943359375, -0.1644744873046875, -0.12158203125, -0.0786895751953125, -0.035797119140625, 0.0070953369140625, 0.04998779296875, 0.0928802490234375, 0.135772705078125, 0.1786651611328125, 0.2215576171875, 0.2644500732421875, 0.307342529296875, 0.3502349853515625, 0.39312744140625, 0.4360198974609375, 0.478912353515625, 0.5218048095703125, 0.564697265625, 0.6075897216796875, 0.650482177734375, 0.6933746337890625, 0.73626708984375, 0.7791595458984375, 0.822052001953125, 0.8649444580078125, 0.9078369140625, 0.9507293701171875, 0.993621826171875, 1.0365142822265625, 1.07940673828125, 1.1222991943359375, 1.165191650390625, 1.2080841064453125, 1.2509765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 9.0, 13.0, 26.0, 64.0, 107.0, 164.0, 192.0, 161.0, 116.0, 62.0, 38.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.264766693115234, -22.661638259887695, -22.058509826660156, -21.45538330078125, -20.85225486755371, -20.249126434326172, -19.645998001098633, -19.042869567871094, -18.439743041992188, -17.83661460876465, -17.23348617553711, -16.630359649658203, -16.027231216430664, -15.424102783203125, -14.820974349975586, -14.217846870422363, -13.614718437194824, -13.011590003967285, -12.408462524414062, -11.805334091186523, -11.2022066116333, -10.599078178405762, -9.995950698852539, -9.392822265625, -8.789693832397461, -8.186565399169922, -7.583437919616699, -6.98030948638916, -6.3771820068359375, -5.774053573608398, -5.170925617218018, -4.567797660827637, -3.9646692276000977, -3.361541271209717, -2.758413314819336, -2.155285120010376, -1.5521571636199951, -0.9490292072296143, -0.3459010124206543, 0.25722694396972656, 0.8603549003601074, 1.4634828567504883, 2.066610813140869, 2.669739007949829, 3.27286696434021, 3.875994920730591, 4.479123115539551, 5.082251071929932, 5.6853790283203125, 6.288506984710693, 6.891634941101074, 7.494763374328613, 8.097890853881836, 8.701019287109375, 9.304147720336914, 9.907275199890137, 10.51040267944336, 11.113531112670898, 11.716658592224121, 12.31978702545166, 12.922914505004883, 13.526042938232422, 14.129171371459961, 14.732298851013184, 15.335427284240723]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 12.0, 15.0, 15.0, 17.0, 24.0, 14.0, 34.0, 36.0, 45.0, 55.0, 42.0, 72.0, 56.0, 63.0, 66.0, 65.0, 33.0, 49.0, 42.0, 42.0, 32.0, 20.0, 22.0, 33.0, 20.0, 25.0, 13.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.27517318725586, -9.972159385681152, -9.669144630432129, -9.366130828857422, -9.063117027282715, -8.760102272033691, -8.457088470458984, -8.154073715209961, -7.851059913635254, -7.548045635223389, -7.245031833648682, -6.942017555236816, -6.639003276824951, -6.335988998413086, -6.032975196838379, -5.729960918426514, -5.426947116851807, -5.123932838439941, -4.820919036865234, -4.517904758453369, -4.214890480041504, -3.9118764400482178, -3.6088624000549316, -3.3058481216430664, -3.0028340816497803, -2.699820041656494, -2.396805763244629, -2.0937917232513428, -1.790777564048767, -1.4877634048461914, -1.1847493648529053, -0.88173508644104, -0.5787210464477539, -0.2757069170475006, 0.027307212352752686, 0.3303213119506836, 0.6333354711532593, 0.936349630355835, 1.239363670349121, 1.5423779487609863, 1.8453919887542725, 2.1484060287475586, 2.451420307159424, 2.75443434715271, 3.057448387145996, 3.3604626655578613, 3.6634767055511475, 3.9664909839630127, 4.269505023956299, 4.572519302368164, 4.875533103942871, 5.178547382354736, 5.481561660766602, 5.784575462341309, 6.087589740753174, 6.390604019165039, 6.693617820739746, 6.996632099151611, 7.299645900726318, 7.602660179138184, 7.905674457550049, 8.208688735961914, 8.511702537536621, 8.814716339111328, 9.117731094360352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 5.0, 8.0, 21.0, 20.0, 25.0, 28.0, 52.0, 73.0, 115.0, 147.0, 241.0, 341.0, 552.0, 1085.0, 1862.0, 3515.0, 7308.0, 16444.0, 38229.0, 93208.0, 225661.0, 352007.0, 177667.0, 73458.0, 30568.0, 13069.0, 5974.0, 2937.0, 1592.0, 847.0, 477.0, 308.0, 216.0, 148.0, 81.0, 68.0, 61.0, 27.0, 31.0, 17.0, 10.0, 7.0, 11.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.546875, -1.501861572265625, -1.45684814453125, -1.411834716796875, -1.3668212890625, -1.321807861328125, -1.27679443359375, -1.231781005859375, -1.186767578125, -1.141754150390625, -1.09674072265625, -1.051727294921875, -1.0067138671875, -0.961700439453125, -0.91668701171875, -0.871673583984375, -0.82666015625, -0.781646728515625, -0.73663330078125, -0.691619873046875, -0.6466064453125, -0.601593017578125, -0.55657958984375, -0.511566162109375, -0.466552734375, -0.421539306640625, -0.37652587890625, -0.331512451171875, -0.2864990234375, -0.241485595703125, -0.19647216796875, -0.151458740234375, -0.1064453125, -0.061431884765625, -0.01641845703125, 0.028594970703125, 0.0736083984375, 0.118621826171875, 0.16363525390625, 0.208648681640625, 0.253662109375, 0.298675537109375, 0.34368896484375, 0.388702392578125, 0.4337158203125, 0.478729248046875, 0.52374267578125, 0.568756103515625, 0.61376953125, 0.658782958984375, 0.70379638671875, 0.748809814453125, 0.7938232421875, 0.838836669921875, 0.88385009765625, 0.928863525390625, 0.973876953125, 1.018890380859375, 1.06390380859375, 1.108917236328125, 1.1539306640625, 1.198944091796875, 1.24395751953125, 1.288970947265625, 1.333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 17.0, 26.0, 32.0, 50.0, 54.0, 53.0, 59.0, 72.0, 91.0, 81.0, 80.0, 81.0, 66.0, 60.0, 47.0, 27.0, 26.0, 20.0, 10.0, 12.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.11456298828125, -1.0787353515625, -1.04290771484375, -1.007080078125, -0.97125244140625, -0.9354248046875, -0.89959716796875, -0.86376953125, -0.82794189453125, -0.7921142578125, -0.75628662109375, -0.720458984375, -0.68463134765625, -0.6488037109375, -0.61297607421875, -0.5771484375, -0.54132080078125, -0.5054931640625, -0.46966552734375, -0.433837890625, -0.39801025390625, -0.3621826171875, -0.32635498046875, -0.29052734375, -0.25469970703125, -0.2188720703125, -0.18304443359375, -0.147216796875, -0.11138916015625, -0.0755615234375, -0.03973388671875, -0.00390625, 0.03192138671875, 0.0677490234375, 0.10357666015625, 0.139404296875, 0.17523193359375, 0.2110595703125, 0.24688720703125, 0.28271484375, 0.31854248046875, 0.3543701171875, 0.39019775390625, 0.426025390625, 0.46185302734375, 0.4976806640625, 0.53350830078125, 0.5693359375, 0.60516357421875, 0.6409912109375, 0.67681884765625, 0.712646484375, 0.74847412109375, 0.7843017578125, 0.82012939453125, 0.85595703125, 0.89178466796875, 0.9276123046875, 0.96343994140625, 0.999267578125, 1.03509521484375, 1.0709228515625, 1.10675048828125, 1.142578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 15.0, 22.0, 30.0, 47.0, 64.0, 125.0, 187.0, 346.0, 573.0, 1054.0, 2592.0, 9851.0, 116116.0, 847104.0, 59169.0, 6880.0, 2130.0, 939.0, 508.0, 289.0, 173.0, 117.0, 61.0, 50.0, 29.0, 22.0, 13.0, 8.0, 12.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.56463623046875, -4.4144287109375, -4.26422119140625, -4.114013671875, -3.96380615234375, -3.8135986328125, -3.66339111328125, -3.51318359375, -3.36297607421875, -3.2127685546875, -3.06256103515625, -2.912353515625, -2.76214599609375, -2.6119384765625, -2.46173095703125, -2.3115234375, -2.16131591796875, -2.0111083984375, -1.86090087890625, -1.710693359375, -1.56048583984375, -1.4102783203125, -1.26007080078125, -1.10986328125, -0.95965576171875, -0.8094482421875, -0.65924072265625, -0.509033203125, -0.35882568359375, -0.2086181640625, -0.05841064453125, 0.091796875, 0.24200439453125, 0.3922119140625, 0.54241943359375, 0.692626953125, 0.84283447265625, 0.9930419921875, 1.14324951171875, 1.29345703125, 1.44366455078125, 1.5938720703125, 1.74407958984375, 1.894287109375, 2.04449462890625, 2.1947021484375, 2.34490966796875, 2.4951171875, 2.64532470703125, 2.7955322265625, 2.94573974609375, 3.095947265625, 3.24615478515625, 3.3963623046875, 3.54656982421875, 3.69677734375, 3.84698486328125, 3.9971923828125, 4.14739990234375, 4.297607421875, 4.44781494140625, 4.5980224609375, 4.74822998046875, 4.8984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 2.0, 10.0, 10.0, 12.0, 14.0, 22.0, 17.0, 24.0, 24.0, 37.0, 44.0, 43.0, 43.0, 56.0, 58.0, 59.0, 50.0, 79.0, 63.0, 43.0, 42.0, 39.0, 42.0, 28.0, 20.0, 22.0, 20.0, 7.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.6328125, -3.51812744140625, -3.4034423828125, -3.28875732421875, -3.174072265625, -3.05938720703125, -2.9447021484375, -2.83001708984375, -2.71533203125, -2.60064697265625, -2.4859619140625, -2.37127685546875, -2.256591796875, -2.14190673828125, -2.0272216796875, -1.91253662109375, -1.7978515625, -1.68316650390625, -1.5684814453125, -1.45379638671875, -1.339111328125, -1.22442626953125, -1.1097412109375, -0.99505615234375, -0.88037109375, -0.76568603515625, -0.6510009765625, -0.53631591796875, -0.421630859375, -0.30694580078125, -0.1922607421875, -0.07757568359375, 0.037109375, 0.15179443359375, 0.2664794921875, 0.38116455078125, 0.495849609375, 0.61053466796875, 0.7252197265625, 0.83990478515625, 0.95458984375, 1.06927490234375, 1.1839599609375, 1.29864501953125, 1.413330078125, 1.52801513671875, 1.6427001953125, 1.75738525390625, 1.8720703125, 1.98675537109375, 2.1014404296875, 2.21612548828125, 2.330810546875, 2.44549560546875, 2.5601806640625, 2.67486572265625, 2.78955078125, 2.90423583984375, 3.0189208984375, 3.13360595703125, 3.248291015625, 3.36297607421875, 3.4776611328125, 3.59234619140625, 3.70703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 5.0, 7.0, 13.0, 14.0, 17.0, 13.0, 21.0, 36.0, 42.0, 69.0, 114.0, 155.0, 219.0, 419.0, 985.0, 2986.0, 14526.0, 168576.0, 792568.0, 57215.0, 7121.0, 1733.0, 697.0, 351.0, 186.0, 145.0, 70.0, 60.0, 41.0, 23.0, 29.0, 18.0, 13.0, 12.0, 9.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2494049072265625, -1.210723876953125, -1.1720428466796875, -1.13336181640625, -1.0946807861328125, -1.055999755859375, -1.0173187255859375, -0.9786376953125, -0.9399566650390625, -0.901275634765625, -0.8625946044921875, -0.82391357421875, -0.7852325439453125, -0.746551513671875, -0.7078704833984375, -0.669189453125, -0.6305084228515625, -0.591827392578125, -0.5531463623046875, -0.51446533203125, -0.4757843017578125, -0.437103271484375, -0.3984222412109375, -0.3597412109375, -0.3210601806640625, -0.282379150390625, -0.2436981201171875, -0.20501708984375, -0.1663360595703125, -0.127655029296875, -0.0889739990234375, -0.05029296875, -0.0116119384765625, 0.027069091796875, 0.0657501220703125, 0.10443115234375, 0.1431121826171875, 0.181793212890625, 0.2204742431640625, 0.2591552734375, 0.2978363037109375, 0.336517333984375, 0.3751983642578125, 0.41387939453125, 0.4525604248046875, 0.491241455078125, 0.5299224853515625, 0.568603515625, 0.6072845458984375, 0.645965576171875, 0.6846466064453125, 0.72332763671875, 0.7620086669921875, 0.800689697265625, 0.8393707275390625, 0.8780517578125, 0.9167327880859375, 0.955413818359375, 0.9940948486328125, 1.03277587890625, 1.0714569091796875, 1.110137939453125, 1.1488189697265625, 1.1875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 5.0, 6.0, 16.0, 11.0, 11.0, 16.0, 12.0, 18.0, 25.0, 34.0, 45.0, 55.0, 69.0, 90.0, 106.0, 79.0, 71.0, 65.0, 45.0, 28.0, 28.0, 24.0, 27.0, 13.0, 14.0, 21.0, 7.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013649463653564453, -0.00013159587979316711, -0.0001266971230506897, -0.00012179836630821228, -0.00011689960956573486, -0.00011200085282325745, -0.00010710209608078003, -0.00010220333933830261, -9.73045825958252e-05, -9.240582585334778e-05, -8.750706911087036e-05, -8.260831236839294e-05, -7.770955562591553e-05, -7.281079888343811e-05, -6.79120421409607e-05, -6.301328539848328e-05, -5.811452865600586e-05, -5.321577191352844e-05, -4.8317015171051025e-05, -4.341825842857361e-05, -3.851950168609619e-05, -3.3620744943618774e-05, -2.8721988201141357e-05, -2.382323145866394e-05, -1.8924474716186523e-05, -1.4025717973709106e-05, -9.12696123123169e-06, -4.2282044887542725e-06, 6.705522537231445e-07, 5.5693089962005615e-06, 1.0468065738677979e-05, 1.5366822481155396e-05, 2.0265579223632812e-05, 2.516433596611023e-05, 3.0063092708587646e-05, 3.4961849451065063e-05, 3.986060619354248e-05, 4.47593629360199e-05, 4.9658119678497314e-05, 5.455687642097473e-05, 5.945563316345215e-05, 6.435438990592957e-05, 6.925314664840698e-05, 7.41519033908844e-05, 7.905066013336182e-05, 8.394941687583923e-05, 8.884817361831665e-05, 9.374693036079407e-05, 9.864568710327148e-05, 0.0001035444438457489, 0.00010844320058822632, 0.00011334195733070374, 0.00011824071407318115, 0.00012313947081565857, 0.00012803822755813599, 0.0001329369843006134, 0.00013783574104309082, 0.00014273449778556824, 0.00014763325452804565, 0.00015253201127052307, 0.0001574307680130005, 0.0001623295247554779, 0.00016722828149795532, 0.00017212703824043274, 0.00017702579498291016]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 17.0, 14.0, 16.0, 17.0, 33.0, 46.0, 63.0, 84.0, 126.0, 195.0, 317.0, 629.0, 1329.0, 3839.0, 13773.0, 112238.0, 826733.0, 72269.0, 10952.0, 3202.0, 1243.0, 558.0, 300.0, 156.0, 112.0, 56.0, 55.0, 46.0, 32.0, 24.0, 14.0, 15.0, 10.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2555999755859375, -1.214324951171875, -1.1730499267578125, -1.13177490234375, -1.0904998779296875, -1.049224853515625, -1.0079498291015625, -0.9666748046875, -0.9253997802734375, -0.884124755859375, -0.8428497314453125, -0.80157470703125, -0.7602996826171875, -0.719024658203125, -0.6777496337890625, -0.636474609375, -0.5951995849609375, -0.553924560546875, -0.5126495361328125, -0.47137451171875, -0.4300994873046875, -0.388824462890625, -0.3475494384765625, -0.3062744140625, -0.2649993896484375, -0.223724365234375, -0.1824493408203125, -0.14117431640625, -0.0998992919921875, -0.058624267578125, -0.0173492431640625, 0.02392578125, 0.0652008056640625, 0.106475830078125, 0.1477508544921875, 0.18902587890625, 0.2303009033203125, 0.271575927734375, 0.3128509521484375, 0.3541259765625, 0.3954010009765625, 0.436676025390625, 0.4779510498046875, 0.51922607421875, 0.5605010986328125, 0.601776123046875, 0.6430511474609375, 0.684326171875, 0.7256011962890625, 0.766876220703125, 0.8081512451171875, 0.84942626953125, 0.8907012939453125, 0.931976318359375, 0.9732513427734375, 1.0145263671875, 1.0558013916015625, 1.097076416015625, 1.1383514404296875, 1.17962646484375, 1.2209014892578125, 1.262176513671875, 1.3034515380859375, 1.3447265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 10.0, 17.0, 23.0, 40.0, 37.0, 45.0, 63.0, 81.0, 93.0, 109.0, 112.0, 84.0, 76.0, 46.0, 33.0, 19.0, 18.0, 14.0, 8.0, 10.0, 4.0, 4.0, 7.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92626953125, -0.8948593139648438, -0.8634490966796875, -0.8320388793945312, -0.800628662109375, -0.7692184448242188, -0.7378082275390625, -0.7063980102539062, -0.67498779296875, -0.6435775756835938, -0.6121673583984375, -0.5807571411132812, -0.549346923828125, -0.5179367065429688, -0.4865264892578125, -0.45511627197265625, -0.4237060546875, -0.39229583740234375, -0.3608856201171875, -0.32947540283203125, -0.298065185546875, -0.26665496826171875, -0.2352447509765625, -0.20383453369140625, -0.17242431640625, -0.14101409912109375, -0.1096038818359375, -0.07819366455078125, -0.046783447265625, -0.01537322998046875, 0.0160369873046875, 0.04744720458984375, 0.078857421875, 0.11026763916015625, 0.1416778564453125, 0.17308807373046875, 0.204498291015625, 0.23590850830078125, 0.2673187255859375, 0.29872894287109375, 0.33013916015625, 0.36154937744140625, 0.3929595947265625, 0.42436981201171875, 0.455780029296875, 0.48719024658203125, 0.5186004638671875, 0.5500106811523438, 0.5814208984375, 0.6128311157226562, 0.6442413330078125, 0.6756515502929688, 0.707061767578125, 0.7384719848632812, 0.7698822021484375, 0.8012924194335938, 0.83270263671875, 0.8641128540039062, 0.8955230712890625, 0.9269332885742188, 0.958343505859375, 0.9897537231445312, 1.0211639404296875, 1.0525741577148438, 1.083984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 5.0, 16.0, 21.0, 48.0, 47.0, 102.0, 112.0, 178.0, 166.0, 105.0, 68.0, 51.0, 23.0, 11.0, 7.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.943916320800781, -15.443807601928711, -14.94369888305664, -14.44359016418457, -13.943480491638184, -13.443371772766113, -12.943263053894043, -12.443154335021973, -11.943044662475586, -11.442935943603516, -10.942827224731445, -10.442718505859375, -9.942608833312988, -9.442500114440918, -8.942391395568848, -8.442282676696777, -7.942173957824707, -7.442065238952637, -6.941956043243408, -6.441847324371338, -5.941738128662109, -5.441629409790039, -4.941520690917969, -4.441411972045898, -3.94130277633667, -3.4411938190460205, -2.941084861755371, -2.440976142883301, -1.9408671855926514, -1.440758228302002, -0.9406495094299316, -0.4405405521392822, 0.05956840515136719, 0.5596773028373718, 1.0597862005233765, 1.5598950386047363, 2.0600039958953857, 2.560112953186035, 3.0602216720581055, 3.560330629348755, 4.060439586639404, 4.560548305511475, 5.060657501220703, 5.560766220092773, 6.060874938964844, 6.560984134674072, 7.061092853546143, 7.561202049255371, 8.061310768127441, 8.561419486999512, 9.061528205871582, 9.561637878417969, 10.061746597290039, 10.56185531616211, 11.06196403503418, 11.56207275390625, 12.06218147277832, 12.56229019165039, 13.062398910522461, 13.562507629394531, 14.062617301940918, 14.562726020812988, 15.062834739685059, 15.562943458557129, 16.063053131103516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 9.0, 19.0, 15.0, 22.0, 20.0, 34.0, 21.0, 35.0, 40.0, 38.0, 30.0, 70.0, 86.0, 80.0, 72.0, 53.0, 49.0, 45.0, 37.0, 16.0, 28.0, 24.0, 25.0, 26.0, 11.0, 25.0, 18.0, 14.0, 3.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.230524063110352, -14.78946304321289, -14.348401069641113, -13.907340049743652, -13.466278076171875, -13.025217056274414, -12.584156036376953, -12.143094062805176, -11.702033042907715, -11.260972023010254, -10.819910049438477, -10.378849029541016, -9.937787055969238, -9.496726036071777, -9.0556640625, -8.614603042602539, -8.173542022705078, -7.732480525970459, -7.29141902923584, -6.850358009338379, -6.40929651260376, -5.968235015869141, -5.5271735191345215, -5.086112022399902, -4.645050048828125, -4.203988552093506, -3.762927293777466, -3.3218657970428467, -2.8808045387268066, -2.4397430419921875, -1.9986815452575684, -1.5576202869415283, -1.1165590286254883, -0.6754976511001587, -0.23443621397018433, 0.20662522315979004, 0.6476866006851196, 1.0887479782104492, 1.5298094749450684, 1.9708707332611084, 2.4119322299957275, 2.8529937267303467, 3.2940549850463867, 3.735116481781006, 4.176177978515625, 4.617238998413086, 5.058300971984863, 5.499361991882324, 5.940423488616943, 6.3814849853515625, 6.822546482086182, 7.263607978820801, 7.704668998718262, 8.145730972290039, 8.5867919921875, 9.027853012084961, 9.468914985656738, 9.9099760055542, 10.351037979125977, 10.792098999023438, 11.233160972595215, 11.674221992492676, 12.115283966064453, 12.556344985961914, 12.997406005859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 15.0, 20.0, 28.0, 38.0, 58.0, 100.0, 173.0, 324.0, 687.0, 1637.0, 4340.0, 15467.0, 83652.0, 1501718.0, 2434640.0, 122639.0, 19689.0, 5362.0, 1985.0, 803.0, 384.0, 241.0, 122.0, 51.0, 45.0, 23.0, 17.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.05059814453125, -1.9937744140625, -1.93695068359375, -1.880126953125, -1.82330322265625, -1.7664794921875, -1.70965576171875, -1.65283203125, -1.59600830078125, -1.5391845703125, -1.48236083984375, -1.425537109375, -1.36871337890625, -1.3118896484375, -1.25506591796875, -1.1982421875, -1.14141845703125, -1.0845947265625, -1.02777099609375, -0.970947265625, -0.91412353515625, -0.8572998046875, -0.80047607421875, -0.74365234375, -0.68682861328125, -0.6300048828125, -0.57318115234375, -0.516357421875, -0.45953369140625, -0.4027099609375, -0.34588623046875, -0.2890625, -0.23223876953125, -0.1754150390625, -0.11859130859375, -0.061767578125, -0.00494384765625, 0.0518798828125, 0.10870361328125, 0.16552734375, 0.22235107421875, 0.2791748046875, 0.33599853515625, 0.392822265625, 0.44964599609375, 0.5064697265625, 0.56329345703125, 0.6201171875, 0.67694091796875, 0.7337646484375, 0.79058837890625, 0.847412109375, 0.90423583984375, 0.9610595703125, 1.01788330078125, 1.07470703125, 1.13153076171875, 1.1883544921875, 1.24517822265625, 1.302001953125, 1.35882568359375, 1.4156494140625, 1.47247314453125, 1.529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 6.0, 9.0, 11.0, 7.0, 11.0, 16.0, 16.0, 24.0, 25.0, 25.0, 37.0, 26.0, 49.0, 50.0, 59.0, 56.0, 57.0, 54.0, 63.0, 50.0, 50.0, 52.0, 45.0, 48.0, 27.0, 26.0, 25.0, 13.0, 13.0, 15.0, 5.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.613189697265625, -0.58868408203125, -0.564178466796875, -0.5396728515625, -0.515167236328125, -0.49066162109375, -0.466156005859375, -0.441650390625, -0.417144775390625, -0.39263916015625, -0.368133544921875, -0.3436279296875, -0.319122314453125, -0.29461669921875, -0.270111083984375, -0.24560546875, -0.221099853515625, -0.19659423828125, -0.172088623046875, -0.1475830078125, -0.123077392578125, -0.09857177734375, -0.074066162109375, -0.049560546875, -0.025054931640625, -0.00054931640625, 0.023956298828125, 0.0484619140625, 0.072967529296875, 0.09747314453125, 0.121978759765625, 0.146484375, 0.170989990234375, 0.19549560546875, 0.220001220703125, 0.2445068359375, 0.269012451171875, 0.29351806640625, 0.318023681640625, 0.342529296875, 0.367034912109375, 0.39154052734375, 0.416046142578125, 0.4405517578125, 0.465057373046875, 0.48956298828125, 0.514068603515625, 0.53857421875, 0.563079833984375, 0.58758544921875, 0.612091064453125, 0.6365966796875, 0.661102294921875, 0.68560791015625, 0.710113525390625, 0.734619140625, 0.759124755859375, 0.78363037109375, 0.808135986328125, 0.8326416015625, 0.857147216796875, 0.88165283203125, 0.906158447265625, 0.9306640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 10.0, 8.0, 11.0, 23.0, 25.0, 49.0, 77.0, 109.0, 159.0, 272.0, 485.0, 915.0, 2233.0, 7710.0, 38747.0, 514684.0, 3425594.0, 170953.0, 23130.0, 5449.0, 1862.0, 752.0, 430.0, 249.0, 142.0, 79.0, 62.0, 23.0, 16.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.552734375, -2.4843292236328125, -2.415924072265625, -2.3475189208984375, -2.27911376953125, -2.2107086181640625, -2.142303466796875, -2.0738983154296875, -2.0054931640625, -1.9370880126953125, -1.868682861328125, -1.8002777099609375, -1.73187255859375, -1.6634674072265625, -1.595062255859375, -1.5266571044921875, -1.458251953125, -1.3898468017578125, -1.321441650390625, -1.2530364990234375, -1.18463134765625, -1.1162261962890625, -1.047821044921875, -0.9794158935546875, -0.9110107421875, -0.8426055908203125, -0.774200439453125, -0.7057952880859375, -0.63739013671875, -0.5689849853515625, -0.500579833984375, -0.4321746826171875, -0.36376953125, -0.2953643798828125, -0.226959228515625, -0.1585540771484375, -0.09014892578125, -0.0217437744140625, 0.046661376953125, 0.1150665283203125, 0.1834716796875, 0.2518768310546875, 0.320281982421875, 0.3886871337890625, 0.45709228515625, 0.5254974365234375, 0.593902587890625, 0.6623077392578125, 0.730712890625, 0.7991180419921875, 0.867523193359375, 0.9359283447265625, 1.00433349609375, 1.0727386474609375, 1.141143798828125, 1.2095489501953125, 1.2779541015625, 1.3463592529296875, 1.414764404296875, 1.4831695556640625, 1.55157470703125, 1.6199798583984375, 1.688385009765625, 1.7567901611328125, 1.8251953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 9.0, 31.0, 75.0, 165.0, 483.0, 1339.0, 1154.0, 429.0, 182.0, 77.0, 40.0, 30.0, 18.0, 11.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1341552734375, -4.022216796875, -3.9102783203125, -3.79833984375, -3.6864013671875, -3.574462890625, -3.4625244140625, -3.3505859375, -3.2386474609375, -3.126708984375, -3.0147705078125, -2.90283203125, -2.7908935546875, -2.678955078125, -2.5670166015625, -2.455078125, -2.3431396484375, -2.231201171875, -2.1192626953125, -2.00732421875, -1.8953857421875, -1.783447265625, -1.6715087890625, -1.5595703125, -1.4476318359375, -1.335693359375, -1.2237548828125, -1.11181640625, -0.9998779296875, -0.887939453125, -0.7760009765625, -0.6640625, -0.5521240234375, -0.440185546875, -0.3282470703125, -0.21630859375, -0.1043701171875, 0.007568359375, 0.1195068359375, 0.2314453125, 0.3433837890625, 0.455322265625, 0.5672607421875, 0.67919921875, 0.7911376953125, 0.903076171875, 1.0150146484375, 1.126953125, 1.2388916015625, 1.350830078125, 1.4627685546875, 1.57470703125, 1.6866455078125, 1.798583984375, 1.9105224609375, 2.0224609375, 2.1343994140625, 2.246337890625, 2.3582763671875, 2.47021484375, 2.5821533203125, 2.694091796875, 2.8060302734375, 2.91796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 13.0, 34.0, 104.0, 207.0, 309.0, 192.0, 67.0, 25.0, 14.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.147830963134766, -20.235191345214844, -19.322551727294922, -18.409912109375, -17.497272491455078, -16.584632873535156, -15.671993255615234, -14.759353637695312, -13.84671401977539, -12.934074401855469, -12.021434783935547, -11.108795166015625, -10.196155548095703, -9.283515930175781, -8.37087631225586, -7.458237171173096, -6.545598030090332, -5.63295841217041, -4.720318794250488, -3.8076794147491455, -2.8950397968292236, -1.9824004173278809, -1.069760799407959, -0.1571211814880371, 0.7555184364318848, 1.6681580543518066, 2.5807976722717285, 3.4934370517730713, 4.406076431274414, 5.318716049194336, 6.231355667114258, 7.14399528503418, 8.056634902954102, 8.969274520874023, 9.881914138793945, 10.794553756713867, 11.707193374633789, 12.619832992553711, 13.532472610473633, 14.445112228393555, 15.357751846313477, 16.2703914642334, 17.18303108215332, 18.095670700073242, 19.008310317993164, 19.920949935913086, 20.833589553833008, 21.74622917175293, 22.65886688232422, 23.57150650024414, 24.484146118164062, 25.396785736083984, 26.309425354003906, 27.222064971923828, 28.13470458984375, 29.047344207763672, 29.959983825683594, 30.872623443603516, 31.785263061523438, 32.69790267944336, 33.61054229736328, 34.5231819152832, 35.435821533203125, 36.34846115112305, 37.26110076904297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 27.0, 37.0, 62.0, 81.0, 88.0, 105.0, 114.0, 94.0, 106.0, 75.0, 55.0, 53.0, 42.0, 22.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.85193634033203, -26.208160400390625, -25.564382553100586, -24.920604705810547, -24.27682876586914, -23.633052825927734, -22.989274978637695, -22.345497131347656, -21.70172119140625, -21.057945251464844, -20.414167404174805, -19.770389556884766, -19.12661361694336, -18.482837677001953, -17.839059829711914, -17.195281982421875, -16.55150604248047, -15.907729148864746, -15.263952255249023, -14.6201753616333, -13.976398468017578, -13.332621574401855, -12.688844680786133, -12.04506778717041, -11.401290893554688, -10.757513999938965, -10.113737106323242, -9.46996021270752, -8.826183319091797, -8.182406425476074, -7.538629531860352, -6.894852638244629, -6.251073837280273, -5.607296943664551, -4.963520050048828, -4.3197431564331055, -3.675966262817383, -3.03218936920166, -2.3884124755859375, -1.7446355819702148, -1.1008586883544922, -0.45708179473876953, 0.18669509887695312, 0.8304719924926758, 1.4742488861083984, 2.118025779724121, 2.7618026733398438, 3.4055795669555664, 4.049356460571289, 4.693133354187012, 5.336910247802734, 5.980687141418457, 6.62446403503418, 7.268240928649902, 7.912017822265625, 8.555794715881348, 9.19957160949707, 9.843348503112793, 10.487125396728516, 11.130902290344238, 11.774679183959961, 12.418456077575684, 13.062232971191406, 13.706009864807129, 14.349786758422852]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 13.0, 11.0, 29.0, 24.0, 44.0, 46.0, 68.0, 101.0, 162.0, 277.0, 394.0, 772.0, 1319.0, 2748.0, 5870.0, 14332.0, 39033.0, 116296.0, 370094.0, 335377.0, 102836.0, 34694.0, 12976.0, 5452.0, 2527.0, 1322.0, 699.0, 328.0, 203.0, 143.0, 94.0, 59.0, 56.0, 31.0, 20.0, 17.0, 15.0, 13.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7041015625, -1.6507568359375, -1.597412109375, -1.5440673828125, -1.49072265625, -1.4373779296875, -1.384033203125, -1.3306884765625, -1.27734375, -1.2239990234375, -1.170654296875, -1.1173095703125, -1.06396484375, -1.0106201171875, -0.957275390625, -0.9039306640625, -0.8505859375, -0.7972412109375, -0.743896484375, -0.6905517578125, -0.63720703125, -0.5838623046875, -0.530517578125, -0.4771728515625, -0.423828125, -0.3704833984375, -0.317138671875, -0.2637939453125, -0.21044921875, -0.1571044921875, -0.103759765625, -0.0504150390625, 0.0029296875, 0.0562744140625, 0.109619140625, 0.1629638671875, 0.21630859375, 0.2696533203125, 0.322998046875, 0.3763427734375, 0.4296875, 0.4830322265625, 0.536376953125, 0.5897216796875, 0.64306640625, 0.6964111328125, 0.749755859375, 0.8031005859375, 0.8564453125, 0.9097900390625, 0.963134765625, 1.0164794921875, 1.06982421875, 1.1231689453125, 1.176513671875, 1.2298583984375, 1.283203125, 1.3365478515625, 1.389892578125, 1.4432373046875, 1.49658203125, 1.5499267578125, 1.603271484375, 1.6566162109375, 1.7099609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 4.0, 12.0, 7.0, 5.0, 16.0, 13.0, 22.0, 24.0, 25.0, 34.0, 21.0, 32.0, 38.0, 49.0, 44.0, 45.0, 45.0, 47.0, 38.0, 43.0, 45.0, 53.0, 42.0, 27.0, 43.0, 27.0, 34.0, 30.0, 24.0, 21.0, 15.0, 16.0, 10.0, 13.0, 5.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6650390625, -0.6449203491210938, -0.6248016357421875, -0.6046829223632812, -0.584564208984375, -0.5644454956054688, -0.5443267822265625, -0.5242080688476562, -0.50408935546875, -0.48397064208984375, -0.4638519287109375, -0.44373321533203125, -0.423614501953125, -0.40349578857421875, -0.3833770751953125, -0.36325836181640625, -0.3431396484375, -0.32302093505859375, -0.3029022216796875, -0.28278350830078125, -0.262664794921875, -0.24254608154296875, -0.2224273681640625, -0.20230865478515625, -0.18218994140625, -0.16207122802734375, -0.1419525146484375, -0.12183380126953125, -0.101715087890625, -0.08159637451171875, -0.0614776611328125, -0.04135894775390625, -0.021240234375, -0.00112152099609375, 0.0189971923828125, 0.03911590576171875, 0.059234619140625, 0.07935333251953125, 0.0994720458984375, 0.11959075927734375, 0.13970947265625, 0.15982818603515625, 0.1799468994140625, 0.20006561279296875, 0.220184326171875, 0.24030303955078125, 0.2604217529296875, 0.28054046630859375, 0.3006591796875, 0.32077789306640625, 0.3408966064453125, 0.36101531982421875, 0.381134033203125, 0.40125274658203125, 0.4213714599609375, 0.44149017333984375, 0.46160888671875, 0.48172760009765625, 0.5018463134765625, 0.5219650268554688, 0.542083740234375, 0.5622024536132812, 0.5823211669921875, 0.6024398803710938, 0.62255859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 23.0, 21.0, 63.0, 109.0, 248.0, 523.0, 1531.0, 6490.0, 171642.0, 847223.0, 16910.0, 2284.0, 759.0, 352.0, 151.0, 72.0, 44.0, 34.0, 14.0, 15.0, 6.0, 7.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8812255859375, -5.672607421875, -5.4639892578125, -5.25537109375, -5.0467529296875, -4.838134765625, -4.6295166015625, -4.4208984375, -4.2122802734375, -4.003662109375, -3.7950439453125, -3.58642578125, -3.3778076171875, -3.169189453125, -2.9605712890625, -2.751953125, -2.5433349609375, -2.334716796875, -2.1260986328125, -1.91748046875, -1.7088623046875, -1.500244140625, -1.2916259765625, -1.0830078125, -0.8743896484375, -0.665771484375, -0.4571533203125, -0.24853515625, -0.0399169921875, 0.168701171875, 0.3773193359375, 0.5859375, 0.7945556640625, 1.003173828125, 1.2117919921875, 1.42041015625, 1.6290283203125, 1.837646484375, 2.0462646484375, 2.2548828125, 2.4635009765625, 2.672119140625, 2.8807373046875, 3.08935546875, 3.2979736328125, 3.506591796875, 3.7152099609375, 3.923828125, 4.1324462890625, 4.341064453125, 4.5496826171875, 4.75830078125, 4.9669189453125, 5.175537109375, 5.3841552734375, 5.5927734375, 5.8013916015625, 6.010009765625, 6.2186279296875, 6.42724609375, 6.6358642578125, 6.844482421875, 7.0531005859375, 7.26171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 16.0, 21.0, 20.0, 31.0, 30.0, 31.0, 44.0, 49.0, 59.0, 41.0, 48.0, 53.0, 43.0, 50.0, 42.0, 53.0, 37.0, 39.0, 40.0, 24.0, 31.0, 22.0, 20.0, 9.0, 11.0, 7.0, 16.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.52288818359375, -2.4442138671875, -2.36553955078125, -2.286865234375, -2.20819091796875, -2.1295166015625, -2.05084228515625, -1.97216796875, -1.89349365234375, -1.8148193359375, -1.73614501953125, -1.657470703125, -1.57879638671875, -1.5001220703125, -1.42144775390625, -1.3427734375, -1.26409912109375, -1.1854248046875, -1.10675048828125, -1.028076171875, -0.94940185546875, -0.8707275390625, -0.79205322265625, -0.71337890625, -0.63470458984375, -0.5560302734375, -0.47735595703125, -0.398681640625, -0.32000732421875, -0.2413330078125, -0.16265869140625, -0.083984375, -0.00531005859375, 0.0733642578125, 0.15203857421875, 0.230712890625, 0.30938720703125, 0.3880615234375, 0.46673583984375, 0.54541015625, 0.62408447265625, 0.7027587890625, 0.78143310546875, 0.860107421875, 0.93878173828125, 1.0174560546875, 1.09613037109375, 1.1748046875, 1.25347900390625, 1.3321533203125, 1.41082763671875, 1.489501953125, 1.56817626953125, 1.6468505859375, 1.72552490234375, 1.80419921875, 1.88287353515625, 1.9615478515625, 2.04022216796875, 2.118896484375, 2.19757080078125, 2.2762451171875, 2.35491943359375, 2.43359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 11.0, 9.0, 22.0, 25.0, 37.0, 57.0, 88.0, 158.0, 455.0, 1713.0, 17066.0, 877163.0, 144508.0, 5616.0, 874.0, 281.0, 143.0, 74.0, 50.0, 35.0, 28.0, 22.0, 10.0, 18.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.34375, -2.274383544921875, -2.20501708984375, -2.135650634765625, -2.0662841796875, -1.996917724609375, -1.92755126953125, -1.858184814453125, -1.788818359375, -1.719451904296875, -1.65008544921875, -1.580718994140625, -1.5113525390625, -1.441986083984375, -1.37261962890625, -1.303253173828125, -1.23388671875, -1.164520263671875, -1.09515380859375, -1.025787353515625, -0.9564208984375, -0.887054443359375, -0.81768798828125, -0.748321533203125, -0.678955078125, -0.609588623046875, -0.54022216796875, -0.470855712890625, -0.4014892578125, -0.332122802734375, -0.26275634765625, -0.193389892578125, -0.1240234375, -0.054656982421875, 0.01470947265625, 0.084075927734375, 0.1534423828125, 0.222808837890625, 0.29217529296875, 0.361541748046875, 0.430908203125, 0.500274658203125, 0.56964111328125, 0.639007568359375, 0.7083740234375, 0.777740478515625, 0.84710693359375, 0.916473388671875, 0.98583984375, 1.055206298828125, 1.12457275390625, 1.193939208984375, 1.2633056640625, 1.332672119140625, 1.40203857421875, 1.471405029296875, 1.540771484375, 1.610137939453125, 1.67950439453125, 1.748870849609375, 1.8182373046875, 1.887603759765625, 1.95697021484375, 2.026336669921875, 2.095703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 2.0, 9.0, 5.0, 2.0, 9.0, 7.0, 10.0, 9.0, 19.0, 30.0, 29.0, 34.0, 51.0, 66.0, 89.0, 109.0, 117.0, 109.0, 72.0, 40.0, 29.0, 30.0, 14.0, 20.0, 14.0, 17.0, 15.0, 11.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016951560974121094, -0.00016369298100471497, -0.000157870352268219, -0.00015204772353172302, -0.00014622509479522705, -0.00014040246605873108, -0.0001345798373222351, -0.00012875720858573914, -0.00012293457984924316, -0.00011711195111274719, -0.00011128932237625122, -0.00010546669363975525, -9.964406490325928e-05, -9.38214361667633e-05, -8.799880743026733e-05, -8.217617869377136e-05, -7.635354995727539e-05, -7.053092122077942e-05, -6.470829248428345e-05, -5.8885663747787476e-05, -5.3063035011291504e-05, -4.724040627479553e-05, -4.141777753829956e-05, -3.559514880180359e-05, -2.9772520065307617e-05, -2.3949891328811646e-05, -1.8127262592315674e-05, -1.2304633855819702e-05, -6.4820051193237305e-06, -6.593763828277588e-07, 5.163252353668213e-06, 1.0985881090164185e-05, 1.6808509826660156e-05, 2.2631138563156128e-05, 2.84537672996521e-05, 3.427639603614807e-05, 4.009902477264404e-05, 4.5921653509140015e-05, 5.1744282245635986e-05, 5.756691098213196e-05, 6.338953971862793e-05, 6.92121684551239e-05, 7.503479719161987e-05, 8.085742592811584e-05, 8.668005466461182e-05, 9.250268340110779e-05, 9.832531213760376e-05, 0.00010414794087409973, 0.0001099705696105957, 0.00011579319834709167, 0.00012161582708358765, 0.00012743845582008362, 0.0001332610845565796, 0.00013908371329307556, 0.00014490634202957153, 0.0001507289707660675, 0.00015655159950256348, 0.00016237422823905945, 0.00016819685697555542, 0.0001740194857120514, 0.00017984211444854736, 0.00018566474318504333, 0.0001914873719215393, 0.00019731000065803528, 0.00020313262939453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 11.0, 9.0, 12.0, 15.0, 34.0, 41.0, 52.0, 101.0, 146.0, 217.0, 401.0, 732.0, 1939.0, 6212.0, 33971.0, 589893.0, 376174.0, 29410.0, 5667.0, 1790.0, 741.0, 384.0, 215.0, 99.0, 88.0, 61.0, 45.0, 22.0, 13.0, 20.0, 13.0, 8.0, 2.0, 4.0, 4.0, 2.0, 5.0], "bins": [-1.546875, -1.5108718872070312, -1.4748687744140625, -1.4388656616210938, -1.402862548828125, -1.3668594360351562, -1.3308563232421875, -1.2948532104492188, -1.25885009765625, -1.2228469848632812, -1.1868438720703125, -1.1508407592773438, -1.114837646484375, -1.0788345336914062, -1.0428314208984375, -1.0068283081054688, -0.9708251953125, -0.9348220825195312, -0.8988189697265625, -0.8628158569335938, -0.826812744140625, -0.7908096313476562, -0.7548065185546875, -0.7188034057617188, -0.68280029296875, -0.6467971801757812, -0.6107940673828125, -0.5747909545898438, -0.538787841796875, -0.5027847290039062, -0.4667816162109375, -0.43077850341796875, -0.394775390625, -0.35877227783203125, -0.3227691650390625, -0.28676605224609375, -0.250762939453125, -0.21475982666015625, -0.1787567138671875, -0.14275360107421875, -0.10675048828125, -0.07074737548828125, -0.0347442626953125, 0.00125885009765625, 0.037261962890625, 0.07326507568359375, 0.1092681884765625, 0.14527130126953125, 0.1812744140625, 0.21727752685546875, 0.2532806396484375, 0.28928375244140625, 0.325286865234375, 0.36128997802734375, 0.3972930908203125, 0.43329620361328125, 0.46929931640625, 0.5053024291992188, 0.5413055419921875, 0.5773086547851562, 0.613311767578125, 0.6493148803710938, 0.6853179931640625, 0.7213211059570312, 0.75732421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 13.0, 19.0, 28.0, 30.0, 32.0, 65.0, 108.0, 125.0, 127.0, 127.0, 70.0, 59.0, 43.0, 24.0, 21.0, 16.0, 10.0, 6.0, 16.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.865814208984375, -0.83612060546875, -0.806427001953125, -0.7767333984375, -0.747039794921875, -0.71734619140625, -0.687652587890625, -0.657958984375, -0.628265380859375, -0.59857177734375, -0.568878173828125, -0.5391845703125, -0.509490966796875, -0.47979736328125, -0.450103759765625, -0.42041015625, -0.390716552734375, -0.36102294921875, -0.331329345703125, -0.3016357421875, -0.271942138671875, -0.24224853515625, -0.212554931640625, -0.182861328125, -0.153167724609375, -0.12347412109375, -0.093780517578125, -0.0640869140625, -0.034393310546875, -0.00469970703125, 0.024993896484375, 0.0546875, 0.084381103515625, 0.11407470703125, 0.143768310546875, 0.1734619140625, 0.203155517578125, 0.23284912109375, 0.262542724609375, 0.292236328125, 0.321929931640625, 0.35162353515625, 0.381317138671875, 0.4110107421875, 0.440704345703125, 0.47039794921875, 0.500091552734375, 0.52978515625, 0.559478759765625, 0.58917236328125, 0.618865966796875, 0.6485595703125, 0.678253173828125, 0.70794677734375, 0.737640380859375, 0.767333984375, 0.797027587890625, 0.82672119140625, 0.856414794921875, 0.8861083984375, 0.915802001953125, 0.94549560546875, 0.975189208984375, 1.0048828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 24.0, 37.0, 140.0, 422.0, 234.0, 88.0, 28.0, 12.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.05577850341797, -51.840389251708984, -50.624996185302734, -49.40960693359375, -48.194217681884766, -46.97882843017578, -45.76343536376953, -44.54804611206055, -43.33265686035156, -42.11726760864258, -40.90187454223633, -39.686485290527344, -38.47109603881836, -37.255706787109375, -36.040313720703125, -34.82492446899414, -33.60953140258789, -32.394142150878906, -31.17875099182129, -29.963359832763672, -28.747970581054688, -27.53257942199707, -26.317188262939453, -25.10179901123047, -23.88640785217285, -22.671016693115234, -21.45562744140625, -20.240236282348633, -19.024845123291016, -17.80945587158203, -16.594064712524414, -15.378674507141113, -14.163284301757812, -12.947894096374512, -11.732503890991211, -10.517112731933594, -9.301722526550293, -8.086332321166992, -6.870941638946533, -5.655550956726074, -4.440160751342773, -3.2247703075408936, -2.0093798637390137, -0.7939894199371338, 0.4214010238647461, 1.6367912292480469, 2.852181911468506, 4.067572593688965, 5.282962799072266, 6.498353004455566, 7.713743686676025, 8.929134368896484, 10.144524574279785, 11.359914779663086, 12.575305938720703, 13.790696144104004, 15.006086349487305, 16.221477508544922, 17.436866760253906, 18.652257919311523, 19.86764907836914, 21.083038330078125, 22.298429489135742, 23.51382064819336, 24.729209899902344]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 23.0, 13.0, 15.0, 18.0, 28.0, 26.0, 31.0, 35.0, 37.0, 36.0, 44.0, 62.0, 81.0, 80.0, 56.0, 43.0, 49.0, 43.0, 26.0, 46.0, 25.0, 21.0, 14.0, 26.0, 14.0, 19.0, 8.0, 10.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.179211616516113, -9.824738502502441, -9.470264434814453, -9.115791320800781, -8.76131820678711, -8.406845092773438, -8.052371978759766, -7.697897911071777, -7.3434247970581055, -6.988951683044434, -6.6344780921936035, -6.280004501342773, -5.925531387329102, -5.57105827331543, -5.2165846824646, -4.8621110916137695, -4.507637977600098, -4.153164863586426, -3.7986912727355957, -3.4442179203033447, -3.0897445678710938, -2.7352712154388428, -2.380797863006592, -2.026324510574341, -1.6718511581420898, -1.3173778057098389, -0.9629044532775879, -0.6084311008453369, -0.25395774841308594, 0.10051560401916504, 0.454988956451416, 0.809462308883667, 1.1639366149902344, 1.5184099674224854, 1.8728833198547363, 2.2273566722869873, 2.5818300247192383, 2.9363033771514893, 3.2907767295837402, 3.645250082015991, 3.999723434448242, 4.354196548461914, 4.708670139312744, 5.063143730163574, 5.417616844177246, 5.772089958190918, 6.126563549041748, 6.481037139892578, 6.83551025390625, 7.189983367919922, 7.544456958770752, 7.898930549621582, 8.253403663635254, 8.607876777648926, 8.962350845336914, 9.316823959350586, 9.671297073364258, 10.02577018737793, 10.380243301391602, 10.73471736907959, 11.089190483093262, 11.443663597106934, 11.798137664794922, 12.152610778808594, 12.507083892822266]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 9.0, 5.0, 19.0, 27.0, 39.0, 84.0, 145.0, 294.0, 683.0, 1966.0, 7566.0, 53210.0, 2759006.0, 1327172.0, 35197.0, 6028.0, 1722.0, 587.0, 229.0, 117.0, 60.0, 43.0, 24.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.056640625, -2.98370361328125, -2.9107666015625, -2.83782958984375, -2.764892578125, -2.69195556640625, -2.6190185546875, -2.54608154296875, -2.47314453125, -2.40020751953125, -2.3272705078125, -2.25433349609375, -2.181396484375, -2.10845947265625, -2.0355224609375, -1.96258544921875, -1.8896484375, -1.81671142578125, -1.7437744140625, -1.67083740234375, -1.597900390625, -1.52496337890625, -1.4520263671875, -1.37908935546875, -1.30615234375, -1.23321533203125, -1.1602783203125, -1.08734130859375, -1.014404296875, -0.94146728515625, -0.8685302734375, -0.79559326171875, -0.72265625, -0.64971923828125, -0.5767822265625, -0.50384521484375, -0.430908203125, -0.35797119140625, -0.2850341796875, -0.21209716796875, -0.13916015625, -0.06622314453125, 0.0067138671875, 0.07965087890625, 0.152587890625, 0.22552490234375, 0.2984619140625, 0.37139892578125, 0.4443359375, 0.51727294921875, 0.5902099609375, 0.66314697265625, 0.736083984375, 0.80902099609375, 0.8819580078125, 0.95489501953125, 1.02783203125, 1.10076904296875, 1.1737060546875, 1.24664306640625, 1.319580078125, 1.39251708984375, 1.4654541015625, 1.53839111328125, 1.611328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 13.0, 18.0, 20.0, 21.0, 26.0, 35.0, 51.0, 52.0, 62.0, 65.0, 65.0, 72.0, 62.0, 76.0, 70.0, 63.0, 50.0, 40.0, 39.0, 30.0, 19.0, 15.0, 17.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8834609985351562, -0.8538360595703125, -0.8242111206054688, -0.794586181640625, -0.7649612426757812, -0.7353363037109375, -0.7057113647460938, -0.67608642578125, -0.6464614868164062, -0.6168365478515625, -0.5872116088867188, -0.557586669921875, -0.5279617309570312, -0.4983367919921875, -0.46871185302734375, -0.4390869140625, -0.40946197509765625, -0.3798370361328125, -0.35021209716796875, -0.320587158203125, -0.29096221923828125, -0.2613372802734375, -0.23171234130859375, -0.20208740234375, -0.17246246337890625, -0.1428375244140625, -0.11321258544921875, -0.083587646484375, -0.05396270751953125, -0.0243377685546875, 0.00528717041015625, 0.034912109375, 0.06453704833984375, 0.0941619873046875, 0.12378692626953125, 0.153411865234375, 0.18303680419921875, 0.2126617431640625, 0.24228668212890625, 0.27191162109375, 0.30153656005859375, 0.3311614990234375, 0.36078643798828125, 0.390411376953125, 0.42003631591796875, 0.4496612548828125, 0.47928619384765625, 0.5089111328125, 0.5385360717773438, 0.5681610107421875, 0.5977859497070312, 0.627410888671875, 0.6570358276367188, 0.6866607666015625, 0.7162857055664062, 0.74591064453125, 0.7755355834960938, 0.8051605224609375, 0.8347854614257812, 0.864410400390625, 0.8940353393554688, 0.9236602783203125, 0.9532852172851562, 0.98291015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 31.0, 50.0, 72.0, 123.0, 187.0, 394.0, 944.0, 2475.0, 10631.0, 128377.0, 3910957.0, 125088.0, 10239.0, 2599.0, 1032.0, 498.0, 248.0, 120.0, 76.0, 34.0, 28.0, 15.0, 12.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.09698486328125, -2.9986572265625, -2.90032958984375, -2.802001953125, -2.70367431640625, -2.6053466796875, -2.50701904296875, -2.40869140625, -2.31036376953125, -2.2120361328125, -2.11370849609375, -2.015380859375, -1.91705322265625, -1.8187255859375, -1.72039794921875, -1.6220703125, -1.52374267578125, -1.4254150390625, -1.32708740234375, -1.228759765625, -1.13043212890625, -1.0321044921875, -0.93377685546875, -0.83544921875, -0.73712158203125, -0.6387939453125, -0.54046630859375, -0.442138671875, -0.34381103515625, -0.2454833984375, -0.14715576171875, -0.048828125, 0.04949951171875, 0.1478271484375, 0.24615478515625, 0.344482421875, 0.44281005859375, 0.5411376953125, 0.63946533203125, 0.73779296875, 0.83612060546875, 0.9344482421875, 1.03277587890625, 1.131103515625, 1.22943115234375, 1.3277587890625, 1.42608642578125, 1.5244140625, 1.62274169921875, 1.7210693359375, 1.81939697265625, 1.917724609375, 2.01605224609375, 2.1143798828125, 2.21270751953125, 2.31103515625, 2.40936279296875, 2.5076904296875, 2.60601806640625, 2.704345703125, 2.80267333984375, 2.9010009765625, 2.99932861328125, 3.09765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 3.0, 17.0, 26.0, 40.0, 132.0, 447.0, 1507.0, 1384.0, 315.0, 110.0, 42.0, 27.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.033721923828125, -3.90728759765625, -3.780853271484375, -3.6544189453125, -3.527984619140625, -3.40155029296875, -3.275115966796875, -3.148681640625, -3.022247314453125, -2.89581298828125, -2.769378662109375, -2.6429443359375, -2.516510009765625, -2.39007568359375, -2.263641357421875, -2.13720703125, -2.010772705078125, -1.88433837890625, -1.757904052734375, -1.6314697265625, -1.505035400390625, -1.37860107421875, -1.252166748046875, -1.125732421875, -0.999298095703125, -0.87286376953125, -0.746429443359375, -0.6199951171875, -0.493560791015625, -0.36712646484375, -0.240692138671875, -0.1142578125, 0.012176513671875, 0.13861083984375, 0.265045166015625, 0.3914794921875, 0.517913818359375, 0.64434814453125, 0.770782470703125, 0.897216796875, 1.023651123046875, 1.15008544921875, 1.276519775390625, 1.4029541015625, 1.529388427734375, 1.65582275390625, 1.782257080078125, 1.90869140625, 2.035125732421875, 2.16156005859375, 2.287994384765625, 2.4144287109375, 2.540863037109375, 2.66729736328125, 2.793731689453125, 2.920166015625, 3.046600341796875, 3.17303466796875, 3.299468994140625, 3.4259033203125, 3.552337646484375, 3.67877197265625, 3.805206298828125, 3.931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 10.0, 10.0, 20.0, 59.0, 162.0, 261.0, 221.0, 148.0, 54.0, 25.0, 5.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.847034454345703, -21.13936996459961, -20.431703567504883, -19.72403907775879, -19.016374588012695, -18.30870819091797, -17.601043701171875, -16.89337921142578, -16.185712814331055, -15.478047370910645, -14.77038288116455, -14.06271743774414, -13.35505199432373, -12.64738655090332, -11.939722061157227, -11.232056617736816, -10.524392127990723, -9.816726684570312, -9.109062194824219, -8.401396751403809, -7.693731307983398, -6.9860663414001465, -6.2784013748168945, -5.570735931396484, -4.863070964813232, -4.1554059982299805, -3.4477405548095703, -2.7400755882263184, -2.0324103832244873, -1.3247451782226562, -0.6170802116394043, 0.09058523178100586, 0.7982501983642578, 1.5059154033660889, 2.21358060836792, 2.921245574951172, 3.628910779953003, 4.336575984954834, 5.044240951538086, 5.751906394958496, 6.459571361541748, 7.167236328125, 7.87490177154541, 8.58256721496582, 9.290231704711914, 9.997897148132324, 10.705562591552734, 11.413227081298828, 12.120892524719238, 12.828557968139648, 13.536222457885742, 14.243887901306152, 14.951553344726562, 15.659217834472656, 16.36688232421875, 17.074548721313477, 17.78221321105957, 18.489877700805664, 19.19754409790039, 19.905208587646484, 20.612873077392578, 21.320539474487305, 22.0282039642334, 22.735870361328125, 23.44353485107422]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 10.0, 25.0, 57.0, 99.0, 156.0, 211.0, 195.0, 121.0, 83.0, 27.0, 11.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.64105796813965, -24.809375762939453, -23.977691650390625, -23.146007537841797, -22.3143253326416, -21.482643127441406, -20.650959014892578, -19.81927490234375, -18.987592697143555, -18.15591049194336, -17.32422637939453, -16.492542266845703, -15.660860061645508, -14.829176902770996, -13.997493743896484, -13.165810585021973, -12.334127426147461, -11.50244426727295, -10.670761108398438, -9.839077949523926, -9.007394790649414, -8.175711631774902, -7.344028472900391, -6.512345314025879, -5.680662155151367, -4.8489789962768555, -4.017295837402344, -3.185612678527832, -2.3539295196533203, -1.5222463607788086, -0.6905632019042969, 0.14111995697021484, 0.9728012084960938, 1.8044843673706055, 2.636167526245117, 3.467850685119629, 4.299533843994141, 5.131217002868652, 5.962900161743164, 6.794583320617676, 7.6262664794921875, 8.4579496383667, 9.289632797241211, 10.121315956115723, 10.952999114990234, 11.784682273864746, 12.616365432739258, 13.44804859161377, 14.279731750488281, 15.111414909362793, 15.943098068237305, 16.7747802734375, 17.606464385986328, 18.438148498535156, 19.26983070373535, 20.101512908935547, 20.933197021484375, 21.764881134033203, 22.5965633392334, 23.428245544433594, 24.259929656982422, 25.09161376953125, 25.923295974731445, 26.75497817993164, 27.58666229248047]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 16.0, 23.0, 57.0, 90.0, 151.0, 249.0, 504.0, 1005.0, 2275.0, 6082.0, 20531.0, 95198.0, 439937.0, 379991.0, 75918.0, 17344.0, 5256.0, 2009.0, 866.0, 424.0, 218.0, 125.0, 84.0, 43.0, 30.0, 20.0, 24.0, 14.0, 12.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7566680908203125, -1.695953369140625, -1.6352386474609375, -1.57452392578125, -1.5138092041015625, -1.453094482421875, -1.3923797607421875, -1.3316650390625, -1.2709503173828125, -1.210235595703125, -1.1495208740234375, -1.08880615234375, -1.0280914306640625, -0.967376708984375, -0.9066619873046875, -0.845947265625, -0.7852325439453125, -0.724517822265625, -0.6638031005859375, -0.60308837890625, -0.5423736572265625, -0.481658935546875, -0.4209442138671875, -0.3602294921875, -0.2995147705078125, -0.238800048828125, -0.1780853271484375, -0.11737060546875, -0.0566558837890625, 0.004058837890625, 0.0647735595703125, 0.12548828125, 0.1862030029296875, 0.246917724609375, 0.3076324462890625, 0.36834716796875, 0.4290618896484375, 0.489776611328125, 0.5504913330078125, 0.6112060546875, 0.6719207763671875, 0.732635498046875, 0.7933502197265625, 0.85406494140625, 0.9147796630859375, 0.975494384765625, 1.0362091064453125, 1.096923828125, 1.1576385498046875, 1.218353271484375, 1.2790679931640625, 1.33978271484375, 1.4004974365234375, 1.461212158203125, 1.5219268798828125, 1.5826416015625, 1.6433563232421875, 1.704071044921875, 1.7647857666015625, 1.82550048828125, 1.8862152099609375, 1.946929931640625, 2.0076446533203125, 2.068359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 9.0, 11.0, 15.0, 19.0, 28.0, 32.0, 52.0, 40.0, 66.0, 83.0, 62.0, 71.0, 66.0, 68.0, 73.0, 61.0, 47.0, 46.0, 35.0, 37.0, 25.0, 14.0, 10.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8736343383789062, -0.8424835205078125, -0.8113327026367188, -0.780181884765625, -0.7490310668945312, -0.7178802490234375, -0.6867294311523438, -0.65557861328125, -0.6244277954101562, -0.5932769775390625, -0.5621261596679688, -0.530975341796875, -0.49982452392578125, -0.4686737060546875, -0.43752288818359375, -0.4063720703125, -0.37522125244140625, -0.3440704345703125, -0.31291961669921875, -0.281768798828125, -0.25061798095703125, -0.2194671630859375, -0.18831634521484375, -0.15716552734375, -0.12601470947265625, -0.0948638916015625, -0.06371307373046875, -0.032562255859375, -0.00141143798828125, 0.0297393798828125, 0.06089019775390625, 0.092041015625, 0.12319183349609375, 0.1543426513671875, 0.18549346923828125, 0.216644287109375, 0.24779510498046875, 0.2789459228515625, 0.31009674072265625, 0.34124755859375, 0.37239837646484375, 0.4035491943359375, 0.43470001220703125, 0.465850830078125, 0.49700164794921875, 0.5281524658203125, 0.5593032836914062, 0.5904541015625, 0.6216049194335938, 0.6527557373046875, 0.6839065551757812, 0.715057373046875, 0.7462081909179688, 0.7773590087890625, 0.8085098266601562, 0.83966064453125, 0.8708114624023438, 0.9019622802734375, 0.9331130981445312, 0.964263916015625, 0.9954147338867188, 1.0265655517578125, 1.0577163696289062, 1.0888671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 11.0, 21.0, 35.0, 56.0, 77.0, 158.0, 250.0, 525.0, 1400.0, 4369.0, 18172.0, 115158.0, 696503.0, 177232.0, 25714.0, 5752.0, 1759.0, 646.0, 321.0, 158.0, 72.0, 55.0, 30.0, 24.0, 15.0, 11.0, 8.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.3481597900390625, -2.280303955078125, -2.2124481201171875, -2.14459228515625, -2.0767364501953125, -2.008880615234375, -1.9410247802734375, -1.8731689453125, -1.8053131103515625, -1.737457275390625, -1.6696014404296875, -1.60174560546875, -1.5338897705078125, -1.466033935546875, -1.3981781005859375, -1.330322265625, -1.2624664306640625, -1.194610595703125, -1.1267547607421875, -1.05889892578125, -0.9910430908203125, -0.923187255859375, -0.8553314208984375, -0.7874755859375, -0.7196197509765625, -0.651763916015625, -0.5839080810546875, -0.51605224609375, -0.4481964111328125, -0.380340576171875, -0.3124847412109375, -0.24462890625, -0.1767730712890625, -0.108917236328125, -0.0410614013671875, 0.02679443359375, 0.0946502685546875, 0.162506103515625, 0.2303619384765625, 0.2982177734375, 0.3660736083984375, 0.433929443359375, 0.5017852783203125, 0.56964111328125, 0.6374969482421875, 0.705352783203125, 0.7732086181640625, 0.841064453125, 0.9089202880859375, 0.976776123046875, 1.0446319580078125, 1.11248779296875, 1.1803436279296875, 1.248199462890625, 1.3160552978515625, 1.3839111328125, 1.4517669677734375, 1.519622802734375, 1.5874786376953125, 1.65533447265625, 1.7231903076171875, 1.791046142578125, 1.8589019775390625, 1.9267578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 4.0, 4.0, 5.0, 15.0, 11.0, 16.0, 13.0, 24.0, 20.0, 21.0, 38.0, 26.0, 39.0, 38.0, 40.0, 45.0, 54.0, 46.0, 31.0, 59.0, 46.0, 40.0, 31.0, 34.0, 34.0, 41.0, 27.0, 34.0, 25.0, 18.0, 27.0, 18.0, 12.0, 12.0, 10.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7483673095703125, -1.683258056640625, -1.6181488037109375, -1.55303955078125, -1.4879302978515625, -1.422821044921875, -1.3577117919921875, -1.2926025390625, -1.2274932861328125, -1.162384033203125, -1.0972747802734375, -1.03216552734375, -0.9670562744140625, -0.901947021484375, -0.8368377685546875, -0.771728515625, -0.7066192626953125, -0.641510009765625, -0.5764007568359375, -0.51129150390625, -0.4461822509765625, -0.381072998046875, -0.3159637451171875, -0.2508544921875, -0.1857452392578125, -0.120635986328125, -0.0555267333984375, 0.00958251953125, 0.0746917724609375, 0.139801025390625, 0.2049102783203125, 0.27001953125, 0.3351287841796875, 0.400238037109375, 0.4653472900390625, 0.53045654296875, 0.5955657958984375, 0.660675048828125, 0.7257843017578125, 0.7908935546875, 0.8560028076171875, 0.921112060546875, 0.9862213134765625, 1.05133056640625, 1.1164398193359375, 1.181549072265625, 1.2466583251953125, 1.311767578125, 1.3768768310546875, 1.441986083984375, 1.5070953369140625, 1.57220458984375, 1.6373138427734375, 1.702423095703125, 1.7675323486328125, 1.8326416015625, 1.8977508544921875, 1.962860107421875, 2.0279693603515625, 2.09307861328125, 2.1581878662109375, 2.223297119140625, 2.2884063720703125, 2.353515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 14.0, 26.0, 41.0, 81.0, 172.0, 412.0, 1257.0, 4931.0, 25772.0, 209615.0, 722728.0, 68804.0, 10936.0, 2438.0, 765.0, 289.0, 127.0, 51.0, 32.0, 19.0, 17.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0227737426757812, -0.9967193603515625, -0.9706649780273438, -0.944610595703125, -0.9185562133789062, -0.8925018310546875, -0.8664474487304688, -0.84039306640625, -0.8143386840820312, -0.7882843017578125, -0.7622299194335938, -0.736175537109375, -0.7101211547851562, -0.6840667724609375, -0.6580123901367188, -0.6319580078125, -0.6059036254882812, -0.5798492431640625, -0.5537948608398438, -0.527740478515625, -0.5016860961914062, -0.4756317138671875, -0.44957733154296875, -0.42352294921875, -0.39746856689453125, -0.3714141845703125, -0.34535980224609375, -0.319305419921875, -0.29325103759765625, -0.2671966552734375, -0.24114227294921875, -0.215087890625, -0.18903350830078125, -0.1629791259765625, -0.13692474365234375, -0.110870361328125, -0.08481597900390625, -0.0587615966796875, -0.03270721435546875, -0.00665283203125, 0.01940155029296875, 0.0454559326171875, 0.07151031494140625, 0.097564697265625, 0.12361907958984375, 0.1496734619140625, 0.17572784423828125, 0.2017822265625, 0.22783660888671875, 0.2538909912109375, 0.27994537353515625, 0.305999755859375, 0.33205413818359375, 0.3581085205078125, 0.38416290283203125, 0.41021728515625, 0.43627166748046875, 0.4623260498046875, 0.48838043212890625, 0.514434814453125, 0.5404891967773438, 0.5665435791015625, 0.5925979614257812, 0.61865234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 4.0, 11.0, 14.0, 21.0, 22.0, 28.0, 32.0, 44.0, 53.0, 73.0, 82.0, 101.0, 101.0, 67.0, 70.0, 67.0, 44.0, 33.0, 24.0, 21.0, 11.0, 5.0, 15.0, 3.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011515617370605469, -0.00011120177805423737, -0.00010724738240242004, -0.00010329298675060272, -9.93385910987854e-05, -9.538419544696808e-05, -9.142979979515076e-05, -8.747540414333344e-05, -8.352100849151611e-05, -7.956661283969879e-05, -7.561221718788147e-05, -7.165782153606415e-05, -6.770342588424683e-05, -6.37490302324295e-05, -5.979463458061218e-05, -5.584023892879486e-05, -5.188584327697754e-05, -4.793144762516022e-05, -4.3977051973342896e-05, -4.0022656321525574e-05, -3.606826066970825e-05, -3.211386501789093e-05, -2.815946936607361e-05, -2.4205073714256287e-05, -2.0250678062438965e-05, -1.6296282410621643e-05, -1.2341886758804321e-05, -8.387491106987e-06, -4.433095455169678e-06, -4.78699803352356e-07, 3.475695848464966e-06, 7.430091500282288e-06, 1.138448715209961e-05, 1.533888280391693e-05, 1.9293278455734253e-05, 2.3247674107551575e-05, 2.7202069759368896e-05, 3.115646541118622e-05, 3.511086106300354e-05, 3.906525671482086e-05, 4.3019652366638184e-05, 4.6974048018455505e-05, 5.092844367027283e-05, 5.488283932209015e-05, 5.883723497390747e-05, 6.279163062572479e-05, 6.674602627754211e-05, 7.070042192935944e-05, 7.465481758117676e-05, 7.860921323299408e-05, 8.25636088848114e-05, 8.651800453662872e-05, 9.047240018844604e-05, 9.442679584026337e-05, 9.838119149208069e-05, 0.00010233558714389801, 0.00010628998279571533, 0.00011024437844753265, 0.00011419877409934998, 0.0001181531697511673, 0.00012210756540298462, 0.00012606196105480194, 0.00013001635670661926, 0.00013397075235843658, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 16.0, 24.0, 38.0, 61.0, 90.0, 133.0, 239.0, 402.0, 733.0, 1448.0, 3095.0, 7525.0, 21106.0, 71115.0, 273733.0, 525002.0, 98457.0, 28197.0, 9531.0, 3818.0, 1710.0, 838.0, 461.0, 247.0, 185.0, 100.0, 49.0, 40.0, 26.0, 27.0, 19.0, 8.0, 14.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.47021484375, -0.4546051025390625, -0.438995361328125, -0.4233856201171875, -0.40777587890625, -0.3921661376953125, -0.376556396484375, -0.3609466552734375, -0.3453369140625, -0.3297271728515625, -0.314117431640625, -0.2985076904296875, -0.28289794921875, -0.2672882080078125, -0.251678466796875, -0.2360687255859375, -0.220458984375, -0.2048492431640625, -0.189239501953125, -0.1736297607421875, -0.15802001953125, -0.1424102783203125, -0.126800537109375, -0.1111907958984375, -0.0955810546875, -0.0799713134765625, -0.064361572265625, -0.0487518310546875, -0.03314208984375, -0.0175323486328125, -0.001922607421875, 0.0136871337890625, 0.029296875, 0.0449066162109375, 0.060516357421875, 0.0761260986328125, 0.09173583984375, 0.1073455810546875, 0.122955322265625, 0.1385650634765625, 0.1541748046875, 0.1697845458984375, 0.185394287109375, 0.2010040283203125, 0.21661376953125, 0.2322235107421875, 0.247833251953125, 0.2634429931640625, 0.279052734375, 0.2946624755859375, 0.310272216796875, 0.3258819580078125, 0.34149169921875, 0.3571014404296875, 0.372711181640625, 0.3883209228515625, 0.4039306640625, 0.4195404052734375, 0.435150146484375, 0.4507598876953125, 0.46636962890625, 0.4819793701171875, 0.497589111328125, 0.5131988525390625, 0.52880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 8.0, 1.0, 6.0, 9.0, 16.0, 9.0, 20.0, 16.0, 21.0, 26.0, 42.0, 43.0, 45.0, 67.0, 66.0, 80.0, 75.0, 84.0, 57.0, 55.0, 44.0, 48.0, 29.0, 31.0, 27.0, 14.0, 10.0, 13.0, 9.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4137077331542969, -0.39894866943359375, -0.3841896057128906, -0.3694305419921875, -0.3546714782714844, -0.33991241455078125, -0.3251533508300781, -0.310394287109375, -0.2956352233886719, -0.28087615966796875, -0.2661170959472656, -0.2513580322265625, -0.23659896850585938, -0.22183990478515625, -0.20708084106445312, -0.19232177734375, -0.17756271362304688, -0.16280364990234375, -0.14804458618164062, -0.1332855224609375, -0.11852645874023438, -0.10376739501953125, -0.08900833129882812, -0.074249267578125, -0.059490203857421875, -0.04473114013671875, -0.029972076416015625, -0.0152130126953125, -0.000453948974609375, 0.01430511474609375, 0.029064178466796875, 0.0438232421875, 0.058582305908203125, 0.07334136962890625, 0.08810043334960938, 0.1028594970703125, 0.11761856079101562, 0.13237762451171875, 0.14713668823242188, 0.161895751953125, 0.17665481567382812, 0.19141387939453125, 0.20617294311523438, 0.2209320068359375, 0.23569107055664062, 0.25045013427734375, 0.2652091979980469, 0.27996826171875, 0.2947273254394531, 0.30948638916015625, 0.3242454528808594, 0.3390045166015625, 0.3537635803222656, 0.36852264404296875, 0.3832817077636719, 0.398040771484375, 0.4127998352050781, 0.42755889892578125, 0.4423179626464844, 0.4570770263671875, 0.4718360900878906, 0.48659515380859375, 0.5013542175292969, 0.51611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 15.0, 43.0, 90.0, 159.0, 347.0, 179.0, 89.0, 31.0, 20.0, 5.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.13393783569336, -22.502058029174805, -21.870176315307617, -21.238296508789062, -20.606414794921875, -19.97453498840332, -19.342655181884766, -18.710773468017578, -18.078893661499023, -17.44701385498047, -16.81513214111328, -16.183252334594727, -15.551371574401855, -14.919490814208984, -14.287610054016113, -13.655729293823242, -13.023848533630371, -12.3919677734375, -11.760087013244629, -11.128206253051758, -10.496326446533203, -9.864445686340332, -9.232564926147461, -8.600685119628906, -7.968803882598877, -7.336923122406006, -6.705042839050293, -6.073162078857422, -5.441281318664551, -4.809401035308838, -4.177520275115967, -3.545639991760254, -2.913759231567383, -2.281878709793091, -1.6499980688095093, -1.0181174278259277, -0.38623690605163574, 0.24564361572265625, 0.8775243759155273, 1.5094046592712402, 2.1412854194641113, 2.7731659412384033, 3.4050464630126953, 4.036927223205566, 4.6688079833984375, 5.30068826675415, 5.9325690269470215, 6.564449310302734, 7.1963300704956055, 7.828210830688477, 8.460091590881348, 9.091972351074219, 9.723852157592773, 10.355732917785645, 10.987613677978516, 11.61949348449707, 12.251375198364258, 12.883255958557129, 13.51513671875, 14.147016525268555, 14.778897285461426, 15.410778045654297, 16.042659759521484, 16.67453956604004, 17.306419372558594]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 19.0, 16.0, 14.0, 24.0, 26.0, 44.0, 39.0, 42.0, 48.0, 61.0, 95.0, 99.0, 82.0, 42.0, 43.0, 33.0, 40.0, 30.0, 38.0, 22.0, 20.0, 20.0, 6.0, 10.0, 9.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.887272834777832, -7.574706554412842, -7.262140274047852, -6.949573993682861, -6.637007713317871, -6.324440956115723, -6.011874675750732, -5.699308395385742, -5.386742115020752, -5.074175834655762, -4.7616095542907715, -4.449043273925781, -4.136476516723633, -3.8239104747772217, -3.5113439559936523, -3.198777675628662, -2.886211395263672, -2.5736451148986816, -2.2610788345336914, -1.948512315750122, -1.6359460353851318, -1.3233797550201416, -1.0108133554458618, -0.698246955871582, -0.3856806755065918, -0.07311433553695679, 0.23945200443267822, 0.5520183444023132, 0.8645846843719482, 1.1771509647369385, 1.4897173643112183, 1.802283763885498, 2.114849090576172, 2.427415370941162, 2.7399816513061523, 3.0525481700897217, 3.365114450454712, 3.677680730819702, 3.9902472496032715, 4.302813529968262, 4.615379810333252, 4.927946090698242, 5.240512371063232, 5.553078651428223, 5.865645408630371, 6.178211212158203, 6.490777969360352, 6.803344249725342, 7.115910530090332, 7.428476810455322, 7.7410430908203125, 8.053609848022461, 8.366175651550293, 8.678742408752441, 8.991308212280273, 9.303874969482422, 9.61644172668457, 9.929008483886719, 10.24157428741455, 10.5541410446167, 10.866706848144531, 11.17927360534668, 11.491839408874512, 11.80440616607666, 12.116971969604492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 14.0, 13.0, 16.0, 15.0, 29.0, 47.0, 68.0, 93.0, 167.0, 282.0, 524.0, 1003.0, 2080.0, 4828.0, 12791.0, 49607.0, 419744.0, 2971520.0, 640138.0, 65310.0, 15569.0, 5594.0, 2427.0, 1076.0, 537.0, 307.0, 169.0, 77.0, 70.0, 48.0, 39.0, 17.0, 18.0, 12.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.451171875, -1.4145050048828125, -1.377838134765625, -1.3411712646484375, -1.30450439453125, -1.2678375244140625, -1.231170654296875, -1.1945037841796875, -1.1578369140625, -1.1211700439453125, -1.084503173828125, -1.0478363037109375, -1.01116943359375, -0.9745025634765625, -0.937835693359375, -0.9011688232421875, -0.864501953125, -0.8278350830078125, -0.791168212890625, -0.7545013427734375, -0.71783447265625, -0.6811676025390625, -0.644500732421875, -0.6078338623046875, -0.5711669921875, -0.5345001220703125, -0.497833251953125, -0.4611663818359375, -0.42449951171875, -0.3878326416015625, -0.351165771484375, -0.3144989013671875, -0.27783203125, -0.2411651611328125, -0.204498291015625, -0.1678314208984375, -0.13116455078125, -0.0944976806640625, -0.057830810546875, -0.0211639404296875, 0.0155029296875, 0.0521697998046875, 0.088836669921875, 0.1255035400390625, 0.16217041015625, 0.1988372802734375, 0.235504150390625, 0.2721710205078125, 0.308837890625, 0.3455047607421875, 0.382171630859375, 0.4188385009765625, 0.45550537109375, 0.4921722412109375, 0.528839111328125, 0.5655059814453125, 0.6021728515625, 0.6388397216796875, 0.675506591796875, 0.7121734619140625, 0.74884033203125, 0.7855072021484375, 0.822174072265625, 0.8588409423828125, 0.8955078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 12.0, 15.0, 9.0, 26.0, 37.0, 46.0, 38.0, 42.0, 54.0, 56.0, 70.0, 78.0, 84.0, 69.0, 55.0, 61.0, 43.0, 50.0, 37.0, 25.0, 32.0, 15.0, 10.0, 6.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66552734375, -0.6387405395507812, -0.6119537353515625, -0.5851669311523438, -0.558380126953125, -0.5315933227539062, -0.5048065185546875, -0.47801971435546875, -0.45123291015625, -0.42444610595703125, -0.3976593017578125, -0.37087249755859375, -0.344085693359375, -0.31729888916015625, -0.2905120849609375, -0.26372528076171875, -0.2369384765625, -0.21015167236328125, -0.1833648681640625, -0.15657806396484375, -0.129791259765625, -0.10300445556640625, -0.0762176513671875, -0.04943084716796875, -0.02264404296875, 0.00414276123046875, 0.0309295654296875, 0.05771636962890625, 0.084503173828125, 0.11128997802734375, 0.1380767822265625, 0.16486358642578125, 0.191650390625, 0.21843719482421875, 0.2452239990234375, 0.27201080322265625, 0.298797607421875, 0.32558441162109375, 0.3523712158203125, 0.37915802001953125, 0.40594482421875, 0.43273162841796875, 0.4595184326171875, 0.48630523681640625, 0.513092041015625, 0.5398788452148438, 0.5666656494140625, 0.5934524536132812, 0.6202392578125, 0.6470260620117188, 0.6738128662109375, 0.7005996704101562, 0.727386474609375, 0.7541732788085938, 0.7809600830078125, 0.8077468872070312, 0.83453369140625, 0.8613204956054688, 0.8881072998046875, 0.9148941040039062, 0.941680908203125, 0.9684677124023438, 0.9952545166015625, 1.0220413208007812, 1.048828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 26.0, 32.0, 58.0, 87.0, 152.0, 276.0, 639.0, 1455.0, 4727.0, 18066.0, 126112.0, 2971672.0, 997993.0, 56643.0, 10937.0, 3187.0, 1156.0, 455.0, 212.0, 134.0, 82.0, 35.0, 34.0, 11.0, 15.0, 11.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.34722900390625, -1.2969970703125, -1.24676513671875, -1.196533203125, -1.14630126953125, -1.0960693359375, -1.04583740234375, -0.99560546875, -0.94537353515625, -0.8951416015625, -0.84490966796875, -0.794677734375, -0.74444580078125, -0.6942138671875, -0.64398193359375, -0.59375, -0.54351806640625, -0.4932861328125, -0.44305419921875, -0.392822265625, -0.34259033203125, -0.2923583984375, -0.24212646484375, -0.19189453125, -0.14166259765625, -0.0914306640625, -0.04119873046875, 0.009033203125, 0.05926513671875, 0.1094970703125, 0.15972900390625, 0.2099609375, 0.26019287109375, 0.3104248046875, 0.36065673828125, 0.410888671875, 0.46112060546875, 0.5113525390625, 0.56158447265625, 0.61181640625, 0.66204833984375, 0.7122802734375, 0.76251220703125, 0.812744140625, 0.86297607421875, 0.9132080078125, 0.96343994140625, 1.013671875, 1.06390380859375, 1.1141357421875, 1.16436767578125, 1.214599609375, 1.26483154296875, 1.3150634765625, 1.36529541015625, 1.41552734375, 1.46575927734375, 1.5159912109375, 1.56622314453125, 1.616455078125, 1.66668701171875, 1.7169189453125, 1.76715087890625, 1.8173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 7.0, 18.0, 18.0, 26.0, 50.0, 72.0, 113.0, 169.0, 305.0, 504.0, 738.0, 671.0, 499.0, 317.0, 173.0, 109.0, 79.0, 40.0, 48.0, 26.0, 20.0, 6.0, 10.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4109954833984375, -1.366912841796875, -1.3228302001953125, -1.27874755859375, -1.2346649169921875, -1.190582275390625, -1.1464996337890625, -1.1024169921875, -1.0583343505859375, -1.014251708984375, -0.9701690673828125, -0.92608642578125, -0.8820037841796875, -0.837921142578125, -0.7938385009765625, -0.749755859375, -0.7056732177734375, -0.661590576171875, -0.6175079345703125, -0.57342529296875, -0.5293426513671875, -0.485260009765625, -0.4411773681640625, -0.3970947265625, -0.3530120849609375, -0.308929443359375, -0.2648468017578125, -0.22076416015625, -0.1766815185546875, -0.132598876953125, -0.0885162353515625, -0.04443359375, -0.0003509521484375, 0.043731689453125, 0.0878143310546875, 0.13189697265625, 0.1759796142578125, 0.220062255859375, 0.2641448974609375, 0.3082275390625, 0.3523101806640625, 0.396392822265625, 0.4404754638671875, 0.48455810546875, 0.5286407470703125, 0.572723388671875, 0.6168060302734375, 0.660888671875, 0.7049713134765625, 0.749053955078125, 0.7931365966796875, 0.83721923828125, 0.8813018798828125, 0.925384521484375, 0.9694671630859375, 1.0135498046875, 1.0576324462890625, 1.101715087890625, 1.1457977294921875, 1.18988037109375, 1.2339630126953125, 1.278045654296875, 1.3221282958984375, 1.3662109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 10.0, 8.0, 10.0, 22.0, 25.0, 51.0, 66.0, 106.0, 150.0, 151.0, 141.0, 102.0, 59.0, 43.0, 22.0, 19.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021146774291992, -4.669943332672119, -4.318739414215088, -3.967535972595215, -3.616332530975342, -3.2651288509368896, -2.9139251708984375, -2.5627217292785645, -2.2115180492401123, -1.8603144884109497, -1.509110927581787, -1.157907247543335, -0.8067036867141724, -0.45550012588500977, -0.10429644584655762, 0.24690699577331543, 0.5981106758117676, 0.9493142366409302, 1.3005177974700928, 1.651721477508545, 2.002924919128418, 2.35412859916687, 2.7053322792053223, 3.0565357208251953, 3.4077394008636475, 3.7589430809020996, 4.110146522521973, 4.461350440979004, 4.812553882598877, 5.16375732421875, 5.514961242675781, 5.866164207458496, 6.217368125915527, 6.5685715675354, 6.919775485992432, 7.270978927612305, 7.622182369232178, 7.973385810852051, 8.324589729309082, 8.675792694091797, 9.026996612548828, 9.37820053100586, 9.729403495788574, 10.080607414245605, 10.431811332702637, 10.783014297485352, 11.134218215942383, 11.485422134399414, 11.836626052856445, 12.187829971313477, 12.539032936096191, 12.890236854553223, 13.241440773010254, 13.592643737792969, 13.94384765625, 14.295051574707031, 14.646254539489746, 14.997458457946777, 15.348661422729492, 15.699865341186523, 16.051069259643555, 16.402273178100586, 16.753475189208984, 17.104679107666016, 17.455883026123047]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 18.0, 13.0, 20.0, 28.0, 20.0, 31.0, 29.0, 37.0, 34.0, 36.0, 52.0, 35.0, 49.0, 45.0, 33.0, 49.0, 47.0, 34.0, 51.0, 38.0, 34.0, 27.0, 28.0, 30.0, 23.0, 17.0, 19.0, 28.0, 11.0, 10.0, 8.0, 11.0, 5.0, 8.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5354461669921875, -5.352889060974121, -5.170332431793213, -4.9877753257751465, -4.805218696594238, -4.622661590576172, -4.440104961395264, -4.257547855377197, -4.074991226196289, -3.8924343585968018, -3.7098774909973145, -3.527320623397827, -3.34476375579834, -3.1622068881988525, -2.9796500205993652, -2.797092914581299, -2.6145360469818115, -2.431979179382324, -2.249422311782837, -2.0668654441833496, -1.8843085765838623, -1.701751708984375, -1.5191947221755981, -1.3366378545761108, -1.1540809869766235, -0.9715241193771362, -0.7889672517776489, -0.6064103245735168, -0.42385345697402954, -0.24129658937454224, -0.058739662170410156, 0.12381720542907715, 0.30637407302856445, 0.48893094062805176, 0.6714878082275391, 0.8540447354316711, 1.0366015434265137, 1.219158411026001, 1.4017153978347778, 1.5842722654342651, 1.7668291330337524, 1.9493860006332397, 2.1319429874420166, 2.314499855041504, 2.497056722640991, 2.6796135902404785, 2.862170457839966, 3.044727325439453, 3.2272841930389404, 3.4098410606384277, 3.592397928237915, 3.7749547958374023, 3.9575116634368896, 4.140068531036377, 4.322625637054443, 4.505182266235352, 4.687739372253418, 4.870296478271484, 5.052853107452393, 5.235410213470459, 5.417966842651367, 5.600523948669434, 5.783080577850342, 5.965637683868408, 6.148194313049316]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 8.0, 2.0, 7.0, 7.0, 12.0, 19.0, 36.0, 37.0, 76.0, 89.0, 168.0, 238.0, 384.0, 811.0, 1595.0, 3775.0, 9919.0, 29689.0, 104195.0, 374157.0, 372939.0, 103676.0, 29636.0, 9834.0, 3716.0, 1636.0, 770.0, 413.0, 268.0, 162.0, 86.0, 54.0, 56.0, 20.0, 21.0, 15.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.470703125, -1.428680419921875, -1.38665771484375, -1.344635009765625, -1.3026123046875, -1.260589599609375, -1.21856689453125, -1.176544189453125, -1.134521484375, -1.092498779296875, -1.05047607421875, -1.008453369140625, -0.9664306640625, -0.924407958984375, -0.88238525390625, -0.840362548828125, -0.79833984375, -0.756317138671875, -0.71429443359375, -0.672271728515625, -0.6302490234375, -0.588226318359375, -0.54620361328125, -0.504180908203125, -0.462158203125, -0.420135498046875, -0.37811279296875, -0.336090087890625, -0.2940673828125, -0.252044677734375, -0.21002197265625, -0.167999267578125, -0.1259765625, -0.083953857421875, -0.04193115234375, 9.1552734375e-05, 0.0421142578125, 0.084136962890625, 0.12615966796875, 0.168182373046875, 0.210205078125, 0.252227783203125, 0.29425048828125, 0.336273193359375, 0.3782958984375, 0.420318603515625, 0.46234130859375, 0.504364013671875, 0.54638671875, 0.588409423828125, 0.63043212890625, 0.672454833984375, 0.7144775390625, 0.756500244140625, 0.79852294921875, 0.840545654296875, 0.882568359375, 0.924591064453125, 0.96661376953125, 1.008636474609375, 1.0506591796875, 1.092681884765625, 1.13470458984375, 1.176727294921875, 1.21875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 9.0, 13.0, 24.0, 23.0, 31.0, 39.0, 42.0, 43.0, 46.0, 55.0, 52.0, 70.0, 66.0, 76.0, 58.0, 56.0, 46.0, 56.0, 38.0, 39.0, 42.0, 16.0, 16.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.635040283203125, -0.60797119140625, -0.580902099609375, -0.5538330078125, -0.526763916015625, -0.49969482421875, -0.472625732421875, -0.445556640625, -0.418487548828125, -0.39141845703125, -0.364349365234375, -0.3372802734375, -0.310211181640625, -0.28314208984375, -0.256072998046875, -0.22900390625, -0.201934814453125, -0.17486572265625, -0.147796630859375, -0.1207275390625, -0.093658447265625, -0.06658935546875, -0.039520263671875, -0.012451171875, 0.014617919921875, 0.04168701171875, 0.068756103515625, 0.0958251953125, 0.122894287109375, 0.14996337890625, 0.177032470703125, 0.2041015625, 0.231170654296875, 0.25823974609375, 0.285308837890625, 0.3123779296875, 0.339447021484375, 0.36651611328125, 0.393585205078125, 0.420654296875, 0.447723388671875, 0.47479248046875, 0.501861572265625, 0.5289306640625, 0.555999755859375, 0.58306884765625, 0.610137939453125, 0.63720703125, 0.664276123046875, 0.69134521484375, 0.718414306640625, 0.7454833984375, 0.772552490234375, 0.79962158203125, 0.826690673828125, 0.853759765625, 0.880828857421875, 0.90789794921875, 0.934967041015625, 0.9620361328125, 0.989105224609375, 1.01617431640625, 1.043243408203125, 1.0703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 10.0, 11.0, 13.0, 33.0, 45.0, 47.0, 56.0, 85.0, 134.0, 243.0, 339.0, 701.0, 1339.0, 3667.0, 15877.0, 123012.0, 779121.0, 103363.0, 14015.0, 3479.0, 1282.0, 621.0, 352.0, 217.0, 148.0, 102.0, 65.0, 36.0, 31.0, 31.0, 15.0, 9.0, 12.0, 7.0, 7.0, 2.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.490234375, -2.420013427734375, -2.34979248046875, -2.279571533203125, -2.2093505859375, -2.139129638671875, -2.06890869140625, -1.998687744140625, -1.928466796875, -1.858245849609375, -1.78802490234375, -1.717803955078125, -1.6475830078125, -1.577362060546875, -1.50714111328125, -1.436920166015625, -1.36669921875, -1.296478271484375, -1.22625732421875, -1.156036376953125, -1.0858154296875, -1.015594482421875, -0.94537353515625, -0.875152587890625, -0.804931640625, -0.734710693359375, -0.66448974609375, -0.594268798828125, -0.5240478515625, -0.453826904296875, -0.38360595703125, -0.313385009765625, -0.2431640625, -0.172943115234375, -0.10272216796875, -0.032501220703125, 0.0377197265625, 0.107940673828125, 0.17816162109375, 0.248382568359375, 0.318603515625, 0.388824462890625, 0.45904541015625, 0.529266357421875, 0.5994873046875, 0.669708251953125, 0.73992919921875, 0.810150146484375, 0.88037109375, 0.950592041015625, 1.02081298828125, 1.091033935546875, 1.1612548828125, 1.231475830078125, 1.30169677734375, 1.371917724609375, 1.442138671875, 1.512359619140625, 1.58258056640625, 1.652801513671875, 1.7230224609375, 1.793243408203125, 1.86346435546875, 1.933685302734375, 2.00390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 17.0, 16.0, 10.0, 22.0, 30.0, 23.0, 44.0, 50.0, 51.0, 58.0, 44.0, 44.0, 65.0, 41.0, 46.0, 54.0, 39.0, 53.0, 39.0, 40.0, 42.0, 35.0, 19.0, 16.0, 12.0, 14.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.073699951171875, -1.99700927734375, -1.920318603515625, -1.8436279296875, -1.766937255859375, -1.69024658203125, -1.613555908203125, -1.536865234375, -1.460174560546875, -1.38348388671875, -1.306793212890625, -1.2301025390625, -1.153411865234375, -1.07672119140625, -1.000030517578125, -0.92333984375, -0.846649169921875, -0.76995849609375, -0.693267822265625, -0.6165771484375, -0.539886474609375, -0.46319580078125, -0.386505126953125, -0.309814453125, -0.233123779296875, -0.15643310546875, -0.079742431640625, -0.0030517578125, 0.073638916015625, 0.15032958984375, 0.227020263671875, 0.3037109375, 0.380401611328125, 0.45709228515625, 0.533782958984375, 0.6104736328125, 0.687164306640625, 0.76385498046875, 0.840545654296875, 0.917236328125, 0.993927001953125, 1.07061767578125, 1.147308349609375, 1.2239990234375, 1.300689697265625, 1.37738037109375, 1.454071044921875, 1.53076171875, 1.607452392578125, 1.68414306640625, 1.760833740234375, 1.8375244140625, 1.914215087890625, 1.99090576171875, 2.067596435546875, 2.144287109375, 2.220977783203125, 2.29766845703125, 2.374359130859375, 2.4510498046875, 2.527740478515625, 2.60443115234375, 2.681121826171875, 2.7578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 5.0, 6.0, 15.0, 19.0, 37.0, 43.0, 70.0, 81.0, 177.0, 287.0, 608.0, 1373.0, 3649.0, 11727.0, 48927.0, 636260.0, 291193.0, 38495.0, 9940.0, 3062.0, 1280.0, 549.0, 293.0, 172.0, 85.0, 62.0, 39.0, 25.0, 19.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5810546875, -0.5616378784179688, -0.5422210693359375, -0.5228042602539062, -0.503387451171875, -0.48397064208984375, -0.4645538330078125, -0.44513702392578125, -0.42572021484375, -0.40630340576171875, -0.3868865966796875, -0.36746978759765625, -0.348052978515625, -0.32863616943359375, -0.3092193603515625, -0.28980255126953125, -0.2703857421875, -0.25096893310546875, -0.2315521240234375, -0.21213531494140625, -0.192718505859375, -0.17330169677734375, -0.1538848876953125, -0.13446807861328125, -0.11505126953125, -0.09563446044921875, -0.0762176513671875, -0.05680084228515625, -0.037384033203125, -0.01796722412109375, 0.0014495849609375, 0.02086639404296875, 0.040283203125, 0.05970001220703125, 0.0791168212890625, 0.09853363037109375, 0.117950439453125, 0.13736724853515625, 0.1567840576171875, 0.17620086669921875, 0.19561767578125, 0.21503448486328125, 0.2344512939453125, 0.25386810302734375, 0.273284912109375, 0.29270172119140625, 0.3121185302734375, 0.33153533935546875, 0.3509521484375, 0.37036895751953125, 0.3897857666015625, 0.40920257568359375, 0.428619384765625, 0.44803619384765625, 0.4674530029296875, 0.48686981201171875, 0.50628662109375, 0.5257034301757812, 0.5451202392578125, 0.5645370483398438, 0.583953857421875, 0.6033706665039062, 0.6227874755859375, 0.6422042846679688, 0.66162109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 7.0, 9.0, 19.0, 18.0, 22.0, 34.0, 48.0, 54.0, 97.0, 98.0, 116.0, 103.0, 64.0, 51.0, 51.0, 27.0, 15.0, 26.0, 17.0, 15.0, 10.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010734796524047852, -0.00010401848703622818, -0.00010068900883197784, -9.735953062772751e-05, -9.403005242347717e-05, -9.070057421922684e-05, -8.73710960149765e-05, -8.404161781072617e-05, -8.071213960647583e-05, -7.73826614022255e-05, -7.405318319797516e-05, -7.072370499372482e-05, -6.739422678947449e-05, -6.406474858522415e-05, -6.0735270380973816e-05, -5.740579217672348e-05, -5.4076313972473145e-05, -5.074683576822281e-05, -4.741735756397247e-05, -4.408787935972214e-05, -4.07584011554718e-05, -3.7428922951221466e-05, -3.409944474697113e-05, -3.0769966542720795e-05, -2.744048833847046e-05, -2.4111010134220123e-05, -2.0781531929969788e-05, -1.7452053725719452e-05, -1.4122575521469116e-05, -1.079309731721878e-05, -7.463619112968445e-06, -4.134140908718109e-06, -8.046627044677734e-07, 2.5248154997825623e-06, 5.854293704032898e-06, 9.183771908283234e-06, 1.251325011253357e-05, 1.5842728316783905e-05, 1.917220652103424e-05, 2.2501684725284576e-05, 2.5831162929534912e-05, 2.9160641133785248e-05, 3.2490119338035583e-05, 3.581959754228592e-05, 3.9149075746536255e-05, 4.247855395078659e-05, 4.5808032155036926e-05, 4.913751035928726e-05, 5.24669885635376e-05, 5.579646676778793e-05, 5.912594497203827e-05, 6.24554231762886e-05, 6.578490138053894e-05, 6.911437958478928e-05, 7.244385778903961e-05, 7.577333599328995e-05, 7.910281419754028e-05, 8.243229240179062e-05, 8.576177060604095e-05, 8.909124881029129e-05, 9.242072701454163e-05, 9.575020521879196e-05, 9.90796834230423e-05, 0.00010240916162729263, 0.00010573863983154297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 16.0, 14.0, 38.0, 44.0, 55.0, 95.0, 170.0, 302.0, 524.0, 1305.0, 3948.0, 15899.0, 97910.0, 799065.0, 105554.0, 16860.0, 4104.0, 1360.0, 555.0, 297.0, 151.0, 94.0, 56.0, 45.0, 20.0, 19.0, 10.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.544708251953125, -0.52154541015625, -0.498382568359375, -0.4752197265625, -0.452056884765625, -0.42889404296875, -0.405731201171875, -0.382568359375, -0.359405517578125, -0.33624267578125, -0.313079833984375, -0.2899169921875, -0.266754150390625, -0.24359130859375, -0.220428466796875, -0.197265625, -0.174102783203125, -0.15093994140625, -0.127777099609375, -0.1046142578125, -0.081451416015625, -0.05828857421875, -0.035125732421875, -0.011962890625, 0.011199951171875, 0.03436279296875, 0.057525634765625, 0.0806884765625, 0.103851318359375, 0.12701416015625, 0.150177001953125, 0.17333984375, 0.196502685546875, 0.21966552734375, 0.242828369140625, 0.2659912109375, 0.289154052734375, 0.31231689453125, 0.335479736328125, 0.358642578125, 0.381805419921875, 0.40496826171875, 0.428131103515625, 0.4512939453125, 0.474456787109375, 0.49761962890625, 0.520782470703125, 0.5439453125, 0.567108154296875, 0.59027099609375, 0.613433837890625, 0.6365966796875, 0.659759521484375, 0.68292236328125, 0.706085205078125, 0.729248046875, 0.752410888671875, 0.77557373046875, 0.798736572265625, 0.8218994140625, 0.845062255859375, 0.86822509765625, 0.891387939453125, 0.91455078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 13.0, 15.0, 16.0, 28.0, 23.0, 27.0, 39.0, 50.0, 69.0, 95.0, 102.0, 109.0, 87.0, 54.0, 39.0, 40.0, 32.0, 19.0, 21.0, 14.0, 14.0, 7.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5390625, -0.5232086181640625, -0.507354736328125, -0.4915008544921875, -0.47564697265625, -0.4597930908203125, -0.443939208984375, -0.4280853271484375, -0.4122314453125, -0.3963775634765625, -0.380523681640625, -0.3646697998046875, -0.34881591796875, -0.3329620361328125, -0.317108154296875, -0.3012542724609375, -0.285400390625, -0.2695465087890625, -0.253692626953125, -0.2378387451171875, -0.22198486328125, -0.2061309814453125, -0.190277099609375, -0.1744232177734375, -0.1585693359375, -0.1427154541015625, -0.126861572265625, -0.1110076904296875, -0.09515380859375, -0.0792999267578125, -0.063446044921875, -0.0475921630859375, -0.03173828125, -0.0158843994140625, -3.0517578125e-05, 0.0158233642578125, 0.03167724609375, 0.0475311279296875, 0.063385009765625, 0.0792388916015625, 0.0950927734375, 0.1109466552734375, 0.126800537109375, 0.1426544189453125, 0.15850830078125, 0.1743621826171875, 0.190216064453125, 0.2060699462890625, 0.221923828125, 0.2377777099609375, 0.253631591796875, 0.2694854736328125, 0.28533935546875, 0.3011932373046875, 0.317047119140625, 0.3329010009765625, 0.3487548828125, 0.3646087646484375, 0.380462646484375, 0.3963165283203125, 0.41217041015625, 0.4280242919921875, 0.443878173828125, 0.4597320556640625, 0.4755859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 8.0, 18.0, 45.0, 117.0, 365.0, 285.0, 102.0, 26.0, 12.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.106849670410156, -33.36344909667969, -32.62004852294922, -31.876649856567383, -31.133251190185547, -30.389850616455078, -29.646451950073242, -28.903051376342773, -28.159652709960938, -27.41625213623047, -26.672853469848633, -25.929452896118164, -25.186054229736328, -24.44265365600586, -23.699254989624023, -22.955854415893555, -22.21245574951172, -21.46905517578125, -20.725656509399414, -19.982255935668945, -19.23885726928711, -18.49545669555664, -17.752058029174805, -17.008657455444336, -16.265256881713867, -15.521857261657715, -14.778457641601562, -14.03505802154541, -13.291658401489258, -12.548258781433105, -11.804859161376953, -11.061458587646484, -10.318059921264648, -9.574660301208496, -8.831260681152344, -8.087861061096191, -7.344461441040039, -6.601061820983887, -5.857661724090576, -5.114262104034424, -4.3708624839782715, -3.627462863922119, -2.884063243865967, -2.1406633853912354, -1.397263765335083, -0.6538641452789307, 0.08953571319580078, 0.8329353332519531, 1.5763349533081055, 2.319734573364258, 3.06313419342041, 3.8065340518951416, 4.549933433532715, 5.293333053588867, 6.036733150482178, 6.78013277053833, 7.523532390594482, 8.266932487487793, 9.010332107543945, 9.753731727600098, 10.49713134765625, 11.240530967712402, 11.983930587768555, 12.727330207824707, 13.47072982788086]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 10.0, 2.0, 10.0, 16.0, 7.0, 12.0, 19.0, 28.0, 16.0, 33.0, 23.0, 26.0, 42.0, 41.0, 58.0, 75.0, 106.0, 90.0, 55.0, 37.0, 49.0, 20.0, 38.0, 31.0, 30.0, 14.0, 19.0, 14.0, 19.0, 4.0, 6.0, 6.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-10.810636520385742, -10.506580352783203, -10.202524185180664, -9.898468017578125, -9.594411849975586, -9.290355682373047, -8.986299514770508, -8.682243347167969, -8.37818717956543, -8.07413101196289, -7.770074844360352, -7.4660186767578125, -7.161962509155273, -6.857906341552734, -6.553850173950195, -6.249794006347656, -5.945737361907959, -5.64168119430542, -5.337625026702881, -5.033568859100342, -4.729512691497803, -4.425456523895264, -4.121399879455566, -3.8173439502716064, -3.5132877826690674, -3.2092316150665283, -2.9051754474639893, -2.601119041442871, -2.297062873840332, -1.9930068254470825, -1.688950538635254, -1.3848943710327148, -1.0808382034301758, -0.7767820358276367, -0.4727258086204529, -0.16866958141326904, 0.13538658618927002, 0.4394427537918091, 0.7434990406036377, 1.0475552082061768, 1.3516113758087158, 1.6556675434112549, 1.959723711013794, 2.263780117034912, 2.567836284637451, 2.8718924522399902, 3.1759486198425293, 3.4800047874450684, 3.7840609550476074, 4.0881171226501465, 4.3921732902526855, 4.696229457855225, 5.000285625457764, 5.304341793060303, 5.6083984375, 5.912454605102539, 6.216510772705078, 6.520566940307617, 6.824623107910156, 7.128679275512695, 7.432735443115234, 7.736791610717773, 8.040847778320312, 8.344903945922852, 8.64896011352539]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 2.0, 12.0, 13.0, 18.0, 25.0, 47.0, 68.0, 97.0, 168.0, 346.0, 665.0, 1339.0, 3310.0, 9568.0, 40378.0, 309086.0, 2618778.0, 1081913.0, 100136.0, 18555.0, 5539.0, 2137.0, 941.0, 488.0, 236.0, 142.0, 95.0, 59.0, 40.0, 19.0, 16.0, 14.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2607421875, -1.223388671875, -1.18603515625, -1.148681640625, -1.111328125, -1.073974609375, -1.03662109375, -0.999267578125, -0.9619140625, -0.924560546875, -0.88720703125, -0.849853515625, -0.8125, -0.775146484375, -0.73779296875, -0.700439453125, -0.6630859375, -0.625732421875, -0.58837890625, -0.551025390625, -0.513671875, -0.476318359375, -0.43896484375, -0.401611328125, -0.3642578125, -0.326904296875, -0.28955078125, -0.252197265625, -0.21484375, -0.177490234375, -0.14013671875, -0.102783203125, -0.0654296875, -0.028076171875, 0.00927734375, 0.046630859375, 0.083984375, 0.121337890625, 0.15869140625, 0.196044921875, 0.2333984375, 0.270751953125, 0.30810546875, 0.345458984375, 0.3828125, 0.420166015625, 0.45751953125, 0.494873046875, 0.5322265625, 0.569580078125, 0.60693359375, 0.644287109375, 0.681640625, 0.718994140625, 0.75634765625, 0.793701171875, 0.8310546875, 0.868408203125, 0.90576171875, 0.943115234375, 0.98046875, 1.017822265625, 1.05517578125, 1.092529296875, 1.1298828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 12.0, 14.0, 16.0, 16.0, 24.0, 30.0, 41.0, 50.0, 27.0, 51.0, 48.0, 46.0, 60.0, 54.0, 65.0, 59.0, 41.0, 51.0, 48.0, 44.0, 43.0, 29.0, 34.0, 20.0, 11.0, 17.0, 9.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6767578125, -0.6533203125, -0.6298828125, -0.6064453125, -0.5830078125, -0.5595703125, -0.5361328125, -0.5126953125, -0.4892578125, -0.4658203125, -0.4423828125, -0.4189453125, -0.3955078125, -0.3720703125, -0.3486328125, -0.3251953125, -0.3017578125, -0.2783203125, -0.2548828125, -0.2314453125, -0.2080078125, -0.1845703125, -0.1611328125, -0.1376953125, -0.1142578125, -0.0908203125, -0.0673828125, -0.0439453125, -0.0205078125, 0.0029296875, 0.0263671875, 0.0498046875, 0.0732421875, 0.0966796875, 0.1201171875, 0.1435546875, 0.1669921875, 0.1904296875, 0.2138671875, 0.2373046875, 0.2607421875, 0.2841796875, 0.3076171875, 0.3310546875, 0.3544921875, 0.3779296875, 0.4013671875, 0.4248046875, 0.4482421875, 0.4716796875, 0.4951171875, 0.5185546875, 0.5419921875, 0.5654296875, 0.5888671875, 0.6123046875, 0.6357421875, 0.6591796875, 0.6826171875, 0.7060546875, 0.7294921875, 0.7529296875, 0.7763671875, 0.7998046875, 0.8232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 5.0, 9.0, 13.0, 9.0, 13.0, 24.0, 58.0, 76.0, 115.0, 156.0, 334.0, 803.0, 2116.0, 7418.0, 40789.0, 659587.0, 3289378.0, 167564.0, 18813.0, 4460.0, 1315.0, 559.0, 284.0, 151.0, 74.0, 41.0, 36.0, 24.0, 9.0, 13.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8123626708984375, -1.762420654296875, -1.7124786376953125, -1.66253662109375, -1.6125946044921875, -1.562652587890625, -1.5127105712890625, -1.4627685546875, -1.4128265380859375, -1.362884521484375, -1.3129425048828125, -1.26300048828125, -1.2130584716796875, -1.163116455078125, -1.1131744384765625, -1.063232421875, -1.0132904052734375, -0.963348388671875, -0.9134063720703125, -0.86346435546875, -0.8135223388671875, -0.763580322265625, -0.7136383056640625, -0.6636962890625, -0.6137542724609375, -0.563812255859375, -0.5138702392578125, -0.46392822265625, -0.4139862060546875, -0.364044189453125, -0.3141021728515625, -0.26416015625, -0.2142181396484375, -0.164276123046875, -0.1143341064453125, -0.06439208984375, -0.0144500732421875, 0.035491943359375, 0.0854339599609375, 0.1353759765625, 0.1853179931640625, 0.235260009765625, 0.2852020263671875, 0.33514404296875, 0.3850860595703125, 0.435028076171875, 0.4849700927734375, 0.534912109375, 0.5848541259765625, 0.634796142578125, 0.6847381591796875, 0.73468017578125, 0.7846221923828125, 0.834564208984375, 0.8845062255859375, 0.9344482421875, 0.9843902587890625, 1.034332275390625, 1.0842742919921875, 1.13421630859375, 1.1841583251953125, 1.234100341796875, 1.2840423583984375, 1.333984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 12.0, 26.0, 41.0, 37.0, 83.0, 93.0, 129.0, 203.0, 296.0, 394.0, 526.0, 556.0, 469.0, 347.0, 251.0, 150.0, 115.0, 69.0, 66.0, 38.0, 46.0, 19.0, 18.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0298614501953125, -0.993316650390625, -0.9567718505859375, -0.92022705078125, -0.8836822509765625, -0.847137451171875, -0.8105926513671875, -0.7740478515625, -0.7375030517578125, -0.700958251953125, -0.6644134521484375, -0.62786865234375, -0.5913238525390625, -0.554779052734375, -0.5182342529296875, -0.481689453125, -0.4451446533203125, -0.408599853515625, -0.3720550537109375, -0.33551025390625, -0.2989654541015625, -0.262420654296875, -0.2258758544921875, -0.1893310546875, -0.1527862548828125, -0.116241455078125, -0.0796966552734375, -0.04315185546875, -0.0066070556640625, 0.029937744140625, 0.0664825439453125, 0.10302734375, 0.1395721435546875, 0.176116943359375, 0.2126617431640625, 0.24920654296875, 0.2857513427734375, 0.322296142578125, 0.3588409423828125, 0.3953857421875, 0.4319305419921875, 0.468475341796875, 0.5050201416015625, 0.54156494140625, 0.5781097412109375, 0.614654541015625, 0.6511993408203125, 0.687744140625, 0.7242889404296875, 0.760833740234375, 0.7973785400390625, 0.83392333984375, 0.8704681396484375, 0.907012939453125, 0.9435577392578125, 0.9801025390625, 1.0166473388671875, 1.053192138671875, 1.0897369384765625, 1.12628173828125, 1.1628265380859375, 1.199371337890625, 1.2359161376953125, 1.2724609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 13.0, 29.0, 49.0, 94.0, 145.0, 181.0, 176.0, 125.0, 61.0, 49.0, 24.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.183838844299316, -7.769847869873047, -7.355856895446777, -6.941866397857666, -6.5278754234313965, -6.113884449005127, -5.699893951416016, -5.285902976989746, -4.871912002563477, -4.457921028137207, -4.0439300537109375, -3.629939556121826, -3.2159485816955566, -2.801957607269287, -2.3879668712615967, -1.9739761352539062, -1.5599851608276367, -1.1459943056106567, -0.7320034503936768, -0.3180125951766968, 0.0959782600402832, 0.5099692344665527, 0.9239599704742432, 1.3379507064819336, 1.7519416809082031, 2.1659326553344727, 2.579923391342163, 2.9939141273498535, 3.407905101776123, 3.8218960762023926, 4.235886573791504, 4.649877548217773, 5.063869476318359, 5.477860450744629, 5.891851425170898, 6.30584192276001, 6.719832897186279, 7.133823871612549, 7.54781436920166, 7.96180534362793, 8.3757963180542, 8.789787292480469, 9.203778266906738, 9.617769241333008, 10.031759262084961, 10.445751190185547, 10.8597412109375, 11.27373218536377, 11.687723159790039, 12.101714134216309, 12.515705108642578, 12.929696083068848, 13.343687057495117, 13.75767707824707, 14.17166805267334, 14.58565902709961, 14.999650001525879, 15.413640975952148, 15.827631950378418, 16.241622924804688, 16.65561294555664, 17.069604873657227, 17.48359489440918, 17.897586822509766, 18.31157684326172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 8.0, 19.0, 23.0, 23.0, 19.0, 33.0, 37.0, 38.0, 31.0, 51.0, 37.0, 41.0, 52.0, 43.0, 48.0, 44.0, 45.0, 32.0, 30.0, 47.0, 32.0, 39.0, 27.0, 24.0, 22.0, 23.0, 10.0, 12.0, 15.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0], "bins": [-6.707261085510254, -6.5287370681762695, -6.350213050842285, -6.171689033508301, -5.993165493011475, -5.81464147567749, -5.636117458343506, -5.4575934410095215, -5.279069423675537, -5.100545406341553, -4.922021389007568, -4.743497848510742, -4.564973831176758, -4.386449813842773, -4.207925796508789, -4.029401779174805, -3.8508780002593994, -3.672353982925415, -3.4938302040100098, -3.3153061866760254, -3.136782169342041, -2.9582581520080566, -2.7797343730926514, -2.601210355758667, -2.4226865768432617, -2.2441625595092773, -2.065638780593872, -1.8871147632598877, -1.7085907459259033, -1.5300668478012085, -1.3515429496765137, -1.1730189323425293, -0.9944949150085449, -0.8159709572792053, -0.6374469995498657, -0.4589231014251709, -0.2803991436958313, -0.1018751859664917, 0.07664871215820312, 0.2551727294921875, 0.4336966276168823, 0.6122205853462219, 0.7907445430755615, 0.9692684412002563, 1.1477923393249512, 1.3263163566589355, 1.5048402547836304, 1.6833642721176147, 1.8618881702423096, 2.040412187576294, 2.218935966491699, 2.3974599838256836, 2.575984001159668, 2.7545080184936523, 2.9330317974090576, 3.111555814743042, 3.2900795936584473, 3.4686036109924316, 3.647127389907837, 3.8256514072418213, 4.004175186157227, 4.182699203491211, 4.361223220825195, 4.53974723815918, 4.718271255493164]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 10.0, 7.0, 9.0, 11.0, 26.0, 40.0, 51.0, 92.0, 183.0, 334.0, 630.0, 1302.0, 2813.0, 6863.0, 17919.0, 54502.0, 206201.0, 492176.0, 186938.0, 50212.0, 16634.0, 6308.0, 2722.0, 1220.0, 603.0, 296.0, 186.0, 101.0, 70.0, 33.0, 21.0, 16.0, 6.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.087188720703125, -1.04449462890625, -1.001800537109375, -0.9591064453125, -0.916412353515625, -0.87371826171875, -0.831024169921875, -0.788330078125, -0.745635986328125, -0.70294189453125, -0.660247802734375, -0.6175537109375, -0.574859619140625, -0.53216552734375, -0.489471435546875, -0.44677734375, -0.404083251953125, -0.36138916015625, -0.318695068359375, -0.2760009765625, -0.233306884765625, -0.19061279296875, -0.147918701171875, -0.105224609375, -0.062530517578125, -0.01983642578125, 0.022857666015625, 0.0655517578125, 0.108245849609375, 0.15093994140625, 0.193634033203125, 0.236328125, 0.279022216796875, 0.32171630859375, 0.364410400390625, 0.4071044921875, 0.449798583984375, 0.49249267578125, 0.535186767578125, 0.577880859375, 0.620574951171875, 0.66326904296875, 0.705963134765625, 0.7486572265625, 0.791351318359375, 0.83404541015625, 0.876739501953125, 0.91943359375, 0.962127685546875, 1.00482177734375, 1.047515869140625, 1.0902099609375, 1.132904052734375, 1.17559814453125, 1.218292236328125, 1.260986328125, 1.303680419921875, 1.34637451171875, 1.389068603515625, 1.4317626953125, 1.474456787109375, 1.51715087890625, 1.559844970703125, 1.6025390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 21.0, 22.0, 27.0, 32.0, 27.0, 48.0, 43.0, 39.0, 44.0, 56.0, 65.0, 55.0, 46.0, 59.0, 44.0, 54.0, 27.0, 53.0, 32.0, 30.0, 34.0, 18.0, 11.0, 12.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6354446411132812, -0.6121978759765625, -0.5889511108398438, -0.565704345703125, -0.5424575805664062, -0.5192108154296875, -0.49596405029296875, -0.47271728515625, -0.44947052001953125, -0.4262237548828125, -0.40297698974609375, -0.379730224609375, -0.35648345947265625, -0.3332366943359375, -0.30998992919921875, -0.2867431640625, -0.26349639892578125, -0.2402496337890625, -0.21700286865234375, -0.193756103515625, -0.17050933837890625, -0.1472625732421875, -0.12401580810546875, -0.10076904296875, -0.07752227783203125, -0.0542755126953125, -0.03102874755859375, -0.007781982421875, 0.01546478271484375, 0.0387115478515625, 0.06195831298828125, 0.085205078125, 0.10845184326171875, 0.1316986083984375, 0.15494537353515625, 0.178192138671875, 0.20143890380859375, 0.2246856689453125, 0.24793243408203125, 0.27117919921875, 0.29442596435546875, 0.3176727294921875, 0.34091949462890625, 0.364166259765625, 0.38741302490234375, 0.4106597900390625, 0.43390655517578125, 0.4571533203125, 0.48040008544921875, 0.5036468505859375, 0.5268936157226562, 0.550140380859375, 0.5733871459960938, 0.5966339111328125, 0.6198806762695312, 0.64312744140625, 0.6663742065429688, 0.6896209716796875, 0.7128677368164062, 0.736114501953125, 0.7593612670898438, 0.7826080322265625, 0.8058547973632812, 0.8291015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 21.0, 18.0, 15.0, 31.0, 33.0, 46.0, 74.0, 95.0, 148.0, 218.0, 344.0, 507.0, 892.0, 1696.0, 4239.0, 17860.0, 171297.0, 785405.0, 51473.0, 8394.0, 2592.0, 1156.0, 669.0, 412.0, 266.0, 182.0, 138.0, 92.0, 60.0, 45.0, 42.0, 29.0, 17.0, 15.0, 2.0, 6.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.9354248046875, -1.866943359375, -1.7984619140625, -1.72998046875, -1.6614990234375, -1.593017578125, -1.5245361328125, -1.4560546875, -1.3875732421875, -1.319091796875, -1.2506103515625, -1.18212890625, -1.1136474609375, -1.045166015625, -0.9766845703125, -0.908203125, -0.8397216796875, -0.771240234375, -0.7027587890625, -0.63427734375, -0.5657958984375, -0.497314453125, -0.4288330078125, -0.3603515625, -0.2918701171875, -0.223388671875, -0.1549072265625, -0.08642578125, -0.0179443359375, 0.050537109375, 0.1190185546875, 0.1875, 0.2559814453125, 0.324462890625, 0.3929443359375, 0.46142578125, 0.5299072265625, 0.598388671875, 0.6668701171875, 0.7353515625, 0.8038330078125, 0.872314453125, 0.9407958984375, 1.00927734375, 1.0777587890625, 1.146240234375, 1.2147216796875, 1.283203125, 1.3516845703125, 1.420166015625, 1.4886474609375, 1.55712890625, 1.6256103515625, 1.694091796875, 1.7625732421875, 1.8310546875, 1.8995361328125, 1.968017578125, 2.0364990234375, 2.10498046875, 2.1734619140625, 2.241943359375, 2.3104248046875, 2.37890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 4.0, 3.0, 9.0, 9.0, 9.0, 13.0, 16.0, 21.0, 15.0, 31.0, 33.0, 31.0, 41.0, 47.0, 44.0, 61.0, 46.0, 55.0, 71.0, 58.0, 49.0, 61.0, 41.0, 28.0, 37.0, 33.0, 20.0, 16.0, 13.0, 13.0, 14.0, 12.0, 9.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.050048828125, -1.97314453125, -1.896240234375, -1.8193359375, -1.742431640625, -1.66552734375, -1.588623046875, -1.51171875, -1.434814453125, -1.35791015625, -1.281005859375, -1.2041015625, -1.127197265625, -1.05029296875, -0.973388671875, -0.896484375, -0.819580078125, -0.74267578125, -0.665771484375, -0.5888671875, -0.511962890625, -0.43505859375, -0.358154296875, -0.28125, -0.204345703125, -0.12744140625, -0.050537109375, 0.0263671875, 0.103271484375, 0.18017578125, 0.257080078125, 0.333984375, 0.410888671875, 0.48779296875, 0.564697265625, 0.6416015625, 0.718505859375, 0.79541015625, 0.872314453125, 0.94921875, 1.026123046875, 1.10302734375, 1.179931640625, 1.2568359375, 1.333740234375, 1.41064453125, 1.487548828125, 1.564453125, 1.641357421875, 1.71826171875, 1.795166015625, 1.8720703125, 1.948974609375, 2.02587890625, 2.102783203125, 2.1796875, 2.256591796875, 2.33349609375, 2.410400390625, 2.4873046875, 2.564208984375, 2.64111328125, 2.718017578125, 2.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 6.0, 6.0, 9.0, 22.0, 35.0, 65.0, 103.0, 163.0, 299.0, 695.0, 1749.0, 6163.0, 41817.0, 875283.0, 107005.0, 10750.0, 2565.0, 929.0, 369.0, 210.0, 112.0, 54.0, 39.0, 30.0, 20.0, 14.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.821533203125, -0.79638671875, -0.771240234375, -0.74609375, -0.720947265625, -0.69580078125, -0.670654296875, -0.6455078125, -0.620361328125, -0.59521484375, -0.570068359375, -0.544921875, -0.519775390625, -0.49462890625, -0.469482421875, -0.4443359375, -0.419189453125, -0.39404296875, -0.368896484375, -0.34375, -0.318603515625, -0.29345703125, -0.268310546875, -0.2431640625, -0.218017578125, -0.19287109375, -0.167724609375, -0.142578125, -0.117431640625, -0.09228515625, -0.067138671875, -0.0419921875, -0.016845703125, 0.00830078125, 0.033447265625, 0.05859375, 0.083740234375, 0.10888671875, 0.134033203125, 0.1591796875, 0.184326171875, 0.20947265625, 0.234619140625, 0.259765625, 0.284912109375, 0.31005859375, 0.335205078125, 0.3603515625, 0.385498046875, 0.41064453125, 0.435791015625, 0.4609375, 0.486083984375, 0.51123046875, 0.536376953125, 0.5615234375, 0.586669921875, 0.61181640625, 0.636962890625, 0.662109375, 0.687255859375, 0.71240234375, 0.737548828125, 0.7626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 15.0, 5.0, 11.0, 28.0, 30.0, 29.0, 39.0, 68.0, 102.0, 181.0, 153.0, 101.0, 63.0, 46.0, 24.0, 26.0, 15.0, 17.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013506412506103516, -0.00013003312051296234, -0.00012500211596488953, -0.00011997111141681671, -0.0001149401068687439, -0.00010990910232067108, -0.00010487809777259827, -9.984709322452545e-05, -9.481608867645264e-05, -8.978508412837982e-05, -8.475407958030701e-05, -7.972307503223419e-05, -7.469207048416138e-05, -6.966106593608856e-05, -6.463006138801575e-05, -5.959905683994293e-05, -5.456805229187012e-05, -4.95370477437973e-05, -4.450604319572449e-05, -3.947503864765167e-05, -3.444403409957886e-05, -2.9413029551506042e-05, -2.4382025003433228e-05, -1.9351020455360413e-05, -1.4320015907287598e-05, -9.289011359214783e-06, -4.258006811141968e-06, 7.729977369308472e-07, 5.804002285003662e-06, 1.0835006833076477e-05, 1.5866011381149292e-05, 2.0897015929222107e-05, 2.5928020477294922e-05, 3.095902502536774e-05, 3.599002957344055e-05, 4.102103412151337e-05, 4.605203866958618e-05, 5.1083043217658997e-05, 5.611404776573181e-05, 6.114505231380463e-05, 6.617605686187744e-05, 7.120706140995026e-05, 7.623806595802307e-05, 8.126907050609589e-05, 8.63000750541687e-05, 9.133107960224152e-05, 9.636208415031433e-05, 0.00010139308869838715, 0.00010642409324645996, 0.00011145509779453278, 0.00011648610234260559, 0.0001215171068906784, 0.00012654811143875122, 0.00013157911598682404, 0.00013661012053489685, 0.00014164112508296967, 0.00014667212963104248, 0.0001517031341791153, 0.0001567341387271881, 0.00016176514327526093, 0.00016679614782333374, 0.00017182715237140656, 0.00017685815691947937, 0.00018188916146755219, 0.000186920166015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 11.0, 7.0, 18.0, 19.0, 36.0, 48.0, 59.0, 81.0, 126.0, 203.0, 386.0, 732.0, 1499.0, 3406.0, 9508.0, 38936.0, 295212.0, 633376.0, 46993.0, 10678.0, 3712.0, 1560.0, 789.0, 461.0, 237.0, 132.0, 92.0, 63.0, 45.0, 35.0, 25.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.404052734375, -0.3885459899902344, -0.37303924560546875, -0.3575325012207031, -0.3420257568359375, -0.3265190124511719, -0.31101226806640625, -0.2955055236816406, -0.279998779296875, -0.2644920349121094, -0.24898529052734375, -0.23347854614257812, -0.2179718017578125, -0.20246505737304688, -0.18695831298828125, -0.17145156860351562, -0.15594482421875, -0.14043807983398438, -0.12493133544921875, -0.10942459106445312, -0.0939178466796875, -0.07841110229492188, -0.06290435791015625, -0.047397613525390625, -0.031890869140625, -0.016384124755859375, -0.00087738037109375, 0.014629364013671875, 0.0301361083984375, 0.045642852783203125, 0.06114959716796875, 0.07665634155273438, 0.0921630859375, 0.10766983032226562, 0.12317657470703125, 0.13868331909179688, 0.1541900634765625, 0.16969680786132812, 0.18520355224609375, 0.20071029663085938, 0.216217041015625, 0.23172378540039062, 0.24723052978515625, 0.2627372741699219, 0.2782440185546875, 0.2937507629394531, 0.30925750732421875, 0.3247642517089844, 0.34027099609375, 0.3557777404785156, 0.37128448486328125, 0.3867912292480469, 0.4022979736328125, 0.4178047180175781, 0.43331146240234375, 0.4488182067871094, 0.464324951171875, 0.4798316955566406, 0.49533843994140625, 0.5108451843261719, 0.5263519287109375, 0.5418586730957031, 0.5573654174804688, 0.5728721618652344, 0.58837890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 11.0, 9.0, 18.0, 14.0, 14.0, 29.0, 29.0, 35.0, 55.0, 56.0, 67.0, 111.0, 121.0, 98.0, 73.0, 63.0, 36.0, 34.0, 24.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 3.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3922462463378906, -0.37799835205078125, -0.3637504577636719, -0.3495025634765625, -0.3352546691894531, -0.32100677490234375, -0.3067588806152344, -0.292510986328125, -0.2782630920410156, -0.26401519775390625, -0.24976730346679688, -0.2355194091796875, -0.22127151489257812, -0.20702362060546875, -0.19277572631835938, -0.17852783203125, -0.16427993774414062, -0.15003204345703125, -0.13578414916992188, -0.1215362548828125, -0.10728836059570312, -0.09304046630859375, -0.07879257202148438, -0.064544677734375, -0.050296783447265625, -0.03604888916015625, -0.021800994873046875, -0.0075531005859375, 0.006694793701171875, 0.02094268798828125, 0.035190582275390625, 0.0494384765625, 0.06368637084960938, 0.07793426513671875, 0.09218215942382812, 0.1064300537109375, 0.12067794799804688, 0.13492584228515625, 0.14917373657226562, 0.163421630859375, 0.17766952514648438, 0.19191741943359375, 0.20616531372070312, 0.2204132080078125, 0.23466110229492188, 0.24890899658203125, 0.2631568908691406, 0.27740478515625, 0.2916526794433594, 0.30590057373046875, 0.3201484680175781, 0.3343963623046875, 0.3486442565917969, 0.36289215087890625, 0.3771400451660156, 0.391387939453125, 0.4056358337402344, 0.41988372802734375, 0.4341316223144531, 0.4483795166015625, 0.4626274108886719, 0.47687530517578125, 0.4911231994628906, 0.50537109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 14.0, 31.0, 114.0, 513.0, 235.0, 63.0, 19.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.60491180419922, -33.66425323486328, -32.72359085083008, -31.78293228149414, -30.84227180480957, -29.901611328125, -28.960952758789062, -28.020292282104492, -27.079631805419922, -26.13897132873535, -25.198312759399414, -24.257652282714844, -23.316991806030273, -22.376331329345703, -21.435672760009766, -20.495012283325195, -19.554351806640625, -18.613691329956055, -17.673032760620117, -16.732372283935547, -15.791711807250977, -14.851052284240723, -13.910392761230469, -12.969732284545898, -12.029073715209961, -11.088414192199707, -10.147753715515137, -9.207094192504883, -8.266433715820312, -7.325774192810059, -6.3851141929626465, -5.444454193115234, -4.503793716430664, -3.563133716583252, -2.62247371673584, -1.6818139553070068, -0.7411539554595947, 0.19950580596923828, 1.1401658058166504, 2.0808258056640625, 3.0214858055114746, 3.9621458053588867, 4.902805805206299, 5.843465805053711, 6.784125328063965, 7.724785327911377, 8.665445327758789, 9.60610580444336, 10.546765327453613, 11.487424850463867, 12.428085327148438, 13.368744850158691, 14.309405326843262, 15.250064849853516, 16.190725326538086, 17.131385803222656, 18.072044372558594, 19.012704849243164, 19.9533634185791, 20.894023895263672, 21.834684371948242, 22.775344848632812, 23.71600341796875, 24.65666389465332, 25.59732437133789]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 10.0, 13.0, 18.0, 15.0, 12.0, 14.0, 14.0, 30.0, 30.0, 34.0, 39.0, 47.0, 90.0, 140.0, 90.0, 58.0, 42.0, 32.0, 39.0, 23.0, 25.0, 11.0, 21.0, 16.0, 17.0, 14.0, 6.0, 9.0, 7.0, 10.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.924737930297852, -8.6578950881958, -8.39105224609375, -8.1242094039917, -7.857367038726807, -7.590524196624756, -7.323681354522705, -7.056838512420654, -6.789996147155762, -6.523153305053711, -6.25631046295166, -5.989467620849609, -5.722625255584717, -5.455782413482666, -5.188939571380615, -4.9220967292785645, -4.655253887176514, -4.388411045074463, -4.121568202972412, -3.8547255992889404, -3.5878829956054688, -3.321040153503418, -3.054197311401367, -2.7873544692993164, -2.5205118656158447, -2.253669023513794, -1.9868264198303223, -1.7199835777282715, -1.4531408548355103, -1.186298131942749, -0.9194552898406982, -0.652612566947937, -0.3857698440551758, -0.11892709136009216, 0.14791566133499146, 0.41475844383239746, 0.6816011667251587, 0.9484438896179199, 1.2152867317199707, 1.482129454612732, 1.7489721775054932, 2.015815019607544, 2.2826576232910156, 2.5495004653930664, 2.816343307495117, 3.083185911178589, 3.3500287532806396, 3.6168713569641113, 3.883714199066162, 4.150557041168213, 4.417399883270264, 4.684242248535156, 4.951085090637207, 5.217927932739258, 5.484770774841309, 5.751613616943359, 6.01845645904541, 6.285299301147461, 6.552142143249512, 6.8189849853515625, 7.085827350616455, 7.352670192718506, 7.619513034820557, 7.886355876922607, 8.1531982421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 6.0, 11.0, 12.0, 12.0, 29.0, 27.0, 30.0, 70.0, 134.0, 234.0, 406.0, 887.0, 2009.0, 5197.0, 17682.0, 97352.0, 955745.0, 2592758.0, 452376.0, 51312.0, 11485.0, 3669.0, 1398.0, 662.0, 331.0, 170.0, 98.0, 60.0, 48.0, 26.0, 11.0, 13.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.650390625, -1.602325439453125, -1.55426025390625, -1.506195068359375, -1.4581298828125, -1.410064697265625, -1.36199951171875, -1.313934326171875, -1.265869140625, -1.217803955078125, -1.16973876953125, -1.121673583984375, -1.0736083984375, -1.025543212890625, -0.97747802734375, -0.929412841796875, -0.88134765625, -0.833282470703125, -0.78521728515625, -0.737152099609375, -0.6890869140625, -0.641021728515625, -0.59295654296875, -0.544891357421875, -0.496826171875, -0.448760986328125, -0.40069580078125, -0.352630615234375, -0.3045654296875, -0.256500244140625, -0.20843505859375, -0.160369873046875, -0.1123046875, -0.064239501953125, -0.01617431640625, 0.031890869140625, 0.0799560546875, 0.128021240234375, 0.17608642578125, 0.224151611328125, 0.272216796875, 0.320281982421875, 0.36834716796875, 0.416412353515625, 0.4644775390625, 0.512542724609375, 0.56060791015625, 0.608673095703125, 0.65673828125, 0.704803466796875, 0.75286865234375, 0.800933837890625, 0.8489990234375, 0.897064208984375, 0.94512939453125, 0.993194580078125, 1.041259765625, 1.089324951171875, 1.13739013671875, 1.185455322265625, 1.2335205078125, 1.281585693359375, 1.32965087890625, 1.377716064453125, 1.42578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 5.0, 12.0, 14.0, 15.0, 13.0, 40.0, 24.0, 26.0, 32.0, 30.0, 33.0, 43.0, 42.0, 37.0, 47.0, 49.0, 49.0, 52.0, 40.0, 40.0, 44.0, 52.0, 29.0, 35.0, 25.0, 24.0, 27.0, 21.0, 17.0, 11.0, 14.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.490966796875, -0.4728431701660156, -0.45471954345703125, -0.4365959167480469, -0.4184722900390625, -0.4003486633300781, -0.38222503662109375, -0.3641014099121094, -0.345977783203125, -0.3278541564941406, -0.30973052978515625, -0.2916069030761719, -0.2734832763671875, -0.2553596496582031, -0.23723602294921875, -0.21911239624023438, -0.20098876953125, -0.18286514282226562, -0.16474151611328125, -0.14661788940429688, -0.1284942626953125, -0.11037063598632812, -0.09224700927734375, -0.07412338256835938, -0.055999755859375, -0.037876129150390625, -0.01975250244140625, -0.001628875732421875, 0.0164947509765625, 0.034618377685546875, 0.05274200439453125, 0.07086563110351562, 0.0889892578125, 0.10711288452148438, 0.12523651123046875, 0.14336013793945312, 0.1614837646484375, 0.17960739135742188, 0.19773101806640625, 0.21585464477539062, 0.233978271484375, 0.2521018981933594, 0.27022552490234375, 0.2883491516113281, 0.3064727783203125, 0.3245964050292969, 0.34272003173828125, 0.3608436584472656, 0.37896728515625, 0.3970909118652344, 0.41521453857421875, 0.4333381652832031, 0.4514617919921875, 0.4695854187011719, 0.48770904541015625, 0.5058326721191406, 0.523956298828125, 0.5420799255371094, 0.5602035522460938, 0.5783271789550781, 0.5964508056640625, 0.6145744323730469, 0.6326980590820312, 0.6508216857910156, 0.6689453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 10.0, 13.0, 15.0, 14.0, 36.0, 41.0, 44.0, 53.0, 110.0, 159.0, 229.0, 416.0, 749.0, 1570.0, 3829.0, 13870.0, 140130.0, 3774932.0, 231894.0, 17804.0, 4503.0, 1788.0, 835.0, 459.0, 269.0, 157.0, 99.0, 55.0, 49.0, 31.0, 34.0, 10.0, 19.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.626800537109375, -2.53485107421875, -2.442901611328125, -2.3509521484375, -2.259002685546875, -2.16705322265625, -2.075103759765625, -1.983154296875, -1.891204833984375, -1.79925537109375, -1.707305908203125, -1.6153564453125, -1.523406982421875, -1.43145751953125, -1.339508056640625, -1.24755859375, -1.155609130859375, -1.06365966796875, -0.971710205078125, -0.8797607421875, -0.787811279296875, -0.69586181640625, -0.603912353515625, -0.511962890625, -0.420013427734375, -0.32806396484375, -0.236114501953125, -0.1441650390625, -0.052215576171875, 0.03973388671875, 0.131683349609375, 0.2236328125, 0.315582275390625, 0.40753173828125, 0.499481201171875, 0.5914306640625, 0.683380126953125, 0.77532958984375, 0.867279052734375, 0.959228515625, 1.051177978515625, 1.14312744140625, 1.235076904296875, 1.3270263671875, 1.418975830078125, 1.51092529296875, 1.602874755859375, 1.69482421875, 1.786773681640625, 1.87872314453125, 1.970672607421875, 2.0626220703125, 2.154571533203125, 2.24652099609375, 2.338470458984375, 2.430419921875, 2.522369384765625, 2.61431884765625, 2.706268310546875, 2.7982177734375, 2.890167236328125, 2.98211669921875, 3.074066162109375, 3.166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 10.0, 23.0, 29.0, 32.0, 40.0, 70.0, 100.0, 114.0, 192.0, 248.0, 433.0, 536.0, 587.0, 455.0, 311.0, 259.0, 166.0, 129.0, 85.0, 56.0, 41.0, 29.0, 27.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.112213134765625, -2.04669189453125, -1.981170654296875, -1.9156494140625, -1.850128173828125, -1.78460693359375, -1.719085693359375, -1.653564453125, -1.588043212890625, -1.52252197265625, -1.457000732421875, -1.3914794921875, -1.325958251953125, -1.26043701171875, -1.194915771484375, -1.12939453125, -1.063873291015625, -0.99835205078125, -0.932830810546875, -0.8673095703125, -0.801788330078125, -0.73626708984375, -0.670745849609375, -0.605224609375, -0.539703369140625, -0.47418212890625, -0.408660888671875, -0.3431396484375, -0.277618408203125, -0.21209716796875, -0.146575927734375, -0.0810546875, -0.015533447265625, 0.04998779296875, 0.115509033203125, 0.1810302734375, 0.246551513671875, 0.31207275390625, 0.377593994140625, 0.443115234375, 0.508636474609375, 0.57415771484375, 0.639678955078125, 0.7052001953125, 0.770721435546875, 0.83624267578125, 0.901763916015625, 0.96728515625, 1.032806396484375, 1.09832763671875, 1.163848876953125, 1.2293701171875, 1.294891357421875, 1.36041259765625, 1.425933837890625, 1.491455078125, 1.556976318359375, 1.62249755859375, 1.688018798828125, 1.7535400390625, 1.819061279296875, 1.88458251953125, 1.950103759765625, 2.015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 5.0, 14.0, 11.0, 23.0, 36.0, 114.0, 199.0, 250.0, 173.0, 83.0, 45.0, 17.0, 11.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.30022430419922, -42.137691497802734, -40.97515869140625, -39.8126220703125, -38.650089263916016, -37.48755645751953, -36.32502365112305, -35.16249084472656, -33.99995422363281, -32.83742141723633, -31.67488670349121, -30.512353897094727, -29.34981918334961, -28.187286376953125, -27.02475357055664, -25.862220764160156, -24.699687957763672, -23.537155151367188, -22.37462043762207, -21.212087631225586, -20.04955291748047, -18.887020111083984, -17.7244873046875, -16.561954498291016, -15.399419784545898, -14.236886024475098, -13.074352264404297, -11.911819458007812, -10.749285697937012, -9.586751937866211, -8.424219131469727, -7.261685371398926, -6.099153518676758, -4.936619758605957, -3.7740864753723145, -2.6115529537200928, -1.449019432067871, -0.2864856719970703, 0.8760476112365723, 2.038580894470215, 3.2011146545410156, 4.363648414611816, 5.526181697845459, 6.688714981079102, 7.851248741149902, 9.013782501220703, 10.176315307617188, 11.338849067687988, 12.501382827758789, 13.66391658782959, 14.82645034790039, 15.988983154296875, 17.15151596069336, 18.314050674438477, 19.47658348083496, 20.639118194580078, 21.801651000976562, 22.964183807373047, 24.126718521118164, 25.28925132751465, 26.451786041259766, 27.61431884765625, 28.776851654052734, 29.93938446044922, 31.101919174194336]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 10.0, 11.0, 22.0, 15.0, 17.0, 30.0, 26.0, 29.0, 36.0, 44.0, 38.0, 53.0, 61.0, 57.0, 72.0, 65.0, 47.0, 47.0, 40.0, 42.0, 28.0, 39.0, 35.0, 26.0, 20.0, 15.0, 10.0, 13.0, 5.0, 6.0, 6.0, 11.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.77409839630127, -12.343695640563965, -11.91329288482666, -11.482890129089355, -11.05248737335205, -10.622084617614746, -10.191682815551758, -9.761280059814453, -9.330877304077148, -8.900474548339844, -8.470071792602539, -8.039669036865234, -7.60926628112793, -7.178863525390625, -6.7484612464904785, -6.318058490753174, -5.887655258178711, -5.457252502441406, -5.026849746704102, -4.596446990966797, -4.166044235229492, -3.7356417179107666, -3.305239200592041, -2.8748364448547363, -2.4444336891174316, -2.014030933380127, -1.5836282968521118, -1.1532256603240967, -0.722822904586792, -0.2924201488494873, 0.13798236846923828, 0.568385124206543, 0.9987869262695312, 1.429189682006836, 1.859592318534851, 2.289994955062866, 2.720397710800171, 3.1508004665374756, 3.581202983856201, 4.011605739593506, 4.4420084953308105, 4.872411251068115, 5.30281400680542, 5.733216285705566, 6.163619041442871, 6.594021797180176, 7.0244245529174805, 7.454827308654785, 7.88523006439209, 8.315632820129395, 8.7460355758667, 9.176438331604004, 9.606841087341309, 10.037243843078613, 10.467645645141602, 10.898048400878906, 11.328451156616211, 11.758853912353516, 12.18925666809082, 12.619659423828125, 13.05006217956543, 13.480464935302734, 13.910867691040039, 14.341270446777344, 14.771673202514648]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 16.0, 23.0, 25.0, 30.0, 59.0, 76.0, 100.0, 185.0, 321.0, 569.0, 1166.0, 2374.0, 5474.0, 15660.0, 52034.0, 274125.0, 571678.0, 87291.0, 23000.0, 7988.0, 3136.0, 1485.0, 746.0, 332.0, 217.0, 131.0, 76.0, 76.0, 48.0, 34.0, 13.0, 8.0, 11.0, 6.0, 3.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.240234375, -1.201690673828125, -1.16314697265625, -1.124603271484375, -1.0860595703125, -1.047515869140625, -1.00897216796875, -0.970428466796875, -0.931884765625, -0.893341064453125, -0.85479736328125, -0.816253662109375, -0.7777099609375, -0.739166259765625, -0.70062255859375, -0.662078857421875, -0.62353515625, -0.584991455078125, -0.54644775390625, -0.507904052734375, -0.4693603515625, -0.430816650390625, -0.39227294921875, -0.353729248046875, -0.315185546875, -0.276641845703125, -0.23809814453125, -0.199554443359375, -0.1610107421875, -0.122467041015625, -0.08392333984375, -0.045379638671875, -0.0068359375, 0.031707763671875, 0.07025146484375, 0.108795166015625, 0.1473388671875, 0.185882568359375, 0.22442626953125, 0.262969970703125, 0.301513671875, 0.340057373046875, 0.37860107421875, 0.417144775390625, 0.4556884765625, 0.494232177734375, 0.53277587890625, 0.571319580078125, 0.60986328125, 0.648406982421875, 0.68695068359375, 0.725494384765625, 0.7640380859375, 0.802581787109375, 0.84112548828125, 0.879669189453125, 0.918212890625, 0.956756591796875, 0.99530029296875, 1.033843994140625, 1.0723876953125, 1.110931396484375, 1.14947509765625, 1.188018798828125, 1.2265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 15.0, 15.0, 29.0, 33.0, 47.0, 42.0, 60.0, 44.0, 80.0, 68.0, 78.0, 71.0, 69.0, 74.0, 48.0, 44.0, 35.0, 34.0, 31.0, 22.0, 17.0, 12.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7572479248046875, -0.722503662109375, -0.6877593994140625, -0.65301513671875, -0.6182708740234375, -0.583526611328125, -0.5487823486328125, -0.5140380859375, -0.4792938232421875, -0.444549560546875, -0.4098052978515625, -0.37506103515625, -0.3403167724609375, -0.305572509765625, -0.2708282470703125, -0.236083984375, -0.2013397216796875, -0.166595458984375, -0.1318511962890625, -0.09710693359375, -0.0623626708984375, -0.027618408203125, 0.0071258544921875, 0.0418701171875, 0.0766143798828125, 0.111358642578125, 0.1461029052734375, 0.18084716796875, 0.2155914306640625, 0.250335693359375, 0.2850799560546875, 0.31982421875, 0.3545684814453125, 0.389312744140625, 0.4240570068359375, 0.45880126953125, 0.4935455322265625, 0.528289794921875, 0.5630340576171875, 0.5977783203125, 0.6325225830078125, 0.667266845703125, 0.7020111083984375, 0.73675537109375, 0.7714996337890625, 0.806243896484375, 0.8409881591796875, 0.875732421875, 0.9104766845703125, 0.945220947265625, 0.9799652099609375, 1.01470947265625, 1.0494537353515625, 1.084197998046875, 1.1189422607421875, 1.1536865234375, 1.1884307861328125, 1.223175048828125, 1.2579193115234375, 1.29266357421875, 1.3274078369140625, 1.362152099609375, 1.3968963623046875, 1.431640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 23.0, 36.0, 52.0, 86.0, 122.0, 156.0, 265.0, 373.0, 771.0, 1859.0, 6833.0, 49896.0, 891703.0, 82467.0, 9460.0, 2259.0, 862.0, 450.0, 269.0, 178.0, 106.0, 68.0, 48.0, 36.0, 32.0, 15.0, 15.0, 5.0, 12.0, 5.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5478515625, -1.5017852783203125, -1.455718994140625, -1.4096527099609375, -1.36358642578125, -1.3175201416015625, -1.271453857421875, -1.2253875732421875, -1.1793212890625, -1.1332550048828125, -1.087188720703125, -1.0411224365234375, -0.99505615234375, -0.9489898681640625, -0.902923583984375, -0.8568572998046875, -0.810791015625, -0.7647247314453125, -0.718658447265625, -0.6725921630859375, -0.62652587890625, -0.5804595947265625, -0.534393310546875, -0.4883270263671875, -0.4422607421875, -0.3961944580078125, -0.350128173828125, -0.3040618896484375, -0.25799560546875, -0.2119293212890625, -0.165863037109375, -0.1197967529296875, -0.07373046875, -0.0276641845703125, 0.018402099609375, 0.0644683837890625, 0.11053466796875, 0.1566009521484375, 0.202667236328125, 0.2487335205078125, 0.2947998046875, 0.3408660888671875, 0.386932373046875, 0.4329986572265625, 0.47906494140625, 0.5251312255859375, 0.571197509765625, 0.6172637939453125, 0.663330078125, 0.7093963623046875, 0.755462646484375, 0.8015289306640625, 0.84759521484375, 0.8936614990234375, 0.939727783203125, 0.9857940673828125, 1.0318603515625, 1.0779266357421875, 1.123992919921875, 1.1700592041015625, 1.21612548828125, 1.2621917724609375, 1.308258056640625, 1.3543243408203125, 1.400390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 10.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 15.0, 19.0, 21.0, 29.0, 28.0, 56.0, 54.0, 58.0, 62.0, 80.0, 59.0, 68.0, 64.0, 52.0, 40.0, 33.0, 34.0, 12.0, 21.0, 20.0, 19.0, 20.0, 8.0, 10.0, 9.0, 6.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.49609375, -2.41912841796875, -2.3421630859375, -2.26519775390625, -2.188232421875, -2.11126708984375, -2.0343017578125, -1.95733642578125, -1.88037109375, -1.80340576171875, -1.7264404296875, -1.64947509765625, -1.572509765625, -1.49554443359375, -1.4185791015625, -1.34161376953125, -1.2646484375, -1.18768310546875, -1.1107177734375, -1.03375244140625, -0.956787109375, -0.87982177734375, -0.8028564453125, -0.72589111328125, -0.64892578125, -0.57196044921875, -0.4949951171875, -0.41802978515625, -0.341064453125, -0.26409912109375, -0.1871337890625, -0.11016845703125, -0.033203125, 0.04376220703125, 0.1207275390625, 0.19769287109375, 0.274658203125, 0.35162353515625, 0.4285888671875, 0.50555419921875, 0.58251953125, 0.65948486328125, 0.7364501953125, 0.81341552734375, 0.890380859375, 0.96734619140625, 1.0443115234375, 1.12127685546875, 1.1982421875, 1.27520751953125, 1.3521728515625, 1.42913818359375, 1.506103515625, 1.58306884765625, 1.6600341796875, 1.73699951171875, 1.81396484375, 1.89093017578125, 1.9678955078125, 2.04486083984375, 2.121826171875, 2.19879150390625, 2.2757568359375, 2.35272216796875, 2.4296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 9.0, 11.0, 19.0, 29.0, 38.0, 53.0, 92.0, 157.0, 268.0, 520.0, 1216.0, 3597.0, 14236.0, 183021.0, 817976.0, 19849.0, 4517.0, 1501.0, 653.0, 308.0, 171.0, 89.0, 66.0, 37.0, 31.0, 25.0, 16.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.37534332275390625, -0.3649444580078125, -0.35454559326171875, -0.344146728515625, -0.33374786376953125, -0.3233489990234375, -0.31295013427734375, -0.30255126953125, -0.29215240478515625, -0.2817535400390625, -0.27135467529296875, -0.260955810546875, -0.25055694580078125, -0.2401580810546875, -0.22975921630859375, -0.2193603515625, -0.20896148681640625, -0.1985626220703125, -0.18816375732421875, -0.177764892578125, -0.16736602783203125, -0.1569671630859375, -0.14656829833984375, -0.13616943359375, -0.12577056884765625, -0.1153717041015625, -0.10497283935546875, -0.094573974609375, -0.08417510986328125, -0.0737762451171875, -0.06337738037109375, -0.052978515625, -0.04257965087890625, -0.0321807861328125, -0.02178192138671875, -0.011383056640625, -0.00098419189453125, 0.0094146728515625, 0.01981353759765625, 0.03021240234375, 0.04061126708984375, 0.0510101318359375, 0.06140899658203125, 0.071807861328125, 0.08220672607421875, 0.0926055908203125, 0.10300445556640625, 0.1134033203125, 0.12380218505859375, 0.1342010498046875, 0.14459991455078125, 0.154998779296875, 0.16539764404296875, 0.1757965087890625, 0.18619537353515625, 0.19659423828125, 0.20699310302734375, 0.2173919677734375, 0.22779083251953125, 0.238189697265625, 0.24858856201171875, 0.2589874267578125, 0.26938629150390625, 0.27978515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 7.0, 7.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 110.0, 146.0, 154.0, 155.0, 67.0, 39.0, 37.0, 24.0, 19.0, 10.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.636713027954102e-05, -8.399225771427155e-05, -8.161738514900208e-05, -7.92425125837326e-05, -7.686764001846313e-05, -7.449276745319366e-05, -7.21178948879242e-05, -6.974302232265472e-05, -6.736814975738525e-05, -6.499327719211578e-05, -6.261840462684631e-05, -6.024353206157684e-05, -5.786865949630737e-05, -5.54937869310379e-05, -5.311891436576843e-05, -5.074404180049896e-05, -4.836916923522949e-05, -4.599429666996002e-05, -4.361942410469055e-05, -4.124455153942108e-05, -3.886967897415161e-05, -3.649480640888214e-05, -3.411993384361267e-05, -3.17450612783432e-05, -2.937018871307373e-05, -2.699531614780426e-05, -2.462044358253479e-05, -2.224557101726532e-05, -1.987069845199585e-05, -1.749582588672638e-05, -1.512095332145691e-05, -1.2746080756187439e-05, -1.0371208190917969e-05, -7.996335625648499e-06, -5.621463060379028e-06, -3.246590495109558e-06, -8.717179298400879e-07, 1.5031546354293823e-06, 3.8780272006988525e-06, 6.252899765968323e-06, 8.627772331237793e-06, 1.1002644896507263e-05, 1.3377517461776733e-05, 1.5752390027046204e-05, 1.8127262592315674e-05, 2.0502135157585144e-05, 2.2877007722854614e-05, 2.5251880288124084e-05, 2.7626752853393555e-05, 3.0001625418663025e-05, 3.2376497983932495e-05, 3.4751370549201965e-05, 3.7126243114471436e-05, 3.9501115679740906e-05, 4.1875988245010376e-05, 4.4250860810279846e-05, 4.6625733375549316e-05, 4.900060594081879e-05, 5.137547850608826e-05, 5.375035107135773e-05, 5.61252236366272e-05, 5.850009620189667e-05, 6.087496876716614e-05, 6.324984133243561e-05, 6.562471389770508e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 21.0, 26.0, 23.0, 47.0, 67.0, 101.0, 157.0, 264.0, 418.0, 764.0, 1378.0, 2775.0, 6157.0, 16501.0, 63245.0, 809634.0, 108661.0, 22977.0, 7930.0, 3522.0, 1631.0, 885.0, 500.0, 282.0, 162.0, 114.0, 77.0, 62.0, 49.0, 32.0, 21.0, 13.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.19930648803710938, -0.19280242919921875, -0.18629837036132812, -0.1797943115234375, -0.17329025268554688, -0.16678619384765625, -0.16028213500976562, -0.153778076171875, -0.14727401733398438, -0.14076995849609375, -0.13426589965820312, -0.1277618408203125, -0.12125778198242188, -0.11475372314453125, -0.10824966430664062, -0.10174560546875, -0.09524154663085938, -0.08873748779296875, -0.08223342895507812, -0.0757293701171875, -0.06922531127929688, -0.06272125244140625, -0.056217193603515625, -0.049713134765625, -0.043209075927734375, -0.03670501708984375, -0.030200958251953125, -0.0236968994140625, -0.017192840576171875, -0.01068878173828125, -0.004184722900390625, 0.0023193359375, 0.008823394775390625, 0.01532745361328125, 0.021831512451171875, 0.0283355712890625, 0.034839630126953125, 0.04134368896484375, 0.047847747802734375, 0.054351806640625, 0.060855865478515625, 0.06735992431640625, 0.07386398315429688, 0.0803680419921875, 0.08687210083007812, 0.09337615966796875, 0.09988021850585938, 0.10638427734375, 0.11288833618164062, 0.11939239501953125, 0.12589645385742188, 0.1324005126953125, 0.13890457153320312, 0.14540863037109375, 0.15191268920898438, 0.158416748046875, 0.16492080688476562, 0.17142486572265625, 0.17792892456054688, 0.1844329833984375, 0.19093704223632812, 0.19744110107421875, 0.20394515991210938, 0.21044921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 2.0, 5.0, 7.0, 6.0, 14.0, 25.0, 11.0, 18.0, 27.0, 50.0, 76.0, 140.0, 156.0, 141.0, 86.0, 57.0, 40.0, 20.0, 20.0, 16.0, 23.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.339599609375, -0.33008575439453125, -0.3205718994140625, -0.31105804443359375, -0.301544189453125, -0.29203033447265625, -0.2825164794921875, -0.27300262451171875, -0.26348876953125, -0.25397491455078125, -0.2444610595703125, -0.23494720458984375, -0.225433349609375, -0.21591949462890625, -0.2064056396484375, -0.19689178466796875, -0.1873779296875, -0.17786407470703125, -0.1683502197265625, -0.15883636474609375, -0.149322509765625, -0.13980865478515625, -0.1302947998046875, -0.12078094482421875, -0.11126708984375, -0.10175323486328125, -0.0922393798828125, -0.08272552490234375, -0.073211669921875, -0.06369781494140625, -0.0541839599609375, -0.04467010498046875, -0.03515625, -0.02564239501953125, -0.0161285400390625, -0.00661468505859375, 0.002899169921875, 0.01241302490234375, 0.0219268798828125, 0.03144073486328125, 0.04095458984375, 0.05046844482421875, 0.0599822998046875, 0.06949615478515625, 0.079010009765625, 0.08852386474609375, 0.0980377197265625, 0.10755157470703125, 0.1170654296875, 0.12657928466796875, 0.1360931396484375, 0.14560699462890625, 0.155120849609375, 0.16463470458984375, 0.1741485595703125, 0.18366241455078125, 0.19317626953125, 0.20269012451171875, 0.2122039794921875, 0.22171783447265625, 0.231231689453125, 0.24074554443359375, 0.2502593994140625, 0.25977325439453125, 0.269287109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 11.0, 20.0, 23.0, 43.0, 64.0, 129.0, 482.0, 103.0, 50.0, 18.0, 14.0, 8.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.590933799743652, -12.262884140014648, -11.934834480285645, -11.606783866882324, -11.27873420715332, -10.950684547424316, -10.622634887695312, -10.294585227966309, -9.966535568237305, -9.6384859085083, -9.310436248779297, -8.982385635375977, -8.654335975646973, -8.326286315917969, -7.998236656188965, -7.670186996459961, -7.342136383056641, -7.014086723327637, -6.686036586761475, -6.357986927032471, -6.029936790466309, -5.701887130737305, -5.373837471008301, -5.045787811279297, -4.717737674713135, -4.389688014984131, -4.061637878417969, -3.733588218688965, -3.405538320541382, -3.077488422393799, -2.749438762664795, -2.421388864517212, -2.0933399200439453, -1.7652900218963623, -1.4372402429580688, -1.1091904640197754, -0.7811405658721924, -0.4530906677246094, -0.12504088878631592, 0.20300889015197754, 0.5310587882995605, 0.8591086268424988, 1.187158465385437, 1.5152082443237305, 1.8432581424713135, 2.1713080406188965, 2.4993577003479004, 2.8274075984954834, 3.1554574966430664, 3.4835073947906494, 3.8115572929382324, 4.139606952667236, 4.467657089233398, 4.795706748962402, 5.123756408691406, 5.45180606842041, 5.779856204986572, 6.107905864715576, 6.435956001281738, 6.764005661010742, 7.092055320739746, 7.420105457305908, 7.748155117034912, 8.076205253601074, 8.404254913330078]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 12.0, 12.0, 13.0, 16.0, 16.0, 21.0, 15.0, 27.0, 24.0, 24.0, 43.0, 185.0, 256.0, 54.0, 34.0, 19.0, 34.0, 25.0, 21.0, 18.0, 12.0, 13.0, 11.0, 8.0, 10.0, 9.0, 2.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.607936859130859, -7.3912434577941895, -7.1745500564575195, -6.95785665512085, -6.74116325378418, -6.52446985244751, -6.30777645111084, -6.091082572937012, -5.8743896484375, -5.65769624710083, -5.44100284576416, -5.22430944442749, -5.00761604309082, -4.79092264175415, -4.5742292404174805, -4.357535362243652, -4.140841960906982, -3.9241485595703125, -3.7074551582336426, -3.4907617568969727, -3.2740683555603027, -3.057374954223633, -2.840681314468384, -2.623987913131714, -2.407294511795044, -2.190601110458374, -1.973907709121704, -1.7572141885757446, -1.5405207872390747, -1.3238273859024048, -1.1071338653564453, -0.8904404640197754, -0.6737470626831055, -0.45705363154411316, -0.24036020040512085, -0.023666739463806152, 0.19302666187286377, 0.4097200632095337, 0.6264135837554932, 0.8431069850921631, 1.059800386428833, 1.276493787765503, 1.4931871891021729, 1.7098807096481323, 1.9265741109848022, 2.1432676315307617, 2.3599610328674316, 2.5766544342041016, 2.7933478355407715, 3.0100412368774414, 3.2267346382141113, 3.4434280395507812, 3.660121440887451, 3.876814842224121, 4.093508720397949, 4.310201644897461, 4.526895523071289, 4.743588924407959, 4.960282325744629, 5.176975727081299, 5.393669128417969, 5.610362529754639, 5.827055931091309, 6.043749809265137, 6.260442733764648]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 6.0, 8.0, 17.0, 19.0, 32.0, 38.0, 42.0, 43.0, 55.0, 139.0, 254.0, 67.0, 46.0, 43.0, 28.0, 24.0, 22.0, 25.0, 17.0, 17.0, 9.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.891357421875, -0.86279296875, -0.834228515625, -0.8056640625, -0.777099609375, -0.74853515625, -0.719970703125, -0.69140625, -0.662841796875, -0.63427734375, -0.605712890625, -0.5771484375, -0.548583984375, -0.52001953125, -0.491455078125, -0.462890625, -0.434326171875, -0.40576171875, -0.377197265625, -0.3486328125, -0.320068359375, -0.29150390625, -0.262939453125, -0.234375, -0.205810546875, -0.17724609375, -0.148681640625, -0.1201171875, -0.091552734375, -0.06298828125, -0.034423828125, -0.005859375, 0.022705078125, 0.05126953125, 0.079833984375, 0.1083984375, 0.136962890625, 0.16552734375, 0.194091796875, 0.22265625, 0.251220703125, 0.27978515625, 0.308349609375, 0.3369140625, 0.365478515625, 0.39404296875, 0.422607421875, 0.451171875, 0.479736328125, 0.50830078125, 0.536865234375, 0.5654296875, 0.593994140625, 0.62255859375, 0.651123046875, 0.6796875, 0.708251953125, 0.73681640625, 0.765380859375, 0.7939453125, 0.822509765625, 0.85107421875, 0.879638671875, 0.908203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 10.0, 11.0, 13.0, 17.0, 22.0, 23.0, 48.0, 98.0, 222.0, 628.0, 2842.0, 32289.0, 8343188.0, 7162.0, 1235.0, 369.0, 147.0, 86.0, 42.0, 33.0, 12.0, 11.0, 14.0, 16.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-10.011630058288574, -9.680545806884766, -9.34946060180664, -9.018376350402832, -8.687292098999023, -8.356207847595215, -8.025123596191406, -7.694038391113281, -7.362954139709473, -7.031869888305664, -6.700785160064697, -6.3697004318237305, -6.038616180419922, -5.707531929016113, -5.3764472007751465, -5.04536247253418, -4.714278221130371, -4.3831939697265625, -4.052109241485596, -3.721024751663208, -3.3899402618408203, -3.0588557720184326, -2.727771282196045, -2.3966867923736572, -2.0656023025512695, -1.7345178127288818, -1.4034333229064941, -1.0723488330841064, -0.7412643432617188, -0.41017985343933105, -0.07909536361694336, 0.25198912620544434, 0.5830726623535156, 0.9141571521759033, 1.245241641998291, 1.5763261318206787, 1.9074106216430664, 2.238495111465454, 2.569579601287842, 2.9006640911102295, 3.231748580932617, 3.562833070755005, 3.8939175605773926, 4.225002288818359, 4.556086540222168, 4.887170791625977, 5.218255519866943, 5.54934024810791, 5.880424499511719, 6.211508750915527, 6.542593479156494, 6.873678207397461, 7.2047624588012695, 7.535846710205078, 7.866931438446045, 8.198016166687012, 8.52910041809082, 8.860184669494629, 9.191268920898438, 9.522354125976562, 9.853438377380371, 10.18452262878418, 10.515607833862305, 10.846692085266113, 11.177776336669922]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 11.0, 5.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.871780395507812, -14.41817569732666, -13.964570999145508, -13.510966300964355, -13.057361602783203, -12.60375690460205, -12.150152206420898, -11.696547508239746, -11.242942810058594, -10.789338111877441, -10.335733413696289, -9.882128715515137, -9.428524017333984, -8.974919319152832, -8.52131462097168, -8.067709922790527, -7.614105224609375, -7.160500526428223, -6.70689582824707, -6.253291130065918, -5.799686431884766, -5.346081733703613, -4.892477035522461, -4.438872337341309, -3.9852676391601562, -3.531662940979004, -3.0780582427978516, -2.624453544616699, -2.170848846435547, -1.7172441482543945, -1.2636394500732422, -0.8100347518920898, -0.3564291000366211, 0.09717559814453125, 0.5507802963256836, 1.004384994506836, 1.4579896926879883, 1.9115943908691406, 2.365199089050293, 2.8188037872314453, 3.2724084854125977, 3.72601318359375, 4.179617881774902, 4.633222579956055, 5.086827278137207, 5.540431976318359, 5.994036674499512, 6.447641372680664, 6.901246070861816, 7.354850769042969, 7.808455467224121, 8.262060165405273, 8.715664863586426, 9.169269561767578, 9.62287425994873, 10.076478958129883, 10.530083656311035, 10.983688354492188, 11.43729305267334, 11.890897750854492, 12.344502449035645, 12.798107147216797, 13.25171184539795, 13.705316543579102, 14.158921241760254]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 18.0, 16.0, 21.0, 34.0, 54.0, 71.0, 75.0, 121.0, 153.0, 232.0, 387.0, 679.0, 1330.0, 3075.0, 8772.0, 26407.0, 85508.0, 208518.0, 127887.0, 40188.0, 12588.0, 4308.0, 1657.0, 759.0, 383.0, 265.0, 188.0, 132.0, 101.0, 65.0, 52.0, 40.0, 35.0, 34.0, 26.0, 19.0, 9.0, 13.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4296875, -6.2200927734375, -6.010498046875, -5.8009033203125, -5.59130859375, -5.3817138671875, -5.172119140625, -4.9625244140625, -4.7529296875, -4.5433349609375, -4.333740234375, -4.1241455078125, -3.91455078125, -3.7049560546875, -3.495361328125, -3.2857666015625, -3.076171875, -2.8665771484375, -2.656982421875, -2.4473876953125, -2.23779296875, -2.0281982421875, -1.818603515625, -1.6090087890625, -1.3994140625, -1.1898193359375, -0.980224609375, -0.7706298828125, -0.56103515625, -0.3514404296875, -0.141845703125, 0.0677490234375, 0.27734375, 0.4869384765625, 0.696533203125, 0.9061279296875, 1.11572265625, 1.3253173828125, 1.534912109375, 1.7445068359375, 1.9541015625, 2.1636962890625, 2.373291015625, 2.5828857421875, 2.79248046875, 3.0020751953125, 3.211669921875, 3.4212646484375, 3.630859375, 3.8404541015625, 4.050048828125, 4.2596435546875, 4.46923828125, 4.6788330078125, 4.888427734375, 5.0980224609375, 5.3076171875, 5.5172119140625, 5.726806640625, 5.9364013671875, 6.14599609375, 6.3555908203125, 6.565185546875, 6.7747802734375, 6.984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 14.0, 18.0, 20.0, 28.0, 45.0, 43.0, 64.0, 92.0, 98.0, 105.0, 87.0, 93.0, 60.0, 53.0, 74.0, 30.0, 15.0, 25.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8467559814453125, -0.807769775390625, -0.7687835693359375, -0.72979736328125, -0.6908111572265625, -0.651824951171875, -0.6128387451171875, -0.5738525390625, -0.5348663330078125, -0.495880126953125, -0.4568939208984375, -0.41790771484375, -0.3789215087890625, -0.339935302734375, -0.3009490966796875, -0.261962890625, -0.2229766845703125, -0.183990478515625, -0.1450042724609375, -0.10601806640625, -0.0670318603515625, -0.028045654296875, 0.0109405517578125, 0.0499267578125, 0.0889129638671875, 0.127899169921875, 0.1668853759765625, 0.20587158203125, 0.2448577880859375, 0.283843994140625, 0.3228302001953125, 0.36181640625, 0.4008026123046875, 0.439788818359375, 0.4787750244140625, 0.51776123046875, 0.5567474365234375, 0.595733642578125, 0.6347198486328125, 0.6737060546875, 0.7126922607421875, 0.751678466796875, 0.7906646728515625, 0.82965087890625, 0.8686370849609375, 0.907623291015625, 0.9466094970703125, 0.985595703125, 1.0245819091796875, 1.063568115234375, 1.1025543212890625, 1.14154052734375, 1.1805267333984375, 1.219512939453125, 1.2584991455078125, 1.2974853515625, 1.3364715576171875, 1.375457763671875, 1.4144439697265625, 1.45343017578125, 1.4924163818359375, 1.531402587890625, 1.5703887939453125, 1.609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 12.0, 8.0, 24.0, 35.0, 54.0, 77.0, 71.0, 68.0, 59.0, 34.0, 13.0, 15.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21453857421875, -7.9825663566589355, -7.750594139099121, -7.518621921539307, -7.286649703979492, -7.054677486419678, -6.822705268859863, -6.590733051300049, -6.358760833740234, -6.12678861618042, -5.8948163986206055, -5.662844181060791, -5.430871963500977, -5.198899745941162, -4.966927528381348, -4.734955310821533, -4.502983093261719, -4.271010875701904, -4.03903865814209, -3.8070664405822754, -3.575094223022461, -3.3431220054626465, -3.111149787902832, -2.8791775703430176, -2.647205352783203, -2.4152331352233887, -2.183260917663574, -1.9512887001037598, -1.7193164825439453, -1.4873442649841309, -1.2553720474243164, -1.023399829864502, -0.7914276123046875, -0.559455394744873, -0.3274831771850586, -0.09551095962524414, 0.1364612579345703, 0.36843347549438477, 0.6004056930541992, 0.8323779106140137, 1.0643501281738281, 1.2963223457336426, 1.528294563293457, 1.7602667808532715, 1.992238998413086, 2.2242112159729004, 2.456183433532715, 2.6881556510925293, 2.9201278686523438, 3.152100086212158, 3.3840723037719727, 3.616044521331787, 3.8480167388916016, 4.079988956451416, 4.3119611740112305, 4.543933391571045, 4.775905609130859, 5.007877826690674, 5.239850044250488, 5.471822261810303, 5.703794479370117, 5.935766696929932, 6.167738914489746, 6.3997111320495605, 6.631683349609375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 5.0, 9.0, 23.0, 58.0, 135.0, 120.0, 51.0, 18.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.148806095123291, -5.946475028991699, -5.744144439697266, -5.541813373565674, -5.339482307434082, -5.137151718139648, -4.934820652008057, -4.732489585876465, -4.530158996582031, -4.3278279304504395, -4.125497341156006, -3.923166275024414, -3.7208352088928223, -3.5185043811798096, -3.316173553466797, -3.113842487335205, -2.9115114212036133, -2.7091805934906006, -2.506849527359009, -2.304518699645996, -2.1021876335144043, -1.8998568058013916, -1.697525978088379, -1.4951950311660767, -1.2928640842437744, -1.0905331373214722, -0.8882022500038147, -0.6858713626861572, -0.483540415763855, -0.28120946884155273, -0.07887864112854004, 0.12345230579376221, 0.32578277587890625, 0.5281137228012085, 0.730444610118866, 0.9327754974365234, 1.1351064443588257, 1.337437391281128, 1.5397682189941406, 1.7420991659164429, 1.9444301128387451, 2.146760940551758, 2.3490920066833496, 2.5514228343963623, 2.753753662109375, 2.956084728240967, 3.1584155559539795, 3.360746383666992, 3.563077449798584, 3.7654082775115967, 3.9677393436431885, 4.170070171356201, 4.372401237487793, 4.574731826782227, 4.777062892913818, 4.97939395904541, 5.181724548339844, 5.3840556144714355, 5.586386203765869, 5.788717269897461, 5.991048336029053, 6.1933794021606445, 6.395709991455078, 6.59804105758667, 6.800372123718262]}, "eval/loss": 5.628564834594727, "eval/wer": 1.5293172212631705, "eval/runtime": 963.4096, "eval/samples_per_second": 2.742, "eval/steps_per_second": 0.344, "train/train_runtime": 28486.3453, "train/train_samples_per_second": 5.009, "train/train_steps_per_second": 0.157, "train/total_flos": 0.0, "train/train_loss": 6.089906092074955} \ No newline at end of file +{"train/loss": 4.4894, "train/learning_rate": 3.4682080924855494e-08, "train/epoch": 5.0, "train/global_step": 4460, "_runtime": 29952, "_timestamp": 1646257635, "_step": 4463, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 99.0, 21.0, 7.0, 6.0, 3.0, 3.0, 8.0, 1.0, 30037.0, 216.0, 45.0, 17.0, 10.0, 9.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.90625, -37.05322265625, -36.2001953125, -35.34716796875, -34.494140625, -33.64111328125, -32.7880859375, -31.93505859375, -31.08203125, -30.22900390625, -29.3759765625, -28.52294921875, -27.669921875, -26.81689453125, -25.9638671875, -25.11083984375, -24.2578125, -23.40478515625, -22.5517578125, -21.69873046875, -20.845703125, -19.99267578125, -19.1396484375, -18.28662109375, -17.43359375, -16.58056640625, -15.7275390625, -14.87451171875, -14.021484375, -13.16845703125, -12.3154296875, -11.46240234375, -10.609375, -9.75634765625, -8.9033203125, -8.05029296875, -7.197265625, -6.34423828125, -5.4912109375, -4.63818359375, -3.78515625, -2.93212890625, -2.0791015625, -1.22607421875, -0.373046875, 0.47998046875, 1.3330078125, 2.18603515625, 3.0390625, 3.89208984375, 4.7451171875, 5.59814453125, 6.451171875, 7.30419921875, 8.1572265625, 9.01025390625, 9.86328125, 10.71630859375, 11.5693359375, 12.42236328125, 13.275390625, 14.12841796875, 14.9814453125, 15.83447265625, 16.6875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 7.0, 4.0, 4.0, 6.0, 12.0, 9.0, 14.0, 21.0, 15.0, 24.0, 20.0, 27.0, 33.0, 33.0, 27.0, 43.0, 30.0, 41.0, 36.0, 46.0, 47.0, 38.0, 46.0, 42.0, 43.0, 36.0, 41.0, 30.0, 37.0, 29.0, 19.0, 30.0, 25.0, 12.0, 11.0, 6.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.805110931396484, -9.561691284179688, -9.318270683288574, -9.074851036071777, -8.83143138885498, -8.588010787963867, -8.34459114074707, -8.101171493530273, -7.857751369476318, -7.614331245422363, -7.370911598205566, -7.127491474151611, -6.884071350097656, -6.640651702880859, -6.397231578826904, -6.153811454772949, -5.910391807556152, -5.666971683502197, -5.4235520362854, -5.180131912231445, -4.936712265014648, -4.693292140960693, -4.449872016906738, -4.206452369689941, -3.9630322456359863, -3.7196123600006104, -3.4761924743652344, -3.2327723503112793, -2.9893524646759033, -2.7459325790405273, -2.5025124549865723, -2.2590925693511963, -2.0156731605529785, -1.7722532749176025, -1.528833270072937, -1.2854132652282715, -1.0419933795928955, -0.7985734939575195, -0.555153489112854, -0.3117334842681885, -0.0683135986328125, 0.17510634660720825, 0.418526291847229, 0.6619462370872498, 0.9053661823272705, 1.1487860679626465, 1.392206072807312, 1.6356260776519775, 1.8790459632873535, 2.1224658489227295, 2.3658857345581055, 2.6093058586120605, 2.8527257442474365, 3.0961456298828125, 3.3395657539367676, 3.5829856395721436, 3.8264055252075195, 4.069825649261475, 4.3132452964782715, 4.556665420532227, 4.800085067749023, 5.0435051918029785, 5.286925315856934, 5.5303449630737305, 5.7737650871276855]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 8.0, 18.0, 13.0, 11.0, 20.0, 17.0, 17.0, 32.0, 21.0, 36.0, 31.0, 45.0, 40.0, 37.0, 50.0, 38.0, 42.0, 51.0, 40.0, 46.0, 35.0, 37.0, 23.0, 35.0, 31.0, 34.0, 24.0, 28.0, 20.0, 19.0, 16.0, 18.0, 13.0, 5.0, 4.0, 3.0, 5.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.515730857849121, -7.263637065887451, -7.011543273925781, -6.759449481964111, -6.507355690002441, -6.255261421203613, -6.003167629241943, -5.751073837280273, -5.4989800453186035, -5.246886253356934, -4.994792461395264, -4.742698669433594, -4.490604400634766, -4.238511085510254, -3.986416816711426, -3.734323024749756, -3.482229232788086, -3.230135440826416, -2.978041648864746, -2.725947618484497, -2.473853826522827, -2.2217600345611572, -1.9696661233901978, -1.7175722122192383, -1.4654784202575684, -1.2133846282958984, -0.961290717124939, -0.7091968655586243, -0.45710301399230957, -0.20500922203063965, 0.047084689140319824, 0.2991786003112793, 0.5512733459472656, 0.8033671975135803, 1.055461049079895, 1.3075549602508545, 1.5596487522125244, 1.8117425441741943, 2.0638365745544434, 2.3159303665161133, 2.568024158477783, 2.820117950439453, 3.072211742401123, 3.324305772781372, 3.576399564743042, 3.828493356704712, 4.080587387084961, 4.332681179046631, 4.584774971008301, 4.836868762969971, 5.088962554931641, 5.3410563468933105, 5.5931501388549805, 5.845244407653809, 6.0973381996154785, 6.349431991577148, 6.601525783538818, 6.853619575500488, 7.105713367462158, 7.357807159423828, 7.609901428222656, 7.861994743347168, 8.114089012145996, 8.366182327270508, 8.618276596069336]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 16.0, 19.0, 35.0, 68.0, 95.0, 158.0, 251.0, 411.0, 623.0, 1083.0, 1743.0, 2828.0, 4714.0, 7535.0, 11752.0, 18425.0, 27274.0, 40217.0, 57174.0, 77683.0, 101516.0, 139276.0, 158053.0, 112234.0, 85687.0, 64222.0, 45651.0, 31301.0, 21287.0, 13941.0, 8838.0, 5490.0, 3435.0, 2130.0, 1269.0, 783.0, 509.0, 310.0, 202.0, 112.0, 59.0, 50.0, 27.0, 22.0, 15.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.625, -23.904541015625, -23.18408203125, -22.463623046875, -21.7431640625, -21.022705078125, -20.30224609375, -19.581787109375, -18.861328125, -18.140869140625, -17.42041015625, -16.699951171875, -15.9794921875, -15.259033203125, -14.53857421875, -13.818115234375, -13.09765625, -12.377197265625, -11.65673828125, -10.936279296875, -10.2158203125, -9.495361328125, -8.77490234375, -8.054443359375, -7.333984375, -6.613525390625, -5.89306640625, -5.172607421875, -4.4521484375, -3.731689453125, -3.01123046875, -2.290771484375, -1.5703125, -0.849853515625, -0.12939453125, 0.591064453125, 1.3115234375, 2.031982421875, 2.75244140625, 3.472900390625, 4.193359375, 4.913818359375, 5.63427734375, 6.354736328125, 7.0751953125, 7.795654296875, 8.51611328125, 9.236572265625, 9.95703125, 10.677490234375, 11.39794921875, 12.118408203125, 12.8388671875, 13.559326171875, 14.27978515625, 15.000244140625, 15.720703125, 16.441162109375, 17.16162109375, 17.882080078125, 18.6025390625, 19.322998046875, 20.04345703125, 20.763916015625, 21.484375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 25.0, 18.0, 13.0, 26.0, 38.0, 43.0, 42.0, 41.0, 53.0, 61.0, 65.0, 69.0, 62.0, 61.0, 49.0, 32.0, 31.0, 23.0, 24.0, 27.0, 26.0, 12.0, 18.0, 14.0, 15.0, 9.0, 3.0, 5.0, 5.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.316650390625, -8.98486328125, -8.653076171875, -8.3212890625, -7.989501953125, -7.65771484375, -7.325927734375, -6.994140625, -6.662353515625, -6.33056640625, -5.998779296875, -5.6669921875, -5.335205078125, -5.00341796875, -4.671630859375, -4.33984375, -4.008056640625, -3.67626953125, -3.344482421875, -3.0126953125, -2.680908203125, -2.34912109375, -2.017333984375, -1.685546875, -1.353759765625, -1.02197265625, -0.690185546875, -0.3583984375, -0.026611328125, 0.30517578125, 0.636962890625, 0.96875, 1.300537109375, 1.63232421875, 1.964111328125, 2.2958984375, 2.627685546875, 2.95947265625, 3.291259765625, 3.623046875, 3.954833984375, 4.28662109375, 4.618408203125, 4.9501953125, 5.281982421875, 5.61376953125, 5.945556640625, 6.27734375, 6.609130859375, 6.94091796875, 7.272705078125, 7.6044921875, 7.936279296875, 8.26806640625, 8.599853515625, 8.931640625, 9.263427734375, 9.59521484375, 9.927001953125, 10.2587890625, 10.590576171875, 10.92236328125, 11.254150390625, 11.5859375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 6.0, 9.0, 13.0, 10.0, 16.0, 16.0, 22.0, 28.0, 28.0, 36.0, 31.0, 39.0, 64.0, 54.0, 49.0, 53.0, 59.0, 43.0, 55.0, 50.0, 34.0, 46.0, 38.0, 37.0, 26.0, 29.0, 19.0, 15.0, 15.0, 8.0, 12.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.451366424560547, -6.244081974029541, -6.036797523498535, -5.829513072967529, -5.622228622436523, -5.414944171905518, -5.207659721374512, -5.000375747680664, -4.7930908203125, -4.585806369781494, -4.378521919250488, -4.171237468719482, -3.9639530181884766, -3.7566685676574707, -3.549384355545044, -3.342099905014038, -3.1348156929016113, -2.9275312423706055, -2.7202467918395996, -2.5129623413085938, -2.305677890777588, -2.098393440246582, -1.8911092281341553, -1.6838247776031494, -1.4765403270721436, -1.2692558765411377, -1.0619714260101318, -0.8546870946884155, -0.6474026441574097, -0.4401181936264038, -0.2328338623046875, -0.02554941177368164, 0.18173551559448242, 0.3890199363231659, 0.5963043570518494, 0.8035887479782104, 1.0108731985092163, 1.2181576490402222, 1.4254419803619385, 1.6327264308929443, 1.8400108814239502, 2.047295331954956, 2.254579782485962, 2.4618639945983887, 2.6691484451293945, 2.8764328956604004, 3.0837173461914062, 3.291001796722412, 3.498286247253418, 3.705570697784424, 3.9128551483154297, 4.1201395988464355, 4.327424049377441, 4.534708499908447, 4.741992950439453, 4.949276924133301, 5.156561851501465, 5.363846302032471, 5.571130752563477, 5.778415203094482, 5.985699653625488, 6.192984104156494, 6.4002685546875, 6.607552528381348, 6.8148369789123535]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 8.0, 6.0, 13.0, 11.0, 16.0, 23.0, 15.0, 31.0, 28.0, 38.0, 33.0, 35.0, 45.0, 45.0, 48.0, 45.0, 57.0, 41.0, 48.0, 38.0, 36.0, 39.0, 43.0, 33.0, 45.0, 30.0, 29.0, 25.0, 24.0, 7.0, 14.0, 11.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.627979278564453, -5.424100875854492, -5.220222473144531, -5.01634407043457, -4.812465667724609, -4.608587265014648, -4.404709339141846, -4.200830936431885, -3.996952533721924, -3.793074131011963, -3.589195728302002, -3.38531756401062, -3.181439161300659, -2.9775607585906982, -2.7736825942993164, -2.5698041915893555, -2.3659257888793945, -2.1620473861694336, -1.9581691026687622, -1.7542908191680908, -1.5504124164581299, -1.346534013748169, -1.1426557302474976, -0.9387774467468262, -0.7348990440368652, -0.5310207009315491, -0.3271423578262329, -0.12326401472091675, 0.08061432838439941, 0.28449273109436035, 0.48837101459503174, 0.6922492980957031, 0.8961272239685059, 1.1000056266784668, 1.3038839101791382, 1.5077621936798096, 1.7116405963897705, 1.9155189990997314, 2.1193971633911133, 2.323275566101074, 2.527153968811035, 2.731032371520996, 2.934910774230957, 3.138788938522339, 3.3426673412323, 3.5465457439422607, 3.7504239082336426, 3.9543023109436035, 4.1581807136535645, 4.362059116363525, 4.565937519073486, 4.769815921783447, 4.97369384765625, 5.177572250366211, 5.381450653076172, 5.585329055786133, 5.789207458496094, 5.993085861206055, 6.196964263916016, 6.400842666625977, 6.6047210693359375, 6.808599472045898, 7.012477397918701, 7.216355800628662, 7.420234203338623]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 21.0, 25.0, 34.0, 39.0, 78.0, 102.0, 146.0, 199.0, 330.0, 532.0, 806.0, 1317.0, 2168.0, 3330.0, 5413.0, 8947.0, 14418.0, 23731.0, 38487.0, 62220.0, 101652.0, 165023.0, 262525.0, 398320.0, 545724.0, 634460.0, 601583.0, 471734.0, 321557.0, 203793.0, 126650.0, 76489.0, 47312.0, 29068.0, 17646.0, 10741.0, 6525.0, 4180.0, 2508.0, 1584.0, 995.0, 677.0, 394.0, 235.0, 176.0, 132.0, 77.0, 54.0, 30.0, 27.0, 20.0, 15.0, 5.0, 10.0, 6.0, 4.0], "bins": [-4.8046875, -4.6622314453125, -4.519775390625, -4.3773193359375, -4.23486328125, -4.0924072265625, -3.949951171875, -3.8074951171875, -3.6650390625, -3.5225830078125, -3.380126953125, -3.2376708984375, -3.09521484375, -2.9527587890625, -2.810302734375, -2.6678466796875, -2.525390625, -2.3829345703125, -2.240478515625, -2.0980224609375, -1.95556640625, -1.8131103515625, -1.670654296875, -1.5281982421875, -1.3857421875, -1.2432861328125, -1.100830078125, -0.9583740234375, -0.81591796875, -0.6734619140625, -0.531005859375, -0.3885498046875, -0.24609375, -0.1036376953125, 0.038818359375, 0.1812744140625, 0.32373046875, 0.4661865234375, 0.608642578125, 0.7510986328125, 0.8935546875, 1.0360107421875, 1.178466796875, 1.3209228515625, 1.46337890625, 1.6058349609375, 1.748291015625, 1.8907470703125, 2.033203125, 2.1756591796875, 2.318115234375, 2.4605712890625, 2.60302734375, 2.7454833984375, 2.887939453125, 3.0303955078125, 3.1728515625, 3.3153076171875, 3.457763671875, 3.6002197265625, 3.74267578125, 3.8851318359375, 4.027587890625, 4.1700439453125, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 11.0, 12.0, 6.0, 15.0, 18.0, 21.0, 19.0, 25.0, 31.0, 39.0, 35.0, 38.0, 35.0, 46.0, 44.0, 52.0, 25.0, 31.0, 38.0, 43.0, 38.0, 44.0, 43.0, 41.0, 33.0, 37.0, 25.0, 21.0, 21.0, 18.0, 13.0, 10.0, 11.0, 10.0, 13.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1845703125, -4.037109375, -3.8896484375, -3.7421875, -3.5947265625, -3.447265625, -3.2998046875, -3.15234375, -3.0048828125, -2.857421875, -2.7099609375, -2.5625, -2.4150390625, -2.267578125, -2.1201171875, -1.97265625, -1.8251953125, -1.677734375, -1.5302734375, -1.3828125, -1.2353515625, -1.087890625, -0.9404296875, -0.79296875, -0.6455078125, -0.498046875, -0.3505859375, -0.203125, -0.0556640625, 0.091796875, 0.2392578125, 0.38671875, 0.5341796875, 0.681640625, 0.8291015625, 0.9765625, 1.1240234375, 1.271484375, 1.4189453125, 1.56640625, 1.7138671875, 1.861328125, 2.0087890625, 2.15625, 2.3037109375, 2.451171875, 2.5986328125, 2.74609375, 2.8935546875, 3.041015625, 3.1884765625, 3.3359375, 3.4833984375, 3.630859375, 3.7783203125, 3.92578125, 4.0732421875, 4.220703125, 4.3681640625, 4.515625, 4.6630859375, 4.810546875, 4.9580078125, 5.10546875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 13.0, 20.0, 32.0, 45.0, 50.0, 106.0, 162.0, 265.0, 438.0, 731.0, 1176.0, 2094.0, 3319.0, 5919.0, 9896.0, 16776.0, 27900.0, 46589.0, 76213.0, 122406.0, 190160.0, 285649.0, 405693.0, 530305.0, 598291.0, 555293.0, 436782.0, 312968.0, 211478.0, 136680.0, 85377.0, 52662.0, 31946.0, 19276.0, 11207.0, 6706.0, 3895.0, 2339.0, 1372.0, 789.0, 465.0, 278.0, 195.0, 109.0, 84.0, 53.0, 27.0, 21.0, 7.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 16.0, 29.0, 33.0, 46.0, 58.0, 83.0, 104.0, 103.0, 140.0, 167.0, 208.0, 213.0, 236.0, 257.0, 287.0, 284.0, 267.0, 258.0, 214.0, 203.0, 145.0, 125.0, 120.0, 99.0, 70.0, 65.0, 62.0, 31.0, 38.0, 22.0, 16.0, 9.0, 9.0, 12.0, 7.0, 3.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.33740234375, -2.2646484375, -2.19189453125, -2.119140625, -2.04638671875, -1.9736328125, -1.90087890625, -1.828125, -1.75537109375, -1.6826171875, -1.60986328125, -1.537109375, -1.46435546875, -1.3916015625, -1.31884765625, -1.24609375, -1.17333984375, -1.1005859375, -1.02783203125, -0.955078125, -0.88232421875, -0.8095703125, -0.73681640625, -0.6640625, -0.59130859375, -0.5185546875, -0.44580078125, -0.373046875, -0.30029296875, -0.2275390625, -0.15478515625, -0.08203125, -0.00927734375, 0.0634765625, 0.13623046875, 0.208984375, 0.28173828125, 0.3544921875, 0.42724609375, 0.5, 0.57275390625, 0.6455078125, 0.71826171875, 0.791015625, 0.86376953125, 0.9365234375, 1.00927734375, 1.08203125, 1.15478515625, 1.2275390625, 1.30029296875, 1.373046875, 1.44580078125, 1.5185546875, 1.59130859375, 1.6640625, 1.73681640625, 1.8095703125, 1.88232421875, 1.955078125, 2.02783203125, 2.1005859375, 2.17333984375, 2.24609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 19.0, 25.0, 28.0, 32.0, 28.0, 33.0, 56.0, 61.0, 54.0, 71.0, 48.0, 50.0, 69.0, 50.0, 52.0, 48.0, 36.0, 38.0, 30.0, 34.0, 21.0, 20.0, 11.0, 8.0, 7.0, 4.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.364202499389648, -7.164638042449951, -6.965073585510254, -6.765509605407715, -6.565945148468018, -6.36638069152832, -6.166816234588623, -5.967251777648926, -5.767687797546387, -5.5681233406066895, -5.368558883666992, -5.168994903564453, -4.969430446624756, -4.769865989685059, -4.570301532745361, -4.370737075805664, -4.171173095703125, -3.9716086387634277, -3.7720444202423096, -3.5724799633026123, -3.372915744781494, -3.173351287841797, -2.9737868309020996, -2.7742226123809814, -2.574657917022705, -2.375093460083008, -2.1755292415618896, -1.9759647846221924, -1.7764005661010742, -1.576836109161377, -1.3772717714309692, -1.1777074337005615, -0.9781432151794434, -0.7785788774490356, -0.5790145397186279, -0.37945014238357544, -0.17988580465316772, 0.01967853307723999, 0.21924293041229248, 0.4188072681427002, 0.6183716058731079, 0.8179359436035156, 1.0175002813339233, 1.217064619064331, 1.4166290760040283, 1.6161932945251465, 1.8157577514648438, 2.015322208404541, 2.214886426925659, 2.4144508838653564, 2.6140151023864746, 2.813579559326172, 3.01314377784729, 3.2127082347869873, 3.4122724533081055, 3.6118369102478027, 3.8114013671875, 4.010965824127197, 4.2105302810668945, 4.410094261169434, 4.609658718109131, 4.809223175048828, 5.008787631988525, 5.208352088928223, 5.407916069030762]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 14.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 16.0, 23.0, 15.0, 26.0, 24.0, 27.0, 23.0, 36.0, 32.0, 34.0, 31.0, 48.0, 30.0, 41.0, 31.0, 48.0, 45.0, 41.0, 33.0, 29.0, 28.0, 31.0, 29.0, 27.0, 22.0, 23.0, 19.0, 16.0, 18.0, 12.0, 8.0, 7.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.708048343658447, -4.56910514831543, -4.430161952972412, -4.2912187576293945, -4.152275562286377, -4.013332366943359, -3.8743889331817627, -3.735445737838745, -3.5965025424957275, -3.45755934715271, -3.3186161518096924, -3.179672956466675, -3.040729522705078, -2.9017863273620605, -2.762843132019043, -2.6238999366760254, -2.484956741333008, -2.3460135459899902, -2.2070703506469727, -2.068127155303955, -1.929183840751648, -1.7902406454086304, -1.6512973308563232, -1.5123541355133057, -1.373410940170288, -1.2344677448272705, -1.095524549484253, -0.9565812349319458, -0.8176380395889282, -0.6786948442459106, -0.5397515892982483, -0.40080833435058594, -0.26186561584472656, -0.1229223906993866, 0.01602083444595337, 0.15496405959129333, 0.2939072847366333, 0.4328504800796509, 0.5717937350273132, 0.7107369899749756, 0.8496801853179932, 0.9886233806610107, 1.1275665760040283, 1.2665098905563354, 1.405453085899353, 1.5443962812423706, 1.6833395957946777, 1.8222827911376953, 1.961225986480713, 2.1001691818237305, 2.239112377166748, 2.3780555725097656, 2.516998767852783, 2.655941963195801, 2.7948853969573975, 2.933828592300415, 3.0727717876434326, 3.21171498298645, 3.3506581783294678, 3.4896013736724854, 3.628544807434082, 3.7674880027770996, 3.906431198120117, 4.045374393463135, 4.184317588806152]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 25.0, 30.0, 41.0, 64.0, 81.0, 140.0, 250.0, 371.0, 638.0, 930.0, 1547.0, 2532.0, 4204.0, 7248.0, 13091.0, 24033.0, 47192.0, 95628.0, 187896.0, 268893.0, 191403.0, 97959.0, 48615.0, 24462.0, 13171.0, 7180.0, 4278.0, 2462.0, 1504.0, 987.0, 614.0, 401.0, 234.0, 155.0, 107.0, 67.0, 39.0, 20.0, 15.0, 16.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19921875, -4.04083251953125, -3.8824462890625, -3.72406005859375, -3.565673828125, -3.40728759765625, -3.2489013671875, -3.09051513671875, -2.93212890625, -2.77374267578125, -2.6153564453125, -2.45697021484375, -2.298583984375, -2.14019775390625, -1.9818115234375, -1.82342529296875, -1.6650390625, -1.50665283203125, -1.3482666015625, -1.18988037109375, -1.031494140625, -0.87310791015625, -0.7147216796875, -0.55633544921875, -0.39794921875, -0.23956298828125, -0.0811767578125, 0.07720947265625, 0.235595703125, 0.39398193359375, 0.5523681640625, 0.71075439453125, 0.869140625, 1.02752685546875, 1.1859130859375, 1.34429931640625, 1.502685546875, 1.66107177734375, 1.8194580078125, 1.97784423828125, 2.13623046875, 2.29461669921875, 2.4530029296875, 2.61138916015625, 2.769775390625, 2.92816162109375, 3.0865478515625, 3.24493408203125, 3.4033203125, 3.56170654296875, 3.7200927734375, 3.87847900390625, 4.036865234375, 4.19525146484375, 4.3536376953125, 4.51202392578125, 4.67041015625, 4.82879638671875, 4.9871826171875, 5.14556884765625, 5.303955078125, 5.46234130859375, 5.6207275390625, 5.77911376953125, 5.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 10.0, 14.0, 17.0, 22.0, 12.0, 25.0, 26.0, 31.0, 27.0, 43.0, 30.0, 44.0, 36.0, 49.0, 38.0, 58.0, 35.0, 29.0, 46.0, 37.0, 36.0, 33.0, 39.0, 27.0, 33.0, 37.0, 23.0, 17.0, 18.0, 9.0, 10.0, 11.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.41796875, -5.26171875, -5.10546875, -4.94921875, -4.79296875, -4.63671875, -4.48046875, -4.32421875, -4.16796875, -4.01171875, -3.85546875, -3.69921875, -3.54296875, -3.38671875, -3.23046875, -3.07421875, -2.91796875, -2.76171875, -2.60546875, -2.44921875, -2.29296875, -2.13671875, -1.98046875, -1.82421875, -1.66796875, -1.51171875, -1.35546875, -1.19921875, -1.04296875, -0.88671875, -0.73046875, -0.57421875, -0.41796875, -0.26171875, -0.10546875, 0.05078125, 0.20703125, 0.36328125, 0.51953125, 0.67578125, 0.83203125, 0.98828125, 1.14453125, 1.30078125, 1.45703125, 1.61328125, 1.76953125, 1.92578125, 2.08203125, 2.23828125, 2.39453125, 2.55078125, 2.70703125, 2.86328125, 3.01953125, 3.17578125, 3.33203125, 3.48828125, 3.64453125, 3.80078125, 3.95703125, 4.11328125, 4.26953125, 4.42578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 13.0, 8.0, 10.0, 12.0, 20.0, 34.0, 40.0, 49.0, 64.0, 75.0, 158.0, 207.0, 267.0, 443.0, 608.0, 944.0, 1514.0, 2507.0, 4383.0, 8156.0, 16576.0, 38212.0, 103439.0, 298008.0, 351266.0, 132584.0, 47082.0, 19555.0, 9520.0, 4990.0, 2832.0, 1735.0, 1065.0, 654.0, 459.0, 319.0, 210.0, 148.0, 85.0, 68.0, 63.0, 39.0, 34.0, 28.0, 11.0, 12.0, 15.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-4.38671875, -4.2457275390625, -4.104736328125, -3.9637451171875, -3.82275390625, -3.6817626953125, -3.540771484375, -3.3997802734375, -3.2587890625, -3.1177978515625, -2.976806640625, -2.8358154296875, -2.69482421875, -2.5538330078125, -2.412841796875, -2.2718505859375, -2.130859375, -1.9898681640625, -1.848876953125, -1.7078857421875, -1.56689453125, -1.4259033203125, -1.284912109375, -1.1439208984375, -1.0029296875, -0.8619384765625, -0.720947265625, -0.5799560546875, -0.43896484375, -0.2979736328125, -0.156982421875, -0.0159912109375, 0.125, 0.2659912109375, 0.406982421875, 0.5479736328125, 0.68896484375, 0.8299560546875, 0.970947265625, 1.1119384765625, 1.2529296875, 1.3939208984375, 1.534912109375, 1.6759033203125, 1.81689453125, 1.9578857421875, 2.098876953125, 2.2398681640625, 2.380859375, 2.5218505859375, 2.662841796875, 2.8038330078125, 2.94482421875, 3.0858154296875, 3.226806640625, 3.3677978515625, 3.5087890625, 3.6497802734375, 3.790771484375, 3.9317626953125, 4.07275390625, 4.2137451171875, 4.354736328125, 4.4957275390625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 5.0, 8.0, 17.0, 14.0, 16.0, 16.0, 18.0, 18.0, 20.0, 22.0, 29.0, 37.0, 31.0, 32.0, 31.0, 32.0, 36.0, 29.0, 30.0, 43.0, 44.0, 43.0, 36.0, 48.0, 33.0, 38.0, 32.0, 27.0, 22.0, 30.0, 29.0, 27.0, 11.0, 19.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.741546630859375, -2.64324951171875, -2.544952392578125, -2.4466552734375, -2.348358154296875, -2.25006103515625, -2.151763916015625, -2.053466796875, -1.955169677734375, -1.85687255859375, -1.758575439453125, -1.6602783203125, -1.561981201171875, -1.46368408203125, -1.365386962890625, -1.26708984375, -1.168792724609375, -1.07049560546875, -0.972198486328125, -0.8739013671875, -0.775604248046875, -0.67730712890625, -0.579010009765625, -0.480712890625, -0.382415771484375, -0.28411865234375, -0.185821533203125, -0.0875244140625, 0.010772705078125, 0.10906982421875, 0.207366943359375, 0.3056640625, 0.403961181640625, 0.50225830078125, 0.600555419921875, 0.6988525390625, 0.797149658203125, 0.89544677734375, 0.993743896484375, 1.092041015625, 1.190338134765625, 1.28863525390625, 1.386932373046875, 1.4852294921875, 1.583526611328125, 1.68182373046875, 1.780120849609375, 1.87841796875, 1.976715087890625, 2.07501220703125, 2.173309326171875, 2.2716064453125, 2.369903564453125, 2.46820068359375, 2.566497802734375, 2.664794921875, 2.763092041015625, 2.86138916015625, 2.959686279296875, 3.0579833984375, 3.156280517578125, 3.25457763671875, 3.352874755859375, 3.451171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 6.0, 16.0, 18.0, 19.0, 33.0, 49.0, 84.0, 126.0, 213.0, 301.0, 480.0, 878.0, 1626.0, 4419.0, 28056.0, 978213.0, 25996.0, 4214.0, 1618.0, 831.0, 512.0, 292.0, 189.0, 113.0, 77.0, 58.0, 26.0, 20.0, 16.0, 11.0, 12.0, 9.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.064453125, -18.31640625, -17.568359375, -16.8203125, -16.072265625, -15.32421875, -14.576171875, -13.828125, -13.080078125, -12.33203125, -11.583984375, -10.8359375, -10.087890625, -9.33984375, -8.591796875, -7.84375, -7.095703125, -6.34765625, -5.599609375, -4.8515625, -4.103515625, -3.35546875, -2.607421875, -1.859375, -1.111328125, -0.36328125, 0.384765625, 1.1328125, 1.880859375, 2.62890625, 3.376953125, 4.125, 4.873046875, 5.62109375, 6.369140625, 7.1171875, 7.865234375, 8.61328125, 9.361328125, 10.109375, 10.857421875, 11.60546875, 12.353515625, 13.1015625, 13.849609375, 14.59765625, 15.345703125, 16.09375, 16.841796875, 17.58984375, 18.337890625, 19.0859375, 19.833984375, 20.58203125, 21.330078125, 22.078125, 22.826171875, 23.57421875, 24.322265625, 25.0703125, 25.818359375, 26.56640625, 27.314453125, 28.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 11.0, 33.0, 58.0, 221.0, 408.0, 136.0, 47.0, 23.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008211135864257812, -0.0007940083742141724, -0.0007669031620025635, -0.0007397979497909546, -0.0007126927375793457, -0.0006855875253677368, -0.0006584823131561279, -0.000631377100944519, -0.0006042718887329102, -0.0005771666765213013, -0.0005500614643096924, -0.0005229562520980835, -0.0004958510398864746, -0.0004687458276748657, -0.00044164061546325684, -0.00041453540325164795, -0.00038743019104003906, -0.0003603249788284302, -0.0003332197666168213, -0.0003061145544052124, -0.0002790093421936035, -0.00025190412998199463, -0.00022479891777038574, -0.00019769370555877686, -0.00017058849334716797, -0.00014348328113555908, -0.0001163780689239502, -8.927285671234131e-05, -6.216764450073242e-05, -3.5062432289123535e-05, -7.957220077514648e-06, 1.9147992134094238e-05, 4.6253204345703125e-05, 7.335841655731201e-05, 0.0001004636287689209, 0.00012756884098052979, 0.00015467405319213867, 0.00018177926540374756, 0.00020888447761535645, 0.00023598968982696533, 0.0002630949020385742, 0.0002902001142501831, 0.000317305326461792, 0.0003444105386734009, 0.00037151575088500977, 0.00039862096309661865, 0.00042572617530822754, 0.0004528313875198364, 0.0004799365997314453, 0.0005070418119430542, 0.0005341470241546631, 0.000561252236366272, 0.0005883574485778809, 0.0006154626607894897, 0.0006425678730010986, 0.0006696730852127075, 0.0006967782974243164, 0.0007238835096359253, 0.0007509887218475342, 0.0007780939340591431, 0.000805199146270752, 0.0008323043584823608, 0.0008594095706939697, 0.0008865147829055786, 0.0009136199951171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 19.0, 8.0, 26.0, 32.0, 40.0, 56.0, 74.0, 115.0, 164.0, 220.0, 303.0, 411.0, 588.0, 824.0, 1158.0, 1546.0, 2312.0, 3710.0, 6001.0, 11396.0, 26493.0, 90347.0, 429666.0, 351747.0, 71797.0, 22815.0, 10104.0, 5605.0, 3465.0, 2207.0, 1549.0, 1081.0, 689.0, 552.0, 407.0, 291.0, 200.0, 156.0, 105.0, 70.0, 58.0, 38.0, 36.0, 31.0, 17.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.42608642578125, -5.2506103515625, -5.07513427734375, -4.899658203125, -4.72418212890625, -4.5487060546875, -4.37322998046875, -4.19775390625, -4.02227783203125, -3.8468017578125, -3.67132568359375, -3.495849609375, -3.32037353515625, -3.1448974609375, -2.96942138671875, -2.7939453125, -2.61846923828125, -2.4429931640625, -2.26751708984375, -2.092041015625, -1.91656494140625, -1.7410888671875, -1.56561279296875, -1.39013671875, -1.21466064453125, -1.0391845703125, -0.86370849609375, -0.688232421875, -0.51275634765625, -0.3372802734375, -0.16180419921875, 0.013671875, 0.18914794921875, 0.3646240234375, 0.54010009765625, 0.715576171875, 0.89105224609375, 1.0665283203125, 1.24200439453125, 1.41748046875, 1.59295654296875, 1.7684326171875, 1.94390869140625, 2.119384765625, 2.29486083984375, 2.4703369140625, 2.64581298828125, 2.8212890625, 2.99676513671875, 3.1722412109375, 3.34771728515625, 3.523193359375, 3.69866943359375, 3.8741455078125, 4.04962158203125, 4.22509765625, 4.40057373046875, 4.5760498046875, 4.75152587890625, 4.927001953125, 5.10247802734375, 5.2779541015625, 5.45343017578125, 5.62890625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 9.0, 8.0, 12.0, 28.0, 48.0, 99.0, 160.0, 208.0, 178.0, 102.0, 58.0, 23.0, 13.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.50732421875, -2.4345703125, -2.36181640625, -2.2890625, -2.21630859375, -2.1435546875, -2.07080078125, -1.998046875, -1.92529296875, -1.8525390625, -1.77978515625, -1.70703125, -1.63427734375, -1.5615234375, -1.48876953125, -1.416015625, -1.34326171875, -1.2705078125, -1.19775390625, -1.125, -1.05224609375, -0.9794921875, -0.90673828125, -0.833984375, -0.76123046875, -0.6884765625, -0.61572265625, -0.54296875, -0.47021484375, -0.3974609375, -0.32470703125, -0.251953125, -0.17919921875, -0.1064453125, -0.03369140625, 0.0390625, 0.11181640625, 0.1845703125, 0.25732421875, 0.330078125, 0.40283203125, 0.4755859375, 0.54833984375, 0.62109375, 0.69384765625, 0.7666015625, 0.83935546875, 0.912109375, 0.98486328125, 1.0576171875, 1.13037109375, 1.203125, 1.27587890625, 1.3486328125, 1.42138671875, 1.494140625, 1.56689453125, 1.6396484375, 1.71240234375, 1.78515625, 1.85791015625, 1.9306640625, 2.00341796875, 2.076171875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 4.0, 8.0, 17.0, 8.0, 6.0, 14.0, 25.0, 20.0, 32.0, 26.0, 36.0, 29.0, 47.0, 41.0, 44.0, 64.0, 49.0, 57.0, 54.0, 40.0, 51.0, 39.0, 37.0, 42.0, 44.0, 24.0, 24.0, 22.0, 22.0, 19.0, 7.0, 7.0, 8.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.619289875030518, -5.4501519203186035, -5.281014442443848, -5.111876487731934, -4.942739009857178, -4.773601055145264, -4.604463577270508, -4.435325622558594, -4.266188144683838, -4.097050189971924, -3.927912712097168, -3.758774995803833, -3.589637279510498, -3.420499563217163, -3.251361846923828, -3.082223892211914, -2.913086175918579, -2.743948459625244, -2.574810743331909, -2.405673027038574, -2.2365353107452393, -2.0673975944519043, -1.8982597589492798, -1.7291220426559448, -1.5599843263626099, -1.390846610069275, -1.22170889377594, -1.0525710582733154, -0.8834334015846252, -0.7142956852912903, -0.5451579093933105, -0.3760201930999756, -0.20688247680664062, -0.03774474561214447, 0.13139298558235168, 0.30053073167800903, 0.469668447971344, 0.638806164264679, 0.8079439401626587, 0.9770816564559937, 1.1462193727493286, 1.3153570890426636, 1.4844948053359985, 1.653632640838623, 1.822770357131958, 1.991908073425293, 2.161045789718628, 2.330183506011963, 2.499321222305298, 2.668458938598633, 2.8375966548919678, 3.0067343711853027, 3.1758720874786377, 3.3450098037719727, 3.5141477584838867, 3.6832852363586426, 3.8524231910705566, 4.021561145782471, 4.190698623657227, 4.359836578369141, 4.5289740562438965, 4.6981120109558105, 4.867249488830566, 5.0363874435424805, 5.205524921417236]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 5.0, 6.0, 8.0, 10.0, 17.0, 19.0, 15.0, 7.0, 26.0, 21.0, 23.0, 30.0, 32.0, 29.0, 27.0, 35.0, 26.0, 38.0, 37.0, 37.0, 48.0, 30.0, 41.0, 42.0, 36.0, 28.0, 28.0, 30.0, 34.0, 23.0, 33.0, 23.0, 17.0, 21.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-4.382673263549805, -4.250843048095703, -4.119012355804443, -3.987182140350342, -3.8553519248962402, -3.7235214710235596, -3.591691017150879, -3.4598608016967773, -3.328030586242676, -3.196200132369995, -3.0643699169158936, -2.932539463043213, -2.8007092475891113, -2.6688787937164307, -2.53704833984375, -2.4052181243896484, -2.2733876705169678, -2.141557216644287, -2.0097270011901855, -1.8778965473175049, -1.7460663318634033, -1.6142358779907227, -1.4824055433273315, -1.3505752086639404, -1.2187448740005493, -1.0869145393371582, -0.9550842046737671, -0.8232538104057312, -0.6914234757423401, -0.559593141078949, -0.4277627468109131, -0.295932412147522, -0.16410207748413086, -0.03227172791957855, 0.09955862164497375, 0.23138898611068726, 0.36321932077407837, 0.4950496554374695, 0.6268800497055054, 0.7587103843688965, 0.8905407190322876, 1.0223710536956787, 1.1542013883590698, 1.286031723022461, 1.4178621768951416, 1.5496923923492432, 1.6815228462219238, 1.813353180885315, 1.945183515548706, 2.0770139694213867, 2.2088441848754883, 2.340674638748169, 2.4725048542022705, 2.604335308074951, 2.7361655235290527, 2.8679959774017334, 2.999826431274414, 3.1316568851470947, 3.2634871006011963, 3.395317554473877, 3.5271477699279785, 3.658978223800659, 3.79080867767334, 3.9226388931274414, 4.054469108581543]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 12.0, 30.0, 44.0, 53.0, 101.0, 161.0, 264.0, 402.0, 631.0, 978.0, 1594.0, 2510.0, 4238.0, 6575.0, 10311.0, 16142.0, 24500.0, 36111.0, 51080.0, 68924.0, 86676.0, 101723.0, 111442.0, 111356.0, 101975.0, 86930.0, 68407.0, 51169.0, 36173.0, 24162.0, 16151.0, 10241.0, 6521.0, 4033.0, 2610.0, 1686.0, 981.0, 636.0, 372.0, 237.0, 167.0, 98.0, 45.0, 31.0, 21.0, 11.0, 5.0, 16.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.58984375, -4.45074462890625, -4.3116455078125, -4.17254638671875, -4.033447265625, -3.89434814453125, -3.7552490234375, -3.61614990234375, -3.47705078125, -3.33795166015625, -3.1988525390625, -3.05975341796875, -2.920654296875, -2.78155517578125, -2.6424560546875, -2.50335693359375, -2.3642578125, -2.22515869140625, -2.0860595703125, -1.94696044921875, -1.807861328125, -1.66876220703125, -1.5296630859375, -1.39056396484375, -1.25146484375, -1.11236572265625, -0.9732666015625, -0.83416748046875, -0.695068359375, -0.55596923828125, -0.4168701171875, -0.27777099609375, -0.138671875, 0.00042724609375, 0.1395263671875, 0.27862548828125, 0.417724609375, 0.55682373046875, 0.6959228515625, 0.83502197265625, 0.97412109375, 1.11322021484375, 1.2523193359375, 1.39141845703125, 1.530517578125, 1.66961669921875, 1.8087158203125, 1.94781494140625, 2.0869140625, 2.22601318359375, 2.3651123046875, 2.50421142578125, 2.643310546875, 2.78240966796875, 2.9215087890625, 3.06060791015625, 3.19970703125, 3.33880615234375, 3.4779052734375, 3.61700439453125, 3.756103515625, 3.89520263671875, 4.0343017578125, 4.17340087890625, 4.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 7.0, 8.0, 10.0, 13.0, 23.0, 24.0, 21.0, 17.0, 25.0, 37.0, 38.0, 30.0, 31.0, 40.0, 53.0, 34.0, 33.0, 50.0, 48.0, 36.0, 37.0, 42.0, 33.0, 24.0, 28.0, 41.0, 28.0, 23.0, 27.0, 18.0, 16.0, 14.0, 15.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-5.015625, -4.8765869140625, -4.737548828125, -4.5985107421875, -4.45947265625, -4.3204345703125, -4.181396484375, -4.0423583984375, -3.9033203125, -3.7642822265625, -3.625244140625, -3.4862060546875, -3.34716796875, -3.2081298828125, -3.069091796875, -2.9300537109375, -2.791015625, -2.6519775390625, -2.512939453125, -2.3739013671875, -2.23486328125, -2.0958251953125, -1.956787109375, -1.8177490234375, -1.6787109375, -1.5396728515625, -1.400634765625, -1.2615966796875, -1.12255859375, -0.9835205078125, -0.844482421875, -0.7054443359375, -0.56640625, -0.4273681640625, -0.288330078125, -0.1492919921875, -0.01025390625, 0.1287841796875, 0.267822265625, 0.4068603515625, 0.5458984375, 0.6849365234375, 0.823974609375, 0.9630126953125, 1.10205078125, 1.2410888671875, 1.380126953125, 1.5191650390625, 1.658203125, 1.7972412109375, 1.936279296875, 2.0753173828125, 2.21435546875, 2.3533935546875, 2.492431640625, 2.6314697265625, 2.7705078125, 2.9095458984375, 3.048583984375, 3.1876220703125, 3.32666015625, 3.4656982421875, 3.604736328125, 3.7437744140625, 3.8828125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 19.0, 17.0, 33.0, 43.0, 66.0, 146.0, 238.0, 322.0, 505.0, 746.0, 1313.0, 2147.0, 3458.0, 5567.0, 9152.0, 14708.0, 23169.0, 35971.0, 53307.0, 75009.0, 98540.0, 117690.0, 126550.0, 121282.0, 104971.0, 81787.0, 59596.0, 40778.0, 26961.0, 16761.0, 10474.0, 6610.0, 3907.0, 2542.0, 1585.0, 915.0, 560.0, 393.0, 262.0, 171.0, 94.0, 61.0, 43.0, 29.0, 20.0, 8.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2734375, -5.1119384765625, -4.950439453125, -4.7889404296875, -4.62744140625, -4.4659423828125, -4.304443359375, -4.1429443359375, -3.9814453125, -3.8199462890625, -3.658447265625, -3.4969482421875, -3.33544921875, -3.1739501953125, -3.012451171875, -2.8509521484375, -2.689453125, -2.5279541015625, -2.366455078125, -2.2049560546875, -2.04345703125, -1.8819580078125, -1.720458984375, -1.5589599609375, -1.3974609375, -1.2359619140625, -1.074462890625, -0.9129638671875, -0.75146484375, -0.5899658203125, -0.428466796875, -0.2669677734375, -0.10546875, 0.0560302734375, 0.217529296875, 0.3790283203125, 0.54052734375, 0.7020263671875, 0.863525390625, 1.0250244140625, 1.1865234375, 1.3480224609375, 1.509521484375, 1.6710205078125, 1.83251953125, 1.9940185546875, 2.155517578125, 2.3170166015625, 2.478515625, 2.6400146484375, 2.801513671875, 2.9630126953125, 3.12451171875, 3.2860107421875, 3.447509765625, 3.6090087890625, 3.7705078125, 3.9320068359375, 4.093505859375, 4.2550048828125, 4.41650390625, 4.5780029296875, 4.739501953125, 4.9010009765625, 5.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 13.0, 16.0, 12.0, 19.0, 19.0, 21.0, 22.0, 30.0, 35.0, 35.0, 38.0, 37.0, 47.0, 55.0, 51.0, 44.0, 39.0, 49.0, 47.0, 39.0, 39.0, 38.0, 30.0, 23.0, 25.0, 24.0, 20.0, 14.0, 13.0, 12.0, 10.0, 8.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.063262939453125, -2.96441650390625, -2.865570068359375, -2.7667236328125, -2.667877197265625, -2.56903076171875, -2.470184326171875, -2.371337890625, -2.272491455078125, -2.17364501953125, -2.074798583984375, -1.9759521484375, -1.877105712890625, -1.77825927734375, -1.679412841796875, -1.58056640625, -1.481719970703125, -1.38287353515625, -1.284027099609375, -1.1851806640625, -1.086334228515625, -0.98748779296875, -0.888641357421875, -0.789794921875, -0.690948486328125, -0.59210205078125, -0.493255615234375, -0.3944091796875, -0.295562744140625, -0.19671630859375, -0.097869873046875, 0.0009765625, 0.099822998046875, 0.19866943359375, 0.297515869140625, 0.3963623046875, 0.495208740234375, 0.59405517578125, 0.692901611328125, 0.791748046875, 0.890594482421875, 0.98944091796875, 1.088287353515625, 1.1871337890625, 1.285980224609375, 1.38482666015625, 1.483673095703125, 1.58251953125, 1.681365966796875, 1.78021240234375, 1.879058837890625, 1.9779052734375, 2.076751708984375, 2.17559814453125, 2.274444580078125, 2.373291015625, 2.472137451171875, 2.57098388671875, 2.669830322265625, 2.7686767578125, 2.867523193359375, 2.96636962890625, 3.065216064453125, 3.1640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 11.0, 13.0, 23.0, 22.0, 34.0, 41.0, 64.0, 92.0, 120.0, 168.0, 234.0, 373.0, 542.0, 821.0, 1304.0, 2198.0, 3693.0, 6567.0, 12338.0, 23544.0, 45969.0, 85466.0, 141070.0, 190806.0, 192863.0, 145926.0, 90202.0, 48539.0, 25288.0, 13051.0, 6923.0, 3818.0, 2247.0, 1377.0, 877.0, 594.0, 401.0, 252.0, 178.0, 139.0, 94.0, 83.0, 53.0, 32.0, 31.0, 10.0, 22.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.11846923828125, -2.0455322265625, -1.97259521484375, -1.899658203125, -1.82672119140625, -1.7537841796875, -1.68084716796875, -1.60791015625, -1.53497314453125, -1.4620361328125, -1.38909912109375, -1.316162109375, -1.24322509765625, -1.1702880859375, -1.09735107421875, -1.0244140625, -0.95147705078125, -0.8785400390625, -0.80560302734375, -0.732666015625, -0.65972900390625, -0.5867919921875, -0.51385498046875, -0.44091796875, -0.36798095703125, -0.2950439453125, -0.22210693359375, -0.149169921875, -0.07623291015625, -0.0032958984375, 0.06964111328125, 0.142578125, 0.21551513671875, 0.2884521484375, 0.36138916015625, 0.434326171875, 0.50726318359375, 0.5802001953125, 0.65313720703125, 0.72607421875, 0.79901123046875, 0.8719482421875, 0.94488525390625, 1.017822265625, 1.09075927734375, 1.1636962890625, 1.23663330078125, 1.3095703125, 1.38250732421875, 1.4554443359375, 1.52838134765625, 1.601318359375, 1.67425537109375, 1.7471923828125, 1.82012939453125, 1.89306640625, 1.96600341796875, 2.0389404296875, 2.11187744140625, 2.184814453125, 2.25775146484375, 2.3306884765625, 2.40362548828125, 2.4765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 7.0, 2.0, 4.0, 10.0, 16.0, 20.0, 28.0, 22.0, 42.0, 34.0, 45.0, 58.0, 55.0, 72.0, 65.0, 87.0, 68.0, 60.0, 62.0, 50.0, 44.0, 41.0, 28.0, 24.0, 13.0, 13.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021754205226898193, -0.0002097785472869873, -0.00020201504230499268, -0.00019425153732299805, -0.00018648803234100342, -0.0001787245273590088, -0.00017096102237701416, -0.00016319751739501953, -0.0001554340124130249, -0.00014767050743103027, -0.00013990700244903564, -0.00013214349746704102, -0.0001243799924850464, -0.00011661648750305176, -0.00010885298252105713, -0.0001010894775390625, -9.332597255706787e-05, -8.556246757507324e-05, -7.779896259307861e-05, -7.003545761108398e-05, -6.227195262908936e-05, -5.4508447647094727e-05, -4.67449426651001e-05, -3.898143768310547e-05, -3.121793270111084e-05, -2.345442771911621e-05, -1.5690922737121582e-05, -7.927417755126953e-06, -1.6391277313232422e-07, 7.599592208862305e-06, 1.5363097190856934e-05, 2.3126602172851562e-05, 3.089010715484619e-05, 3.865361213684082e-05, 4.641711711883545e-05, 5.418062210083008e-05, 6.194412708282471e-05, 6.970763206481934e-05, 7.747113704681396e-05, 8.52346420288086e-05, 9.299814701080322e-05, 0.00010076165199279785, 0.00010852515697479248, 0.00011628866195678711, 0.00012405216693878174, 0.00013181567192077637, 0.000139579176902771, 0.00014734268188476562, 0.00015510618686676025, 0.00016286969184875488, 0.0001706331968307495, 0.00017839670181274414, 0.00018616020679473877, 0.0001939237117767334, 0.00020168721675872803, 0.00020945072174072266, 0.00021721422672271729, 0.00022497773170471191, 0.00023274123668670654, 0.00024050474166870117, 0.0002482682466506958, 0.00025603175163269043, 0.00026379525661468506, 0.0002715587615966797]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 1.0, 9.0, 12.0, 16.0, 12.0, 14.0, 26.0, 32.0, 42.0, 61.0, 84.0, 114.0, 116.0, 190.0, 275.0, 495.0, 821.0, 1465.0, 2728.0, 5407.0, 10136.0, 19336.0, 37308.0, 67574.0, 111863.0, 157183.0, 181363.0, 165040.0, 120948.0, 75988.0, 42284.0, 22590.0, 11659.0, 5953.0, 3126.0, 1674.0, 908.0, 575.0, 367.0, 217.0, 143.0, 98.0, 80.0, 58.0, 35.0, 38.0, 23.0, 20.0, 8.0, 13.0, 8.0, 11.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-2.029296875, -1.9670562744140625, -1.904815673828125, -1.8425750732421875, -1.78033447265625, -1.7180938720703125, -1.655853271484375, -1.5936126708984375, -1.5313720703125, -1.4691314697265625, -1.406890869140625, -1.3446502685546875, -1.28240966796875, -1.2201690673828125, -1.157928466796875, -1.0956878662109375, -1.033447265625, -0.9712066650390625, -0.908966064453125, -0.8467254638671875, -0.78448486328125, -0.7222442626953125, -0.660003662109375, -0.5977630615234375, -0.5355224609375, -0.4732818603515625, -0.411041259765625, -0.3488006591796875, -0.28656005859375, -0.2243194580078125, -0.162078857421875, -0.0998382568359375, -0.03759765625, 0.0246429443359375, 0.086883544921875, 0.1491241455078125, 0.21136474609375, 0.2736053466796875, 0.335845947265625, 0.3980865478515625, 0.4603271484375, 0.5225677490234375, 0.584808349609375, 0.6470489501953125, 0.70928955078125, 0.7715301513671875, 0.833770751953125, 0.8960113525390625, 0.958251953125, 1.0204925537109375, 1.082733154296875, 1.1449737548828125, 1.20721435546875, 1.2694549560546875, 1.331695556640625, 1.3939361572265625, 1.4561767578125, 1.5184173583984375, 1.580657958984375, 1.6428985595703125, 1.70513916015625, 1.7673797607421875, 1.829620361328125, 1.8918609619140625, 1.9541015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 4.0, 10.0, 12.0, 17.0, 14.0, 35.0, 36.0, 44.0, 38.0, 39.0, 42.0, 61.0, 64.0, 62.0, 63.0, 60.0, 55.0, 50.0, 50.0, 43.0, 44.0, 24.0, 30.0, 26.0, 13.0, 12.0, 11.0, 6.0, 9.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6356277465820312, -0.6130523681640625, -0.5904769897460938, -0.567901611328125, -0.5453262329101562, -0.5227508544921875, -0.5001754760742188, -0.47760009765625, -0.45502471923828125, -0.4324493408203125, -0.40987396240234375, -0.387298583984375, -0.36472320556640625, -0.3421478271484375, -0.31957244873046875, -0.2969970703125, -0.27442169189453125, -0.2518463134765625, -0.22927093505859375, -0.206695556640625, -0.18412017822265625, -0.1615447998046875, -0.13896942138671875, -0.11639404296875, -0.09381866455078125, -0.0712432861328125, -0.04866790771484375, -0.026092529296875, -0.00351715087890625, 0.0190582275390625, 0.04163360595703125, 0.064208984375, 0.08678436279296875, 0.1093597412109375, 0.13193511962890625, 0.154510498046875, 0.17708587646484375, 0.1996612548828125, 0.22223663330078125, 0.24481201171875, 0.26738739013671875, 0.2899627685546875, 0.31253814697265625, 0.335113525390625, 0.35768890380859375, 0.3802642822265625, 0.40283966064453125, 0.4254150390625, 0.44799041748046875, 0.4705657958984375, 0.49314117431640625, 0.515716552734375, 0.5382919311523438, 0.5608673095703125, 0.5834426879882812, 0.60601806640625, 0.6285934448242188, 0.6511688232421875, 0.6737442016601562, 0.696319580078125, 0.7188949584960938, 0.7414703369140625, 0.7640457153320312, 0.78662109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 5.0, 11.0, 14.0, 12.0, 13.0, 13.0, 16.0, 21.0, 19.0, 35.0, 28.0, 33.0, 35.0, 43.0, 45.0, 64.0, 53.0, 45.0, 55.0, 44.0, 47.0, 35.0, 29.0, 39.0, 39.0, 34.0, 28.0, 27.0, 25.0, 21.0, 8.0, 11.0, 13.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.122591495513916, -4.962081432342529, -4.801571369171143, -4.641060829162598, -4.480550765991211, -4.320040702819824, -4.1595306396484375, -3.9990203380584717, -3.838510036468506, -3.677999973297119, -3.5174896717071533, -3.3569796085357666, -3.196469306945801, -3.035959243774414, -2.8754491806030273, -2.7149388790130615, -2.554428815841675, -2.393918752670288, -2.2334084510803223, -2.0728983879089355, -1.9123880863189697, -1.751878023147583, -1.5913678407669067, -1.4308576583862305, -1.2703474760055542, -1.109837293624878, -0.9493271112442017, -0.7888169884681702, -0.6283068060874939, -0.4677966237068176, -0.30728650093078613, -0.14677631855010986, 0.013733863830566406, 0.17424403131008148, 0.33475419878959656, 0.49526435136795044, 0.6557745337486267, 0.816284716129303, 0.9767948389053345, 1.1373050212860107, 1.297815203666687, 1.4583253860473633, 1.6188355684280396, 1.7793457508087158, 1.9398558139801025, 2.1003661155700684, 2.260876178741455, 2.421386241912842, 2.5818965435028076, 2.7424066066741943, 2.90291690826416, 3.063426971435547, 3.2239372730255127, 3.3844473361968994, 3.5449576377868652, 3.705467700958252, 3.8659777641296387, 4.026487827301025, 4.186997890472412, 4.347508430480957, 4.508018493652344, 4.6685285568237305, 4.829038619995117, 4.989548683166504, 5.150059223175049]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 10.0, 12.0, 15.0, 22.0, 14.0, 30.0, 24.0, 31.0, 29.0, 30.0, 36.0, 53.0, 35.0, 39.0, 42.0, 50.0, 44.0, 47.0, 34.0, 34.0, 36.0, 44.0, 29.0, 31.0, 34.0, 22.0, 21.0, 16.0, 20.0, 11.0, 13.0, 10.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021089553833008, -4.866550922393799, -4.71201229095459, -4.557473182678223, -4.402934551239014, -4.248395919799805, -4.093857288360596, -3.9393186569213867, -3.7847800254821777, -3.6302413940429688, -3.4757025241851807, -3.3211638927459717, -3.1666252613067627, -3.0120863914489746, -2.8575477600097656, -2.7030091285705566, -2.5484702587127686, -2.3939316272735596, -2.2393927574157715, -2.0848541259765625, -1.9303154945373535, -1.775776743888855, -1.6212379932403564, -1.4666993618011475, -1.312160611152649, -1.1576218605041504, -1.0030832290649414, -0.8485444784164429, -0.6940057873725891, -0.5394670963287354, -0.3849283456802368, -0.23038971424102783, -0.0758509635925293, 0.07868774235248566, 0.2332264482975006, 0.38776516914367676, 0.5423038601875305, 0.6968425512313843, 0.8513813018798828, 1.0059199333190918, 1.1604586839675903, 1.3149974346160889, 1.4695360660552979, 1.6240748167037964, 1.778613567352295, 1.933152198791504, 2.087690830230713, 2.242229461669922, 2.39676833152771, 2.551306962966919, 2.705845832824707, 2.860384464263916, 3.014923095703125, 3.169461727142334, 3.324000597000122, 3.478539228439331, 3.633078098297119, 3.787616729736328, 3.942155599594116, 4.096693992614746, 4.251233100891113, 4.405771732330322, 4.560310363769531, 4.71484899520874, 4.869387626647949]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 6.0, 7.0, 23.0, 20.0, 57.0, 79.0, 129.0, 240.0, 389.0, 644.0, 1086.0, 1690.0, 2903.0, 4884.0, 7936.0, 13549.0, 22353.0, 37250.0, 61627.0, 101512.0, 163475.0, 256915.0, 380127.0, 509729.0, 596424.0, 583854.0, 486224.0, 353835.0, 234928.0, 147725.0, 90589.0, 54667.0, 32431.0, 19222.0, 11378.0, 6745.0, 3961.0, 2298.0, 1391.0, 827.0, 479.0, 264.0, 172.0, 107.0, 53.0, 35.0, 21.0, 15.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.25, -4.128204345703125, -4.00640869140625, -3.884613037109375, -3.7628173828125, -3.641021728515625, -3.51922607421875, -3.397430419921875, -3.275634765625, -3.153839111328125, -3.03204345703125, -2.910247802734375, -2.7884521484375, -2.666656494140625, -2.54486083984375, -2.423065185546875, -2.30126953125, -2.179473876953125, -2.05767822265625, -1.935882568359375, -1.8140869140625, -1.692291259765625, -1.57049560546875, -1.448699951171875, -1.326904296875, -1.205108642578125, -1.08331298828125, -0.961517333984375, -0.8397216796875, -0.717926025390625, -0.59613037109375, -0.474334716796875, -0.3525390625, -0.230743408203125, -0.10894775390625, 0.012847900390625, 0.1346435546875, 0.256439208984375, 0.37823486328125, 0.500030517578125, 0.621826171875, 0.743621826171875, 0.86541748046875, 0.987213134765625, 1.1090087890625, 1.230804443359375, 1.35260009765625, 1.474395751953125, 1.59619140625, 1.717987060546875, 1.83978271484375, 1.961578369140625, 2.0833740234375, 2.205169677734375, 2.32696533203125, 2.448760986328125, 2.570556640625, 2.692352294921875, 2.81414794921875, 2.935943603515625, 3.0577392578125, 3.179534912109375, 3.30133056640625, 3.423126220703125, 3.544921875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 6.0, 11.0, 4.0, 7.0, 14.0, 14.0, 19.0, 17.0, 18.0, 26.0, 28.0, 38.0, 37.0, 27.0, 44.0, 35.0, 50.0, 34.0, 43.0, 57.0, 42.0, 41.0, 30.0, 50.0, 40.0, 39.0, 34.0, 32.0, 21.0, 26.0, 15.0, 23.0, 15.0, 11.0, 8.0, 11.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.479644775390625, -3.35577392578125, -3.231903076171875, -3.1080322265625, -2.984161376953125, -2.86029052734375, -2.736419677734375, -2.612548828125, -2.488677978515625, -2.36480712890625, -2.240936279296875, -2.1170654296875, -1.993194580078125, -1.86932373046875, -1.745452880859375, -1.62158203125, -1.497711181640625, -1.37384033203125, -1.249969482421875, -1.1260986328125, -1.002227783203125, -0.87835693359375, -0.754486083984375, -0.630615234375, -0.506744384765625, -0.38287353515625, -0.259002685546875, -0.1351318359375, -0.011260986328125, 0.11260986328125, 0.236480712890625, 0.3603515625, 0.484222412109375, 0.60809326171875, 0.731964111328125, 0.8558349609375, 0.979705810546875, 1.10357666015625, 1.227447509765625, 1.351318359375, 1.475189208984375, 1.59906005859375, 1.722930908203125, 1.8468017578125, 1.970672607421875, 2.09454345703125, 2.218414306640625, 2.34228515625, 2.466156005859375, 2.59002685546875, 2.713897705078125, 2.8377685546875, 2.961639404296875, 3.08551025390625, 3.209381103515625, 3.333251953125, 3.457122802734375, 3.58099365234375, 3.704864501953125, 3.8287353515625, 3.952606201171875, 4.07647705078125, 4.200347900390625, 4.32421875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 16.0, 15.0, 31.0, 70.0, 82.0, 164.0, 277.0, 460.0, 914.0, 1554.0, 2873.0, 5252.0, 9363.0, 17180.0, 29773.0, 51312.0, 86806.0, 142476.0, 221547.0, 327103.0, 444346.0, 539694.0, 570593.0, 520358.0, 416514.0, 299272.0, 199450.0, 126904.0, 76408.0, 44967.0, 25758.0, 14409.0, 8047.0, 4601.0, 2482.0, 1438.0, 781.0, 448.0, 216.0, 147.0, 78.0, 38.0, 24.0, 20.0, 7.0, 8.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.359375, -4.23614501953125, -4.1129150390625, -3.98968505859375, -3.866455078125, -3.74322509765625, -3.6199951171875, -3.49676513671875, -3.37353515625, -3.25030517578125, -3.1270751953125, -3.00384521484375, -2.880615234375, -2.75738525390625, -2.6341552734375, -2.51092529296875, -2.3876953125, -2.26446533203125, -2.1412353515625, -2.01800537109375, -1.894775390625, -1.77154541015625, -1.6483154296875, -1.52508544921875, -1.40185546875, -1.27862548828125, -1.1553955078125, -1.03216552734375, -0.908935546875, -0.78570556640625, -0.6624755859375, -0.53924560546875, -0.416015625, -0.29278564453125, -0.1695556640625, -0.04632568359375, 0.076904296875, 0.20013427734375, 0.3233642578125, 0.44659423828125, 0.56982421875, 0.69305419921875, 0.8162841796875, 0.93951416015625, 1.062744140625, 1.18597412109375, 1.3092041015625, 1.43243408203125, 1.5556640625, 1.67889404296875, 1.8021240234375, 1.92535400390625, 2.048583984375, 2.17181396484375, 2.2950439453125, 2.41827392578125, 2.54150390625, 2.66473388671875, 2.7879638671875, 2.91119384765625, 3.034423828125, 3.15765380859375, 3.2808837890625, 3.40411376953125, 3.52734375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 11.0, 14.0, 12.0, 13.0, 25.0, 32.0, 33.0, 45.0, 44.0, 60.0, 93.0, 88.0, 118.0, 137.0, 160.0, 183.0, 183.0, 214.0, 236.0, 252.0, 241.0, 258.0, 233.0, 186.0, 204.0, 166.0, 132.0, 136.0, 107.0, 96.0, 70.0, 69.0, 47.0, 32.0, 28.0, 29.0, 17.0, 21.0, 15.0, 9.0, 5.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.650390625, -1.595611572265625, -1.54083251953125, -1.486053466796875, -1.4312744140625, -1.376495361328125, -1.32171630859375, -1.266937255859375, -1.212158203125, -1.157379150390625, -1.10260009765625, -1.047821044921875, -0.9930419921875, -0.938262939453125, -0.88348388671875, -0.828704833984375, -0.77392578125, -0.719146728515625, -0.66436767578125, -0.609588623046875, -0.5548095703125, -0.500030517578125, -0.44525146484375, -0.390472412109375, -0.335693359375, -0.280914306640625, -0.22613525390625, -0.171356201171875, -0.1165771484375, -0.061798095703125, -0.00701904296875, 0.047760009765625, 0.1025390625, 0.157318115234375, 0.21209716796875, 0.266876220703125, 0.3216552734375, 0.376434326171875, 0.43121337890625, 0.485992431640625, 0.540771484375, 0.595550537109375, 0.65032958984375, 0.705108642578125, 0.7598876953125, 0.814666748046875, 0.86944580078125, 0.924224853515625, 0.97900390625, 1.033782958984375, 1.08856201171875, 1.143341064453125, 1.1981201171875, 1.252899169921875, 1.30767822265625, 1.362457275390625, 1.417236328125, 1.472015380859375, 1.52679443359375, 1.581573486328125, 1.6363525390625, 1.691131591796875, 1.74591064453125, 1.800689697265625, 1.85546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 14.0, 17.0, 9.0, 16.0, 22.0, 30.0, 33.0, 36.0, 46.0, 35.0, 50.0, 43.0, 53.0, 56.0, 51.0, 52.0, 52.0, 39.0, 45.0, 36.0, 42.0, 39.0, 29.0, 22.0, 31.0, 15.0, 10.0, 15.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9960076808929443, -3.8486523628234863, -3.7012972831726074, -3.5539419651031494, -3.4065866470336914, -3.2592313289642334, -3.1118760108947754, -2.9645209312438965, -2.8171656131744385, -2.6698102951049805, -2.5224552154541016, -2.3750998973846436, -2.2277445793151855, -2.0803892612457275, -1.933034062385559, -1.7856788635253906, -1.6383235454559326, -1.4909682273864746, -1.3436130285263062, -1.1962578296661377, -1.0489025115966797, -0.9015472531318665, -0.7541919946670532, -0.6068367958068848, -0.45948147773742676, -0.3121262192726135, -0.1647709608078003, -0.01741570234298706, 0.12993955612182617, 0.2772948145866394, 0.42465007305145264, 0.5720052719116211, 0.7193608283996582, 0.8667160868644714, 1.0140713453292847, 1.1614265441894531, 1.3087818622589111, 1.4561371803283691, 1.6034923791885376, 1.750847578048706, 1.898202896118164, 2.045558214187622, 2.19291353225708, 2.340268611907959, 2.487623929977417, 2.634979248046875, 2.782334327697754, 2.929689645767212, 3.07704496383667, 3.224400281906128, 3.371755599975586, 3.519110679626465, 3.666465997695923, 3.813821315765381, 3.9611763954162598, 4.108531951904297, 4.255887031555176, 4.403242111206055, 4.550597667694092, 4.697952747344971, 4.845308303833008, 4.992663383483887, 5.140018463134766, 5.2873735427856445, 5.434729099273682]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 7.0, 11.0, 11.0, 8.0, 13.0, 14.0, 17.0, 14.0, 22.0, 28.0, 26.0, 27.0, 26.0, 32.0, 41.0, 43.0, 33.0, 49.0, 32.0, 38.0, 43.0, 48.0, 27.0, 49.0, 40.0, 39.0, 30.0, 34.0, 23.0, 30.0, 21.0, 18.0, 21.0, 13.0, 16.0, 9.0, 8.0, 6.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.188475131988525, -4.064115047454834, -3.9397549629211426, -3.815394878387451, -3.6910347938537598, -3.5666747093200684, -3.442314624786377, -3.3179545402526855, -3.193594455718994, -3.0692343711853027, -2.9448742866516113, -2.82051420211792, -2.6961541175842285, -2.571794033050537, -2.4474339485168457, -2.3230738639831543, -2.198714017868042, -2.0743539333343506, -1.9499938488006592, -1.8256337642669678, -1.7012736797332764, -1.576913595199585, -1.452553629875183, -1.3281935453414917, -1.2038334608078003, -1.0794733762741089, -0.9551132917404175, -0.8307532668113708, -0.7063931822776794, -0.582033097743988, -0.4576730728149414, -0.33331298828125, -0.2089526653289795, -0.08459259569644928, 0.03976747393608093, 0.16412752866744995, 0.28848761320114136, 0.41284769773483276, 0.5372077226638794, 0.6615678071975708, 0.7859278917312622, 0.9102879762649536, 1.034648060798645, 1.1590080261230469, 1.2833681106567383, 1.4077281951904297, 1.532088279724121, 1.6564483642578125, 1.780808448791504, 1.9051685333251953, 2.0295286178588867, 2.153888702392578, 2.2782487869262695, 2.402608871459961, 2.5269689559936523, 2.6513290405273438, 2.775689125061035, 2.9000492095947266, 3.024409294128418, 3.1487693786621094, 3.273129463195801, 3.397489547729492, 3.5218496322631836, 3.646209716796875, 3.7705695629119873]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 12.0, 20.0, 21.0, 40.0, 43.0, 75.0, 118.0, 201.0, 270.0, 446.0, 753.0, 1254.0, 2168.0, 3897.0, 7795.0, 16462.0, 37349.0, 88790.0, 210077.0, 326745.0, 199994.0, 84234.0, 35627.0, 15628.0, 7339.0, 3846.0, 2159.0, 1229.0, 720.0, 419.0, 287.0, 169.0, 100.0, 91.0, 48.0, 36.0, 21.0, 17.0, 12.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.27288818359375, -5.0809326171875, -4.88897705078125, -4.697021484375, -4.50506591796875, -4.3131103515625, -4.12115478515625, -3.92919921875, -3.73724365234375, -3.5452880859375, -3.35333251953125, -3.161376953125, -2.96942138671875, -2.7774658203125, -2.58551025390625, -2.3935546875, -2.20159912109375, -2.0096435546875, -1.81768798828125, -1.625732421875, -1.43377685546875, -1.2418212890625, -1.04986572265625, -0.85791015625, -0.66595458984375, -0.4739990234375, -0.28204345703125, -0.090087890625, 0.10186767578125, 0.2938232421875, 0.48577880859375, 0.677734375, 0.86968994140625, 1.0616455078125, 1.25360107421875, 1.445556640625, 1.63751220703125, 1.8294677734375, 2.02142333984375, 2.21337890625, 2.40533447265625, 2.5972900390625, 2.78924560546875, 2.981201171875, 3.17315673828125, 3.3651123046875, 3.55706787109375, 3.7490234375, 3.94097900390625, 4.1329345703125, 4.32489013671875, 4.516845703125, 4.70880126953125, 4.9007568359375, 5.09271240234375, 5.28466796875, 5.47662353515625, 5.6685791015625, 5.86053466796875, 6.052490234375, 6.24444580078125, 6.4364013671875, 6.62835693359375, 6.8203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 9.0, 12.0, 11.0, 13.0, 9.0, 20.0, 15.0, 14.0, 22.0, 34.0, 20.0, 32.0, 30.0, 25.0, 30.0, 31.0, 40.0, 40.0, 46.0, 44.0, 37.0, 33.0, 45.0, 44.0, 30.0, 35.0, 21.0, 31.0, 24.0, 22.0, 18.0, 22.0, 19.0, 21.0, 14.0, 19.0, 13.0, 6.0, 9.0, 10.0, 3.0, 1.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.728515625, -3.610595703125, -3.49267578125, -3.374755859375, -3.2568359375, -3.138916015625, -3.02099609375, -2.903076171875, -2.78515625, -2.667236328125, -2.54931640625, -2.431396484375, -2.3134765625, -2.195556640625, -2.07763671875, -1.959716796875, -1.841796875, -1.723876953125, -1.60595703125, -1.488037109375, -1.3701171875, -1.252197265625, -1.13427734375, -1.016357421875, -0.8984375, -0.780517578125, -0.66259765625, -0.544677734375, -0.4267578125, -0.308837890625, -0.19091796875, -0.072998046875, 0.044921875, 0.162841796875, 0.28076171875, 0.398681640625, 0.5166015625, 0.634521484375, 0.75244140625, 0.870361328125, 0.98828125, 1.106201171875, 1.22412109375, 1.342041015625, 1.4599609375, 1.577880859375, 1.69580078125, 1.813720703125, 1.931640625, 2.049560546875, 2.16748046875, 2.285400390625, 2.4033203125, 2.521240234375, 2.63916015625, 2.757080078125, 2.875, 2.992919921875, 3.11083984375, 3.228759765625, 3.3466796875, 3.464599609375, 3.58251953125, 3.700439453125, 3.818359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 12.0, 20.0, 27.0, 37.0, 52.0, 86.0, 98.0, 141.0, 180.0, 271.0, 363.0, 508.0, 722.0, 1086.0, 1759.0, 2833.0, 4528.0, 8055.0, 15187.0, 31146.0, 69167.0, 161390.0, 309219.0, 240138.0, 106288.0, 46141.0, 21544.0, 11107.0, 5991.0, 3616.0, 2211.0, 1424.0, 978.0, 662.0, 455.0, 333.0, 229.0, 148.0, 107.0, 80.0, 60.0, 48.0, 22.0, 23.0, 21.0, 11.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-4.29296875, -4.16943359375, -4.0458984375, -3.92236328125, -3.798828125, -3.67529296875, -3.5517578125, -3.42822265625, -3.3046875, -3.18115234375, -3.0576171875, -2.93408203125, -2.810546875, -2.68701171875, -2.5634765625, -2.43994140625, -2.31640625, -2.19287109375, -2.0693359375, -1.94580078125, -1.822265625, -1.69873046875, -1.5751953125, -1.45166015625, -1.328125, -1.20458984375, -1.0810546875, -0.95751953125, -0.833984375, -0.71044921875, -0.5869140625, -0.46337890625, -0.33984375, -0.21630859375, -0.0927734375, 0.03076171875, 0.154296875, 0.27783203125, 0.4013671875, 0.52490234375, 0.6484375, 0.77197265625, 0.8955078125, 1.01904296875, 1.142578125, 1.26611328125, 1.3896484375, 1.51318359375, 1.63671875, 1.76025390625, 1.8837890625, 2.00732421875, 2.130859375, 2.25439453125, 2.3779296875, 2.50146484375, 2.625, 2.74853515625, 2.8720703125, 2.99560546875, 3.119140625, 3.24267578125, 3.3662109375, 3.48974609375, 3.61328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 8.0, 10.0, 12.0, 13.0, 13.0, 19.0, 13.0, 20.0, 19.0, 28.0, 28.0, 18.0, 27.0, 32.0, 42.0, 43.0, 24.0, 33.0, 31.0, 32.0, 39.0, 48.0, 38.0, 40.0, 42.0, 34.0, 41.0, 24.0, 34.0, 24.0, 21.0, 19.0, 20.0, 14.0, 15.0, 17.0, 7.0, 14.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.404296875, -2.32501220703125, -2.2457275390625, -2.16644287109375, -2.087158203125, -2.00787353515625, -1.9285888671875, -1.84930419921875, -1.77001953125, -1.69073486328125, -1.6114501953125, -1.53216552734375, -1.452880859375, -1.37359619140625, -1.2943115234375, -1.21502685546875, -1.1357421875, -1.05645751953125, -0.9771728515625, -0.89788818359375, -0.818603515625, -0.73931884765625, -0.6600341796875, -0.58074951171875, -0.50146484375, -0.42218017578125, -0.3428955078125, -0.26361083984375, -0.184326171875, -0.10504150390625, -0.0257568359375, 0.05352783203125, 0.1328125, 0.21209716796875, 0.2913818359375, 0.37066650390625, 0.449951171875, 0.52923583984375, 0.6085205078125, 0.68780517578125, 0.76708984375, 0.84637451171875, 0.9256591796875, 1.00494384765625, 1.084228515625, 1.16351318359375, 1.2427978515625, 1.32208251953125, 1.4013671875, 1.48065185546875, 1.5599365234375, 1.63922119140625, 1.718505859375, 1.79779052734375, 1.8770751953125, 1.95635986328125, 2.03564453125, 2.11492919921875, 2.1942138671875, 2.27349853515625, 2.352783203125, 2.43206787109375, 2.5113525390625, 2.59063720703125, 2.669921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 7.0, 16.0, 29.0, 47.0, 63.0, 104.0, 187.0, 272.0, 453.0, 649.0, 1083.0, 1812.0, 3224.0, 6522.0, 15726.0, 61687.0, 695563.0, 210619.0, 29825.0, 10017.0, 4678.0, 2360.0, 1365.0, 771.0, 487.0, 339.0, 234.0, 136.0, 105.0, 58.0, 35.0, 22.0, 19.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.0645751953125, -5.867431640625, -5.6702880859375, -5.47314453125, -5.2760009765625, -5.078857421875, -4.8817138671875, -4.6845703125, -4.4874267578125, -4.290283203125, -4.0931396484375, -3.89599609375, -3.6988525390625, -3.501708984375, -3.3045654296875, -3.107421875, -2.9102783203125, -2.713134765625, -2.5159912109375, -2.31884765625, -2.1217041015625, -1.924560546875, -1.7274169921875, -1.5302734375, -1.3331298828125, -1.135986328125, -0.9388427734375, -0.74169921875, -0.5445556640625, -0.347412109375, -0.1502685546875, 0.046875, 0.2440185546875, 0.441162109375, 0.6383056640625, 0.83544921875, 1.0325927734375, 1.229736328125, 1.4268798828125, 1.6240234375, 1.8211669921875, 2.018310546875, 2.2154541015625, 2.41259765625, 2.6097412109375, 2.806884765625, 3.0040283203125, 3.201171875, 3.3983154296875, 3.595458984375, 3.7926025390625, 3.98974609375, 4.1868896484375, 4.384033203125, 4.5811767578125, 4.7783203125, 4.9754638671875, 5.172607421875, 5.3697509765625, 5.56689453125, 5.7640380859375, 5.961181640625, 6.1583251953125, 6.35546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 10.0, 9.0, 22.0, 27.0, 68.0, 142.0, 287.0, 206.0, 94.0, 51.0, 20.0, 22.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008754730224609375, -0.0008528754115104675, -0.0008302778005599976, -0.0008076801896095276, -0.0007850825786590576, -0.0007624849677085876, -0.0007398873567581177, -0.0007172897458076477, -0.0006946921348571777, -0.0006720945239067078, -0.0006494969129562378, -0.0006268993020057678, -0.0006043016910552979, -0.0005817040801048279, -0.0005591064691543579, -0.0005365088582038879, -0.000513911247253418, -0.000491313636302948, -0.00046871602535247803, -0.00044611841440200806, -0.0004235208034515381, -0.0004009231925010681, -0.00037832558155059814, -0.0003557279706001282, -0.0003331303596496582, -0.00031053274869918823, -0.00028793513774871826, -0.0002653375267982483, -0.00024273991584777832, -0.00022014230489730835, -0.00019754469394683838, -0.0001749470829963684, -0.00015234947204589844, -0.00012975186109542847, -0.0001071542501449585, -8.455663919448853e-05, -6.195902824401855e-05, -3.9361417293548584e-05, -1.6763806343078613e-05, 5.833804607391357e-06, 2.8431415557861328e-05, 5.10290265083313e-05, 7.362663745880127e-05, 9.622424840927124e-05, 0.00011882185935974121, 0.00014141947031021118, 0.00016401708126068115, 0.00018661469221115112, 0.0002092123031616211, 0.00023180991411209106, 0.00025440752506256104, 0.000277005136013031, 0.000299602746963501, 0.00032220035791397095, 0.0003447979688644409, 0.0003673955798149109, 0.00038999319076538086, 0.00041259080171585083, 0.0004351884126663208, 0.00045778602361679077, 0.00048038363456726074, 0.0005029812455177307, 0.0005255788564682007, 0.0005481764674186707, 0.0005707740783691406]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 16.0, 23.0, 32.0, 48.0, 52.0, 85.0, 126.0, 179.0, 230.0, 373.0, 496.0, 657.0, 986.0, 1409.0, 2205.0, 3412.0, 5424.0, 9344.0, 18558.0, 42486.0, 120809.0, 370820.0, 304261.0, 93817.0, 34234.0, 15770.0, 8360.0, 4780.0, 3125.0, 2008.0, 1319.0, 909.0, 615.0, 477.0, 316.0, 236.0, 145.0, 121.0, 87.0, 65.0, 37.0, 27.0, 17.0, 13.0, 9.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.935546875, -3.808135986328125, -3.68072509765625, -3.553314208984375, -3.4259033203125, -3.298492431640625, -3.17108154296875, -3.043670654296875, -2.916259765625, -2.788848876953125, -2.66143798828125, -2.534027099609375, -2.4066162109375, -2.279205322265625, -2.15179443359375, -2.024383544921875, -1.89697265625, -1.769561767578125, -1.64215087890625, -1.514739990234375, -1.3873291015625, -1.259918212890625, -1.13250732421875, -1.005096435546875, -0.877685546875, -0.750274658203125, -0.62286376953125, -0.495452880859375, -0.3680419921875, -0.240631103515625, -0.11322021484375, 0.014190673828125, 0.1416015625, 0.269012451171875, 0.39642333984375, 0.523834228515625, 0.6512451171875, 0.778656005859375, 0.90606689453125, 1.033477783203125, 1.160888671875, 1.288299560546875, 1.41571044921875, 1.543121337890625, 1.6705322265625, 1.797943115234375, 1.92535400390625, 2.052764892578125, 2.18017578125, 2.307586669921875, 2.43499755859375, 2.562408447265625, 2.6898193359375, 2.817230224609375, 2.94464111328125, 3.072052001953125, 3.199462890625, 3.326873779296875, 3.45428466796875, 3.581695556640625, 3.7091064453125, 3.836517333984375, 3.96392822265625, 4.091339111328125, 4.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 4.0, 4.0, 4.0, 6.0, 15.0, 14.0, 19.0, 31.0, 40.0, 63.0, 49.0, 71.0, 72.0, 103.0, 92.0, 86.0, 69.0, 60.0, 46.0, 27.0, 25.0, 15.0, 13.0, 11.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.97802734375, -0.95001220703125, -0.9219970703125, -0.89398193359375, -0.865966796875, -0.83795166015625, -0.8099365234375, -0.78192138671875, -0.75390625, -0.72589111328125, -0.6978759765625, -0.66986083984375, -0.641845703125, -0.61383056640625, -0.5858154296875, -0.55780029296875, -0.52978515625, -0.50177001953125, -0.4737548828125, -0.44573974609375, -0.417724609375, -0.38970947265625, -0.3616943359375, -0.33367919921875, -0.3056640625, -0.27764892578125, -0.2496337890625, -0.22161865234375, -0.193603515625, -0.16558837890625, -0.1375732421875, -0.10955810546875, -0.08154296875, -0.05352783203125, -0.0255126953125, 0.00250244140625, 0.030517578125, 0.05853271484375, 0.0865478515625, 0.11456298828125, 0.142578125, 0.17059326171875, 0.1986083984375, 0.22662353515625, 0.254638671875, 0.28265380859375, 0.3106689453125, 0.33868408203125, 0.36669921875, 0.39471435546875, 0.4227294921875, 0.45074462890625, 0.478759765625, 0.50677490234375, 0.5347900390625, 0.56280517578125, 0.5908203125, 0.61883544921875, 0.6468505859375, 0.67486572265625, 0.702880859375, 0.73089599609375, 0.7589111328125, 0.78692626953125, 0.81494140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 18.0, 17.0, 30.0, 26.0, 30.0, 40.0, 45.0, 37.0, 37.0, 37.0, 35.0, 39.0, 49.0, 54.0, 49.0, 42.0, 33.0, 38.0, 24.0, 32.0, 32.0, 26.0, 31.0, 17.0, 24.0, 19.0, 11.0, 12.0, 6.0, 6.0, 13.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6007587909698486, -3.4782354831695557, -3.3557121753692627, -3.2331888675689697, -3.1106653213500977, -2.9881420135498047, -2.8656187057495117, -2.7430953979492188, -2.620572090148926, -2.498048782348633, -2.37552547454834, -2.253002166748047, -2.130478858947754, -2.007955551147461, -1.8854320049285889, -1.762908697128296, -1.640385389328003, -1.51786208152771, -1.395338773727417, -1.2728153467178345, -1.1502920389175415, -1.0277687311172485, -0.9052453637123108, -0.782721996307373, -0.6601986885070801, -0.5376753807067871, -0.41515201330184937, -0.292628675699234, -0.17010533809661865, -0.047582030296325684, 0.07494133710861206, 0.1974647045135498, 0.3199882507324219, 0.44251158833503723, 0.5650349259376526, 0.6875582933425903, 0.8100816011428833, 0.9326049089431763, 1.0551283359527588, 1.1776516437530518, 1.3001749515533447, 1.4226982593536377, 1.5452215671539307, 1.6677449941635132, 1.7902683019638062, 1.9127916097640991, 2.0353150367736816, 2.1578383445739746, 2.2803616523742676, 2.4028849601745605, 2.5254082679748535, 2.6479315757751465, 2.7704548835754395, 2.8929781913757324, 3.0155017375946045, 3.1380250453948975, 3.2605483531951904, 3.3830716609954834, 3.5055949687957764, 3.6281182765960693, 3.7506418228149414, 3.8731651306152344, 3.9956884384155273, 4.11821174621582, 4.240735054016113]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 13.0, 11.0, 7.0, 15.0, 12.0, 21.0, 12.0, 23.0, 17.0, 26.0, 25.0, 29.0, 33.0, 39.0, 30.0, 42.0, 40.0, 43.0, 52.0, 30.0, 38.0, 39.0, 41.0, 49.0, 39.0, 34.0, 34.0, 19.0, 25.0, 26.0, 23.0, 14.0, 15.0, 14.0, 12.0, 7.0, 3.0, 12.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.016229152679443, -3.8973805904388428, -3.778532028198242, -3.6596834659576416, -3.540834903717041, -3.4219865798950195, -3.303138017654419, -3.1842894554138184, -3.0654408931732178, -2.946592330932617, -2.8277437686920166, -2.708895206451416, -2.5900468826293945, -2.471198081970215, -2.3523497581481934, -2.2335011959075928, -2.114652633666992, -1.9958040714263916, -1.876955509185791, -1.75810706615448, -1.6392585039138794, -1.5204099416732788, -1.4015614986419678, -1.2827129364013672, -1.1638643741607666, -1.045015811920166, -0.9261673092842102, -0.8073188066482544, -0.6884702444076538, -0.5696216821670532, -0.4507731795310974, -0.3319246768951416, -0.21307611465454102, -0.09422758221626282, 0.02462095022201538, 0.14346948266029358, 0.2623180150985718, 0.38116657733917236, 0.5000150799751282, 0.618863582611084, 0.7377121448516846, 0.8565607070922852, 0.975409209728241, 1.0942577123641968, 1.2131062746047974, 1.331954836845398, 1.450803279876709, 1.5696518421173096, 1.6885004043579102, 1.8073489665985107, 1.9261975288391113, 2.045046091079712, 2.1638946533203125, 2.282742977142334, 2.4015915393829346, 2.520440101623535, 2.6392886638641357, 2.7581372261047363, 2.876985788345337, 2.9958343505859375, 3.114682674407959, 3.2335314750671387, 3.35237979888916, 3.4712283611297607, 3.5900769233703613]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 13.0, 12.0, 16.0, 31.0, 41.0, 61.0, 97.0, 136.0, 200.0, 310.0, 487.0, 710.0, 1082.0, 1701.0, 2751.0, 4259.0, 6712.0, 10392.0, 16315.0, 24860.0, 37364.0, 53346.0, 72787.0, 92835.0, 110228.0, 118796.0, 115629.0, 102177.0, 82811.0, 62211.0, 44310.0, 30027.0, 19990.0, 12816.0, 8378.0, 5220.0, 3376.0, 2107.0, 1356.0, 857.0, 602.0, 352.0, 246.0, 183.0, 134.0, 65.0, 48.0, 36.0, 20.0, 19.0, 13.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 11.0, 9.0, 16.0, 12.0, 15.0, 18.0, 30.0, 18.0, 19.0, 39.0, 23.0, 26.0, 35.0, 41.0, 40.0, 32.0, 43.0, 41.0, 42.0, 42.0, 46.0, 36.0, 46.0, 41.0, 38.0, 29.0, 26.0, 36.0, 26.0, 18.0, 16.0, 14.0, 14.0, 10.0, 10.0, 7.0, 4.0, 8.0, 1.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.865234375, -3.747894287109375, -3.63055419921875, -3.513214111328125, -3.3958740234375, -3.278533935546875, -3.16119384765625, -3.043853759765625, -2.926513671875, -2.809173583984375, -2.69183349609375, -2.574493408203125, -2.4571533203125, -2.339813232421875, -2.22247314453125, -2.105133056640625, -1.98779296875, -1.870452880859375, -1.75311279296875, -1.635772705078125, -1.5184326171875, -1.401092529296875, -1.28375244140625, -1.166412353515625, -1.049072265625, -0.931732177734375, -0.81439208984375, -0.697052001953125, -0.5797119140625, -0.462371826171875, -0.34503173828125, -0.227691650390625, -0.1103515625, 0.006988525390625, 0.12432861328125, 0.241668701171875, 0.3590087890625, 0.476348876953125, 0.59368896484375, 0.711029052734375, 0.828369140625, 0.945709228515625, 1.06304931640625, 1.180389404296875, 1.2977294921875, 1.415069580078125, 1.53240966796875, 1.649749755859375, 1.76708984375, 1.884429931640625, 2.00177001953125, 2.119110107421875, 2.2364501953125, 2.353790283203125, 2.47113037109375, 2.588470458984375, 2.705810546875, 2.823150634765625, 2.94049072265625, 3.057830810546875, 3.1751708984375, 3.292510986328125, 3.40985107421875, 3.527191162109375, 3.64453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 13.0, 14.0, 29.0, 43.0, 79.0, 125.0, 191.0, 292.0, 549.0, 790.0, 1393.0, 2312.0, 3759.0, 6144.0, 10282.0, 16606.0, 26349.0, 40187.0, 58723.0, 81777.0, 105485.0, 121920.0, 126443.0, 118413.0, 99664.0, 76025.0, 53878.0, 35964.0, 23340.0, 14671.0, 9080.0, 5587.0, 3328.0, 2023.0, 1261.0, 683.0, 440.0, 285.0, 152.0, 82.0, 72.0, 40.0, 23.0, 15.0, 10.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.15625, -4.0194091796875, -3.882568359375, -3.7457275390625, -3.60888671875, -3.4720458984375, -3.335205078125, -3.1983642578125, -3.0615234375, -2.9246826171875, -2.787841796875, -2.6510009765625, -2.51416015625, -2.3773193359375, -2.240478515625, -2.1036376953125, -1.966796875, -1.8299560546875, -1.693115234375, -1.5562744140625, -1.41943359375, -1.2825927734375, -1.145751953125, -1.0089111328125, -0.8720703125, -0.7352294921875, -0.598388671875, -0.4615478515625, -0.32470703125, -0.1878662109375, -0.051025390625, 0.0858154296875, 0.22265625, 0.3594970703125, 0.496337890625, 0.6331787109375, 0.77001953125, 0.9068603515625, 1.043701171875, 1.1805419921875, 1.3173828125, 1.4542236328125, 1.591064453125, 1.7279052734375, 1.86474609375, 2.0015869140625, 2.138427734375, 2.2752685546875, 2.412109375, 2.5489501953125, 2.685791015625, 2.8226318359375, 2.95947265625, 3.0963134765625, 3.233154296875, 3.3699951171875, 3.5068359375, 3.6436767578125, 3.780517578125, 3.9173583984375, 4.05419921875, 4.1910400390625, 4.327880859375, 4.4647216796875, 4.6015625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 10.0, 11.0, 18.0, 8.0, 11.0, 14.0, 22.0, 21.0, 31.0, 28.0, 31.0, 39.0, 36.0, 24.0, 37.0, 41.0, 41.0, 46.0, 44.0, 38.0, 44.0, 53.0, 29.0, 41.0, 36.0, 27.0, 20.0, 29.0, 25.0, 17.0, 18.0, 15.0, 21.0, 18.0, 11.0, 8.0, 8.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.303192138671875, -2.22552490234375, -2.147857666015625, -2.0701904296875, -1.992523193359375, -1.91485595703125, -1.837188720703125, -1.759521484375, -1.681854248046875, -1.60418701171875, -1.526519775390625, -1.4488525390625, -1.371185302734375, -1.29351806640625, -1.215850830078125, -1.13818359375, -1.060516357421875, -0.98284912109375, -0.905181884765625, -0.8275146484375, -0.749847412109375, -0.67218017578125, -0.594512939453125, -0.516845703125, -0.439178466796875, -0.36151123046875, -0.283843994140625, -0.2061767578125, -0.128509521484375, -0.05084228515625, 0.026824951171875, 0.1044921875, 0.182159423828125, 0.25982666015625, 0.337493896484375, 0.4151611328125, 0.492828369140625, 0.57049560546875, 0.648162841796875, 0.725830078125, 0.803497314453125, 0.88116455078125, 0.958831787109375, 1.0364990234375, 1.114166259765625, 1.19183349609375, 1.269500732421875, 1.34716796875, 1.424835205078125, 1.50250244140625, 1.580169677734375, 1.6578369140625, 1.735504150390625, 1.81317138671875, 1.890838623046875, 1.968505859375, 2.046173095703125, 2.12384033203125, 2.201507568359375, 2.2791748046875, 2.356842041015625, 2.43450927734375, 2.512176513671875, 2.58984375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 13.0, 22.0, 19.0, 42.0, 54.0, 78.0, 110.0, 167.0, 191.0, 348.0, 452.0, 686.0, 991.0, 1628.0, 2673.0, 4959.0, 9748.0, 21169.0, 48439.0, 111224.0, 213081.0, 267553.0, 191670.0, 95153.0, 40639.0, 17735.0, 8366.0, 4438.0, 2430.0, 1563.0, 908.0, 598.0, 430.0, 284.0, 207.0, 155.0, 81.0, 72.0, 44.0, 36.0, 22.0, 20.0, 15.0, 15.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.25616455078125, -3.1490478515625, -3.04193115234375, -2.934814453125, -2.82769775390625, -2.7205810546875, -2.61346435546875, -2.50634765625, -2.39923095703125, -2.2921142578125, -2.18499755859375, -2.077880859375, -1.97076416015625, -1.8636474609375, -1.75653076171875, -1.6494140625, -1.54229736328125, -1.4351806640625, -1.32806396484375, -1.220947265625, -1.11383056640625, -1.0067138671875, -0.89959716796875, -0.79248046875, -0.68536376953125, -0.5782470703125, -0.47113037109375, -0.364013671875, -0.25689697265625, -0.1497802734375, -0.04266357421875, 0.064453125, 0.17156982421875, 0.2786865234375, 0.38580322265625, 0.492919921875, 0.60003662109375, 0.7071533203125, 0.81427001953125, 0.92138671875, 1.02850341796875, 1.1356201171875, 1.24273681640625, 1.349853515625, 1.45697021484375, 1.5640869140625, 1.67120361328125, 1.7783203125, 1.88543701171875, 1.9925537109375, 2.09967041015625, 2.206787109375, 2.31390380859375, 2.4210205078125, 2.52813720703125, 2.63525390625, 2.74237060546875, 2.8494873046875, 2.95660400390625, 3.063720703125, 3.17083740234375, 3.2779541015625, 3.38507080078125, 3.4921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 5.0, 13.0, 9.0, 9.0, 31.0, 27.0, 32.0, 57.0, 61.0, 71.0, 70.0, 68.0, 78.0, 82.0, 59.0, 62.0, 53.0, 31.0, 39.0, 28.0, 30.0, 22.0, 21.0, 5.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003304481506347656, -0.00032163411378860474, -0.00031282007694244385, -0.00030400604009628296, -0.00029519200325012207, -0.0002863779664039612, -0.0002775639295578003, -0.0002687498927116394, -0.0002599358558654785, -0.0002511218190193176, -0.00024230778217315674, -0.00023349374532699585, -0.00022467970848083496, -0.00021586567163467407, -0.00020705163478851318, -0.0001982375979423523, -0.0001894235610961914, -0.00018060952425003052, -0.00017179548740386963, -0.00016298145055770874, -0.00015416741371154785, -0.00014535337686538696, -0.00013653934001922607, -0.00012772530317306519, -0.0001189112663269043, -0.00011009722948074341, -0.00010128319263458252, -9.246915578842163e-05, -8.365511894226074e-05, -7.484108209609985e-05, -6.602704524993896e-05, -5.7213008403778076e-05, -4.839897155761719e-05, -3.95849347114563e-05, -3.077089786529541e-05, -2.195686101913452e-05, -1.3142824172973633e-05, -4.328787326812744e-06, 4.4852495193481445e-06, 1.3299286365509033e-05, 2.2113323211669922e-05, 3.092736005783081e-05, 3.97413969039917e-05, 4.855543375015259e-05, 5.7369470596313477e-05, 6.618350744247437e-05, 7.499754428863525e-05, 8.381158113479614e-05, 9.262561798095703e-05, 0.00010143965482711792, 0.00011025369167327881, 0.0001190677285194397, 0.00012788176536560059, 0.00013669580221176147, 0.00014550983905792236, 0.00015432387590408325, 0.00016313791275024414, 0.00017195194959640503, 0.00018076598644256592, 0.0001895800232887268, 0.0001983940601348877, 0.00020720809698104858, 0.00021602213382720947, 0.00022483617067337036, 0.00023365020751953125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 20.0, 23.0, 54.0, 61.0, 86.0, 168.0, 233.0, 325.0, 496.0, 722.0, 1231.0, 2039.0, 3574.0, 6433.0, 11765.0, 22186.0, 41990.0, 77182.0, 129225.0, 180852.0, 194642.0, 155637.0, 98937.0, 55483.0, 29726.0, 15757.0, 8454.0, 4484.0, 2549.0, 1542.0, 862.0, 593.0, 395.0, 220.0, 184.0, 134.0, 81.0, 64.0, 42.0, 25.0, 21.0, 15.0, 13.0, 13.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4609375, -2.386871337890625, -2.31280517578125, -2.238739013671875, -2.1646728515625, -2.090606689453125, -2.01654052734375, -1.942474365234375, -1.868408203125, -1.794342041015625, -1.72027587890625, -1.646209716796875, -1.5721435546875, -1.498077392578125, -1.42401123046875, -1.349945068359375, -1.27587890625, -1.201812744140625, -1.12774658203125, -1.053680419921875, -0.9796142578125, -0.905548095703125, -0.83148193359375, -0.757415771484375, -0.683349609375, -0.609283447265625, -0.53521728515625, -0.461151123046875, -0.3870849609375, -0.313018798828125, -0.23895263671875, -0.164886474609375, -0.0908203125, -0.016754150390625, 0.05731201171875, 0.131378173828125, 0.2054443359375, 0.279510498046875, 0.35357666015625, 0.427642822265625, 0.501708984375, 0.575775146484375, 0.64984130859375, 0.723907470703125, 0.7979736328125, 0.872039794921875, 0.94610595703125, 1.020172119140625, 1.09423828125, 1.168304443359375, 1.24237060546875, 1.316436767578125, 1.3905029296875, 1.464569091796875, 1.53863525390625, 1.612701416015625, 1.686767578125, 1.760833740234375, 1.83489990234375, 1.908966064453125, 1.9830322265625, 2.057098388671875, 2.13116455078125, 2.205230712890625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 4.0, 9.0, 15.0, 12.0, 16.0, 13.0, 23.0, 22.0, 28.0, 31.0, 46.0, 37.0, 50.0, 47.0, 60.0, 49.0, 53.0, 49.0, 54.0, 60.0, 47.0, 46.0, 32.0, 36.0, 30.0, 24.0, 19.0, 15.0, 15.0, 9.0, 8.0, 5.0, 4.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.79541015625, -0.7714614868164062, -0.7475128173828125, -0.7235641479492188, -0.699615478515625, -0.6756668090820312, -0.6517181396484375, -0.6277694702148438, -0.60382080078125, -0.5798721313476562, -0.5559234619140625, -0.5319747924804688, -0.508026123046875, -0.48407745361328125, -0.4601287841796875, -0.43618011474609375, -0.4122314453125, -0.38828277587890625, -0.3643341064453125, -0.34038543701171875, -0.316436767578125, -0.29248809814453125, -0.2685394287109375, -0.24459075927734375, -0.22064208984375, -0.19669342041015625, -0.1727447509765625, -0.14879608154296875, -0.124847412109375, -0.10089874267578125, -0.0769500732421875, -0.05300140380859375, -0.029052734375, -0.00510406494140625, 0.0188446044921875, 0.04279327392578125, 0.066741943359375, 0.09069061279296875, 0.1146392822265625, 0.13858795166015625, 0.16253662109375, 0.18648529052734375, 0.2104339599609375, 0.23438262939453125, 0.258331298828125, 0.28227996826171875, 0.3062286376953125, 0.33017730712890625, 0.3541259765625, 0.37807464599609375, 0.4020233154296875, 0.42597198486328125, 0.449920654296875, 0.47386932373046875, 0.4978179931640625, 0.5217666625976562, 0.54571533203125, 0.5696640014648438, 0.5936126708984375, 0.6175613403320312, 0.641510009765625, 0.6654586791992188, 0.6894073486328125, 0.7133560180664062, 0.7373046875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 14.0, 9.0, 8.0, 11.0, 12.0, 18.0, 22.0, 28.0, 24.0, 22.0, 37.0, 40.0, 45.0, 44.0, 44.0, 53.0, 47.0, 41.0, 45.0, 44.0, 46.0, 29.0, 41.0, 39.0, 22.0, 27.0, 25.0, 23.0, 21.0, 22.0, 11.0, 16.0, 13.0, 7.0, 9.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6092023849487305, -3.489184856414795, -3.3691673278808594, -3.249149799346924, -3.1291322708129883, -3.0091147422790527, -2.889097213745117, -2.7690794467926025, -2.649061918258667, -2.5290443897247314, -2.409026861190796, -2.2890093326568604, -2.168991804122925, -2.04897403717041, -1.9289566278457642, -1.808938980102539, -1.688921570777893, -1.5689040422439575, -1.448886513710022, -1.3288688659667969, -1.2088513374328613, -1.0888338088989258, -0.9688162803649902, -0.8487986922264099, -0.7287811636924744, -0.6087636351585388, -0.4887460470199585, -0.36872851848602295, -0.24871096014976501, -0.12869340181350708, -0.008675873279571533, 0.11134171485900879, 0.23135924339294434, 0.35137680172920227, 0.4713943600654602, 0.5914118885993958, 0.7114294767379761, 0.8314470052719116, 0.9514645338058472, 1.0714821815490723, 1.1914997100830078, 1.3115172386169434, 1.431534767150879, 1.5515522956848145, 1.6715699434280396, 1.791587471961975, 1.9116050004959106, 2.0316226482391357, 2.151639938354492, 2.2716574668884277, 2.3916749954223633, 2.511692523956299, 2.6317100524902344, 2.75172758102417, 2.8717451095581055, 2.99176287651062, 3.1117804050445557, 3.231797933578491, 3.3518154621124268, 3.4718329906463623, 3.591850519180298, 3.7118682861328125, 3.831885814666748, 3.9519033432006836, 4.071920871734619]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 9.0, 8.0, 9.0, 15.0, 12.0, 14.0, 10.0, 10.0, 15.0, 23.0, 19.0, 34.0, 30.0, 37.0, 32.0, 44.0, 49.0, 31.0, 42.0, 45.0, 45.0, 35.0, 38.0, 36.0, 42.0, 33.0, 42.0, 26.0, 32.0, 17.0, 23.0, 20.0, 16.0, 22.0, 9.0, 12.0, 8.0, 14.0, 11.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.8113772869110107, -3.691875696182251, -3.572374105453491, -3.4528725147247314, -3.3333709239959717, -3.213869333267212, -3.094367742538452, -2.9748661518096924, -2.8553645610809326, -2.735862970352173, -2.616361379623413, -2.4968597888946533, -2.3773581981658936, -2.257856607437134, -2.138355016708374, -2.0188534259796143, -1.8993518352508545, -1.7798502445220947, -1.660348653793335, -1.5408470630645752, -1.4213454723358154, -1.3018438816070557, -1.182342290878296, -1.0628407001495361, -0.9433391094207764, -0.8238375186920166, -0.7043359279632568, -0.5848343372344971, -0.4653327465057373, -0.34583115577697754, -0.22632956504821777, -0.10682797431945801, 0.012673377990722656, 0.13217496871948242, 0.2516765594482422, 0.37117815017700195, 0.4906797409057617, 0.6101813316345215, 0.7296829223632812, 0.849184513092041, 0.9686861038208008, 1.0881876945495605, 1.2076892852783203, 1.32719087600708, 1.4466924667358398, 1.5661940574645996, 1.6856956481933594, 1.8051972389221191, 1.924698829650879, 2.0442004203796387, 2.1637020111083984, 2.283203601837158, 2.402705192565918, 2.5222067832946777, 2.6417083740234375, 2.7612099647521973, 2.880711555480957, 3.000213146209717, 3.1197147369384766, 3.2392163276672363, 3.358717918395996, 3.478219509124756, 3.5977210998535156, 3.7172226905822754, 3.836724281311035]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 10.0, 10.0, 8.0, 19.0, 29.0, 41.0, 71.0, 147.0, 202.0, 342.0, 498.0, 861.0, 1453.0, 2343.0, 3724.0, 6109.0, 9958.0, 16278.0, 26585.0, 42211.0, 67967.0, 107281.0, 166552.0, 249078.0, 354256.0, 459905.0, 533483.0, 541889.0, 477075.0, 374384.0, 267073.0, 179271.0, 115153.0, 72621.0, 45410.0, 28037.0, 16967.0, 10563.0, 6354.0, 3959.0, 2421.0, 1408.0, 870.0, 564.0, 318.0, 201.0, 123.0, 85.0, 52.0, 30.0, 14.0, 16.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.919921875, -2.826019287109375, -2.73211669921875, -2.638214111328125, -2.5443115234375, -2.450408935546875, -2.35650634765625, -2.262603759765625, -2.168701171875, -2.074798583984375, -1.98089599609375, -1.886993408203125, -1.7930908203125, -1.699188232421875, -1.60528564453125, -1.511383056640625, -1.41748046875, -1.323577880859375, -1.22967529296875, -1.135772705078125, -1.0418701171875, -0.947967529296875, -0.85406494140625, -0.760162353515625, -0.666259765625, -0.572357177734375, -0.47845458984375, -0.384552001953125, -0.2906494140625, -0.196746826171875, -0.10284423828125, -0.008941650390625, 0.0849609375, 0.178863525390625, 0.27276611328125, 0.366668701171875, 0.4605712890625, 0.554473876953125, 0.64837646484375, 0.742279052734375, 0.836181640625, 0.930084228515625, 1.02398681640625, 1.117889404296875, 1.2117919921875, 1.305694580078125, 1.39959716796875, 1.493499755859375, 1.58740234375, 1.681304931640625, 1.77520751953125, 1.869110107421875, 1.9630126953125, 2.056915283203125, 2.15081787109375, 2.244720458984375, 2.338623046875, 2.432525634765625, 2.52642822265625, 2.620330810546875, 2.7142333984375, 2.808135986328125, 2.90203857421875, 2.995941162109375, 3.08984375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 2.0, 7.0, 12.0, 10.0, 16.0, 8.0, 14.0, 13.0, 21.0, 20.0, 18.0, 27.0, 31.0, 44.0, 36.0, 37.0, 33.0, 38.0, 35.0, 42.0, 33.0, 51.0, 44.0, 40.0, 38.0, 29.0, 28.0, 27.0, 27.0, 24.0, 29.0, 20.0, 17.0, 22.0, 21.0, 21.0, 8.0, 12.0, 9.0, 5.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.526580810546875, -2.43597412109375, -2.345367431640625, -2.2547607421875, -2.164154052734375, -2.07354736328125, -1.982940673828125, -1.892333984375, -1.801727294921875, -1.71112060546875, -1.620513916015625, -1.5299072265625, -1.439300537109375, -1.34869384765625, -1.258087158203125, -1.16748046875, -1.076873779296875, -0.98626708984375, -0.895660400390625, -0.8050537109375, -0.714447021484375, -0.62384033203125, -0.533233642578125, -0.442626953125, -0.352020263671875, -0.26141357421875, -0.170806884765625, -0.0802001953125, 0.010406494140625, 0.10101318359375, 0.191619873046875, 0.2822265625, 0.372833251953125, 0.46343994140625, 0.554046630859375, 0.6446533203125, 0.735260009765625, 0.82586669921875, 0.916473388671875, 1.007080078125, 1.097686767578125, 1.18829345703125, 1.278900146484375, 1.3695068359375, 1.460113525390625, 1.55072021484375, 1.641326904296875, 1.73193359375, 1.822540283203125, 1.91314697265625, 2.003753662109375, 2.0943603515625, 2.184967041015625, 2.27557373046875, 2.366180419921875, 2.456787109375, 2.547393798828125, 2.63800048828125, 2.728607177734375, 2.8192138671875, 2.909820556640625, 3.00042724609375, 3.091033935546875, 3.181640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 24.0, 29.0, 41.0, 67.0, 145.0, 267.0, 450.0, 807.0, 1671.0, 3110.0, 6082.0, 11950.0, 22364.0, 41566.0, 76856.0, 134260.0, 224595.0, 348208.0, 488313.0, 596026.0, 619137.0, 544317.0, 410737.0, 275480.0, 171091.0, 98577.0, 55544.0, 29649.0, 15491.0, 8332.0, 4204.0, 2271.0, 1262.0, 618.0, 307.0, 188.0, 102.0, 57.0, 37.0, 21.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.998046875, -3.8812255859375, -3.764404296875, -3.6475830078125, -3.53076171875, -3.4139404296875, -3.297119140625, -3.1802978515625, -3.0634765625, -2.9466552734375, -2.829833984375, -2.7130126953125, -2.59619140625, -2.4793701171875, -2.362548828125, -2.2457275390625, -2.12890625, -2.0120849609375, -1.895263671875, -1.7784423828125, -1.66162109375, -1.5447998046875, -1.427978515625, -1.3111572265625, -1.1943359375, -1.0775146484375, -0.960693359375, -0.8438720703125, -0.72705078125, -0.6102294921875, -0.493408203125, -0.3765869140625, -0.259765625, -0.1429443359375, -0.026123046875, 0.0906982421875, 0.20751953125, 0.3243408203125, 0.441162109375, 0.5579833984375, 0.6748046875, 0.7916259765625, 0.908447265625, 1.0252685546875, 1.14208984375, 1.2589111328125, 1.375732421875, 1.4925537109375, 1.609375, 1.7261962890625, 1.843017578125, 1.9598388671875, 2.07666015625, 2.1934814453125, 2.310302734375, 2.4271240234375, 2.5439453125, 2.6607666015625, 2.777587890625, 2.8944091796875, 3.01123046875, 3.1280517578125, 3.244873046875, 3.3616943359375, 3.478515625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 14.0, 25.0, 28.0, 27.0, 54.0, 54.0, 71.0, 96.0, 82.0, 128.0, 155.0, 168.0, 216.0, 235.0, 258.0, 247.0, 242.0, 253.0, 255.0, 245.0, 203.0, 192.0, 173.0, 128.0, 123.0, 86.0, 73.0, 65.0, 35.0, 37.0, 26.0, 23.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6337890625, -1.582061767578125, -1.53033447265625, -1.478607177734375, -1.4268798828125, -1.375152587890625, -1.32342529296875, -1.271697998046875, -1.219970703125, -1.168243408203125, -1.11651611328125, -1.064788818359375, -1.0130615234375, -0.961334228515625, -0.90960693359375, -0.857879638671875, -0.80615234375, -0.754425048828125, -0.70269775390625, -0.650970458984375, -0.5992431640625, -0.547515869140625, -0.49578857421875, -0.444061279296875, -0.392333984375, -0.340606689453125, -0.28887939453125, -0.237152099609375, -0.1854248046875, -0.133697509765625, -0.08197021484375, -0.030242919921875, 0.021484375, 0.073211669921875, 0.12493896484375, 0.176666259765625, 0.2283935546875, 0.280120849609375, 0.33184814453125, 0.383575439453125, 0.435302734375, 0.487030029296875, 0.53875732421875, 0.590484619140625, 0.6422119140625, 0.693939208984375, 0.74566650390625, 0.797393798828125, 0.84912109375, 0.900848388671875, 0.95257568359375, 1.004302978515625, 1.0560302734375, 1.107757568359375, 1.15948486328125, 1.211212158203125, 1.262939453125, 1.314666748046875, 1.36639404296875, 1.418121337890625, 1.4698486328125, 1.521575927734375, 1.57330322265625, 1.625030517578125, 1.6767578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 6.0, 11.0, 8.0, 5.0, 9.0, 14.0, 16.0, 20.0, 27.0, 30.0, 16.0, 27.0, 49.0, 35.0, 40.0, 43.0, 49.0, 50.0, 49.0, 45.0, 39.0, 47.0, 53.0, 38.0, 43.0, 32.0, 35.0, 25.0, 18.0, 19.0, 20.0, 18.0, 18.0, 13.0, 6.0, 8.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.854025363922119, -3.737438917160034, -3.620852470397949, -3.5042660236358643, -3.3876795768737793, -3.2710931301116943, -3.1545066833496094, -3.0379204750061035, -2.9213337898254395, -2.8047473430633545, -2.6881608963012695, -2.5715744495391846, -2.4549880027770996, -2.3384015560150146, -2.2218151092529297, -2.105228900909424, -1.9886424541473389, -1.872056007385254, -1.755469560623169, -1.638883113861084, -1.522296667098999, -1.405710220336914, -1.2891238927841187, -1.1725374460220337, -1.0559509992599487, -0.9393645524978638, -0.8227781057357788, -0.7061917185783386, -0.5896052718162537, -0.4730188250541687, -0.3564324378967285, -0.23984599113464355, -0.1232595443725586, -0.006673112511634827, 0.10991331934928894, 0.2264997363090515, 0.3430861830711365, 0.45967262983322144, 0.5762590169906616, 0.6928454637527466, 0.8094319105148315, 0.9260183572769165, 1.0426048040390015, 1.1591911315917969, 1.2757775783538818, 1.3923640251159668, 1.5089504718780518, 1.6255369186401367, 1.7421233654022217, 1.8587098121643066, 1.9752962589263916, 2.0918827056884766, 2.2084691524505615, 2.3250555992126465, 2.4416418075561523, 2.5582284927368164, 2.6748147010803223, 2.7914011478424072, 2.907987594604492, 3.024574041366577, 3.141160488128662, 3.257746934890747, 3.374333381652832, 3.490919589996338, 3.607506275177002]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 3.0, 5.0, 10.0, 8.0, 16.0, 14.0, 8.0, 17.0, 20.0, 20.0, 24.0, 27.0, 31.0, 34.0, 42.0, 29.0, 33.0, 36.0, 42.0, 40.0, 44.0, 50.0, 45.0, 44.0, 31.0, 33.0, 42.0, 34.0, 21.0, 32.0, 23.0, 24.0, 24.0, 14.0, 9.0, 10.0, 11.0, 12.0, 5.0, 9.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.6561279296875, -3.55086612701416, -3.4456043243408203, -3.3403425216674805, -3.2350807189941406, -3.129818916320801, -3.024557113647461, -2.919295310974121, -2.8140335083007812, -2.7087717056274414, -2.6035099029541016, -2.4982481002807617, -2.392986297607422, -2.287724494934082, -2.182462692260742, -2.0772008895874023, -1.9719388484954834, -1.8666770458221436, -1.7614152431488037, -1.6561534404754639, -1.550891637802124, -1.4456298351287842, -1.3403679132461548, -1.235106110572815, -1.129844307899475, -1.0245825052261353, -0.9193207025527954, -0.8140588402748108, -0.708797037601471, -0.6035352349281311, -0.4982733726501465, -0.39301156997680664, -0.2877495288848877, -0.18248771131038666, -0.07722589373588562, 0.02803593873977661, 0.13329774141311646, 0.2385595440864563, 0.3438214063644409, 0.44908320903778076, 0.5543450117111206, 0.6596068143844604, 0.7648686170578003, 0.8701304793357849, 0.9753922820091248, 1.0806541442871094, 1.1859159469604492, 1.291177749633789, 1.396439552307129, 1.5017013549804688, 1.6069631576538086, 1.7122249603271484, 1.8174867630004883, 1.9227485656738281, 2.028010368347168, 2.133272171020508, 2.2385339736938477, 2.3437957763671875, 2.4490575790405273, 2.554319381713867, 2.659581184387207, 2.764842987060547, 2.8701047897338867, 2.9753665924072266, 3.0806286334991455]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 6.0, 19.0, 26.0, 49.0, 63.0, 96.0, 146.0, 222.0, 302.0, 430.0, 629.0, 925.0, 1337.0, 1958.0, 2953.0, 4453.0, 6807.0, 10514.0, 16383.0, 26178.0, 41741.0, 67147.0, 105428.0, 155079.0, 182426.0, 149921.0, 100633.0, 63528.0, 39225.0, 24912.0, 15551.0, 10067.0, 6485.0, 4162.0, 2790.0, 1890.0, 1256.0, 839.0, 613.0, 435.0, 278.0, 202.0, 164.0, 105.0, 62.0, 42.0, 28.0, 16.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.613372802734375, -2.52752685546875, -2.441680908203125, -2.3558349609375, -2.269989013671875, -2.18414306640625, -2.098297119140625, -2.012451171875, -1.926605224609375, -1.84075927734375, -1.754913330078125, -1.6690673828125, -1.583221435546875, -1.49737548828125, -1.411529541015625, -1.32568359375, -1.239837646484375, -1.15399169921875, -1.068145751953125, -0.9822998046875, -0.896453857421875, -0.81060791015625, -0.724761962890625, -0.638916015625, -0.553070068359375, -0.46722412109375, -0.381378173828125, -0.2955322265625, -0.209686279296875, -0.12384033203125, -0.037994384765625, 0.0478515625, 0.133697509765625, 0.21954345703125, 0.305389404296875, 0.3912353515625, 0.477081298828125, 0.56292724609375, 0.648773193359375, 0.734619140625, 0.820465087890625, 0.90631103515625, 0.992156982421875, 1.0780029296875, 1.163848876953125, 1.24969482421875, 1.335540771484375, 1.42138671875, 1.507232666015625, 1.59307861328125, 1.678924560546875, 1.7647705078125, 1.850616455078125, 1.93646240234375, 2.022308349609375, 2.108154296875, 2.194000244140625, 2.27984619140625, 2.365692138671875, 2.4515380859375, 2.537384033203125, 2.62322998046875, 2.709075927734375, 2.794921875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 11.0, 8.0, 15.0, 14.0, 17.0, 26.0, 20.0, 13.0, 27.0, 30.0, 27.0, 33.0, 37.0, 35.0, 45.0, 40.0, 47.0, 43.0, 40.0, 29.0, 46.0, 29.0, 39.0, 32.0, 31.0, 35.0, 25.0, 26.0, 32.0, 22.0, 22.0, 8.0, 14.0, 10.0, 7.0, 8.0, 11.0, 10.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.5625, -3.45538330078125, -3.3482666015625, -3.24114990234375, -3.134033203125, -3.02691650390625, -2.9197998046875, -2.81268310546875, -2.70556640625, -2.59844970703125, -2.4913330078125, -2.38421630859375, -2.277099609375, -2.16998291015625, -2.0628662109375, -1.95574951171875, -1.8486328125, -1.74151611328125, -1.6343994140625, -1.52728271484375, -1.420166015625, -1.31304931640625, -1.2059326171875, -1.09881591796875, -0.99169921875, -0.88458251953125, -0.7774658203125, -0.67034912109375, -0.563232421875, -0.45611572265625, -0.3489990234375, -0.24188232421875, -0.134765625, -0.02764892578125, 0.0794677734375, 0.18658447265625, 0.293701171875, 0.40081787109375, 0.5079345703125, 0.61505126953125, 0.72216796875, 0.82928466796875, 0.9364013671875, 1.04351806640625, 1.150634765625, 1.25775146484375, 1.3648681640625, 1.47198486328125, 1.5791015625, 1.68621826171875, 1.7933349609375, 1.90045166015625, 2.007568359375, 2.11468505859375, 2.2218017578125, 2.32891845703125, 2.43603515625, 2.54315185546875, 2.6502685546875, 2.75738525390625, 2.864501953125, 2.97161865234375, 3.0787353515625, 3.18585205078125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 13.0, 6.0, 13.0, 30.0, 29.0, 47.0, 73.0, 107.0, 177.0, 238.0, 378.0, 578.0, 1010.0, 1621.0, 2760.0, 4887.0, 8876.0, 16460.0, 33230.0, 70466.0, 153697.0, 283381.0, 241621.0, 118397.0, 54255.0, 25792.0, 13323.0, 7056.0, 3998.0, 2349.0, 1389.0, 799.0, 488.0, 352.0, 199.0, 136.0, 98.0, 70.0, 45.0, 32.0, 16.0, 13.0, 12.0, 8.0, 8.0, 4.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.973846435546875, -2.87738037109375, -2.780914306640625, -2.6844482421875, -2.587982177734375, -2.49151611328125, -2.395050048828125, -2.298583984375, -2.202117919921875, -2.10565185546875, -2.009185791015625, -1.9127197265625, -1.816253662109375, -1.71978759765625, -1.623321533203125, -1.52685546875, -1.430389404296875, -1.33392333984375, -1.237457275390625, -1.1409912109375, -1.044525146484375, -0.94805908203125, -0.851593017578125, -0.755126953125, -0.658660888671875, -0.56219482421875, -0.465728759765625, -0.3692626953125, -0.272796630859375, -0.17633056640625, -0.079864501953125, 0.0166015625, 0.113067626953125, 0.20953369140625, 0.305999755859375, 0.4024658203125, 0.498931884765625, 0.59539794921875, 0.691864013671875, 0.788330078125, 0.884796142578125, 0.98126220703125, 1.077728271484375, 1.1741943359375, 1.270660400390625, 1.36712646484375, 1.463592529296875, 1.56005859375, 1.656524658203125, 1.75299072265625, 1.849456787109375, 1.9459228515625, 2.042388916015625, 2.13885498046875, 2.235321044921875, 2.331787109375, 2.428253173828125, 2.52471923828125, 2.621185302734375, 2.7176513671875, 2.814117431640625, 2.91058349609375, 3.007049560546875, 3.103515625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 11.0, 7.0, 10.0, 10.0, 14.0, 11.0, 11.0, 26.0, 22.0, 20.0, 19.0, 43.0, 23.0, 30.0, 30.0, 31.0, 35.0, 30.0, 39.0, 39.0, 47.0, 37.0, 34.0, 44.0, 44.0, 41.0, 26.0, 40.0, 26.0, 25.0, 20.0, 26.0, 21.0, 11.0, 16.0, 12.0, 12.0, 10.0, 6.0, 6.0, 9.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.01171875, -1.9432373046875, -1.874755859375, -1.8062744140625, -1.73779296875, -1.6693115234375, -1.600830078125, -1.5323486328125, -1.4638671875, -1.3953857421875, -1.326904296875, -1.2584228515625, -1.18994140625, -1.1214599609375, -1.052978515625, -0.9844970703125, -0.916015625, -0.8475341796875, -0.779052734375, -0.7105712890625, -0.64208984375, -0.5736083984375, -0.505126953125, -0.4366455078125, -0.3681640625, -0.2996826171875, -0.231201171875, -0.1627197265625, -0.09423828125, -0.0257568359375, 0.042724609375, 0.1112060546875, 0.1796875, 0.2481689453125, 0.316650390625, 0.3851318359375, 0.45361328125, 0.5220947265625, 0.590576171875, 0.6590576171875, 0.7275390625, 0.7960205078125, 0.864501953125, 0.9329833984375, 1.00146484375, 1.0699462890625, 1.138427734375, 1.2069091796875, 1.275390625, 1.3438720703125, 1.412353515625, 1.4808349609375, 1.54931640625, 1.6177978515625, 1.686279296875, 1.7547607421875, 1.8232421875, 1.8917236328125, 1.960205078125, 2.0286865234375, 2.09716796875, 2.1656494140625, 2.234130859375, 2.3026123046875, 2.37109375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 10.0, 9.0, 13.0, 11.0, 25.0, 47.0, 61.0, 75.0, 98.0, 133.0, 199.0, 269.0, 348.0, 497.0, 724.0, 1111.0, 1626.0, 2412.0, 3848.0, 6490.0, 11274.0, 22789.0, 59159.0, 281531.0, 497077.0, 92870.0, 30456.0, 14030.0, 7763.0, 4579.0, 2891.0, 1921.0, 1232.0, 837.0, 602.0, 451.0, 302.0, 198.0, 160.0, 132.0, 70.0, 62.0, 41.0, 40.0, 24.0, 16.0, 8.0, 11.0, 5.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.455078125, -3.340576171875, -3.22607421875, -3.111572265625, -2.9970703125, -2.882568359375, -2.76806640625, -2.653564453125, -2.5390625, -2.424560546875, -2.31005859375, -2.195556640625, -2.0810546875, -1.966552734375, -1.85205078125, -1.737548828125, -1.623046875, -1.508544921875, -1.39404296875, -1.279541015625, -1.1650390625, -1.050537109375, -0.93603515625, -0.821533203125, -0.70703125, -0.592529296875, -0.47802734375, -0.363525390625, -0.2490234375, -0.134521484375, -0.02001953125, 0.094482421875, 0.208984375, 0.323486328125, 0.43798828125, 0.552490234375, 0.6669921875, 0.781494140625, 0.89599609375, 1.010498046875, 1.125, 1.239501953125, 1.35400390625, 1.468505859375, 1.5830078125, 1.697509765625, 1.81201171875, 1.926513671875, 2.041015625, 2.155517578125, 2.27001953125, 2.384521484375, 2.4990234375, 2.613525390625, 2.72802734375, 2.842529296875, 2.95703125, 3.071533203125, 3.18603515625, 3.300537109375, 3.4150390625, 3.529541015625, 3.64404296875, 3.758544921875, 3.873046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 0.0, 7.0, 6.0, 4.0, 6.0, 7.0, 16.0, 12.0, 23.0, 39.0, 40.0, 58.0, 94.0, 160.0, 164.0, 111.0, 69.0, 39.0, 31.0, 23.0, 13.0, 15.0, 8.0, 12.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003421306610107422, -0.00032897666096687317, -0.00031582266092300415, -0.00030266866087913513, -0.0002895146608352661, -0.0002763606607913971, -0.0002632066607475281, -0.00025005266070365906, -0.00023689866065979004, -0.00022374466061592102, -0.000210590660572052, -0.00019743666052818298, -0.00018428266048431396, -0.00017112866044044495, -0.00015797466039657593, -0.0001448206603527069, -0.0001316666603088379, -0.00011851266026496887, -0.00010535866022109985, -9.220466017723083e-05, -7.905066013336182e-05, -6.58966600894928e-05, -5.274266004562378e-05, -3.958866000175476e-05, -2.6434659957885742e-05, -1.3280659914016724e-05, -1.2665987014770508e-07, 1.3027340173721313e-05, 2.6181340217590332e-05, 3.933534026145935e-05, 5.248934030532837e-05, 6.564334034919739e-05, 7.87973403930664e-05, 9.195134043693542e-05, 0.00010510534048080444, 0.00011825934052467346, 0.00013141334056854248, 0.0001445673406124115, 0.00015772134065628052, 0.00017087534070014954, 0.00018402934074401855, 0.00019718334078788757, 0.0002103373408317566, 0.0002234913408756256, 0.00023664534091949463, 0.00024979934096336365, 0.00026295334100723267, 0.0002761073410511017, 0.0002892613410949707, 0.0003024153411388397, 0.00031556934118270874, 0.00032872334122657776, 0.0003418773412704468, 0.0003550313413143158, 0.0003681853413581848, 0.00038133934140205383, 0.00039449334144592285, 0.00040764734148979187, 0.0004208013415336609, 0.0004339553415775299, 0.0004471093416213989, 0.00046026334166526794, 0.00047341734170913696, 0.000486571341753006, 0.000499725341796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 11.0, 9.0, 16.0, 24.0, 49.0, 55.0, 81.0, 102.0, 168.0, 244.0, 350.0, 533.0, 827.0, 1240.0, 1911.0, 3218.0, 5084.0, 8338.0, 14519.0, 27435.0, 61338.0, 165420.0, 393606.0, 213638.0, 76011.0, 32646.0, 16700.0, 9547.0, 5602.0, 3580.0, 2175.0, 1437.0, 942.0, 560.0, 351.0, 257.0, 155.0, 103.0, 73.0, 63.0, 45.0, 29.0, 22.0, 11.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.375, -3.26824951171875, -3.1614990234375, -3.05474853515625, -2.947998046875, -2.84124755859375, -2.7344970703125, -2.62774658203125, -2.52099609375, -2.41424560546875, -2.3074951171875, -2.20074462890625, -2.093994140625, -1.98724365234375, -1.8804931640625, -1.77374267578125, -1.6669921875, -1.56024169921875, -1.4534912109375, -1.34674072265625, -1.239990234375, -1.13323974609375, -1.0264892578125, -0.91973876953125, -0.81298828125, -0.70623779296875, -0.5994873046875, -0.49273681640625, -0.385986328125, -0.27923583984375, -0.1724853515625, -0.06573486328125, 0.041015625, 0.14776611328125, 0.2545166015625, 0.36126708984375, 0.468017578125, 0.57476806640625, 0.6815185546875, 0.78826904296875, 0.89501953125, 1.00177001953125, 1.1085205078125, 1.21527099609375, 1.322021484375, 1.42877197265625, 1.5355224609375, 1.64227294921875, 1.7490234375, 1.85577392578125, 1.9625244140625, 2.06927490234375, 2.176025390625, 2.28277587890625, 2.3895263671875, 2.49627685546875, 2.60302734375, 2.70977783203125, 2.8165283203125, 2.92327880859375, 3.030029296875, 3.13677978515625, 3.2435302734375, 3.35028076171875, 3.45703125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 5.0, 12.0, 14.0, 14.0, 27.0, 20.0, 21.0, 37.0, 30.0, 47.0, 74.0, 63.0, 89.0, 115.0, 86.0, 54.0, 54.0, 38.0, 48.0, 25.0, 17.0, 29.0, 12.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77734375, -0.7531204223632812, -0.7288970947265625, -0.7046737670898438, -0.680450439453125, -0.6562271118164062, -0.6320037841796875, -0.6077804565429688, -0.58355712890625, -0.5593338012695312, -0.5351104736328125, -0.5108871459960938, -0.486663818359375, -0.46244049072265625, -0.4382171630859375, -0.41399383544921875, -0.3897705078125, -0.36554718017578125, -0.3413238525390625, -0.31710052490234375, -0.292877197265625, -0.26865386962890625, -0.2444305419921875, -0.22020721435546875, -0.19598388671875, -0.17176055908203125, -0.1475372314453125, -0.12331390380859375, -0.099090576171875, -0.07486724853515625, -0.0506439208984375, -0.02642059326171875, -0.002197265625, 0.02202606201171875, 0.0462493896484375, 0.07047271728515625, 0.094696044921875, 0.11891937255859375, 0.1431427001953125, 0.16736602783203125, 0.19158935546875, 0.21581268310546875, 0.2400360107421875, 0.26425933837890625, 0.288482666015625, 0.31270599365234375, 0.3369293212890625, 0.36115264892578125, 0.3853759765625, 0.40959930419921875, 0.4338226318359375, 0.45804595947265625, 0.482269287109375, 0.5064926147460938, 0.5307159423828125, 0.5549392700195312, 0.57916259765625, 0.6033859252929688, 0.6276092529296875, 0.6518325805664062, 0.676055908203125, 0.7002792358398438, 0.7245025634765625, 0.7487258911132812, 0.77294921875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 12.0, 15.0, 15.0, 17.0, 24.0, 34.0, 27.0, 23.0, 43.0, 46.0, 44.0, 48.0, 42.0, 54.0, 56.0, 53.0, 57.0, 54.0, 53.0, 43.0, 32.0, 45.0, 27.0, 21.0, 20.0, 17.0, 16.0, 8.0, 7.0, 7.0, 5.0, 3.0, 8.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982191801071167, -3.8511953353881836, -3.7201988697052, -3.589202404022217, -3.4582056999206543, -3.327209234237671, -3.1962127685546875, -3.065216302871704, -2.9342198371887207, -2.8032233715057373, -2.672226905822754, -2.5412302017211914, -2.410233736038208, -2.2792372703552246, -2.148240804672241, -2.017244338989258, -1.8862476348876953, -1.755251169204712, -1.624254584312439, -1.4932581186294556, -1.3622615337371826, -1.2312650680541992, -1.1002686023712158, -0.9692720770835876, -0.8382755517959595, -0.7072790265083313, -0.5762825012207031, -0.4452860355377197, -0.31428951025009155, -0.18329298496246338, -0.05229651927947998, 0.0787000060081482, 0.20969676971435547, 0.34069329500198364, 0.47168979048728943, 0.6026862859725952, 0.7336828112602234, 0.8646793365478516, 0.995675802230835, 1.1266722679138184, 1.2576688528060913, 1.3886653184890747, 1.5196619033813477, 1.650658369064331, 1.7816548347473145, 1.9126514196395874, 2.0436477661132812, 2.1746444702148438, 2.305640935897827, 2.4366374015808105, 2.567633867263794, 2.6986303329467773, 2.82962703704834, 2.9606235027313232, 3.0916199684143066, 3.22261643409729, 3.3536128997802734, 3.484609365463257, 3.6156058311462402, 3.7466025352478027, 3.877599000930786, 4.0085954666137695, 4.139592170715332, 4.270588397979736, 4.401585102081299]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 3.0, 6.0, 13.0, 15.0, 16.0, 11.0, 12.0, 21.0, 27.0, 24.0, 25.0, 35.0, 37.0, 26.0, 43.0, 33.0, 39.0, 41.0, 47.0, 46.0, 46.0, 42.0, 40.0, 36.0, 27.0, 39.0, 34.0, 19.0, 31.0, 17.0, 32.0, 12.0, 22.0, 14.0, 9.0, 13.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.6701035499572754, -3.5632424354553223, -3.4563815593719482, -3.349520444869995, -3.242659330368042, -3.135798454284668, -3.028937339782715, -2.9220762252807617, -2.8152151107788086, -2.7083539962768555, -2.6014931201934814, -2.4946320056915283, -2.387770891189575, -2.280910015106201, -2.174048900604248, -2.067187786102295, -1.960326910018921, -1.8534659147262573, -1.7466048002243042, -1.6397438049316406, -1.5328826904296875, -1.426021695137024, -1.3191606998443604, -1.2122995853424072, -1.1054385900497437, -0.9985775351524353, -0.891716480255127, -0.7848554849624634, -0.677994430065155, -0.5711333751678467, -0.4642723798751831, -0.35741132497787476, -0.2505500316619873, -0.14368899166584015, -0.03682795166969299, 0.07003307342529297, 0.17689412832260132, 0.28375518321990967, 0.39061617851257324, 0.4974772334098816, 0.6043382883071899, 0.7111993432044983, 0.8180603981018066, 0.9249213933944702, 1.0317823886871338, 1.138643503189087, 1.2455044984817505, 1.352365493774414, 1.4592266082763672, 1.5660876035690308, 1.6729487180709839, 1.7798097133636475, 1.8866708278656006, 1.9935318231582642, 2.1003928184509277, 2.207253932952881, 2.314115047454834, 2.420976161956787, 2.527837038040161, 2.6346981525421143, 2.7415592670440674, 2.8484201431274414, 2.9552812576293945, 3.0621423721313477, 3.1690032482147217]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 9.0, 3.0, 2.0, 19.0, 13.0, 41.0, 60.0, 88.0, 153.0, 186.0, 323.0, 506.0, 689.0, 1133.0, 1786.0, 2650.0, 4091.0, 6081.0, 9229.0, 13578.0, 19701.0, 27911.0, 39051.0, 51711.0, 67357.0, 82172.0, 94945.0, 102395.0, 102096.0, 94698.0, 82118.0, 66362.0, 51554.0, 38081.0, 27809.0, 19560.0, 13222.0, 9183.0, 6142.0, 4073.0, 2701.0, 1830.0, 1139.0, 728.0, 537.0, 295.0, 193.0, 122.0, 88.0, 52.0, 34.0, 25.0, 19.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.361328125, -3.259429931640625, -3.15753173828125, -3.055633544921875, -2.9537353515625, -2.851837158203125, -2.74993896484375, -2.648040771484375, -2.546142578125, -2.444244384765625, -2.34234619140625, -2.240447998046875, -2.1385498046875, -2.036651611328125, -1.93475341796875, -1.832855224609375, -1.73095703125, -1.629058837890625, -1.52716064453125, -1.425262451171875, -1.3233642578125, -1.221466064453125, -1.11956787109375, -1.017669677734375, -0.915771484375, -0.813873291015625, -0.71197509765625, -0.610076904296875, -0.5081787109375, -0.406280517578125, -0.30438232421875, -0.202484130859375, -0.1005859375, 0.001312255859375, 0.10321044921875, 0.205108642578125, 0.3070068359375, 0.408905029296875, 0.51080322265625, 0.612701416015625, 0.714599609375, 0.816497802734375, 0.91839599609375, 1.020294189453125, 1.1221923828125, 1.224090576171875, 1.32598876953125, 1.427886962890625, 1.52978515625, 1.631683349609375, 1.73358154296875, 1.835479736328125, 1.9373779296875, 2.039276123046875, 2.14117431640625, 2.243072509765625, 2.344970703125, 2.446868896484375, 2.54876708984375, 2.650665283203125, 2.7525634765625, 2.854461669921875, 2.95635986328125, 3.058258056640625, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 13.0, 15.0, 21.0, 14.0, 23.0, 32.0, 39.0, 26.0, 33.0, 36.0, 32.0, 30.0, 33.0, 36.0, 38.0, 53.0, 39.0, 45.0, 36.0, 38.0, 34.0, 28.0, 41.0, 25.0, 32.0, 22.0, 29.0, 15.0, 21.0, 17.0, 10.0, 9.0, 18.0, 11.0, 7.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.447265625, -3.344970703125, -3.24267578125, -3.140380859375, -3.0380859375, -2.935791015625, -2.83349609375, -2.731201171875, -2.62890625, -2.526611328125, -2.42431640625, -2.322021484375, -2.2197265625, -2.117431640625, -2.01513671875, -1.912841796875, -1.810546875, -1.708251953125, -1.60595703125, -1.503662109375, -1.4013671875, -1.299072265625, -1.19677734375, -1.094482421875, -0.9921875, -0.889892578125, -0.78759765625, -0.685302734375, -0.5830078125, -0.480712890625, -0.37841796875, -0.276123046875, -0.173828125, -0.071533203125, 0.03076171875, 0.133056640625, 0.2353515625, 0.337646484375, 0.43994140625, 0.542236328125, 0.64453125, 0.746826171875, 0.84912109375, 0.951416015625, 1.0537109375, 1.156005859375, 1.25830078125, 1.360595703125, 1.462890625, 1.565185546875, 1.66748046875, 1.769775390625, 1.8720703125, 1.974365234375, 2.07666015625, 2.178955078125, 2.28125, 2.383544921875, 2.48583984375, 2.588134765625, 2.6904296875, 2.792724609375, 2.89501953125, 2.997314453125, 3.099609375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 25.0, 23.0, 54.0, 83.0, 93.0, 195.0, 318.0, 519.0, 810.0, 1446.0, 2322.0, 3945.0, 6564.0, 10437.0, 16807.0, 26084.0, 39631.0, 57727.0, 78152.0, 99556.0, 115591.0, 121551.0, 116269.0, 100996.0, 79646.0, 58073.0, 40366.0, 26835.0, 17084.0, 10741.0, 6526.0, 3997.0, 2389.0, 1450.0, 866.0, 535.0, 337.0, 198.0, 123.0, 66.0, 49.0, 19.0, 14.0, 14.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.681640625, -3.564849853515625, -3.44805908203125, -3.331268310546875, -3.2144775390625, -3.097686767578125, -2.98089599609375, -2.864105224609375, -2.747314453125, -2.630523681640625, -2.51373291015625, -2.396942138671875, -2.2801513671875, -2.163360595703125, -2.04656982421875, -1.929779052734375, -1.81298828125, -1.696197509765625, -1.57940673828125, -1.462615966796875, -1.3458251953125, -1.229034423828125, -1.11224365234375, -0.995452880859375, -0.878662109375, -0.761871337890625, -0.64508056640625, -0.528289794921875, -0.4114990234375, -0.294708251953125, -0.17791748046875, -0.061126708984375, 0.0556640625, 0.172454833984375, 0.28924560546875, 0.406036376953125, 0.5228271484375, 0.639617919921875, 0.75640869140625, 0.873199462890625, 0.989990234375, 1.106781005859375, 1.22357177734375, 1.340362548828125, 1.4571533203125, 1.573944091796875, 1.69073486328125, 1.807525634765625, 1.92431640625, 2.041107177734375, 2.15789794921875, 2.274688720703125, 2.3914794921875, 2.508270263671875, 2.62506103515625, 2.741851806640625, 2.858642578125, 2.975433349609375, 3.09222412109375, 3.209014892578125, 3.3258056640625, 3.442596435546875, 3.55938720703125, 3.676177978515625, 3.79296875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 1.0, 8.0, 12.0, 10.0, 10.0, 12.0, 21.0, 17.0, 24.0, 21.0, 25.0, 16.0, 29.0, 36.0, 32.0, 46.0, 37.0, 43.0, 37.0, 43.0, 50.0, 36.0, 43.0, 41.0, 40.0, 39.0, 28.0, 33.0, 31.0, 26.0, 19.0, 27.0, 15.0, 12.0, 15.0, 14.0, 6.0, 10.0, 9.0, 5.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.103607177734375, -2.03533935546875, -1.967071533203125, -1.8988037109375, -1.830535888671875, -1.76226806640625, -1.694000244140625, -1.625732421875, -1.557464599609375, -1.48919677734375, -1.420928955078125, -1.3526611328125, -1.284393310546875, -1.21612548828125, -1.147857666015625, -1.07958984375, -1.011322021484375, -0.94305419921875, -0.874786376953125, -0.8065185546875, -0.738250732421875, -0.66998291015625, -0.601715087890625, -0.533447265625, -0.465179443359375, -0.39691162109375, -0.328643798828125, -0.2603759765625, -0.192108154296875, -0.12384033203125, -0.055572509765625, 0.0126953125, 0.080963134765625, 0.14923095703125, 0.217498779296875, 0.2857666015625, 0.354034423828125, 0.42230224609375, 0.490570068359375, 0.558837890625, 0.627105712890625, 0.69537353515625, 0.763641357421875, 0.8319091796875, 0.900177001953125, 0.96844482421875, 1.036712646484375, 1.10498046875, 1.173248291015625, 1.24151611328125, 1.309783935546875, 1.3780517578125, 1.446319580078125, 1.51458740234375, 1.582855224609375, 1.651123046875, 1.719390869140625, 1.78765869140625, 1.855926513671875, 1.9241943359375, 1.992462158203125, 2.06072998046875, 2.128997802734375, 2.197265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 7.0, 9.0, 14.0, 26.0, 35.0, 54.0, 74.0, 114.0, 171.0, 214.0, 309.0, 464.0, 659.0, 1069.0, 1631.0, 2518.0, 4450.0, 8460.0, 17438.0, 38248.0, 89579.0, 190745.0, 277061.0, 217166.0, 107261.0, 46866.0, 20808.0, 9741.0, 5282.0, 2869.0, 1758.0, 1043.0, 773.0, 482.0, 371.0, 228.0, 183.0, 123.0, 83.0, 43.0, 30.0, 25.0, 27.0, 17.0, 12.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.968170166015625, -3.84649658203125, -3.724822998046875, -3.6031494140625, -3.481475830078125, -3.35980224609375, -3.238128662109375, -3.116455078125, -2.994781494140625, -2.87310791015625, -2.751434326171875, -2.6297607421875, -2.508087158203125, -2.38641357421875, -2.264739990234375, -2.14306640625, -2.021392822265625, -1.89971923828125, -1.778045654296875, -1.6563720703125, -1.534698486328125, -1.41302490234375, -1.291351318359375, -1.169677734375, -1.048004150390625, -0.92633056640625, -0.804656982421875, -0.6829833984375, -0.561309814453125, -0.43963623046875, -0.317962646484375, -0.1962890625, -0.074615478515625, 0.04705810546875, 0.168731689453125, 0.2904052734375, 0.412078857421875, 0.53375244140625, 0.655426025390625, 0.777099609375, 0.898773193359375, 1.02044677734375, 1.142120361328125, 1.2637939453125, 1.385467529296875, 1.50714111328125, 1.628814697265625, 1.75048828125, 1.872161865234375, 1.99383544921875, 2.115509033203125, 2.2371826171875, 2.358856201171875, 2.48052978515625, 2.602203369140625, 2.723876953125, 2.845550537109375, 2.96722412109375, 3.088897705078125, 3.2105712890625, 3.332244873046875, 3.45391845703125, 3.575592041015625, 3.697265625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 23.0, 20.0, 38.0, 32.0, 57.0, 57.0, 95.0, 85.0, 123.0, 93.0, 78.0, 56.0, 70.0, 35.0, 29.0, 25.0, 16.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0005211830139160156, -0.0005088746547698975, -0.0004965662956237793, -0.00048425793647766113, -0.00047194957733154297, -0.0004596412181854248, -0.00044733285903930664, -0.0004350244998931885, -0.0004227161407470703, -0.00041040778160095215, -0.000398099422454834, -0.0003857910633087158, -0.00037348270416259766, -0.0003611743450164795, -0.00034886598587036133, -0.00033655762672424316, -0.000324249267578125, -0.00031194090843200684, -0.00029963254928588867, -0.0002873241901397705, -0.00027501583099365234, -0.0002627074718475342, -0.000250399112701416, -0.00023809075355529785, -0.0002257823944091797, -0.00021347403526306152, -0.00020116567611694336, -0.0001888573169708252, -0.00017654895782470703, -0.00016424059867858887, -0.0001519322395324707, -0.00013962388038635254, -0.00012731552124023438, -0.00011500716209411621, -0.00010269880294799805, -9.039044380187988e-05, -7.808208465576172e-05, -6.577372550964355e-05, -5.346536636352539e-05, -4.1157007217407227e-05, -2.8848648071289062e-05, -1.65402889251709e-05, -4.231929779052734e-06, 8.07642936706543e-06, 2.0384788513183594e-05, 3.269314765930176e-05, 4.500150680541992e-05, 5.7309865951538086e-05, 6.961822509765625e-05, 8.192658424377441e-05, 9.423494338989258e-05, 0.00010654330253601074, 0.0001188516616821289, 0.00013116002082824707, 0.00014346837997436523, 0.0001557767391204834, 0.00016808509826660156, 0.00018039345741271973, 0.0001927018165588379, 0.00020501017570495605, 0.00021731853485107422, 0.00022962689399719238, 0.00024193525314331055, 0.0002542436122894287, 0.0002665519714355469]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 20.0, 27.0, 33.0, 48.0, 85.0, 124.0, 174.0, 317.0, 464.0, 704.0, 1134.0, 1798.0, 3086.0, 5074.0, 8710.0, 14711.0, 24937.0, 41823.0, 68069.0, 102617.0, 138919.0, 159228.0, 150393.0, 117837.0, 81310.0, 51355.0, 30510.0, 18253.0, 10589.0, 6284.0, 3758.0, 2324.0, 1433.0, 816.0, 580.0, 329.0, 230.0, 150.0, 95.0, 63.0, 52.0, 26.0, 18.0, 14.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.0050048828125, -1.939697265625, -1.8743896484375, -1.80908203125, -1.7437744140625, -1.678466796875, -1.6131591796875, -1.5478515625, -1.4825439453125, -1.417236328125, -1.3519287109375, -1.28662109375, -1.2213134765625, -1.156005859375, -1.0906982421875, -1.025390625, -0.9600830078125, -0.894775390625, -0.8294677734375, -0.76416015625, -0.6988525390625, -0.633544921875, -0.5682373046875, -0.5029296875, -0.4376220703125, -0.372314453125, -0.3070068359375, -0.24169921875, -0.1763916015625, -0.111083984375, -0.0457763671875, 0.01953125, 0.0848388671875, 0.150146484375, 0.2154541015625, 0.28076171875, 0.3460693359375, 0.411376953125, 0.4766845703125, 0.5419921875, 0.6072998046875, 0.672607421875, 0.7379150390625, 0.80322265625, 0.8685302734375, 0.933837890625, 0.9991455078125, 1.064453125, 1.1297607421875, 1.195068359375, 1.2603759765625, 1.32568359375, 1.3909912109375, 1.456298828125, 1.5216064453125, 1.5869140625, 1.6522216796875, 1.717529296875, 1.7828369140625, 1.84814453125, 1.9134521484375, 1.978759765625, 2.0440673828125, 2.109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 7.0, 23.0, 14.0, 19.0, 19.0, 25.0, 28.0, 42.0, 45.0, 67.0, 62.0, 57.0, 51.0, 63.0, 66.0, 62.0, 56.0, 50.0, 41.0, 29.0, 35.0, 25.0, 19.0, 17.0, 19.0, 12.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.750335693359375, -0.72283935546875, -0.695343017578125, -0.6678466796875, -0.640350341796875, -0.61285400390625, -0.585357666015625, -0.557861328125, -0.530364990234375, -0.50286865234375, -0.475372314453125, -0.4478759765625, -0.420379638671875, -0.39288330078125, -0.365386962890625, -0.337890625, -0.310394287109375, -0.28289794921875, -0.255401611328125, -0.2279052734375, -0.200408935546875, -0.17291259765625, -0.145416259765625, -0.117919921875, -0.090423583984375, -0.06292724609375, -0.035430908203125, -0.0079345703125, 0.019561767578125, 0.04705810546875, 0.074554443359375, 0.10205078125, 0.129547119140625, 0.15704345703125, 0.184539794921875, 0.2120361328125, 0.239532470703125, 0.26702880859375, 0.294525146484375, 0.322021484375, 0.349517822265625, 0.37701416015625, 0.404510498046875, 0.4320068359375, 0.459503173828125, 0.48699951171875, 0.514495849609375, 0.5419921875, 0.569488525390625, 0.59698486328125, 0.624481201171875, 0.6519775390625, 0.679473876953125, 0.70697021484375, 0.734466552734375, 0.761962890625, 0.789459228515625, 0.81695556640625, 0.844451904296875, 0.8719482421875, 0.899444580078125, 0.92694091796875, 0.954437255859375, 0.98193359375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 8.0, 8.0, 12.0, 16.0, 12.0, 11.0, 9.0, 20.0, 20.0, 26.0, 29.0, 31.0, 44.0, 31.0, 44.0, 47.0, 43.0, 34.0, 38.0, 56.0, 45.0, 43.0, 42.0, 34.0, 39.0, 44.0, 30.0, 23.0, 20.0, 15.0, 23.0, 18.0, 13.0, 10.0, 12.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3753297328948975, -3.2676143646240234, -3.1598987579345703, -3.0521833896636963, -2.9444680213928223, -2.8367526531219482, -2.729037284851074, -2.621321678161621, -2.513606309890747, -2.405890941619873, -2.29817533493042, -2.190459966659546, -2.082744598388672, -1.9750292301177979, -1.8673137426376343, -1.7595982551574707, -1.6518828868865967, -1.5441675186157227, -1.436452031135559, -1.3287365436553955, -1.2210211753845215, -1.1133058071136475, -1.0055903196334839, -0.8978748917579651, -0.7901594638824463, -0.6824440360069275, -0.5747286081314087, -0.4670131802558899, -0.3592977523803711, -0.2515823245048523, -0.1438668966293335, -0.0361514687538147, 0.0715641975402832, 0.179279625415802, 0.2869950532913208, 0.3947104811668396, 0.5024259090423584, 0.6101413369178772, 0.717856764793396, 0.8255721926689148, 0.9332876205444336, 1.0410029888153076, 1.1487184762954712, 1.2564339637756348, 1.3641493320465088, 1.4718647003173828, 1.5795801877975464, 1.68729567527771, 1.795011043548584, 1.902726411819458, 2.010441780090332, 2.118157386779785, 2.225872755050659, 2.333588123321533, 2.4413037300109863, 2.5490190982818604, 2.6567344665527344, 2.7644498348236084, 2.8721652030944824, 2.9798808097839355, 3.0875961780548096, 3.1953115463256836, 3.3030271530151367, 3.4107425212860107, 3.5184578895568848]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 7.0, 13.0, 15.0, 25.0, 21.0, 14.0, 22.0, 27.0, 29.0, 25.0, 34.0, 38.0, 31.0, 39.0, 52.0, 41.0, 37.0, 47.0, 37.0, 49.0, 57.0, 22.0, 32.0, 34.0, 26.0, 19.0, 26.0, 23.0, 21.0, 12.0, 10.0, 19.0, 19.0, 12.0, 8.0, 9.0, 5.0, 2.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.945760726928711, -2.8403706550598145, -2.734980583190918, -2.6295905113220215, -2.524200677871704, -2.4188106060028076, -2.313420534133911, -2.2080304622650146, -2.1026406288146973, -1.9972505569458008, -1.8918606042861938, -1.7864705324172974, -1.6810805797576904, -1.575690507888794, -1.4703004360198975, -1.364910364151001, -1.2595202922821045, -1.154130220413208, -1.048740267753601, -0.9433501958847046, -0.8379601836204529, -0.7325701713562012, -0.6271800994873047, -0.521790087223053, -0.41640007495880127, -0.31101006269454956, -0.20562002062797546, -0.10022997856140137, 0.005160033702850342, 0.11055004596710205, 0.21594011783599854, 0.32133013010025024, 0.42672038078308105, 0.5321103930473328, 0.6375004053115845, 0.742890477180481, 0.8482804894447327, 0.9536705017089844, 1.0590605735778809, 1.1644506454467773, 1.2698405981063843, 1.3752306699752808, 1.4806206226348877, 1.5860106945037842, 1.6914007663726807, 1.7967907190322876, 1.902180790901184, 2.007570743560791, 2.1129608154296875, 2.218350887298584, 2.3237409591674805, 2.429131031036377, 2.5345208644866943, 2.639910936355591, 2.7453010082244873, 2.850691080093384, 2.956080913543701, 3.0614709854125977, 3.166861057281494, 3.2722511291503906, 3.377640962600708, 3.4830310344696045, 3.588421106338501, 3.6938111782073975, 3.799201250076294]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 13.0, 42.0, 50.0, 90.0, 144.0, 253.0, 415.0, 766.0, 1288.0, 2212.0, 3723.0, 6901.0, 12516.0, 22660.0, 40935.0, 75409.0, 135952.0, 239532.0, 395004.0, 572624.0, 692871.0, 669715.0, 520854.0, 343113.0, 202895.0, 114621.0, 62913.0, 34303.0, 18776.0, 10421.0, 5706.0, 3186.0, 1796.0, 1026.0, 627.0, 345.0, 204.0, 152.0, 86.0, 39.0, 32.0, 23.0, 12.0, 7.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.263671875, -3.15789794921875, -3.0521240234375, -2.94635009765625, -2.840576171875, -2.73480224609375, -2.6290283203125, -2.52325439453125, -2.41748046875, -2.31170654296875, -2.2059326171875, -2.10015869140625, -1.994384765625, -1.88861083984375, -1.7828369140625, -1.67706298828125, -1.5712890625, -1.46551513671875, -1.3597412109375, -1.25396728515625, -1.148193359375, -1.04241943359375, -0.9366455078125, -0.83087158203125, -0.72509765625, -0.61932373046875, -0.5135498046875, -0.40777587890625, -0.302001953125, -0.19622802734375, -0.0904541015625, 0.01531982421875, 0.12109375, 0.22686767578125, 0.3326416015625, 0.43841552734375, 0.544189453125, 0.64996337890625, 0.7557373046875, 0.86151123046875, 0.96728515625, 1.07305908203125, 1.1788330078125, 1.28460693359375, 1.390380859375, 1.49615478515625, 1.6019287109375, 1.70770263671875, 1.8134765625, 1.91925048828125, 2.0250244140625, 2.13079833984375, 2.236572265625, 2.34234619140625, 2.4481201171875, 2.55389404296875, 2.65966796875, 2.76544189453125, 2.8712158203125, 2.97698974609375, 3.082763671875, 3.18853759765625, 3.2943115234375, 3.40008544921875, 3.505859375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 6.0, 18.0, 16.0, 17.0, 16.0, 21.0, 21.0, 17.0, 23.0, 33.0, 27.0, 42.0, 40.0, 32.0, 45.0, 51.0, 40.0, 53.0, 42.0, 36.0, 51.0, 48.0, 40.0, 26.0, 27.0, 27.0, 23.0, 15.0, 23.0, 16.0, 23.0, 13.0, 12.0, 7.0, 8.0, 4.0, 6.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.29656982421875, -2.2122802734375, -2.12799072265625, -2.043701171875, -1.95941162109375, -1.8751220703125, -1.79083251953125, -1.70654296875, -1.62225341796875, -1.5379638671875, -1.45367431640625, -1.369384765625, -1.28509521484375, -1.2008056640625, -1.11651611328125, -1.0322265625, -0.94793701171875, -0.8636474609375, -0.77935791015625, -0.695068359375, -0.61077880859375, -0.5264892578125, -0.44219970703125, -0.35791015625, -0.27362060546875, -0.1893310546875, -0.10504150390625, -0.020751953125, 0.06353759765625, 0.1478271484375, 0.23211669921875, 0.31640625, 0.40069580078125, 0.4849853515625, 0.56927490234375, 0.653564453125, 0.73785400390625, 0.8221435546875, 0.90643310546875, 0.99072265625, 1.07501220703125, 1.1593017578125, 1.24359130859375, 1.327880859375, 1.41217041015625, 1.4964599609375, 1.58074951171875, 1.6650390625, 1.74932861328125, 1.8336181640625, 1.91790771484375, 2.002197265625, 2.08648681640625, 2.1707763671875, 2.25506591796875, 2.33935546875, 2.42364501953125, 2.5079345703125, 2.59222412109375, 2.676513671875, 2.76080322265625, 2.8450927734375, 2.92938232421875, 3.013671875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 28.0, 29.0, 44.0, 66.0, 110.0, 171.0, 317.0, 460.0, 730.0, 1145.0, 1851.0, 3119.0, 4697.0, 7517.0, 11720.0, 18551.0, 28126.0, 44187.0, 65869.0, 98796.0, 142659.0, 201026.0, 270242.0, 344086.0, 409945.0, 450180.0, 448690.0, 407470.0, 342459.0, 268034.0, 197844.0, 140808.0, 96534.0, 65353.0, 43292.0, 28456.0, 17860.0, 11682.0, 7422.0, 4683.0, 2922.0, 1929.0, 1211.0, 743.0, 440.0, 297.0, 170.0, 104.0, 83.0, 37.0, 30.0, 24.0, 10.0, 10.0, 5.0, 5.0, 1.0], "bins": [-2.427734375, -2.3541259765625, -2.280517578125, -2.2069091796875, -2.13330078125, -2.0596923828125, -1.986083984375, -1.9124755859375, -1.8388671875, -1.7652587890625, -1.691650390625, -1.6180419921875, -1.54443359375, -1.4708251953125, -1.397216796875, -1.3236083984375, -1.25, -1.1763916015625, -1.102783203125, -1.0291748046875, -0.95556640625, -0.8819580078125, -0.808349609375, -0.7347412109375, -0.6611328125, -0.5875244140625, -0.513916015625, -0.4403076171875, -0.36669921875, -0.2930908203125, -0.219482421875, -0.1458740234375, -0.072265625, 0.0013427734375, 0.074951171875, 0.1485595703125, 0.22216796875, 0.2957763671875, 0.369384765625, 0.4429931640625, 0.5166015625, 0.5902099609375, 0.663818359375, 0.7374267578125, 0.81103515625, 0.8846435546875, 0.958251953125, 1.0318603515625, 1.10546875, 1.1790771484375, 1.252685546875, 1.3262939453125, 1.39990234375, 1.4735107421875, 1.547119140625, 1.6207275390625, 1.6943359375, 1.7679443359375, 1.841552734375, 1.9151611328125, 1.98876953125, 2.0623779296875, 2.135986328125, 2.2095947265625, 2.283203125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 1.0, 6.0, 8.0, 13.0, 20.0, 15.0, 15.0, 32.0, 43.0, 63.0, 44.0, 59.0, 69.0, 90.0, 91.0, 114.0, 138.0, 152.0, 169.0, 176.0, 178.0, 220.0, 212.0, 223.0, 223.0, 204.0, 178.0, 187.0, 160.0, 173.0, 117.0, 122.0, 101.0, 71.0, 77.0, 70.0, 59.0, 44.0, 23.0, 23.0, 20.0, 18.0, 14.0, 11.0, 6.0, 10.0, 4.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.195556640625, -1.15966796875, -1.123779296875, -1.087890625, -1.052001953125, -1.01611328125, -0.980224609375, -0.9443359375, -0.908447265625, -0.87255859375, -0.836669921875, -0.80078125, -0.764892578125, -0.72900390625, -0.693115234375, -0.6572265625, -0.621337890625, -0.58544921875, -0.549560546875, -0.513671875, -0.477783203125, -0.44189453125, -0.406005859375, -0.3701171875, -0.334228515625, -0.29833984375, -0.262451171875, -0.2265625, -0.190673828125, -0.15478515625, -0.118896484375, -0.0830078125, -0.047119140625, -0.01123046875, 0.024658203125, 0.060546875, 0.096435546875, 0.13232421875, 0.168212890625, 0.2041015625, 0.239990234375, 0.27587890625, 0.311767578125, 0.34765625, 0.383544921875, 0.41943359375, 0.455322265625, 0.4912109375, 0.527099609375, 0.56298828125, 0.598876953125, 0.634765625, 0.670654296875, 0.70654296875, 0.742431640625, 0.7783203125, 0.814208984375, 0.85009765625, 0.885986328125, 0.921875, 0.957763671875, 0.99365234375, 1.029541015625, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 4.0, 1.0, 3.0, 6.0, 8.0, 8.0, 9.0, 10.0, 17.0, 17.0, 19.0, 15.0, 28.0, 27.0, 31.0, 30.0, 35.0, 31.0, 37.0, 34.0, 41.0, 34.0, 47.0, 40.0, 45.0, 38.0, 33.0, 41.0, 40.0, 42.0, 24.0, 25.0, 27.0, 25.0, 19.0, 17.0, 12.0, 10.0, 12.0, 16.0, 8.0, 7.0, 5.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.152416706085205, -3.0596210956573486, -2.966825485229492, -2.874030113220215, -2.7812345027923584, -2.688438892364502, -2.5956432819366455, -2.502847671508789, -2.4100522994995117, -2.3172566890716553, -2.224461078643799, -2.1316657066345215, -2.038870096206665, -1.9460744857788086, -1.8532788753509521, -1.7604832649230957, -1.6676876544952393, -1.5748920440673828, -1.482096552848816, -1.3893009424209595, -1.2965054512023926, -1.2037098407745361, -1.1109142303466797, -1.0181186199188232, -0.9253231287002563, -0.8325275778770447, -0.739732027053833, -0.6469364166259766, -0.5541408658027649, -0.4613453149795532, -0.3685497045516968, -0.2757541537284851, -0.18295836448669434, -0.09016279876232147, 0.0026327669620513916, 0.09542834758758545, 0.18822389841079712, 0.2810194492340088, 0.37381505966186523, 0.4666106104850769, 0.5594061613082886, 0.6522017121315002, 0.7449972629547119, 0.8377928733825684, 0.93058842420578, 1.0233839750289917, 1.1161795854568481, 1.208975076675415, 1.3017706871032715, 1.394566297531128, 1.4873617887496948, 1.5801573991775513, 1.6729528903961182, 1.7657485008239746, 1.858544111251831, 1.9513397216796875, 2.044135093688965, 2.1369307041168213, 2.2297263145446777, 2.322521686553955, 2.4153172969818115, 2.508112907409668, 2.6009085178375244, 2.693704128265381, 2.7864997386932373]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 22.0, 14.0, 19.0, 14.0, 15.0, 28.0, 24.0, 26.0, 32.0, 35.0, 34.0, 39.0, 39.0, 36.0, 40.0, 42.0, 51.0, 39.0, 33.0, 33.0, 41.0, 32.0, 40.0, 24.0, 20.0, 30.0, 16.0, 23.0, 21.0, 17.0, 13.0, 13.0, 15.0, 7.0, 9.0, 12.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.8398711681365967, -2.7512996196746826, -2.6627280712127686, -2.5741565227508545, -2.4855849742889404, -2.3970134258270264, -2.3084418773651123, -2.2198703289031982, -2.131298780441284, -2.04272723197937, -1.954155683517456, -1.865584135055542, -1.777012586593628, -1.6884410381317139, -1.5998694896697998, -1.5112979412078857, -1.4227263927459717, -1.3341548442840576, -1.2455832958221436, -1.1570117473602295, -1.0684401988983154, -0.9798686504364014, -0.8912971019744873, -0.8027255535125732, -0.7141540050506592, -0.6255824565887451, -0.537010908126831, -0.448439359664917, -0.35986781120300293, -0.27129626274108887, -0.1827247142791748, -0.09415316581726074, -0.005581855773925781, 0.08298969268798828, 0.17156124114990234, 0.2601327896118164, 0.34870433807373047, 0.43727588653564453, 0.5258474349975586, 0.6144189834594727, 0.7029905319213867, 0.7915620803833008, 0.8801336288452148, 0.9687051773071289, 1.057276725769043, 1.145848274230957, 1.234419822692871, 1.3229913711547852, 1.4115629196166992, 1.5001344680786133, 1.5887060165405273, 1.6772775650024414, 1.7658491134643555, 1.8544206619262695, 1.9429922103881836, 2.0315637588500977, 2.1201353073120117, 2.208706855773926, 2.29727840423584, 2.385849952697754, 2.474421501159668, 2.562993049621582, 2.651564598083496, 2.74013614654541, 2.828707695007324]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 2.0, 2.0, 4.0, 13.0, 21.0, 22.0, 29.0, 49.0, 68.0, 92.0, 115.0, 192.0, 271.0, 337.0, 484.0, 699.0, 1083.0, 1524.0, 2506.0, 3839.0, 6468.0, 11483.0, 22072.0, 46646.0, 104451.0, 237465.0, 313001.0, 157298.0, 68453.0, 31705.0, 15762.0, 8478.0, 4894.0, 3008.0, 1921.0, 1273.0, 818.0, 602.0, 399.0, 289.0, 204.0, 131.0, 117.0, 73.0, 55.0, 37.0, 32.0, 12.0, 17.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.9017333984375, -3.768310546875, -3.6348876953125, -3.50146484375, -3.3680419921875, -3.234619140625, -3.1011962890625, -2.9677734375, -2.8343505859375, -2.700927734375, -2.5675048828125, -2.43408203125, -2.3006591796875, -2.167236328125, -2.0338134765625, -1.900390625, -1.7669677734375, -1.633544921875, -1.5001220703125, -1.36669921875, -1.2332763671875, -1.099853515625, -0.9664306640625, -0.8330078125, -0.6995849609375, -0.566162109375, -0.4327392578125, -0.29931640625, -0.1658935546875, -0.032470703125, 0.1009521484375, 0.234375, 0.3677978515625, 0.501220703125, 0.6346435546875, 0.76806640625, 0.9014892578125, 1.034912109375, 1.1683349609375, 1.3017578125, 1.4351806640625, 1.568603515625, 1.7020263671875, 1.83544921875, 1.9688720703125, 2.102294921875, 2.2357177734375, 2.369140625, 2.5025634765625, 2.635986328125, 2.7694091796875, 2.90283203125, 3.0362548828125, 3.169677734375, 3.3031005859375, 3.4365234375, 3.5699462890625, 3.703369140625, 3.8367919921875, 3.97021484375, 4.1036376953125, 4.237060546875, 4.3704833984375, 4.50390625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 9.0, 10.0, 6.0, 11.0, 16.0, 16.0, 16.0, 19.0, 23.0, 38.0, 32.0, 21.0, 33.0, 30.0, 28.0, 46.0, 38.0, 36.0, 42.0, 35.0, 39.0, 42.0, 39.0, 22.0, 46.0, 29.0, 31.0, 32.0, 27.0, 22.0, 20.0, 21.0, 13.0, 14.0, 14.0, 14.0, 8.0, 8.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.80859375, -2.71929931640625, -2.6300048828125, -2.54071044921875, -2.451416015625, -2.36212158203125, -2.2728271484375, -2.18353271484375, -2.09423828125, -2.00494384765625, -1.9156494140625, -1.82635498046875, -1.737060546875, -1.64776611328125, -1.5584716796875, -1.46917724609375, -1.3798828125, -1.29058837890625, -1.2012939453125, -1.11199951171875, -1.022705078125, -0.93341064453125, -0.8441162109375, -0.75482177734375, -0.66552734375, -0.57623291015625, -0.4869384765625, -0.39764404296875, -0.308349609375, -0.21905517578125, -0.1297607421875, -0.04046630859375, 0.048828125, 0.13812255859375, 0.2274169921875, 0.31671142578125, 0.406005859375, 0.49530029296875, 0.5845947265625, 0.67388916015625, 0.76318359375, 0.85247802734375, 0.9417724609375, 1.03106689453125, 1.120361328125, 1.20965576171875, 1.2989501953125, 1.38824462890625, 1.4775390625, 1.56683349609375, 1.6561279296875, 1.74542236328125, 1.834716796875, 1.92401123046875, 2.0133056640625, 2.10260009765625, 2.19189453125, 2.28118896484375, 2.3704833984375, 2.45977783203125, 2.549072265625, 2.63836669921875, 2.7276611328125, 2.81695556640625, 2.90625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 14.0, 27.0, 29.0, 42.0, 56.0, 89.0, 127.0, 200.0, 265.0, 501.0, 719.0, 1161.0, 1938.0, 3525.0, 6547.0, 13789.0, 31677.0, 84733.0, 254156.0, 391021.0, 159702.0, 54669.0, 21714.0, 9856.0, 5035.0, 2731.0, 1539.0, 979.0, 544.0, 339.0, 236.0, 173.0, 116.0, 85.0, 56.0, 34.0, 30.0, 20.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.539306640625, -3.41845703125, -3.297607421875, -3.1767578125, -3.055908203125, -2.93505859375, -2.814208984375, -2.693359375, -2.572509765625, -2.45166015625, -2.330810546875, -2.2099609375, -2.089111328125, -1.96826171875, -1.847412109375, -1.7265625, -1.605712890625, -1.48486328125, -1.364013671875, -1.2431640625, -1.122314453125, -1.00146484375, -0.880615234375, -0.759765625, -0.638916015625, -0.51806640625, -0.397216796875, -0.2763671875, -0.155517578125, -0.03466796875, 0.086181640625, 0.20703125, 0.327880859375, 0.44873046875, 0.569580078125, 0.6904296875, 0.811279296875, 0.93212890625, 1.052978515625, 1.173828125, 1.294677734375, 1.41552734375, 1.536376953125, 1.6572265625, 1.778076171875, 1.89892578125, 2.019775390625, 2.140625, 2.261474609375, 2.38232421875, 2.503173828125, 2.6240234375, 2.744873046875, 2.86572265625, 2.986572265625, 3.107421875, 3.228271484375, 3.34912109375, 3.469970703125, 3.5908203125, 3.711669921875, 3.83251953125, 3.953369140625, 4.07421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 8.0, 10.0, 10.0, 16.0, 23.0, 28.0, 23.0, 31.0, 35.0, 32.0, 40.0, 44.0, 29.0, 52.0, 55.0, 45.0, 45.0, 41.0, 42.0, 47.0, 33.0, 37.0, 47.0, 33.0, 28.0, 31.0, 21.0, 22.0, 18.0, 17.0, 15.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.701263427734375, -2.62518310546875, -2.549102783203125, -2.4730224609375, -2.396942138671875, -2.32086181640625, -2.244781494140625, -2.168701171875, -2.092620849609375, -2.01654052734375, -1.940460205078125, -1.8643798828125, -1.788299560546875, -1.71221923828125, -1.636138916015625, -1.56005859375, -1.483978271484375, -1.40789794921875, -1.331817626953125, -1.2557373046875, -1.179656982421875, -1.10357666015625, -1.027496337890625, -0.951416015625, -0.875335693359375, -0.79925537109375, -0.723175048828125, -0.6470947265625, -0.571014404296875, -0.49493408203125, -0.418853759765625, -0.3427734375, -0.266693115234375, -0.19061279296875, -0.114532470703125, -0.0384521484375, 0.037628173828125, 0.11370849609375, 0.189788818359375, 0.265869140625, 0.341949462890625, 0.41802978515625, 0.494110107421875, 0.5701904296875, 0.646270751953125, 0.72235107421875, 0.798431396484375, 0.87451171875, 0.950592041015625, 1.02667236328125, 1.102752685546875, 1.1788330078125, 1.254913330078125, 1.33099365234375, 1.407073974609375, 1.483154296875, 1.559234619140625, 1.63531494140625, 1.711395263671875, 1.7874755859375, 1.863555908203125, 1.93963623046875, 2.015716552734375, 2.091796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 19.0, 19.0, 15.0, 37.0, 43.0, 56.0, 83.0, 112.0, 133.0, 146.0, 205.0, 248.0, 409.0, 535.0, 765.0, 1223.0, 2007.0, 3742.0, 7620.0, 20970.0, 106441.0, 767546.0, 98922.0, 20142.0, 7623.0, 3575.0, 1962.0, 1206.0, 739.0, 500.0, 370.0, 270.0, 219.0, 165.0, 119.0, 88.0, 60.0, 49.0, 40.0, 22.0, 23.0, 16.0, 18.0, 5.0, 10.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.41796875, -5.25616455078125, -5.0943603515625, -4.93255615234375, -4.770751953125, -4.60894775390625, -4.4471435546875, -4.28533935546875, -4.12353515625, -3.96173095703125, -3.7999267578125, -3.63812255859375, -3.476318359375, -3.31451416015625, -3.1527099609375, -2.99090576171875, -2.8291015625, -2.66729736328125, -2.5054931640625, -2.34368896484375, -2.181884765625, -2.02008056640625, -1.8582763671875, -1.69647216796875, -1.53466796875, -1.37286376953125, -1.2110595703125, -1.04925537109375, -0.887451171875, -0.72564697265625, -0.5638427734375, -0.40203857421875, -0.240234375, -0.07843017578125, 0.0833740234375, 0.24517822265625, 0.406982421875, 0.56878662109375, 0.7305908203125, 0.89239501953125, 1.05419921875, 1.21600341796875, 1.3778076171875, 1.53961181640625, 1.701416015625, 1.86322021484375, 2.0250244140625, 2.18682861328125, 2.3486328125, 2.51043701171875, 2.6722412109375, 2.83404541015625, 2.995849609375, 3.15765380859375, 3.3194580078125, 3.48126220703125, 3.64306640625, 3.80487060546875, 3.9666748046875, 4.12847900390625, 4.290283203125, 4.45208740234375, 4.6138916015625, 4.77569580078125, 4.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 3.0, 12.0, 19.0, 30.0, 55.0, 110.0, 185.0, 244.0, 125.0, 73.0, 43.0, 28.0, 13.0, 8.0, 7.0, 6.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004253387451171875, -0.00041211768984794617, -0.00039889663457870483, -0.0003856755793094635, -0.00037245452404022217, -0.00035923346877098083, -0.0003460124135017395, -0.00033279135823249817, -0.00031957030296325684, -0.0003063492476940155, -0.00029312819242477417, -0.00027990713715553284, -0.0002666860818862915, -0.00025346502661705017, -0.00024024397134780884, -0.0002270229160785675, -0.00021380186080932617, -0.00020058080554008484, -0.0001873597502708435, -0.00017413869500160217, -0.00016091763973236084, -0.0001476965844631195, -0.00013447552919387817, -0.00012125447392463684, -0.00010803341865539551, -9.481236338615417e-05, -8.159130811691284e-05, -6.837025284767151e-05, -5.5149197578430176e-05, -4.192814230918884e-05, -2.870708703994751e-05, -1.5486031770706177e-05, -2.2649765014648438e-06, 1.095607876777649e-05, 2.4177134037017822e-05, 3.7398189306259155e-05, 5.061924457550049e-05, 6.384029984474182e-05, 7.706135511398315e-05, 9.028241038322449e-05, 0.00010350346565246582, 0.00011672452092170715, 0.00012994557619094849, 0.00014316663146018982, 0.00015638768672943115, 0.00016960874199867249, 0.00018282979726791382, 0.00019605085253715515, 0.00020927190780639648, 0.00022249296307563782, 0.00023571401834487915, 0.0002489350736141205, 0.0002621561288833618, 0.00027537718415260315, 0.0002885982394218445, 0.0003018192946910858, 0.00031504034996032715, 0.0003282614052295685, 0.0003414824604988098, 0.00035470351576805115, 0.0003679245710372925, 0.0003811456263065338, 0.00039436668157577515, 0.0004075877368450165, 0.0004208087921142578]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 11.0, 19.0, 33.0, 56.0, 72.0, 88.0, 133.0, 163.0, 199.0, 288.0, 435.0, 678.0, 1041.0, 1640.0, 2424.0, 3801.0, 6716.0, 12820.0, 29486.0, 90729.0, 436349.0, 337131.0, 71840.0, 24842.0, 11313.0, 6151.0, 3524.0, 2198.0, 1399.0, 947.0, 586.0, 403.0, 274.0, 211.0, 149.0, 116.0, 83.0, 54.0, 44.0, 36.0, 22.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.845703125, -3.721282958984375, -3.59686279296875, -3.472442626953125, -3.3480224609375, -3.223602294921875, -3.09918212890625, -2.974761962890625, -2.850341796875, -2.725921630859375, -2.60150146484375, -2.477081298828125, -2.3526611328125, -2.228240966796875, -2.10382080078125, -1.979400634765625, -1.85498046875, -1.730560302734375, -1.60614013671875, -1.481719970703125, -1.3572998046875, -1.232879638671875, -1.10845947265625, -0.984039306640625, -0.859619140625, -0.735198974609375, -0.61077880859375, -0.486358642578125, -0.3619384765625, -0.237518310546875, -0.11309814453125, 0.011322021484375, 0.1357421875, 0.260162353515625, 0.38458251953125, 0.509002685546875, 0.6334228515625, 0.757843017578125, 0.88226318359375, 1.006683349609375, 1.131103515625, 1.255523681640625, 1.37994384765625, 1.504364013671875, 1.6287841796875, 1.753204345703125, 1.87762451171875, 2.002044677734375, 2.12646484375, 2.250885009765625, 2.37530517578125, 2.499725341796875, 2.6241455078125, 2.748565673828125, 2.87298583984375, 2.997406005859375, 3.121826171875, 3.246246337890625, 3.37066650390625, 3.495086669921875, 3.6195068359375, 3.743927001953125, 3.86834716796875, 3.992767333984375, 4.1171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 9.0, 14.0, 13.0, 9.0, 29.0, 42.0, 55.0, 104.0, 188.0, 165.0, 107.0, 62.0, 55.0, 32.0, 20.0, 21.0, 14.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.974609375, -0.9459228515625, -0.917236328125, -0.8885498046875, -0.85986328125, -0.8311767578125, -0.802490234375, -0.7738037109375, -0.7451171875, -0.7164306640625, -0.687744140625, -0.6590576171875, -0.63037109375, -0.6016845703125, -0.572998046875, -0.5443115234375, -0.515625, -0.4869384765625, -0.458251953125, -0.4295654296875, -0.40087890625, -0.3721923828125, -0.343505859375, -0.3148193359375, -0.2861328125, -0.2574462890625, -0.228759765625, -0.2000732421875, -0.17138671875, -0.1427001953125, -0.114013671875, -0.0853271484375, -0.056640625, -0.0279541015625, 0.000732421875, 0.0294189453125, 0.05810546875, 0.0867919921875, 0.115478515625, 0.1441650390625, 0.1728515625, 0.2015380859375, 0.230224609375, 0.2589111328125, 0.28759765625, 0.3162841796875, 0.344970703125, 0.3736572265625, 0.40234375, 0.4310302734375, 0.459716796875, 0.4884033203125, 0.51708984375, 0.5457763671875, 0.574462890625, 0.6031494140625, 0.6318359375, 0.6605224609375, 0.689208984375, 0.7178955078125, 0.74658203125, 0.7752685546875, 0.803955078125, 0.8326416015625, 0.861328125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 4.0, 1.0, 13.0, 12.0, 6.0, 15.0, 13.0, 26.0, 23.0, 26.0, 27.0, 27.0, 32.0, 28.0, 35.0, 32.0, 36.0, 34.0, 42.0, 32.0, 57.0, 52.0, 44.0, 34.0, 37.0, 32.0, 28.0, 24.0, 33.0, 25.0, 17.0, 17.0, 19.0, 21.0, 19.0, 10.0, 11.0, 7.0, 6.0, 11.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.174232006072998, -3.0808262825012207, -2.9874205589294434, -2.894014596939087, -2.8006088733673096, -2.7072031497955322, -2.613797426223755, -2.5203914642333984, -2.426985740661621, -2.3335800170898438, -2.2401742935180664, -2.14676833152771, -2.0533626079559326, -1.9599568843841553, -1.866551160812378, -1.773145318031311, -1.6797395944595337, -1.5863338708877563, -1.4929280281066895, -1.399522304534912, -1.3061164617538452, -1.2127107381820679, -1.119304895401001, -1.0258991718292236, -0.9324933886528015, -0.8390876054763794, -0.7456818222999573, -0.6522760391235352, -0.5588703155517578, -0.4654645025730133, -0.3720587491989136, -0.27865296602249146, -0.18524718284606934, -0.09184140712022781, 0.0015643686056137085, 0.09497013688087463, 0.18837592005729675, 0.28178170323371887, 0.3751874566078186, 0.4685932397842407, 0.5619990229606628, 0.655404806137085, 0.7488105893135071, 0.8422163724899292, 0.9356220960617065, 1.0290279388427734, 1.1224336624145508, 1.2158393859863281, 1.309245228767395, 1.4026509523391724, 1.4960567951202393, 1.5894625186920166, 1.6828683614730835, 1.7762740850448608, 1.8696799278259277, 1.963085651397705, 2.0564913749694824, 2.1498970985412598, 2.243302822113037, 2.3367087841033936, 2.430114507675171, 2.5235202312469482, 2.6169259548187256, 2.710331916809082, 2.8037376403808594]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 2.0, 20.0, 16.0, 15.0, 11.0, 15.0, 19.0, 20.0, 28.0, 32.0, 28.0, 29.0, 28.0, 48.0, 49.0, 27.0, 36.0, 45.0, 37.0, 44.0, 39.0, 37.0, 48.0, 34.0, 41.0, 25.0, 20.0, 18.0, 22.0, 29.0, 12.0, 21.0, 21.0, 12.0, 11.0, 13.0, 10.0, 3.0, 9.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.7933664321899414, -2.7040176391601562, -2.614668846130371, -2.525320053100586, -2.4359710216522217, -2.3466222286224365, -2.2572734355926514, -2.167924642562866, -2.078575611114502, -1.9892268180847168, -1.899877905845642, -1.810529112815857, -1.7211802005767822, -1.631831407546997, -1.542482614517212, -1.4531338214874268, -1.3637850284576416, -1.2744362354278564, -1.1850873231887817, -1.0957385301589966, -1.0063896179199219, -0.9170408248901367, -0.8276920318603516, -0.7383431792259216, -0.6489943265914917, -0.5596454739570618, -0.4702966511249542, -0.3809478282928467, -0.29159897565841675, -0.20225012302398682, -0.11290132999420166, -0.02355247735977173, 0.0657963752746582, 0.15514521300792694, 0.24449405074119568, 0.3338428735733032, 0.42319172620773315, 0.5125405788421631, 0.6018893718719482, 0.6912382245063782, 0.7805870771408081, 0.869935929775238, 0.959284782409668, 1.0486335754394531, 1.1379823684692383, 1.227331280708313, 1.3166800737380981, 1.4060289859771729, 1.495377779006958, 1.5847265720367432, 1.6740754842758179, 1.763424277305603, 1.8527731895446777, 1.942121982574463, 2.031470775604248, 2.120819568634033, 2.2101683616638184, 2.2995171546936035, 2.3888659477233887, 2.478214740753174, 2.567563772201538, 2.6569125652313232, 2.7462613582611084, 2.8356101512908936, 2.924959182739258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 14.0, 23.0, 45.0, 66.0, 93.0, 130.0, 221.0, 299.0, 523.0, 730.0, 1283.0, 1939.0, 3103.0, 4794.0, 7696.0, 11811.0, 18349.0, 28291.0, 41647.0, 58858.0, 79424.0, 100235.0, 115517.0, 119991.0, 112949.0, 96590.0, 76039.0, 55562.0, 38503.0, 26410.0, 17105.0, 10993.0, 7077.0, 4440.0, 2772.0, 1825.0, 1125.0, 730.0, 506.0, 347.0, 192.0, 104.0, 62.0, 41.0, 41.0, 22.0, 16.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.765625, -3.65618896484375, -3.5467529296875, -3.43731689453125, -3.327880859375, -3.21844482421875, -3.1090087890625, -2.99957275390625, -2.89013671875, -2.78070068359375, -2.6712646484375, -2.56182861328125, -2.452392578125, -2.34295654296875, -2.2335205078125, -2.12408447265625, -2.0146484375, -1.90521240234375, -1.7957763671875, -1.68634033203125, -1.576904296875, -1.46746826171875, -1.3580322265625, -1.24859619140625, -1.13916015625, -1.02972412109375, -0.9202880859375, -0.81085205078125, -0.701416015625, -0.59197998046875, -0.4825439453125, -0.37310791015625, -0.263671875, -0.15423583984375, -0.0447998046875, 0.06463623046875, 0.174072265625, 0.28350830078125, 0.3929443359375, 0.50238037109375, 0.61181640625, 0.72125244140625, 0.8306884765625, 0.94012451171875, 1.049560546875, 1.15899658203125, 1.2684326171875, 1.37786865234375, 1.4873046875, 1.59674072265625, 1.7061767578125, 1.81561279296875, 1.925048828125, 2.03448486328125, 2.1439208984375, 2.25335693359375, 2.36279296875, 2.47222900390625, 2.5816650390625, 2.69110107421875, 2.800537109375, 2.90997314453125, 3.0194091796875, 3.12884521484375, 3.23828125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 15.0, 16.0, 11.0, 26.0, 23.0, 25.0, 24.0, 24.0, 37.0, 29.0, 34.0, 31.0, 45.0, 39.0, 36.0, 44.0, 37.0, 43.0, 45.0, 31.0, 36.0, 39.0, 39.0, 27.0, 17.0, 29.0, 25.0, 20.0, 15.0, 15.0, 16.0, 11.0, 12.0, 13.0, 9.0, 12.0, 6.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.330169677734375, -2.24432373046875, -2.158477783203125, -2.0726318359375, -1.986785888671875, -1.90093994140625, -1.815093994140625, -1.729248046875, -1.643402099609375, -1.55755615234375, -1.471710205078125, -1.3858642578125, -1.300018310546875, -1.21417236328125, -1.128326416015625, -1.04248046875, -0.956634521484375, -0.87078857421875, -0.784942626953125, -0.6990966796875, -0.613250732421875, -0.52740478515625, -0.441558837890625, -0.355712890625, -0.269866943359375, -0.18402099609375, -0.098175048828125, -0.0123291015625, 0.073516845703125, 0.15936279296875, 0.245208740234375, 0.3310546875, 0.416900634765625, 0.50274658203125, 0.588592529296875, 0.6744384765625, 0.760284423828125, 0.84613037109375, 0.931976318359375, 1.017822265625, 1.103668212890625, 1.18951416015625, 1.275360107421875, 1.3612060546875, 1.447052001953125, 1.53289794921875, 1.618743896484375, 1.70458984375, 1.790435791015625, 1.87628173828125, 1.962127685546875, 2.0479736328125, 2.133819580078125, 2.21966552734375, 2.305511474609375, 2.391357421875, 2.477203369140625, 2.56304931640625, 2.648895263671875, 2.7347412109375, 2.820587158203125, 2.90643310546875, 2.992279052734375, 3.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 16.0, 21.0, 31.0, 45.0, 95.0, 123.0, 188.0, 301.0, 490.0, 748.0, 1207.0, 1884.0, 3011.0, 4532.0, 7134.0, 11006.0, 16454.0, 25095.0, 36265.0, 50526.0, 67738.0, 85888.0, 101337.0, 110327.0, 110202.0, 101222.0, 85537.0, 67968.0, 50687.0, 35781.0, 24820.0, 16604.0, 11159.0, 7252.0, 4701.0, 2849.0, 1895.0, 1226.0, 820.0, 481.0, 309.0, 207.0, 136.0, 86.0, 51.0, 40.0, 20.0, 14.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.984375, -2.89111328125, -2.7978515625, -2.70458984375, -2.611328125, -2.51806640625, -2.4248046875, -2.33154296875, -2.23828125, -2.14501953125, -2.0517578125, -1.95849609375, -1.865234375, -1.77197265625, -1.6787109375, -1.58544921875, -1.4921875, -1.39892578125, -1.3056640625, -1.21240234375, -1.119140625, -1.02587890625, -0.9326171875, -0.83935546875, -0.74609375, -0.65283203125, -0.5595703125, -0.46630859375, -0.373046875, -0.27978515625, -0.1865234375, -0.09326171875, 0.0, 0.09326171875, 0.1865234375, 0.27978515625, 0.373046875, 0.46630859375, 0.5595703125, 0.65283203125, 0.74609375, 0.83935546875, 0.9326171875, 1.02587890625, 1.119140625, 1.21240234375, 1.3056640625, 1.39892578125, 1.4921875, 1.58544921875, 1.6787109375, 1.77197265625, 1.865234375, 1.95849609375, 2.0517578125, 2.14501953125, 2.23828125, 2.33154296875, 2.4248046875, 2.51806640625, 2.611328125, 2.70458984375, 2.7978515625, 2.89111328125, 2.984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 14.0, 13.0, 15.0, 23.0, 20.0, 23.0, 33.0, 36.0, 44.0, 28.0, 42.0, 27.0, 38.0, 33.0, 43.0, 37.0, 42.0, 43.0, 34.0, 41.0, 37.0, 38.0, 25.0, 26.0, 22.0, 24.0, 20.0, 27.0, 20.0, 17.0, 9.0, 13.0, 10.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.7958984375, -1.739959716796875, -1.68402099609375, -1.628082275390625, -1.5721435546875, -1.516204833984375, -1.46026611328125, -1.404327392578125, -1.348388671875, -1.292449951171875, -1.23651123046875, -1.180572509765625, -1.1246337890625, -1.068695068359375, -1.01275634765625, -0.956817626953125, -0.90087890625, -0.844940185546875, -0.78900146484375, -0.733062744140625, -0.6771240234375, -0.621185302734375, -0.56524658203125, -0.509307861328125, -0.453369140625, -0.397430419921875, -0.34149169921875, -0.285552978515625, -0.2296142578125, -0.173675537109375, -0.11773681640625, -0.061798095703125, -0.005859375, 0.050079345703125, 0.10601806640625, 0.161956787109375, 0.2178955078125, 0.273834228515625, 0.32977294921875, 0.385711669921875, 0.441650390625, 0.497589111328125, 0.55352783203125, 0.609466552734375, 0.6654052734375, 0.721343994140625, 0.77728271484375, 0.833221435546875, 0.88916015625, 0.945098876953125, 1.00103759765625, 1.056976318359375, 1.1129150390625, 1.168853759765625, 1.22479248046875, 1.280731201171875, 1.336669921875, 1.392608642578125, 1.44854736328125, 1.504486083984375, 1.5604248046875, 1.616363525390625, 1.67230224609375, 1.728240966796875, 1.7841796875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 16.0, 21.0, 34.0, 35.0, 56.0, 69.0, 114.0, 148.0, 228.0, 311.0, 460.0, 663.0, 1018.0, 1496.0, 2350.0, 3549.0, 5894.0, 9731.0, 17415.0, 33431.0, 66910.0, 132532.0, 217598.0, 231647.0, 153825.0, 79651.0, 39736.0, 20362.0, 11113.0, 6506.0, 3977.0, 2474.0, 1688.0, 1082.0, 768.0, 524.0, 347.0, 229.0, 160.0, 111.0, 89.0, 76.0, 32.0, 19.0, 25.0, 12.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.34783935546875, -3.2366943359375, -3.12554931640625, -3.014404296875, -2.90325927734375, -2.7921142578125, -2.68096923828125, -2.56982421875, -2.45867919921875, -2.3475341796875, -2.23638916015625, -2.125244140625, -2.01409912109375, -1.9029541015625, -1.79180908203125, -1.6806640625, -1.56951904296875, -1.4583740234375, -1.34722900390625, -1.236083984375, -1.12493896484375, -1.0137939453125, -0.90264892578125, -0.79150390625, -0.68035888671875, -0.5692138671875, -0.45806884765625, -0.346923828125, -0.23577880859375, -0.1246337890625, -0.01348876953125, 0.09765625, 0.20880126953125, 0.3199462890625, 0.43109130859375, 0.542236328125, 0.65338134765625, 0.7645263671875, 0.87567138671875, 0.98681640625, 1.09796142578125, 1.2091064453125, 1.32025146484375, 1.431396484375, 1.54254150390625, 1.6536865234375, 1.76483154296875, 1.8759765625, 1.98712158203125, 2.0982666015625, 2.20941162109375, 2.320556640625, 2.43170166015625, 2.5428466796875, 2.65399169921875, 2.76513671875, 2.87628173828125, 2.9874267578125, 3.09857177734375, 3.209716796875, 3.32086181640625, 3.4320068359375, 3.54315185546875, 3.654296875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 10.0, 15.0, 27.0, 32.0, 42.0, 79.0, 85.0, 96.0, 111.0, 94.0, 71.0, 81.0, 63.0, 47.0, 38.0, 19.0, 18.0, 13.0, 13.0, 11.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047779083251953125, -0.00046325474977493286, -0.00044871866703033447, -0.0004341825842857361, -0.0004196465015411377, -0.0004051104187965393, -0.0003905743360519409, -0.00037603825330734253, -0.00036150217056274414, -0.00034696608781814575, -0.00033243000507354736, -0.000317893922328949, -0.0003033578395843506, -0.0002888217568397522, -0.0002742856740951538, -0.0002597495913505554, -0.00024521350860595703, -0.00023067742586135864, -0.00021614134311676025, -0.00020160526037216187, -0.00018706917762756348, -0.0001725330948829651, -0.0001579970121383667, -0.0001434609293937683, -0.00012892484664916992, -0.00011438876390457153, -9.985268115997314e-05, -8.531659841537476e-05, -7.078051567077637e-05, -5.624443292617798e-05, -4.170835018157959e-05, -2.71722674369812e-05, -1.2636184692382812e-05, 1.8998980522155762e-06, 1.6435980796813965e-05, 3.0972063541412354e-05, 4.550814628601074e-05, 6.004422903060913e-05, 7.458031177520752e-05, 8.911639451980591e-05, 0.0001036524772644043, 0.00011818856000900269, 0.00013272464275360107, 0.00014726072549819946, 0.00016179680824279785, 0.00017633289098739624, 0.00019086897373199463, 0.00020540505647659302, 0.0002199411392211914, 0.0002344772219657898, 0.0002490133047103882, 0.00026354938745498657, 0.00027808547019958496, 0.00029262155294418335, 0.00030715763568878174, 0.0003216937184333801, 0.0003362298011779785, 0.0003507658839225769, 0.0003653019666671753, 0.0003798380494117737, 0.00039437413215637207, 0.00040891021490097046, 0.00042344629764556885, 0.00043798238039016724, 0.0004525184631347656]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 14.0, 22.0, 27.0, 33.0, 35.0, 64.0, 112.0, 168.0, 228.0, 360.0, 512.0, 842.0, 1307.0, 2104.0, 3298.0, 5192.0, 8411.0, 14035.0, 23373.0, 38006.0, 61430.0, 93142.0, 128271.0, 152090.0, 150744.0, 124570.0, 88632.0, 58383.0, 36039.0, 22086.0, 13382.0, 8056.0, 4998.0, 3038.0, 1966.0, 1197.0, 777.0, 552.0, 328.0, 222.0, 150.0, 123.0, 67.0, 48.0, 35.0, 26.0, 14.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-2.1484375, -2.083221435546875, -2.01800537109375, -1.952789306640625, -1.8875732421875, -1.822357177734375, -1.75714111328125, -1.691925048828125, -1.626708984375, -1.561492919921875, -1.49627685546875, -1.431060791015625, -1.3658447265625, -1.300628662109375, -1.23541259765625, -1.170196533203125, -1.10498046875, -1.039764404296875, -0.97454833984375, -0.909332275390625, -0.8441162109375, -0.778900146484375, -0.71368408203125, -0.648468017578125, -0.583251953125, -0.518035888671875, -0.45281982421875, -0.387603759765625, -0.3223876953125, -0.257171630859375, -0.19195556640625, -0.126739501953125, -0.0615234375, 0.003692626953125, 0.06890869140625, 0.134124755859375, 0.1993408203125, 0.264556884765625, 0.32977294921875, 0.394989013671875, 0.460205078125, 0.525421142578125, 0.59063720703125, 0.655853271484375, 0.7210693359375, 0.786285400390625, 0.85150146484375, 0.916717529296875, 0.98193359375, 1.047149658203125, 1.11236572265625, 1.177581787109375, 1.2427978515625, 1.308013916015625, 1.37322998046875, 1.438446044921875, 1.503662109375, 1.568878173828125, 1.63409423828125, 1.699310302734375, 1.7645263671875, 1.829742431640625, 1.89495849609375, 1.960174560546875, 2.025390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 8.0, 5.0, 8.0, 7.0, 9.0, 7.0, 11.0, 13.0, 18.0, 13.0, 15.0, 23.0, 32.0, 20.0, 35.0, 44.0, 49.0, 44.0, 47.0, 40.0, 47.0, 53.0, 39.0, 45.0, 46.0, 43.0, 45.0, 30.0, 42.0, 22.0, 25.0, 17.0, 19.0, 18.0, 10.0, 12.0, 7.0, 8.0, 7.0, 3.0, 4.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.88916015625, -0.86395263671875, -0.8387451171875, -0.81353759765625, -0.788330078125, -0.76312255859375, -0.7379150390625, -0.71270751953125, -0.6875, -0.66229248046875, -0.6370849609375, -0.61187744140625, -0.586669921875, -0.56146240234375, -0.5362548828125, -0.51104736328125, -0.48583984375, -0.46063232421875, -0.4354248046875, -0.41021728515625, -0.385009765625, -0.35980224609375, -0.3345947265625, -0.30938720703125, -0.2841796875, -0.25897216796875, -0.2337646484375, -0.20855712890625, -0.183349609375, -0.15814208984375, -0.1329345703125, -0.10772705078125, -0.08251953125, -0.05731201171875, -0.0321044921875, -0.00689697265625, 0.018310546875, 0.04351806640625, 0.0687255859375, 0.09393310546875, 0.119140625, 0.14434814453125, 0.1695556640625, 0.19476318359375, 0.219970703125, 0.24517822265625, 0.2703857421875, 0.29559326171875, 0.32080078125, 0.34600830078125, 0.3712158203125, 0.39642333984375, 0.421630859375, 0.44683837890625, 0.4720458984375, 0.49725341796875, 0.5224609375, 0.54766845703125, 0.5728759765625, 0.59808349609375, 0.623291015625, 0.64849853515625, 0.6737060546875, 0.69891357421875, 0.72412109375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 13.0, 23.0, 23.0, 18.0, 20.0, 31.0, 27.0, 28.0, 23.0, 28.0, 30.0, 45.0, 36.0, 44.0, 45.0, 43.0, 45.0, 44.0, 40.0, 45.0, 33.0, 49.0, 31.0, 27.0, 22.0, 29.0, 26.0, 16.0, 20.0, 17.0, 3.0, 11.0, 10.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.302363872528076, -3.2079219818115234, -3.1134800910949707, -3.019038200378418, -2.924596071243286, -2.8301541805267334, -2.7357122898101807, -2.641270399093628, -2.546828269958496, -2.4523863792419434, -2.3579444885253906, -2.263502597808838, -2.169060468673706, -2.0746185779571533, -1.9801766872406006, -1.8857347965240479, -1.7912929058074951, -1.6968510150909424, -1.6024090051651, -1.5079671144485474, -1.413525104522705, -1.3190832138061523, -1.2246413230895996, -1.1301994323730469, -1.0357574224472046, -0.9413154721260071, -0.8468735218048096, -0.7524316310882568, -0.6579896807670593, -0.5635477304458618, -0.4691058397293091, -0.3746638894081116, -0.28022170066833496, -0.18577976524829865, -0.09133782982826233, 0.003104090690612793, 0.0975460410118103, 0.1919879913330078, 0.28642988204956055, 0.38087183237075806, 0.47531378269195557, 0.5697557330131531, 0.6641976833343506, 0.7586395740509033, 0.8530815243721008, 0.9475234746932983, 1.041965365409851, 1.1364073753356934, 1.230849266052246, 1.3252911567687988, 1.4197331666946411, 1.5141750574111938, 1.6086170673370361, 1.7030589580535889, 1.7975008487701416, 1.8919427394866943, 1.9863847494125366, 2.080826759338379, 2.1752686500549316, 2.2697105407714844, 2.364152431488037, 2.45859432220459, 2.5530362129211426, 2.6474783420562744, 2.741920232772827]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 11.0, 11.0, 10.0, 13.0, 14.0, 18.0, 23.0, 24.0, 28.0, 28.0, 32.0, 32.0, 26.0, 51.0, 42.0, 41.0, 41.0, 37.0, 44.0, 47.0, 34.0, 29.0, 43.0, 32.0, 30.0, 39.0, 30.0, 30.0, 21.0, 14.0, 16.0, 17.0, 15.0, 18.0, 9.0, 2.0, 10.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.664181709289551, -2.571289300918579, -2.4783968925476074, -2.3855044841766357, -2.292612075805664, -2.1997196674346924, -2.1068272590637207, -2.01393461227417, -1.9210423231124878, -1.8281499147415161, -1.7352575063705444, -1.6423649787902832, -1.5494725704193115, -1.4565801620483398, -1.3636877536773682, -1.2707953453063965, -1.1779029369354248, -1.0850105285644531, -0.9921181201934814, -0.899225652217865, -0.8063332438468933, -0.7134408354759216, -0.6205483675003052, -0.5276559591293335, -0.4347635507583618, -0.34187114238739014, -0.24897870421409607, -0.156086266040802, -0.06319385766983032, 0.029698550701141357, 0.12259101867675781, 0.2154834270477295, 0.30837583541870117, 0.40126824378967285, 0.4941606819629669, 0.587053120136261, 0.6799455285072327, 0.7728379368782043, 0.8657304048538208, 0.9586228132247925, 1.0515152215957642, 1.1444076299667358, 1.2373000383377075, 1.3301925659179688, 1.4230849742889404, 1.515977382659912, 1.6088697910308838, 1.7017621994018555, 1.7946546077728271, 1.8875470161437988, 1.9804394245147705, 2.073331832885742, 2.166224241256714, 2.2591166496276855, 2.3520092964172363, 2.444901466369629, 2.5377941131591797, 2.6306865215301514, 2.723578929901123, 2.8164713382720947, 2.9093637466430664, 3.002256155014038, 3.0951485633850098, 3.1880412101745605, 3.280933380126953]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 13.0, 25.0, 31.0, 42.0, 62.0, 136.0, 215.0, 377.0, 618.0, 1086.0, 1722.0, 3036.0, 5018.0, 8500.0, 14598.0, 24543.0, 41199.0, 69894.0, 114159.0, 185315.0, 285838.0, 412390.0, 531399.0, 593869.0, 560884.0, 454996.0, 326476.0, 217120.0, 135424.0, 83259.0, 49723.0, 29332.0, 17410.0, 10443.0, 6141.0, 3608.0, 2082.0, 1373.0, 757.0, 475.0, 251.0, 164.0, 106.0, 69.0, 40.0, 22.0, 15.0, 6.0, 8.0, 5.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.6796875, -2.600067138671875, -2.52044677734375, -2.440826416015625, -2.3612060546875, -2.281585693359375, -2.20196533203125, -2.122344970703125, -2.042724609375, -1.963104248046875, -1.88348388671875, -1.803863525390625, -1.7242431640625, -1.644622802734375, -1.56500244140625, -1.485382080078125, -1.40576171875, -1.326141357421875, -1.24652099609375, -1.166900634765625, -1.0872802734375, -1.007659912109375, -0.92803955078125, -0.848419189453125, -0.768798828125, -0.689178466796875, -0.60955810546875, -0.529937744140625, -0.4503173828125, -0.370697021484375, -0.29107666015625, -0.211456298828125, -0.1318359375, -0.052215576171875, 0.02740478515625, 0.107025146484375, 0.1866455078125, 0.266265869140625, 0.34588623046875, 0.425506591796875, 0.505126953125, 0.584747314453125, 0.66436767578125, 0.743988037109375, 0.8236083984375, 0.903228759765625, 0.98284912109375, 1.062469482421875, 1.14208984375, 1.221710205078125, 1.30133056640625, 1.380950927734375, 1.4605712890625, 1.540191650390625, 1.61981201171875, 1.699432373046875, 1.779052734375, 1.858673095703125, 1.93829345703125, 2.017913818359375, 2.0975341796875, 2.177154541015625, 2.25677490234375, 2.336395263671875, 2.416015625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 12.0, 9.0, 17.0, 16.0, 13.0, 21.0, 25.0, 27.0, 27.0, 34.0, 38.0, 32.0, 41.0, 46.0, 37.0, 39.0, 48.0, 33.0, 46.0, 44.0, 40.0, 36.0, 38.0, 38.0, 35.0, 33.0, 23.0, 23.0, 17.0, 14.0, 12.0, 14.0, 8.0, 11.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.029296875, -1.95849609375, -1.8876953125, -1.81689453125, -1.74609375, -1.67529296875, -1.6044921875, -1.53369140625, -1.462890625, -1.39208984375, -1.3212890625, -1.25048828125, -1.1796875, -1.10888671875, -1.0380859375, -0.96728515625, -0.896484375, -0.82568359375, -0.7548828125, -0.68408203125, -0.61328125, -0.54248046875, -0.4716796875, -0.40087890625, -0.330078125, -0.25927734375, -0.1884765625, -0.11767578125, -0.046875, 0.02392578125, 0.0947265625, 0.16552734375, 0.236328125, 0.30712890625, 0.3779296875, 0.44873046875, 0.51953125, 0.59033203125, 0.6611328125, 0.73193359375, 0.802734375, 0.87353515625, 0.9443359375, 1.01513671875, 1.0859375, 1.15673828125, 1.2275390625, 1.29833984375, 1.369140625, 1.43994140625, 1.5107421875, 1.58154296875, 1.65234375, 1.72314453125, 1.7939453125, 1.86474609375, 1.935546875, 2.00634765625, 2.0771484375, 2.14794921875, 2.21875, 2.28955078125, 2.3603515625, 2.43115234375, 2.501953125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 33.0, 41.0, 71.0, 126.0, 200.0, 358.0, 611.0, 1054.0, 1768.0, 3103.0, 5271.0, 9154.0, 16049.0, 27037.0, 45753.0, 75324.0, 122266.0, 189562.0, 278947.0, 383194.0, 481017.0, 535683.0, 526642.0, 454338.0, 353029.0, 250271.0, 167287.0, 106250.0, 65386.0, 38969.0, 23369.0, 13525.0, 7743.0, 4542.0, 2602.0, 1592.0, 848.0, 530.0, 286.0, 184.0, 106.0, 70.0, 39.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.587890625, -2.511444091796875, -2.43499755859375, -2.358551025390625, -2.2821044921875, -2.205657958984375, -2.12921142578125, -2.052764892578125, -1.976318359375, -1.899871826171875, -1.82342529296875, -1.746978759765625, -1.6705322265625, -1.594085693359375, -1.51763916015625, -1.441192626953125, -1.36474609375, -1.288299560546875, -1.21185302734375, -1.135406494140625, -1.0589599609375, -0.982513427734375, -0.90606689453125, -0.829620361328125, -0.753173828125, -0.676727294921875, -0.60028076171875, -0.523834228515625, -0.4473876953125, -0.370941162109375, -0.29449462890625, -0.218048095703125, -0.1416015625, -0.065155029296875, 0.01129150390625, 0.087738037109375, 0.1641845703125, 0.240631103515625, 0.31707763671875, 0.393524169921875, 0.469970703125, 0.546417236328125, 0.62286376953125, 0.699310302734375, 0.7757568359375, 0.852203369140625, 0.92864990234375, 1.005096435546875, 1.08154296875, 1.157989501953125, 1.23443603515625, 1.310882568359375, 1.3873291015625, 1.463775634765625, 1.54022216796875, 1.616668701171875, 1.693115234375, 1.769561767578125, 1.84600830078125, 1.922454833984375, 1.9989013671875, 2.075347900390625, 2.15179443359375, 2.228240966796875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 12.0, 7.0, 14.0, 20.0, 31.0, 41.0, 40.0, 61.0, 53.0, 82.0, 100.0, 112.0, 117.0, 142.0, 137.0, 182.0, 187.0, 213.0, 232.0, 185.0, 211.0, 206.0, 201.0, 193.0, 172.0, 167.0, 151.0, 115.0, 114.0, 108.0, 93.0, 78.0, 58.0, 52.0, 44.0, 28.0, 33.0, 21.0, 15.0, 16.0, 3.0, 6.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0595703125, -1.0271148681640625, -0.994659423828125, -0.9622039794921875, -0.92974853515625, -0.8972930908203125, -0.864837646484375, -0.8323822021484375, -0.7999267578125, -0.7674713134765625, -0.735015869140625, -0.7025604248046875, -0.67010498046875, -0.6376495361328125, -0.605194091796875, -0.5727386474609375, -0.540283203125, -0.5078277587890625, -0.475372314453125, -0.4429168701171875, -0.41046142578125, -0.3780059814453125, -0.345550537109375, -0.3130950927734375, -0.2806396484375, -0.2481842041015625, -0.215728759765625, -0.1832733154296875, -0.15081787109375, -0.1183624267578125, -0.085906982421875, -0.0534515380859375, -0.02099609375, 0.0114593505859375, 0.043914794921875, 0.0763702392578125, 0.10882568359375, 0.1412811279296875, 0.173736572265625, 0.2061920166015625, 0.2386474609375, 0.2711029052734375, 0.303558349609375, 0.3360137939453125, 0.36846923828125, 0.4009246826171875, 0.433380126953125, 0.4658355712890625, 0.498291015625, 0.5307464599609375, 0.563201904296875, 0.5956573486328125, 0.62811279296875, 0.6605682373046875, 0.693023681640625, 0.7254791259765625, 0.7579345703125, 0.7903900146484375, 0.822845458984375, 0.8553009033203125, 0.88775634765625, 0.9202117919921875, 0.952667236328125, 0.9851226806640625, 1.017578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 6.0, 10.0, 7.0, 16.0, 17.0, 23.0, 23.0, 32.0, 34.0, 28.0, 41.0, 36.0, 40.0, 53.0, 62.0, 46.0, 46.0, 54.0, 47.0, 53.0, 45.0, 38.0, 36.0, 33.0, 31.0, 23.0, 21.0, 12.0, 14.0, 17.0, 14.0, 5.0, 8.0, 9.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3508079051971436, -3.2532224655151367, -3.155637264251709, -3.0580520629882812, -2.9604666233062744, -2.8628811836242676, -2.76529598236084, -2.667710781097412, -2.5701253414154053, -2.4725399017333984, -2.3749547004699707, -2.277369499206543, -2.179784059524536, -2.0821986198425293, -1.9846134185791016, -1.8870280981063843, -1.789442777633667, -1.6918574571609497, -1.5942721366882324, -1.4966868162155151, -1.3991014957427979, -1.3015161752700806, -1.2039308547973633, -1.106345534324646, -1.0087602138519287, -0.9111748933792114, -0.8135895729064941, -0.7160042524337769, -0.6184189319610596, -0.5208336114883423, -0.423248291015625, -0.3256629705429077, -0.22807741165161133, -0.13049209117889404, -0.03290677070617676, 0.06467854976654053, 0.1622638702392578, 0.2598491907119751, 0.3574345111846924, 0.45501983165740967, 0.552605152130127, 0.6501904726028442, 0.7477757930755615, 0.8453611135482788, 0.9429464340209961, 1.0405317544937134, 1.1381170749664307, 1.235702395439148, 1.3332877159118652, 1.4308730363845825, 1.5284583568572998, 1.626043677330017, 1.7236289978027344, 1.8212143182754517, 1.918799638748169, 2.016385078430176, 2.1139702796936035, 2.2115554809570312, 2.309140920639038, 2.406726360321045, 2.5043115615844727, 2.6018967628479004, 2.6994822025299072, 2.797067642211914, 2.894652843475342]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 2.0, 3.0, 6.0, 16.0, 14.0, 8.0, 16.0, 30.0, 23.0, 27.0, 27.0, 28.0, 34.0, 26.0, 32.0, 49.0, 49.0, 48.0, 42.0, 41.0, 34.0, 30.0, 39.0, 29.0, 39.0, 40.0, 33.0, 30.0, 30.0, 26.0, 18.0, 25.0, 19.0, 17.0, 12.0, 8.0, 6.0, 12.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.750286102294922, -2.670217990875244, -2.5901501178741455, -2.5100820064544678, -2.430014133453369, -2.3499460220336914, -2.2698781490325928, -2.189810037612915, -2.1097421646118164, -2.0296740531921387, -1.94960618019104, -1.8695381879806519, -1.7894701957702637, -1.7094022035598755, -1.6293342113494873, -1.5492660999298096, -1.4691981077194214, -1.3891301155090332, -1.309062123298645, -1.2289941310882568, -1.1489261388778687, -1.0688581466674805, -0.9887900948524475, -0.9087221026420593, -0.8286541104316711, -0.748586118221283, -0.6685181260108948, -0.5884500741958618, -0.5083820819854736, -0.42831411957740784, -0.34824609756469727, -0.2681781053543091, -0.1881101131439209, -0.10804211348295212, -0.027974113821983337, 0.05209389328956604, 0.13216188549995422, 0.2122298777103424, 0.292297899723053, 0.37236589193344116, 0.45243388414382935, 0.5325018763542175, 0.6125698685646057, 0.6926379203796387, 0.7727059125900269, 0.852773904800415, 0.9328418970108032, 1.0129098892211914, 1.0929778814315796, 1.1730458736419678, 1.253113865852356, 1.3331818580627441, 1.4132498502731323, 1.4933178424835205, 1.5733859539031982, 1.6534538269042969, 1.7335219383239746, 1.8135899305343628, 1.893657922744751, 1.9737259149551392, 2.0537939071655273, 2.133862018585205, 2.2139298915863037, 2.2939980030059814, 2.37406587600708]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 17.0, 27.0, 25.0, 36.0, 45.0, 76.0, 119.0, 178.0, 251.0, 441.0, 734.0, 1246.0, 2374.0, 4394.0, 8666.0, 18709.0, 39206.0, 83009.0, 169491.0, 265414.0, 223873.0, 120114.0, 57149.0, 26871.0, 12506.0, 6161.0, 3138.0, 1664.0, 974.0, 584.0, 362.0, 238.0, 150.0, 97.0, 69.0, 48.0, 28.0, 13.0, 7.0, 12.0, 10.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.46484375, -2.38720703125, -2.3095703125, -2.23193359375, -2.154296875, -2.07666015625, -1.9990234375, -1.92138671875, -1.84375, -1.76611328125, -1.6884765625, -1.61083984375, -1.533203125, -1.45556640625, -1.3779296875, -1.30029296875, -1.22265625, -1.14501953125, -1.0673828125, -0.98974609375, -0.912109375, -0.83447265625, -0.7568359375, -0.67919921875, -0.6015625, -0.52392578125, -0.4462890625, -0.36865234375, -0.291015625, -0.21337890625, -0.1357421875, -0.05810546875, 0.01953125, 0.09716796875, 0.1748046875, 0.25244140625, 0.330078125, 0.40771484375, 0.4853515625, 0.56298828125, 0.640625, 0.71826171875, 0.7958984375, 0.87353515625, 0.951171875, 1.02880859375, 1.1064453125, 1.18408203125, 1.26171875, 1.33935546875, 1.4169921875, 1.49462890625, 1.572265625, 1.64990234375, 1.7275390625, 1.80517578125, 1.8828125, 1.96044921875, 2.0380859375, 2.11572265625, 2.193359375, 2.27099609375, 2.3486328125, 2.42626953125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 6.0, 5.0, 11.0, 6.0, 12.0, 16.0, 10.0, 20.0, 22.0, 24.0, 18.0, 18.0, 39.0, 33.0, 39.0, 35.0, 38.0, 45.0, 44.0, 39.0, 40.0, 39.0, 38.0, 31.0, 32.0, 40.0, 35.0, 28.0, 23.0, 30.0, 33.0, 31.0, 19.0, 12.0, 15.0, 13.0, 10.0, 12.0, 11.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71484375, -2.633209228515625, -2.55157470703125, -2.469940185546875, -2.3883056640625, -2.306671142578125, -2.22503662109375, -2.143402099609375, -2.061767578125, -1.980133056640625, -1.89849853515625, -1.816864013671875, -1.7352294921875, -1.653594970703125, -1.57196044921875, -1.490325927734375, -1.40869140625, -1.327056884765625, -1.24542236328125, -1.163787841796875, -1.0821533203125, -1.000518798828125, -0.91888427734375, -0.837249755859375, -0.755615234375, -0.673980712890625, -0.59234619140625, -0.510711669921875, -0.4290771484375, -0.347442626953125, -0.26580810546875, -0.184173583984375, -0.1025390625, -0.020904541015625, 0.06072998046875, 0.142364501953125, 0.2239990234375, 0.305633544921875, 0.38726806640625, 0.468902587890625, 0.550537109375, 0.632171630859375, 0.71380615234375, 0.795440673828125, 0.8770751953125, 0.958709716796875, 1.04034423828125, 1.121978759765625, 1.20361328125, 1.285247802734375, 1.36688232421875, 1.448516845703125, 1.5301513671875, 1.611785888671875, 1.69342041015625, 1.775054931640625, 1.856689453125, 1.938323974609375, 2.01995849609375, 2.101593017578125, 2.1832275390625, 2.264862060546875, 2.34649658203125, 2.428131103515625, 2.509765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 11.0, 11.0, 22.0, 25.0, 37.0, 51.0, 73.0, 114.0, 174.0, 279.0, 396.0, 624.0, 976.0, 1635.0, 2886.0, 5246.0, 9743.0, 19743.0, 41563.0, 89975.0, 191591.0, 294144.0, 203112.0, 96953.0, 44387.0, 21044.0, 10648.0, 5398.0, 2984.0, 1767.0, 1083.0, 633.0, 440.0, 234.0, 206.0, 118.0, 64.0, 58.0, 33.0, 26.0, 17.0, 11.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.669525146484375, -1.60662841796875, -1.543731689453125, -1.4808349609375, -1.417938232421875, -1.35504150390625, -1.292144775390625, -1.229248046875, -1.166351318359375, -1.10345458984375, -1.040557861328125, -0.9776611328125, -0.914764404296875, -0.85186767578125, -0.788970947265625, -0.72607421875, -0.663177490234375, -0.60028076171875, -0.537384033203125, -0.4744873046875, -0.411590576171875, -0.34869384765625, -0.285797119140625, -0.222900390625, -0.160003662109375, -0.09710693359375, -0.034210205078125, 0.0286865234375, 0.091583251953125, 0.15447998046875, 0.217376708984375, 0.2802734375, 0.343170166015625, 0.40606689453125, 0.468963623046875, 0.5318603515625, 0.594757080078125, 0.65765380859375, 0.720550537109375, 0.783447265625, 0.846343994140625, 0.90924072265625, 0.972137451171875, 1.0350341796875, 1.097930908203125, 1.16082763671875, 1.223724365234375, 1.28662109375, 1.349517822265625, 1.41241455078125, 1.475311279296875, 1.5382080078125, 1.601104736328125, 1.66400146484375, 1.726898193359375, 1.789794921875, 1.852691650390625, 1.91558837890625, 1.978485107421875, 2.0413818359375, 2.104278564453125, 2.16717529296875, 2.230072021484375, 2.29296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 3.0, 6.0, 11.0, 9.0, 17.0, 15.0, 16.0, 20.0, 30.0, 27.0, 36.0, 38.0, 31.0, 44.0, 39.0, 42.0, 46.0, 48.0, 46.0, 35.0, 44.0, 41.0, 36.0, 32.0, 30.0, 41.0, 27.0, 29.0, 22.0, 22.0, 16.0, 19.0, 11.0, 14.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.61602783203125, -1.5562744140625, -1.49652099609375, -1.436767578125, -1.37701416015625, -1.3172607421875, -1.25750732421875, -1.19775390625, -1.13800048828125, -1.0782470703125, -1.01849365234375, -0.958740234375, -0.89898681640625, -0.8392333984375, -0.77947998046875, -0.7197265625, -0.65997314453125, -0.6002197265625, -0.54046630859375, -0.480712890625, -0.42095947265625, -0.3612060546875, -0.30145263671875, -0.24169921875, -0.18194580078125, -0.1221923828125, -0.06243896484375, -0.002685546875, 0.05706787109375, 0.1168212890625, 0.17657470703125, 0.236328125, 0.29608154296875, 0.3558349609375, 0.41558837890625, 0.475341796875, 0.53509521484375, 0.5948486328125, 0.65460205078125, 0.71435546875, 0.77410888671875, 0.8338623046875, 0.89361572265625, 0.953369140625, 1.01312255859375, 1.0728759765625, 1.13262939453125, 1.1923828125, 1.25213623046875, 1.3118896484375, 1.37164306640625, 1.431396484375, 1.49114990234375, 1.5509033203125, 1.61065673828125, 1.67041015625, 1.73016357421875, 1.7899169921875, 1.84967041015625, 1.909423828125, 1.96917724609375, 2.0289306640625, 2.08868408203125, 2.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 14.0, 16.0, 23.0, 17.0, 20.0, 37.0, 44.0, 53.0, 71.0, 87.0, 132.0, 177.0, 209.0, 313.0, 436.0, 599.0, 1003.0, 1487.0, 2583.0, 4692.0, 10438.0, 31674.0, 187744.0, 665094.0, 101128.0, 22067.0, 8155.0, 3914.0, 2080.0, 1276.0, 855.0, 547.0, 417.0, 290.0, 186.0, 156.0, 113.0, 98.0, 61.0, 51.0, 48.0, 38.0, 19.0, 16.0, 16.0, 10.0, 11.0, 10.0, 8.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.28515625, -2.2122802734375, -2.139404296875, -2.0665283203125, -1.99365234375, -1.9207763671875, -1.847900390625, -1.7750244140625, -1.7021484375, -1.6292724609375, -1.556396484375, -1.4835205078125, -1.41064453125, -1.3377685546875, -1.264892578125, -1.1920166015625, -1.119140625, -1.0462646484375, -0.973388671875, -0.9005126953125, -0.82763671875, -0.7547607421875, -0.681884765625, -0.6090087890625, -0.5361328125, -0.4632568359375, -0.390380859375, -0.3175048828125, -0.24462890625, -0.1717529296875, -0.098876953125, -0.0260009765625, 0.046875, 0.1197509765625, 0.192626953125, 0.2655029296875, 0.33837890625, 0.4112548828125, 0.484130859375, 0.5570068359375, 0.6298828125, 0.7027587890625, 0.775634765625, 0.8485107421875, 0.92138671875, 0.9942626953125, 1.067138671875, 1.1400146484375, 1.212890625, 1.2857666015625, 1.358642578125, 1.4315185546875, 1.50439453125, 1.5772705078125, 1.650146484375, 1.7230224609375, 1.7958984375, 1.8687744140625, 1.941650390625, 2.0145263671875, 2.08740234375, 2.1602783203125, 2.233154296875, 2.3060302734375, 2.37890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 14.0, 16.0, 26.0, 52.0, 55.0, 113.0, 118.0, 114.0, 126.0, 92.0, 86.0, 44.0, 35.0, 16.0, 10.0, 12.0, 11.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00014328956604003906, -0.00013889558613300323, -0.0001345016062259674, -0.00013010762631893158, -0.00012571364641189575, -0.00012131966650485992, -0.0001169256865978241, -0.00011253170669078827, -0.00010813772678375244, -0.00010374374687671661, -9.934976696968079e-05, -9.495578706264496e-05, -9.056180715560913e-05, -8.61678272485733e-05, -8.177384734153748e-05, -7.737986743450165e-05, -7.298588752746582e-05, -6.859190762042999e-05, -6.419792771339417e-05, -5.980394780635834e-05, -5.540996789932251e-05, -5.101598799228668e-05, -4.6622008085250854e-05, -4.222802817821503e-05, -3.78340482711792e-05, -3.344006836414337e-05, -2.9046088457107544e-05, -2.4652108550071716e-05, -2.025812864303589e-05, -1.586414873600006e-05, -1.1470168828964233e-05, -7.076188921928406e-06, -2.682209014892578e-06, 1.7117708921432495e-06, 6.105750799179077e-06, 1.0499730706214905e-05, 1.4893710613250732e-05, 1.928769052028656e-05, 2.3681670427322388e-05, 2.8075650334358215e-05, 3.246963024139404e-05, 3.686361014842987e-05, 4.12575900554657e-05, 4.5651569962501526e-05, 5.0045549869537354e-05, 5.443952977657318e-05, 5.883350968360901e-05, 6.322748959064484e-05, 6.762146949768066e-05, 7.201544940471649e-05, 7.640942931175232e-05, 8.080340921878815e-05, 8.519738912582397e-05, 8.95913690328598e-05, 9.398534893989563e-05, 9.837932884693146e-05, 0.00010277330875396729, 0.00010716728866100311, 0.00011156126856803894, 0.00011595524847507477, 0.0001203492283821106, 0.00012474320828914642, 0.00012913718819618225, 0.00013353116810321808, 0.0001379251480102539]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 9.0, 13.0, 16.0, 17.0, 37.0, 36.0, 42.0, 64.0, 103.0, 157.0, 179.0, 245.0, 329.0, 498.0, 680.0, 924.0, 1231.0, 1853.0, 2985.0, 4684.0, 8207.0, 17532.0, 44549.0, 130059.0, 336648.0, 308034.0, 113843.0, 39050.0, 15756.0, 7590.0, 4355.0, 2657.0, 1758.0, 1201.0, 914.0, 620.0, 461.0, 338.0, 223.0, 175.0, 137.0, 94.0, 72.0, 66.0, 31.0, 20.0, 17.0, 18.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.455291748046875, -1.40667724609375, -1.358062744140625, -1.3094482421875, -1.260833740234375, -1.21221923828125, -1.163604736328125, -1.114990234375, -1.066375732421875, -1.01776123046875, -0.969146728515625, -0.9205322265625, -0.871917724609375, -0.82330322265625, -0.774688720703125, -0.72607421875, -0.677459716796875, -0.62884521484375, -0.580230712890625, -0.5316162109375, -0.483001708984375, -0.43438720703125, -0.385772705078125, -0.337158203125, -0.288543701171875, -0.23992919921875, -0.191314697265625, -0.1427001953125, -0.094085693359375, -0.04547119140625, 0.003143310546875, 0.0517578125, 0.100372314453125, 0.14898681640625, 0.197601318359375, 0.2462158203125, 0.294830322265625, 0.34344482421875, 0.392059326171875, 0.440673828125, 0.489288330078125, 0.53790283203125, 0.586517333984375, 0.6351318359375, 0.683746337890625, 0.73236083984375, 0.780975341796875, 0.82958984375, 0.878204345703125, 0.92681884765625, 0.975433349609375, 1.0240478515625, 1.072662353515625, 1.12127685546875, 1.169891357421875, 1.218505859375, 1.267120361328125, 1.31573486328125, 1.364349365234375, 1.4129638671875, 1.461578369140625, 1.51019287109375, 1.558807373046875, 1.607421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 5.0, 13.0, 12.0, 10.0, 28.0, 20.0, 31.0, 44.0, 63.0, 68.0, 76.0, 105.0, 103.0, 76.0, 69.0, 56.0, 45.0, 39.0, 21.0, 18.0, 13.0, 12.0, 11.0, 7.0, 2.0, 2.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.365966796875, -0.3542289733886719, -0.34249114990234375, -0.3307533264160156, -0.3190155029296875, -0.3072776794433594, -0.29553985595703125, -0.2838020324707031, -0.272064208984375, -0.2603263854980469, -0.24858856201171875, -0.23685073852539062, -0.2251129150390625, -0.21337509155273438, -0.20163726806640625, -0.18989944458007812, -0.17816162109375, -0.16642379760742188, -0.15468597412109375, -0.14294815063476562, -0.1312103271484375, -0.11947250366210938, -0.10773468017578125, -0.09599685668945312, -0.084259033203125, -0.07252120971679688, -0.06078338623046875, -0.049045562744140625, -0.0373077392578125, -0.025569915771484375, -0.01383209228515625, -0.002094268798828125, 0.0096435546875, 0.021381378173828125, 0.03311920166015625, 0.044857025146484375, 0.0565948486328125, 0.06833267211914062, 0.08007049560546875, 0.09180831909179688, 0.103546142578125, 0.11528396606445312, 0.12702178955078125, 0.13875961303710938, 0.1504974365234375, 0.16223526000976562, 0.17397308349609375, 0.18571090698242188, 0.19744873046875, 0.20918655395507812, 0.22092437744140625, 0.23266220092773438, 0.2444000244140625, 0.2561378479003906, 0.26787567138671875, 0.2796134948730469, 0.291351318359375, 0.3030891418457031, 0.31482696533203125, 0.3265647888183594, 0.3383026123046875, 0.3500404357910156, 0.36177825927734375, 0.3735160827636719, 0.38525390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 10.0, 18.0, 20.0, 12.0, 20.0, 32.0, 27.0, 27.0, 31.0, 30.0, 33.0, 56.0, 55.0, 62.0, 51.0, 46.0, 54.0, 43.0, 46.0, 46.0, 42.0, 39.0, 26.0, 31.0, 34.0, 20.0, 9.0, 12.0, 13.0, 16.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265214204788208, -3.1674351692199707, -3.0696561336517334, -2.971877098083496, -2.874098062515259, -2.7763190269470215, -2.678539991378784, -2.580760955810547, -2.4829819202423096, -2.3852028846740723, -2.287423849105835, -2.1896448135375977, -2.0918657779693604, -1.994086742401123, -1.8963077068328857, -1.7985286712646484, -1.7007497549057007, -1.6029707193374634, -1.505191683769226, -1.4074126482009888, -1.3096336126327515, -1.2118545770645142, -1.1140756607055664, -1.016296625137329, -0.918517529964447, -0.8207384943962097, -0.7229594588279724, -0.6251804828643799, -0.5274014472961426, -0.4296223819255829, -0.33184337615966797, -0.23406434059143066, -0.13628530502319336, -0.03850627690553665, 0.059272751212120056, 0.15705177187919617, 0.25483080744743347, 0.3526098430156708, 0.4503888487815857, 0.548167884349823, 0.6459469199180603, 0.7437259554862976, 0.8415049910545349, 0.9392839670181274, 1.0370630025863647, 1.134842038154602, 1.2326210737228394, 1.3304001092910767, 1.428179144859314, 1.5259581804275513, 1.6237372159957886, 1.7215162515640259, 1.8192952871322632, 1.9170743227005005, 2.0148532390594482, 2.1126322746276855, 2.210411310195923, 2.30819034576416, 2.4059693813323975, 2.5037484169006348, 2.601527452468872, 2.6993064880371094, 2.7970855236053467, 2.894864559173584, 2.9926435947418213]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 1.0, 3.0, 7.0, 13.0, 12.0, 11.0, 18.0, 20.0, 30.0, 31.0, 23.0, 27.0, 25.0, 28.0, 39.0, 48.0, 48.0, 38.0, 34.0, 45.0, 48.0, 28.0, 33.0, 31.0, 35.0, 38.0, 35.0, 30.0, 23.0, 36.0, 20.0, 23.0, 19.0, 19.0, 16.0, 10.0, 4.0, 12.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.642449140548706, -2.5643460750579834, -2.4862427711486816, -2.408139705657959, -2.3300366401672363, -2.2519335746765137, -2.173830270767212, -2.0957272052764893, -2.0176239013671875, -1.9395207166671753, -1.8614176511764526, -1.7833144664764404, -1.7052114009857178, -1.6271082162857056, -1.5490050315856934, -1.4709019660949707, -1.392798900604248, -1.3146957159042358, -1.2365926504135132, -1.158489465713501, -1.0803864002227783, -1.0022832155227661, -0.9241800308227539, -0.8460769057273865, -0.767973780632019, -0.6898706555366516, -0.6117675304412842, -0.533664345741272, -0.45556122064590454, -0.3774580955505371, -0.2993549406528473, -0.22125178575515747, -0.14314889907836914, -0.06504575908184052, 0.01305738091468811, 0.09116052091121674, 0.16926366090774536, 0.2473667860031128, 0.3254699409008026, 0.40357309579849243, 0.48167622089385986, 0.5597793459892273, 0.6378824710845947, 0.7159856557846069, 0.7940887808799744, 0.8721919059753418, 0.950295090675354, 1.0283982753753662, 1.1065013408660889, 1.184604525566101, 1.2627075910568237, 1.340810775756836, 1.4189138412475586, 1.4970170259475708, 1.575120210647583, 1.6532232761383057, 1.7313264608383179, 1.80942964553833, 1.8875327110290527, 1.965635895729065, 2.043739080429077, 2.1218421459198, 2.1999452114105225, 2.278048515319824, 2.356151580810547]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 13.0, 17.0, 37.0, 36.0, 61.0, 97.0, 158.0, 210.0, 363.0, 574.0, 894.0, 1542.0, 2436.0, 3994.0, 6380.0, 9952.0, 15611.0, 23825.0, 35609.0, 51795.0, 70984.0, 91955.0, 110038.0, 119786.0, 117408.0, 104729.0, 84257.0, 63918.0, 45160.0, 30615.0, 20240.0, 13445.0, 8208.0, 5314.0, 3329.0, 2143.0, 1316.0, 769.0, 509.0, 328.0, 169.0, 115.0, 80.0, 53.0, 33.0, 24.0, 12.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.826171875, -2.74005126953125, -2.6539306640625, -2.56781005859375, -2.481689453125, -2.39556884765625, -2.3094482421875, -2.22332763671875, -2.13720703125, -2.05108642578125, -1.9649658203125, -1.87884521484375, -1.792724609375, -1.70660400390625, -1.6204833984375, -1.53436279296875, -1.4482421875, -1.36212158203125, -1.2760009765625, -1.18988037109375, -1.103759765625, -1.01763916015625, -0.9315185546875, -0.84539794921875, -0.75927734375, -0.67315673828125, -0.5870361328125, -0.50091552734375, -0.414794921875, -0.32867431640625, -0.2425537109375, -0.15643310546875, -0.0703125, 0.01580810546875, 0.1019287109375, 0.18804931640625, 0.274169921875, 0.36029052734375, 0.4464111328125, 0.53253173828125, 0.61865234375, 0.70477294921875, 0.7908935546875, 0.87701416015625, 0.963134765625, 1.04925537109375, 1.1353759765625, 1.22149658203125, 1.3076171875, 1.39373779296875, 1.4798583984375, 1.56597900390625, 1.652099609375, 1.73822021484375, 1.8243408203125, 1.91046142578125, 1.99658203125, 2.08270263671875, 2.1688232421875, 2.25494384765625, 2.341064453125, 2.42718505859375, 2.5133056640625, 2.59942626953125, 2.685546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 10.0, 4.0, 16.0, 14.0, 17.0, 22.0, 17.0, 27.0, 27.0, 36.0, 32.0, 32.0, 35.0, 45.0, 32.0, 44.0, 47.0, 34.0, 37.0, 38.0, 48.0, 36.0, 38.0, 23.0, 34.0, 35.0, 21.0, 23.0, 29.0, 19.0, 24.0, 22.0, 14.0, 10.0, 10.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.6484375, -2.57012939453125, -2.4918212890625, -2.41351318359375, -2.335205078125, -2.25689697265625, -2.1785888671875, -2.10028076171875, -2.02197265625, -1.94366455078125, -1.8653564453125, -1.78704833984375, -1.708740234375, -1.63043212890625, -1.5521240234375, -1.47381591796875, -1.3955078125, -1.31719970703125, -1.2388916015625, -1.16058349609375, -1.082275390625, -1.00396728515625, -0.9256591796875, -0.84735107421875, -0.76904296875, -0.69073486328125, -0.6124267578125, -0.53411865234375, -0.455810546875, -0.37750244140625, -0.2991943359375, -0.22088623046875, -0.142578125, -0.06427001953125, 0.0140380859375, 0.09234619140625, 0.170654296875, 0.24896240234375, 0.3272705078125, 0.40557861328125, 0.48388671875, 0.56219482421875, 0.6405029296875, 0.71881103515625, 0.797119140625, 0.87542724609375, 0.9537353515625, 1.03204345703125, 1.1103515625, 1.18865966796875, 1.2669677734375, 1.34527587890625, 1.423583984375, 1.50189208984375, 1.5802001953125, 1.65850830078125, 1.73681640625, 1.81512451171875, 1.8934326171875, 1.97174072265625, 2.050048828125, 2.12835693359375, 2.2066650390625, 2.28497314453125, 2.36328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 13.0, 13.0, 10.0, 16.0, 33.0, 48.0, 86.0, 86.0, 128.0, 190.0, 325.0, 462.0, 739.0, 1079.0, 1589.0, 2474.0, 3640.0, 5332.0, 8377.0, 12243.0, 18133.0, 26326.0, 37081.0, 51792.0, 67703.0, 84323.0, 98260.0, 107617.0, 107504.0, 98450.0, 83229.0, 66027.0, 49940.0, 36218.0, 25937.0, 17412.0, 11973.0, 8121.0, 5262.0, 3438.0, 2274.0, 1558.0, 1041.0, 623.0, 485.0, 303.0, 195.0, 132.0, 107.0, 71.0, 59.0, 28.0, 10.0, 20.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0], "bins": [-2.330078125, -2.257171630859375, -2.18426513671875, -2.111358642578125, -2.0384521484375, -1.965545654296875, -1.89263916015625, -1.819732666015625, -1.746826171875, -1.673919677734375, -1.60101318359375, -1.528106689453125, -1.4552001953125, -1.382293701171875, -1.30938720703125, -1.236480712890625, -1.16357421875, -1.090667724609375, -1.01776123046875, -0.944854736328125, -0.8719482421875, -0.799041748046875, -0.72613525390625, -0.653228759765625, -0.580322265625, -0.507415771484375, -0.43450927734375, -0.361602783203125, -0.2886962890625, -0.215789794921875, -0.14288330078125, -0.069976806640625, 0.0029296875, 0.075836181640625, 0.14874267578125, 0.221649169921875, 0.2945556640625, 0.367462158203125, 0.44036865234375, 0.513275146484375, 0.586181640625, 0.659088134765625, 0.73199462890625, 0.804901123046875, 0.8778076171875, 0.950714111328125, 1.02362060546875, 1.096527099609375, 1.16943359375, 1.242340087890625, 1.31524658203125, 1.388153076171875, 1.4610595703125, 1.533966064453125, 1.60687255859375, 1.679779052734375, 1.752685546875, 1.825592041015625, 1.89849853515625, 1.971405029296875, 2.0443115234375, 2.117218017578125, 2.19012451171875, 2.263031005859375, 2.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 5.0, 5.0, 9.0, 9.0, 7.0, 16.0, 14.0, 11.0, 17.0, 21.0, 25.0, 20.0, 33.0, 26.0, 38.0, 35.0, 40.0, 32.0, 32.0, 40.0, 45.0, 37.0, 50.0, 38.0, 28.0, 30.0, 33.0, 30.0, 29.0, 17.0, 20.0, 22.0, 18.0, 20.0, 20.0, 26.0, 12.0, 13.0, 14.0, 13.0, 11.0, 5.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.43359375, -1.387115478515625, -1.34063720703125, -1.294158935546875, -1.2476806640625, -1.201202392578125, -1.15472412109375, -1.108245849609375, -1.061767578125, -1.015289306640625, -0.96881103515625, -0.922332763671875, -0.8758544921875, -0.829376220703125, -0.78289794921875, -0.736419677734375, -0.68994140625, -0.643463134765625, -0.59698486328125, -0.550506591796875, -0.5040283203125, -0.457550048828125, -0.41107177734375, -0.364593505859375, -0.318115234375, -0.271636962890625, -0.22515869140625, -0.178680419921875, -0.1322021484375, -0.085723876953125, -0.03924560546875, 0.007232666015625, 0.0537109375, 0.100189208984375, 0.14666748046875, 0.193145751953125, 0.2396240234375, 0.286102294921875, 0.33258056640625, 0.379058837890625, 0.425537109375, 0.472015380859375, 0.51849365234375, 0.564971923828125, 0.6114501953125, 0.657928466796875, 0.70440673828125, 0.750885009765625, 0.79736328125, 0.843841552734375, 0.89031982421875, 0.936798095703125, 0.9832763671875, 1.029754638671875, 1.07623291015625, 1.122711181640625, 1.169189453125, 1.215667724609375, 1.26214599609375, 1.308624267578125, 1.3551025390625, 1.401580810546875, 1.44805908203125, 1.494537353515625, 1.541015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 20.0, 28.0, 47.0, 56.0, 70.0, 116.0, 175.0, 244.0, 368.0, 528.0, 736.0, 1116.0, 1884.0, 3040.0, 5412.0, 9753.0, 19544.0, 43548.0, 100710.0, 209204.0, 280337.0, 198141.0, 92559.0, 40248.0, 18322.0, 9207.0, 5009.0, 2899.0, 1810.0, 1038.0, 726.0, 498.0, 348.0, 254.0, 167.0, 114.0, 81.0, 52.0, 31.0, 21.0, 22.0, 13.0, 16.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.954742431640625, -2.85089111328125, -2.747039794921875, -2.6431884765625, -2.539337158203125, -2.43548583984375, -2.331634521484375, -2.227783203125, -2.123931884765625, -2.02008056640625, -1.916229248046875, -1.8123779296875, -1.708526611328125, -1.60467529296875, -1.500823974609375, -1.39697265625, -1.293121337890625, -1.18927001953125, -1.085418701171875, -0.9815673828125, -0.877716064453125, -0.77386474609375, -0.670013427734375, -0.566162109375, -0.462310791015625, -0.35845947265625, -0.254608154296875, -0.1507568359375, -0.046905517578125, 0.05694580078125, 0.160797119140625, 0.2646484375, 0.368499755859375, 0.47235107421875, 0.576202392578125, 0.6800537109375, 0.783905029296875, 0.88775634765625, 0.991607666015625, 1.095458984375, 1.199310302734375, 1.30316162109375, 1.407012939453125, 1.5108642578125, 1.614715576171875, 1.71856689453125, 1.822418212890625, 1.92626953125, 2.030120849609375, 2.13397216796875, 2.237823486328125, 2.3416748046875, 2.445526123046875, 2.54937744140625, 2.653228759765625, 2.757080078125, 2.860931396484375, 2.96478271484375, 3.068634033203125, 3.1724853515625, 3.276336669921875, 3.38018798828125, 3.484039306640625, 3.587890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 6.0, 14.0, 8.0, 20.0, 38.0, 64.0, 75.0, 109.0, 111.0, 107.0, 124.0, 91.0, 65.0, 52.0, 33.0, 23.0, 20.0, 4.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004410743713378906, -0.0004278421401977539, -0.0004146099090576172, -0.00040137767791748047, -0.00038814544677734375, -0.00037491321563720703, -0.0003616809844970703, -0.0003484487533569336, -0.0003352165222167969, -0.00032198429107666016, -0.00030875205993652344, -0.0002955198287963867, -0.00028228759765625, -0.0002690553665161133, -0.00025582313537597656, -0.00024259090423583984, -0.00022935867309570312, -0.0002161264419555664, -0.0002028942108154297, -0.00018966197967529297, -0.00017642974853515625, -0.00016319751739501953, -0.0001499652862548828, -0.0001367330551147461, -0.00012350082397460938, -0.00011026859283447266, -9.703636169433594e-05, -8.380413055419922e-05, -7.05718994140625e-05, -5.733966827392578e-05, -4.410743713378906e-05, -3.0875205993652344e-05, -1.7642974853515625e-05, -4.410743713378906e-06, 8.821487426757812e-06, 2.205371856689453e-05, 3.528594970703125e-05, 4.851818084716797e-05, 6.175041198730469e-05, 7.49826431274414e-05, 8.821487426757812e-05, 0.00010144710540771484, 0.00011467933654785156, 0.00012791156768798828, 0.000141143798828125, 0.00015437602996826172, 0.00016760826110839844, 0.00018084049224853516, 0.00019407272338867188, 0.0002073049545288086, 0.0002205371856689453, 0.00023376941680908203, 0.00024700164794921875, 0.00026023387908935547, 0.0002734661102294922, 0.0002866983413696289, 0.0002999305725097656, 0.00031316280364990234, 0.00032639503479003906, 0.0003396272659301758, 0.0003528594970703125, 0.0003660917282104492, 0.00037932395935058594, 0.00039255619049072266, 0.0004057884216308594]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 7.0, 16.0, 21.0, 36.0, 39.0, 55.0, 59.0, 115.0, 178.0, 278.0, 408.0, 621.0, 940.0, 1536.0, 2281.0, 3789.0, 6237.0, 10406.0, 18017.0, 30099.0, 50877.0, 83858.0, 126549.0, 163657.0, 169286.0, 138581.0, 94878.0, 58745.0, 35242.0, 20592.0, 11919.0, 7235.0, 4366.0, 2700.0, 1789.0, 1070.0, 684.0, 459.0, 290.0, 195.0, 135.0, 99.0, 58.0, 51.0, 29.0, 20.0, 16.0, 6.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.78515625, -1.7278289794921875, -1.670501708984375, -1.6131744384765625, -1.55584716796875, -1.4985198974609375, -1.441192626953125, -1.3838653564453125, -1.3265380859375, -1.2692108154296875, -1.211883544921875, -1.1545562744140625, -1.09722900390625, -1.0399017333984375, -0.982574462890625, -0.9252471923828125, -0.867919921875, -0.8105926513671875, -0.753265380859375, -0.6959381103515625, -0.63861083984375, -0.5812835693359375, -0.523956298828125, -0.4666290283203125, -0.4093017578125, -0.3519744873046875, -0.294647216796875, -0.2373199462890625, -0.17999267578125, -0.1226654052734375, -0.065338134765625, -0.0080108642578125, 0.04931640625, 0.1066436767578125, 0.163970947265625, 0.2212982177734375, 0.27862548828125, 0.3359527587890625, 0.393280029296875, 0.4506072998046875, 0.5079345703125, 0.5652618408203125, 0.622589111328125, 0.6799163818359375, 0.73724365234375, 0.7945709228515625, 0.851898193359375, 0.9092254638671875, 0.966552734375, 1.0238800048828125, 1.081207275390625, 1.1385345458984375, 1.19586181640625, 1.2531890869140625, 1.310516357421875, 1.3678436279296875, 1.4251708984375, 1.4824981689453125, 1.539825439453125, 1.5971527099609375, 1.65447998046875, 1.7118072509765625, 1.769134521484375, 1.8264617919921875, 1.8837890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 9.0, 11.0, 6.0, 8.0, 15.0, 14.0, 15.0, 23.0, 22.0, 32.0, 37.0, 31.0, 38.0, 51.0, 49.0, 39.0, 45.0, 45.0, 50.0, 60.0, 58.0, 34.0, 33.0, 31.0, 39.0, 31.0, 23.0, 21.0, 24.0, 8.0, 19.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.51513671875, -0.49948883056640625, -0.4838409423828125, -0.46819305419921875, -0.452545166015625, -0.43689727783203125, -0.4212493896484375, -0.40560150146484375, -0.38995361328125, -0.37430572509765625, -0.3586578369140625, -0.34300994873046875, -0.327362060546875, -0.31171417236328125, -0.2960662841796875, -0.28041839599609375, -0.2647705078125, -0.24912261962890625, -0.2334747314453125, -0.21782684326171875, -0.202178955078125, -0.18653106689453125, -0.1708831787109375, -0.15523529052734375, -0.13958740234375, -0.12393951416015625, -0.1082916259765625, -0.09264373779296875, -0.076995849609375, -0.06134796142578125, -0.0457000732421875, -0.03005218505859375, -0.014404296875, 0.00124359130859375, 0.0168914794921875, 0.03253936767578125, 0.048187255859375, 0.06383514404296875, 0.0794830322265625, 0.09513092041015625, 0.11077880859375, 0.12642669677734375, 0.1420745849609375, 0.15772247314453125, 0.173370361328125, 0.18901824951171875, 0.2046661376953125, 0.22031402587890625, 0.2359619140625, 0.25160980224609375, 0.2672576904296875, 0.28290557861328125, 0.298553466796875, 0.31420135498046875, 0.3298492431640625, 0.34549713134765625, 0.36114501953125, 0.37679290771484375, 0.3924407958984375, 0.40808868408203125, 0.423736572265625, 0.43938446044921875, 0.4550323486328125, 0.47068023681640625, 0.486328125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 7.0, 6.0, 9.0, 12.0, 18.0, 20.0, 20.0, 18.0, 23.0, 25.0, 30.0, 27.0, 40.0, 38.0, 53.0, 49.0, 32.0, 47.0, 50.0, 56.0, 43.0, 36.0, 44.0, 40.0, 33.0, 25.0, 26.0, 30.0, 24.0, 17.0, 18.0, 13.0, 17.0, 11.0, 2.0, 9.0, 8.0, 5.0, 2.0, 2.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.74275541305542, -2.6544618606567383, -2.5661680698394775, -2.477874279022217, -2.389580726623535, -2.3012871742248535, -2.2129933834075928, -2.124699592590332, -2.0364060401916504, -1.9481123685836792, -1.859818696975708, -1.7715250253677368, -1.6832313537597656, -1.5949376821517944, -1.5066440105438232, -1.418350338935852, -1.3300566673278809, -1.2417629957199097, -1.1534693241119385, -1.0651756525039673, -0.9768819808959961, -0.8885883092880249, -0.8002946376800537, -0.7120009660720825, -0.6237072944641113, -0.5354136228561401, -0.44711995124816895, -0.35882627964019775, -0.27053260803222656, -0.18223893642425537, -0.09394526481628418, -0.005651593208312988, 0.0826418399810791, 0.1709355115890503, 0.2592291831970215, 0.3475228548049927, 0.43581652641296387, 0.5241101980209351, 0.6124038696289062, 0.7006975412368774, 0.7889912128448486, 0.8772848844528198, 0.965578556060791, 1.0538722276687622, 1.1421658992767334, 1.2304595708847046, 1.3187532424926758, 1.407046914100647, 1.4953405857086182, 1.5836342573165894, 1.6719279289245605, 1.7602216005325317, 1.848515272140503, 1.9368089437484741, 2.0251026153564453, 2.113396167755127, 2.2016899585723877, 2.2899837493896484, 2.37827730178833, 2.4665708541870117, 2.5548646450042725, 2.643158435821533, 2.731451988220215, 2.8197455406188965, 2.9080393314361572]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 12.0, 17.0, 13.0, 12.0, 18.0, 18.0, 11.0, 21.0, 21.0, 22.0, 29.0, 25.0, 35.0, 44.0, 31.0, 45.0, 38.0, 35.0, 41.0, 38.0, 50.0, 36.0, 35.0, 30.0, 35.0, 29.0, 31.0, 25.0, 26.0, 20.0, 23.0, 24.0, 17.0, 17.0, 13.0, 9.0, 7.0, 8.0, 1.0, 7.0, 7.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5127570629119873, -2.4362292289733887, -2.35970139503479, -2.2831737995147705, -2.206645965576172, -2.1301181316375732, -2.0535902976989746, -1.977062463760376, -1.900534749031067, -1.8240069150924683, -1.7474792003631592, -1.6709513664245605, -1.594423532485962, -1.5178958177566528, -1.4413679838180542, -1.3648402690887451, -1.2883124351501465, -1.2117846012115479, -1.1352568864822388, -1.0587290525436401, -0.9822012782096863, -0.9056735038757324, -0.8291456699371338, -0.7526178956031799, -0.6760901212692261, -0.5995623469352722, -0.5230345726013184, -0.4465067386627197, -0.36997896432876587, -0.293451189994812, -0.21692338585853577, -0.14039558172225952, -0.06386804580688477, 0.012659743428230286, 0.08918753266334534, 0.1657153218984604, 0.24224311113357544, 0.3187708854675293, 0.39529868960380554, 0.4718264937400818, 0.5483542680740356, 0.6248820424079895, 0.7014098167419434, 0.777937650680542, 0.8544654250144958, 0.9309931993484497, 1.0075210332870483, 1.0840487480163574, 1.160576581954956, 1.2371044158935547, 1.3136321306228638, 1.3901599645614624, 1.4666876792907715, 1.5432155132293701, 1.6197433471679688, 1.6962711811065674, 1.7727988958358765, 1.849326729774475, 1.9258544445037842, 2.002382278442383, 2.0789101123809814, 2.15543794631958, 2.2319655418395996, 2.3084933757781982, 2.385021209716797]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 6.0, 10.0, 21.0, 21.0, 41.0, 82.0, 159.0, 239.0, 390.0, 668.0, 1130.0, 1920.0, 3135.0, 5245.0, 8943.0, 15356.0, 26283.0, 43784.0, 73951.0, 121924.0, 195773.0, 300346.0, 427972.0, 543121.0, 593948.0, 550498.0, 439748.0, 312250.0, 205893.0, 128274.0, 78963.0, 46810.0, 27504.0, 16233.0, 9442.0, 5712.0, 3344.0, 2006.0, 1213.0, 724.0, 465.0, 299.0, 164.0, 114.0, 60.0, 31.0, 42.0, 11.0, 8.0, 1.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8932037353515625, -1.824493408203125, -1.7557830810546875, -1.68707275390625, -1.6183624267578125, -1.549652099609375, -1.4809417724609375, -1.4122314453125, -1.3435211181640625, -1.274810791015625, -1.2061004638671875, -1.13739013671875, -1.0686798095703125, -0.999969482421875, -0.9312591552734375, -0.862548828125, -0.7938385009765625, -0.725128173828125, -0.6564178466796875, -0.58770751953125, -0.5189971923828125, -0.450286865234375, -0.3815765380859375, -0.3128662109375, -0.2441558837890625, -0.175445556640625, -0.1067352294921875, -0.03802490234375, 0.0306854248046875, 0.099395751953125, 0.1681060791015625, 0.23681640625, 0.3055267333984375, 0.374237060546875, 0.4429473876953125, 0.51165771484375, 0.5803680419921875, 0.649078369140625, 0.7177886962890625, 0.7864990234375, 0.8552093505859375, 0.923919677734375, 0.9926300048828125, 1.06134033203125, 1.1300506591796875, 1.198760986328125, 1.2674713134765625, 1.336181640625, 1.4048919677734375, 1.473602294921875, 1.5423126220703125, 1.61102294921875, 1.6797332763671875, 1.748443603515625, 1.8171539306640625, 1.8858642578125, 1.9545745849609375, 2.023284912109375, 2.0919952392578125, 2.16070556640625, 2.2294158935546875, 2.298126220703125, 2.3668365478515625, 2.435546875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 12.0, 13.0, 19.0, 8.0, 17.0, 29.0, 30.0, 17.0, 36.0, 35.0, 32.0, 40.0, 40.0, 38.0, 45.0, 37.0, 45.0, 44.0, 46.0, 44.0, 38.0, 34.0, 35.0, 26.0, 31.0, 24.0, 26.0, 26.0, 15.0, 20.0, 12.0, 16.0, 16.0, 11.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9421234130859375, -1.882293701171875, -1.8224639892578125, -1.76263427734375, -1.7028045654296875, -1.642974853515625, -1.5831451416015625, -1.5233154296875, -1.4634857177734375, -1.403656005859375, -1.3438262939453125, -1.28399658203125, -1.2241668701171875, -1.164337158203125, -1.1045074462890625, -1.044677734375, -0.9848480224609375, -0.925018310546875, -0.8651885986328125, -0.80535888671875, -0.7455291748046875, -0.685699462890625, -0.6258697509765625, -0.5660400390625, -0.5062103271484375, -0.446380615234375, -0.3865509033203125, -0.32672119140625, -0.2668914794921875, -0.207061767578125, -0.1472320556640625, -0.08740234375, -0.0275726318359375, 0.032257080078125, 0.0920867919921875, 0.15191650390625, 0.2117462158203125, 0.271575927734375, 0.3314056396484375, 0.3912353515625, 0.4510650634765625, 0.510894775390625, 0.5707244873046875, 0.63055419921875, 0.6903839111328125, 0.750213623046875, 0.8100433349609375, 0.869873046875, 0.9297027587890625, 0.989532470703125, 1.0493621826171875, 1.10919189453125, 1.1690216064453125, 1.228851318359375, 1.2886810302734375, 1.3485107421875, 1.4083404541015625, 1.468170166015625, 1.5279998779296875, 1.58782958984375, 1.6476593017578125, 1.707489013671875, 1.7673187255859375, 1.8271484375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 9.0, 8.0, 19.0, 37.0, 48.0, 70.0, 121.0, 167.0, 305.0, 522.0, 747.0, 1175.0, 1888.0, 3016.0, 4639.0, 7535.0, 11887.0, 18713.0, 29477.0, 45899.0, 70096.0, 105526.0, 151809.0, 214589.0, 287922.0, 365575.0, 428604.0, 462047.0, 449901.0, 399661.0, 328065.0, 250259.0, 182285.0, 127444.0, 85086.0, 57148.0, 37173.0, 23739.0, 15027.0, 9676.0, 5978.0, 3814.0, 2405.0, 1584.0, 941.0, 611.0, 388.0, 230.0, 144.0, 83.0, 92.0, 36.0, 26.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0], "bins": [-1.8271484375, -1.7713623046875, -1.715576171875, -1.6597900390625, -1.60400390625, -1.5482177734375, -1.492431640625, -1.4366455078125, -1.380859375, -1.3250732421875, -1.269287109375, -1.2135009765625, -1.15771484375, -1.1019287109375, -1.046142578125, -0.9903564453125, -0.9345703125, -0.8787841796875, -0.822998046875, -0.7672119140625, -0.71142578125, -0.6556396484375, -0.599853515625, -0.5440673828125, -0.48828125, -0.4324951171875, -0.376708984375, -0.3209228515625, -0.26513671875, -0.2093505859375, -0.153564453125, -0.0977783203125, -0.0419921875, 0.0137939453125, 0.069580078125, 0.1253662109375, 0.18115234375, 0.2369384765625, 0.292724609375, 0.3485107421875, 0.404296875, 0.4600830078125, 0.515869140625, 0.5716552734375, 0.62744140625, 0.6832275390625, 0.739013671875, 0.7947998046875, 0.8505859375, 0.9063720703125, 0.962158203125, 1.0179443359375, 1.07373046875, 1.1295166015625, 1.185302734375, 1.2410888671875, 1.296875, 1.3526611328125, 1.408447265625, 1.4642333984375, 1.52001953125, 1.5758056640625, 1.631591796875, 1.6873779296875, 1.7431640625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 7.0, 17.0, 15.0, 19.0, 14.0, 21.0, 18.0, 38.0, 35.0, 45.0, 55.0, 65.0, 106.0, 108.0, 117.0, 120.0, 146.0, 155.0, 174.0, 173.0, 199.0, 202.0, 188.0, 197.0, 193.0, 198.0, 167.0, 179.0, 164.0, 144.0, 129.0, 104.0, 106.0, 79.0, 56.0, 84.0, 58.0, 39.0, 27.0, 20.0, 23.0, 21.0, 9.0, 8.0, 12.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.88037109375, -0.8539810180664062, -0.8275909423828125, -0.8012008666992188, -0.774810791015625, -0.7484207153320312, -0.7220306396484375, -0.6956405639648438, -0.66925048828125, -0.6428604125976562, -0.6164703369140625, -0.5900802612304688, -0.563690185546875, -0.5373001098632812, -0.5109100341796875, -0.48451995849609375, -0.4581298828125, -0.43173980712890625, -0.4053497314453125, -0.37895965576171875, -0.352569580078125, -0.32617950439453125, -0.2997894287109375, -0.27339935302734375, -0.24700927734375, -0.22061920166015625, -0.1942291259765625, -0.16783905029296875, -0.141448974609375, -0.11505889892578125, -0.0886688232421875, -0.06227874755859375, -0.035888671875, -0.00949859619140625, 0.0168914794921875, 0.04328155517578125, 0.069671630859375, 0.09606170654296875, 0.1224517822265625, 0.14884185791015625, 0.17523193359375, 0.20162200927734375, 0.2280120849609375, 0.25440216064453125, 0.280792236328125, 0.30718231201171875, 0.3335723876953125, 0.35996246337890625, 0.3863525390625, 0.41274261474609375, 0.4391326904296875, 0.46552276611328125, 0.491912841796875, 0.5183029174804688, 0.5446929931640625, 0.5710830688476562, 0.59747314453125, 0.6238632202148438, 0.6502532958984375, 0.6766433715820312, 0.703033447265625, 0.7294235229492188, 0.7558135986328125, 0.7822036743164062, 0.80859375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 11.0, 11.0, 18.0, 21.0, 28.0, 26.0, 25.0, 44.0, 35.0, 38.0, 41.0, 48.0, 41.0, 53.0, 54.0, 62.0, 55.0, 44.0, 40.0, 44.0, 34.0, 41.0, 40.0, 27.0, 22.0, 13.0, 16.0, 12.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.011713743209839, -2.9235851764678955, -2.835456609725952, -2.747328042984009, -2.6591994762420654, -2.571070909500122, -2.482942581176758, -2.3948140144348145, -2.306685447692871, -2.2185568809509277, -2.1304283142089844, -2.042299747467041, -1.9541711807250977, -1.8660426139831543, -1.7779141664505005, -1.6897855997085571, -1.6016569137573242, -1.5135283470153809, -1.4253997802734375, -1.3372712135314941, -1.2491426467895508, -1.1610140800476074, -1.0728856325149536, -0.9847570657730103, -0.8966284990310669, -0.8084999322891235, -0.7203713655471802, -0.6322428584098816, -0.5441142916679382, -0.4559857249259949, -0.3678572177886963, -0.27972865104675293, -0.19160032272338867, -0.1034717708826065, -0.01534321904182434, 0.07278531789779663, 0.16091388463974, 0.24904245138168335, 0.33717095851898193, 0.4252995252609253, 0.5134280920028687, 0.601556658744812, 0.6896852254867554, 0.777813732624054, 0.8659422993659973, 0.9540708661079407, 1.0421993732452393, 1.1303279399871826, 1.218456506729126, 1.3065850734710693, 1.3947136402130127, 1.482842206954956, 1.5709707736968994, 1.6590993404388428, 1.7472277879714966, 1.83535635471344, 1.9234849214553833, 2.011613368988037, 2.0997419357299805, 2.187870502471924, 2.275999069213867, 2.3641276359558105, 2.452256202697754, 2.5403847694396973, 2.6285133361816406]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 6.0, 12.0, 12.0, 14.0, 12.0, 15.0, 16.0, 16.0, 22.0, 19.0, 35.0, 35.0, 24.0, 23.0, 22.0, 24.0, 34.0, 42.0, 40.0, 31.0, 47.0, 35.0, 44.0, 37.0, 34.0, 27.0, 35.0, 27.0, 32.0, 26.0, 15.0, 26.0, 20.0, 15.0, 13.0, 16.0, 16.0, 15.0, 7.0, 11.0, 7.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.096761703491211, -2.035475492477417, -1.9741891622543335, -1.91290283203125, -1.851616621017456, -1.790330410003662, -1.7290440797805786, -1.6677577495574951, -1.6064715385437012, -1.5451853275299072, -1.4838989973068237, -1.4226126670837402, -1.3613264560699463, -1.3000402450561523, -1.2387539148330688, -1.1774675846099854, -1.1161813735961914, -1.0548951625823975, -0.993608832359314, -0.9323225617408752, -0.8710362911224365, -0.8097500205039978, -0.7484637498855591, -0.6871774792671204, -0.6258912086486816, -0.5646049380302429, -0.5033186674118042, -0.4420323967933655, -0.38074612617492676, -0.31945985555648804, -0.2581735849380493, -0.1968873143196106, -0.13560104370117188, -0.07431477308273315, -0.013028502464294434, 0.04825776815414429, 0.10954403877258301, 0.17083030939102173, 0.23211658000946045, 0.29340285062789917, 0.3546891212463379, 0.4159753918647766, 0.47726166248321533, 0.538547933101654, 0.5998342037200928, 0.6611204743385315, 0.7224067449569702, 0.7836930155754089, 0.8449792861938477, 0.9062655568122864, 0.9675518274307251, 1.0288381576538086, 1.0901243686676025, 1.1514105796813965, 1.21269690990448, 1.2739832401275635, 1.3352694511413574, 1.3965556621551514, 1.4578419923782349, 1.5191283226013184, 1.5804145336151123, 1.6417007446289062, 1.7029870748519897, 1.7642734050750732, 1.8255596160888672]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 10.0, 9.0, 20.0, 18.0, 25.0, 37.0, 46.0, 61.0, 91.0, 128.0, 177.0, 265.0, 417.0, 556.0, 812.0, 1361.0, 2705.0, 5607.0, 14257.0, 43241.0, 140649.0, 375635.0, 308765.0, 101030.0, 31303.0, 10988.0, 4435.0, 2184.0, 1269.0, 779.0, 503.0, 344.0, 251.0, 156.0, 122.0, 82.0, 51.0, 43.0, 29.0, 28.0, 20.0, 16.0, 6.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.629638671875, -2.54443359375, -2.459228515625, -2.3740234375, -2.288818359375, -2.20361328125, -2.118408203125, -2.033203125, -1.947998046875, -1.86279296875, -1.777587890625, -1.6923828125, -1.607177734375, -1.52197265625, -1.436767578125, -1.3515625, -1.266357421875, -1.18115234375, -1.095947265625, -1.0107421875, -0.925537109375, -0.84033203125, -0.755126953125, -0.669921875, -0.584716796875, -0.49951171875, -0.414306640625, -0.3291015625, -0.243896484375, -0.15869140625, -0.073486328125, 0.01171875, 0.096923828125, 0.18212890625, 0.267333984375, 0.3525390625, 0.437744140625, 0.52294921875, 0.608154296875, 0.693359375, 0.778564453125, 0.86376953125, 0.948974609375, 1.0341796875, 1.119384765625, 1.20458984375, 1.289794921875, 1.375, 1.460205078125, 1.54541015625, 1.630615234375, 1.7158203125, 1.801025390625, 1.88623046875, 1.971435546875, 2.056640625, 2.141845703125, 2.22705078125, 2.312255859375, 2.3974609375, 2.482666015625, 2.56787109375, 2.653076171875, 2.73828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 14.0, 10.0, 9.0, 14.0, 9.0, 7.0, 10.0, 13.0, 21.0, 20.0, 21.0, 26.0, 28.0, 34.0, 31.0, 28.0, 30.0, 35.0, 32.0, 34.0, 35.0, 46.0, 47.0, 38.0, 38.0, 33.0, 33.0, 21.0, 30.0, 28.0, 24.0, 22.0, 14.0, 29.0, 15.0, 15.0, 22.0, 18.0, 10.0, 8.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0], "bins": [-2.134765625, -2.0708160400390625, -2.006866455078125, -1.9429168701171875, -1.87896728515625, -1.8150177001953125, -1.751068115234375, -1.6871185302734375, -1.6231689453125, -1.5592193603515625, -1.495269775390625, -1.4313201904296875, -1.36737060546875, -1.3034210205078125, -1.239471435546875, -1.1755218505859375, -1.111572265625, -1.0476226806640625, -0.983673095703125, -0.9197235107421875, -0.85577392578125, -0.7918243408203125, -0.727874755859375, -0.6639251708984375, -0.5999755859375, -0.5360260009765625, -0.472076416015625, -0.4081268310546875, -0.34417724609375, -0.2802276611328125, -0.216278076171875, -0.1523284912109375, -0.08837890625, -0.0244293212890625, 0.039520263671875, 0.1034698486328125, 0.16741943359375, 0.2313690185546875, 0.295318603515625, 0.3592681884765625, 0.4232177734375, 0.4871673583984375, 0.551116943359375, 0.6150665283203125, 0.67901611328125, 0.7429656982421875, 0.806915283203125, 0.8708648681640625, 0.934814453125, 0.9987640380859375, 1.062713623046875, 1.1266632080078125, 1.19061279296875, 1.2545623779296875, 1.318511962890625, 1.3824615478515625, 1.4464111328125, 1.5103607177734375, 1.574310302734375, 1.6382598876953125, 1.70220947265625, 1.7661590576171875, 1.830108642578125, 1.8940582275390625, 1.9580078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 9.0, 5.0, 12.0, 15.0, 19.0, 20.0, 35.0, 42.0, 65.0, 84.0, 101.0, 149.0, 214.0, 318.0, 477.0, 797.0, 1312.0, 2466.0, 5516.0, 13967.0, 39360.0, 128808.0, 370817.0, 324835.0, 104280.0, 32704.0, 11659.0, 4724.0, 2312.0, 1175.0, 725.0, 433.0, 311.0, 216.0, 177.0, 96.0, 76.0, 49.0, 41.0, 24.0, 24.0, 21.0, 17.0, 9.0, 10.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 3.0], "bins": [-2.76171875, -2.6826171875, -2.603515625, -2.5244140625, -2.4453125, -2.3662109375, -2.287109375, -2.2080078125, -2.12890625, -2.0498046875, -1.970703125, -1.8916015625, -1.8125, -1.7333984375, -1.654296875, -1.5751953125, -1.49609375, -1.4169921875, -1.337890625, -1.2587890625, -1.1796875, -1.1005859375, -1.021484375, -0.9423828125, -0.86328125, -0.7841796875, -0.705078125, -0.6259765625, -0.546875, -0.4677734375, -0.388671875, -0.3095703125, -0.23046875, -0.1513671875, -0.072265625, 0.0068359375, 0.0859375, 0.1650390625, 0.244140625, 0.3232421875, 0.40234375, 0.4814453125, 0.560546875, 0.6396484375, 0.71875, 0.7978515625, 0.876953125, 0.9560546875, 1.03515625, 1.1142578125, 1.193359375, 1.2724609375, 1.3515625, 1.4306640625, 1.509765625, 1.5888671875, 1.66796875, 1.7470703125, 1.826171875, 1.9052734375, 1.984375, 2.0634765625, 2.142578125, 2.2216796875, 2.30078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 8.0, 8.0, 14.0, 11.0, 11.0, 14.0, 24.0, 22.0, 28.0, 26.0, 27.0, 22.0, 38.0, 39.0, 23.0, 30.0, 40.0, 43.0, 51.0, 49.0, 53.0, 40.0, 38.0, 34.0, 46.0, 36.0, 40.0, 23.0, 24.0, 19.0, 28.0, 18.0, 16.0, 7.0, 10.0, 10.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.734375, -1.6830291748046875, -1.631683349609375, -1.5803375244140625, -1.52899169921875, -1.4776458740234375, -1.426300048828125, -1.3749542236328125, -1.3236083984375, -1.2722625732421875, -1.220916748046875, -1.1695709228515625, -1.11822509765625, -1.0668792724609375, -1.015533447265625, -0.9641876220703125, -0.912841796875, -0.8614959716796875, -0.810150146484375, -0.7588043212890625, -0.70745849609375, -0.6561126708984375, -0.604766845703125, -0.5534210205078125, -0.5020751953125, -0.4507293701171875, -0.399383544921875, -0.3480377197265625, -0.29669189453125, -0.2453460693359375, -0.194000244140625, -0.1426544189453125, -0.09130859375, -0.0399627685546875, 0.011383056640625, 0.0627288818359375, 0.11407470703125, 0.1654205322265625, 0.216766357421875, 0.2681121826171875, 0.3194580078125, 0.3708038330078125, 0.422149658203125, 0.4734954833984375, 0.52484130859375, 0.5761871337890625, 0.627532958984375, 0.6788787841796875, 0.730224609375, 0.7815704345703125, 0.832916259765625, 0.8842620849609375, 0.93560791015625, 0.9869537353515625, 1.038299560546875, 1.0896453857421875, 1.1409912109375, 1.1923370361328125, 1.243682861328125, 1.2950286865234375, 1.34637451171875, 1.3977203369140625, 1.449066162109375, 1.5004119873046875, 1.5517578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 10.0, 9.0, 8.0, 19.0, 28.0, 21.0, 31.0, 52.0, 91.0, 116.0, 173.0, 269.0, 380.0, 556.0, 871.0, 1501.0, 2573.0, 4553.0, 10212.0, 30174.0, 135434.0, 560332.0, 229287.0, 44475.0, 13761.0, 5808.0, 3035.0, 1658.0, 1054.0, 670.0, 436.0, 302.0, 189.0, 126.0, 79.0, 66.0, 49.0, 40.0, 34.0, 16.0, 19.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.205078125, -1.1681671142578125, -1.131256103515625, -1.0943450927734375, -1.05743408203125, -1.0205230712890625, -0.983612060546875, -0.9467010498046875, -0.9097900390625, -0.8728790283203125, -0.835968017578125, -0.7990570068359375, -0.76214599609375, -0.7252349853515625, -0.688323974609375, -0.6514129638671875, -0.614501953125, -0.5775909423828125, -0.540679931640625, -0.5037689208984375, -0.46685791015625, -0.4299468994140625, -0.393035888671875, -0.3561248779296875, -0.3192138671875, -0.2823028564453125, -0.245391845703125, -0.2084808349609375, -0.17156982421875, -0.1346588134765625, -0.097747802734375, -0.0608367919921875, -0.02392578125, 0.0129852294921875, 0.049896240234375, 0.0868072509765625, 0.12371826171875, 0.1606292724609375, 0.197540283203125, 0.2344512939453125, 0.2713623046875, 0.3082733154296875, 0.345184326171875, 0.3820953369140625, 0.41900634765625, 0.4559173583984375, 0.492828369140625, 0.5297393798828125, 0.566650390625, 0.6035614013671875, 0.640472412109375, 0.6773834228515625, 0.71429443359375, 0.7512054443359375, 0.788116455078125, 0.8250274658203125, 0.8619384765625, 0.8988494873046875, 0.935760498046875, 0.9726715087890625, 1.00958251953125, 1.0464935302734375, 1.083404541015625, 1.1203155517578125, 1.1572265625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 10.0, 20.0, 31.0, 34.0, 38.0, 54.0, 67.0, 70.0, 62.0, 74.0, 94.0, 76.0, 68.0, 47.0, 35.0, 41.0, 26.0, 30.0, 21.0, 18.0, 8.0, 9.0, 4.0, 4.0, 1.0, 7.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.99758529663086e-05, -6.81411474943161e-05, -6.630644202232361e-05, -6.447173655033112e-05, -6.263703107833862e-05, -6.080232560634613e-05, -5.896762013435364e-05, -5.7132914662361145e-05, -5.529820919036865e-05, -5.346350371837616e-05, -5.162879824638367e-05, -4.9794092774391174e-05, -4.795938730239868e-05, -4.612468183040619e-05, -4.4289976358413696e-05, -4.2455270886421204e-05, -4.062056541442871e-05, -3.878585994243622e-05, -3.6951154470443726e-05, -3.511644899845123e-05, -3.328174352645874e-05, -3.144703805446625e-05, -2.9612332582473755e-05, -2.7777627110481262e-05, -2.594292163848877e-05, -2.4108216166496277e-05, -2.2273510694503784e-05, -2.043880522251129e-05, -1.86040997505188e-05, -1.6769394278526306e-05, -1.4934688806533813e-05, -1.309998333454132e-05, -1.1265277862548828e-05, -9.430572390556335e-06, -7.595866918563843e-06, -5.76116144657135e-06, -3.926455974578857e-06, -2.0917505025863647e-06, -2.5704503059387207e-07, 1.5776604413986206e-06, 3.4123659133911133e-06, 5.247071385383606e-06, 7.081776857376099e-06, 8.916482329368591e-06, 1.0751187801361084e-05, 1.2585893273353577e-05, 1.442059874534607e-05, 1.6255304217338562e-05, 1.8090009689331055e-05, 1.9924715161323547e-05, 2.175942063331604e-05, 2.3594126105308533e-05, 2.5428831577301025e-05, 2.7263537049293518e-05, 2.909824252128601e-05, 3.0932947993278503e-05, 3.2767653465270996e-05, 3.460235893726349e-05, 3.643706440925598e-05, 3.8271769881248474e-05, 4.010647535324097e-05, 4.194118082523346e-05, 4.377588629722595e-05, 4.5610591769218445e-05, 4.744529724121094e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 14.0, 15.0, 30.0, 39.0, 55.0, 83.0, 105.0, 178.0, 249.0, 384.0, 560.0, 839.0, 1297.0, 1942.0, 3400.0, 5662.0, 10182.0, 19208.0, 38796.0, 81446.0, 169774.0, 276304.0, 218826.0, 110166.0, 52086.0, 25528.0, 13194.0, 7150.0, 4109.0, 2352.0, 1586.0, 958.0, 682.0, 441.0, 288.0, 199.0, 135.0, 95.0, 63.0, 40.0, 21.0, 16.0, 17.0, 6.0, 10.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7031707763671875, -0.680267333984375, -0.6573638916015625, -0.63446044921875, -0.6115570068359375, -0.588653564453125, -0.5657501220703125, -0.5428466796875, -0.5199432373046875, -0.497039794921875, -0.4741363525390625, -0.45123291015625, -0.4283294677734375, -0.405426025390625, -0.3825225830078125, -0.359619140625, -0.3367156982421875, -0.313812255859375, -0.2909088134765625, -0.26800537109375, -0.2451019287109375, -0.222198486328125, -0.1992950439453125, -0.1763916015625, -0.1534881591796875, -0.130584716796875, -0.1076812744140625, -0.08477783203125, -0.0618743896484375, -0.038970947265625, -0.0160675048828125, 0.0068359375, 0.0297393798828125, 0.052642822265625, 0.0755462646484375, 0.09844970703125, 0.1213531494140625, 0.144256591796875, 0.1671600341796875, 0.1900634765625, 0.2129669189453125, 0.235870361328125, 0.2587738037109375, 0.28167724609375, 0.3045806884765625, 0.327484130859375, 0.3503875732421875, 0.373291015625, 0.3961944580078125, 0.419097900390625, 0.4420013427734375, 0.46490478515625, 0.4878082275390625, 0.510711669921875, 0.5336151123046875, 0.5565185546875, 0.5794219970703125, 0.602325439453125, 0.6252288818359375, 0.64813232421875, 0.6710357666015625, 0.693939208984375, 0.7168426513671875, 0.73974609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 6.0, 12.0, 22.0, 28.0, 25.0, 55.0, 65.0, 77.0, 97.0, 116.0, 105.0, 97.0, 74.0, 64.0, 43.0, 22.0, 28.0, 9.0, 13.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2656707763671875, -0.254974365234375, -0.2442779541015625, -0.23358154296875, -0.2228851318359375, -0.212188720703125, -0.2014923095703125, -0.1907958984375, -0.1800994873046875, -0.169403076171875, -0.1587066650390625, -0.14801025390625, -0.1373138427734375, -0.126617431640625, -0.1159210205078125, -0.105224609375, -0.0945281982421875, -0.083831787109375, -0.0731353759765625, -0.06243896484375, -0.0517425537109375, -0.041046142578125, -0.0303497314453125, -0.0196533203125, -0.0089569091796875, 0.001739501953125, 0.0124359130859375, 0.02313232421875, 0.0338287353515625, 0.044525146484375, 0.0552215576171875, 0.06591796875, 0.0766143798828125, 0.087310791015625, 0.0980072021484375, 0.10870361328125, 0.1194000244140625, 0.130096435546875, 0.1407928466796875, 0.1514892578125, 0.1621856689453125, 0.172882080078125, 0.1835784912109375, 0.19427490234375, 0.2049713134765625, 0.215667724609375, 0.2263641357421875, 0.237060546875, 0.2477569580078125, 0.258453369140625, 0.2691497802734375, 0.27984619140625, 0.2905426025390625, 0.301239013671875, 0.3119354248046875, 0.3226318359375, 0.3333282470703125, 0.344024658203125, 0.3547210693359375, 0.36541748046875, 0.3761138916015625, 0.386810302734375, 0.3975067138671875, 0.408203125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 4.0, 7.0, 11.0, 6.0, 8.0, 18.0, 28.0, 29.0, 18.0, 41.0, 36.0, 43.0, 33.0, 42.0, 48.0, 54.0, 45.0, 73.0, 54.0, 51.0, 46.0, 39.0, 39.0, 42.0, 39.0, 28.0, 26.0, 16.0, 12.0, 16.0, 13.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.925477981567383, -2.8365590572357178, -2.7476401329040527, -2.6587212085723877, -2.5698022842407227, -2.4808833599090576, -2.3919644355773926, -2.3030452728271484, -2.2141265869140625, -2.1252076625823975, -2.0362887382507324, -1.9473698139190674, -1.8584508895874023, -1.7695319652557373, -1.6806129217147827, -1.5916939973831177, -1.502774953842163, -1.413856029510498, -1.324937105178833, -1.236018180847168, -1.147099256515503, -1.058180332183838, -0.9692612886428833, -0.8803423643112183, -0.7914234399795532, -0.7025045156478882, -0.6135855913162231, -0.5246666073799133, -0.4357476830482483, -0.34682875871658325, -0.25790977478027344, -0.1689908504486084, -0.08007168769836426, 0.008847251534461975, 0.09776619076728821, 0.18668514490127563, 0.2756040692329407, 0.3645229935646057, 0.4534419775009155, 0.5423609018325806, 0.6312798261642456, 0.7201987504959106, 0.8091176748275757, 0.8980366587638855, 0.9869555830955505, 1.0758745670318604, 1.1647934913635254, 1.2537124156951904, 1.3426313400268555, 1.4315502643585205, 1.5204691886901855, 1.6093881130218506, 1.6983070373535156, 1.7872259616851807, 1.8761450052261353, 1.9650639295578003, 2.053982734680176, 2.142901659011841, 2.231820583343506, 2.320739507675171, 2.409658432006836, 2.498577356338501, 2.587496280670166, 2.67641544342041, 2.765334367752075]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 4.0, 6.0, 4.0, 12.0, 8.0, 10.0, 16.0, 10.0, 16.0, 11.0, 18.0, 32.0, 28.0, 22.0, 30.0, 34.0, 24.0, 16.0, 29.0, 36.0, 40.0, 47.0, 46.0, 40.0, 32.0, 41.0, 35.0, 39.0, 40.0, 33.0, 22.0, 21.0, 24.0, 22.0, 17.0, 22.0, 10.0, 15.0, 15.0, 16.0, 13.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.1321260929107666, -2.0693349838256836, -2.0065436363220215, -1.9437525272369385, -1.880961298942566, -1.8181700706481934, -1.7553788423538208, -1.6925876140594482, -1.6297965049743652, -1.5670052766799927, -1.5042140483856201, -1.441422939300537, -1.3786317110061646, -1.315840482711792, -1.2530492544174194, -1.1902580261230469, -1.1274667978286743, -1.0646755695343018, -1.0018843412399292, -0.9390931725502014, -0.8763020038604736, -0.8135107755661011, -0.7507195472717285, -0.687928318977356, -0.6251371502876282, -0.5623459219932556, -0.49955475330352783, -0.4367635250091553, -0.3739723265171051, -0.31118112802505493, -0.24838989973068237, -0.1855987012386322, -0.12280738353729248, -0.06001617759466171, 0.002775028347969055, 0.06556624174118042, 0.1283574402332306, 0.19114863872528076, 0.2539398670196533, 0.3167310655117035, 0.37952226400375366, 0.44231346249580383, 0.505104660987854, 0.5678958892822266, 0.6306871175765991, 0.6934782862663269, 0.7562695145606995, 0.8190606832504272, 0.8818519115447998, 0.9446431398391724, 1.007434368133545, 1.070225477218628, 1.1330167055130005, 1.195807933807373, 1.2585991621017456, 1.3213903903961182, 1.3841814994812012, 1.4469727277755737, 1.5097639560699463, 1.5725550651550293, 1.6353462934494019, 1.6981375217437744, 1.760928750038147, 1.8237199783325195, 1.886511206626892]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 13.0, 13.0, 15.0, 38.0, 58.0, 85.0, 113.0, 178.0, 277.0, 402.0, 590.0, 847.0, 1352.0, 1984.0, 2889.0, 4574.0, 6788.0, 9948.0, 15071.0, 21892.0, 31813.0, 44284.0, 60720.0, 79197.0, 95565.0, 108340.0, 111284.0, 104707.0, 90615.0, 73121.0, 55075.0, 39756.0, 27912.0, 19219.0, 13079.0, 8825.0, 5909.0, 4038.0, 2730.0, 1805.0, 1146.0, 801.0, 496.0, 345.0, 214.0, 139.0, 87.0, 65.0, 34.0, 39.0, 21.0, 8.0, 9.0, 10.0, 6.0, 5.0, 5.0], "bins": [-2.111328125, -2.0479888916015625, -1.984649658203125, -1.9213104248046875, -1.85797119140625, -1.7946319580078125, -1.731292724609375, -1.6679534912109375, -1.6046142578125, -1.5412750244140625, -1.477935791015625, -1.4145965576171875, -1.35125732421875, -1.2879180908203125, -1.224578857421875, -1.1612396240234375, -1.097900390625, -1.0345611572265625, -0.971221923828125, -0.9078826904296875, -0.84454345703125, -0.7812042236328125, -0.717864990234375, -0.6545257568359375, -0.5911865234375, -0.5278472900390625, -0.464508056640625, -0.4011688232421875, -0.33782958984375, -0.2744903564453125, -0.211151123046875, -0.1478118896484375, -0.08447265625, -0.0211334228515625, 0.042205810546875, 0.1055450439453125, 0.16888427734375, 0.2322235107421875, 0.295562744140625, 0.3589019775390625, 0.4222412109375, 0.4855804443359375, 0.548919677734375, 0.6122589111328125, 0.67559814453125, 0.7389373779296875, 0.802276611328125, 0.8656158447265625, 0.928955078125, 0.9922943115234375, 1.055633544921875, 1.1189727783203125, 1.18231201171875, 1.2456512451171875, 1.308990478515625, 1.3723297119140625, 1.4356689453125, 1.4990081787109375, 1.562347412109375, 1.6256866455078125, 1.68902587890625, 1.7523651123046875, 1.815704345703125, 1.8790435791015625, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 10.0, 19.0, 16.0, 19.0, 19.0, 17.0, 19.0, 34.0, 21.0, 30.0, 27.0, 35.0, 36.0, 40.0, 38.0, 51.0, 36.0, 40.0, 45.0, 52.0, 36.0, 39.0, 28.0, 34.0, 29.0, 18.0, 16.0, 29.0, 21.0, 21.0, 17.0, 16.0, 11.0, 7.0, 7.0, 13.0, 11.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.974609375, -1.91070556640625, -1.8468017578125, -1.78289794921875, -1.718994140625, -1.65509033203125, -1.5911865234375, -1.52728271484375, -1.46337890625, -1.39947509765625, -1.3355712890625, -1.27166748046875, -1.207763671875, -1.14385986328125, -1.0799560546875, -1.01605224609375, -0.9521484375, -0.88824462890625, -0.8243408203125, -0.76043701171875, -0.696533203125, -0.63262939453125, -0.5687255859375, -0.50482177734375, -0.44091796875, -0.37701416015625, -0.3131103515625, -0.24920654296875, -0.185302734375, -0.12139892578125, -0.0574951171875, 0.00640869140625, 0.0703125, 0.13421630859375, 0.1981201171875, 0.26202392578125, 0.325927734375, 0.38983154296875, 0.4537353515625, 0.51763916015625, 0.58154296875, 0.64544677734375, 0.7093505859375, 0.77325439453125, 0.837158203125, 0.90106201171875, 0.9649658203125, 1.02886962890625, 1.0927734375, 1.15667724609375, 1.2205810546875, 1.28448486328125, 1.348388671875, 1.41229248046875, 1.4761962890625, 1.54010009765625, 1.60400390625, 1.66790771484375, 1.7318115234375, 1.79571533203125, 1.859619140625, 1.92352294921875, 1.9874267578125, 2.05133056640625, 2.115234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 7.0, 22.0, 20.0, 33.0, 57.0, 106.0, 160.0, 276.0, 439.0, 734.0, 1193.0, 2015.0, 3604.0, 5963.0, 9842.0, 16141.0, 26400.0, 40745.0, 60684.0, 85314.0, 110673.0, 128409.0, 131738.0, 120376.0, 97600.0, 72003.0, 49639.0, 32462.0, 20363.0, 12548.0, 7641.0, 4443.0, 2739.0, 1672.0, 993.0, 591.0, 340.0, 237.0, 144.0, 84.0, 45.0, 30.0, 9.0, 12.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.7716064453125, -1.701416015625, -1.6312255859375, -1.56103515625, -1.4908447265625, -1.420654296875, -1.3504638671875, -1.2802734375, -1.2100830078125, -1.139892578125, -1.0697021484375, -0.99951171875, -0.9293212890625, -0.859130859375, -0.7889404296875, -0.71875, -0.6485595703125, -0.578369140625, -0.5081787109375, -0.43798828125, -0.3677978515625, -0.297607421875, -0.2274169921875, -0.1572265625, -0.0870361328125, -0.016845703125, 0.0533447265625, 0.12353515625, 0.1937255859375, 0.263916015625, 0.3341064453125, 0.404296875, 0.4744873046875, 0.544677734375, 0.6148681640625, 0.68505859375, 0.7552490234375, 0.825439453125, 0.8956298828125, 0.9658203125, 1.0360107421875, 1.106201171875, 1.1763916015625, 1.24658203125, 1.3167724609375, 1.386962890625, 1.4571533203125, 1.52734375, 1.5975341796875, 1.667724609375, 1.7379150390625, 1.80810546875, 1.8782958984375, 1.948486328125, 2.0186767578125, 2.0888671875, 2.1590576171875, 2.229248046875, 2.2994384765625, 2.36962890625, 2.4398193359375, 2.510009765625, 2.5802001953125, 2.650390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 9.0, 21.0, 17.0, 12.0, 23.0, 26.0, 25.0, 21.0, 39.0, 28.0, 45.0, 31.0, 39.0, 41.0, 39.0, 51.0, 43.0, 47.0, 46.0, 45.0, 34.0, 41.0, 46.0, 33.0, 29.0, 23.0, 13.0, 22.0, 10.0, 18.0, 14.0, 6.0, 13.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.344024658203125, -1.29742431640625, -1.250823974609375, -1.2042236328125, -1.157623291015625, -1.11102294921875, -1.064422607421875, -1.017822265625, -0.971221923828125, -0.92462158203125, -0.878021240234375, -0.8314208984375, -0.784820556640625, -0.73822021484375, -0.691619873046875, -0.64501953125, -0.598419189453125, -0.55181884765625, -0.505218505859375, -0.4586181640625, -0.412017822265625, -0.36541748046875, -0.318817138671875, -0.272216796875, -0.225616455078125, -0.17901611328125, -0.132415771484375, -0.0858154296875, -0.039215087890625, 0.00738525390625, 0.053985595703125, 0.1005859375, 0.147186279296875, 0.19378662109375, 0.240386962890625, 0.2869873046875, 0.333587646484375, 0.38018798828125, 0.426788330078125, 0.473388671875, 0.519989013671875, 0.56658935546875, 0.613189697265625, 0.6597900390625, 0.706390380859375, 0.75299072265625, 0.799591064453125, 0.84619140625, 0.892791748046875, 0.93939208984375, 0.985992431640625, 1.0325927734375, 1.079193115234375, 1.12579345703125, 1.172393798828125, 1.218994140625, 1.265594482421875, 1.31219482421875, 1.358795166015625, 1.4053955078125, 1.451995849609375, 1.49859619140625, 1.545196533203125, 1.591796875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 24.0, 30.0, 38.0, 48.0, 91.0, 99.0, 190.0, 250.0, 426.0, 647.0, 917.0, 1489.0, 2503.0, 4192.0, 7742.0, 15272.0, 31301.0, 69323.0, 162597.0, 299850.0, 243930.0, 110974.0, 48205.0, 22566.0, 11142.0, 5880.0, 3379.0, 1930.0, 1237.0, 799.0, 476.0, 318.0, 227.0, 137.0, 91.0, 71.0, 48.0, 35.0, 23.0, 19.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.289764404296875, -3.17132568359375, -3.052886962890625, -2.9344482421875, -2.816009521484375, -2.69757080078125, -2.579132080078125, -2.460693359375, -2.342254638671875, -2.22381591796875, -2.105377197265625, -1.9869384765625, -1.868499755859375, -1.75006103515625, -1.631622314453125, -1.51318359375, -1.394744873046875, -1.27630615234375, -1.157867431640625, -1.0394287109375, -0.920989990234375, -0.80255126953125, -0.684112548828125, -0.565673828125, -0.447235107421875, -0.32879638671875, -0.210357666015625, -0.0919189453125, 0.026519775390625, 0.14495849609375, 0.263397216796875, 0.3818359375, 0.500274658203125, 0.61871337890625, 0.737152099609375, 0.8555908203125, 0.974029541015625, 1.09246826171875, 1.210906982421875, 1.329345703125, 1.447784423828125, 1.56622314453125, 1.684661865234375, 1.8031005859375, 1.921539306640625, 2.03997802734375, 2.158416748046875, 2.27685546875, 2.395294189453125, 2.51373291015625, 2.632171630859375, 2.7506103515625, 2.869049072265625, 2.98748779296875, 3.105926513671875, 3.224365234375, 3.342803955078125, 3.46124267578125, 3.579681396484375, 3.6981201171875, 3.816558837890625, 3.93499755859375, 4.053436279296875, 4.171875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 8.0, 15.0, 19.0, 17.0, 23.0, 31.0, 51.0, 59.0, 55.0, 66.0, 90.0, 70.0, 56.0, 76.0, 49.0, 52.0, 46.0, 42.0, 19.0, 27.0, 15.0, 18.0, 5.0, 12.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00020325183868408203, -0.00019521452486515045, -0.00018717721104621887, -0.0001791398972272873, -0.0001711025834083557, -0.00016306526958942413, -0.00015502795577049255, -0.00014699064195156097, -0.0001389533281326294, -0.00013091601431369781, -0.00012287870049476624, -0.00011484138667583466, -0.00010680407285690308, -9.87667590379715e-05, -9.072944521903992e-05, -8.269213140010834e-05, -7.465481758117676e-05, -6.661750376224518e-05, -5.85801899433136e-05, -5.054287612438202e-05, -4.250556230545044e-05, -3.446824848651886e-05, -2.643093466758728e-05, -1.83936208486557e-05, -1.0356307029724121e-05, -2.3189932107925415e-06, 5.718320608139038e-06, 1.3755634427070618e-05, 2.1792948246002197e-05, 2.9830262064933777e-05, 3.7867575883865356e-05, 4.5904889702796936e-05, 5.3942203521728516e-05, 6.19795173406601e-05, 7.001683115959167e-05, 7.805414497852325e-05, 8.609145879745483e-05, 9.412877261638641e-05, 0.00010216608643531799, 0.00011020340025424957, 0.00011824071407318115, 0.00012627802789211273, 0.0001343153417110443, 0.0001423526555299759, 0.00015038996934890747, 0.00015842728316783905, 0.00016646459698677063, 0.0001745019108057022, 0.0001825392246246338, 0.00019057653844356537, 0.00019861385226249695, 0.00020665116608142853, 0.0002146884799003601, 0.0002227257937192917, 0.00023076310753822327, 0.00023880042135715485, 0.0002468377351760864, 0.000254875048995018, 0.0002629123628139496, 0.00027094967663288116, 0.00027898699045181274, 0.0002870243042707443, 0.0002950616180896759, 0.0003030989319086075, 0.00031113624572753906]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 12.0, 17.0, 24.0, 37.0, 43.0, 83.0, 109.0, 158.0, 232.0, 340.0, 500.0, 727.0, 1038.0, 1526.0, 2483.0, 3754.0, 6155.0, 10440.0, 17877.0, 32690.0, 60087.0, 108852.0, 175784.0, 213301.0, 172608.0, 105094.0, 58427.0, 31708.0, 17327.0, 10101.0, 6087.0, 3734.0, 2395.0, 1488.0, 1046.0, 702.0, 469.0, 319.0, 233.0, 151.0, 118.0, 76.0, 64.0, 42.0, 34.0, 16.0, 15.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.132720947265625, -2.06036376953125, -1.988006591796875, -1.9156494140625, -1.843292236328125, -1.77093505859375, -1.698577880859375, -1.626220703125, -1.553863525390625, -1.48150634765625, -1.409149169921875, -1.3367919921875, -1.264434814453125, -1.19207763671875, -1.119720458984375, -1.04736328125, -0.975006103515625, -0.90264892578125, -0.830291748046875, -0.7579345703125, -0.685577392578125, -0.61322021484375, -0.540863037109375, -0.468505859375, -0.396148681640625, -0.32379150390625, -0.251434326171875, -0.1790771484375, -0.106719970703125, -0.03436279296875, 0.037994384765625, 0.1103515625, 0.182708740234375, 0.25506591796875, 0.327423095703125, 0.3997802734375, 0.472137451171875, 0.54449462890625, 0.616851806640625, 0.689208984375, 0.761566162109375, 0.83392333984375, 0.906280517578125, 0.9786376953125, 1.050994873046875, 1.12335205078125, 1.195709228515625, 1.26806640625, 1.340423583984375, 1.41278076171875, 1.485137939453125, 1.5574951171875, 1.629852294921875, 1.70220947265625, 1.774566650390625, 1.846923828125, 1.919281005859375, 1.99163818359375, 2.063995361328125, 2.1363525390625, 2.208709716796875, 2.28106689453125, 2.353424072265625, 2.42578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 6.0, 10.0, 15.0, 14.0, 14.0, 28.0, 30.0, 28.0, 41.0, 47.0, 55.0, 89.0, 61.0, 77.0, 67.0, 65.0, 54.0, 47.0, 44.0, 44.0, 23.0, 30.0, 17.0, 14.0, 17.0, 10.0, 7.0, 3.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8664016723632812, -0.8397369384765625, -0.8130722045898438, -0.786407470703125, -0.7597427368164062, -0.7330780029296875, -0.7064132690429688, -0.67974853515625, -0.6530838012695312, -0.6264190673828125, -0.5997543334960938, -0.573089599609375, -0.5464248657226562, -0.5197601318359375, -0.49309539794921875, -0.4664306640625, -0.43976593017578125, -0.4131011962890625, -0.38643646240234375, -0.359771728515625, -0.33310699462890625, -0.3064422607421875, -0.27977752685546875, -0.25311279296875, -0.22644805908203125, -0.1997833251953125, -0.17311859130859375, -0.146453857421875, -0.11978912353515625, -0.0931243896484375, -0.06645965576171875, -0.039794921875, -0.01313018798828125, 0.0135345458984375, 0.04019927978515625, 0.066864013671875, 0.09352874755859375, 0.1201934814453125, 0.14685821533203125, 0.17352294921875, 0.20018768310546875, 0.2268524169921875, 0.25351715087890625, 0.280181884765625, 0.30684661865234375, 0.3335113525390625, 0.36017608642578125, 0.3868408203125, 0.41350555419921875, 0.4401702880859375, 0.46683502197265625, 0.493499755859375, 0.5201644897460938, 0.5468292236328125, 0.5734939575195312, 0.60015869140625, 0.6268234252929688, 0.6534881591796875, 0.6801528930664062, 0.706817626953125, 0.7334823608398438, 0.7601470947265625, 0.7868118286132812, 0.8134765625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 16.0, 11.0, 13.0, 17.0, 31.0, 29.0, 35.0, 34.0, 33.0, 43.0, 31.0, 42.0, 48.0, 46.0, 47.0, 55.0, 52.0, 45.0, 47.0, 34.0, 47.0, 24.0, 25.0, 33.0, 31.0, 22.0, 11.0, 22.0, 16.0, 5.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6193525791168213, -2.537788152694702, -2.456223487854004, -2.3746590614318848, -2.2930946350097656, -2.2115302085876465, -2.1299655437469482, -2.048401117324829, -1.96683669090271, -1.8852721452713013, -1.8037077188491821, -1.7221431732177734, -1.6405787467956543, -1.5590142011642456, -1.477449655532837, -1.3958852291107178, -1.314320683479309, -1.2327561378479004, -1.1511917114257812, -1.0696271657943726, -0.9880627393722534, -0.9064981937408447, -0.8249337077140808, -0.7433692216873169, -0.661804735660553, -0.5802402496337891, -0.49867576360702515, -0.41711124777793884, -0.3355467617511749, -0.253982275724411, -0.1724177598953247, -0.09085327386856079, -0.009288787841796875, 0.07227570563554764, 0.15384019911289215, 0.23540470004081726, 0.3169691860675812, 0.3985336720943451, 0.4800981879234314, 0.5616626739501953, 0.6432271599769592, 0.7247916460037231, 0.8063561320304871, 0.887920618057251, 0.9694851636886597, 1.0510495901107788, 1.1326141357421875, 1.2141785621643066, 1.2957431077957153, 1.377307653427124, 1.4588720798492432, 1.5404366254806519, 1.622001051902771, 1.7035655975341797, 1.7851300239562988, 1.8666945695877075, 1.9482591152191162, 2.0298235416412354, 2.1113882064819336, 2.1929526329040527, 2.274517059326172, 2.356081485748291, 2.4376461505889893, 2.5192105770111084, 2.6007750034332275]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 4.0, 11.0, 11.0, 12.0, 13.0, 11.0, 21.0, 13.0, 20.0, 25.0, 30.0, 24.0, 30.0, 28.0, 33.0, 33.0, 34.0, 31.0, 42.0, 34.0, 41.0, 35.0, 43.0, 52.0, 32.0, 39.0, 29.0, 32.0, 29.0, 32.0, 20.0, 31.0, 18.0, 11.0, 12.0, 12.0, 9.0, 8.0, 8.0, 9.0, 5.0, 7.0, 1.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.2677392959594727, -2.201488494873047, -2.135237693786621, -2.0689868927001953, -2.0027360916137695, -1.9364852905273438, -1.870234489440918, -1.8039836883544922, -1.7377328872680664, -1.6714820861816406, -1.6052312850952148, -1.538980484008789, -1.4727296829223633, -1.4064788818359375, -1.3402280807495117, -1.273977279663086, -1.2077263593673706, -1.1414755582809448, -1.075224757194519, -1.0089739561080933, -0.9427231550216675, -0.8764723539352417, -0.8102214932441711, -0.7439706921577454, -0.6777198910713196, -0.6114690899848938, -0.545218288898468, -0.47896745800971985, -0.41271665692329407, -0.3464658558368683, -0.2802150249481201, -0.21396422386169434, -0.147713303565979, -0.08146249502897263, -0.015211686491966248, 0.05103912949562073, 0.11728993058204651, 0.1835407316684723, 0.24979156255722046, 0.31604236364364624, 0.382293164730072, 0.4485439658164978, 0.5147947669029236, 0.5810456275939941, 0.6472964286804199, 0.7135472297668457, 0.7797980308532715, 0.8460488319396973, 0.912299633026123, 0.9785504341125488, 1.0448012351989746, 1.1110520362854004, 1.1773028373718262, 1.243553638458252, 1.3098044395446777, 1.3760552406311035, 1.4423060417175293, 1.508556842803955, 1.5748076438903809, 1.6410584449768066, 1.7073092460632324, 1.7735600471496582, 1.839810848236084, 1.9060616493225098, 1.972312569618225]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 11.0, 17.0, 27.0, 29.0, 62.0, 97.0, 121.0, 240.0, 347.0, 570.0, 910.0, 1470.0, 2229.0, 3561.0, 5886.0, 9420.0, 15350.0, 24762.0, 39929.0, 63640.0, 100979.0, 155739.0, 235136.0, 336935.0, 446928.0, 529459.0, 548992.0, 491119.0, 387947.0, 277860.0, 187169.0, 121414.0, 77488.0, 48558.0, 30053.0, 18491.0, 11992.0, 7183.0, 4417.0, 2896.0, 1747.0, 1111.0, 720.0, 448.0, 292.0, 170.0, 143.0, 85.0, 47.0, 30.0, 20.0, 14.0, 10.0, 5.0, 13.0, 1.0, 1.0, 2.0], "bins": [-1.78125, -1.7259368896484375, -1.670623779296875, -1.6153106689453125, -1.55999755859375, -1.5046844482421875, -1.449371337890625, -1.3940582275390625, -1.3387451171875, -1.2834320068359375, -1.228118896484375, -1.1728057861328125, -1.11749267578125, -1.0621795654296875, -1.006866455078125, -0.9515533447265625, -0.896240234375, -0.8409271240234375, -0.785614013671875, -0.7303009033203125, -0.67498779296875, -0.6196746826171875, -0.564361572265625, -0.5090484619140625, -0.4537353515625, -0.3984222412109375, -0.343109130859375, -0.2877960205078125, -0.23248291015625, -0.1771697998046875, -0.121856689453125, -0.0665435791015625, -0.01123046875, 0.0440826416015625, 0.099395751953125, 0.1547088623046875, 0.21002197265625, 0.2653350830078125, 0.320648193359375, 0.3759613037109375, 0.4312744140625, 0.4865875244140625, 0.541900634765625, 0.5972137451171875, 0.65252685546875, 0.7078399658203125, 0.763153076171875, 0.8184661865234375, 0.873779296875, 0.9290924072265625, 0.984405517578125, 1.0397186279296875, 1.09503173828125, 1.1503448486328125, 1.205657958984375, 1.2609710693359375, 1.3162841796875, 1.3715972900390625, 1.426910400390625, 1.4822235107421875, 1.53753662109375, 1.5928497314453125, 1.648162841796875, 1.7034759521484375, 1.7587890625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 13.0, 11.0, 13.0, 9.0, 19.0, 13.0, 25.0, 22.0, 32.0, 30.0, 30.0, 37.0, 30.0, 33.0, 45.0, 54.0, 43.0, 51.0, 43.0, 44.0, 41.0, 41.0, 51.0, 33.0, 28.0, 29.0, 30.0, 22.0, 25.0, 18.0, 13.0, 8.0, 14.0, 6.0, 10.0, 3.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9931640625, -1.9395599365234375, -1.885955810546875, -1.8323516845703125, -1.77874755859375, -1.7251434326171875, -1.671539306640625, -1.6179351806640625, -1.5643310546875, -1.5107269287109375, -1.457122802734375, -1.4035186767578125, -1.34991455078125, -1.2963104248046875, -1.242706298828125, -1.1891021728515625, -1.135498046875, -1.0818939208984375, -1.028289794921875, -0.9746856689453125, -0.92108154296875, -0.8674774169921875, -0.813873291015625, -0.7602691650390625, -0.7066650390625, -0.6530609130859375, -0.599456787109375, -0.5458526611328125, -0.49224853515625, -0.4386444091796875, -0.385040283203125, -0.3314361572265625, -0.27783203125, -0.2242279052734375, -0.170623779296875, -0.1170196533203125, -0.06341552734375, -0.0098114013671875, 0.043792724609375, 0.0973968505859375, 0.1510009765625, 0.2046051025390625, 0.258209228515625, 0.3118133544921875, 0.36541748046875, 0.4190216064453125, 0.472625732421875, 0.5262298583984375, 0.579833984375, 0.6334381103515625, 0.687042236328125, 0.7406463623046875, 0.79425048828125, 0.8478546142578125, 0.901458740234375, 0.9550628662109375, 1.0086669921875, 1.0622711181640625, 1.115875244140625, 1.1694793701171875, 1.22308349609375, 1.2766876220703125, 1.330291748046875, 1.3838958740234375, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 14.0, 18.0, 31.0, 43.0, 97.0, 110.0, 204.0, 326.0, 611.0, 993.0, 1628.0, 2723.0, 4560.0, 8034.0, 13451.0, 22727.0, 37434.0, 61894.0, 99186.0, 154213.0, 229733.0, 323447.0, 422384.0, 499957.0, 524608.0, 487044.0, 404648.0, 305777.0, 213974.0, 142143.0, 90702.0, 56274.0, 34481.0, 20740.0, 12222.0, 7384.0, 4226.0, 2523.0, 1455.0, 885.0, 548.0, 318.0, 183.0, 132.0, 69.0, 42.0, 35.0, 20.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6689453125, -1.6140594482421875, -1.559173583984375, -1.5042877197265625, -1.44940185546875, -1.3945159912109375, -1.339630126953125, -1.2847442626953125, -1.2298583984375, -1.1749725341796875, -1.120086669921875, -1.0652008056640625, -1.01031494140625, -0.9554290771484375, -0.900543212890625, -0.8456573486328125, -0.790771484375, -0.7358856201171875, -0.680999755859375, -0.6261138916015625, -0.57122802734375, -0.5163421630859375, -0.461456298828125, -0.4065704345703125, -0.3516845703125, -0.2967987060546875, -0.241912841796875, -0.1870269775390625, -0.13214111328125, -0.0772552490234375, -0.022369384765625, 0.0325164794921875, 0.08740234375, 0.1422882080078125, 0.197174072265625, 0.2520599365234375, 0.30694580078125, 0.3618316650390625, 0.416717529296875, 0.4716033935546875, 0.5264892578125, 0.5813751220703125, 0.636260986328125, 0.6911468505859375, 0.74603271484375, 0.8009185791015625, 0.855804443359375, 0.9106903076171875, 0.965576171875, 1.0204620361328125, 1.075347900390625, 1.1302337646484375, 1.18511962890625, 1.2400054931640625, 1.294891357421875, 1.3497772216796875, 1.4046630859375, 1.4595489501953125, 1.514434814453125, 1.5693206787109375, 1.62420654296875, 1.6790924072265625, 1.733978271484375, 1.7888641357421875, 1.84375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 11.0, 22.0, 21.0, 27.0, 27.0, 31.0, 52.0, 51.0, 75.0, 91.0, 83.0, 112.0, 130.0, 118.0, 152.0, 163.0, 176.0, 203.0, 191.0, 216.0, 231.0, 201.0, 204.0, 192.0, 181.0, 172.0, 140.0, 123.0, 115.0, 103.0, 74.0, 80.0, 57.0, 43.0, 47.0, 35.0, 27.0, 23.0, 13.0, 10.0, 5.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7119140625, -0.6884918212890625, -0.665069580078125, -0.6416473388671875, -0.61822509765625, -0.5948028564453125, -0.571380615234375, -0.5479583740234375, -0.5245361328125, -0.5011138916015625, -0.477691650390625, -0.4542694091796875, -0.43084716796875, -0.4074249267578125, -0.384002685546875, -0.3605804443359375, -0.337158203125, -0.3137359619140625, -0.290313720703125, -0.2668914794921875, -0.24346923828125, -0.2200469970703125, -0.196624755859375, -0.1732025146484375, -0.1497802734375, -0.1263580322265625, -0.102935791015625, -0.0795135498046875, -0.05609130859375, -0.0326690673828125, -0.009246826171875, 0.0141754150390625, 0.03759765625, 0.0610198974609375, 0.084442138671875, 0.1078643798828125, 0.13128662109375, 0.1547088623046875, 0.178131103515625, 0.2015533447265625, 0.2249755859375, 0.2483978271484375, 0.271820068359375, 0.2952423095703125, 0.31866455078125, 0.3420867919921875, 0.365509033203125, 0.3889312744140625, 0.412353515625, 0.4357757568359375, 0.459197998046875, 0.4826202392578125, 0.50604248046875, 0.5294647216796875, 0.552886962890625, 0.5763092041015625, 0.5997314453125, 0.6231536865234375, 0.646575927734375, 0.6699981689453125, 0.69342041015625, 0.7168426513671875, 0.740264892578125, 0.7636871337890625, 0.787109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 8.0, 6.0, 10.0, 9.0, 17.0, 16.0, 27.0, 31.0, 34.0, 30.0, 59.0, 60.0, 63.0, 60.0, 69.0, 70.0, 62.0, 38.0, 42.0, 43.0, 56.0, 33.0, 33.0, 22.0, 31.0, 24.0, 20.0, 7.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.988922595977783, -2.9013919830322266, -2.813861131668091, -2.726330518722534, -2.6387999057769775, -2.551269054412842, -2.463738441467285, -2.3762078285217285, -2.288677215576172, -2.2011466026306152, -2.1136157512664795, -2.026085138320923, -1.9385545253753662, -1.85102379322052, -1.7634930610656738, -1.6759624481201172, -1.5884315967559814, -1.5009008646011353, -1.4133702516555786, -1.3258395195007324, -1.2383089065551758, -1.1507781744003296, -1.0632474422454834, -0.975716769695282, -0.8881860971450806, -0.8006554245948792, -0.7131247520446777, -0.6255940198898315, -0.5380633473396301, -0.4505326747894287, -0.3630019426345825, -0.2754712700843811, -0.1879405975341797, -0.10040991008281708, -0.012879222631454468, 0.07465147972106934, 0.16218215227127075, 0.24971282482147217, 0.33724355697631836, 0.4247742295265198, 0.5123049020767212, 0.5998355746269226, 0.687366247177124, 0.7748969793319702, 0.8624276518821716, 0.949958324432373, 1.0374890565872192, 1.1250197887420654, 1.212550401687622, 1.3000811338424683, 1.387611746788025, 1.475142478942871, 1.5626730918884277, 1.650203824043274, 1.7377345561981201, 1.8252651691436768, 1.912795901298523, 2.000326633453369, 2.087857246398926, 2.1753878593444824, 2.262918710708618, 2.350449323654175, 2.4379801750183105, 2.525510787963867, 2.613041400909424]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 8.0, 6.0, 10.0, 11.0, 14.0, 15.0, 16.0, 15.0, 18.0, 28.0, 24.0, 21.0, 29.0, 31.0, 33.0, 34.0, 39.0, 34.0, 40.0, 30.0, 46.0, 30.0, 38.0, 35.0, 37.0, 26.0, 30.0, 30.0, 21.0, 24.0, 31.0, 21.0, 16.0, 21.0, 18.0, 14.0, 15.0, 13.0, 12.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.6044965982437134, -1.5532957315444946, -1.5020948648452759, -1.4508939981460571, -1.3996931314468384, -1.3484922647476196, -1.2972913980484009, -1.2460905313491821, -1.1948896646499634, -1.1436887979507446, -1.0924879312515259, -1.0412870645523071, -0.9900861978530884, -0.9388853311538696, -0.8876844644546509, -0.8364835977554321, -0.7852827310562134, -0.7340818643569946, -0.6828809976577759, -0.6316801309585571, -0.5804792642593384, -0.5292783975601196, -0.4780775308609009, -0.42687666416168213, -0.3756757974624634, -0.32447493076324463, -0.2732740640640259, -0.22207319736480713, -0.17087233066558838, -0.11967146396636963, -0.06847059726715088, -0.01726973056793213, 0.03393101692199707, 0.08513188362121582, 0.13633275032043457, 0.18753361701965332, 0.23873448371887207, 0.2899353504180908, 0.34113621711730957, 0.3923370838165283, 0.44353795051574707, 0.4947388172149658, 0.5459396839141846, 0.5971405506134033, 0.6483414173126221, 0.6995422840118408, 0.7507431507110596, 0.8019440174102783, 0.8531448841094971, 0.9043457508087158, 0.9555466175079346, 1.0067474842071533, 1.057948350906372, 1.1091492176055908, 1.1603500843048096, 1.2115509510040283, 1.262751817703247, 1.3139526844024658, 1.3651535511016846, 1.4163544178009033, 1.467555284500122, 1.5187561511993408, 1.5699570178985596, 1.6211578845977783, 1.672358751296997]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 28.0, 18.0, 40.0, 55.0, 76.0, 81.0, 137.0, 178.0, 266.0, 399.0, 557.0, 779.0, 1109.0, 1719.0, 2903.0, 5997.0, 17535.0, 72549.0, 313259.0, 452580.0, 130021.0, 29278.0, 8687.0, 3818.0, 2127.0, 1303.0, 860.0, 690.0, 394.0, 329.0, 229.0, 160.0, 97.0, 80.0, 55.0, 37.0, 33.0, 20.0, 16.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.939453125, -2.84814453125, -2.7568359375, -2.66552734375, -2.57421875, -2.48291015625, -2.3916015625, -2.30029296875, -2.208984375, -2.11767578125, -2.0263671875, -1.93505859375, -1.84375, -1.75244140625, -1.6611328125, -1.56982421875, -1.478515625, -1.38720703125, -1.2958984375, -1.20458984375, -1.11328125, -1.02197265625, -0.9306640625, -0.83935546875, -0.748046875, -0.65673828125, -0.5654296875, -0.47412109375, -0.3828125, -0.29150390625, -0.2001953125, -0.10888671875, -0.017578125, 0.07373046875, 0.1650390625, 0.25634765625, 0.34765625, 0.43896484375, 0.5302734375, 0.62158203125, 0.712890625, 0.80419921875, 0.8955078125, 0.98681640625, 1.078125, 1.16943359375, 1.2607421875, 1.35205078125, 1.443359375, 1.53466796875, 1.6259765625, 1.71728515625, 1.80859375, 1.89990234375, 1.9912109375, 2.08251953125, 2.173828125, 2.26513671875, 2.3564453125, 2.44775390625, 2.5390625, 2.63037109375, 2.7216796875, 2.81298828125, 2.904296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 8.0, 12.0, 7.0, 12.0, 17.0, 17.0, 17.0, 23.0, 26.0, 22.0, 39.0, 28.0, 34.0, 35.0, 39.0, 33.0, 31.0, 29.0, 38.0, 47.0, 34.0, 46.0, 44.0, 31.0, 28.0, 32.0, 30.0, 31.0, 25.0, 18.0, 19.0, 24.0, 28.0, 19.0, 8.0, 7.0, 11.0, 3.0, 7.0, 7.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7255859375, -1.6685028076171875, -1.611419677734375, -1.5543365478515625, -1.49725341796875, -1.4401702880859375, -1.383087158203125, -1.3260040283203125, -1.2689208984375, -1.2118377685546875, -1.154754638671875, -1.0976715087890625, -1.04058837890625, -0.9835052490234375, -0.926422119140625, -0.8693389892578125, -0.812255859375, -0.7551727294921875, -0.698089599609375, -0.6410064697265625, -0.58392333984375, -0.5268402099609375, -0.469757080078125, -0.4126739501953125, -0.3555908203125, -0.2985076904296875, -0.241424560546875, -0.1843414306640625, -0.12725830078125, -0.0701751708984375, -0.013092041015625, 0.0439910888671875, 0.10107421875, 0.1581573486328125, 0.215240478515625, 0.2723236083984375, 0.32940673828125, 0.3864898681640625, 0.443572998046875, 0.5006561279296875, 0.5577392578125, 0.6148223876953125, 0.671905517578125, 0.7289886474609375, 0.78607177734375, 0.8431549072265625, 0.900238037109375, 0.9573211669921875, 1.014404296875, 1.0714874267578125, 1.128570556640625, 1.1856536865234375, 1.24273681640625, 1.2998199462890625, 1.356903076171875, 1.4139862060546875, 1.4710693359375, 1.5281524658203125, 1.585235595703125, 1.6423187255859375, 1.69940185546875, 1.7564849853515625, 1.813568115234375, 1.8706512451171875, 1.927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 16.0, 17.0, 22.0, 29.0, 42.0, 51.0, 71.0, 94.0, 128.0, 167.0, 199.0, 293.0, 417.0, 628.0, 1095.0, 1970.0, 4683.0, 12812.0, 41546.0, 155245.0, 454129.0, 270118.0, 70632.0, 20574.0, 6905.0, 2748.0, 1354.0, 739.0, 480.0, 340.0, 235.0, 168.0, 150.0, 129.0, 75.0, 53.0, 50.0, 34.0, 18.0, 20.0, 20.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.1875, -2.113861083984375, -2.04022216796875, -1.966583251953125, -1.8929443359375, -1.819305419921875, -1.74566650390625, -1.672027587890625, -1.598388671875, -1.524749755859375, -1.45111083984375, -1.377471923828125, -1.3038330078125, -1.230194091796875, -1.15655517578125, -1.082916259765625, -1.00927734375, -0.935638427734375, -0.86199951171875, -0.788360595703125, -0.7147216796875, -0.641082763671875, -0.56744384765625, -0.493804931640625, -0.420166015625, -0.346527099609375, -0.27288818359375, -0.199249267578125, -0.1256103515625, -0.051971435546875, 0.02166748046875, 0.095306396484375, 0.1689453125, 0.242584228515625, 0.31622314453125, 0.389862060546875, 0.4635009765625, 0.537139892578125, 0.61077880859375, 0.684417724609375, 0.758056640625, 0.831695556640625, 0.90533447265625, 0.978973388671875, 1.0526123046875, 1.126251220703125, 1.19989013671875, 1.273529052734375, 1.34716796875, 1.420806884765625, 1.49444580078125, 1.568084716796875, 1.6417236328125, 1.715362548828125, 1.78900146484375, 1.862640380859375, 1.936279296875, 2.009918212890625, 2.08355712890625, 2.157196044921875, 2.2308349609375, 2.304473876953125, 2.37811279296875, 2.451751708984375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 7.0, 13.0, 16.0, 8.0, 8.0, 23.0, 11.0, 20.0, 19.0, 30.0, 28.0, 32.0, 26.0, 26.0, 38.0, 27.0, 41.0, 45.0, 42.0, 46.0, 41.0, 42.0, 45.0, 29.0, 36.0, 30.0, 32.0, 23.0, 24.0, 37.0, 21.0, 20.0, 15.0, 15.0, 18.0, 6.0, 14.0, 6.0, 12.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.072052001953125, -1.03472900390625, -0.997406005859375, -0.9600830078125, -0.922760009765625, -0.88543701171875, -0.848114013671875, -0.810791015625, -0.773468017578125, -0.73614501953125, -0.698822021484375, -0.6614990234375, -0.624176025390625, -0.58685302734375, -0.549530029296875, -0.51220703125, -0.474884033203125, -0.43756103515625, -0.400238037109375, -0.3629150390625, -0.325592041015625, -0.28826904296875, -0.250946044921875, -0.213623046875, -0.176300048828125, -0.13897705078125, -0.101654052734375, -0.0643310546875, -0.027008056640625, 0.01031494140625, 0.047637939453125, 0.0849609375, 0.122283935546875, 0.15960693359375, 0.196929931640625, 0.2342529296875, 0.271575927734375, 0.30889892578125, 0.346221923828125, 0.383544921875, 0.420867919921875, 0.45819091796875, 0.495513916015625, 0.5328369140625, 0.570159912109375, 0.60748291015625, 0.644805908203125, 0.68212890625, 0.719451904296875, 0.75677490234375, 0.794097900390625, 0.8314208984375, 0.868743896484375, 0.90606689453125, 0.943389892578125, 0.980712890625, 1.018035888671875, 1.05535888671875, 1.092681884765625, 1.1300048828125, 1.167327880859375, 1.20465087890625, 1.241973876953125, 1.279296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 9.0, 10.0, 12.0, 17.0, 25.0, 30.0, 53.0, 68.0, 118.0, 139.0, 197.0, 278.0, 422.0, 618.0, 959.0, 1456.0, 2382.0, 4098.0, 8088.0, 18773.0, 58960.0, 243558.0, 485528.0, 153105.0, 39866.0, 14057.0, 6401.0, 3440.0, 2025.0, 1266.0, 841.0, 496.0, 375.0, 259.0, 150.0, 113.0, 109.0, 61.0, 42.0, 29.0, 28.0, 26.0, 13.0, 12.0, 12.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.70556640625, -0.68231201171875, -0.6590576171875, -0.63580322265625, -0.612548828125, -0.58929443359375, -0.5660400390625, -0.54278564453125, -0.51953125, -0.49627685546875, -0.4730224609375, -0.44976806640625, -0.426513671875, -0.40325927734375, -0.3800048828125, -0.35675048828125, -0.33349609375, -0.31024169921875, -0.2869873046875, -0.26373291015625, -0.240478515625, -0.21722412109375, -0.1939697265625, -0.17071533203125, -0.1474609375, -0.12420654296875, -0.1009521484375, -0.07769775390625, -0.054443359375, -0.03118896484375, -0.0079345703125, 0.01531982421875, 0.03857421875, 0.06182861328125, 0.0850830078125, 0.10833740234375, 0.131591796875, 0.15484619140625, 0.1781005859375, 0.20135498046875, 0.224609375, 0.24786376953125, 0.2711181640625, 0.29437255859375, 0.317626953125, 0.34088134765625, 0.3641357421875, 0.38739013671875, 0.41064453125, 0.43389892578125, 0.4571533203125, 0.48040771484375, 0.503662109375, 0.52691650390625, 0.5501708984375, 0.57342529296875, 0.5966796875, 0.61993408203125, 0.6431884765625, 0.66644287109375, 0.689697265625, 0.71295166015625, 0.7362060546875, 0.75946044921875, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 19.0, 34.0, 36.0, 59.0, 111.0, 151.0, 139.0, 136.0, 99.0, 74.0, 33.0, 25.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.861852645874023e-05, -7.612258195877075e-05, -7.362663745880127e-05, -7.113069295883179e-05, -6.86347484588623e-05, -6.613880395889282e-05, -6.364285945892334e-05, -6.114691495895386e-05, -5.8650970458984375e-05, -5.615502595901489e-05, -5.365908145904541e-05, -5.116313695907593e-05, -4.8667192459106445e-05, -4.617124795913696e-05, -4.367530345916748e-05, -4.1179358959198e-05, -3.8683414459228516e-05, -3.618746995925903e-05, -3.369152545928955e-05, -3.119558095932007e-05, -2.8699636459350586e-05, -2.6203691959381104e-05, -2.370774745941162e-05, -2.121180295944214e-05, -1.8715858459472656e-05, -1.6219913959503174e-05, -1.3723969459533691e-05, -1.1228024959564209e-05, -8.732080459594727e-06, -6.236135959625244e-06, -3.7401914596557617e-06, -1.2442469596862793e-06, 1.2516975402832031e-06, 3.7476420402526855e-06, 6.243586540222168e-06, 8.73953104019165e-06, 1.1235475540161133e-05, 1.3731420040130615e-05, 1.6227364540100098e-05, 1.872330904006958e-05, 2.1219253540039062e-05, 2.3715198040008545e-05, 2.6211142539978027e-05, 2.870708703994751e-05, 3.120303153991699e-05, 3.3698976039886475e-05, 3.619492053985596e-05, 3.869086503982544e-05, 4.118680953979492e-05, 4.3682754039764404e-05, 4.617869853973389e-05, 4.867464303970337e-05, 5.117058753967285e-05, 5.3666532039642334e-05, 5.6162476539611816e-05, 5.86584210395813e-05, 6.115436553955078e-05, 6.365031003952026e-05, 6.614625453948975e-05, 6.864219903945923e-05, 7.113814353942871e-05, 7.36340880393982e-05, 7.613003253936768e-05, 7.862597703933716e-05, 8.112192153930664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 3.0, 10.0, 25.0, 30.0, 54.0, 57.0, 88.0, 128.0, 172.0, 250.0, 389.0, 580.0, 783.0, 1313.0, 1985.0, 3159.0, 5028.0, 8559.0, 15204.0, 28684.0, 57454.0, 115493.0, 211057.0, 252402.0, 166083.0, 85360.0, 42431.0, 21734.0, 11677.0, 6845.0, 4109.0, 2504.0, 1643.0, 1078.0, 689.0, 489.0, 309.0, 196.0, 145.0, 126.0, 71.0, 51.0, 30.0, 16.0, 15.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.58349609375, -0.5659637451171875, -0.548431396484375, -0.5308990478515625, -0.51336669921875, -0.4958343505859375, -0.478302001953125, -0.4607696533203125, -0.4432373046875, -0.4257049560546875, -0.408172607421875, -0.3906402587890625, -0.37310791015625, -0.3555755615234375, -0.338043212890625, -0.3205108642578125, -0.302978515625, -0.2854461669921875, -0.267913818359375, -0.2503814697265625, -0.23284912109375, -0.2153167724609375, -0.197784423828125, -0.1802520751953125, -0.1627197265625, -0.1451873779296875, -0.127655029296875, -0.1101226806640625, -0.09259033203125, -0.0750579833984375, -0.057525634765625, -0.0399932861328125, -0.0224609375, -0.0049285888671875, 0.012603759765625, 0.0301361083984375, 0.04766845703125, 0.0652008056640625, 0.082733154296875, 0.1002655029296875, 0.1177978515625, 0.1353302001953125, 0.152862548828125, 0.1703948974609375, 0.18792724609375, 0.2054595947265625, 0.222991943359375, 0.2405242919921875, 0.258056640625, 0.2755889892578125, 0.293121337890625, 0.3106536865234375, 0.32818603515625, 0.3457183837890625, 0.363250732421875, 0.3807830810546875, 0.3983154296875, 0.4158477783203125, 0.433380126953125, 0.4509124755859375, 0.46844482421875, 0.4859771728515625, 0.503509521484375, 0.5210418701171875, 0.53857421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 18.0, 17.0, 33.0, 52.0, 47.0, 93.0, 141.0, 148.0, 135.0, 88.0, 67.0, 48.0, 24.0, 25.0, 13.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.285369873046875, -0.27630615234375, -0.267242431640625, -0.2581787109375, -0.249114990234375, -0.24005126953125, -0.230987548828125, -0.221923828125, -0.212860107421875, -0.20379638671875, -0.194732666015625, -0.1856689453125, -0.176605224609375, -0.16754150390625, -0.158477783203125, -0.1494140625, -0.140350341796875, -0.13128662109375, -0.122222900390625, -0.1131591796875, -0.104095458984375, -0.09503173828125, -0.085968017578125, -0.076904296875, -0.067840576171875, -0.05877685546875, -0.049713134765625, -0.0406494140625, -0.031585693359375, -0.02252197265625, -0.013458251953125, -0.00439453125, 0.004669189453125, 0.01373291015625, 0.022796630859375, 0.0318603515625, 0.040924072265625, 0.04998779296875, 0.059051513671875, 0.068115234375, 0.077178955078125, 0.08624267578125, 0.095306396484375, 0.1043701171875, 0.113433837890625, 0.12249755859375, 0.131561279296875, 0.140625, 0.149688720703125, 0.15875244140625, 0.167816162109375, 0.1768798828125, 0.185943603515625, 0.19500732421875, 0.204071044921875, 0.213134765625, 0.222198486328125, 0.23126220703125, 0.240325927734375, 0.2493896484375, 0.258453369140625, 0.26751708984375, 0.276580810546875, 0.28564453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 14.0, 25.0, 18.0, 26.0, 32.0, 33.0, 50.0, 49.0, 60.0, 69.0, 62.0, 68.0, 49.0, 51.0, 47.0, 47.0, 52.0, 45.0, 43.0, 28.0, 19.0, 29.0, 16.0, 16.0, 9.0, 5.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.003823757171631, -2.9175076484680176, -2.8311917781829834, -2.74487566947937, -2.658559560775757, -2.5722436904907227, -2.4859275817871094, -2.399611473083496, -2.313295364379883, -2.2269792556762695, -2.1406633853912354, -2.054347276687622, -1.9680311679840088, -1.881715178489685, -1.7953991889953613, -1.709083080291748, -1.6227672100067139, -1.5364512205123901, -1.4501351118087769, -1.3638191223144531, -1.2775030136108398, -1.1911870241165161, -1.1048710346221924, -1.018554925918579, -0.9322389364242554, -0.8459228873252869, -0.7596068382263184, -0.6732908487319946, -0.5869747996330261, -0.5006587505340576, -0.4143427610397339, -0.3280267119407654, -0.24171066284179688, -0.15539462864398956, -0.06907859444618225, 0.017237424850463867, 0.10355347394943237, 0.18986952304840088, 0.2761855125427246, 0.3625015616416931, 0.4488176107406616, 0.5351336598396301, 0.6214497089385986, 0.7077656984329224, 0.7940817475318909, 0.8803977966308594, 0.9667137861251831, 1.0530297756195068, 1.1393458843231201, 1.2256618738174438, 1.3119779825210571, 1.3982939720153809, 1.4846100807189941, 1.5709260702133179, 1.6572420597076416, 1.7435581684112549, 1.8298741579055786, 1.9161901473999023, 2.0025062561035156, 2.088822364807129, 2.175138235092163, 2.2614543437957764, 2.3477702140808105, 2.434086322784424, 2.520402431488037]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 8.0, 8.0, 8.0, 15.0, 16.0, 12.0, 13.0, 16.0, 18.0, 19.0, 29.0, 24.0, 26.0, 27.0, 28.0, 37.0, 37.0, 46.0, 30.0, 41.0, 30.0, 37.0, 38.0, 38.0, 41.0, 17.0, 38.0, 24.0, 30.0, 22.0, 23.0, 21.0, 26.0, 16.0, 22.0, 12.0, 15.0, 12.0, 17.0, 4.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5719082355499268, -1.5209792852401733, -1.4700504541397095, -1.419121503829956, -1.3681925535202026, -1.3172636032104492, -1.2663347721099854, -1.215405821800232, -1.1644768714904785, -1.113547921180725, -1.0626190900802612, -1.0116901397705078, -0.9607611894607544, -0.9098322987556458, -0.8589034080505371, -0.8079744577407837, -0.7570456266403198, -0.7061167359352112, -0.6551877856254578, -0.6042588949203491, -0.5533299446105957, -0.5024010539054871, -0.4514721632003784, -0.4005432426929474, -0.34961432218551636, -0.2986854016780853, -0.2477564960718155, -0.19682759046554565, -0.14589866995811462, -0.0949697494506836, -0.04404085874557495, 0.006888061761856079, 0.05781710147857666, 0.1087460145354271, 0.15967492759227753, 0.21060383319854736, 0.2615327537059784, 0.3124616742134094, 0.36339056491851807, 0.4143194854259491, 0.4652484059333801, 0.5161772966384888, 0.5671062469482422, 0.6180351376533508, 0.6689640283584595, 0.7198929786682129, 0.7708218693733215, 0.8217507600784302, 0.8726797103881836, 0.9236086010932922, 0.9745375514030457, 1.0254664421081543, 1.0763953924179077, 1.1273243427276611, 1.178253173828125, 1.2291821241378784, 1.2801110744476318, 1.3310400247573853, 1.3819688558578491, 1.4328978061676025, 1.483826756477356, 1.5347557067871094, 1.5856845378875732, 1.6366134881973267, 1.6875423192977905]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 12.0, 23.0, 21.0, 36.0, 46.0, 68.0, 86.0, 141.0, 189.0, 324.0, 470.0, 663.0, 1151.0, 1766.0, 2768.0, 4536.0, 7436.0, 12099.0, 19240.0, 31222.0, 48183.0, 70618.0, 96769.0, 120000.0, 133898.0, 129632.0, 111419.0, 86059.0, 61073.0, 40393.0, 25955.0, 16270.0, 9791.0, 5963.0, 3684.0, 2295.0, 1468.0, 935.0, 576.0, 415.0, 255.0, 177.0, 120.0, 100.0, 71.0, 41.0, 34.0, 27.0, 12.0, 5.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.0078125, -1.944671630859375, -1.88153076171875, -1.818389892578125, -1.7552490234375, -1.692108154296875, -1.62896728515625, -1.565826416015625, -1.502685546875, -1.439544677734375, -1.37640380859375, -1.313262939453125, -1.2501220703125, -1.186981201171875, -1.12384033203125, -1.060699462890625, -0.99755859375, -0.934417724609375, -0.87127685546875, -0.808135986328125, -0.7449951171875, -0.681854248046875, -0.61871337890625, -0.555572509765625, -0.492431640625, -0.429290771484375, -0.36614990234375, -0.303009033203125, -0.2398681640625, -0.176727294921875, -0.11358642578125, -0.050445556640625, 0.0126953125, 0.075836181640625, 0.13897705078125, 0.202117919921875, 0.2652587890625, 0.328399658203125, 0.39154052734375, 0.454681396484375, 0.517822265625, 0.580963134765625, 0.64410400390625, 0.707244873046875, 0.7703857421875, 0.833526611328125, 0.89666748046875, 0.959808349609375, 1.02294921875, 1.086090087890625, 1.14923095703125, 1.212371826171875, 1.2755126953125, 1.338653564453125, 1.40179443359375, 1.464935302734375, 1.528076171875, 1.591217041015625, 1.65435791015625, 1.717498779296875, 1.7806396484375, 1.843780517578125, 1.90692138671875, 1.970062255859375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 8.0, 8.0, 13.0, 11.0, 8.0, 12.0, 19.0, 15.0, 19.0, 14.0, 23.0, 32.0, 27.0, 36.0, 29.0, 40.0, 37.0, 30.0, 37.0, 41.0, 35.0, 33.0, 43.0, 32.0, 29.0, 25.0, 39.0, 27.0, 21.0, 25.0, 28.0, 26.0, 23.0, 20.0, 20.0, 14.0, 16.0, 15.0, 12.0, 9.0, 9.0, 7.0, 1.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.716796875, -1.66448974609375, -1.6121826171875, -1.55987548828125, -1.507568359375, -1.45526123046875, -1.4029541015625, -1.35064697265625, -1.29833984375, -1.24603271484375, -1.1937255859375, -1.14141845703125, -1.089111328125, -1.03680419921875, -0.9844970703125, -0.93218994140625, -0.8798828125, -0.82757568359375, -0.7752685546875, -0.72296142578125, -0.670654296875, -0.61834716796875, -0.5660400390625, -0.51373291015625, -0.46142578125, -0.40911865234375, -0.3568115234375, -0.30450439453125, -0.252197265625, -0.19989013671875, -0.1475830078125, -0.09527587890625, -0.04296875, 0.00933837890625, 0.0616455078125, 0.11395263671875, 0.166259765625, 0.21856689453125, 0.2708740234375, 0.32318115234375, 0.37548828125, 0.42779541015625, 0.4801025390625, 0.53240966796875, 0.584716796875, 0.63702392578125, 0.6893310546875, 0.74163818359375, 0.7939453125, 0.84625244140625, 0.8985595703125, 0.95086669921875, 1.003173828125, 1.05548095703125, 1.1077880859375, 1.16009521484375, 1.21240234375, 1.26470947265625, 1.3170166015625, 1.36932373046875, 1.421630859375, 1.47393798828125, 1.5262451171875, 1.57855224609375, 1.630859375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 9.0, 11.0, 14.0, 17.0, 40.0, 86.0, 105.0, 167.0, 279.0, 422.0, 730.0, 1154.0, 2061.0, 3396.0, 5667.0, 9379.0, 15524.0, 25357.0, 40040.0, 60773.0, 86530.0, 113300.0, 132039.0, 134892.0, 121972.0, 98041.0, 70846.0, 47234.0, 30604.0, 19060.0, 11476.0, 6904.0, 4156.0, 2483.0, 1509.0, 840.0, 532.0, 378.0, 210.0, 125.0, 64.0, 49.0, 37.0, 27.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.818359375, -1.758148193359375, -1.69793701171875, -1.637725830078125, -1.5775146484375, -1.517303466796875, -1.45709228515625, -1.396881103515625, -1.336669921875, -1.276458740234375, -1.21624755859375, -1.156036376953125, -1.0958251953125, -1.035614013671875, -0.97540283203125, -0.915191650390625, -0.85498046875, -0.794769287109375, -0.73455810546875, -0.674346923828125, -0.6141357421875, -0.553924560546875, -0.49371337890625, -0.433502197265625, -0.373291015625, -0.313079833984375, -0.25286865234375, -0.192657470703125, -0.1324462890625, -0.072235107421875, -0.01202392578125, 0.048187255859375, 0.1083984375, 0.168609619140625, 0.22882080078125, 0.289031982421875, 0.3492431640625, 0.409454345703125, 0.46966552734375, 0.529876708984375, 0.590087890625, 0.650299072265625, 0.71051025390625, 0.770721435546875, 0.8309326171875, 0.891143798828125, 0.95135498046875, 1.011566162109375, 1.07177734375, 1.131988525390625, 1.19219970703125, 1.252410888671875, 1.3126220703125, 1.372833251953125, 1.43304443359375, 1.493255615234375, 1.553466796875, 1.613677978515625, 1.67388916015625, 1.734100341796875, 1.7943115234375, 1.854522705078125, 1.91473388671875, 1.974945068359375, 2.03515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 4.0, 12.0, 13.0, 11.0, 26.0, 24.0, 23.0, 23.0, 28.0, 30.0, 42.0, 37.0, 32.0, 40.0, 35.0, 30.0, 46.0, 40.0, 45.0, 40.0, 40.0, 35.0, 41.0, 36.0, 28.0, 43.0, 41.0, 24.0, 26.0, 26.0, 7.0, 16.0, 11.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1051483154296875, -1.064788818359375, -1.0244293212890625, -0.98406982421875, -0.9437103271484375, -0.903350830078125, -0.8629913330078125, -0.8226318359375, -0.7822723388671875, -0.741912841796875, -0.7015533447265625, -0.66119384765625, -0.6208343505859375, -0.580474853515625, -0.5401153564453125, -0.499755859375, -0.4593963623046875, -0.419036865234375, -0.3786773681640625, -0.33831787109375, -0.2979583740234375, -0.257598876953125, -0.2172393798828125, -0.1768798828125, -0.1365203857421875, -0.096160888671875, -0.0558013916015625, -0.01544189453125, 0.0249176025390625, 0.065277099609375, 0.1056365966796875, 0.14599609375, 0.1863555908203125, 0.226715087890625, 0.2670745849609375, 0.30743408203125, 0.3477935791015625, 0.388153076171875, 0.4285125732421875, 0.4688720703125, 0.5092315673828125, 0.549591064453125, 0.5899505615234375, 0.63031005859375, 0.6706695556640625, 0.711029052734375, 0.7513885498046875, 0.791748046875, 0.8321075439453125, 0.872467041015625, 0.9128265380859375, 0.95318603515625, 0.9935455322265625, 1.033905029296875, 1.0742645263671875, 1.1146240234375, 1.1549835205078125, 1.195343017578125, 1.2357025146484375, 1.27606201171875, 1.3164215087890625, 1.356781005859375, 1.3971405029296875, 1.4375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 6.0, 9.0, 7.0, 15.0, 18.0, 27.0, 42.0, 54.0, 91.0, 132.0, 244.0, 378.0, 561.0, 890.0, 1353.0, 2354.0, 4015.0, 7058.0, 13559.0, 27707.0, 62300.0, 142593.0, 264452.0, 261435.0, 140674.0, 60859.0, 27342.0, 13171.0, 7080.0, 3984.0, 2315.0, 1462.0, 827.0, 512.0, 349.0, 231.0, 150.0, 99.0, 49.0, 41.0, 33.0, 24.0, 20.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.766204833984375, -2.67694091796875, -2.587677001953125, -2.4984130859375, -2.409149169921875, -2.31988525390625, -2.230621337890625, -2.141357421875, -2.052093505859375, -1.96282958984375, -1.873565673828125, -1.7843017578125, -1.695037841796875, -1.60577392578125, -1.516510009765625, -1.42724609375, -1.337982177734375, -1.24871826171875, -1.159454345703125, -1.0701904296875, -0.980926513671875, -0.89166259765625, -0.802398681640625, -0.713134765625, -0.623870849609375, -0.53460693359375, -0.445343017578125, -0.3560791015625, -0.266815185546875, -0.17755126953125, -0.088287353515625, 0.0009765625, 0.090240478515625, 0.17950439453125, 0.268768310546875, 0.3580322265625, 0.447296142578125, 0.53656005859375, 0.625823974609375, 0.715087890625, 0.804351806640625, 0.89361572265625, 0.982879638671875, 1.0721435546875, 1.161407470703125, 1.25067138671875, 1.339935302734375, 1.42919921875, 1.518463134765625, 1.60772705078125, 1.696990966796875, 1.7862548828125, 1.875518798828125, 1.96478271484375, 2.054046630859375, 2.143310546875, 2.232574462890625, 2.32183837890625, 2.411102294921875, 2.5003662109375, 2.589630126953125, 2.67889404296875, 2.768157958984375, 2.857421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 1.0, 11.0, 12.0, 14.0, 19.0, 25.0, 27.0, 17.0, 26.0, 35.0, 50.0, 51.0, 47.0, 58.0, 64.0, 65.0, 59.0, 50.0, 43.0, 48.0, 37.0, 33.0, 40.0, 16.0, 22.0, 21.0, 11.0, 17.0, 11.0, 5.0, 4.0, 9.0, 4.0, 4.0, 12.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014257431030273438, -0.00013802573084831238, -0.00013347715139389038, -0.00012892857193946838, -0.0001243799924850464, -0.00011983141303062439, -0.00011528283357620239, -0.0001107342541217804, -0.0001061856746673584, -0.0001016370952129364, -9.70885157585144e-05, -9.253993630409241e-05, -8.799135684967041e-05, -8.344277739524841e-05, -7.889419794082642e-05, -7.434561848640442e-05, -6.979703903198242e-05, -6.524845957756042e-05, -6.069988012313843e-05, -5.615130066871643e-05, -5.1602721214294434e-05, -4.7054141759872437e-05, -4.250556230545044e-05, -3.795698285102844e-05, -3.3408403396606445e-05, -2.8859823942184448e-05, -2.431124448776245e-05, -1.9762665033340454e-05, -1.5214085578918457e-05, -1.066550612449646e-05, -6.116926670074463e-06, -1.5683472156524658e-06, 2.9802322387695312e-06, 7.528811693191528e-06, 1.2077391147613525e-05, 1.6625970602035522e-05, 2.117455005645752e-05, 2.5723129510879517e-05, 3.0271708965301514e-05, 3.482028841972351e-05, 3.936886787414551e-05, 4.3917447328567505e-05, 4.84660267829895e-05, 5.30146062374115e-05, 5.7563185691833496e-05, 6.211176514625549e-05, 6.666034460067749e-05, 7.120892405509949e-05, 7.575750350952148e-05, 8.030608296394348e-05, 8.485466241836548e-05, 8.940324187278748e-05, 9.395182132720947e-05, 9.850040078163147e-05, 0.00010304898023605347, 0.00010759755969047546, 0.00011214613914489746, 0.00011669471859931946, 0.00012124329805374146, 0.00012579187750816345, 0.00013034045696258545, 0.00013488903641700745, 0.00013943761587142944, 0.00014398619532585144, 0.00014853477478027344]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 16.0, 19.0, 27.0, 38.0, 75.0, 124.0, 186.0, 275.0, 481.0, 726.0, 1162.0, 1838.0, 3203.0, 5907.0, 11868.0, 25592.0, 61875.0, 151549.0, 284343.0, 266415.0, 133290.0, 53471.0, 22510.0, 10459.0, 5378.0, 3100.0, 1772.0, 1105.0, 631.0, 395.0, 250.0, 179.0, 100.0, 65.0, 41.0, 24.0, 22.0, 18.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.83880615234375, -2.7498779296875, -2.66094970703125, -2.572021484375, -2.48309326171875, -2.3941650390625, -2.30523681640625, -2.21630859375, -2.12738037109375, -2.0384521484375, -1.94952392578125, -1.860595703125, -1.77166748046875, -1.6827392578125, -1.59381103515625, -1.5048828125, -1.41595458984375, -1.3270263671875, -1.23809814453125, -1.149169921875, -1.06024169921875, -0.9713134765625, -0.88238525390625, -0.79345703125, -0.70452880859375, -0.6156005859375, -0.52667236328125, -0.437744140625, -0.34881591796875, -0.2598876953125, -0.17095947265625, -0.08203125, 0.00689697265625, 0.0958251953125, 0.18475341796875, 0.273681640625, 0.36260986328125, 0.4515380859375, 0.54046630859375, 0.62939453125, 0.71832275390625, 0.8072509765625, 0.89617919921875, 0.985107421875, 1.07403564453125, 1.1629638671875, 1.25189208984375, 1.3408203125, 1.42974853515625, 1.5186767578125, 1.60760498046875, 1.696533203125, 1.78546142578125, 1.8743896484375, 1.96331787109375, 2.05224609375, 2.14117431640625, 2.2301025390625, 2.31903076171875, 2.407958984375, 2.49688720703125, 2.5858154296875, 2.67474365234375, 2.763671875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 5.0, 14.0, 15.0, 19.0, 22.0, 31.0, 36.0, 44.0, 55.0, 85.0, 65.0, 89.0, 70.0, 73.0, 63.0, 56.0, 43.0, 39.0, 29.0, 25.0, 31.0, 14.0, 12.0, 12.0, 7.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7098464965820312, -0.6843414306640625, -0.6588363647460938, -0.633331298828125, -0.6078262329101562, -0.5823211669921875, -0.5568161010742188, -0.53131103515625, -0.5058059692382812, -0.4803009033203125, -0.45479583740234375, -0.429290771484375, -0.40378570556640625, -0.3782806396484375, -0.35277557373046875, -0.3272705078125, -0.30176544189453125, -0.2762603759765625, -0.25075531005859375, -0.225250244140625, -0.19974517822265625, -0.1742401123046875, -0.14873504638671875, -0.12322998046875, -0.09772491455078125, -0.0722198486328125, -0.04671478271484375, -0.021209716796875, 0.00429534912109375, 0.0298004150390625, 0.05530548095703125, 0.080810546875, 0.10631561279296875, 0.1318206787109375, 0.15732574462890625, 0.182830810546875, 0.20833587646484375, 0.2338409423828125, 0.25934600830078125, 0.28485107421875, 0.31035614013671875, 0.3358612060546875, 0.36136627197265625, 0.386871337890625, 0.41237640380859375, 0.4378814697265625, 0.46338653564453125, 0.4888916015625, 0.5143966674804688, 0.5399017333984375, 0.5654067993164062, 0.590911865234375, 0.6164169311523438, 0.6419219970703125, 0.6674270629882812, 0.69293212890625, 0.7184371948242188, 0.7439422607421875, 0.7694473266601562, 0.794952392578125, 0.8204574584960938, 0.8459625244140625, 0.8714675903320312, 0.89697265625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 22.0, 18.0, 16.0, 25.0, 39.0, 45.0, 47.0, 59.0, 62.0, 77.0, 66.0, 69.0, 51.0, 45.0, 46.0, 53.0, 54.0, 35.0, 26.0, 22.0, 29.0, 19.0, 10.0, 15.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564897298812866, -2.4802913665771484, -2.3956854343414307, -2.311079502105713, -2.226473331451416, -2.1418673992156982, -2.0572614669799805, -1.9726555347442627, -1.8880494832992554, -1.8034435510635376, -1.7188374996185303, -1.6342315673828125, -1.5496256351470947, -1.4650195837020874, -1.3804136514663696, -1.2958076000213623, -1.2112016677856445, -1.1265957355499268, -1.0419896841049194, -0.9573837518692017, -0.8727777600288391, -0.7881717681884766, -0.7035658359527588, -0.6189598441123962, -0.5343538522720337, -0.44974786043167114, -0.365141898393631, -0.2805359363555908, -0.19592994451522827, -0.11132395267486572, -0.02671802043914795, 0.0578879714012146, 0.14249420166015625, 0.2271001785993576, 0.31170615553855896, 0.3963121175765991, 0.48091810941696167, 0.5655241012573242, 0.650130033493042, 0.7347360253334045, 0.8193420171737671, 0.9039480090141296, 0.9885540008544922, 1.07315993309021, 1.1577658653259277, 1.242371916770935, 1.3269778490066528, 1.4115839004516602, 1.496189832687378, 1.5807957649230957, 1.665401816368103, 1.7500077486038208, 1.8346138000488281, 1.919219732284546, 2.0038256645202637, 2.0884315967559814, 2.173037528991699, 2.257643461227417, 2.3422493934631348, 2.4268555641174316, 2.5114614963531494, 2.596067428588867, 2.680673360824585, 2.7652792930603027, 2.8498854637145996]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 1.0, 7.0, 6.0, 10.0, 10.0, 10.0, 6.0, 13.0, 19.0, 15.0, 18.0, 22.0, 20.0, 23.0, 26.0, 32.0, 37.0, 30.0, 22.0, 34.0, 31.0, 38.0, 39.0, 34.0, 33.0, 35.0, 27.0, 35.0, 37.0, 38.0, 25.0, 19.0, 20.0, 26.0, 24.0, 14.0, 20.0, 24.0, 10.0, 15.0, 10.0, 17.0, 11.0, 10.0, 5.0, 8.0, 10.0, 9.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.6389598846435547, -1.5876710414886475, -1.5363821983337402, -1.485093355178833, -1.4338045120239258, -1.3825156688690186, -1.3312268257141113, -1.279937982559204, -1.2286491394042969, -1.1773602962493896, -1.1260714530944824, -1.0747826099395752, -1.023493766784668, -0.9722049236297607, -0.9209160804748535, -0.8696272373199463, -0.8183384537696838, -0.7670496106147766, -0.7157607674598694, -0.6644719243049622, -0.6131830811500549, -0.5618942975997925, -0.5106054544448853, -0.45931658148765564, -0.4080277383327484, -0.3567388951778412, -0.30545005202293396, -0.2541612386703491, -0.2028723806142807, -0.15158355236053467, -0.10029470920562744, -0.049005866050720215, 0.0022829771041870117, 0.05357181653380394, 0.10486065596342087, 0.1561494916677475, 0.20743833482265472, 0.25872716307640076, 0.310016006231308, 0.3613048493862152, 0.41259369254112244, 0.46388253569602966, 0.5151713490486145, 0.5664601922035217, 0.617749035358429, 0.6690378785133362, 0.7203267216682434, 0.7716155648231506, 0.8229044079780579, 0.8741932511329651, 0.9254820942878723, 0.9767709374427795, 1.028059720993042, 1.0793485641479492, 1.1306374073028564, 1.1819262504577637, 1.233215093612671, 1.2845039367675781, 1.3357927799224854, 1.3870816230773926, 1.4383704662322998, 1.489659309387207, 1.5409481525421143, 1.5922369956970215, 1.6435258388519287]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 11.0, 12.0, 11.0, 28.0, 59.0, 95.0, 174.0, 299.0, 496.0, 850.0, 1501.0, 2740.0, 4621.0, 8159.0, 14452.0, 25672.0, 45516.0, 82119.0, 141962.0, 240000.0, 379876.0, 542413.0, 655204.0, 643477.0, 518130.0, 357821.0, 222909.0, 131684.0, 75607.0, 42503.0, 23913.0, 13638.0, 7811.0, 4365.0, 2568.0, 1522.0, 867.0, 481.0, 291.0, 188.0, 86.0, 65.0, 44.0, 24.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7557373046875, -1.698974609375, -1.6422119140625, -1.58544921875, -1.5286865234375, -1.471923828125, -1.4151611328125, -1.3583984375, -1.3016357421875, -1.244873046875, -1.1881103515625, -1.13134765625, -1.0745849609375, -1.017822265625, -0.9610595703125, -0.904296875, -0.8475341796875, -0.790771484375, -0.7340087890625, -0.67724609375, -0.6204833984375, -0.563720703125, -0.5069580078125, -0.4501953125, -0.3934326171875, -0.336669921875, -0.2799072265625, -0.22314453125, -0.1663818359375, -0.109619140625, -0.0528564453125, 0.00390625, 0.0606689453125, 0.117431640625, 0.1741943359375, 0.23095703125, 0.2877197265625, 0.344482421875, 0.4012451171875, 0.4580078125, 0.5147705078125, 0.571533203125, 0.6282958984375, 0.68505859375, 0.7418212890625, 0.798583984375, 0.8553466796875, 0.912109375, 0.9688720703125, 1.025634765625, 1.0823974609375, 1.13916015625, 1.1959228515625, 1.252685546875, 1.3094482421875, 1.3662109375, 1.4229736328125, 1.479736328125, 1.5364990234375, 1.59326171875, 1.6500244140625, 1.706787109375, 1.7635498046875, 1.8203125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 3.0, 4.0, 6.0, 3.0, 9.0, 11.0, 14.0, 12.0, 24.0, 19.0, 21.0, 25.0, 24.0, 28.0, 25.0, 29.0, 32.0, 44.0, 45.0, 28.0, 36.0, 37.0, 24.0, 35.0, 37.0, 32.0, 39.0, 40.0, 31.0, 38.0, 17.0, 14.0, 21.0, 32.0, 23.0, 19.0, 15.0, 21.0, 10.0, 15.0, 11.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.092803955078125, -1.05474853515625, -1.016693115234375, -0.9786376953125, -0.940582275390625, -0.90252685546875, -0.864471435546875, -0.826416015625, -0.788360595703125, -0.75030517578125, -0.712249755859375, -0.6741943359375, -0.636138916015625, -0.59808349609375, -0.560028076171875, -0.52197265625, -0.483917236328125, -0.44586181640625, -0.407806396484375, -0.3697509765625, -0.331695556640625, -0.29364013671875, -0.255584716796875, -0.217529296875, -0.179473876953125, -0.14141845703125, -0.103363037109375, -0.0653076171875, -0.027252197265625, 0.01080322265625, 0.048858642578125, 0.0869140625, 0.124969482421875, 0.16302490234375, 0.201080322265625, 0.2391357421875, 0.277191162109375, 0.31524658203125, 0.353302001953125, 0.391357421875, 0.429412841796875, 0.46746826171875, 0.505523681640625, 0.5435791015625, 0.581634521484375, 0.61968994140625, 0.657745361328125, 0.69580078125, 0.733856201171875, 0.77191162109375, 0.809967041015625, 0.8480224609375, 0.886077880859375, 0.92413330078125, 0.962188720703125, 1.000244140625, 1.038299560546875, 1.07635498046875, 1.114410400390625, 1.1524658203125, 1.190521240234375, 1.22857666015625, 1.266632080078125, 1.3046875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 18.0, 20.0, 35.0, 40.0, 83.0, 141.0, 224.0, 346.0, 567.0, 926.0, 1627.0, 2772.0, 4575.0, 7682.0, 13066.0, 21424.0, 35434.0, 57835.0, 90700.0, 141182.0, 207486.0, 296111.0, 388439.0, 470461.0, 511125.0, 492721.0, 423943.0, 332004.0, 241209.0, 164834.0, 108412.0, 69008.0, 43399.0, 26501.0, 16049.0, 9531.0, 5809.0, 3382.0, 2065.0, 1233.0, 721.0, 473.0, 262.0, 159.0, 97.0, 57.0, 37.0, 31.0, 9.0, 9.0, 2.0, 6.0, 2.0, 0.0, 4.0], "bins": [-1.5302734375, -1.48486328125, -1.439453125, -1.39404296875, -1.3486328125, -1.30322265625, -1.2578125, -1.21240234375, -1.1669921875, -1.12158203125, -1.076171875, -1.03076171875, -0.9853515625, -0.93994140625, -0.89453125, -0.84912109375, -0.8037109375, -0.75830078125, -0.712890625, -0.66748046875, -0.6220703125, -0.57666015625, -0.53125, -0.48583984375, -0.4404296875, -0.39501953125, -0.349609375, -0.30419921875, -0.2587890625, -0.21337890625, -0.16796875, -0.12255859375, -0.0771484375, -0.03173828125, 0.013671875, 0.05908203125, 0.1044921875, 0.14990234375, 0.1953125, 0.24072265625, 0.2861328125, 0.33154296875, 0.376953125, 0.42236328125, 0.4677734375, 0.51318359375, 0.55859375, 0.60400390625, 0.6494140625, 0.69482421875, 0.740234375, 0.78564453125, 0.8310546875, 0.87646484375, 0.921875, 0.96728515625, 1.0126953125, 1.05810546875, 1.103515625, 1.14892578125, 1.1943359375, 1.23974609375, 1.28515625, 1.33056640625, 1.3759765625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 2.0, 10.0, 7.0, 7.0, 7.0, 14.0, 18.0, 15.0, 39.0, 41.0, 48.0, 42.0, 50.0, 51.0, 67.0, 84.0, 123.0, 133.0, 134.0, 176.0, 139.0, 160.0, 165.0, 195.0, 203.0, 204.0, 192.0, 195.0, 172.0, 183.0, 155.0, 145.0, 140.0, 136.0, 122.0, 70.0, 75.0, 77.0, 64.0, 46.0, 31.0, 32.0, 27.0, 16.0, 12.0, 12.0, 13.0, 14.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.55126953125, -0.5328826904296875, -0.514495849609375, -0.4961090087890625, -0.47772216796875, -0.4593353271484375, -0.440948486328125, -0.4225616455078125, -0.4041748046875, -0.3857879638671875, -0.367401123046875, -0.3490142822265625, -0.33062744140625, -0.3122406005859375, -0.293853759765625, -0.2754669189453125, -0.257080078125, -0.2386932373046875, -0.220306396484375, -0.2019195556640625, -0.18353271484375, -0.1651458740234375, -0.146759033203125, -0.1283721923828125, -0.1099853515625, -0.0915985107421875, -0.073211669921875, -0.0548248291015625, -0.03643798828125, -0.0180511474609375, 0.000335693359375, 0.0187225341796875, 0.037109375, 0.0554962158203125, 0.073883056640625, 0.0922698974609375, 0.11065673828125, 0.1290435791015625, 0.147430419921875, 0.1658172607421875, 0.1842041015625, 0.2025909423828125, 0.220977783203125, 0.2393646240234375, 0.25775146484375, 0.2761383056640625, 0.294525146484375, 0.3129119873046875, 0.331298828125, 0.3496856689453125, 0.368072509765625, 0.3864593505859375, 0.40484619140625, 0.4232330322265625, 0.441619873046875, 0.4600067138671875, 0.4783935546875, 0.4967803955078125, 0.515167236328125, 0.5335540771484375, 0.55194091796875, 0.5703277587890625, 0.588714599609375, 0.6071014404296875, 0.62548828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 13.0, 11.0, 24.0, 19.0, 20.0, 25.0, 26.0, 34.0, 47.0, 49.0, 48.0, 57.0, 55.0, 50.0, 56.0, 61.0, 58.0, 40.0, 39.0, 50.0, 35.0, 35.0, 24.0, 21.0, 16.0, 15.0, 13.0, 9.0, 5.0, 15.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2901968955993652, -2.22659969329834, -2.1630024909973145, -2.099405288696289, -2.0358080863952637, -1.9722108840942383, -1.9086135625839233, -1.845016360282898, -1.7814191579818726, -1.7178219556808472, -1.6542247533798218, -1.5906275510787964, -1.5270302295684814, -1.463433027267456, -1.3998358249664307, -1.3362386226654053, -1.2726414203643799, -1.2090442180633545, -1.145447015762329, -1.0818498134613037, -1.0182526111602783, -0.9546553492546082, -0.891058087348938, -0.8274608850479126, -0.7638636827468872, -0.7002664804458618, -0.6366692781448364, -0.5730720162391663, -0.5094748139381409, -0.4458776116371155, -0.3822803795337677, -0.3186831474304199, -0.25508618354797363, -0.19148896634578705, -0.12789174914360046, -0.06429453194141388, -0.0006973147392272949, 0.0628998875617981, 0.12649711966514587, 0.19009435176849365, 0.25369155406951904, 0.31728875637054443, 0.3808859884738922, 0.44448322057724, 0.5080804228782654, 0.5716776251792908, 0.6352748870849609, 0.6988720893859863, 0.7624692916870117, 0.8260664939880371, 0.8896636962890625, 0.9532609581947327, 1.0168581008911133, 1.0804553031921387, 1.1440526247024536, 1.207649827003479, 1.2712470293045044, 1.3348442316055298, 1.3984414339065552, 1.4620386362075806, 1.5256359577178955, 1.589233160018921, 1.6528303623199463, 1.7164275646209717, 1.780024766921997]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 8.0, 3.0, 7.0, 7.0, 8.0, 17.0, 18.0, 26.0, 24.0, 28.0, 19.0, 25.0, 34.0, 25.0, 25.0, 36.0, 37.0, 44.0, 40.0, 27.0, 42.0, 38.0, 41.0, 35.0, 38.0, 41.0, 32.0, 31.0, 25.0, 19.0, 19.0, 18.0, 25.0, 17.0, 13.0, 23.0, 14.0, 16.0, 6.0, 9.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4026124477386475, -1.3561328649520874, -1.3096531629562378, -1.2631735801696777, -1.2166939973831177, -1.1702144145965576, -1.123734712600708, -1.077255129814148, -1.030775547027588, -0.9842959046363831, -0.937816321849823, -0.8913366794586182, -0.8448570966720581, -0.7983774542808533, -0.7518978118896484, -0.7054182291030884, -0.6589385867118835, -0.6124589443206787, -0.5659793615341187, -0.5194997191429138, -0.47302013635635376, -0.4265404939651489, -0.3800608813762665, -0.33358126878738403, -0.2871016561985016, -0.24062204360961914, -0.1941424310207367, -0.14766280353069305, -0.10118319094181061, -0.05470357835292816, -0.008223950862884521, 0.038255661725997925, 0.08473527431488037, 0.13121488690376282, 0.17769449949264526, 0.2241741269826889, 0.27065372467041016, 0.317133367061615, 0.36361297965049744, 0.4100925922393799, 0.45657220482826233, 0.5030518174171448, 0.5495314598083496, 0.5960110425949097, 0.6424906849861145, 0.6889702677726746, 0.7354499101638794, 0.7819294929504395, 0.8284091353416443, 0.8748887777328491, 0.9213683605194092, 0.967848002910614, 1.0143276453018188, 1.060807228088379, 1.107286810874939, 1.153766393661499, 1.2002460956573486, 1.2467256784439087, 1.2932053804397583, 1.3396849632263184, 1.3861645460128784, 1.4326441287994385, 1.479123830795288, 1.5256034135818481, 1.5720829963684082]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 10.0, 9.0, 11.0, 13.0, 28.0, 29.0, 61.0, 82.0, 121.0, 179.0, 248.0, 435.0, 640.0, 1021.0, 1576.0, 2510.0, 3968.0, 6737.0, 11412.0, 19522.0, 34020.0, 60081.0, 101959.0, 159776.0, 199411.0, 171531.0, 112984.0, 67200.0, 38475.0, 22061.0, 12841.0, 7491.0, 4485.0, 2777.0, 1767.0, 1038.0, 672.0, 470.0, 295.0, 191.0, 129.0, 93.0, 69.0, 46.0, 26.0, 18.0, 15.0, 4.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.78271484375, -0.7579498291015625, -0.733184814453125, -0.7084197998046875, -0.68365478515625, -0.6588897705078125, -0.634124755859375, -0.6093597412109375, -0.5845947265625, -0.5598297119140625, -0.535064697265625, -0.5102996826171875, -0.48553466796875, -0.4607696533203125, -0.436004638671875, -0.4112396240234375, -0.386474609375, -0.3617095947265625, -0.336944580078125, -0.3121795654296875, -0.28741455078125, -0.2626495361328125, -0.237884521484375, -0.2131195068359375, -0.1883544921875, -0.1635894775390625, -0.138824462890625, -0.1140594482421875, -0.08929443359375, -0.0645294189453125, -0.039764404296875, -0.0149993896484375, 0.009765625, 0.0345306396484375, 0.059295654296875, 0.0840606689453125, 0.10882568359375, 0.1335906982421875, 0.158355712890625, 0.1831207275390625, 0.2078857421875, 0.2326507568359375, 0.257415771484375, 0.2821807861328125, 0.30694580078125, 0.3317108154296875, 0.356475830078125, 0.3812408447265625, 0.406005859375, 0.4307708740234375, 0.455535888671875, 0.4803009033203125, 0.50506591796875, 0.5298309326171875, 0.554595947265625, 0.5793609619140625, 0.6041259765625, 0.6288909912109375, 0.653656005859375, 0.6784210205078125, 0.70318603515625, 0.7279510498046875, 0.752716064453125, 0.7774810791015625, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 10.0, 6.0, 11.0, 10.0, 19.0, 20.0, 28.0, 24.0, 26.0, 37.0, 29.0, 26.0, 35.0, 36.0, 40.0, 35.0, 35.0, 41.0, 34.0, 40.0, 39.0, 37.0, 38.0, 36.0, 31.0, 40.0, 25.0, 28.0, 28.0, 10.0, 17.0, 20.0, 17.0, 14.0, 14.0, 8.0, 6.0, 6.0, 9.0, 10.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.46624755859375, -1.4149169921875, -1.36358642578125, -1.312255859375, -1.26092529296875, -1.2095947265625, -1.15826416015625, -1.10693359375, -1.05560302734375, -1.0042724609375, -0.95294189453125, -0.901611328125, -0.85028076171875, -0.7989501953125, -0.74761962890625, -0.6962890625, -0.64495849609375, -0.5936279296875, -0.54229736328125, -0.490966796875, -0.43963623046875, -0.3883056640625, -0.33697509765625, -0.28564453125, -0.23431396484375, -0.1829833984375, -0.13165283203125, -0.080322265625, -0.02899169921875, 0.0223388671875, 0.07366943359375, 0.125, 0.17633056640625, 0.2276611328125, 0.27899169921875, 0.330322265625, 0.38165283203125, 0.4329833984375, 0.48431396484375, 0.53564453125, 0.58697509765625, 0.6383056640625, 0.68963623046875, 0.740966796875, 0.79229736328125, 0.8436279296875, 0.89495849609375, 0.9462890625, 0.99761962890625, 1.0489501953125, 1.10028076171875, 1.151611328125, 1.20294189453125, 1.2542724609375, 1.30560302734375, 1.35693359375, 1.40826416015625, 1.4595947265625, 1.51092529296875, 1.562255859375, 1.61358642578125, 1.6649169921875, 1.71624755859375, 1.767578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 6.0, 7.0, 11.0, 39.0, 44.0, 68.0, 113.0, 178.0, 248.0, 425.0, 684.0, 1098.0, 1796.0, 3009.0, 5298.0, 9575.0, 17182.0, 32353.0, 61138.0, 115634.0, 201279.0, 240623.0, 164357.0, 89781.0, 46939.0, 25070.0, 13530.0, 7438.0, 4281.0, 2435.0, 1492.0, 917.0, 536.0, 357.0, 204.0, 153.0, 88.0, 70.0, 41.0, 27.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9951171875, -0.9669265747070312, -0.9387359619140625, -0.9105453491210938, -0.882354736328125, -0.8541641235351562, -0.8259735107421875, -0.7977828979492188, -0.76959228515625, -0.7414016723632812, -0.7132110595703125, -0.6850204467773438, -0.656829833984375, -0.6286392211914062, -0.6004486083984375, -0.5722579956054688, -0.5440673828125, -0.5158767700195312, -0.4876861572265625, -0.45949554443359375, -0.431304931640625, -0.40311431884765625, -0.3749237060546875, -0.34673309326171875, -0.31854248046875, -0.29035186767578125, -0.2621612548828125, -0.23397064208984375, -0.205780029296875, -0.17758941650390625, -0.1493988037109375, -0.12120819091796875, -0.093017578125, -0.06482696533203125, -0.0366363525390625, -0.00844573974609375, 0.019744873046875, 0.04793548583984375, 0.0761260986328125, 0.10431671142578125, 0.13250732421875, 0.16069793701171875, 0.1888885498046875, 0.21707916259765625, 0.245269775390625, 0.27346038818359375, 0.3016510009765625, 0.32984161376953125, 0.3580322265625, 0.38622283935546875, 0.4144134521484375, 0.44260406494140625, 0.470794677734375, 0.49898529052734375, 0.5271759033203125, 0.5553665161132812, 0.58355712890625, 0.6117477416992188, 0.6399383544921875, 0.6681289672851562, 0.696319580078125, 0.7245101928710938, 0.7527008056640625, 0.7808914184570312, 0.80908203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 5.0, 15.0, 11.0, 13.0, 15.0, 14.0, 19.0, 22.0, 37.0, 21.0, 20.0, 32.0, 26.0, 33.0, 34.0, 46.0, 49.0, 53.0, 36.0, 43.0, 47.0, 43.0, 33.0, 41.0, 36.0, 26.0, 29.0, 32.0, 25.0, 22.0, 15.0, 23.0, 14.0, 13.0, 6.0, 6.0, 7.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.222137451171875, -1.18548583984375, -1.148834228515625, -1.1121826171875, -1.075531005859375, -1.03887939453125, -1.002227783203125, -0.965576171875, -0.928924560546875, -0.89227294921875, -0.855621337890625, -0.8189697265625, -0.782318115234375, -0.74566650390625, -0.709014892578125, -0.67236328125, -0.635711669921875, -0.59906005859375, -0.562408447265625, -0.5257568359375, -0.489105224609375, -0.45245361328125, -0.415802001953125, -0.379150390625, -0.342498779296875, -0.30584716796875, -0.269195556640625, -0.2325439453125, -0.195892333984375, -0.15924072265625, -0.122589111328125, -0.0859375, -0.049285888671875, -0.01263427734375, 0.024017333984375, 0.0606689453125, 0.097320556640625, 0.13397216796875, 0.170623779296875, 0.207275390625, 0.243927001953125, 0.28057861328125, 0.317230224609375, 0.3538818359375, 0.390533447265625, 0.42718505859375, 0.463836669921875, 0.50048828125, 0.537139892578125, 0.57379150390625, 0.610443115234375, 0.6470947265625, 0.683746337890625, 0.72039794921875, 0.757049560546875, 0.793701171875, 0.830352783203125, 0.86700439453125, 0.903656005859375, 0.9403076171875, 0.976959228515625, 1.01361083984375, 1.050262451171875, 1.0869140625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 55.0, 77.0, 57.0, 112.0, 134.0, 196.0, 289.0, 410.0, 652.0, 1003.0, 1492.0, 2554.0, 4423.0, 8168.0, 17700.0, 46551.0, 162096.0, 466474.0, 228420.0, 62504.0, 22321.0, 9739.0, 5028.0, 2895.0, 1729.0, 1072.0, 717.0, 507.0, 328.0, 220.0, 161.0, 104.0, 81.0, 50.0, 57.0, 26.0, 21.0, 14.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4549674987792969, -0.43849945068359375, -0.4220314025878906, -0.4055633544921875, -0.3890953063964844, -0.37262725830078125, -0.3561592102050781, -0.339691162109375, -0.3232231140136719, -0.30675506591796875, -0.2902870178222656, -0.2738189697265625, -0.2573509216308594, -0.24088287353515625, -0.22441482543945312, -0.20794677734375, -0.19147872924804688, -0.17501068115234375, -0.15854263305664062, -0.1420745849609375, -0.12560653686523438, -0.10913848876953125, -0.09267044067382812, -0.076202392578125, -0.059734344482421875, -0.04326629638671875, -0.026798248291015625, -0.0103302001953125, 0.006137847900390625, 0.02260589599609375, 0.039073944091796875, 0.0555419921875, 0.07201004028320312, 0.08847808837890625, 0.10494613647460938, 0.1214141845703125, 0.13788223266601562, 0.15435028076171875, 0.17081832885742188, 0.187286376953125, 0.20375442504882812, 0.22022247314453125, 0.23669052124023438, 0.2531585693359375, 0.2696266174316406, 0.28609466552734375, 0.3025627136230469, 0.31903076171875, 0.3354988098144531, 0.35196685791015625, 0.3684349060058594, 0.3849029541015625, 0.4013710021972656, 0.41783905029296875, 0.4343070983886719, 0.450775146484375, 0.4672431945800781, 0.48371124267578125, 0.5001792907714844, 0.5166473388671875, 0.5331153869628906, 0.5495834350585938, 0.5660514831542969, 0.58251953125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 9.0, 5.0, 4.0, 15.0, 14.0, 21.0, 18.0, 19.0, 26.0, 36.0, 25.0, 35.0, 36.0, 49.0, 42.0, 56.0, 46.0, 60.0, 43.0, 51.0, 63.0, 40.0, 41.0, 31.0, 40.0, 30.0, 23.0, 20.0, 21.0, 16.0, 10.0, 8.0, 9.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.1083280444145203e-05, -2.0410865545272827e-05, -1.973845064640045e-05, -1.9066035747528076e-05, -1.83936208486557e-05, -1.7721205949783325e-05, -1.704879105091095e-05, -1.6376376152038574e-05, -1.57039612531662e-05, -1.5031546354293823e-05, -1.4359131455421448e-05, -1.3686716556549072e-05, -1.3014301657676697e-05, -1.2341886758804321e-05, -1.1669471859931946e-05, -1.099705696105957e-05, -1.0324642062187195e-05, -9.65222716331482e-06, -8.979812264442444e-06, -8.307397365570068e-06, -7.634982466697693e-06, -6.962567567825317e-06, -6.290152668952942e-06, -5.617737770080566e-06, -4.945322871208191e-06, -4.2729079723358154e-06, -3.60049307346344e-06, -2.9280781745910645e-06, -2.255663275718689e-06, -1.5832483768463135e-06, -9.10833477973938e-07, -2.384185791015625e-07, 4.33996319770813e-07, 1.1064112186431885e-06, 1.778826117515564e-06, 2.4512410163879395e-06, 3.123655915260315e-06, 3.7960708141326904e-06, 4.468485713005066e-06, 5.140900611877441e-06, 5.813315510749817e-06, 6.485730409622192e-06, 7.158145308494568e-06, 7.830560207366943e-06, 8.502975106239319e-06, 9.175390005111694e-06, 9.84780490398407e-06, 1.0520219802856445e-05, 1.119263470172882e-05, 1.1865049600601196e-05, 1.2537464499473572e-05, 1.3209879398345947e-05, 1.3882294297218323e-05, 1.4554709196090698e-05, 1.5227124094963074e-05, 1.589953899383545e-05, 1.6571953892707825e-05, 1.72443687915802e-05, 1.7916783690452576e-05, 1.858919858932495e-05, 1.9261613488197327e-05, 1.9934028387069702e-05, 2.0606443285942078e-05, 2.1278858184814453e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 11.0, 15.0, 10.0, 24.0, 39.0, 77.0, 104.0, 185.0, 273.0, 466.0, 835.0, 1397.0, 2392.0, 4420.0, 8511.0, 17373.0, 36830.0, 82607.0, 186052.0, 306803.0, 216254.0, 98906.0, 43293.0, 20199.0, 9900.0, 5053.0, 2725.0, 1492.0, 913.0, 550.0, 305.0, 206.0, 118.0, 59.0, 57.0, 36.0, 26.0, 13.0, 9.0, 3.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4791755676269531, -0.46298980712890625, -0.4468040466308594, -0.4306182861328125, -0.4144325256347656, -0.39824676513671875, -0.3820610046386719, -0.365875244140625, -0.3496894836425781, -0.33350372314453125, -0.3173179626464844, -0.3011322021484375, -0.2849464416503906, -0.26876068115234375, -0.2525749206542969, -0.23638916015625, -0.22020339965820312, -0.20401763916015625, -0.18783187866210938, -0.1716461181640625, -0.15546035766601562, -0.13927459716796875, -0.12308883666992188, -0.106903076171875, -0.09071731567382812, -0.07453155517578125, -0.058345794677734375, -0.0421600341796875, -0.025974273681640625, -0.00978851318359375, 0.006397247314453125, 0.0225830078125, 0.038768768310546875, 0.05495452880859375, 0.07114028930664062, 0.0873260498046875, 0.10351181030273438, 0.11969757080078125, 0.13588333129882812, 0.152069091796875, 0.16825485229492188, 0.18444061279296875, 0.20062637329101562, 0.2168121337890625, 0.23299789428710938, 0.24918365478515625, 0.2653694152832031, 0.28155517578125, 0.2977409362792969, 0.31392669677734375, 0.3301124572753906, 0.3462982177734375, 0.3624839782714844, 0.37866973876953125, 0.3948554992675781, 0.411041259765625, 0.4272270202636719, 0.44341278076171875, 0.4595985412597656, 0.4757843017578125, 0.4919700622558594, 0.5081558227539062, 0.5243415832519531, 0.54052734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 14.0, 8.0, 7.0, 16.0, 9.0, 20.0, 18.0, 16.0, 24.0, 20.0, 24.0, 35.0, 42.0, 40.0, 65.0, 59.0, 51.0, 59.0, 55.0, 56.0, 54.0, 42.0, 38.0, 25.0, 29.0, 28.0, 19.0, 19.0, 18.0, 13.0, 10.0, 4.0, 9.0, 6.0, 12.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.097412109375, -0.09454917907714844, -0.09168624877929688, -0.08882331848144531, -0.08596038818359375, -0.08309745788574219, -0.08023452758789062, -0.07737159729003906, -0.0745086669921875, -0.07164573669433594, -0.06878280639648438, -0.06591987609863281, -0.06305694580078125, -0.06019401550292969, -0.057331085205078125, -0.05446815490722656, -0.051605224609375, -0.04874229431152344, -0.045879364013671875, -0.04301643371582031, -0.04015350341796875, -0.03729057312011719, -0.034427642822265625, -0.03156471252441406, -0.0287017822265625, -0.025838851928710938, -0.022975921630859375, -0.020112991333007812, -0.01725006103515625, -0.014387130737304688, -0.011524200439453125, -0.008661270141601562, -0.00579833984375, -0.0029354095458984375, -7.2479248046875e-05, 0.0027904510498046875, 0.00565338134765625, 0.008516311645507812, 0.011379241943359375, 0.014242172241210938, 0.0171051025390625, 0.019968032836914062, 0.022830963134765625, 0.025693893432617188, 0.02855682373046875, 0.03141975402832031, 0.034282684326171875, 0.03714561462402344, 0.040008544921875, 0.04287147521972656, 0.045734405517578125, 0.04859733581542969, 0.05146026611328125, 0.05432319641113281, 0.057186126708984375, 0.06004905700683594, 0.0629119873046875, 0.06577491760253906, 0.06863784790039062, 0.07150077819824219, 0.07436370849609375, 0.07722663879394531, 0.08008956909179688, 0.08295249938964844, 0.0858154296875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 8.0, 9.0, 15.0, 21.0, 19.0, 28.0, 26.0, 36.0, 36.0, 31.0, 53.0, 37.0, 65.0, 50.0, 61.0, 55.0, 50.0, 43.0, 54.0, 44.0, 37.0, 43.0, 31.0, 19.0, 21.0, 19.0, 18.0, 11.0, 10.0, 9.0, 6.0, 3.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1656153202056885, -2.103355646133423, -2.041095733642578, -1.978835940361023, -1.9165761470794678, -1.8543163537979126, -1.7920565605163574, -1.7297967672348022, -1.667536973953247, -1.605277180671692, -1.5430173873901367, -1.4807575941085815, -1.4184978008270264, -1.3562380075454712, -1.293978214263916, -1.2317184209823608, -1.1694586277008057, -1.1071988344192505, -1.0449390411376953, -0.9826792478561401, -0.920419454574585, -0.8581596612930298, -0.7958998680114746, -0.7336400747299194, -0.6713804006576538, -0.6091206073760986, -0.5468608140945435, -0.4846010208129883, -0.4223412275314331, -0.3600814640522003, -0.29782167077064514, -0.23556187748908997, -0.1733020544052124, -0.11104226112365723, -0.04878247529268265, 0.013477310538291931, 0.0757371038198471, 0.1379968822002411, 0.20025667548179626, 0.26251646876335144, 0.3247762620449066, 0.3870360553264618, 0.44929584860801697, 0.5115556120872498, 0.5738154053688049, 0.6360751986503601, 0.6983349919319153, 0.7605947852134705, 0.8228545784950256, 0.8851143717765808, 0.947374165058136, 1.0096338987350464, 1.0718936920166016, 1.1341534852981567, 1.196413278579712, 1.258673071861267, 1.3209328651428223, 1.3831926584243774, 1.4454524517059326, 1.5077122449874878, 1.569972038269043, 1.6322318315505981, 1.6944916248321533, 1.7567514181137085, 1.8190112113952637]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 6.0, 5.0, 5.0, 11.0, 12.0, 9.0, 25.0, 27.0, 24.0, 21.0, 21.0, 30.0, 29.0, 28.0, 24.0, 29.0, 42.0, 43.0, 35.0, 32.0, 39.0, 48.0, 37.0, 34.0, 35.0, 42.0, 29.0, 27.0, 23.0, 20.0, 24.0, 22.0, 21.0, 16.0, 15.0, 15.0, 19.0, 13.0, 9.0, 8.0, 11.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3607033491134644, -1.3150500059127808, -1.2693967819213867, -1.2237434387207031, -1.1780900955200195, -1.132436752319336, -1.0867834091186523, -1.0411301851272583, -0.9954768419265747, -0.9498234987258911, -0.9041702151298523, -0.8585169315338135, -0.8128635883331299, -0.7672102451324463, -0.7215569615364075, -0.6759036779403687, -0.6302503347396851, -0.5845969915390015, -0.5389437079429626, -0.49329039454460144, -0.44763708114624023, -0.40198376774787903, -0.3563304543495178, -0.3106771409511566, -0.2650238275527954, -0.2193705141544342, -0.173717200756073, -0.1280638873577118, -0.08241057395935059, -0.03675726056098938, 0.008896052837371826, 0.05454936623573303, 0.10020256042480469, 0.1458558738231659, 0.1915091872215271, 0.2371625006198883, 0.2828158140182495, 0.3284691274166107, 0.3741224408149719, 0.41977575421333313, 0.46542906761169434, 0.5110824108123779, 0.5567356944084167, 0.6023889780044556, 0.6480423212051392, 0.6936956644058228, 0.7393489480018616, 0.7850022315979004, 0.830655574798584, 0.8763089179992676, 0.9219622015953064, 0.9676154851913452, 1.0132688283920288, 1.0589221715927124, 1.1045753955841064, 1.15022873878479, 1.1958820819854736, 1.2415354251861572, 1.2871887683868408, 1.3328419923782349, 1.3784953355789185, 1.424148678779602, 1.469801902770996, 1.5154552459716797, 1.5611085891723633]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 12.0, 18.0, 23.0, 50.0, 54.0, 87.0, 139.0, 231.0, 361.0, 564.0, 839.0, 1272.0, 1955.0, 3119.0, 4894.0, 7515.0, 11383.0, 17296.0, 25425.0, 36209.0, 50124.0, 67055.0, 84012.0, 99669.0, 108911.0, 109134.0, 100086.0, 85735.0, 67929.0, 50990.0, 36845.0, 25873.0, 17287.0, 11838.0, 7746.0, 4876.0, 3256.0, 2045.0, 1343.0, 849.0, 535.0, 343.0, 226.0, 152.0, 95.0, 41.0, 33.0, 28.0, 28.0, 7.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2749176025390625, -1.232452392578125, -1.1899871826171875, -1.14752197265625, -1.1050567626953125, -1.062591552734375, -1.0201263427734375, -0.9776611328125, -0.9351959228515625, -0.892730712890625, -0.8502655029296875, -0.80780029296875, -0.7653350830078125, -0.722869873046875, -0.6804046630859375, -0.637939453125, -0.5954742431640625, -0.553009033203125, -0.5105438232421875, -0.46807861328125, -0.4256134033203125, -0.383148193359375, -0.3406829833984375, -0.2982177734375, -0.2557525634765625, -0.213287353515625, -0.1708221435546875, -0.12835693359375, -0.0858917236328125, -0.043426513671875, -0.0009613037109375, 0.04150390625, 0.0839691162109375, 0.126434326171875, 0.1688995361328125, 0.21136474609375, 0.2538299560546875, 0.296295166015625, 0.3387603759765625, 0.3812255859375, 0.4236907958984375, 0.466156005859375, 0.5086212158203125, 0.55108642578125, 0.5935516357421875, 0.636016845703125, 0.6784820556640625, 0.720947265625, 0.7634124755859375, 0.805877685546875, 0.8483428955078125, 0.89080810546875, 0.9332733154296875, 0.975738525390625, 1.0182037353515625, 1.0606689453125, 1.1031341552734375, 1.145599365234375, 1.1880645751953125, 1.23052978515625, 1.2729949951171875, 1.315460205078125, 1.3579254150390625, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 11.0, 13.0, 15.0, 22.0, 18.0, 20.0, 27.0, 29.0, 26.0, 18.0, 34.0, 25.0, 33.0, 40.0, 38.0, 40.0, 33.0, 48.0, 40.0, 40.0, 46.0, 31.0, 20.0, 27.0, 27.0, 23.0, 31.0, 17.0, 20.0, 24.0, 13.0, 17.0, 19.0, 16.0, 10.0, 8.0, 8.0, 4.0, 6.0, 1.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.5146484375, -1.4691009521484375, -1.423553466796875, -1.3780059814453125, -1.33245849609375, -1.2869110107421875, -1.241363525390625, -1.1958160400390625, -1.1502685546875, -1.1047210693359375, -1.059173583984375, -1.0136260986328125, -0.96807861328125, -0.9225311279296875, -0.876983642578125, -0.8314361572265625, -0.785888671875, -0.7403411865234375, -0.694793701171875, -0.6492462158203125, -0.60369873046875, -0.5581512451171875, -0.512603759765625, -0.4670562744140625, -0.4215087890625, -0.3759613037109375, -0.330413818359375, -0.2848663330078125, -0.23931884765625, -0.1937713623046875, -0.148223876953125, -0.1026763916015625, -0.05712890625, -0.0115814208984375, 0.033966064453125, 0.0795135498046875, 0.12506103515625, 0.1706085205078125, 0.216156005859375, 0.2617034912109375, 0.3072509765625, 0.3527984619140625, 0.398345947265625, 0.4438934326171875, 0.48944091796875, 0.5349884033203125, 0.580535888671875, 0.6260833740234375, 0.671630859375, 0.7171783447265625, 0.762725830078125, 0.8082733154296875, 0.85382080078125, 0.8993682861328125, 0.944915771484375, 0.9904632568359375, 1.0360107421875, 1.0815582275390625, 1.127105712890625, 1.1726531982421875, 1.21820068359375, 1.2637481689453125, 1.309295654296875, 1.3548431396484375, 1.400390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 15.0, 26.0, 34.0, 64.0, 90.0, 154.0, 214.0, 373.0, 565.0, 886.0, 1422.0, 2326.0, 3504.0, 5587.0, 8588.0, 13287.0, 20391.0, 30099.0, 43180.0, 59122.0, 77582.0, 95084.0, 108012.0, 112504.0, 106995.0, 94487.0, 77092.0, 58695.0, 42529.0, 29508.0, 19641.0, 12991.0, 8564.0, 5412.0, 3494.0, 2273.0, 1331.0, 874.0, 569.0, 356.0, 229.0, 158.0, 90.0, 52.0, 33.0, 24.0, 12.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.40625, -1.3642425537109375, -1.322235107421875, -1.2802276611328125, -1.23822021484375, -1.1962127685546875, -1.154205322265625, -1.1121978759765625, -1.0701904296875, -1.0281829833984375, -0.986175537109375, -0.9441680908203125, -0.90216064453125, -0.8601531982421875, -0.818145751953125, -0.7761383056640625, -0.734130859375, -0.6921234130859375, -0.650115966796875, -0.6081085205078125, -0.56610107421875, -0.5240936279296875, -0.482086181640625, -0.4400787353515625, -0.3980712890625, -0.3560638427734375, -0.314056396484375, -0.2720489501953125, -0.23004150390625, -0.1880340576171875, -0.146026611328125, -0.1040191650390625, -0.06201171875, -0.0200042724609375, 0.022003173828125, 0.0640106201171875, 0.10601806640625, 0.1480255126953125, 0.190032958984375, 0.2320404052734375, 0.2740478515625, 0.3160552978515625, 0.358062744140625, 0.4000701904296875, 0.44207763671875, 0.4840850830078125, 0.526092529296875, 0.5680999755859375, 0.610107421875, 0.6521148681640625, 0.694122314453125, 0.7361297607421875, 0.77813720703125, 0.8201446533203125, 0.862152099609375, 0.9041595458984375, 0.9461669921875, 0.9881744384765625, 1.030181884765625, 1.0721893310546875, 1.11419677734375, 1.1562042236328125, 1.198211669921875, 1.2402191162109375, 1.2822265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 2.0, 8.0, 12.0, 5.0, 14.0, 10.0, 12.0, 19.0, 18.0, 16.0, 23.0, 27.0, 13.0, 33.0, 24.0, 30.0, 31.0, 31.0, 31.0, 35.0, 31.0, 33.0, 35.0, 42.0, 42.0, 42.0, 39.0, 21.0, 42.0, 25.0, 30.0, 31.0, 22.0, 23.0, 18.0, 21.0, 17.0, 17.0, 11.0, 9.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9072265625, -0.8786849975585938, -0.8501434326171875, -0.8216018676757812, -0.793060302734375, -0.7645187377929688, -0.7359771728515625, -0.7074356079101562, -0.67889404296875, -0.6503524780273438, -0.6218109130859375, -0.5932693481445312, -0.564727783203125, -0.5361862182617188, -0.5076446533203125, -0.47910308837890625, -0.4505615234375, -0.42201995849609375, -0.3934783935546875, -0.36493682861328125, -0.336395263671875, -0.30785369873046875, -0.2793121337890625, -0.25077056884765625, -0.22222900390625, -0.19368743896484375, -0.1651458740234375, -0.13660430908203125, -0.108062744140625, -0.07952117919921875, -0.0509796142578125, -0.02243804931640625, 0.006103515625, 0.03464508056640625, 0.0631866455078125, 0.09172821044921875, 0.120269775390625, 0.14881134033203125, 0.1773529052734375, 0.20589447021484375, 0.23443603515625, 0.26297760009765625, 0.2915191650390625, 0.32006072998046875, 0.348602294921875, 0.37714385986328125, 0.4056854248046875, 0.43422698974609375, 0.4627685546875, 0.49131011962890625, 0.5198516845703125, 0.5483932495117188, 0.576934814453125, 0.6054763793945312, 0.6340179443359375, 0.6625595092773438, 0.69110107421875, 0.7196426391601562, 0.7481842041015625, 0.7767257690429688, 0.805267333984375, 0.8338088989257812, 0.8623504638671875, 0.8908920288085938, 0.91943359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 8.0, 16.0, 14.0, 24.0, 38.0, 48.0, 80.0, 126.0, 185.0, 286.0, 466.0, 680.0, 1139.0, 1975.0, 3384.0, 5995.0, 11202.0, 21092.0, 39146.0, 73194.0, 124782.0, 182377.0, 200390.0, 159393.0, 100831.0, 55619.0, 30179.0, 15855.0, 8473.0, 4718.0, 2667.0, 1543.0, 925.0, 556.0, 346.0, 246.0, 158.0, 118.0, 61.0, 60.0, 40.0, 27.0, 26.0, 16.0, 6.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.2763671875, -1.2368316650390625, -1.197296142578125, -1.1577606201171875, -1.11822509765625, -1.0786895751953125, -1.039154052734375, -0.9996185302734375, -0.9600830078125, -0.9205474853515625, -0.881011962890625, -0.8414764404296875, -0.80194091796875, -0.7624053955078125, -0.722869873046875, -0.6833343505859375, -0.643798828125, -0.6042633056640625, -0.564727783203125, -0.5251922607421875, -0.48565673828125, -0.4461212158203125, -0.406585693359375, -0.3670501708984375, -0.3275146484375, -0.2879791259765625, -0.248443603515625, -0.2089080810546875, -0.16937255859375, -0.1298370361328125, -0.090301513671875, -0.0507659912109375, -0.01123046875, 0.0283050537109375, 0.067840576171875, 0.1073760986328125, 0.14691162109375, 0.1864471435546875, 0.225982666015625, 0.2655181884765625, 0.3050537109375, 0.3445892333984375, 0.384124755859375, 0.4236602783203125, 0.46319580078125, 0.5027313232421875, 0.542266845703125, 0.5818023681640625, 0.621337890625, 0.6608734130859375, 0.700408935546875, 0.7399444580078125, 0.77947998046875, 0.8190155029296875, 0.858551025390625, 0.8980865478515625, 0.9376220703125, 0.9771575927734375, 1.016693115234375, 1.0562286376953125, 1.09576416015625, 1.1352996826171875, 1.174835205078125, 1.2143707275390625, 1.25390625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 3.0, 9.0, 12.0, 12.0, 12.0, 23.0, 34.0, 32.0, 38.0, 44.0, 49.0, 57.0, 48.0, 64.0, 60.0, 44.0, 61.0, 60.0, 52.0, 37.0, 46.0, 33.0, 40.0, 19.0, 19.0, 22.0, 13.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010466575622558594, -0.00010150019079446793, -9.833462536334991e-05, -9.51690599322319e-05, -9.200349450111389e-05, -8.883792906999588e-05, -8.567236363887787e-05, -8.250679820775986e-05, -7.934123277664185e-05, -7.617566734552383e-05, -7.301010191440582e-05, -6.984453648328781e-05, -6.66789710521698e-05, -6.351340562105179e-05, -6.034784018993378e-05, -5.7182274758815765e-05, -5.4016709327697754e-05, -5.085114389657974e-05, -4.768557846546173e-05, -4.452001303434372e-05, -4.135444760322571e-05, -3.8188882172107697e-05, -3.5023316740989685e-05, -3.1857751309871674e-05, -2.8692185878753662e-05, -2.552662044763565e-05, -2.236105501651764e-05, -1.9195489585399628e-05, -1.6029924154281616e-05, -1.2864358723163605e-05, -9.698793292045593e-06, -6.533227860927582e-06, -3.3676624298095703e-06, -2.0209699869155884e-07, 2.9634684324264526e-06, 6.129033863544464e-06, 9.294599294662476e-06, 1.2460164725780487e-05, 1.56257301568985e-05, 1.879129558801651e-05, 2.195686101913452e-05, 2.5122426450252533e-05, 2.8287991881370544e-05, 3.1453557312488556e-05, 3.461912274360657e-05, 3.778468817472458e-05, 4.095025360584259e-05, 4.41158190369606e-05, 4.728138446807861e-05, 5.0446949899196625e-05, 5.3612515330314636e-05, 5.677808076143265e-05, 5.994364619255066e-05, 6.310921162366867e-05, 6.627477705478668e-05, 6.94403424859047e-05, 7.26059079170227e-05, 7.577147334814072e-05, 7.893703877925873e-05, 8.210260421037674e-05, 8.526816964149475e-05, 8.843373507261276e-05, 9.159930050373077e-05, 9.476486593484879e-05, 9.79304313659668e-05]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 11.0, 17.0, 17.0, 40.0, 38.0, 42.0, 63.0, 79.0, 145.0, 222.0, 301.0, 461.0, 755.0, 1174.0, 1822.0, 2861.0, 4667.0, 7651.0, 12413.0, 19913.0, 32585.0, 51298.0, 79006.0, 112705.0, 143082.0, 152351.0, 134546.0, 102270.0, 69718.0, 44877.0, 28237.0, 17182.0, 10528.0, 6524.0, 4006.0, 2549.0, 1504.0, 1038.0, 628.0, 403.0, 251.0, 179.0, 107.0, 81.0, 58.0, 49.0, 29.0, 23.0, 13.0, 14.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0], "bins": [-0.9375, -0.9085159301757812, -0.8795318603515625, -0.8505477905273438, -0.821563720703125, -0.7925796508789062, -0.7635955810546875, -0.7346115112304688, -0.70562744140625, -0.6766433715820312, -0.6476593017578125, -0.6186752319335938, -0.589691162109375, -0.5607070922851562, -0.5317230224609375, -0.5027389526367188, -0.4737548828125, -0.44477081298828125, -0.4157867431640625, -0.38680267333984375, -0.357818603515625, -0.32883453369140625, -0.2998504638671875, -0.27086639404296875, -0.24188232421875, -0.21289825439453125, -0.1839141845703125, -0.15493011474609375, -0.125946044921875, -0.09696197509765625, -0.0679779052734375, -0.03899383544921875, -0.010009765625, 0.01897430419921875, 0.0479583740234375, 0.07694244384765625, 0.105926513671875, 0.13491058349609375, 0.1638946533203125, 0.19287872314453125, 0.22186279296875, 0.25084686279296875, 0.2798309326171875, 0.30881500244140625, 0.337799072265625, 0.36678314208984375, 0.3957672119140625, 0.42475128173828125, 0.4537353515625, 0.48271942138671875, 0.5117034912109375, 0.5406875610351562, 0.569671630859375, 0.5986557006835938, 0.6276397705078125, 0.6566238403320312, 0.68560791015625, 0.7145919799804688, 0.7435760498046875, 0.7725601196289062, 0.801544189453125, 0.8305282592773438, 0.8595123291015625, 0.8884963989257812, 0.91748046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 7.0, 4.0, 10.0, 12.0, 20.0, 16.0, 22.0, 31.0, 28.0, 31.0, 32.0, 39.0, 44.0, 50.0, 60.0, 58.0, 63.0, 50.0, 54.0, 55.0, 57.0, 43.0, 35.0, 31.0, 30.0, 30.0, 21.0, 17.0, 11.0, 12.0, 9.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47867584228515625, -0.4656524658203125, -0.45262908935546875, -0.439605712890625, -0.42658233642578125, -0.4135589599609375, -0.40053558349609375, -0.38751220703125, -0.37448883056640625, -0.3614654541015625, -0.34844207763671875, -0.335418701171875, -0.32239532470703125, -0.3093719482421875, -0.29634857177734375, -0.2833251953125, -0.27030181884765625, -0.2572784423828125, -0.24425506591796875, -0.231231689453125, -0.21820831298828125, -0.2051849365234375, -0.19216156005859375, -0.17913818359375, -0.16611480712890625, -0.1530914306640625, -0.14006805419921875, -0.127044677734375, -0.11402130126953125, -0.1009979248046875, -0.08797454833984375, -0.074951171875, -0.06192779541015625, -0.0489044189453125, -0.03588104248046875, -0.022857666015625, -0.00983428955078125, 0.0031890869140625, 0.01621246337890625, 0.02923583984375, 0.04225921630859375, 0.0552825927734375, 0.06830596923828125, 0.081329345703125, 0.09435272216796875, 0.1073760986328125, 0.12039947509765625, 0.1334228515625, 0.14644622802734375, 0.1594696044921875, 0.17249298095703125, 0.185516357421875, 0.19853973388671875, 0.2115631103515625, 0.22458648681640625, 0.23760986328125, 0.25063323974609375, 0.2636566162109375, 0.27667999267578125, 0.289703369140625, 0.30272674560546875, 0.3157501220703125, 0.32877349853515625, 0.341796875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 13.0, 12.0, 15.0, 9.0, 26.0, 20.0, 29.0, 34.0, 40.0, 39.0, 37.0, 52.0, 46.0, 45.0, 56.0, 49.0, 57.0, 49.0, 38.0, 55.0, 48.0, 31.0, 31.0, 25.0, 20.0, 15.0, 24.0, 11.0, 12.0, 12.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8894098997116089, -1.829939365386963, -1.770468831062317, -1.710998296737671, -1.651527762413025, -1.592057228088379, -1.5325868129730225, -1.4731162786483765, -1.4136457443237305, -1.3541752099990845, -1.2947046756744385, -1.2352341413497925, -1.1757636070251465, -1.11629319190979, -1.0568225383758545, -0.997352123260498, -0.9378815293312073, -0.8784109950065613, -0.8189404606819153, -0.7594699859619141, -0.6999994516372681, -0.6405289173126221, -0.5810583829879761, -0.5215878486633301, -0.46211734414100647, -0.4026468098163605, -0.34317630529403687, -0.28370577096939087, -0.22423525154590607, -0.16476473212242126, -0.10529419779777527, -0.04582369327545166, 0.013646841049194336, 0.07311736047267914, 0.13258787989616394, 0.19205841422080994, 0.25152891874313354, 0.31099945306777954, 0.37046998739242554, 0.42994049191474915, 0.48941102623939514, 0.5488815307617188, 0.6083520650863647, 0.6678225994110107, 0.7272931337356567, 0.7867636680603027, 0.8462342023849487, 0.90570467710495, 0.965175211429596, 1.0246456861495972, 1.0841162204742432, 1.1435867547988892, 1.2030572891235352, 1.2625278234481812, 1.3219983577728271, 1.3814688920974731, 1.4409394264221191, 1.5004099607467651, 1.5598804950714111, 1.6193510293960571, 1.6788215637207031, 1.7382919788360596, 1.7977626323699951, 1.8572330474853516, 1.9167035818099976]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 1.0, 8.0, 9.0, 7.0, 12.0, 11.0, 9.0, 12.0, 13.0, 14.0, 35.0, 24.0, 17.0, 29.0, 31.0, 42.0, 30.0, 34.0, 35.0, 27.0, 41.0, 45.0, 41.0, 31.0, 41.0, 38.0, 39.0, 44.0, 29.0, 37.0, 26.0, 17.0, 21.0, 24.0, 21.0, 12.0, 10.0, 13.0, 17.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.371199607849121, -1.3224812746047974, -1.2737629413604736, -1.22504460811615, -1.1763262748718262, -1.1276079416275024, -1.0788896083831787, -1.0301713943481445, -0.981453001499176, -0.9327346682548523, -0.8840163350105286, -0.8352980613708496, -0.7865797281265259, -0.7378613948822021, -0.6891430616378784, -0.6404247283935547, -0.591706395149231, -0.5429880619049072, -0.4942697286605835, -0.44555142521858215, -0.3968330919742584, -0.3481147587299347, -0.29939645528793335, -0.2506781220436096, -0.2019597887992859, -0.15324145555496216, -0.10452313721179962, -0.055804818868637085, -0.0070864856243133545, 0.041631847620010376, 0.09035015106201172, 0.13906848430633545, 0.18778681755065918, 0.2365051507949829, 0.28522348403930664, 0.333941787481308, 0.3826601207256317, 0.43137845396995544, 0.4800967574119568, 0.5288150906562805, 0.5775334239006042, 0.626251757144928, 0.6749700903892517, 0.7236883640289307, 0.7724066972732544, 0.8211250305175781, 0.8698433637619019, 0.9185616970062256, 0.9672800302505493, 1.015998363494873, 1.0647166967391968, 1.1134350299835205, 1.1621533632278442, 1.210871696472168, 1.2595899105072021, 1.3083083629608154, 1.3570265769958496, 1.4057449102401733, 1.454463243484497, 1.5031815767288208, 1.5518999099731445, 1.6006182432174683, 1.649336576461792, 1.6980547904968262, 1.7467732429504395]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 12.0, 27.0, 39.0, 49.0, 79.0, 135.0, 225.0, 378.0, 655.0, 1170.0, 1907.0, 3451.0, 5958.0, 10651.0, 19230.0, 33416.0, 58904.0, 103499.0, 176924.0, 289343.0, 440194.0, 593615.0, 663971.0, 602063.0, 453475.0, 300291.0, 184695.0, 107892.0, 61816.0, 35026.0, 19654.0, 11040.0, 6208.0, 3646.0, 2000.0, 1098.0, 603.0, 379.0, 236.0, 125.0, 81.0, 51.0, 27.0, 23.0, 7.0, 10.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.609375, -1.559906005859375, -1.51043701171875, -1.460968017578125, -1.4114990234375, -1.362030029296875, -1.31256103515625, -1.263092041015625, -1.213623046875, -1.164154052734375, -1.11468505859375, -1.065216064453125, -1.0157470703125, -0.966278076171875, -0.91680908203125, -0.867340087890625, -0.81787109375, -0.768402099609375, -0.71893310546875, -0.669464111328125, -0.6199951171875, -0.570526123046875, -0.52105712890625, -0.471588134765625, -0.422119140625, -0.372650146484375, -0.32318115234375, -0.273712158203125, -0.2242431640625, -0.174774169921875, -0.12530517578125, -0.075836181640625, -0.0263671875, 0.023101806640625, 0.07257080078125, 0.122039794921875, 0.1715087890625, 0.220977783203125, 0.27044677734375, 0.319915771484375, 0.369384765625, 0.418853759765625, 0.46832275390625, 0.517791748046875, 0.5672607421875, 0.616729736328125, 0.66619873046875, 0.715667724609375, 0.76513671875, 0.814605712890625, 0.86407470703125, 0.913543701171875, 0.9630126953125, 1.012481689453125, 1.06195068359375, 1.111419677734375, 1.160888671875, 1.210357666015625, 1.25982666015625, 1.309295654296875, 1.3587646484375, 1.408233642578125, 1.45770263671875, 1.507171630859375, 1.556640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 12.0, 6.0, 7.0, 13.0, 9.0, 13.0, 14.0, 26.0, 23.0, 30.0, 20.0, 35.0, 25.0, 39.0, 36.0, 27.0, 37.0, 35.0, 33.0, 41.0, 34.0, 40.0, 28.0, 40.0, 36.0, 31.0, 33.0, 32.0, 26.0, 22.0, 22.0, 20.0, 11.0, 14.0, 17.0, 21.0, 15.0, 11.0, 7.0, 12.0, 5.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93505859375, -0.9029006958007812, -0.8707427978515625, -0.8385848999023438, -0.806427001953125, -0.7742691040039062, -0.7421112060546875, -0.7099533081054688, -0.67779541015625, -0.6456375122070312, -0.6134796142578125, -0.5813217163085938, -0.549163818359375, -0.5170059204101562, -0.4848480224609375, -0.45269012451171875, -0.4205322265625, -0.38837432861328125, -0.3562164306640625, -0.32405853271484375, -0.291900634765625, -0.25974273681640625, -0.2275848388671875, -0.19542694091796875, -0.16326904296875, -0.13111114501953125, -0.0989532470703125, -0.06679534912109375, -0.034637451171875, -0.00247955322265625, 0.0296783447265625, 0.06183624267578125, 0.093994140625, 0.12615203857421875, 0.1583099365234375, 0.19046783447265625, 0.222625732421875, 0.25478363037109375, 0.2869415283203125, 0.31909942626953125, 0.35125732421875, 0.38341522216796875, 0.4155731201171875, 0.44773101806640625, 0.479888916015625, 0.5120468139648438, 0.5442047119140625, 0.5763626098632812, 0.6085205078125, 0.6406784057617188, 0.6728363037109375, 0.7049942016601562, 0.737152099609375, 0.7693099975585938, 0.8014678955078125, 0.8336257934570312, 0.86578369140625, 0.8979415893554688, 0.9300994873046875, 0.9622573852539062, 0.994415283203125, 1.0265731811523438, 1.0587310791015625, 1.0908889770507812, 1.123046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 10.0, 16.0, 18.0, 36.0, 67.0, 119.0, 149.0, 267.0, 470.0, 755.0, 1308.0, 2118.0, 3435.0, 5913.0, 9869.0, 16485.0, 27229.0, 44764.0, 72471.0, 113592.0, 175828.0, 255213.0, 352056.0, 443335.0, 506013.0, 513012.0, 463209.0, 375762.0, 278724.0, 193409.0, 128425.0, 81391.0, 50984.0, 30690.0, 18794.0, 11265.0, 6935.0, 4039.0, 2419.0, 1484.0, 884.0, 508.0, 314.0, 189.0, 113.0, 80.0, 58.0, 30.0, 14.0, 12.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.3486328125, -1.30792236328125, -1.2672119140625, -1.22650146484375, -1.185791015625, -1.14508056640625, -1.1043701171875, -1.06365966796875, -1.02294921875, -0.98223876953125, -0.9415283203125, -0.90081787109375, -0.860107421875, -0.81939697265625, -0.7786865234375, -0.73797607421875, -0.697265625, -0.65655517578125, -0.6158447265625, -0.57513427734375, -0.534423828125, -0.49371337890625, -0.4530029296875, -0.41229248046875, -0.37158203125, -0.33087158203125, -0.2901611328125, -0.24945068359375, -0.208740234375, -0.16802978515625, -0.1273193359375, -0.08660888671875, -0.0458984375, -0.00518798828125, 0.0355224609375, 0.07623291015625, 0.116943359375, 0.15765380859375, 0.1983642578125, 0.23907470703125, 0.27978515625, 0.32049560546875, 0.3612060546875, 0.40191650390625, 0.442626953125, 0.48333740234375, 0.5240478515625, 0.56475830078125, 0.60546875, 0.64617919921875, 0.6868896484375, 0.72760009765625, 0.768310546875, 0.80902099609375, 0.8497314453125, 0.89044189453125, 0.93115234375, 0.97186279296875, 1.0125732421875, 1.05328369140625, 1.093994140625, 1.13470458984375, 1.1754150390625, 1.21612548828125, 1.2568359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 9.0, 5.0, 8.0, 13.0, 14.0, 28.0, 29.0, 25.0, 44.0, 61.0, 65.0, 83.0, 88.0, 90.0, 108.0, 127.0, 149.0, 176.0, 197.0, 186.0, 208.0, 228.0, 216.0, 199.0, 203.0, 173.0, 185.0, 173.0, 134.0, 138.0, 111.0, 111.0, 101.0, 67.0, 69.0, 46.0, 43.0, 43.0, 33.0, 21.0, 12.0, 13.0, 8.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5343780517578125, -0.516998291015625, -0.4996185302734375, -0.48223876953125, -0.4648590087890625, -0.447479248046875, -0.4300994873046875, -0.4127197265625, -0.3953399658203125, -0.377960205078125, -0.3605804443359375, -0.34320068359375, -0.3258209228515625, -0.308441162109375, -0.2910614013671875, -0.273681640625, -0.2563018798828125, -0.238922119140625, -0.2215423583984375, -0.20416259765625, -0.1867828369140625, -0.169403076171875, -0.1520233154296875, -0.1346435546875, -0.1172637939453125, -0.099884033203125, -0.0825042724609375, -0.06512451171875, -0.0477447509765625, -0.030364990234375, -0.0129852294921875, 0.00439453125, 0.0217742919921875, 0.039154052734375, 0.0565338134765625, 0.07391357421875, 0.0912933349609375, 0.108673095703125, 0.1260528564453125, 0.1434326171875, 0.1608123779296875, 0.178192138671875, 0.1955718994140625, 0.21295166015625, 0.2303314208984375, 0.247711181640625, 0.2650909423828125, 0.282470703125, 0.2998504638671875, 0.317230224609375, 0.3346099853515625, 0.35198974609375, 0.3693695068359375, 0.386749267578125, 0.4041290283203125, 0.4215087890625, 0.4388885498046875, 0.456268310546875, 0.4736480712890625, 0.49102783203125, 0.5084075927734375, 0.525787353515625, 0.5431671142578125, 0.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 5.0, 8.0, 6.0, 15.0, 15.0, 29.0, 25.0, 38.0, 39.0, 42.0, 46.0, 48.0, 69.0, 72.0, 57.0, 68.0, 53.0, 69.0, 53.0, 46.0, 38.0, 34.0, 21.0, 19.0, 28.0, 11.0, 10.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8024777173995972, -1.7369765043258667, -1.6714752912521362, -1.6059740781784058, -1.5404728651046753, -1.4749716520309448, -1.409470558166504, -1.3439693450927734, -1.278468132019043, -1.2129669189453125, -1.147465705871582, -1.0819644927978516, -1.016463279724121, -0.9509620666503906, -0.8854609131813049, -0.8199597001075745, -0.7544584274291992, -0.6889572143554688, -0.6234560012817383, -0.5579547882080078, -0.49245360493659973, -0.42695239186286926, -0.3614512085914612, -0.2959499955177307, -0.23044878244400024, -0.16494756937026978, -0.0994463711977005, -0.033945173025131226, 0.03155604004859924, 0.09705725312232971, 0.1625584363937378, 0.22805964946746826, 0.2935607433319092, 0.35906195640563965, 0.4245631694793701, 0.4900643527507782, 0.555565595626831, 0.6210668087005615, 0.6865679621696472, 0.7520691752433777, 0.8175703883171082, 0.8830716013908386, 0.9485728144645691, 1.0140739679336548, 1.0795751810073853, 1.1450763940811157, 1.2105776071548462, 1.2760788202285767, 1.3415800333023071, 1.4070812463760376, 1.472582459449768, 1.5380836725234985, 1.603584885597229, 1.6690860986709595, 1.7345871925354004, 1.8000884056091309, 1.8655896186828613, 1.9310908317565918, 1.9965920448303223, 2.0620932579040527, 2.127594470977783, 2.1930956840515137, 2.258596897125244, 2.3240981101989746, 2.389599323272705]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 4.0, 3.0, 8.0, 8.0, 17.0, 11.0, 10.0, 22.0, 13.0, 21.0, 24.0, 29.0, 29.0, 30.0, 35.0, 30.0, 35.0, 38.0, 29.0, 33.0, 35.0, 43.0, 43.0, 33.0, 40.0, 41.0, 38.0, 33.0, 34.0, 28.0, 24.0, 26.0, 25.0, 17.0, 11.0, 7.0, 12.0, 19.0, 13.0, 10.0, 10.0, 2.0, 8.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.269423007965088, -1.2290480136871338, -1.1886730194091797, -1.1482980251312256, -1.1079230308532715, -1.0675479173660278, -1.0271729230880737, -0.9867979288101196, -0.9464229345321655, -0.9060479402542114, -0.8656729459762573, -0.8252978920936584, -0.7849228978157043, -0.7445479035377502, -0.7041728496551514, -0.6637978553771973, -0.6234228610992432, -0.5830478668212891, -0.542672872543335, -0.5022978186607361, -0.461922824382782, -0.4215478301048279, -0.3811728060245514, -0.3407977819442749, -0.3004227876663208, -0.2600477933883667, -0.2196727693080902, -0.17929776012897491, -0.13892275094985962, -0.09854774177074432, -0.05817273259162903, -0.01779770851135254, 0.022577285766601562, 0.06295229494571686, 0.10332730412483215, 0.14370231330394745, 0.18407732248306274, 0.22445233166217804, 0.26482734084129333, 0.3052023649215698, 0.3455773591995239, 0.385952353477478, 0.4263273775577545, 0.466702401638031, 0.5070773959159851, 0.5474523901939392, 0.5878274440765381, 0.6282024383544922, 0.6685774326324463, 0.7089524269104004, 0.7493274211883545, 0.7897024750709534, 0.8300774693489075, 0.8704524636268616, 0.9108275175094604, 0.9512025117874146, 0.9915775060653687, 1.0319525003433228, 1.0723274946212769, 1.112702488899231, 1.1530776023864746, 1.1934525966644287, 1.2338275909423828, 1.274202585220337, 1.314577579498291]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 9.0, 12.0, 20.0, 43.0, 38.0, 70.0, 96.0, 146.0, 195.0, 279.0, 424.0, 633.0, 875.0, 1368.0, 2180.0, 3483.0, 5805.0, 9731.0, 16791.0, 29913.0, 52774.0, 91020.0, 147701.0, 200017.0, 184602.0, 124050.0, 74536.0, 42984.0, 23994.0, 13773.0, 7985.0, 4761.0, 2828.0, 1706.0, 1259.0, 759.0, 508.0, 339.0, 253.0, 174.0, 131.0, 97.0, 60.0, 36.0, 32.0, 19.0, 14.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.72021484375, -0.69891357421875, -0.6776123046875, -0.65631103515625, -0.635009765625, -0.61370849609375, -0.5924072265625, -0.57110595703125, -0.5498046875, -0.52850341796875, -0.5072021484375, -0.48590087890625, -0.464599609375, -0.44329833984375, -0.4219970703125, -0.40069580078125, -0.37939453125, -0.35809326171875, -0.3367919921875, -0.31549072265625, -0.294189453125, -0.27288818359375, -0.2515869140625, -0.23028564453125, -0.208984375, -0.18768310546875, -0.1663818359375, -0.14508056640625, -0.123779296875, -0.10247802734375, -0.0811767578125, -0.05987548828125, -0.03857421875, -0.01727294921875, 0.0040283203125, 0.02532958984375, 0.046630859375, 0.06793212890625, 0.0892333984375, 0.11053466796875, 0.1318359375, 0.15313720703125, 0.1744384765625, 0.19573974609375, 0.217041015625, 0.23834228515625, 0.2596435546875, 0.28094482421875, 0.30224609375, 0.32354736328125, 0.3448486328125, 0.36614990234375, 0.387451171875, 0.40875244140625, 0.4300537109375, 0.45135498046875, 0.47265625, 0.49395751953125, 0.5152587890625, 0.53656005859375, 0.557861328125, 0.57916259765625, 0.6004638671875, 0.62176513671875, 0.64306640625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 9.0, 6.0, 8.0, 13.0, 11.0, 15.0, 17.0, 12.0, 24.0, 24.0, 32.0, 21.0, 30.0, 31.0, 30.0, 37.0, 46.0, 36.0, 34.0, 42.0, 48.0, 31.0, 33.0, 48.0, 36.0, 42.0, 34.0, 32.0, 20.0, 22.0, 25.0, 23.0, 12.0, 24.0, 14.0, 13.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.408203125, -1.36297607421875, -1.3177490234375, -1.27252197265625, -1.227294921875, -1.18206787109375, -1.1368408203125, -1.09161376953125, -1.04638671875, -1.00115966796875, -0.9559326171875, -0.91070556640625, -0.865478515625, -0.82025146484375, -0.7750244140625, -0.72979736328125, -0.6845703125, -0.63934326171875, -0.5941162109375, -0.54888916015625, -0.503662109375, -0.45843505859375, -0.4132080078125, -0.36798095703125, -0.32275390625, -0.27752685546875, -0.2322998046875, -0.18707275390625, -0.141845703125, -0.09661865234375, -0.0513916015625, -0.00616455078125, 0.0390625, 0.08428955078125, 0.1295166015625, 0.17474365234375, 0.219970703125, 0.26519775390625, 0.3104248046875, 0.35565185546875, 0.40087890625, 0.44610595703125, 0.4913330078125, 0.53656005859375, 0.581787109375, 0.62701416015625, 0.6722412109375, 0.71746826171875, 0.7626953125, 0.80792236328125, 0.8531494140625, 0.89837646484375, 0.943603515625, 0.98883056640625, 1.0340576171875, 1.07928466796875, 1.12451171875, 1.16973876953125, 1.2149658203125, 1.26019287109375, 1.305419921875, 1.35064697265625, 1.3958740234375, 1.44110107421875, 1.486328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 7.0, 1.0, 11.0, 12.0, 24.0, 34.0, 52.0, 66.0, 105.0, 138.0, 231.0, 358.0, 622.0, 1085.0, 2223.0, 4879.0, 12454.0, 38183.0, 130315.0, 389692.0, 322990.0, 97387.0, 29203.0, 10148.0, 4073.0, 1819.0, 936.0, 549.0, 348.0, 215.0, 117.0, 93.0, 62.0, 29.0, 31.0, 24.0, 17.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4833984375, -1.4396209716796875, -1.395843505859375, -1.3520660400390625, -1.30828857421875, -1.2645111083984375, -1.220733642578125, -1.1769561767578125, -1.1331787109375, -1.0894012451171875, -1.045623779296875, -1.0018463134765625, -0.95806884765625, -0.9142913818359375, -0.870513916015625, -0.8267364501953125, -0.782958984375, -0.7391815185546875, -0.695404052734375, -0.6516265869140625, -0.60784912109375, -0.5640716552734375, -0.520294189453125, -0.4765167236328125, -0.4327392578125, -0.3889617919921875, -0.345184326171875, -0.3014068603515625, -0.25762939453125, -0.2138519287109375, -0.170074462890625, -0.1262969970703125, -0.08251953125, -0.0387420654296875, 0.005035400390625, 0.0488128662109375, 0.09259033203125, 0.1363677978515625, 0.180145263671875, 0.2239227294921875, 0.2677001953125, 0.3114776611328125, 0.355255126953125, 0.3990325927734375, 0.44281005859375, 0.4865875244140625, 0.530364990234375, 0.5741424560546875, 0.617919921875, 0.6616973876953125, 0.705474853515625, 0.7492523193359375, 0.79302978515625, 0.8368072509765625, 0.880584716796875, 0.9243621826171875, 0.9681396484375, 1.0119171142578125, 1.055694580078125, 1.0994720458984375, 1.14324951171875, 1.1870269775390625, 1.230804443359375, 1.2745819091796875, 1.318359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 2.0, 3.0, 8.0, 13.0, 12.0, 13.0, 14.0, 16.0, 14.0, 17.0, 18.0, 27.0, 26.0, 20.0, 33.0, 27.0, 38.0, 45.0, 34.0, 29.0, 35.0, 44.0, 41.0, 46.0, 42.0, 27.0, 27.0, 37.0, 33.0, 25.0, 24.0, 22.0, 19.0, 22.0, 27.0, 19.0, 17.0, 17.0, 11.0, 11.0, 7.0, 5.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9482421875, -0.9193344116210938, -0.8904266357421875, -0.8615188598632812, -0.832611083984375, -0.8037033081054688, -0.7747955322265625, -0.7458877563476562, -0.71697998046875, -0.6880722045898438, -0.6591644287109375, -0.6302566528320312, -0.601348876953125, -0.5724411010742188, -0.5435333251953125, -0.5146255493164062, -0.4857177734375, -0.45680999755859375, -0.4279022216796875, -0.39899444580078125, -0.370086669921875, -0.34117889404296875, -0.3122711181640625, -0.28336334228515625, -0.25445556640625, -0.22554779052734375, -0.1966400146484375, -0.16773223876953125, -0.138824462890625, -0.10991668701171875, -0.0810089111328125, -0.05210113525390625, -0.023193359375, 0.00571441650390625, 0.0346221923828125, 0.06352996826171875, 0.092437744140625, 0.12134552001953125, 0.1502532958984375, 0.17916107177734375, 0.20806884765625, 0.23697662353515625, 0.2658843994140625, 0.29479217529296875, 0.323699951171875, 0.35260772705078125, 0.3815155029296875, 0.41042327880859375, 0.4393310546875, 0.46823883056640625, 0.4971466064453125, 0.5260543823242188, 0.554962158203125, 0.5838699340820312, 0.6127777099609375, 0.6416854858398438, 0.67059326171875, 0.6995010375976562, 0.7284088134765625, 0.7573165893554688, 0.786224365234375, 0.8151321411132812, 0.8440399169921875, 0.8729476928710938, 0.90185546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 9.0, 12.0, 16.0, 23.0, 31.0, 49.0, 56.0, 78.0, 100.0, 157.0, 193.0, 277.0, 382.0, 552.0, 923.0, 1438.0, 2798.0, 6708.0, 28105.0, 601080.0, 371774.0, 21285.0, 5694.0, 2531.0, 1413.0, 835.0, 544.0, 383.0, 292.0, 191.0, 170.0, 102.0, 89.0, 64.0, 48.0, 41.0, 19.0, 23.0, 21.0, 14.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2080078125, -1.1662445068359375, -1.124481201171875, -1.0827178955078125, -1.04095458984375, -0.9991912841796875, -0.957427978515625, -0.9156646728515625, -0.8739013671875, -0.8321380615234375, -0.790374755859375, -0.7486114501953125, -0.70684814453125, -0.6650848388671875, -0.623321533203125, -0.5815582275390625, -0.539794921875, -0.4980316162109375, -0.456268310546875, -0.4145050048828125, -0.37274169921875, -0.3309783935546875, -0.289215087890625, -0.2474517822265625, -0.2056884765625, -0.1639251708984375, -0.122161865234375, -0.0803985595703125, -0.03863525390625, 0.0031280517578125, 0.044891357421875, 0.0866546630859375, 0.12841796875, 0.1701812744140625, 0.211944580078125, 0.2537078857421875, 0.29547119140625, 0.3372344970703125, 0.378997802734375, 0.4207611083984375, 0.4625244140625, 0.5042877197265625, 0.546051025390625, 0.5878143310546875, 0.62957763671875, 0.6713409423828125, 0.713104248046875, 0.7548675537109375, 0.796630859375, 0.8383941650390625, 0.880157470703125, 0.9219207763671875, 0.96368408203125, 1.0054473876953125, 1.047210693359375, 1.0889739990234375, 1.1307373046875, 1.1725006103515625, 1.214263916015625, 1.2560272216796875, 1.29779052734375, 1.3395538330078125, 1.381317138671875, 1.4230804443359375, 1.46484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 10.0, 7.0, 37.0, 166.0, 378.0, 271.0, 90.0, 23.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017905235290527344, -0.00017454568296670914, -0.00017003901302814484, -0.00016553234308958054, -0.00016102567315101624, -0.00015651900321245193, -0.00015201233327388763, -0.00014750566333532333, -0.00014299899339675903, -0.00013849232345819473, -0.00013398565351963043, -0.00012947898358106613, -0.00012497231364250183, -0.00012046564370393753, -0.00011595897376537323, -0.00011145230382680893, -0.00010694563388824463, -0.00010243896394968033, -9.793229401111603e-05, -9.342562407255173e-05, -8.891895413398743e-05, -8.441228419542313e-05, -7.990561425685883e-05, -7.539894431829453e-05, -7.089227437973022e-05, -6.638560444116592e-05, -6.187893450260162e-05, -5.737226456403732e-05, -5.286559462547302e-05, -4.835892468690872e-05, -4.385225474834442e-05, -3.934558480978012e-05, -3.483891487121582e-05, -3.033224493265152e-05, -2.582557499408722e-05, -2.131890505552292e-05, -1.6812235116958618e-05, -1.2305565178394318e-05, -7.798895239830017e-06, -3.2922253012657166e-06, 1.214444637298584e-06, 5.7211145758628845e-06, 1.0227784514427185e-05, 1.4734454452991486e-05, 1.9241124391555786e-05, 2.3747794330120087e-05, 2.8254464268684387e-05, 3.276113420724869e-05, 3.726780414581299e-05, 4.177447408437729e-05, 4.628114402294159e-05, 5.078781396150589e-05, 5.529448390007019e-05, 5.980115383863449e-05, 6.430782377719879e-05, 6.881449371576309e-05, 7.332116365432739e-05, 7.782783359289169e-05, 8.2334503531456e-05, 8.68411734700203e-05, 9.13478434085846e-05, 9.58545133471489e-05, 0.0001003611832857132, 0.0001048678532242775, 0.0001093745231628418]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 13.0, 18.0, 22.0, 33.0, 32.0, 56.0, 84.0, 101.0, 159.0, 233.0, 403.0, 732.0, 1164.0, 2207.0, 4459.0, 10179.0, 27892.0, 102862.0, 413747.0, 356340.0, 85602.0, 24236.0, 9093.0, 3952.0, 2007.0, 1109.0, 622.0, 392.0, 254.0, 155.0, 96.0, 66.0, 53.0, 42.0, 29.0, 25.0, 18.0, 9.0, 5.0, 5.0, 5.0, 5.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.75830078125, -0.7359542846679688, -0.7136077880859375, -0.6912612915039062, -0.668914794921875, -0.6465682983398438, -0.6242218017578125, -0.6018753051757812, -0.57952880859375, -0.5571823120117188, -0.5348358154296875, -0.5124893188476562, -0.490142822265625, -0.46779632568359375, -0.4454498291015625, -0.42310333251953125, -0.4007568359375, -0.37841033935546875, -0.3560638427734375, -0.33371734619140625, -0.311370849609375, -0.28902435302734375, -0.2666778564453125, -0.24433135986328125, -0.22198486328125, -0.19963836669921875, -0.1772918701171875, -0.15494537353515625, -0.132598876953125, -0.11025238037109375, -0.0879058837890625, -0.06555938720703125, -0.043212890625, -0.02086639404296875, 0.0014801025390625, 0.02382659912109375, 0.046173095703125, 0.06851959228515625, 0.0908660888671875, 0.11321258544921875, 0.13555908203125, 0.15790557861328125, 0.1802520751953125, 0.20259857177734375, 0.224945068359375, 0.24729156494140625, 0.2696380615234375, 0.29198455810546875, 0.3143310546875, 0.33667755126953125, 0.3590240478515625, 0.38137054443359375, 0.403717041015625, 0.42606353759765625, 0.4484100341796875, 0.47075653076171875, 0.49310302734375, 0.5154495239257812, 0.5377960205078125, 0.5601425170898438, 0.582489013671875, 0.6048355102539062, 0.6271820068359375, 0.6495285034179688, 0.671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 15.0, 18.0, 20.0, 35.0, 60.0, 128.0, 212.0, 219.0, 114.0, 70.0, 35.0, 33.0, 12.0, 9.0, 3.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.343505859375, -0.33570098876953125, -0.3278961181640625, -0.32009124755859375, -0.312286376953125, -0.30448150634765625, -0.2966766357421875, -0.28887176513671875, -0.28106689453125, -0.27326202392578125, -0.2654571533203125, -0.25765228271484375, -0.249847412109375, -0.24204254150390625, -0.2342376708984375, -0.22643280029296875, -0.2186279296875, -0.21082305908203125, -0.2030181884765625, -0.19521331787109375, -0.187408447265625, -0.17960357666015625, -0.1717987060546875, -0.16399383544921875, -0.15618896484375, -0.14838409423828125, -0.1405792236328125, -0.13277435302734375, -0.124969482421875, -0.11716461181640625, -0.1093597412109375, -0.10155487060546875, -0.09375, -0.08594512939453125, -0.0781402587890625, -0.07033538818359375, -0.062530517578125, -0.05472564697265625, -0.0469207763671875, -0.03911590576171875, -0.03131103515625, -0.02350616455078125, -0.0157012939453125, -0.00789642333984375, -9.1552734375e-05, 0.00771331787109375, 0.0155181884765625, 0.02332305908203125, 0.0311279296875, 0.03893280029296875, 0.0467376708984375, 0.05454254150390625, 0.062347412109375, 0.07015228271484375, 0.0779571533203125, 0.08576202392578125, 0.09356689453125, 0.10137176513671875, 0.1091766357421875, 0.11698150634765625, 0.124786376953125, 0.13259124755859375, 0.1403961181640625, 0.14820098876953125, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 2.0, 12.0, 11.0, 11.0, 17.0, 20.0, 25.0, 34.0, 35.0, 37.0, 45.0, 50.0, 59.0, 78.0, 57.0, 64.0, 53.0, 62.0, 65.0, 46.0, 43.0, 33.0, 33.0, 20.0, 15.0, 20.0, 13.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7161957025527954, -1.6523724794387817, -1.5885493755340576, -1.524726152420044, -1.4609029293060303, -1.3970797061920166, -1.333256483078003, -1.2694333791732788, -1.2056101560592651, -1.1417869329452515, -1.0779638290405273, -1.0141406059265137, -0.9503173828125, -0.8864941596984863, -0.8226709961891174, -0.7588478326797485, -0.6950246095657349, -0.6312013864517212, -0.5673782229423523, -0.5035550594329834, -0.4397318363189697, -0.37590864300727844, -0.31208544969558716, -0.24826225638389587, -0.1844390630722046, -0.1206158697605133, -0.05679267644882202, 0.007030516862869263, 0.07085371017456055, 0.13467690348625183, 0.19850009679794312, 0.2623232901096344, 0.32614636421203613, 0.3899695575237274, 0.4537927508354187, 0.5176159143447876, 0.5814391374588013, 0.6452623605728149, 0.7090855240821838, 0.7729086875915527, 0.8367319107055664, 0.9005551338195801, 0.964378297328949, 1.0282014608383179, 1.0920246839523315, 1.1558479070663452, 1.2196710109710693, 1.283494234085083, 1.3473174571990967, 1.4111406803131104, 1.474963903427124, 1.5387870073318481, 1.6026102304458618, 1.6664334535598755, 1.7302565574645996, 1.7940797805786133, 1.857903003692627, 1.9217262268066406, 1.9855494499206543, 2.049372673034668, 2.1131958961486816, 2.177018880844116, 2.24084210395813, 2.3046653270721436, 2.3684885501861572]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 3.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 15.0, 12.0, 22.0, 29.0, 29.0, 24.0, 28.0, 35.0, 30.0, 38.0, 37.0, 31.0, 33.0, 34.0, 46.0, 40.0, 37.0, 42.0, 38.0, 35.0, 31.0, 35.0, 28.0, 28.0, 21.0, 31.0, 12.0, 13.0, 12.0, 10.0, 16.0, 11.0, 12.0, 10.0, 2.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2592148780822754, -1.2190552949905396, -1.1788957118988037, -1.1387361288070679, -1.098576545715332, -1.0584168434143066, -1.0182572603225708, -0.978097677230835, -0.9379380941390991, -0.8977785110473633, -0.8576189279556274, -0.8174592852592468, -0.777299702167511, -0.7371401190757751, -0.6969804763793945, -0.6568208932876587, -0.6166613101959229, -0.576501727104187, -0.5363421440124512, -0.49618250131607056, -0.4560229182243347, -0.4158633351325989, -0.37570372223854065, -0.3355441093444824, -0.2953845262527466, -0.25522494316101074, -0.21506533026695251, -0.17490573227405548, -0.13474613428115845, -0.09458653628826141, -0.05442693829536438, -0.014267325401306152, 0.025892257690429688, 0.06605185568332672, 0.10621145367622375, 0.1463710516691208, 0.18653064966201782, 0.22669024765491486, 0.2668498456478119, 0.3070094585418701, 0.34716904163360596, 0.3873286247253418, 0.4274882376194, 0.46764785051345825, 0.5078074336051941, 0.5479670166969299, 0.5881266593933105, 0.6282862424850464, 0.6684458255767822, 0.7086054086685181, 0.7487649917602539, 0.7889246344566345, 0.8290842175483704, 0.8692438006401062, 0.9094034433364868, 0.9495630264282227, 0.9897226095199585, 1.0298821926116943, 1.0700417757034302, 1.110201358795166, 1.1503610610961914, 1.1905206441879272, 1.230680227279663, 1.270839810371399, 1.3109993934631348]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 8.0, 10.0, 23.0, 29.0, 54.0, 75.0, 126.0, 178.0, 292.0, 452.0, 695.0, 1067.0, 1650.0, 2535.0, 3781.0, 5759.0, 8684.0, 12999.0, 19103.0, 27869.0, 38388.0, 52981.0, 69031.0, 84784.0, 98282.0, 105789.0, 104631.0, 96323.0, 82034.0, 65992.0, 49762.0, 36587.0, 25666.0, 17795.0, 12116.0, 7964.0, 5170.0, 3386.0, 2239.0, 1430.0, 974.0, 638.0, 414.0, 273.0, 177.0, 131.0, 65.0, 60.0, 36.0, 13.0, 8.0, 10.0, 14.0, 8.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1064453125, -1.0717620849609375, -1.037078857421875, -1.0023956298828125, -0.96771240234375, -0.9330291748046875, -0.898345947265625, -0.8636627197265625, -0.8289794921875, -0.7942962646484375, -0.759613037109375, -0.7249298095703125, -0.69024658203125, -0.6555633544921875, -0.620880126953125, -0.5861968994140625, -0.551513671875, -0.5168304443359375, -0.482147216796875, -0.4474639892578125, -0.41278076171875, -0.3780975341796875, -0.343414306640625, -0.3087310791015625, -0.2740478515625, -0.2393646240234375, -0.204681396484375, -0.1699981689453125, -0.13531494140625, -0.1006317138671875, -0.065948486328125, -0.0312652587890625, 0.00341796875, 0.0381011962890625, 0.072784423828125, 0.1074676513671875, 0.14215087890625, 0.1768341064453125, 0.211517333984375, 0.2462005615234375, 0.2808837890625, 0.3155670166015625, 0.350250244140625, 0.3849334716796875, 0.41961669921875, 0.4542999267578125, 0.488983154296875, 0.5236663818359375, 0.558349609375, 0.5930328369140625, 0.627716064453125, 0.6623992919921875, 0.69708251953125, 0.7317657470703125, 0.766448974609375, 0.8011322021484375, 0.8358154296875, 0.8704986572265625, 0.905181884765625, 0.9398651123046875, 0.97454833984375, 1.0092315673828125, 1.043914794921875, 1.0785980224609375, 1.11328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 7.0, 2.0, 5.0, 9.0, 7.0, 12.0, 16.0, 8.0, 18.0, 13.0, 18.0, 25.0, 13.0, 33.0, 36.0, 38.0, 26.0, 30.0, 42.0, 38.0, 31.0, 33.0, 33.0, 40.0, 44.0, 33.0, 45.0, 38.0, 28.0, 40.0, 28.0, 30.0, 21.0, 21.0, 25.0, 16.0, 8.0, 19.0, 12.0, 9.0, 10.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2978515625, -1.257110595703125, -1.21636962890625, -1.175628662109375, -1.1348876953125, -1.094146728515625, -1.05340576171875, -1.012664794921875, -0.971923828125, -0.931182861328125, -0.89044189453125, -0.849700927734375, -0.8089599609375, -0.768218994140625, -0.72747802734375, -0.686737060546875, -0.64599609375, -0.605255126953125, -0.56451416015625, -0.523773193359375, -0.4830322265625, -0.442291259765625, -0.40155029296875, -0.360809326171875, -0.320068359375, -0.279327392578125, -0.23858642578125, -0.197845458984375, -0.1571044921875, -0.116363525390625, -0.07562255859375, -0.034881591796875, 0.005859375, 0.046600341796875, 0.08734130859375, 0.128082275390625, 0.1688232421875, 0.209564208984375, 0.25030517578125, 0.291046142578125, 0.331787109375, 0.372528076171875, 0.41326904296875, 0.454010009765625, 0.4947509765625, 0.535491943359375, 0.57623291015625, 0.616973876953125, 0.65771484375, 0.698455810546875, 0.73919677734375, 0.779937744140625, 0.8206787109375, 0.861419677734375, 0.90216064453125, 0.942901611328125, 0.983642578125, 1.024383544921875, 1.06512451171875, 1.105865478515625, 1.1466064453125, 1.187347412109375, 1.22808837890625, 1.268829345703125, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 10.0, 22.0, 27.0, 39.0, 58.0, 90.0, 129.0, 171.0, 314.0, 443.0, 744.0, 1100.0, 1716.0, 2556.0, 3836.0, 6056.0, 8960.0, 13489.0, 19406.0, 27707.0, 38876.0, 52246.0, 68236.0, 83640.0, 96278.0, 103027.0, 102151.0, 94264.0, 82405.0, 66456.0, 51550.0, 37958.0, 27116.0, 19018.0, 12697.0, 8868.0, 5848.0, 3931.0, 2471.0, 1627.0, 1030.0, 683.0, 464.0, 296.0, 204.0, 121.0, 78.0, 45.0, 48.0, 21.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0], "bins": [-1.1064453125, -1.0728759765625, -1.039306640625, -1.0057373046875, -0.97216796875, -0.9385986328125, -0.905029296875, -0.8714599609375, -0.837890625, -0.8043212890625, -0.770751953125, -0.7371826171875, -0.70361328125, -0.6700439453125, -0.636474609375, -0.6029052734375, -0.5693359375, -0.5357666015625, -0.502197265625, -0.4686279296875, -0.43505859375, -0.4014892578125, -0.367919921875, -0.3343505859375, -0.30078125, -0.2672119140625, -0.233642578125, -0.2000732421875, -0.16650390625, -0.1329345703125, -0.099365234375, -0.0657958984375, -0.0322265625, 0.0013427734375, 0.034912109375, 0.0684814453125, 0.10205078125, 0.1356201171875, 0.169189453125, 0.2027587890625, 0.236328125, 0.2698974609375, 0.303466796875, 0.3370361328125, 0.37060546875, 0.4041748046875, 0.437744140625, 0.4713134765625, 0.5048828125, 0.5384521484375, 0.572021484375, 0.6055908203125, 0.63916015625, 0.6727294921875, 0.706298828125, 0.7398681640625, 0.7734375, 0.8070068359375, 0.840576171875, 0.8741455078125, 0.90771484375, 0.9412841796875, 0.974853515625, 1.0084228515625, 1.0419921875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 15.0, 18.0, 17.0, 12.0, 21.0, 18.0, 22.0, 23.0, 18.0, 36.0, 30.0, 36.0, 39.0, 44.0, 40.0, 34.0, 43.0, 37.0, 35.0, 47.0, 37.0, 43.0, 49.0, 33.0, 30.0, 23.0, 38.0, 14.0, 24.0, 24.0, 14.0, 10.0, 11.0, 10.0, 3.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7753677368164062, -0.7480010986328125, -0.7206344604492188, -0.693267822265625, -0.6659011840820312, -0.6385345458984375, -0.6111679077148438, -0.58380126953125, -0.5564346313476562, -0.5290679931640625, -0.5017013549804688, -0.474334716796875, -0.44696807861328125, -0.4196014404296875, -0.39223480224609375, -0.3648681640625, -0.33750152587890625, -0.3101348876953125, -0.28276824951171875, -0.255401611328125, -0.22803497314453125, -0.2006683349609375, -0.17330169677734375, -0.14593505859375, -0.11856842041015625, -0.0912017822265625, -0.06383514404296875, -0.036468505859375, -0.00910186767578125, 0.0182647705078125, 0.04563140869140625, 0.072998046875, 0.10036468505859375, 0.1277313232421875, 0.15509796142578125, 0.182464599609375, 0.20983123779296875, 0.2371978759765625, 0.26456451416015625, 0.29193115234375, 0.31929779052734375, 0.3466644287109375, 0.37403106689453125, 0.401397705078125, 0.42876434326171875, 0.4561309814453125, 0.48349761962890625, 0.5108642578125, 0.5382308959960938, 0.5655975341796875, 0.5929641723632812, 0.620330810546875, 0.6476974487304688, 0.6750640869140625, 0.7024307250976562, 0.72979736328125, 0.7571640014648438, 0.7845306396484375, 0.8118972778320312, 0.839263916015625, 0.8666305541992188, 0.8939971923828125, 0.9213638305664062, 0.94873046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 9.0, 13.0, 31.0, 42.0, 61.0, 91.0, 178.0, 238.0, 365.0, 583.0, 965.0, 1513.0, 2474.0, 4178.0, 7039.0, 12463.0, 21956.0, 39284.0, 68589.0, 112228.0, 163587.0, 187293.0, 160961.0, 109378.0, 66472.0, 37843.0, 21280.0, 12082.0, 6906.0, 4105.0, 2366.0, 1444.0, 928.0, 562.0, 376.0, 210.0, 155.0, 95.0, 72.0, 41.0, 29.0, 20.0, 12.0, 15.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.92236328125, -0.894805908203125, -0.86724853515625, -0.839691162109375, -0.8121337890625, -0.784576416015625, -0.75701904296875, -0.729461669921875, -0.701904296875, -0.674346923828125, -0.64678955078125, -0.619232177734375, -0.5916748046875, -0.564117431640625, -0.53656005859375, -0.509002685546875, -0.4814453125, -0.453887939453125, -0.42633056640625, -0.398773193359375, -0.3712158203125, -0.343658447265625, -0.31610107421875, -0.288543701171875, -0.260986328125, -0.233428955078125, -0.20587158203125, -0.178314208984375, -0.1507568359375, -0.123199462890625, -0.09564208984375, -0.068084716796875, -0.04052734375, -0.012969970703125, 0.01458740234375, 0.042144775390625, 0.0697021484375, 0.097259521484375, 0.12481689453125, 0.152374267578125, 0.179931640625, 0.207489013671875, 0.23504638671875, 0.262603759765625, 0.2901611328125, 0.317718505859375, 0.34527587890625, 0.372833251953125, 0.400390625, 0.427947998046875, 0.45550537109375, 0.483062744140625, 0.5106201171875, 0.538177490234375, 0.56573486328125, 0.593292236328125, 0.620849609375, 0.648406982421875, 0.67596435546875, 0.703521728515625, 0.7310791015625, 0.758636474609375, 0.78619384765625, 0.813751220703125, 0.84130859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 12.0, 17.0, 25.0, 27.0, 29.0, 28.0, 27.0, 45.0, 38.0, 42.0, 42.0, 62.0, 62.0, 72.0, 48.0, 51.0, 43.0, 48.0, 47.0, 32.0, 29.0, 33.0, 23.0, 18.0, 14.0, 14.0, 12.0, 8.0, 5.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.390975952148438e-05, -7.155537605285645e-05, -6.920099258422852e-05, -6.684660911560059e-05, -6.449222564697266e-05, -6.213784217834473e-05, -5.97834587097168e-05, -5.742907524108887e-05, -5.507469177246094e-05, -5.272030830383301e-05, -5.036592483520508e-05, -4.801154136657715e-05, -4.565715789794922e-05, -4.330277442932129e-05, -4.094839096069336e-05, -3.859400749206543e-05, -3.62396240234375e-05, -3.388524055480957e-05, -3.153085708618164e-05, -2.917647361755371e-05, -2.682209014892578e-05, -2.446770668029785e-05, -2.2113323211669922e-05, -1.9758939743041992e-05, -1.7404556274414062e-05, -1.5050172805786133e-05, -1.2695789337158203e-05, -1.0341405868530273e-05, -7.987022399902344e-06, -5.632638931274414e-06, -3.2782554626464844e-06, -9.238719940185547e-07, 1.430511474609375e-06, 3.7848949432373047e-06, 6.139278411865234e-06, 8.493661880493164e-06, 1.0848045349121094e-05, 1.3202428817749023e-05, 1.5556812286376953e-05, 1.7911195755004883e-05, 2.0265579223632812e-05, 2.2619962692260742e-05, 2.4974346160888672e-05, 2.73287296295166e-05, 2.968311309814453e-05, 3.203749656677246e-05, 3.439188003540039e-05, 3.674626350402832e-05, 3.910064697265625e-05, 4.145503044128418e-05, 4.380941390991211e-05, 4.616379737854004e-05, 4.851818084716797e-05, 5.08725643157959e-05, 5.322694778442383e-05, 5.558133125305176e-05, 5.793571472167969e-05, 6.029009819030762e-05, 6.264448165893555e-05, 6.499886512756348e-05, 6.73532485961914e-05, 6.970763206481934e-05, 7.206201553344727e-05, 7.44163990020752e-05, 7.677078247070312e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 16.0, 20.0, 27.0, 49.0, 58.0, 104.0, 154.0, 224.0, 366.0, 613.0, 1018.0, 1768.0, 2840.0, 4807.0, 8372.0, 14733.0, 25419.0, 44505.0, 75655.0, 118628.0, 159821.0, 174986.0, 149433.0, 106494.0, 66374.0, 39158.0, 22162.0, 12750.0, 7421.0, 4107.0, 2534.0, 1479.0, 924.0, 536.0, 363.0, 232.0, 154.0, 92.0, 55.0, 35.0, 18.0, 18.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.84765625, -0.82147216796875, -0.7952880859375, -0.76910400390625, -0.742919921875, -0.71673583984375, -0.6905517578125, -0.66436767578125, -0.63818359375, -0.61199951171875, -0.5858154296875, -0.55963134765625, -0.533447265625, -0.50726318359375, -0.4810791015625, -0.45489501953125, -0.4287109375, -0.40252685546875, -0.3763427734375, -0.35015869140625, -0.323974609375, -0.29779052734375, -0.2716064453125, -0.24542236328125, -0.21923828125, -0.19305419921875, -0.1668701171875, -0.14068603515625, -0.114501953125, -0.08831787109375, -0.0621337890625, -0.03594970703125, -0.009765625, 0.01641845703125, 0.0426025390625, 0.06878662109375, 0.094970703125, 0.12115478515625, 0.1473388671875, 0.17352294921875, 0.19970703125, 0.22589111328125, 0.2520751953125, 0.27825927734375, 0.304443359375, 0.33062744140625, 0.3568115234375, 0.38299560546875, 0.4091796875, 0.43536376953125, 0.4615478515625, 0.48773193359375, 0.513916015625, 0.54010009765625, 0.5662841796875, 0.59246826171875, 0.61865234375, 0.64483642578125, 0.6710205078125, 0.69720458984375, 0.723388671875, 0.74957275390625, 0.7757568359375, 0.80194091796875, 0.828125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 10.0, 17.0, 12.0, 22.0, 25.0, 27.0, 44.0, 46.0, 56.0, 54.0, 65.0, 75.0, 68.0, 78.0, 64.0, 67.0, 43.0, 42.0, 35.0, 27.0, 22.0, 17.0, 22.0, 13.0, 11.0, 3.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38722991943359375, -0.3760223388671875, -0.36481475830078125, -0.353607177734375, -0.34239959716796875, -0.3311920166015625, -0.31998443603515625, -0.30877685546875, -0.29756927490234375, -0.2863616943359375, -0.27515411376953125, -0.263946533203125, -0.25273895263671875, -0.2415313720703125, -0.23032379150390625, -0.2191162109375, -0.20790863037109375, -0.1967010498046875, -0.18549346923828125, -0.174285888671875, -0.16307830810546875, -0.1518707275390625, -0.14066314697265625, -0.12945556640625, -0.11824798583984375, -0.1070404052734375, -0.09583282470703125, -0.084625244140625, -0.07341766357421875, -0.0622100830078125, -0.05100250244140625, -0.039794921875, -0.02858734130859375, -0.0173797607421875, -0.00617218017578125, 0.005035400390625, 0.01624298095703125, 0.0274505615234375, 0.03865814208984375, 0.04986572265625, 0.06107330322265625, 0.0722808837890625, 0.08348846435546875, 0.094696044921875, 0.10590362548828125, 0.1171112060546875, 0.12831878662109375, 0.1395263671875, 0.15073394775390625, 0.1619415283203125, 0.17314910888671875, 0.184356689453125, 0.19556427001953125, 0.2067718505859375, 0.21797943115234375, 0.22918701171875, 0.24039459228515625, 0.2516021728515625, 0.26280975341796875, 0.274017333984375, 0.28522491455078125, 0.2964324951171875, 0.30764007568359375, 0.31884765625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 11.0, 7.0, 12.0, 19.0, 26.0, 30.0, 35.0, 33.0, 33.0, 57.0, 59.0, 64.0, 63.0, 70.0, 61.0, 64.0, 71.0, 52.0, 47.0, 38.0, 30.0, 23.0, 17.0, 18.0, 23.0, 9.0, 4.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96602463722229, -1.89926016330719, -1.8324956893920898, -1.7657313346862793, -1.6989668607711792, -1.632202386856079, -1.5654380321502686, -1.4986735582351685, -1.4319090843200684, -1.3651446104049683, -1.2983801364898682, -1.2316157817840576, -1.1648513078689575, -1.0980868339538574, -1.0313224792480469, -0.9645580053329468, -0.8977935314178467, -0.8310290575027466, -0.7642646431922913, -0.6975002288818359, -0.6307357549667358, -0.5639712810516357, -0.4972068667411804, -0.4304424226284027, -0.363677978515625, -0.2969135344028473, -0.23014909029006958, -0.16338464617729187, -0.09662020206451416, -0.02985575795173645, 0.03690868616104126, 0.10367313027381897, 0.17043781280517578, 0.2372022569179535, 0.3039667010307312, 0.3707311451435089, 0.4374955892562866, 0.5042600631713867, 0.571024477481842, 0.6377888917922974, 0.7045533657073975, 0.7713178396224976, 0.8380822539329529, 0.9048466682434082, 0.9716111421585083, 1.0383756160736084, 1.105139970779419, 1.171904444694519, 1.2386689186096191, 1.3054333925247192, 1.3721978664398193, 1.4389622211456299, 1.50572669506073, 1.57249116897583, 1.6392555236816406, 1.7060199975967407, 1.7727844715118408, 1.839548945426941, 1.906313419342041, 1.9730777740478516, 2.039842128753662, 2.1066067218780518, 2.1733710765838623, 2.240135669708252, 2.3069000244140625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 1.0, 5.0, 2.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 9.0, 8.0, 12.0, 9.0, 14.0, 17.0, 17.0, 29.0, 22.0, 20.0, 30.0, 22.0, 25.0, 29.0, 36.0, 37.0, 30.0, 24.0, 41.0, 46.0, 43.0, 31.0, 30.0, 40.0, 40.0, 33.0, 32.0, 33.0, 18.0, 14.0, 23.0, 16.0, 25.0, 13.0, 12.0, 16.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1299009323120117, -1.0913114547729492, -1.0527218580245972, -1.0141323804855347, -0.9755429029464722, -0.9369533658027649, -0.8983638286590576, -0.8597743511199951, -0.8211848139762878, -0.7825952768325806, -0.7440057992935181, -0.7054162621498108, -0.6668267250061035, -0.628237247467041, -0.5896477103233337, -0.5510581731796265, -0.512468695640564, -0.4738791882991791, -0.4352896809577942, -0.3967001438140869, -0.358110636472702, -0.31952112913131714, -0.28093159198760986, -0.24234208464622498, -0.2037525773048401, -0.1651630699634552, -0.12657354772090912, -0.08798403292894363, -0.04939451813697815, -0.010805010795593262, 0.02778451144695282, 0.0663740336894989, 0.10496342182159424, 0.14355292916297913, 0.1821424514055252, 0.2207319736480713, 0.2593214809894562, 0.29791098833084106, 0.33650052547454834, 0.3750900328159332, 0.4136795401573181, 0.452269047498703, 0.4908585548400879, 0.5294480919837952, 0.5680376291275024, 0.6066271066665649, 0.6452166438102722, 0.6838061809539795, 0.722395658493042, 0.7609851956367493, 0.7995746731758118, 0.838164210319519, 0.8767536878585815, 0.9153432250022888, 0.9539327621459961, 0.9925222396850586, 1.031111717224121, 1.0697011947631836, 1.1082907915115356, 1.1468802690505981, 1.1854697465896606, 1.2240593433380127, 1.2626488208770752, 1.3012382984161377, 1.3398278951644897]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 11.0, 22.0, 35.0, 56.0, 97.0, 163.0, 267.0, 412.0, 617.0, 1047.0, 1675.0, 2741.0, 4423.0, 7275.0, 11679.0, 19559.0, 31746.0, 52151.0, 84917.0, 136164.0, 215054.0, 320890.0, 445944.0, 551682.0, 584934.0, 526040.0, 409265.0, 287414.0, 189352.0, 119317.0, 73346.0, 45020.0, 27438.0, 16638.0, 10245.0, 6144.0, 3970.0, 2380.0, 1519.0, 949.0, 625.0, 398.0, 268.0, 156.0, 81.0, 64.0, 39.0, 22.0, 18.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.0457611083984375, -1.007537841796875, -0.9693145751953125, -0.93109130859375, -0.8928680419921875, -0.854644775390625, -0.8164215087890625, -0.7781982421875, -0.7399749755859375, -0.701751708984375, -0.6635284423828125, -0.62530517578125, -0.5870819091796875, -0.548858642578125, -0.5106353759765625, -0.472412109375, -0.4341888427734375, -0.395965576171875, -0.3577423095703125, -0.31951904296875, -0.2812957763671875, -0.243072509765625, -0.2048492431640625, -0.1666259765625, -0.1284027099609375, -0.090179443359375, -0.0519561767578125, -0.01373291015625, 0.0244903564453125, 0.062713623046875, 0.1009368896484375, 0.13916015625, 0.1773834228515625, 0.215606689453125, 0.2538299560546875, 0.29205322265625, 0.3302764892578125, 0.368499755859375, 0.4067230224609375, 0.4449462890625, 0.4831695556640625, 0.521392822265625, 0.5596160888671875, 0.59783935546875, 0.6360626220703125, 0.674285888671875, 0.7125091552734375, 0.750732421875, 0.7889556884765625, 0.827178955078125, 0.8654022216796875, 0.90362548828125, 0.9418487548828125, 0.980072021484375, 1.0182952880859375, 1.0565185546875, 1.0947418212890625, 1.132965087890625, 1.1711883544921875, 1.20941162109375, 1.2476348876953125, 1.285858154296875, 1.3240814208984375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 11.0, 17.0, 21.0, 18.0, 16.0, 24.0, 27.0, 33.0, 26.0, 30.0, 40.0, 44.0, 41.0, 32.0, 40.0, 50.0, 46.0, 38.0, 39.0, 36.0, 48.0, 39.0, 33.0, 31.0, 18.0, 24.0, 22.0, 20.0, 21.0, 19.0, 12.0, 8.0, 5.0, 9.0, 11.0, 4.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0205078125, -0.987518310546875, -0.95452880859375, -0.921539306640625, -0.8885498046875, -0.855560302734375, -0.82257080078125, -0.789581298828125, -0.756591796875, -0.723602294921875, -0.69061279296875, -0.657623291015625, -0.6246337890625, -0.591644287109375, -0.55865478515625, -0.525665283203125, -0.49267578125, -0.459686279296875, -0.42669677734375, -0.393707275390625, -0.3607177734375, -0.327728271484375, -0.29473876953125, -0.261749267578125, -0.228759765625, -0.195770263671875, -0.16278076171875, -0.129791259765625, -0.0968017578125, -0.063812255859375, -0.03082275390625, 0.002166748046875, 0.03515625, 0.068145751953125, 0.10113525390625, 0.134124755859375, 0.1671142578125, 0.200103759765625, 0.23309326171875, 0.266082763671875, 0.299072265625, 0.332061767578125, 0.36505126953125, 0.398040771484375, 0.4310302734375, 0.464019775390625, 0.49700927734375, 0.529998779296875, 0.56298828125, 0.595977783203125, 0.62896728515625, 0.661956787109375, 0.6949462890625, 0.727935791015625, 0.76092529296875, 0.793914794921875, 0.826904296875, 0.859893798828125, 0.89288330078125, 0.925872802734375, 0.9588623046875, 0.991851806640625, 1.02484130859375, 1.057830810546875, 1.0908203125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 7.0, 8.0, 10.0, 21.0, 33.0, 42.0, 81.0, 86.0, 161.0, 251.0, 405.0, 686.0, 1126.0, 1752.0, 2789.0, 4616.0, 7535.0, 12585.0, 20347.0, 33214.0, 53900.0, 85864.0, 132855.0, 197985.0, 282884.0, 376772.0, 460876.0, 508345.0, 497358.0, 434073.0, 344207.0, 251626.0, 174302.0, 115185.0, 73336.0, 45993.0, 28355.0, 17249.0, 10592.0, 6422.0, 3939.0, 2386.0, 1518.0, 959.0, 563.0, 398.0, 211.0, 131.0, 89.0, 68.0, 40.0, 15.0, 19.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.070556640625, -1.03466796875, -0.998779296875, -0.962890625, -0.927001953125, -0.89111328125, -0.855224609375, -0.8193359375, -0.783447265625, -0.74755859375, -0.711669921875, -0.67578125, -0.639892578125, -0.60400390625, -0.568115234375, -0.5322265625, -0.496337890625, -0.46044921875, -0.424560546875, -0.388671875, -0.352783203125, -0.31689453125, -0.281005859375, -0.2451171875, -0.209228515625, -0.17333984375, -0.137451171875, -0.1015625, -0.065673828125, -0.02978515625, 0.006103515625, 0.0419921875, 0.077880859375, 0.11376953125, 0.149658203125, 0.185546875, 0.221435546875, 0.25732421875, 0.293212890625, 0.3291015625, 0.364990234375, 0.40087890625, 0.436767578125, 0.47265625, 0.508544921875, 0.54443359375, 0.580322265625, 0.6162109375, 0.652099609375, 0.68798828125, 0.723876953125, 0.759765625, 0.795654296875, 0.83154296875, 0.867431640625, 0.9033203125, 0.939208984375, 0.97509765625, 1.010986328125, 1.046875, 1.082763671875, 1.11865234375, 1.154541015625, 1.1904296875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 6.0, 11.0, 12.0, 17.0, 34.0, 34.0, 33.0, 42.0, 49.0, 46.0, 72.0, 80.0, 107.0, 120.0, 154.0, 151.0, 166.0, 190.0, 192.0, 201.0, 213.0, 230.0, 240.0, 201.0, 206.0, 165.0, 164.0, 153.0, 132.0, 119.0, 100.0, 88.0, 67.0, 49.0, 58.0, 34.0, 23.0, 25.0, 18.0, 9.0, 10.0, 12.0, 11.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.480224609375, -0.4644126892089844, -0.44860076904296875, -0.4327888488769531, -0.4169769287109375, -0.4011650085449219, -0.38535308837890625, -0.3695411682128906, -0.353729248046875, -0.3379173278808594, -0.32210540771484375, -0.3062934875488281, -0.2904815673828125, -0.2746696472167969, -0.25885772705078125, -0.24304580688476562, -0.22723388671875, -0.21142196655273438, -0.19561004638671875, -0.17979812622070312, -0.1639862060546875, -0.14817428588867188, -0.13236236572265625, -0.11655044555664062, -0.100738525390625, -0.08492660522460938, -0.06911468505859375, -0.053302764892578125, -0.0374908447265625, -0.021678924560546875, -0.00586700439453125, 0.009944915771484375, 0.0257568359375, 0.041568756103515625, 0.05738067626953125, 0.07319259643554688, 0.0890045166015625, 0.10481643676757812, 0.12062835693359375, 0.13644027709960938, 0.152252197265625, 0.16806411743164062, 0.18387603759765625, 0.19968795776367188, 0.2154998779296875, 0.23131179809570312, 0.24712371826171875, 0.2629356384277344, 0.27874755859375, 0.2945594787597656, 0.31037139892578125, 0.3261833190917969, 0.3419952392578125, 0.3578071594238281, 0.37361907958984375, 0.3894309997558594, 0.405242919921875, 0.4210548400878906, 0.43686676025390625, 0.4526786804199219, 0.4684906005859375, 0.4843025207519531, 0.5001144409179688, 0.5159263610839844, 0.53173828125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 7.0, 9.0, 9.0, 10.0, 14.0, 18.0, 24.0, 23.0, 32.0, 37.0, 44.0, 46.0, 51.0, 66.0, 67.0, 52.0, 71.0, 53.0, 52.0, 37.0, 42.0, 38.0, 35.0, 31.0, 27.0, 20.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 4.0, 8.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5019704103469849, -1.4478763341903687, -1.393782377243042, -1.3396883010864258, -1.2855942249298096, -1.231500267982483, -1.1774061918258667, -1.12331223487854, -1.0692181587219238, -1.0151240825653076, -0.961030125617981, -0.9069360494613647, -0.8528420329093933, -0.7987480163574219, -0.7446539402008057, -0.6905599236488342, -0.6364659070968628, -0.5823718905448914, -0.5282778739929199, -0.4741837978363037, -0.4200897812843323, -0.36599576473236084, -0.311901718378067, -0.2578076720237732, -0.20371365547180176, -0.14961962401866913, -0.0955255925655365, -0.04143156111240387, 0.01266247034072876, 0.0667564868927002, 0.12085053324699402, 0.17494457960128784, 0.22903847694396973, 0.28313249349594116, 0.337226539850235, 0.3913205862045288, 0.44541460275650024, 0.4995086193084717, 0.5536026954650879, 0.6076967120170593, 0.6617907285690308, 0.7158847451210022, 0.7699787616729736, 0.8240728378295898, 0.8781668543815613, 0.9322608709335327, 0.9863549470901489, 1.0404489040374756, 1.0945429801940918, 1.148637056350708, 1.2027310132980347, 1.2568250894546509, 1.3109190464019775, 1.3650131225585938, 1.41910719871521, 1.4732012748718262, 1.5272952318191528, 1.581389307975769, 1.6354832649230957, 1.689577341079712, 1.7436714172363281, 1.7977653741836548, 1.851859450340271, 1.9059534072875977, 1.9600474834442139]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 14.0, 12.0, 4.0, 7.0, 9.0, 20.0, 15.0, 15.0, 21.0, 20.0, 38.0, 21.0, 32.0, 28.0, 28.0, 35.0, 37.0, 38.0, 42.0, 44.0, 29.0, 30.0, 35.0, 37.0, 34.0, 27.0, 29.0, 34.0, 34.0, 22.0, 25.0, 23.0, 23.0, 20.0, 11.0, 15.0, 16.0, 17.0, 16.0, 6.0, 6.0, 4.0, 8.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.111849308013916, -1.0768101215362549, -1.0417709350585938, -1.0067317485809326, -0.9716925621032715, -0.9366533756256104, -0.9016141295433044, -0.8665749430656433, -0.8315357565879822, -0.796496570110321, -0.7614573836326599, -0.7264181971549988, -0.6913789510726929, -0.6563397645950317, -0.6213005781173706, -0.5862613916397095, -0.5512222051620483, -0.5161830186843872, -0.4811438322067261, -0.44610461592674255, -0.4110654294490814, -0.3760262429714203, -0.34098702669143677, -0.30594784021377563, -0.2709086537361145, -0.23586946725845337, -0.20083026587963104, -0.16579106450080872, -0.13075187802314758, -0.09571269154548645, -0.060673490166664124, -0.025634288787841797, 0.009405016899108887, 0.044444210827350616, 0.07948340475559235, 0.11452259868383408, 0.1495617926120758, 0.18460097908973694, 0.21964018046855927, 0.2546793818473816, 0.2897185683250427, 0.32475775480270386, 0.359796941280365, 0.3948361575603485, 0.42987534403800964, 0.4649145305156708, 0.4999537467956543, 0.5349929332733154, 0.5700321197509766, 0.6050713062286377, 0.6401104927062988, 0.67514967918396, 0.7101888656616211, 0.7452280521392822, 0.7802672982215881, 0.8153064846992493, 0.8503456711769104, 0.8853848576545715, 0.9204240441322327, 0.9554632306098938, 0.9905024766921997, 1.0255416631698608, 1.060580849647522, 1.095620036125183, 1.1306592226028442]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 1.0, 10.0, 8.0, 15.0, 21.0, 24.0, 22.0, 54.0, 63.0, 88.0, 141.0, 198.0, 277.0, 439.0, 731.0, 1047.0, 1769.0, 2715.0, 4535.0, 7041.0, 11846.0, 19658.0, 32748.0, 53931.0, 87933.0, 135080.0, 176522.0, 173044.0, 127677.0, 82773.0, 50333.0, 30352.0, 18346.0, 11088.0, 6773.0, 4067.0, 2531.0, 1661.0, 1032.0, 662.0, 406.0, 300.0, 183.0, 128.0, 91.0, 45.0, 59.0, 29.0, 19.0, 11.0, 9.0, 10.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.416748046875, -0.40234375, -0.387939453125, -0.37353515625, -0.359130859375, -0.3447265625, -0.330322265625, -0.31591796875, -0.301513671875, -0.287109375, -0.272705078125, -0.25830078125, -0.243896484375, -0.2294921875, -0.215087890625, -0.20068359375, -0.186279296875, -0.171875, -0.157470703125, -0.14306640625, -0.128662109375, -0.1142578125, -0.099853515625, -0.08544921875, -0.071044921875, -0.056640625, -0.042236328125, -0.02783203125, -0.013427734375, 0.0009765625, 0.015380859375, 0.02978515625, 0.044189453125, 0.05859375, 0.072998046875, 0.08740234375, 0.101806640625, 0.1162109375, 0.130615234375, 0.14501953125, 0.159423828125, 0.173828125, 0.188232421875, 0.20263671875, 0.217041015625, 0.2314453125, 0.245849609375, 0.26025390625, 0.274658203125, 0.2890625, 0.303466796875, 0.31787109375, 0.332275390625, 0.3466796875, 0.361083984375, 0.37548828125, 0.389892578125, 0.404296875, 0.418701171875, 0.43310546875, 0.447509765625, 0.4619140625, 0.476318359375, 0.49072265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 11.0, 12.0, 14.0, 10.0, 16.0, 12.0, 18.0, 33.0, 23.0, 27.0, 36.0, 27.0, 27.0, 46.0, 35.0, 41.0, 43.0, 40.0, 38.0, 45.0, 30.0, 42.0, 42.0, 36.0, 31.0, 25.0, 32.0, 23.0, 31.0, 20.0, 24.0, 12.0, 19.0, 11.0, 13.0, 7.0, 13.0, 6.0, 2.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2594757080078125, -1.219146728515625, -1.1788177490234375, -1.13848876953125, -1.0981597900390625, -1.057830810546875, -1.0175018310546875, -0.9771728515625, -0.9368438720703125, -0.896514892578125, -0.8561859130859375, -0.81585693359375, -0.7755279541015625, -0.735198974609375, -0.6948699951171875, -0.654541015625, -0.6142120361328125, -0.573883056640625, -0.5335540771484375, -0.49322509765625, -0.4528961181640625, -0.412567138671875, -0.3722381591796875, -0.3319091796875, -0.2915802001953125, -0.251251220703125, -0.2109222412109375, -0.17059326171875, -0.1302642822265625, -0.089935302734375, -0.0496063232421875, -0.00927734375, 0.0310516357421875, 0.071380615234375, 0.1117095947265625, 0.15203857421875, 0.1923675537109375, 0.232696533203125, 0.2730255126953125, 0.3133544921875, 0.3536834716796875, 0.394012451171875, 0.4343414306640625, 0.47467041015625, 0.5149993896484375, 0.555328369140625, 0.5956573486328125, 0.635986328125, 0.6763153076171875, 0.716644287109375, 0.7569732666015625, 0.79730224609375, 0.8376312255859375, 0.877960205078125, 0.9182891845703125, 0.9586181640625, 0.9989471435546875, 1.039276123046875, 1.0796051025390625, 1.11993408203125, 1.1602630615234375, 1.200592041015625, 1.2409210205078125, 1.28125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 10.0, 10.0, 20.0, 36.0, 42.0, 66.0, 105.0, 174.0, 210.0, 367.0, 569.0, 1026.0, 1787.0, 3248.0, 6200.0, 11638.0, 23402.0, 47637.0, 96681.0, 184208.0, 259963.0, 198395.0, 106425.0, 52593.0, 25850.0, 12901.0, 6659.0, 3507.0, 1894.0, 1119.0, 631.0, 464.0, 264.0, 163.0, 99.0, 68.0, 48.0, 26.0, 20.0, 14.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6123046875, -0.593505859375, -0.57470703125, -0.555908203125, -0.537109375, -0.518310546875, -0.49951171875, -0.480712890625, -0.4619140625, -0.443115234375, -0.42431640625, -0.405517578125, -0.38671875, -0.367919921875, -0.34912109375, -0.330322265625, -0.3115234375, -0.292724609375, -0.27392578125, -0.255126953125, -0.236328125, -0.217529296875, -0.19873046875, -0.179931640625, -0.1611328125, -0.142333984375, -0.12353515625, -0.104736328125, -0.0859375, -0.067138671875, -0.04833984375, -0.029541015625, -0.0107421875, 0.008056640625, 0.02685546875, 0.045654296875, 0.064453125, 0.083251953125, 0.10205078125, 0.120849609375, 0.1396484375, 0.158447265625, 0.17724609375, 0.196044921875, 0.21484375, 0.233642578125, 0.25244140625, 0.271240234375, 0.2900390625, 0.308837890625, 0.32763671875, 0.346435546875, 0.365234375, 0.384033203125, 0.40283203125, 0.421630859375, 0.4404296875, 0.459228515625, 0.47802734375, 0.496826171875, 0.515625, 0.534423828125, 0.55322265625, 0.572021484375, 0.5908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 12.0, 7.0, 17.0, 19.0, 17.0, 26.0, 31.0, 35.0, 34.0, 29.0, 32.0, 39.0, 34.0, 40.0, 41.0, 42.0, 47.0, 42.0, 37.0, 44.0, 51.0, 30.0, 34.0, 34.0, 32.0, 23.0, 18.0, 17.0, 17.0, 21.0, 16.0, 11.0, 7.0, 14.0, 2.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7228012084960938, -0.6951141357421875, -0.6674270629882812, -0.639739990234375, -0.6120529174804688, -0.5843658447265625, -0.5566787719726562, -0.52899169921875, -0.5013046264648438, -0.4736175537109375, -0.44593048095703125, -0.418243408203125, -0.39055633544921875, -0.3628692626953125, -0.33518218994140625, -0.3074951171875, -0.27980804443359375, -0.2521209716796875, -0.22443389892578125, -0.196746826171875, -0.16905975341796875, -0.1413726806640625, -0.11368560791015625, -0.08599853515625, -0.05831146240234375, -0.0306243896484375, -0.00293731689453125, 0.024749755859375, 0.05243682861328125, 0.0801239013671875, 0.10781097412109375, 0.135498046875, 0.16318511962890625, 0.1908721923828125, 0.21855926513671875, 0.246246337890625, 0.27393341064453125, 0.3016204833984375, 0.32930755615234375, 0.35699462890625, 0.38468170166015625, 0.4123687744140625, 0.44005584716796875, 0.467742919921875, 0.49542999267578125, 0.5231170654296875, 0.5508041381835938, 0.5784912109375, 0.6061782836914062, 0.6338653564453125, 0.6615524291992188, 0.689239501953125, 0.7169265747070312, 0.7446136474609375, 0.7723007202148438, 0.79998779296875, 0.8276748657226562, 0.8553619384765625, 0.8830490112304688, 0.910736083984375, 0.9384231567382812, 0.9661102294921875, 0.9937973022460938, 1.021484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 18.0, 21.0, 29.0, 32.0, 45.0, 78.0, 123.0, 131.0, 184.0, 244.0, 346.0, 439.0, 569.0, 871.0, 1205.0, 1694.0, 2662.0, 3800.0, 5977.0, 9812.0, 16993.0, 31692.0, 65999.0, 149403.0, 301991.0, 238409.0, 105710.0, 48787.0, 24321.0, 13262.0, 8045.0, 5030.0, 3163.0, 2192.0, 1452.0, 1065.0, 732.0, 555.0, 368.0, 308.0, 209.0, 185.0, 84.0, 92.0, 64.0, 43.0, 29.0, 26.0, 19.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0], "bins": [-0.2322998046875, -0.22542572021484375, -0.2185516357421875, -0.21167755126953125, -0.204803466796875, -0.19792938232421875, -0.1910552978515625, -0.18418121337890625, -0.17730712890625, -0.17043304443359375, -0.1635589599609375, -0.15668487548828125, -0.149810791015625, -0.14293670654296875, -0.1360626220703125, -0.12918853759765625, -0.122314453125, -0.11544036865234375, -0.1085662841796875, -0.10169219970703125, -0.094818115234375, -0.08794403076171875, -0.0810699462890625, -0.07419586181640625, -0.06732177734375, -0.06044769287109375, -0.0535736083984375, -0.04669952392578125, -0.039825439453125, -0.03295135498046875, -0.0260772705078125, -0.01920318603515625, -0.0123291015625, -0.00545501708984375, 0.0014190673828125, 0.00829315185546875, 0.015167236328125, 0.02204132080078125, 0.0289154052734375, 0.03578948974609375, 0.04266357421875, 0.04953765869140625, 0.0564117431640625, 0.06328582763671875, 0.070159912109375, 0.07703399658203125, 0.0839080810546875, 0.09078216552734375, 0.09765625, 0.10453033447265625, 0.1114044189453125, 0.11827850341796875, 0.125152587890625, 0.13202667236328125, 0.1389007568359375, 0.14577484130859375, 0.15264892578125, 0.15952301025390625, 0.1663970947265625, 0.17327117919921875, 0.180145263671875, 0.18701934814453125, 0.1938934326171875, 0.20076751708984375, 0.2076416015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 9.0, 13.0, 5.0, 13.0, 19.0, 15.0, 26.0, 30.0, 31.0, 39.0, 70.0, 64.0, 76.0, 85.0, 82.0, 72.0, 78.0, 62.0, 53.0, 24.0, 27.0, 24.0, 15.0, 17.0, 10.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.2709369659423828e-05, -2.2079795598983765e-05, -2.14502215385437e-05, -2.0820647478103638e-05, -2.0191073417663574e-05, -1.956149935722351e-05, -1.8931925296783447e-05, -1.8302351236343384e-05, -1.767277717590332e-05, -1.7043203115463257e-05, -1.6413629055023193e-05, -1.578405499458313e-05, -1.5154480934143066e-05, -1.4524906873703003e-05, -1.389533281326294e-05, -1.3265758752822876e-05, -1.2636184692382812e-05, -1.2006610631942749e-05, -1.1377036571502686e-05, -1.0747462511062622e-05, -1.0117888450622559e-05, -9.488314390182495e-06, -8.858740329742432e-06, -8.229166269302368e-06, -7.599592208862305e-06, -6.970018148422241e-06, -6.340444087982178e-06, -5.710870027542114e-06, -5.081295967102051e-06, -4.451721906661987e-06, -3.822147846221924e-06, -3.1925737857818604e-06, -2.562999725341797e-06, -1.9334256649017334e-06, -1.30385160446167e-06, -6.742775440216064e-07, -4.470348358154297e-08, 5.848705768585205e-07, 1.214444637298584e-06, 1.8440186977386475e-06, 2.473592758178711e-06, 3.1031668186187744e-06, 3.732740879058838e-06, 4.362314939498901e-06, 4.991888999938965e-06, 5.621463060379028e-06, 6.251037120819092e-06, 6.880611181259155e-06, 7.510185241699219e-06, 8.139759302139282e-06, 8.769333362579346e-06, 9.39890742301941e-06, 1.0028481483459473e-05, 1.0658055543899536e-05, 1.12876296043396e-05, 1.1917203664779663e-05, 1.2546777725219727e-05, 1.317635178565979e-05, 1.3805925846099854e-05, 1.4435499906539917e-05, 1.506507396697998e-05, 1.5694648027420044e-05, 1.6324222087860107e-05, 1.695379614830017e-05, 1.7583370208740234e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 3.0, 18.0, 12.0, 25.0, 32.0, 40.0, 72.0, 115.0, 160.0, 248.0, 414.0, 642.0, 935.0, 1456.0, 2144.0, 3403.0, 5216.0, 8202.0, 13302.0, 21351.0, 34753.0, 58266.0, 99458.0, 161448.0, 206357.0, 166801.0, 104936.0, 61770.0, 36595.0, 22115.0, 13847.0, 8758.0, 5522.0, 3507.0, 2361.0, 1517.0, 1005.0, 611.0, 377.0, 267.0, 154.0, 114.0, 73.0, 40.0, 38.0, 21.0, 28.0, 7.0, 7.0, 10.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.2200927734375, -0.21372222900390625, -0.2073516845703125, -0.20098114013671875, -0.194610595703125, -0.18824005126953125, -0.1818695068359375, -0.17549896240234375, -0.16912841796875, -0.16275787353515625, -0.1563873291015625, -0.15001678466796875, -0.143646240234375, -0.13727569580078125, -0.1309051513671875, -0.12453460693359375, -0.1181640625, -0.11179351806640625, -0.1054229736328125, -0.09905242919921875, -0.092681884765625, -0.08631134033203125, -0.0799407958984375, -0.07357025146484375, -0.06719970703125, -0.06082916259765625, -0.0544586181640625, -0.04808807373046875, -0.041717529296875, -0.03534698486328125, -0.0289764404296875, -0.02260589599609375, -0.0162353515625, -0.00986480712890625, -0.0034942626953125, 0.00287628173828125, 0.009246826171875, 0.01561737060546875, 0.0219879150390625, 0.02835845947265625, 0.03472900390625, 0.04109954833984375, 0.0474700927734375, 0.05384063720703125, 0.060211181640625, 0.06658172607421875, 0.0729522705078125, 0.07932281494140625, 0.085693359375, 0.09206390380859375, 0.0984344482421875, 0.10480499267578125, 0.111175537109375, 0.11754608154296875, 0.1239166259765625, 0.13028717041015625, 0.13665771484375, 0.14302825927734375, 0.1493988037109375, 0.15576934814453125, 0.162139892578125, 0.16851043701171875, 0.1748809814453125, 0.18125152587890625, 0.1876220703125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 6.0, 14.0, 12.0, 14.0, 26.0, 34.0, 25.0, 36.0, 58.0, 62.0, 73.0, 79.0, 84.0, 93.0, 54.0, 63.0, 51.0, 29.0, 42.0, 37.0, 29.0, 17.0, 16.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0675048828125, -0.0648794174194336, -0.06225395202636719, -0.05962848663330078, -0.057003021240234375, -0.05437755584716797, -0.05175209045410156, -0.049126625061035156, -0.04650115966796875, -0.043875694274902344, -0.04125022888183594, -0.03862476348876953, -0.035999298095703125, -0.03337383270263672, -0.030748367309570312, -0.028122901916503906, -0.0254974365234375, -0.022871971130371094, -0.020246505737304688, -0.01762104034423828, -0.014995574951171875, -0.012370109558105469, -0.009744644165039062, -0.007119178771972656, -0.00449371337890625, -0.0018682479858398438, 0.0007572174072265625, 0.0033826828002929688, 0.006008148193359375, 0.008633613586425781, 0.011259078979492188, 0.013884544372558594, 0.016510009765625, 0.019135475158691406, 0.021760940551757812, 0.02438640594482422, 0.027011871337890625, 0.02963733673095703, 0.03226280212402344, 0.034888267517089844, 0.03751373291015625, 0.040139198303222656, 0.04276466369628906, 0.04539012908935547, 0.048015594482421875, 0.05064105987548828, 0.05326652526855469, 0.055891990661621094, 0.0585174560546875, 0.061142921447753906, 0.06376838684082031, 0.06639385223388672, 0.06901931762695312, 0.07164478302001953, 0.07427024841308594, 0.07689571380615234, 0.07952117919921875, 0.08214664459228516, 0.08477210998535156, 0.08739757537841797, 0.09002304077148438, 0.09264850616455078, 0.09527397155761719, 0.0978994369506836, 0.10052490234375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 10.0, 11.0, 11.0, 19.0, 22.0, 29.0, 35.0, 22.0, 51.0, 42.0, 63.0, 50.0, 69.0, 59.0, 54.0, 65.0, 42.0, 47.0, 49.0, 36.0, 25.0, 34.0, 28.0, 21.0, 16.0, 18.0, 10.0, 11.0, 2.0, 4.0, 3.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4869941473007202, -1.433651328086853, -1.3803086280822754, -1.3269658088684082, -1.273622989654541, -1.2202801704406738, -1.1669373512268066, -1.113594651222229, -1.0602518320083618, -1.0069090127944946, -0.9535662531852722, -0.9002234935760498, -0.8468806743621826, -0.7935378551483154, -0.740195095539093, -0.6868523359298706, -0.6335095167160034, -0.5801666975021362, -0.5268239378929138, -0.473481148481369, -0.4201383590698242, -0.3667955696582794, -0.3134527802467346, -0.2601099908351898, -0.20676720142364502, -0.15342441201210022, -0.10008162260055542, -0.04673883318901062, 0.00660395622253418, 0.05994674563407898, 0.11328953504562378, 0.16663232445716858, 0.21997511386871338, 0.2733179032802582, 0.326660692691803, 0.3800034821033478, 0.4333462715148926, 0.4866890609264374, 0.5400318503379822, 0.5933746099472046, 0.6467174291610718, 0.700060248374939, 0.7534030079841614, 0.8067457675933838, 0.860088586807251, 0.9134314060211182, 0.9667741656303406, 1.020116925239563, 1.0734597444534302, 1.1268025636672974, 1.180145263671875, 1.2334880828857422, 1.2868309020996094, 1.3401737213134766, 1.3935165405273438, 1.4468592405319214, 1.5002020597457886, 1.5535448789596558, 1.6068875789642334, 1.6602303981781006, 1.7135732173919678, 1.766916036605835, 1.8202588558197021, 1.8736015558242798, 1.926944375038147]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 4.0, 12.0, 13.0, 5.0, 8.0, 7.0, 17.0, 17.0, 19.0, 17.0, 24.0, 28.0, 29.0, 26.0, 30.0, 36.0, 35.0, 33.0, 40.0, 43.0, 30.0, 45.0, 29.0, 37.0, 36.0, 32.0, 22.0, 34.0, 33.0, 36.0, 23.0, 21.0, 26.0, 21.0, 17.0, 16.0, 12.0, 23.0, 10.0, 16.0, 7.0, 5.0, 7.0, 2.0, 5.0, 2.0, 8.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.1195793151855469, -1.0842653512954712, -1.048951506614685, -1.0136375427246094, -0.9783235788345337, -0.9430096745491028, -0.9076957702636719, -0.8723818063735962, -0.8370679020881653, -0.8017539978027344, -0.7664400339126587, -0.7311261296272278, -0.6958122253417969, -0.6604982614517212, -0.6251843571662903, -0.5898704528808594, -0.5545564889907837, -0.5192425847053528, -0.4839286208152771, -0.4486147165298462, -0.4133007824420929, -0.3779868483543396, -0.3426729440689087, -0.3073590099811554, -0.2720450758934021, -0.2367311418056488, -0.2014172226190567, -0.1661033034324646, -0.1307893693447113, -0.09547543525695801, -0.060161516070365906, -0.024847596883773804, 0.010466217994689941, 0.04578014463186264, 0.08109407126903534, 0.11640799790620804, 0.15172192454338074, 0.18703585863113403, 0.22234977781772614, 0.25766369700431824, 0.29297763109207153, 0.32829156517982483, 0.3636054992675781, 0.39891940355300903, 0.43423333764076233, 0.4695472717285156, 0.5048611760139465, 0.5401750802993774, 0.5754890441894531, 0.610802948474884, 0.6461169123649597, 0.6814308166503906, 0.7167447805404663, 0.7520586848258972, 0.7873725891113281, 0.8226865530014038, 0.8580004572868347, 0.8933143615722656, 0.9286283254623413, 0.9639422297477722, 0.9992561340332031, 1.0345700979232788, 1.0698840618133545, 1.1051979064941406, 1.1405118703842163]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 9.0, 9.0, 21.0, 23.0, 26.0, 35.0, 58.0, 78.0, 145.0, 182.0, 279.0, 420.0, 617.0, 833.0, 1273.0, 1946.0, 2980.0, 4437.0, 6468.0, 9511.0, 14122.0, 20150.0, 28597.0, 39687.0, 52228.0, 67427.0, 81790.0, 93884.0, 100042.0, 99973.0, 92837.0, 81267.0, 66285.0, 51557.0, 38564.0, 28347.0, 19676.0, 13907.0, 9248.0, 6521.0, 4258.0, 2877.0, 1954.0, 1284.0, 899.0, 561.0, 425.0, 268.0, 168.0, 130.0, 77.0, 68.0, 40.0, 37.0, 20.0, 12.0, 11.0, 10.0, 2.0, 0.0, 2.0], "bins": [-0.9580078125, -0.9280471801757812, -0.8980865478515625, -0.8681259155273438, -0.838165283203125, -0.8082046508789062, -0.7782440185546875, -0.7482833862304688, -0.71832275390625, -0.6883621215820312, -0.6584014892578125, -0.6284408569335938, -0.598480224609375, -0.5685195922851562, -0.5385589599609375, -0.5085983276367188, -0.4786376953125, -0.44867706298828125, -0.4187164306640625, -0.38875579833984375, -0.358795166015625, -0.32883453369140625, -0.2988739013671875, -0.26891326904296875, -0.23895263671875, -0.20899200439453125, -0.1790313720703125, -0.14907073974609375, -0.119110107421875, -0.08914947509765625, -0.0591888427734375, -0.02922821044921875, 0.000732421875, 0.03069305419921875, 0.0606536865234375, 0.09061431884765625, 0.120574951171875, 0.15053558349609375, 0.1804962158203125, 0.21045684814453125, 0.24041748046875, 0.27037811279296875, 0.3003387451171875, 0.33029937744140625, 0.360260009765625, 0.39022064208984375, 0.4201812744140625, 0.45014190673828125, 0.4801025390625, 0.5100631713867188, 0.5400238037109375, 0.5699844360351562, 0.599945068359375, 0.6299057006835938, 0.6598663330078125, 0.6898269653320312, 0.71978759765625, 0.7497482299804688, 0.7797088623046875, 0.8096694946289062, 0.839630126953125, 0.8695907592773438, 0.8995513916015625, 0.9295120239257812, 0.95947265625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 9.0, 15.0, 9.0, 14.0, 18.0, 16.0, 18.0, 32.0, 18.0, 27.0, 27.0, 35.0, 32.0, 39.0, 38.0, 42.0, 42.0, 35.0, 45.0, 34.0, 30.0, 40.0, 39.0, 31.0, 31.0, 29.0, 32.0, 36.0, 20.0, 22.0, 28.0, 14.0, 24.0, 15.0, 13.0, 6.0, 7.0, 10.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.2323455810546875, -1.193206787109375, -1.1540679931640625, -1.11492919921875, -1.0757904052734375, -1.036651611328125, -0.9975128173828125, -0.9583740234375, -0.9192352294921875, -0.880096435546875, -0.8409576416015625, -0.80181884765625, -0.7626800537109375, -0.723541259765625, -0.6844024658203125, -0.645263671875, -0.6061248779296875, -0.566986083984375, -0.5278472900390625, -0.48870849609375, -0.4495697021484375, -0.410430908203125, -0.3712921142578125, -0.3321533203125, -0.2930145263671875, -0.253875732421875, -0.2147369384765625, -0.17559814453125, -0.1364593505859375, -0.097320556640625, -0.0581817626953125, -0.01904296875, 0.0200958251953125, 0.059234619140625, 0.0983734130859375, 0.13751220703125, 0.1766510009765625, 0.215789794921875, 0.2549285888671875, 0.2940673828125, 0.3332061767578125, 0.372344970703125, 0.4114837646484375, 0.45062255859375, 0.4897613525390625, 0.528900146484375, 0.5680389404296875, 0.607177734375, 0.6463165283203125, 0.685455322265625, 0.7245941162109375, 0.76373291015625, 0.8028717041015625, 0.842010498046875, 0.8811492919921875, 0.9202880859375, 0.9594268798828125, 0.998565673828125, 1.0377044677734375, 1.07684326171875, 1.1159820556640625, 1.155120849609375, 1.1942596435546875, 1.2333984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 10.0, 8.0, 11.0, 22.0, 29.0, 68.0, 67.0, 119.0, 184.0, 317.0, 494.0, 762.0, 1152.0, 2022.0, 3092.0, 4905.0, 8088.0, 12717.0, 20001.0, 30216.0, 44584.0, 62767.0, 83348.0, 102451.0, 116277.0, 118908.0, 110914.0, 93998.0, 73122.0, 53166.0, 37010.0, 24681.0, 15944.0, 10088.0, 6514.0, 3982.0, 2479.0, 1537.0, 959.0, 526.0, 366.0, 207.0, 155.0, 102.0, 67.0, 40.0, 28.0, 19.0, 9.0, 14.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.1669921875, -1.13189697265625, -1.0968017578125, -1.06170654296875, -1.026611328125, -0.99151611328125, -0.9564208984375, -0.92132568359375, -0.88623046875, -0.85113525390625, -0.8160400390625, -0.78094482421875, -0.745849609375, -0.71075439453125, -0.6756591796875, -0.64056396484375, -0.60546875, -0.57037353515625, -0.5352783203125, -0.50018310546875, -0.465087890625, -0.42999267578125, -0.3948974609375, -0.35980224609375, -0.32470703125, -0.28961181640625, -0.2545166015625, -0.21942138671875, -0.184326171875, -0.14923095703125, -0.1141357421875, -0.07904052734375, -0.0439453125, -0.00885009765625, 0.0262451171875, 0.06134033203125, 0.096435546875, 0.13153076171875, 0.1666259765625, 0.20172119140625, 0.23681640625, 0.27191162109375, 0.3070068359375, 0.34210205078125, 0.377197265625, 0.41229248046875, 0.4473876953125, 0.48248291015625, 0.517578125, 0.55267333984375, 0.5877685546875, 0.62286376953125, 0.657958984375, 0.69305419921875, 0.7281494140625, 0.76324462890625, 0.79833984375, 0.83343505859375, 0.8685302734375, 0.90362548828125, 0.938720703125, 0.97381591796875, 1.0089111328125, 1.04400634765625, 1.0791015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 8.0, 17.0, 23.0, 19.0, 23.0, 29.0, 28.0, 30.0, 29.0, 28.0, 31.0, 34.0, 40.0, 48.0, 45.0, 29.0, 33.0, 38.0, 35.0, 42.0, 32.0, 40.0, 26.0, 29.0, 29.0, 31.0, 19.0, 22.0, 13.0, 16.0, 16.0, 13.0, 17.0, 3.0, 14.0, 11.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.701171875, -0.6784591674804688, -0.6557464599609375, -0.6330337524414062, -0.610321044921875, -0.5876083374023438, -0.5648956298828125, -0.5421829223632812, -0.51947021484375, -0.49675750732421875, -0.4740447998046875, -0.45133209228515625, -0.428619384765625, -0.40590667724609375, -0.3831939697265625, -0.36048126220703125, -0.3377685546875, -0.31505584716796875, -0.2923431396484375, -0.26963043212890625, -0.246917724609375, -0.22420501708984375, -0.2014923095703125, -0.17877960205078125, -0.15606689453125, -0.13335418701171875, -0.1106414794921875, -0.08792877197265625, -0.065216064453125, -0.04250335693359375, -0.0197906494140625, 0.00292205810546875, 0.025634765625, 0.04834747314453125, 0.0710601806640625, 0.09377288818359375, 0.116485595703125, 0.13919830322265625, 0.1619110107421875, 0.18462371826171875, 0.20733642578125, 0.23004913330078125, 0.2527618408203125, 0.27547454833984375, 0.298187255859375, 0.32089996337890625, 0.3436126708984375, 0.36632537841796875, 0.3890380859375, 0.41175079345703125, 0.4344635009765625, 0.45717620849609375, 0.479888916015625, 0.5026016235351562, 0.5253143310546875, 0.5480270385742188, 0.57073974609375, 0.5934524536132812, 0.6161651611328125, 0.6388778686523438, 0.661590576171875, 0.6843032836914062, 0.7070159912109375, 0.7297286987304688, 0.75244140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 3.0, 9.0, 7.0, 13.0, 16.0, 29.0, 39.0, 43.0, 82.0, 137.0, 235.0, 319.0, 584.0, 978.0, 1580.0, 2731.0, 4820.0, 8641.0, 16403.0, 31157.0, 58939.0, 107061.0, 169935.0, 206219.0, 179453.0, 117424.0, 66069.0, 34905.0, 18197.0, 9790.0, 5309.0, 2977.0, 1718.0, 1037.0, 649.0, 366.0, 227.0, 145.0, 88.0, 66.0, 43.0, 32.0, 20.0, 18.0, 11.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.98583984375, -0.95733642578125, -0.9288330078125, -0.90032958984375, -0.871826171875, -0.84332275390625, -0.8148193359375, -0.78631591796875, -0.7578125, -0.72930908203125, -0.7008056640625, -0.67230224609375, -0.643798828125, -0.61529541015625, -0.5867919921875, -0.55828857421875, -0.52978515625, -0.50128173828125, -0.4727783203125, -0.44427490234375, -0.415771484375, -0.38726806640625, -0.3587646484375, -0.33026123046875, -0.3017578125, -0.27325439453125, -0.2447509765625, -0.21624755859375, -0.187744140625, -0.15924072265625, -0.1307373046875, -0.10223388671875, -0.07373046875, -0.04522705078125, -0.0167236328125, 0.01177978515625, 0.040283203125, 0.06878662109375, 0.0972900390625, 0.12579345703125, 0.154296875, 0.18280029296875, 0.2113037109375, 0.23980712890625, 0.268310546875, 0.29681396484375, 0.3253173828125, 0.35382080078125, 0.38232421875, 0.41082763671875, 0.4393310546875, 0.46783447265625, 0.496337890625, 0.52484130859375, 0.5533447265625, 0.58184814453125, 0.6103515625, 0.63885498046875, 0.6673583984375, 0.69586181640625, 0.724365234375, 0.75286865234375, 0.7813720703125, 0.80987548828125, 0.83837890625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 20.0, 14.0, 20.0, 22.0, 32.0, 29.0, 37.0, 50.0, 51.0, 50.0, 70.0, 48.0, 48.0, 61.0, 46.0, 69.0, 51.0, 41.0, 33.0, 38.0, 27.0, 18.0, 13.0, 19.0, 12.0, 14.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.426738739013672e-05, -7.211044430732727e-05, -6.995350122451782e-05, -6.779655814170837e-05, -6.563961505889893e-05, -6.348267197608948e-05, -6.132572889328003e-05, -5.916878581047058e-05, -5.701184272766113e-05, -5.4854899644851685e-05, -5.2697956562042236e-05, -5.054101347923279e-05, -4.838407039642334e-05, -4.622712731361389e-05, -4.407018423080444e-05, -4.1913241147994995e-05, -3.975629806518555e-05, -3.75993549823761e-05, -3.544241189956665e-05, -3.32854688167572e-05, -3.1128525733947754e-05, -2.8971582651138306e-05, -2.6814639568328857e-05, -2.465769648551941e-05, -2.250075340270996e-05, -2.0343810319900513e-05, -1.8186867237091064e-05, -1.6029924154281616e-05, -1.3872981071472168e-05, -1.171603798866272e-05, -9.559094905853271e-06, -7.402151823043823e-06, -5.245208740234375e-06, -3.0882656574249268e-06, -9.313225746154785e-07, 1.2256205081939697e-06, 3.382563591003418e-06, 5.539506673812866e-06, 7.696449756622314e-06, 9.853392839431763e-06, 1.2010335922241211e-05, 1.416727900505066e-05, 1.6324222087860107e-05, 1.8481165170669556e-05, 2.0638108253479004e-05, 2.2795051336288452e-05, 2.49519944190979e-05, 2.710893750190735e-05, 2.9265880584716797e-05, 3.1422823667526245e-05, 3.357976675033569e-05, 3.573670983314514e-05, 3.789365291595459e-05, 4.005059599876404e-05, 4.2207539081573486e-05, 4.4364482164382935e-05, 4.652142524719238e-05, 4.867836833000183e-05, 5.083531141281128e-05, 5.299225449562073e-05, 5.5149197578430176e-05, 5.7306140661239624e-05, 5.946308374404907e-05, 6.162002682685852e-05, 6.377696990966797e-05]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 3.0, 12.0, 15.0, 23.0, 36.0, 44.0, 74.0, 99.0, 142.0, 203.0, 282.0, 478.0, 713.0, 1120.0, 1600.0, 2595.0, 3883.0, 6021.0, 9513.0, 15378.0, 24343.0, 37686.0, 56452.0, 82289.0, 110634.0, 132661.0, 137119.0, 123755.0, 98314.0, 70054.0, 47818.0, 30862.0, 19866.0, 12479.0, 7609.0, 5040.0, 3219.0, 2080.0, 1329.0, 904.0, 634.0, 387.0, 257.0, 175.0, 117.0, 75.0, 63.0, 32.0, 24.0, 13.0, 12.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5724029541015625, -0.553497314453125, -0.5345916748046875, -0.51568603515625, -0.4967803955078125, -0.477874755859375, -0.4589691162109375, -0.4400634765625, -0.4211578369140625, -0.402252197265625, -0.3833465576171875, -0.36444091796875, -0.3455352783203125, -0.326629638671875, -0.3077239990234375, -0.288818359375, -0.2699127197265625, -0.251007080078125, -0.2321014404296875, -0.21319580078125, -0.1942901611328125, -0.175384521484375, -0.1564788818359375, -0.1375732421875, -0.1186676025390625, -0.099761962890625, -0.0808563232421875, -0.06195068359375, -0.0430450439453125, -0.024139404296875, -0.0052337646484375, 0.013671875, 0.0325775146484375, 0.051483154296875, 0.0703887939453125, 0.08929443359375, 0.1082000732421875, 0.127105712890625, 0.1460113525390625, 0.1649169921875, 0.1838226318359375, 0.202728271484375, 0.2216339111328125, 0.24053955078125, 0.2594451904296875, 0.278350830078125, 0.2972564697265625, 0.316162109375, 0.3350677490234375, 0.353973388671875, 0.3728790283203125, 0.39178466796875, 0.4106903076171875, 0.429595947265625, 0.4485015869140625, 0.4674072265625, 0.4863128662109375, 0.505218505859375, 0.5241241455078125, 0.54302978515625, 0.5619354248046875, 0.580841064453125, 0.5997467041015625, 0.61865234375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 3.0, 10.0, 7.0, 6.0, 5.0, 12.0, 18.0, 18.0, 29.0, 26.0, 26.0, 40.0, 30.0, 51.0, 35.0, 58.0, 45.0, 55.0, 52.0, 60.0, 53.0, 48.0, 51.0, 38.0, 40.0, 39.0, 19.0, 19.0, 23.0, 13.0, 16.0, 10.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22766685485839844, -0.21961593627929688, -0.2115650177001953, -0.20351409912109375, -0.1954631805419922, -0.18741226196289062, -0.17936134338378906, -0.1713104248046875, -0.16325950622558594, -0.15520858764648438, -0.1471576690673828, -0.13910675048828125, -0.1310558319091797, -0.12300491333007812, -0.11495399475097656, -0.106903076171875, -0.09885215759277344, -0.09080123901367188, -0.08275032043457031, -0.07469940185546875, -0.06664848327636719, -0.058597564697265625, -0.05054664611816406, -0.0424957275390625, -0.03444480895996094, -0.026393890380859375, -0.018342971801757812, -0.01029205322265625, -0.0022411346435546875, 0.005809783935546875, 0.013860702514648438, 0.02191162109375, 0.029962539672851562, 0.038013458251953125, 0.04606437683105469, 0.05411529541015625, 0.06216621398925781, 0.07021713256835938, 0.07826805114746094, 0.0863189697265625, 0.09436988830566406, 0.10242080688476562, 0.11047172546386719, 0.11852264404296875, 0.1265735626220703, 0.13462448120117188, 0.14267539978027344, 0.150726318359375, 0.15877723693847656, 0.16682815551757812, 0.1748790740966797, 0.18292999267578125, 0.1909809112548828, 0.19903182983398438, 0.20708274841308594, 0.2151336669921875, 0.22318458557128906, 0.23123550415039062, 0.2392864227294922, 0.24733734130859375, 0.2553882598876953, 0.2634391784667969, 0.27149009704589844, 0.279541015625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 9.0, 5.0, 6.0, 7.0, 16.0, 15.0, 21.0, 23.0, 38.0, 29.0, 47.0, 48.0, 44.0, 52.0, 50.0, 56.0, 71.0, 50.0, 58.0, 47.0, 43.0, 42.0, 35.0, 32.0, 27.0, 22.0, 22.0, 16.0, 13.0, 5.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4840911626815796, -1.4314384460449219, -1.3787857294082642, -1.3261330127716064, -1.2734804153442383, -1.2208276987075806, -1.1681749820709229, -1.1155222654342651, -1.0628695487976074, -1.0102168321609497, -0.9575641751289368, -0.904911458492279, -0.8522588014602661, -0.7996060848236084, -0.7469533681869507, -0.694300651550293, -0.6416480541229248, -0.5889953374862671, -0.5363426804542542, -0.48368996381759644, -0.4310372769832611, -0.3783845901489258, -0.32573187351226807, -0.27307918667793274, -0.2204264998435974, -0.16777381300926208, -0.11512111127376556, -0.06246840953826904, -0.009815722703933716, 0.04283696413040161, 0.09548968076705933, 0.14814236760139465, 0.20079493522644043, 0.25344762206077576, 0.3061003088951111, 0.3587530255317688, 0.4114057123661041, 0.46405839920043945, 0.5167111158370972, 0.5693638324737549, 0.6220164895057678, 0.6746692061424255, 0.7273218631744385, 0.7799745798110962, 0.8326272964477539, 0.8852799534797668, 0.9379326701164246, 0.9905853271484375, 1.0432380437850952, 1.095890760421753, 1.1485434770584106, 1.2011961936950684, 1.2538487911224365, 1.3065015077590942, 1.359154224395752, 1.4118069410324097, 1.4644596576690674, 1.517112374305725, 1.5697650909423828, 1.622417688369751, 1.6750704050064087, 1.7277231216430664, 1.7803758382797241, 1.8330285549163818, 1.88568115234375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 8.0, 13.0, 18.0, 16.0, 12.0, 27.0, 26.0, 29.0, 25.0, 37.0, 28.0, 26.0, 41.0, 37.0, 37.0, 37.0, 42.0, 36.0, 30.0, 32.0, 38.0, 39.0, 31.0, 26.0, 25.0, 30.0, 23.0, 27.0, 26.0, 17.0, 14.0, 14.0, 13.0, 13.0, 11.0, 12.0, 15.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 3.0], "bins": [-1.2504222393035889, -1.2146520614624023, -1.1788820028305054, -1.1431118249893188, -1.1073417663574219, -1.0715715885162354, -1.0358015298843384, -1.0000313520431519, -0.9642612934112549, -0.9284911751747131, -0.8927210569381714, -0.8569509387016296, -0.8211808204650879, -0.7854107022285461, -0.7496405839920044, -0.7138704061508179, -0.6781002879142761, -0.6423301696777344, -0.6065600514411926, -0.5707899332046509, -0.5350198149681091, -0.4992496967315674, -0.46347954869270325, -0.4277094304561615, -0.39193931221961975, -0.356169193983078, -0.32039907574653625, -0.2846289277076721, -0.24885882437229156, -0.21308870613574982, -0.17731857299804688, -0.14154845476150513, -0.10577833652496338, -0.07000821828842163, -0.034238092601299286, 0.001532033085823059, 0.03730215132236481, 0.07307226955890656, 0.1088424026966095, 0.14461252093315125, 0.180382639169693, 0.21615275740623474, 0.2519228756427765, 0.2876930236816406, 0.3234631419181824, 0.3592332601547241, 0.39500337839126587, 0.4307734966278076, 0.46654361486434937, 0.5023137331008911, 0.5380838513374329, 0.5738539695739746, 0.6096240878105164, 0.6453942060470581, 0.6811643838882446, 0.7169344425201416, 0.7527046203613281, 0.7884747385978699, 0.8242448568344116, 0.8600149750709534, 0.8957850933074951, 0.9315552115440369, 0.9673253297805786, 1.0030955076217651, 1.038865566253662]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 6.0, 4.0, 5.0, 14.0, 27.0, 51.0, 55.0, 87.0, 141.0, 202.0, 342.0, 526.0, 773.0, 1209.0, 1954.0, 3154.0, 5054.0, 8268.0, 13544.0, 22511.0, 37272.0, 62087.0, 102599.0, 165864.0, 261436.0, 385996.0, 514907.0, 595147.0, 580517.0, 478583.0, 348549.0, 230901.0, 146224.0, 89542.0, 53929.0, 32804.0, 19336.0, 11745.0, 7175.0, 4370.0, 2751.0, 1632.0, 1050.0, 640.0, 454.0, 287.0, 210.0, 126.0, 83.0, 46.0, 35.0, 22.0, 13.0, 6.0, 9.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0], "bins": [-1.1181640625, -1.0819244384765625, -1.045684814453125, -1.0094451904296875, -0.97320556640625, -0.9369659423828125, -0.900726318359375, -0.8644866943359375, -0.8282470703125, -0.7920074462890625, -0.755767822265625, -0.7195281982421875, -0.68328857421875, -0.6470489501953125, -0.610809326171875, -0.5745697021484375, -0.538330078125, -0.5020904541015625, -0.465850830078125, -0.4296112060546875, -0.39337158203125, -0.3571319580078125, -0.320892333984375, -0.2846527099609375, -0.2484130859375, -0.2121734619140625, -0.175933837890625, -0.1396942138671875, -0.10345458984375, -0.0672149658203125, -0.030975341796875, 0.0052642822265625, 0.04150390625, 0.0777435302734375, 0.113983154296875, 0.1502227783203125, 0.18646240234375, 0.2227020263671875, 0.258941650390625, 0.2951812744140625, 0.3314208984375, 0.3676605224609375, 0.403900146484375, 0.4401397705078125, 0.47637939453125, 0.5126190185546875, 0.548858642578125, 0.5850982666015625, 0.621337890625, 0.6575775146484375, 0.693817138671875, 0.7300567626953125, 0.76629638671875, 0.8025360107421875, 0.838775634765625, 0.8750152587890625, 0.9112548828125, 0.9474945068359375, 0.983734130859375, 1.0199737548828125, 1.05621337890625, 1.0924530029296875, 1.128692626953125, 1.1649322509765625, 1.201171875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 3.0, 13.0, 10.0, 10.0, 11.0, 10.0, 17.0, 22.0, 17.0, 31.0, 25.0, 39.0, 40.0, 33.0, 28.0, 37.0, 26.0, 43.0, 40.0, 39.0, 29.0, 39.0, 39.0, 39.0, 26.0, 35.0, 31.0, 33.0, 25.0, 28.0, 16.0, 23.0, 23.0, 18.0, 11.0, 11.0, 12.0, 16.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.86962890625, -0.842926025390625, -0.81622314453125, -0.789520263671875, -0.7628173828125, -0.736114501953125, -0.70941162109375, -0.682708740234375, -0.656005859375, -0.629302978515625, -0.60260009765625, -0.575897216796875, -0.5491943359375, -0.522491455078125, -0.49578857421875, -0.469085693359375, -0.4423828125, -0.415679931640625, -0.38897705078125, -0.362274169921875, -0.3355712890625, -0.308868408203125, -0.28216552734375, -0.255462646484375, -0.228759765625, -0.202056884765625, -0.17535400390625, -0.148651123046875, -0.1219482421875, -0.095245361328125, -0.06854248046875, -0.041839599609375, -0.01513671875, 0.011566162109375, 0.03826904296875, 0.064971923828125, 0.0916748046875, 0.118377685546875, 0.14508056640625, 0.171783447265625, 0.198486328125, 0.225189208984375, 0.25189208984375, 0.278594970703125, 0.3052978515625, 0.332000732421875, 0.35870361328125, 0.385406494140625, 0.412109375, 0.438812255859375, 0.46551513671875, 0.492218017578125, 0.5189208984375, 0.545623779296875, 0.57232666015625, 0.599029541015625, 0.625732421875, 0.652435302734375, 0.67913818359375, 0.705841064453125, 0.7325439453125, 0.759246826171875, 0.78594970703125, 0.812652587890625, 0.83935546875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 10.0, 18.0, 27.0, 53.0, 75.0, 140.0, 176.0, 299.0, 464.0, 772.0, 1244.0, 2035.0, 3147.0, 5348.0, 8621.0, 14054.0, 23110.0, 37565.0, 58740.0, 92549.0, 141389.0, 208076.0, 289879.0, 379392.0, 455817.0, 496042.0, 482191.0, 420586.0, 337083.0, 247941.0, 173525.0, 115371.0, 75168.0, 47425.0, 29394.0, 18006.0, 11169.0, 6637.0, 4120.0, 2539.0, 1571.0, 950.0, 580.0, 356.0, 231.0, 139.0, 93.0, 60.0, 42.0, 26.0, 20.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.001953125, -0.9693756103515625, -0.936798095703125, -0.9042205810546875, -0.87164306640625, -0.8390655517578125, -0.806488037109375, -0.7739105224609375, -0.7413330078125, -0.7087554931640625, -0.676177978515625, -0.6436004638671875, -0.61102294921875, -0.5784454345703125, -0.545867919921875, -0.5132904052734375, -0.480712890625, -0.4481353759765625, -0.415557861328125, -0.3829803466796875, -0.35040283203125, -0.3178253173828125, -0.285247802734375, -0.2526702880859375, -0.2200927734375, -0.1875152587890625, -0.154937744140625, -0.1223602294921875, -0.08978271484375, -0.0572052001953125, -0.024627685546875, 0.0079498291015625, 0.04052734375, 0.0731048583984375, 0.105682373046875, 0.1382598876953125, 0.17083740234375, 0.2034149169921875, 0.235992431640625, 0.2685699462890625, 0.3011474609375, 0.3337249755859375, 0.366302490234375, 0.3988800048828125, 0.43145751953125, 0.4640350341796875, 0.496612548828125, 0.5291900634765625, 0.561767578125, 0.5943450927734375, 0.626922607421875, 0.6595001220703125, 0.69207763671875, 0.7246551513671875, 0.757232666015625, 0.7898101806640625, 0.8223876953125, 0.8549652099609375, 0.887542724609375, 0.9201202392578125, 0.95269775390625, 0.9852752685546875, 1.017852783203125, 1.0504302978515625, 1.0830078125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 8.0, 10.0, 21.0, 28.0, 31.0, 37.0, 62.0, 68.0, 64.0, 92.0, 124.0, 139.0, 153.0, 184.0, 233.0, 217.0, 261.0, 220.0, 245.0, 226.0, 217.0, 203.0, 190.0, 163.0, 163.0, 134.0, 131.0, 121.0, 73.0, 54.0, 43.0, 46.0, 23.0, 18.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5153656005859375, -0.499481201171875, -0.4835968017578125, -0.46771240234375, -0.4518280029296875, -0.435943603515625, -0.4200592041015625, -0.4041748046875, -0.3882904052734375, -0.372406005859375, -0.3565216064453125, -0.34063720703125, -0.3247528076171875, -0.308868408203125, -0.2929840087890625, -0.277099609375, -0.2612152099609375, -0.245330810546875, -0.2294464111328125, -0.21356201171875, -0.1976776123046875, -0.181793212890625, -0.1659088134765625, -0.1500244140625, -0.1341400146484375, -0.118255615234375, -0.1023712158203125, -0.08648681640625, -0.0706024169921875, -0.054718017578125, -0.0388336181640625, -0.02294921875, -0.0070648193359375, 0.008819580078125, 0.0247039794921875, 0.04058837890625, 0.0564727783203125, 0.072357177734375, 0.0882415771484375, 0.1041259765625, 0.1200103759765625, 0.135894775390625, 0.1517791748046875, 0.16766357421875, 0.1835479736328125, 0.199432373046875, 0.2153167724609375, 0.231201171875, 0.2470855712890625, 0.262969970703125, 0.2788543701171875, 0.29473876953125, 0.3106231689453125, 0.326507568359375, 0.3423919677734375, 0.3582763671875, 0.3741607666015625, 0.390045166015625, 0.4059295654296875, 0.42181396484375, 0.4376983642578125, 0.453582763671875, 0.4694671630859375, 0.4853515625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 18.0, 17.0, 25.0, 29.0, 38.0, 34.0, 45.0, 47.0, 45.0, 56.0, 63.0, 65.0, 61.0, 46.0, 63.0, 40.0, 35.0, 31.0, 29.0, 30.0, 31.0, 18.0, 23.0, 22.0, 7.0, 7.0, 10.0, 6.0, 3.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7404402494430542, -1.6902867555618286, -1.6401333808898926, -1.589979887008667, -1.5398263931274414, -1.4896728992462158, -1.4395195245742798, -1.3893660306930542, -1.3392125368118286, -1.289059042930603, -1.238905668258667, -1.1887521743774414, -1.1385986804962158, -1.0884451866149902, -1.0382918119430542, -0.9881383180618286, -0.9379848837852478, -0.887831449508667, -0.8376779556274414, -0.7875245213508606, -0.737371027469635, -0.6872175931930542, -0.6370640993118286, -0.5869106650352478, -0.536757230758667, -0.4866037666797638, -0.4364503026008606, -0.3862968683242798, -0.3361433744430542, -0.2859899401664734, -0.2358364760875702, -0.185683012008667, -0.1355295181274414, -0.08537605404853821, -0.03522259742021561, 0.014930859208106995, 0.06508432328701019, 0.1152377724647522, 0.1653912365436554, 0.2155447006225586, 0.2656981647014618, 0.315851628780365, 0.3660050928592682, 0.4161585569381714, 0.4663119912147522, 0.516465425491333, 0.5666189193725586, 0.6167724132537842, 0.666925847530365, 0.7170792818069458, 0.7672327756881714, 0.8173862099647522, 0.8675397038459778, 0.9176931381225586, 0.9678466320037842, 1.0180001258850098, 1.0681535005569458, 1.1183069944381714, 1.1684603691101074, 1.218613862991333, 1.2687673568725586, 1.3189208507537842, 1.3690742254257202, 1.4192277193069458, 1.4693812131881714]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 33.0, 31.0, 49.0, 32.0, 43.0, 33.0, 42.0, 45.0, 38.0, 41.0, 46.0, 48.0, 35.0, 43.0, 32.0, 41.0, 34.0, 29.0, 22.0, 29.0, 18.0, 22.0, 18.0, 18.0, 10.0, 13.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1312960386276245, -1.0931018590927124, -1.0549076795578003, -1.0167135000228882, -0.9785193204879761, -0.940325140953064, -0.9021309614181519, -0.8639367818832397, -0.8257426023483276, -0.7875484228134155, -0.7493542432785034, -0.7111600637435913, -0.6729658842086792, -0.6347717046737671, -0.596577525138855, -0.5583833456039429, -0.520189106464386, -0.4819949269294739, -0.44380074739456177, -0.40560656785964966, -0.36741238832473755, -0.32921820878982544, -0.29102399945259094, -0.25282981991767883, -0.21463564038276672, -0.17644146084785461, -0.1382472813129425, -0.1000530868768692, -0.06185890734195709, -0.023664727807044983, 0.01452946662902832, 0.05272364616394043, 0.09091782569885254, 0.12911200523376465, 0.16730618476867676, 0.20550037920475006, 0.24369455873966217, 0.2818887233734131, 0.3200829327106476, 0.3582771122455597, 0.3964712917804718, 0.4346654713153839, 0.472859650850296, 0.5110538601875305, 0.5492480397224426, 0.5874422192573547, 0.6256363987922668, 0.663830578327179, 0.7020247578620911, 0.7402189373970032, 0.7784131169319153, 0.8166072964668274, 0.8548014760017395, 0.8929956555366516, 0.9311898946762085, 0.9693840742111206, 1.0075782537460327, 1.0457724332809448, 1.083966612815857, 1.122160792350769, 1.1603549718856812, 1.1985491514205933, 1.2367433309555054, 1.2749375104904175, 1.3131316900253296]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 11.0, 22.0, 16.0, 46.0, 63.0, 92.0, 134.0, 198.0, 265.0, 442.0, 722.0, 1011.0, 1595.0, 2449.0, 3737.0, 5824.0, 8756.0, 13578.0, 20997.0, 32060.0, 48982.0, 73299.0, 105470.0, 140775.0, 155347.0, 133909.0, 99948.0, 68504.0, 45225.0, 29942.0, 19296.0, 12498.0, 8209.0, 5180.0, 3422.0, 2184.0, 1536.0, 928.0, 632.0, 396.0, 281.0, 194.0, 134.0, 76.0, 51.0, 37.0, 31.0, 26.0, 8.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.358642578125, -0.3485145568847656, -0.33838653564453125, -0.3282585144042969, -0.3181304931640625, -0.3080024719238281, -0.29787445068359375, -0.2877464294433594, -0.277618408203125, -0.2674903869628906, -0.25736236572265625, -0.24723434448242188, -0.2371063232421875, -0.22697830200195312, -0.21685028076171875, -0.20672225952148438, -0.19659423828125, -0.18646621704101562, -0.17633819580078125, -0.16621017456054688, -0.1560821533203125, -0.14595413208007812, -0.13582611083984375, -0.12569808959960938, -0.115570068359375, -0.10544204711914062, -0.09531402587890625, -0.08518600463867188, -0.0750579833984375, -0.06492996215820312, -0.05480194091796875, -0.044673919677734375, -0.0345458984375, -0.024417877197265625, -0.01428985595703125, -0.004161834716796875, 0.0059661865234375, 0.016094207763671875, 0.02622222900390625, 0.036350250244140625, 0.046478271484375, 0.056606292724609375, 0.06673431396484375, 0.07686233520507812, 0.0869903564453125, 0.09711837768554688, 0.10724639892578125, 0.11737442016601562, 0.12750244140625, 0.13763046264648438, 0.14775848388671875, 0.15788650512695312, 0.1680145263671875, 0.17814254760742188, 0.18827056884765625, 0.19839859008789062, 0.208526611328125, 0.21865463256835938, 0.22878265380859375, 0.23891067504882812, 0.2490386962890625, 0.2591667175292969, 0.26929473876953125, 0.2794227600097656, 0.28955078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 11.0, 5.0, 8.0, 5.0, 8.0, 10.0, 13.0, 9.0, 18.0, 18.0, 27.0, 19.0, 31.0, 35.0, 35.0, 35.0, 29.0, 52.0, 31.0, 33.0, 46.0, 38.0, 42.0, 42.0, 45.0, 38.0, 40.0, 38.0, 26.0, 26.0, 32.0, 22.0, 31.0, 13.0, 18.0, 14.0, 10.0, 13.0, 7.0, 6.0, 6.0, 7.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0423736572265625, -1.005645751953125, -0.9689178466796875, -0.93218994140625, -0.8954620361328125, -0.858734130859375, -0.8220062255859375, -0.7852783203125, -0.7485504150390625, -0.711822509765625, -0.6750946044921875, -0.63836669921875, -0.6016387939453125, -0.564910888671875, -0.5281829833984375, -0.491455078125, -0.4547271728515625, -0.417999267578125, -0.3812713623046875, -0.34454345703125, -0.3078155517578125, -0.271087646484375, -0.2343597412109375, -0.1976318359375, -0.1609039306640625, -0.124176025390625, -0.0874481201171875, -0.05072021484375, -0.0139923095703125, 0.022735595703125, 0.0594635009765625, 0.09619140625, 0.1329193115234375, 0.169647216796875, 0.2063751220703125, 0.24310302734375, 0.2798309326171875, 0.316558837890625, 0.3532867431640625, 0.3900146484375, 0.4267425537109375, 0.463470458984375, 0.5001983642578125, 0.53692626953125, 0.5736541748046875, 0.610382080078125, 0.6471099853515625, 0.683837890625, 0.7205657958984375, 0.757293701171875, 0.7940216064453125, 0.83074951171875, 0.8674774169921875, 0.904205322265625, 0.9409332275390625, 0.9776611328125, 1.0143890380859375, 1.051116943359375, 1.0878448486328125, 1.12457275390625, 1.1613006591796875, 1.198028564453125, 1.2347564697265625, 1.271484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 20.0, 13.0, 23.0, 29.0, 55.0, 75.0, 119.0, 169.0, 306.0, 486.0, 820.0, 1418.0, 2535.0, 4501.0, 8335.0, 16166.0, 31751.0, 62708.0, 120147.0, 204119.0, 236822.0, 167482.0, 92455.0, 47155.0, 23902.0, 12360.0, 6375.0, 3495.0, 1908.0, 1073.0, 645.0, 373.0, 215.0, 137.0, 120.0, 68.0, 51.0, 33.0, 17.0, 12.0, 14.0, 5.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.50390625, -0.48876953125, -0.4736328125, -0.45849609375, -0.443359375, -0.42822265625, -0.4130859375, -0.39794921875, -0.3828125, -0.36767578125, -0.3525390625, -0.33740234375, -0.322265625, -0.30712890625, -0.2919921875, -0.27685546875, -0.26171875, -0.24658203125, -0.2314453125, -0.21630859375, -0.201171875, -0.18603515625, -0.1708984375, -0.15576171875, -0.140625, -0.12548828125, -0.1103515625, -0.09521484375, -0.080078125, -0.06494140625, -0.0498046875, -0.03466796875, -0.01953125, -0.00439453125, 0.0107421875, 0.02587890625, 0.041015625, 0.05615234375, 0.0712890625, 0.08642578125, 0.1015625, 0.11669921875, 0.1318359375, 0.14697265625, 0.162109375, 0.17724609375, 0.1923828125, 0.20751953125, 0.22265625, 0.23779296875, 0.2529296875, 0.26806640625, 0.283203125, 0.29833984375, 0.3134765625, 0.32861328125, 0.34375, 0.35888671875, 0.3740234375, 0.38916015625, 0.404296875, 0.41943359375, 0.4345703125, 0.44970703125, 0.46484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 7.0, 7.0, 13.0, 13.0, 25.0, 18.0, 19.0, 25.0, 24.0, 26.0, 45.0, 29.0, 31.0, 34.0, 42.0, 34.0, 33.0, 38.0, 32.0, 39.0, 35.0, 33.0, 28.0, 29.0, 28.0, 31.0, 28.0, 29.0, 23.0, 29.0, 19.0, 23.0, 21.0, 14.0, 14.0, 16.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72216796875, -0.6994247436523438, -0.6766815185546875, -0.6539382934570312, -0.631195068359375, -0.6084518432617188, -0.5857086181640625, -0.5629653930664062, -0.54022216796875, -0.5174789428710938, -0.4947357177734375, -0.47199249267578125, -0.449249267578125, -0.42650604248046875, -0.4037628173828125, -0.38101959228515625, -0.3582763671875, -0.33553314208984375, -0.3127899169921875, -0.29004669189453125, -0.267303466796875, -0.24456024169921875, -0.2218170166015625, -0.19907379150390625, -0.17633056640625, -0.15358734130859375, -0.1308441162109375, -0.10810089111328125, -0.085357666015625, -0.06261444091796875, -0.0398712158203125, -0.01712799072265625, 0.005615234375, 0.02835845947265625, 0.0511016845703125, 0.07384490966796875, 0.096588134765625, 0.11933135986328125, 0.1420745849609375, 0.16481781005859375, 0.18756103515625, 0.21030426025390625, 0.2330474853515625, 0.25579071044921875, 0.278533935546875, 0.30127716064453125, 0.3240203857421875, 0.34676361083984375, 0.3695068359375, 0.39225006103515625, 0.4149932861328125, 0.43773651123046875, 0.460479736328125, 0.48322296142578125, 0.5059661865234375, 0.5287094116210938, 0.55145263671875, 0.5741958618164062, 0.5969390869140625, 0.6196823120117188, 0.642425537109375, 0.6651687622070312, 0.6879119873046875, 0.7106552124023438, 0.7333984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 19.0, 26.0, 30.0, 53.0, 92.0, 94.0, 129.0, 178.0, 271.0, 372.0, 490.0, 724.0, 1016.0, 1391.0, 2200.0, 3264.0, 5237.0, 8778.0, 16545.0, 32888.0, 73867.0, 178310.0, 335355.0, 214488.0, 88057.0, 38656.0, 18903.0, 9985.0, 5853.0, 3593.0, 2335.0, 1601.0, 1055.0, 700.0, 542.0, 389.0, 279.0, 215.0, 158.0, 110.0, 77.0, 58.0, 36.0, 25.0, 26.0, 14.0, 15.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.19970703125, -0.1933879852294922, -0.18706893920898438, -0.18074989318847656, -0.17443084716796875, -0.16811180114746094, -0.16179275512695312, -0.1554737091064453, -0.1491546630859375, -0.1428356170654297, -0.13651657104492188, -0.13019752502441406, -0.12387847900390625, -0.11755943298339844, -0.11124038696289062, -0.10492134094238281, -0.098602294921875, -0.09228324890136719, -0.08596420288085938, -0.07964515686035156, -0.07332611083984375, -0.06700706481933594, -0.060688018798828125, -0.05436897277832031, -0.0480499267578125, -0.04173088073730469, -0.035411834716796875, -0.029092788696289062, -0.02277374267578125, -0.016454696655273438, -0.010135650634765625, -0.0038166046142578125, 0.00250244140625, 0.008821487426757812, 0.015140533447265625, 0.021459579467773438, 0.02777862548828125, 0.03409767150878906, 0.040416717529296875, 0.04673576354980469, 0.0530548095703125, 0.05937385559082031, 0.06569290161132812, 0.07201194763183594, 0.07833099365234375, 0.08465003967285156, 0.09096908569335938, 0.09728813171386719, 0.103607177734375, 0.10992622375488281, 0.11624526977539062, 0.12256431579589844, 0.12888336181640625, 0.13520240783691406, 0.14152145385742188, 0.1478404998779297, 0.1541595458984375, 0.1604785919189453, 0.16679763793945312, 0.17311668395996094, 0.17943572998046875, 0.18575477600097656, 0.19207382202148438, 0.1983928680419922, 0.2047119140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 10.0, 2.0, 7.0, 17.0, 15.0, 16.0, 17.0, 30.0, 33.0, 58.0, 68.0, 59.0, 72.0, 71.0, 74.0, 83.0, 72.0, 62.0, 52.0, 38.0, 43.0, 20.0, 23.0, 12.0, 16.0, 9.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.3930723071098328e-05, -1.3377517461776733e-05, -1.282431185245514e-05, -1.2271106243133545e-05, -1.171790063381195e-05, -1.1164695024490356e-05, -1.0611489415168762e-05, -1.0058283805847168e-05, -9.505078196525574e-06, -8.95187258720398e-06, -8.398666977882385e-06, -7.845461368560791e-06, -7.292255759239197e-06, -6.7390501499176025e-06, -6.185844540596008e-06, -5.632638931274414e-06, -5.07943332195282e-06, -4.526227712631226e-06, -3.973022103309631e-06, -3.419816493988037e-06, -2.866610884666443e-06, -2.3134052753448486e-06, -1.7601996660232544e-06, -1.2069940567016602e-06, -6.537884473800659e-07, -1.0058283805847168e-07, 4.5262277126312256e-07, 1.0058283805847168e-06, 1.559033989906311e-06, 2.1122395992279053e-06, 2.6654452085494995e-06, 3.2186508178710938e-06, 3.771856427192688e-06, 4.325062036514282e-06, 4.8782676458358765e-06, 5.431473255157471e-06, 5.984678864479065e-06, 6.537884473800659e-06, 7.091090083122253e-06, 7.644295692443848e-06, 8.197501301765442e-06, 8.750706911087036e-06, 9.30391252040863e-06, 9.857118129730225e-06, 1.0410323739051819e-05, 1.0963529348373413e-05, 1.1516734957695007e-05, 1.2069940567016602e-05, 1.2623146176338196e-05, 1.317635178565979e-05, 1.3729557394981384e-05, 1.4282763004302979e-05, 1.4835968613624573e-05, 1.5389174222946167e-05, 1.594237983226776e-05, 1.6495585441589355e-05, 1.704879105091095e-05, 1.7601996660232544e-05, 1.8155202269554138e-05, 1.8708407878875732e-05, 1.9261613488197327e-05, 1.981481909751892e-05, 2.0368024706840515e-05, 2.092123031616211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 4.0, 15.0, 24.0, 26.0, 34.0, 50.0, 94.0, 146.0, 233.0, 368.0, 577.0, 898.0, 1420.0, 2468.0, 3811.0, 6526.0, 11684.0, 21027.0, 39899.0, 75922.0, 139346.0, 220519.0, 220420.0, 138690.0, 75217.0, 39763.0, 20831.0, 11654.0, 6795.0, 3905.0, 2368.0, 1410.0, 832.0, 564.0, 334.0, 217.0, 133.0, 123.0, 55.0, 35.0, 43.0, 23.0, 15.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1708984375, -0.16500473022460938, -0.15911102294921875, -0.15321731567382812, -0.1473236083984375, -0.14142990112304688, -0.13553619384765625, -0.12964248657226562, -0.123748779296875, -0.11785507202148438, -0.11196136474609375, -0.10606765747070312, -0.1001739501953125, -0.09428024291992188, -0.08838653564453125, -0.08249282836914062, -0.07659912109375, -0.07070541381835938, -0.06481170654296875, -0.058917999267578125, -0.0530242919921875, -0.047130584716796875, -0.04123687744140625, -0.035343170166015625, -0.029449462890625, -0.023555755615234375, -0.01766204833984375, -0.011768341064453125, -0.0058746337890625, 1.9073486328125e-05, 0.00591278076171875, 0.011806488037109375, 0.0177001953125, 0.023593902587890625, 0.02948760986328125, 0.035381317138671875, 0.0412750244140625, 0.047168731689453125, 0.05306243896484375, 0.058956146240234375, 0.064849853515625, 0.07074356079101562, 0.07663726806640625, 0.08253097534179688, 0.0884246826171875, 0.09431838989257812, 0.10021209716796875, 0.10610580444335938, 0.11199951171875, 0.11789321899414062, 0.12378692626953125, 0.12968063354492188, 0.1355743408203125, 0.14146804809570312, 0.14736175537109375, 0.15325546264648438, 0.159149169921875, 0.16504287719726562, 0.17093658447265625, 0.17683029174804688, 0.1827239990234375, 0.18861770629882812, 0.19451141357421875, 0.20040512084960938, 0.206298828125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 18.0, 15.0, 20.0, 21.0, 20.0, 21.0, 30.0, 32.0, 31.0, 49.0, 52.0, 58.0, 52.0, 51.0, 58.0, 55.0, 56.0, 43.0, 37.0, 33.0, 40.0, 26.0, 34.0, 22.0, 19.0, 14.0, 6.0, 15.0, 3.0, 11.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03614616394042969, -0.034938812255859375, -0.03373146057128906, -0.03252410888671875, -0.03131675720214844, -0.030109405517578125, -0.028902053833007812, -0.0276947021484375, -0.026487350463867188, -0.025279998779296875, -0.024072647094726562, -0.02286529541015625, -0.021657943725585938, -0.020450592041015625, -0.019243240356445312, -0.018035888671875, -0.016828536987304688, -0.015621185302734375, -0.014413833618164062, -0.01320648193359375, -0.011999130249023438, -0.010791778564453125, -0.009584426879882812, -0.0083770751953125, -0.0071697235107421875, -0.005962371826171875, -0.0047550201416015625, -0.00354766845703125, -0.0023403167724609375, -0.001132965087890625, 7.43865966796875e-05, 0.00128173828125, 0.0024890899658203125, 0.003696441650390625, 0.0049037933349609375, 0.00611114501953125, 0.0073184967041015625, 0.008525848388671875, 0.009733200073242188, 0.0109405517578125, 0.012147903442382812, 0.013355255126953125, 0.014562606811523438, 0.01576995849609375, 0.016977310180664062, 0.018184661865234375, 0.019392013549804688, 0.020599365234375, 0.021806716918945312, 0.023014068603515625, 0.024221420288085938, 0.02542877197265625, 0.026636123657226562, 0.027843475341796875, 0.029050827026367188, 0.0302581787109375, 0.03146553039550781, 0.032672882080078125, 0.03388023376464844, 0.03508758544921875, 0.03629493713378906, 0.037502288818359375, 0.03870964050292969, 0.0399169921875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 8.0, 16.0, 19.0, 25.0, 28.0, 39.0, 41.0, 36.0, 45.0, 47.0, 68.0, 58.0, 65.0, 56.0, 54.0, 53.0, 37.0, 33.0, 34.0, 24.0, 37.0, 28.0, 29.0, 18.0, 18.0, 10.0, 4.0, 8.0, 8.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8160393238067627, -1.7665389776229858, -1.717038631439209, -1.6675382852554321, -1.6180379390716553, -1.5685375928878784, -1.5190372467041016, -1.4695369005203247, -1.4200365543365479, -1.370536208152771, -1.3210358619689941, -1.2715355157852173, -1.2220351696014404, -1.1725348234176636, -1.1230344772338867, -1.0735341310501099, -1.024033784866333, -0.9745334386825562, -0.9250330924987793, -0.8755327463150024, -0.8260324001312256, -0.7765320539474487, -0.7270317077636719, -0.677531361579895, -0.6280310153961182, -0.5785306692123413, -0.5290303230285645, -0.4795299768447876, -0.43002963066101074, -0.3805292844772339, -0.33102893829345703, -0.2815285921096802, -0.23202836513519287, -0.18252801895141602, -0.13302767276763916, -0.0835273265838623, -0.03402698040008545, 0.015473365783691406, 0.06497371196746826, 0.11447405815124512, 0.16397440433502197, 0.21347475051879883, 0.2629750967025757, 0.31247544288635254, 0.3619757890701294, 0.41147613525390625, 0.4609764814376831, 0.51047682762146, 0.5599771738052368, 0.6094775199890137, 0.6589778661727905, 0.7084782123565674, 0.7579785585403442, 0.8074789047241211, 0.856979250907898, 0.9064795970916748, 0.9559799432754517, 1.0054802894592285, 1.0549806356430054, 1.1044809818267822, 1.153981328010559, 1.203481674194336, 1.2529820203781128, 1.3024823665618896, 1.3519827127456665]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 7.0, 9.0, 15.0, 18.0, 16.0, 24.0, 37.0, 28.0, 43.0, 36.0, 39.0, 40.0, 34.0, 42.0, 44.0, 35.0, 42.0, 51.0, 42.0, 36.0, 42.0, 31.0, 41.0, 35.0, 26.0, 28.0, 22.0, 20.0, 20.0, 21.0, 14.0, 10.0, 14.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1101436614990234, -1.0721240043640137, -1.0341042280197144, -0.9960845112800598, -0.9580647945404053, -0.9200450778007507, -0.8820253610610962, -0.8440056443214417, -0.8059859275817871, -0.7679662108421326, -0.729946494102478, -0.6919267773628235, -0.653907060623169, -0.6158873438835144, -0.5778676271438599, -0.5398479104042053, -0.5018281936645508, -0.46380847692489624, -0.4257887601852417, -0.38776904344558716, -0.3497493267059326, -0.3117296099662781, -0.27370989322662354, -0.235690176486969, -0.19767045974731445, -0.1596507430076599, -0.12163102626800537, -0.08361130952835083, -0.04559159278869629, -0.007571876049041748, 0.030447840690612793, 0.06846755743026733, 0.10648727416992188, 0.14450699090957642, 0.18252670764923096, 0.2205464243888855, 0.25856614112854004, 0.2965858578681946, 0.3346055746078491, 0.37262529134750366, 0.4106450080871582, 0.44866472482681274, 0.4866844415664673, 0.5247041583061218, 0.5627238750457764, 0.6007435917854309, 0.6387633085250854, 0.67678302526474, 0.7148027420043945, 0.7528224587440491, 0.7908421754837036, 0.8288618922233582, 0.8668816089630127, 0.9049013257026672, 0.9429210424423218, 0.9809407591819763, 1.0189604759216309, 1.0569801330566406, 1.09499990940094, 1.1330196857452393, 1.171039342880249, 1.2090590000152588, 1.247078776359558, 1.2850985527038574, 1.3231182098388672]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 26.0, 32.0, 50.0, 89.0, 123.0, 213.0, 307.0, 545.0, 957.0, 1324.0, 2135.0, 3391.0, 5303.0, 8356.0, 12820.0, 19623.0, 28643.0, 41411.0, 56893.0, 74877.0, 91945.0, 104753.0, 111172.0, 106640.0, 95520.0, 79605.0, 61970.0, 45297.0, 32077.0, 21696.0, 14627.0, 9602.0, 6132.0, 3790.0, 2364.0, 1580.0, 979.0, 593.0, 399.0, 286.0, 143.0, 86.0, 69.0, 29.0, 27.0, 21.0, 11.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.94384765625, -0.9149322509765625, -0.886016845703125, -0.8571014404296875, -0.82818603515625, -0.7992706298828125, -0.770355224609375, -0.7414398193359375, -0.7125244140625, -0.6836090087890625, -0.654693603515625, -0.6257781982421875, -0.59686279296875, -0.5679473876953125, -0.539031982421875, -0.5101165771484375, -0.481201171875, -0.4522857666015625, -0.423370361328125, -0.3944549560546875, -0.36553955078125, -0.3366241455078125, -0.307708740234375, -0.2787933349609375, -0.2498779296875, -0.2209625244140625, -0.192047119140625, -0.1631317138671875, -0.13421630859375, -0.1053009033203125, -0.076385498046875, -0.0474700927734375, -0.0185546875, 0.0103607177734375, 0.039276123046875, 0.0681915283203125, 0.09710693359375, 0.1260223388671875, 0.154937744140625, 0.1838531494140625, 0.2127685546875, 0.2416839599609375, 0.270599365234375, 0.2995147705078125, 0.32843017578125, 0.3573455810546875, 0.386260986328125, 0.4151763916015625, 0.444091796875, 0.4730072021484375, 0.501922607421875, 0.5308380126953125, 0.55975341796875, 0.5886688232421875, 0.617584228515625, 0.6464996337890625, 0.6754150390625, 0.7043304443359375, 0.733245849609375, 0.7621612548828125, 0.79107666015625, 0.8199920654296875, 0.848907470703125, 0.8778228759765625, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 9.0, 16.0, 11.0, 19.0, 17.0, 34.0, 24.0, 28.0, 44.0, 40.0, 36.0, 35.0, 45.0, 46.0, 40.0, 49.0, 59.0, 46.0, 45.0, 35.0, 36.0, 32.0, 34.0, 42.0, 31.0, 20.0, 20.0, 15.0, 20.0, 15.0, 14.0, 6.0, 12.0, 8.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0507049560546875, -1.008636474609375, -0.9665679931640625, -0.92449951171875, -0.8824310302734375, -0.840362548828125, -0.7982940673828125, -0.7562255859375, -0.7141571044921875, -0.672088623046875, -0.6300201416015625, -0.58795166015625, -0.5458831787109375, -0.503814697265625, -0.4617462158203125, -0.419677734375, -0.3776092529296875, -0.335540771484375, -0.2934722900390625, -0.25140380859375, -0.2093353271484375, -0.167266845703125, -0.1251983642578125, -0.0831298828125, -0.0410614013671875, 0.001007080078125, 0.0430755615234375, 0.08514404296875, 0.1272125244140625, 0.169281005859375, 0.2113494873046875, 0.25341796875, 0.2954864501953125, 0.337554931640625, 0.3796234130859375, 0.42169189453125, 0.4637603759765625, 0.505828857421875, 0.5478973388671875, 0.5899658203125, 0.6320343017578125, 0.674102783203125, 0.7161712646484375, 0.75823974609375, 0.8003082275390625, 0.842376708984375, 0.8844451904296875, 0.926513671875, 0.9685821533203125, 1.010650634765625, 1.0527191162109375, 1.09478759765625, 1.1368560791015625, 1.178924560546875, 1.2209930419921875, 1.2630615234375, 1.3051300048828125, 1.347198486328125, 1.3892669677734375, 1.43133544921875, 1.4734039306640625, 1.515472412109375, 1.5575408935546875, 1.599609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 11.0, 20.0, 30.0, 46.0, 59.0, 118.0, 220.0, 298.0, 528.0, 846.0, 1370.0, 2109.0, 3427.0, 5542.0, 8731.0, 13722.0, 20852.0, 31190.0, 44331.0, 61992.0, 80846.0, 97880.0, 110067.0, 113781.0, 106870.0, 93017.0, 74861.0, 56971.0, 40357.0, 27822.0, 18451.0, 12064.0, 7561.0, 4733.0, 2944.0, 1789.0, 1118.0, 739.0, 457.0, 305.0, 193.0, 100.0, 69.0, 30.0, 30.0, 15.0, 14.0, 8.0, 6.0, 3.0, 7.0, 0.0, 0.0, 2.0], "bins": [-0.994140625, -0.9643325805664062, -0.9345245361328125, -0.9047164916992188, -0.874908447265625, -0.8451004028320312, -0.8152923583984375, -0.7854843139648438, -0.75567626953125, -0.7258682250976562, -0.6960601806640625, -0.6662521362304688, -0.636444091796875, -0.6066360473632812, -0.5768280029296875, -0.5470199584960938, -0.5172119140625, -0.48740386962890625, -0.4575958251953125, -0.42778778076171875, -0.397979736328125, -0.36817169189453125, -0.3383636474609375, -0.30855560302734375, -0.27874755859375, -0.24893951416015625, -0.2191314697265625, -0.18932342529296875, -0.159515380859375, -0.12970733642578125, -0.0998992919921875, -0.07009124755859375, -0.040283203125, -0.01047515869140625, 0.0193328857421875, 0.04914093017578125, 0.078948974609375, 0.10875701904296875, 0.1385650634765625, 0.16837310791015625, 0.19818115234375, 0.22798919677734375, 0.2577972412109375, 0.28760528564453125, 0.317413330078125, 0.34722137451171875, 0.3770294189453125, 0.40683746337890625, 0.4366455078125, 0.46645355224609375, 0.4962615966796875, 0.5260696411132812, 0.555877685546875, 0.5856857299804688, 0.6154937744140625, 0.6453018188476562, 0.67510986328125, 0.7049179077148438, 0.7347259521484375, 0.7645339965820312, 0.794342041015625, 0.8241500854492188, 0.8539581298828125, 0.8837661743164062, 0.91357421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 7.0, 15.0, 15.0, 13.0, 21.0, 20.0, 18.0, 36.0, 26.0, 24.0, 36.0, 28.0, 25.0, 32.0, 38.0, 37.0, 47.0, 38.0, 49.0, 39.0, 31.0, 40.0, 36.0, 32.0, 33.0, 33.0, 20.0, 23.0, 31.0, 22.0, 14.0, 22.0, 16.0, 18.0, 8.0, 7.0, 10.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64013671875, -0.6192398071289062, -0.5983428955078125, -0.5774459838867188, -0.556549072265625, -0.5356521606445312, -0.5147552490234375, -0.49385833740234375, -0.47296142578125, -0.45206451416015625, -0.4311676025390625, -0.41027069091796875, -0.389373779296875, -0.36847686767578125, -0.3475799560546875, -0.32668304443359375, -0.3057861328125, -0.28488922119140625, -0.2639923095703125, -0.24309539794921875, -0.222198486328125, -0.20130157470703125, -0.1804046630859375, -0.15950775146484375, -0.13861083984375, -0.11771392822265625, -0.0968170166015625, -0.07592010498046875, -0.055023193359375, -0.03412628173828125, -0.0132293701171875, 0.00766754150390625, 0.028564453125, 0.04946136474609375, 0.0703582763671875, 0.09125518798828125, 0.112152099609375, 0.13304901123046875, 0.1539459228515625, 0.17484283447265625, 0.19573974609375, 0.21663665771484375, 0.2375335693359375, 0.25843048095703125, 0.279327392578125, 0.30022430419921875, 0.3211212158203125, 0.34201812744140625, 0.3629150390625, 0.38381195068359375, 0.4047088623046875, 0.42560577392578125, 0.446502685546875, 0.46739959716796875, 0.4882965087890625, 0.5091934204101562, 0.53009033203125, 0.5509872436523438, 0.5718841552734375, 0.5927810668945312, 0.613677978515625, 0.6345748901367188, 0.6554718017578125, 0.6763687133789062, 0.697265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 1.0, 7.0, 9.0, 13.0, 28.0, 39.0, 57.0, 80.0, 105.0, 176.0, 293.0, 362.0, 572.0, 869.0, 1393.0, 2049.0, 3130.0, 4786.0, 7342.0, 11471.0, 17431.0, 26727.0, 40727.0, 60185.0, 85102.0, 109918.0, 128765.0, 131837.0, 117383.0, 93379.0, 68122.0, 46839.0, 31012.0, 20376.0, 13225.0, 8566.0, 5604.0, 3639.0, 2322.0, 1581.0, 1031.0, 674.0, 448.0, 314.0, 190.0, 130.0, 89.0, 53.0, 45.0, 26.0, 14.0, 9.0, 8.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4667091369628906, -0.45124053955078125, -0.4357719421386719, -0.4203033447265625, -0.4048347473144531, -0.38936614990234375, -0.3738975524902344, -0.358428955078125, -0.3429603576660156, -0.32749176025390625, -0.3120231628417969, -0.2965545654296875, -0.2810859680175781, -0.26561737060546875, -0.2501487731933594, -0.23468017578125, -0.21921157836914062, -0.20374298095703125, -0.18827438354492188, -0.1728057861328125, -0.15733718872070312, -0.14186859130859375, -0.12639999389648438, -0.110931396484375, -0.09546279907226562, -0.07999420166015625, -0.06452560424804688, -0.0490570068359375, -0.033588409423828125, -0.01811981201171875, -0.002651214599609375, 0.0128173828125, 0.028285980224609375, 0.04375457763671875, 0.059223175048828125, 0.0746917724609375, 0.09016036987304688, 0.10562896728515625, 0.12109756469726562, 0.136566162109375, 0.15203475952148438, 0.16750335693359375, 0.18297195434570312, 0.1984405517578125, 0.21390914916992188, 0.22937774658203125, 0.24484634399414062, 0.26031494140625, 0.2757835388183594, 0.29125213623046875, 0.3067207336425781, 0.3221893310546875, 0.3376579284667969, 0.35312652587890625, 0.3685951232910156, 0.384063720703125, 0.3995323181152344, 0.41500091552734375, 0.4304695129394531, 0.4459381103515625, 0.4614067077636719, 0.47687530517578125, 0.4923439025878906, 0.5078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 2.0, 9.0, 12.0, 16.0, 12.0, 15.0, 31.0, 29.0, 23.0, 29.0, 22.0, 39.0, 46.0, 54.0, 41.0, 65.0, 65.0, 37.0, 56.0, 56.0, 42.0, 33.0, 39.0, 30.0, 32.0, 28.0, 24.0, 16.0, 13.0, 20.0, 7.0, 5.0, 7.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.251169204711914e-05, -5.0866976380348206e-05, -4.922226071357727e-05, -4.7577545046806335e-05, -4.59328293800354e-05, -4.4288113713264465e-05, -4.264339804649353e-05, -4.0998682379722595e-05, -3.935396671295166e-05, -3.7709251046180725e-05, -3.606453537940979e-05, -3.4419819712638855e-05, -3.277510404586792e-05, -3.1130388379096985e-05, -2.948567271232605e-05, -2.7840957045555115e-05, -2.619624137878418e-05, -2.4551525712013245e-05, -2.290681004524231e-05, -2.1262094378471375e-05, -1.961737871170044e-05, -1.7972663044929504e-05, -1.632794737815857e-05, -1.4683231711387634e-05, -1.30385160446167e-05, -1.1393800377845764e-05, -9.749084711074829e-06, -8.104369044303894e-06, -6.459653377532959e-06, -4.814937710762024e-06, -3.170222043991089e-06, -1.5255063772201538e-06, 1.1920928955078125e-07, 1.7639249563217163e-06, 3.4086406230926514e-06, 5.0533562898635864e-06, 6.6980719566345215e-06, 8.342787623405457e-06, 9.987503290176392e-06, 1.1632218956947327e-05, 1.3276934623718262e-05, 1.4921650290489197e-05, 1.6566365957260132e-05, 1.8211081624031067e-05, 1.9855797290802002e-05, 2.1500512957572937e-05, 2.3145228624343872e-05, 2.4789944291114807e-05, 2.6434659957885742e-05, 2.8079375624656677e-05, 2.9724091291427612e-05, 3.136880695819855e-05, 3.301352262496948e-05, 3.465823829174042e-05, 3.630295395851135e-05, 3.794766962528229e-05, 3.959238529205322e-05, 4.123710095882416e-05, 4.288181662559509e-05, 4.452653229236603e-05, 4.617124795913696e-05, 4.78159636259079e-05, 4.946067929267883e-05, 5.110539495944977e-05, 5.27501106262207e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 16.0, 39.0, 50.0, 65.0, 134.0, 187.0, 283.0, 476.0, 726.0, 1181.0, 1872.0, 2903.0, 4727.0, 7476.0, 11813.0, 18170.0, 29183.0, 44470.0, 66653.0, 92804.0, 118968.0, 135421.0, 133745.0, 115551.0, 86846.0, 61254.0, 40689.0, 26670.0, 17076.0, 10621.0, 6882.0, 4290.0, 2694.0, 1713.0, 1105.0, 652.0, 429.0, 271.0, 167.0, 97.0, 64.0, 44.0, 27.0, 12.0, 11.0, 7.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.490478515625, -0.4746055603027344, -0.45873260498046875, -0.4428596496582031, -0.4269866943359375, -0.4111137390136719, -0.39524078369140625, -0.3793678283691406, -0.363494873046875, -0.3476219177246094, -0.33174896240234375, -0.3158760070800781, -0.3000030517578125, -0.2841300964355469, -0.26825714111328125, -0.2523841857910156, -0.23651123046875, -0.22063827514648438, -0.20476531982421875, -0.18889236450195312, -0.1730194091796875, -0.15714645385742188, -0.14127349853515625, -0.12540054321289062, -0.109527587890625, -0.09365463256835938, -0.07778167724609375, -0.061908721923828125, -0.0460357666015625, -0.030162811279296875, -0.01428985595703125, 0.001583099365234375, 0.0174560546875, 0.033329010009765625, 0.04920196533203125, 0.06507492065429688, 0.0809478759765625, 0.09682083129882812, 0.11269378662109375, 0.12856674194335938, 0.144439697265625, 0.16031265258789062, 0.17618560791015625, 0.19205856323242188, 0.2079315185546875, 0.22380447387695312, 0.23967742919921875, 0.2555503845214844, 0.27142333984375, 0.2872962951660156, 0.30316925048828125, 0.3190422058105469, 0.3349151611328125, 0.3507881164550781, 0.36666107177734375, 0.3825340270996094, 0.398406982421875, 0.4142799377441406, 0.43015289306640625, 0.4460258483886719, 0.4618988037109375, 0.4777717590332031, 0.49364471435546875, 0.5095176696777344, 0.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 2.0, 14.0, 13.0, 24.0, 11.0, 17.0, 27.0, 24.0, 21.0, 28.0, 42.0, 51.0, 46.0, 50.0, 50.0, 59.0, 42.0, 53.0, 42.0, 57.0, 41.0, 32.0, 41.0, 28.0, 20.0, 30.0, 23.0, 22.0, 15.0, 10.0, 11.0, 11.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16259765625, -0.15713119506835938, -0.15166473388671875, -0.14619827270507812, -0.1407318115234375, -0.13526535034179688, -0.12979888916015625, -0.12433242797851562, -0.118865966796875, -0.11339950561523438, -0.10793304443359375, -0.10246658325195312, -0.0970001220703125, -0.09153366088867188, -0.08606719970703125, -0.08060073852539062, -0.07513427734375, -0.06966781616210938, -0.06420135498046875, -0.058734893798828125, -0.0532684326171875, -0.047801971435546875, -0.04233551025390625, -0.036869049072265625, -0.031402587890625, -0.025936126708984375, -0.02046966552734375, -0.015003204345703125, -0.0095367431640625, -0.004070281982421875, 0.00139617919921875, 0.006862640380859375, 0.0123291015625, 0.017795562744140625, 0.02326202392578125, 0.028728485107421875, 0.0341949462890625, 0.039661407470703125, 0.04512786865234375, 0.050594329833984375, 0.056060791015625, 0.061527252197265625, 0.06699371337890625, 0.07246017456054688, 0.0779266357421875, 0.08339309692382812, 0.08885955810546875, 0.09432601928710938, 0.09979248046875, 0.10525894165039062, 0.11072540283203125, 0.11619186401367188, 0.1216583251953125, 0.12712478637695312, 0.13259124755859375, 0.13805770874023438, 0.143524169921875, 0.14899063110351562, 0.15445709228515625, 0.15992355346679688, 0.1653900146484375, 0.17085647583007812, 0.17632293701171875, 0.18178939819335938, 0.187255859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 16.0, 14.0, 26.0, 29.0, 39.0, 40.0, 32.0, 54.0, 54.0, 50.0, 51.0, 63.0, 69.0, 47.0, 55.0, 34.0, 36.0, 35.0, 30.0, 34.0, 20.0, 19.0, 16.0, 15.0, 16.0, 10.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.7850890159606934, -1.737668514251709, -1.6902481317520142, -1.6428276300430298, -1.5954071283340454, -1.5479867458343506, -1.5005662441253662, -1.4531457424163818, -1.4057252407073975, -1.358304738998413, -1.3108843564987183, -1.2634638547897339, -1.2160433530807495, -1.1686229705810547, -1.1212024688720703, -1.073781967163086, -1.0263615846633911, -0.9789411425590515, -0.9315206408500671, -0.8841001987457275, -0.8366796970367432, -0.7892592549324036, -0.741838812828064, -0.6944183111190796, -0.64699786901474, -0.5995774269104004, -0.552156925201416, -0.5047364830970764, -0.45731601119041443, -0.40989553928375244, -0.36247509717941284, -0.31505462527275085, -0.2676340341567993, -0.22021356225013733, -0.17279310524463654, -0.12537264823913574, -0.07795217633247375, -0.030531704425811768, 0.016888737678527832, 0.06430920958518982, 0.1117296814918518, 0.1591501533985138, 0.2065706104040146, 0.2539910674095154, 0.30141153931617737, 0.34883201122283936, 0.39625245332717896, 0.44367292523384094, 0.49109339714050293, 0.5385138392448425, 0.5859343409538269, 0.6333547830581665, 0.6807752847671509, 0.7281957268714905, 0.7756161689758301, 0.8230366706848145, 0.870457112789154, 0.9178775548934937, 0.965298056602478, 1.0127184391021729, 1.0601389408111572, 1.1075594425201416, 1.154979944229126, 1.2024003267288208, 1.2498208284378052]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 4.0, 13.0, 13.0, 15.0, 23.0, 22.0, 22.0, 45.0, 25.0, 33.0, 36.0, 41.0, 47.0, 27.0, 28.0, 49.0, 44.0, 39.0, 46.0, 38.0, 50.0, 39.0, 27.0, 35.0, 34.0, 28.0, 18.0, 20.0, 23.0, 17.0, 17.0, 21.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1418660879135132, -1.1035720109939575, -1.0652778148651123, -1.0269837379455566, -0.988689661026001, -0.9503955841064453, -0.9121014475822449, -0.8738073110580444, -0.8355132341384888, -0.7972191572189331, -0.7589250206947327, -0.7206308841705322, -0.6823368072509766, -0.6440427303314209, -0.6057485938072205, -0.56745445728302, -0.5291603803634644, -0.4908662736415863, -0.45257216691970825, -0.4142780601978302, -0.37598395347595215, -0.3376898467540741, -0.29939574003219604, -0.261101633310318, -0.22280752658843994, -0.1845134198665619, -0.14621931314468384, -0.10792520642280579, -0.06963109970092773, -0.03133699297904968, 0.006957113742828369, 0.04525122046470642, 0.08354544639587402, 0.12183955311775208, 0.16013365983963013, 0.19842776656150818, 0.23672187328338623, 0.2750159800052643, 0.31331008672714233, 0.3516041934490204, 0.38989830017089844, 0.4281924068927765, 0.46648651361465454, 0.504780650138855, 0.5430747270584106, 0.5813688039779663, 0.6196629405021667, 0.6579570770263672, 0.6962511539459229, 0.7345452308654785, 0.772839367389679, 0.8111335039138794, 0.8494275808334351, 0.8877216577529907, 0.9260157942771912, 0.9643099308013916, 1.0026040077209473, 1.040898084640503, 1.0791921615600586, 1.1174863576889038, 1.1557804346084595, 1.1940745115280151, 1.2323687076568604, 1.270662784576416, 1.3089568614959717]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 12.0, 19.0, 27.0, 56.0, 92.0, 177.0, 259.0, 522.0, 890.0, 1499.0, 2833.0, 5345.0, 9825.0, 18294.0, 34720.0, 65267.0, 122446.0, 224053.0, 385772.0, 589798.0, 738902.0, 710247.0, 533755.0, 335285.0, 191041.0, 104108.0, 55782.0, 29337.0, 15295.0, 8283.0, 4550.0, 2502.0, 1361.0, 812.0, 426.0, 246.0, 168.0, 84.0, 74.0, 40.0, 26.0, 17.0, 20.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.4482421875, -1.405487060546875, -1.36273193359375, -1.319976806640625, -1.2772216796875, -1.234466552734375, -1.19171142578125, -1.148956298828125, -1.106201171875, -1.063446044921875, -1.02069091796875, -0.977935791015625, -0.9351806640625, -0.892425537109375, -0.84967041015625, -0.806915283203125, -0.76416015625, -0.721405029296875, -0.67864990234375, -0.635894775390625, -0.5931396484375, -0.550384521484375, -0.50762939453125, -0.464874267578125, -0.422119140625, -0.379364013671875, -0.33660888671875, -0.293853759765625, -0.2510986328125, -0.208343505859375, -0.16558837890625, -0.122833251953125, -0.080078125, -0.037322998046875, 0.00543212890625, 0.048187255859375, 0.0909423828125, 0.133697509765625, 0.17645263671875, 0.219207763671875, 0.261962890625, 0.304718017578125, 0.34747314453125, 0.390228271484375, 0.4329833984375, 0.475738525390625, 0.51849365234375, 0.561248779296875, 0.60400390625, 0.646759033203125, 0.68951416015625, 0.732269287109375, 0.7750244140625, 0.817779541015625, 0.86053466796875, 0.903289794921875, 0.946044921875, 0.988800048828125, 1.03155517578125, 1.074310302734375, 1.1170654296875, 1.159820556640625, 1.20257568359375, 1.245330810546875, 1.2880859375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 15.0, 17.0, 25.0, 27.0, 21.0, 19.0, 21.0, 32.0, 40.0, 38.0, 42.0, 29.0, 26.0, 51.0, 42.0, 52.0, 33.0, 46.0, 47.0, 39.0, 43.0, 25.0, 31.0, 29.0, 31.0, 20.0, 20.0, 29.0, 21.0, 7.0, 18.0, 10.0, 10.0, 5.0, 1.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.8899612426757812, -0.8619537353515625, -0.8339462280273438, -0.805938720703125, -0.7779312133789062, -0.7499237060546875, -0.7219161987304688, -0.69390869140625, -0.6659011840820312, -0.6378936767578125, -0.6098861694335938, -0.581878662109375, -0.5538711547851562, -0.5258636474609375, -0.49785614013671875, -0.4698486328125, -0.44184112548828125, -0.4138336181640625, -0.38582611083984375, -0.357818603515625, -0.32981109619140625, -0.3018035888671875, -0.27379608154296875, -0.24578857421875, -0.21778106689453125, -0.1897735595703125, -0.16176605224609375, -0.133758544921875, -0.10575103759765625, -0.0777435302734375, -0.04973602294921875, -0.021728515625, 0.00627899169921875, 0.0342864990234375, 0.06229400634765625, 0.090301513671875, 0.11830902099609375, 0.1463165283203125, 0.17432403564453125, 0.20233154296875, 0.23033905029296875, 0.2583465576171875, 0.28635406494140625, 0.314361572265625, 0.34236907958984375, 0.3703765869140625, 0.39838409423828125, 0.4263916015625, 0.45439910888671875, 0.4824066162109375, 0.5104141235351562, 0.538421630859375, 0.5664291381835938, 0.5944366455078125, 0.6224441528320312, 0.65045166015625, 0.6784591674804688, 0.7064666748046875, 0.7344741821289062, 0.762481689453125, 0.7904891967773438, 0.8184967041015625, 0.8465042114257812, 0.87451171875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 4.0, 7.0, 18.0, 25.0, 51.0, 72.0, 67.0, 141.0, 243.0, 335.0, 561.0, 1030.0, 1663.0, 2766.0, 4650.0, 8010.0, 13360.0, 22186.0, 37924.0, 62782.0, 101553.0, 160775.0, 241775.0, 344058.0, 448981.0, 525655.0, 539371.0, 487189.0, 392118.0, 285105.0, 193315.0, 124145.0, 77481.0, 47066.0, 28337.0, 16965.0, 9878.0, 5880.0, 3423.0, 2081.0, 1253.0, 748.0, 466.0, 281.0, 191.0, 98.0, 94.0, 32.0, 29.0, 17.0, 9.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0810546875, -1.0475006103515625, -1.013946533203125, -0.9803924560546875, -0.94683837890625, -0.9132843017578125, -0.879730224609375, -0.8461761474609375, -0.8126220703125, -0.7790679931640625, -0.745513916015625, -0.7119598388671875, -0.67840576171875, -0.6448516845703125, -0.611297607421875, -0.5777435302734375, -0.544189453125, -0.5106353759765625, -0.477081298828125, -0.4435272216796875, -0.40997314453125, -0.3764190673828125, -0.342864990234375, -0.3093109130859375, -0.2757568359375, -0.2422027587890625, -0.208648681640625, -0.1750946044921875, -0.14154052734375, -0.1079864501953125, -0.074432373046875, -0.0408782958984375, -0.00732421875, 0.0262298583984375, 0.059783935546875, 0.0933380126953125, 0.12689208984375, 0.1604461669921875, 0.194000244140625, 0.2275543212890625, 0.2611083984375, 0.2946624755859375, 0.328216552734375, 0.3617706298828125, 0.39532470703125, 0.4288787841796875, 0.462432861328125, 0.4959869384765625, 0.529541015625, 0.5630950927734375, 0.596649169921875, 0.6302032470703125, 0.66375732421875, 0.6973114013671875, 0.730865478515625, 0.7644195556640625, 0.7979736328125, 0.8315277099609375, 0.865081787109375, 0.8986358642578125, 0.93218994140625, 0.9657440185546875, 0.999298095703125, 1.0328521728515625, 1.06640625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 24.0, 41.0, 53.0, 59.0, 85.0, 88.0, 123.0, 118.0, 134.0, 151.0, 188.0, 166.0, 209.0, 222.0, 229.0, 237.0, 239.0, 211.0, 209.0, 209.0, 158.0, 149.0, 123.0, 124.0, 94.0, 85.0, 55.0, 47.0, 40.0, 32.0, 26.0, 10.0, 19.0, 13.0, 7.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42724609375, -0.4130363464355469, -0.39882659912109375, -0.3846168518066406, -0.3704071044921875, -0.3561973571777344, -0.34198760986328125, -0.3277778625488281, -0.313568115234375, -0.2993583679199219, -0.28514862060546875, -0.2709388732910156, -0.2567291259765625, -0.24251937866210938, -0.22830963134765625, -0.21409988403320312, -0.19989013671875, -0.18568038940429688, -0.17147064208984375, -0.15726089477539062, -0.1430511474609375, -0.12884140014648438, -0.11463165283203125, -0.10042190551757812, -0.086212158203125, -0.07200241088867188, -0.05779266357421875, -0.043582916259765625, -0.0293731689453125, -0.015163421630859375, -0.00095367431640625, 0.013256072998046875, 0.0274658203125, 0.041675567626953125, 0.05588531494140625, 0.07009506225585938, 0.0843048095703125, 0.09851455688476562, 0.11272430419921875, 0.12693405151367188, 0.141143798828125, 0.15535354614257812, 0.16956329345703125, 0.18377304077148438, 0.1979827880859375, 0.21219253540039062, 0.22640228271484375, 0.24061203002929688, 0.25482177734375, 0.2690315246582031, 0.28324127197265625, 0.2974510192871094, 0.3116607666015625, 0.3258705139160156, 0.34008026123046875, 0.3542900085449219, 0.368499755859375, 0.3827095031738281, 0.39691925048828125, 0.4111289978027344, 0.4253387451171875, 0.4395484924316406, 0.45375823974609375, 0.4679679870605469, 0.482177734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 11.0, 9.0, 14.0, 20.0, 25.0, 24.0, 28.0, 39.0, 43.0, 30.0, 36.0, 57.0, 52.0, 59.0, 59.0, 58.0, 53.0, 52.0, 48.0, 29.0, 37.0, 35.0, 20.0, 32.0, 22.0, 15.0, 15.0, 14.0, 7.0, 9.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.469054102897644, -1.4224615097045898, -1.3758689165115356, -1.3292763233184814, -1.2826837301254272, -1.236091136932373, -1.1894984245300293, -1.1429059505462646, -1.096313238143921, -1.0497206449508667, -1.0031280517578125, -0.9565354585647583, -0.9099428653717041, -0.8633502721786499, -0.8167576193809509, -0.7701650261878967, -0.7235724925994873, -0.6769798994064331, -0.6303873062133789, -0.5837947130203247, -0.5372021198272705, -0.4906094968318939, -0.44401687383651733, -0.39742428064346313, -0.35083168745040894, -0.30423909425735474, -0.25764650106430054, -0.21105387806892395, -0.16446128487586975, -0.11786869168281555, -0.07127606868743896, -0.024683475494384766, 0.021908998489379883, 0.06850159913301468, 0.11509419977664948, 0.16168680787086487, 0.20827940106391907, 0.25487199425697327, 0.30146461725234985, 0.34805721044540405, 0.39464980363845825, 0.44124239683151245, 0.48783499002456665, 0.5344276428222656, 0.5810202360153198, 0.627612829208374, 0.6742054224014282, 0.7207980155944824, 0.7673906087875366, 0.8139832019805908, 0.860575795173645, 0.9071683883666992, 0.9537609815597534, 1.0003535747528076, 1.0469462871551514, 1.093538761138916, 1.1401314735412598, 1.186724066734314, 1.2333166599273682, 1.2799092531204224, 1.3265018463134766, 1.3730944395065308, 1.419687032699585, 1.4662797451019287, 1.5128722190856934]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 3.0, 4.0, 7.0, 10.0, 17.0, 10.0, 19.0, 20.0, 32.0, 23.0, 33.0, 33.0, 26.0, 35.0, 41.0, 45.0, 48.0, 43.0, 38.0, 35.0, 42.0, 29.0, 45.0, 32.0, 40.0, 36.0, 29.0, 24.0, 29.0, 20.0, 24.0, 19.0, 24.0, 12.0, 9.0, 11.0, 8.0, 13.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.993068277835846, -0.9603825807571411, -0.927696943283081, -0.8950112462043762, -0.8623255491256714, -0.8296399116516113, -0.7969542145729065, -0.7642685174942017, -0.7315828800201416, -0.6988971829414368, -0.6662115454673767, -0.6335258483886719, -0.6008402109146118, -0.568154513835907, -0.5354688167572021, -0.5027831792831421, -0.47009748220443726, -0.4374118149280548, -0.40472614765167236, -0.37204045057296753, -0.3393547832965851, -0.30666911602020264, -0.2739834189414978, -0.24129775166511536, -0.2086120843887329, -0.17592641711235046, -0.14324073493480682, -0.11055506020784378, -0.07786938548088074, -0.04518371820449829, -0.012498036026954651, 0.02018764615058899, 0.05287337303161621, 0.08555904775857925, 0.1182447224855423, 0.15093040466308594, 0.18361607193946838, 0.21630173921585083, 0.24898742139339447, 0.2816731035709381, 0.31435877084732056, 0.347044438123703, 0.37973010540008545, 0.4124158024787903, 0.44510146975517273, 0.4777871370315552, 0.51047283411026, 0.5431585311889648, 0.5758441686630249, 0.6085298657417297, 0.6412155032157898, 0.6739012002944946, 0.7065868377685547, 0.7392725348472595, 0.7719582319259644, 0.8046438694000244, 0.8373295664787292, 0.8700152635574341, 0.9027009010314941, 0.935386598110199, 0.9680722951889038, 1.0007579326629639, 1.033443570137024, 1.0661293268203735, 1.0988149642944336]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 8.0, 12.0, 21.0, 21.0, 49.0, 48.0, 90.0, 155.0, 191.0, 355.0, 591.0, 955.0, 1472.0, 2410.0, 4068.0, 6547.0, 10696.0, 17770.0, 29482.0, 48878.0, 79344.0, 122158.0, 168576.0, 177988.0, 138252.0, 91985.0, 57556.0, 34994.0, 21108.0, 12825.0, 7760.0, 4588.0, 2954.0, 1733.0, 1023.0, 651.0, 440.0, 287.0, 167.0, 119.0, 69.0, 50.0, 25.0, 24.0, 16.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.315673828125, -0.3061561584472656, -0.29663848876953125, -0.2871208190917969, -0.2776031494140625, -0.2680854797363281, -0.25856781005859375, -0.24905014038085938, -0.239532470703125, -0.23001480102539062, -0.22049713134765625, -0.21097946166992188, -0.2014617919921875, -0.19194412231445312, -0.18242645263671875, -0.17290878295898438, -0.16339111328125, -0.15387344360351562, -0.14435577392578125, -0.13483810424804688, -0.1253204345703125, -0.11580276489257812, -0.10628509521484375, -0.09676742553710938, -0.087249755859375, -0.07773208618164062, -0.06821441650390625, -0.058696746826171875, -0.0491790771484375, -0.039661407470703125, -0.03014373779296875, -0.020626068115234375, -0.0111083984375, -0.001590728759765625, 0.00792694091796875, 0.017444610595703125, 0.0269622802734375, 0.036479949951171875, 0.04599761962890625, 0.055515289306640625, 0.065032958984375, 0.07455062866210938, 0.08406829833984375, 0.09358596801757812, 0.1031036376953125, 0.11262130737304688, 0.12213897705078125, 0.13165664672851562, 0.14117431640625, 0.15069198608398438, 0.16020965576171875, 0.16972732543945312, 0.1792449951171875, 0.18876266479492188, 0.19828033447265625, 0.20779800415039062, 0.217315673828125, 0.22683334350585938, 0.23635101318359375, 0.24586868286132812, 0.2553863525390625, 0.2649040222167969, 0.27442169189453125, 0.2839393615722656, 0.29345703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 11.0, 23.0, 14.0, 18.0, 18.0, 30.0, 24.0, 38.0, 27.0, 50.0, 61.0, 48.0, 46.0, 41.0, 48.0, 55.0, 45.0, 42.0, 39.0, 41.0, 37.0, 36.0, 32.0, 21.0, 23.0, 19.0, 19.0, 11.0, 11.0, 15.0, 5.0, 8.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.23504638671875, -1.1947021484375, -1.15435791015625, -1.114013671875, -1.07366943359375, -1.0333251953125, -0.99298095703125, -0.95263671875, -0.91229248046875, -0.8719482421875, -0.83160400390625, -0.791259765625, -0.75091552734375, -0.7105712890625, -0.67022705078125, -0.6298828125, -0.58953857421875, -0.5491943359375, -0.50885009765625, -0.468505859375, -0.42816162109375, -0.3878173828125, -0.34747314453125, -0.30712890625, -0.26678466796875, -0.2264404296875, -0.18609619140625, -0.145751953125, -0.10540771484375, -0.0650634765625, -0.02471923828125, 0.015625, 0.05596923828125, 0.0963134765625, 0.13665771484375, 0.177001953125, 0.21734619140625, 0.2576904296875, 0.29803466796875, 0.33837890625, 0.37872314453125, 0.4190673828125, 0.45941162109375, 0.499755859375, 0.54010009765625, 0.5804443359375, 0.62078857421875, 0.6611328125, 0.70147705078125, 0.7418212890625, 0.78216552734375, 0.822509765625, 0.86285400390625, 0.9031982421875, 0.94354248046875, 0.98388671875, 1.02423095703125, 1.0645751953125, 1.10491943359375, 1.145263671875, 1.18560791015625, 1.2259521484375, 1.26629638671875, 1.306640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 6.0, 6.0, 20.0, 21.0, 41.0, 53.0, 90.0, 135.0, 224.0, 344.0, 597.0, 1046.0, 1847.0, 3292.0, 6116.0, 11655.0, 22439.0, 44921.0, 88282.0, 165038.0, 245352.0, 209021.0, 120249.0, 62166.0, 31260.0, 15929.0, 8079.0, 4618.0, 2368.0, 1313.0, 770.0, 460.0, 283.0, 157.0, 109.0, 81.0, 48.0, 30.0, 17.0, 10.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.4267578125, -0.4141082763671875, -0.401458740234375, -0.3888092041015625, -0.37615966796875, -0.3635101318359375, -0.350860595703125, -0.3382110595703125, -0.3255615234375, -0.3129119873046875, -0.300262451171875, -0.2876129150390625, -0.27496337890625, -0.2623138427734375, -0.249664306640625, -0.2370147705078125, -0.224365234375, -0.2117156982421875, -0.199066162109375, -0.1864166259765625, -0.17376708984375, -0.1611175537109375, -0.148468017578125, -0.1358184814453125, -0.1231689453125, -0.1105194091796875, -0.097869873046875, -0.0852203369140625, -0.07257080078125, -0.0599212646484375, -0.047271728515625, -0.0346221923828125, -0.02197265625, -0.0093231201171875, 0.003326416015625, 0.0159759521484375, 0.02862548828125, 0.0412750244140625, 0.053924560546875, 0.0665740966796875, 0.0792236328125, 0.0918731689453125, 0.104522705078125, 0.1171722412109375, 0.12982177734375, 0.1424713134765625, 0.155120849609375, 0.1677703857421875, 0.180419921875, 0.1930694580078125, 0.205718994140625, 0.2183685302734375, 0.23101806640625, 0.2436676025390625, 0.256317138671875, 0.2689666748046875, 0.2816162109375, 0.2942657470703125, 0.306915283203125, 0.3195648193359375, 0.33221435546875, 0.3448638916015625, 0.357513427734375, 0.3701629638671875, 0.3828125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 11.0, 10.0, 10.0, 14.0, 23.0, 16.0, 19.0, 23.0, 21.0, 26.0, 28.0, 26.0, 37.0, 38.0, 40.0, 47.0, 38.0, 41.0, 49.0, 32.0, 43.0, 33.0, 35.0, 32.0, 42.0, 35.0, 23.0, 25.0, 19.0, 16.0, 30.0, 10.0, 18.0, 12.0, 14.0, 7.0, 5.0, 5.0, 3.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6044921875, -0.5842742919921875, -0.564056396484375, -0.5438385009765625, -0.52362060546875, -0.5034027099609375, -0.483184814453125, -0.4629669189453125, -0.4427490234375, -0.4225311279296875, -0.402313232421875, -0.3820953369140625, -0.36187744140625, -0.3416595458984375, -0.321441650390625, -0.3012237548828125, -0.281005859375, -0.2607879638671875, -0.240570068359375, -0.2203521728515625, -0.20013427734375, -0.1799163818359375, -0.159698486328125, -0.1394805908203125, -0.1192626953125, -0.0990447998046875, -0.078826904296875, -0.0586090087890625, -0.03839111328125, -0.0181732177734375, 0.002044677734375, 0.0222625732421875, 0.04248046875, 0.0626983642578125, 0.082916259765625, 0.1031341552734375, 0.12335205078125, 0.1435699462890625, 0.163787841796875, 0.1840057373046875, 0.2042236328125, 0.2244415283203125, 0.244659423828125, 0.2648773193359375, 0.28509521484375, 0.3053131103515625, 0.325531005859375, 0.3457489013671875, 0.365966796875, 0.3861846923828125, 0.406402587890625, 0.4266204833984375, 0.44683837890625, 0.4670562744140625, 0.487274169921875, 0.5074920654296875, 0.5277099609375, 0.5479278564453125, 0.568145751953125, 0.5883636474609375, 0.60858154296875, 0.6287994384765625, 0.649017333984375, 0.6692352294921875, 0.689453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 19.0, 18.0, 40.0, 40.0, 82.0, 99.0, 191.0, 249.0, 411.0, 609.0, 887.0, 1549.0, 2450.0, 4303.0, 7593.0, 15093.0, 32191.0, 78715.0, 214299.0, 377292.0, 185032.0, 67972.0, 28689.0, 13487.0, 7011.0, 3928.0, 2280.0, 1451.0, 886.0, 561.0, 391.0, 219.0, 154.0, 104.0, 63.0, 66.0, 41.0, 14.0, 18.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.19189453125, -0.18615341186523438, -0.18041229248046875, -0.17467117309570312, -0.1689300537109375, -0.16318893432617188, -0.15744781494140625, -0.15170669555664062, -0.145965576171875, -0.14022445678710938, -0.13448333740234375, -0.12874221801757812, -0.1230010986328125, -0.11725997924804688, -0.11151885986328125, -0.10577774047851562, -0.10003662109375, -0.09429550170898438, -0.08855438232421875, -0.08281326293945312, -0.0770721435546875, -0.07133102416992188, -0.06558990478515625, -0.059848785400390625, -0.054107666015625, -0.048366546630859375, -0.04262542724609375, -0.036884307861328125, -0.0311431884765625, -0.025402069091796875, -0.01966094970703125, -0.013919830322265625, -0.0081787109375, -0.002437591552734375, 0.00330352783203125, 0.009044647216796875, 0.0147857666015625, 0.020526885986328125, 0.02626800537109375, 0.032009124755859375, 0.037750244140625, 0.043491363525390625, 0.04923248291015625, 0.054973602294921875, 0.0607147216796875, 0.06645584106445312, 0.07219696044921875, 0.07793807983398438, 0.08367919921875, 0.08942031860351562, 0.09516143798828125, 0.10090255737304688, 0.1066436767578125, 0.11238479614257812, 0.11812591552734375, 0.12386703491210938, 0.129608154296875, 0.13534927368164062, 0.14109039306640625, 0.14683151245117188, 0.1525726318359375, 0.15831375122070312, 0.16405487060546875, 0.16979598999023438, 0.175537109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 6.0, 3.0, 14.0, 12.0, 21.0, 24.0, 33.0, 28.0, 30.0, 38.0, 42.0, 46.0, 45.0, 51.0, 39.0, 55.0, 46.0, 45.0, 64.0, 40.0, 55.0, 32.0, 24.0, 25.0, 22.0, 18.0, 19.0, 23.0, 17.0, 13.0, 12.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -8.977949619293213e-06, -8.657574653625488e-06, -8.337199687957764e-06, -8.016824722290039e-06, -7.696449756622314e-06, -7.37607479095459e-06, -7.055699825286865e-06, -6.735324859619141e-06, -6.414949893951416e-06, -6.094574928283691e-06, -5.774199962615967e-06, -5.453824996948242e-06, -5.133450031280518e-06, -4.813075065612793e-06, -4.492700099945068e-06, -4.172325134277344e-06, -3.851950168609619e-06, -3.5315752029418945e-06, -3.21120023727417e-06, -2.8908252716064453e-06, -2.5704503059387207e-06, -2.250075340270996e-06, -1.9297003746032715e-06, -1.6093254089355469e-06, -1.2889504432678223e-06, -9.685754776000977e-07, -6.48200511932373e-07, -3.2782554626464844e-07, -7.450580596923828e-09, 3.129243850708008e-07, 6.332993507385254e-07, 9.5367431640625e-07, 1.2740492820739746e-06, 1.5944242477416992e-06, 1.914799213409424e-06, 2.2351741790771484e-06, 2.555549144744873e-06, 2.8759241104125977e-06, 3.1962990760803223e-06, 3.516674041748047e-06, 3.8370490074157715e-06, 4.157423973083496e-06, 4.477798938751221e-06, 4.798173904418945e-06, 5.11854887008667e-06, 5.4389238357543945e-06, 5.759298801422119e-06, 6.079673767089844e-06, 6.400048732757568e-06, 6.720423698425293e-06, 7.040798664093018e-06, 7.361173629760742e-06, 7.681548595428467e-06, 8.001923561096191e-06, 8.322298526763916e-06, 8.64267349243164e-06, 8.963048458099365e-06, 9.28342342376709e-06, 9.603798389434814e-06, 9.924173355102539e-06, 1.0244548320770264e-05, 1.0564923286437988e-05, 1.0885298252105713e-05, 1.1205673217773438e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 10.0, 15.0, 33.0, 26.0, 45.0, 79.0, 95.0, 147.0, 187.0, 331.0, 554.0, 788.0, 1247.0, 2113.0, 3588.0, 6208.0, 10415.0, 18253.0, 31186.0, 56630.0, 100991.0, 169169.0, 219709.0, 177462.0, 108321.0, 60437.0, 34049.0, 19150.0, 11045.0, 6387.0, 3707.0, 2269.0, 1410.0, 887.0, 534.0, 371.0, 254.0, 142.0, 105.0, 65.0, 45.0, 22.0, 23.0, 24.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12136077880859375, -0.1171112060546875, -0.11286163330078125, -0.108612060546875, -0.10436248779296875, -0.1001129150390625, -0.09586334228515625, -0.09161376953125, -0.08736419677734375, -0.0831146240234375, -0.07886505126953125, -0.074615478515625, -0.07036590576171875, -0.0661163330078125, -0.06186676025390625, -0.0576171875, -0.05336761474609375, -0.0491180419921875, -0.04486846923828125, -0.040618896484375, -0.03636932373046875, -0.0321197509765625, -0.02787017822265625, -0.02362060546875, -0.01937103271484375, -0.0151214599609375, -0.01087188720703125, -0.006622314453125, -0.00237274169921875, 0.0018768310546875, 0.00612640380859375, 0.0103759765625, 0.01462554931640625, 0.0188751220703125, 0.02312469482421875, 0.027374267578125, 0.03162384033203125, 0.0358734130859375, 0.04012298583984375, 0.04437255859375, 0.04862213134765625, 0.0528717041015625, 0.05712127685546875, 0.061370849609375, 0.06562042236328125, 0.0698699951171875, 0.07411956787109375, 0.078369140625, 0.08261871337890625, 0.0868682861328125, 0.09111785888671875, 0.095367431640625, 0.09961700439453125, 0.1038665771484375, 0.10811614990234375, 0.11236572265625, 0.11661529541015625, 0.1208648681640625, 0.12511444091796875, 0.129364013671875, 0.13361358642578125, 0.1378631591796875, 0.14211273193359375, 0.1463623046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 6.0, 13.0, 4.0, 16.0, 12.0, 15.0, 17.0, 14.0, 14.0, 24.0, 30.0, 33.0, 31.0, 36.0, 45.0, 53.0, 70.0, 78.0, 55.0, 48.0, 44.0, 42.0, 44.0, 35.0, 35.0, 30.0, 31.0, 8.0, 21.0, 16.0, 11.0, 11.0, 5.0, 6.0, 2.0, 8.0, 5.0, 5.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0284576416015625, -0.027442216873168945, -0.02642679214477539, -0.025411367416381836, -0.02439594268798828, -0.023380517959594727, -0.022365093231201172, -0.021349668502807617, -0.020334243774414062, -0.019318819046020508, -0.018303394317626953, -0.0172879695892334, -0.016272544860839844, -0.015257120132446289, -0.014241695404052734, -0.01322627067565918, -0.012210845947265625, -0.01119542121887207, -0.010179996490478516, -0.009164571762084961, -0.008149147033691406, -0.0071337223052978516, -0.006118297576904297, -0.005102872848510742, -0.0040874481201171875, -0.003072023391723633, -0.002056598663330078, -0.0010411739349365234, -2.574920654296875e-05, 0.000989675521850586, 0.0020051002502441406, 0.0030205249786376953, 0.00403594970703125, 0.005051374435424805, 0.006066799163818359, 0.007082223892211914, 0.008097648620605469, 0.009113073348999023, 0.010128498077392578, 0.011143922805786133, 0.012159347534179688, 0.013174772262573242, 0.014190196990966797, 0.015205621719360352, 0.016221046447753906, 0.01723647117614746, 0.018251895904541016, 0.01926732063293457, 0.020282745361328125, 0.02129817008972168, 0.022313594818115234, 0.02332901954650879, 0.024344444274902344, 0.0253598690032959, 0.026375293731689453, 0.027390718460083008, 0.028406143188476562, 0.029421567916870117, 0.030436992645263672, 0.03145241737365723, 0.03246784210205078, 0.033483266830444336, 0.03449869155883789, 0.035514116287231445, 0.036529541015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 15.0, 8.0, 9.0, 23.0, 11.0, 28.0, 19.0, 31.0, 46.0, 32.0, 34.0, 35.0, 60.0, 57.0, 57.0, 56.0, 55.0, 57.0, 46.0, 49.0, 28.0, 33.0, 34.0, 23.0, 26.0, 28.0, 16.0, 17.0, 11.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.437822937965393, -1.3920657634735107, -1.3463085889816284, -1.300551414489746, -1.2547943592071533, -1.209037184715271, -1.1632800102233887, -1.1175228357315063, -1.071765661239624, -1.0260084867477417, -0.9802513718605042, -0.9344941973686218, -0.8887370824813843, -0.842979907989502, -0.7972227334976196, -0.7514655590057373, -0.7057085037231445, -0.6599513292312622, -0.6141942143440247, -0.5684370398521423, -0.5226799249649048, -0.47692275047302246, -0.43116557598114014, -0.3854084312915802, -0.33965128660202026, -0.2938941419124603, -0.2481369823217392, -0.20237982273101807, -0.15662267804145813, -0.1108655333518982, -0.06510835886001587, -0.019351214170455933, 0.026405811309814453, 0.07216296344995499, 0.11792011559009552, 0.16367727518081665, 0.2094344198703766, 0.2551915645599365, 0.30094873905181885, 0.3467058837413788, 0.3924630284309387, 0.43822017312049866, 0.4839773178100586, 0.5297344923019409, 0.5754916667938232, 0.6212487816810608, 0.6670059561729431, 0.7127630710601807, 0.758520245552063, 0.8042774200439453, 0.8500345349311829, 0.8957917094230652, 0.9415488243103027, 0.9873059988021851, 1.0330631732940674, 1.0788203477859497, 1.124577522277832, 1.1703346967697144, 1.2160918712615967, 1.2618489265441895, 1.3076061010360718, 1.353363275527954, 1.3991204500198364, 1.4448776245117188, 1.4906346797943115]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 1.0, 5.0, 3.0, 8.0, 13.0, 13.0, 14.0, 16.0, 22.0, 29.0, 23.0, 38.0, 32.0, 24.0, 34.0, 47.0, 47.0, 46.0, 38.0, 39.0, 40.0, 38.0, 26.0, 45.0, 36.0, 36.0, 41.0, 28.0, 27.0, 22.0, 21.0, 28.0, 21.0, 19.0, 9.0, 13.0, 12.0, 5.0, 12.0, 11.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9932097792625427, -0.960573136806488, -0.9279365539550781, -0.8952999114990234, -0.8626633286476135, -0.8300266861915588, -0.7973901033401489, -0.7647534608840942, -0.7321168184280396, -0.6994801759719849, -0.666843593120575, -0.6342069506645203, -0.6015703678131104, -0.5689337253570557, -0.536297082901001, -0.5036605000495911, -0.47102391719818115, -0.43838730454444885, -0.40575069189071655, -0.37311404943466187, -0.34047746658325195, -0.30784082412719727, -0.27520421147346497, -0.24256759881973267, -0.20993098616600037, -0.17729437351226807, -0.14465776085853577, -0.11202113330364227, -0.07938452064990997, -0.04674790799617767, -0.01411128044128418, 0.01852533221244812, 0.051161885261535645, 0.08379849791526794, 0.11643511801958084, 0.14907173812389374, 0.18170835077762604, 0.21434496343135834, 0.24698159098625183, 0.27961820363998413, 0.31225481629371643, 0.34489142894744873, 0.37752804160118103, 0.41016465425491333, 0.442801296710968, 0.47543787956237793, 0.5080745220184326, 0.5407111644744873, 0.5733477473258972, 0.6059843897819519, 0.6386209726333618, 0.6712576150894165, 0.7038941979408264, 0.7365308403968811, 0.769167423248291, 0.8018040657043457, 0.8344407081604004, 0.8670773506164551, 0.899713933467865, 0.9323505759239197, 0.9649871587753296, 0.9976238012313843, 1.030260443687439, 1.062896966934204, 1.0955336093902588]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 15.0, 25.0, 37.0, 39.0, 78.0, 130.0, 287.0, 484.0, 746.0, 1330.0, 2261.0, 3887.0, 6577.0, 11004.0, 18470.0, 30062.0, 46316.0, 69047.0, 95066.0, 118543.0, 132622.0, 130941.0, 114651.0, 89790.0, 64373.0, 42822.0, 27180.0, 17338.0, 9994.0, 6031.0, 3485.0, 2028.0, 1248.0, 667.0, 382.0, 222.0, 145.0, 84.0, 57.0, 37.0, 17.0, 11.0, 9.0, 4.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0747604370117188, -1.0420989990234375, -1.0094375610351562, -0.976776123046875, -0.9441146850585938, -0.9114532470703125, -0.8787918090820312, -0.84613037109375, -0.8134689331054688, -0.7808074951171875, -0.7481460571289062, -0.715484619140625, -0.6828231811523438, -0.6501617431640625, -0.6175003051757812, -0.5848388671875, -0.5521774291992188, -0.5195159912109375, -0.48685455322265625, -0.454193115234375, -0.42153167724609375, -0.3888702392578125, -0.35620880126953125, -0.32354736328125, -0.29088592529296875, -0.2582244873046875, -0.22556304931640625, -0.192901611328125, -0.16024017333984375, -0.1275787353515625, -0.09491729736328125, -0.062255859375, -0.02959442138671875, 0.0030670166015625, 0.03572845458984375, 0.068389892578125, 0.10105133056640625, 0.1337127685546875, 0.16637420654296875, 0.19903564453125, 0.23169708251953125, 0.2643585205078125, 0.29701995849609375, 0.329681396484375, 0.36234283447265625, 0.3950042724609375, 0.42766571044921875, 0.4603271484375, 0.49298858642578125, 0.5256500244140625, 0.5583114624023438, 0.590972900390625, 0.6236343383789062, 0.6562957763671875, 0.6889572143554688, 0.72161865234375, 0.7542800903320312, 0.7869415283203125, 0.8196029663085938, 0.852264404296875, 0.8849258422851562, 0.9175872802734375, 0.9502487182617188, 0.98291015625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 7.0, 11.0, 12.0, 12.0, 32.0, 19.0, 39.0, 37.0, 38.0, 31.0, 39.0, 42.0, 59.0, 56.0, 54.0, 39.0, 58.0, 41.0, 41.0, 33.0, 47.0, 28.0, 29.0, 27.0, 28.0, 25.0, 15.0, 17.0, 14.0, 19.0, 6.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.11480712890625, -1.0753173828125, -1.03582763671875, -0.996337890625, -0.95684814453125, -0.9173583984375, -0.87786865234375, -0.83837890625, -0.79888916015625, -0.7593994140625, -0.71990966796875, -0.680419921875, -0.64093017578125, -0.6014404296875, -0.56195068359375, -0.5224609375, -0.48297119140625, -0.4434814453125, -0.40399169921875, -0.364501953125, -0.32501220703125, -0.2855224609375, -0.24603271484375, -0.20654296875, -0.16705322265625, -0.1275634765625, -0.08807373046875, -0.048583984375, -0.00909423828125, 0.0303955078125, 0.06988525390625, 0.109375, 0.14886474609375, 0.1883544921875, 0.22784423828125, 0.267333984375, 0.30682373046875, 0.3463134765625, 0.38580322265625, 0.42529296875, 0.46478271484375, 0.5042724609375, 0.54376220703125, 0.583251953125, 0.62274169921875, 0.6622314453125, 0.70172119140625, 0.7412109375, 0.78070068359375, 0.8201904296875, 0.85968017578125, 0.899169921875, 0.93865966796875, 0.9781494140625, 1.01763916015625, 1.05712890625, 1.09661865234375, 1.1361083984375, 1.17559814453125, 1.215087890625, 1.25457763671875, 1.2940673828125, 1.33355712890625, 1.373046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 15.0, 15.0, 25.0, 46.0, 61.0, 101.0, 151.0, 245.0, 404.0, 648.0, 984.0, 1589.0, 2513.0, 3897.0, 6072.0, 9312.0, 14391.0, 21976.0, 31910.0, 45404.0, 61562.0, 79713.0, 96118.0, 107680.0, 111343.0, 105211.0, 91511.0, 74286.0, 56345.0, 41036.0, 28749.0, 19406.0, 12786.0, 8361.0, 5350.0, 3397.0, 2147.0, 1382.0, 871.0, 543.0, 364.0, 248.0, 153.0, 76.0, 62.0, 38.0, 17.0, 13.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.847564697265625, -0.81964111328125, -0.791717529296875, -0.7637939453125, -0.735870361328125, -0.70794677734375, -0.680023193359375, -0.652099609375, -0.624176025390625, -0.59625244140625, -0.568328857421875, -0.5404052734375, -0.512481689453125, -0.48455810546875, -0.456634521484375, -0.4287109375, -0.400787353515625, -0.37286376953125, -0.344940185546875, -0.3170166015625, -0.289093017578125, -0.26116943359375, -0.233245849609375, -0.205322265625, -0.177398681640625, -0.14947509765625, -0.121551513671875, -0.0936279296875, -0.065704345703125, -0.03778076171875, -0.009857177734375, 0.01806640625, 0.045989990234375, 0.07391357421875, 0.101837158203125, 0.1297607421875, 0.157684326171875, 0.18560791015625, 0.213531494140625, 0.241455078125, 0.269378662109375, 0.29730224609375, 0.325225830078125, 0.3531494140625, 0.381072998046875, 0.40899658203125, 0.436920166015625, 0.46484375, 0.492767333984375, 0.52069091796875, 0.548614501953125, 0.5765380859375, 0.604461669921875, 0.63238525390625, 0.660308837890625, 0.688232421875, 0.716156005859375, 0.74407958984375, 0.772003173828125, 0.7999267578125, 0.827850341796875, 0.85577392578125, 0.883697509765625, 0.91162109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 12.0, 16.0, 20.0, 13.0, 32.0, 40.0, 31.0, 24.0, 45.0, 52.0, 52.0, 51.0, 56.0, 42.0, 44.0, 47.0, 48.0, 56.0, 41.0, 33.0, 50.0, 33.0, 26.0, 29.0, 24.0, 13.0, 11.0, 11.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6833038330078125, -0.657623291015625, -0.6319427490234375, -0.60626220703125, -0.5805816650390625, -0.554901123046875, -0.5292205810546875, -0.5035400390625, -0.4778594970703125, -0.452178955078125, -0.4264984130859375, -0.40081787109375, -0.3751373291015625, -0.349456787109375, -0.3237762451171875, -0.298095703125, -0.2724151611328125, -0.246734619140625, -0.2210540771484375, -0.19537353515625, -0.1696929931640625, -0.144012451171875, -0.1183319091796875, -0.0926513671875, -0.0669708251953125, -0.041290283203125, -0.0156097412109375, 0.01007080078125, 0.0357513427734375, 0.061431884765625, 0.0871124267578125, 0.11279296875, 0.1384735107421875, 0.164154052734375, 0.1898345947265625, 0.21551513671875, 0.2411956787109375, 0.266876220703125, 0.2925567626953125, 0.3182373046875, 0.3439178466796875, 0.369598388671875, 0.3952789306640625, 0.42095947265625, 0.4466400146484375, 0.472320556640625, 0.4980010986328125, 0.523681640625, 0.5493621826171875, 0.575042724609375, 0.6007232666015625, 0.62640380859375, 0.6520843505859375, 0.677764892578125, 0.7034454345703125, 0.7291259765625, 0.7548065185546875, 0.780487060546875, 0.8061676025390625, 0.83184814453125, 0.8575286865234375, 0.883209228515625, 0.9088897705078125, 0.9345703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 9.0, 4.0, 9.0, 19.0, 29.0, 30.0, 37.0, 56.0, 82.0, 124.0, 215.0, 246.0, 403.0, 587.0, 869.0, 1309.0, 1976.0, 3057.0, 4616.0, 7145.0, 11384.0, 17593.0, 27230.0, 42210.0, 62524.0, 88929.0, 116502.0, 134577.0, 136402.0, 116924.0, 89630.0, 63299.0, 42319.0, 27685.0, 17843.0, 11367.0, 7256.0, 4924.0, 3130.0, 1965.0, 1289.0, 882.0, 565.0, 374.0, 276.0, 205.0, 132.0, 97.0, 66.0, 48.0, 39.0, 23.0, 21.0, 8.0, 11.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.46142578125, -0.44605255126953125, -0.4306793212890625, -0.41530609130859375, -0.399932861328125, -0.38455963134765625, -0.3691864013671875, -0.35381317138671875, -0.33843994140625, -0.32306671142578125, -0.3076934814453125, -0.29232025146484375, -0.276947021484375, -0.26157379150390625, -0.2462005615234375, -0.23082733154296875, -0.2154541015625, -0.20008087158203125, -0.1847076416015625, -0.16933441162109375, -0.153961181640625, -0.13858795166015625, -0.1232147216796875, -0.10784149169921875, -0.09246826171875, -0.07709503173828125, -0.0617218017578125, -0.04634857177734375, -0.030975341796875, -0.01560211181640625, -0.0002288818359375, 0.01514434814453125, 0.030517578125, 0.04589080810546875, 0.0612640380859375, 0.07663726806640625, 0.092010498046875, 0.10738372802734375, 0.1227569580078125, 0.13813018798828125, 0.15350341796875, 0.16887664794921875, 0.1842498779296875, 0.19962310791015625, 0.214996337890625, 0.23036956787109375, 0.2457427978515625, 0.26111602783203125, 0.2764892578125, 0.29186248779296875, 0.3072357177734375, 0.32260894775390625, 0.337982177734375, 0.35335540771484375, 0.3687286376953125, 0.38410186767578125, 0.39947509765625, 0.41484832763671875, 0.4302215576171875, 0.44559478759765625, 0.460968017578125, 0.47634124755859375, 0.4917144775390625, 0.5070877075195312, 0.5224609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 9.0, 16.0, 22.0, 25.0, 28.0, 40.0, 35.0, 52.0, 48.0, 61.0, 59.0, 68.0, 65.0, 69.0, 50.0, 56.0, 50.0, 29.0, 46.0, 27.0, 16.0, 21.0, 16.0, 16.0, 13.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.340576171875e-05, -5.150400102138519e-05, -4.9602240324020386e-05, -4.770047962665558e-05, -4.579871892929077e-05, -4.3896958231925964e-05, -4.199519753456116e-05, -4.009343683719635e-05, -3.819167613983154e-05, -3.6289915442466736e-05, -3.438815474510193e-05, -3.248639404773712e-05, -3.0584633350372314e-05, -2.8682872653007507e-05, -2.67811119556427e-05, -2.4879351258277893e-05, -2.2977590560913086e-05, -2.107582986354828e-05, -1.917406916618347e-05, -1.7272308468818665e-05, -1.5370547771453857e-05, -1.346878707408905e-05, -1.1567026376724243e-05, -9.665265679359436e-06, -7.763504981994629e-06, -5.861744284629822e-06, -3.959983587265015e-06, -2.0582228899002075e-06, -1.564621925354004e-07, 1.7452985048294067e-06, 3.647059202194214e-06, 5.548819899559021e-06, 7.450580596923828e-06, 9.352341294288635e-06, 1.1254101991653442e-05, 1.315586268901825e-05, 1.5057623386383057e-05, 1.6959384083747864e-05, 1.886114478111267e-05, 2.0762905478477478e-05, 2.2664666175842285e-05, 2.4566426873207092e-05, 2.64681875705719e-05, 2.8369948267936707e-05, 3.0271708965301514e-05, 3.217346966266632e-05, 3.407523036003113e-05, 3.5976991057395935e-05, 3.787875175476074e-05, 3.978051245212555e-05, 4.1682273149490356e-05, 4.3584033846855164e-05, 4.548579454421997e-05, 4.738755524158478e-05, 4.9289315938949585e-05, 5.119107663631439e-05, 5.30928373336792e-05, 5.4994598031044006e-05, 5.6896358728408813e-05, 5.879811942577362e-05, 6.069988012313843e-05, 6.260164082050323e-05, 6.450340151786804e-05, 6.640516221523285e-05, 6.830692291259766e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 12.0, 8.0, 18.0, 28.0, 35.0, 41.0, 74.0, 106.0, 182.0, 280.0, 517.0, 771.0, 1402.0, 2447.0, 4601.0, 8304.0, 15893.0, 30309.0, 56366.0, 98206.0, 150535.0, 190416.0, 179239.0, 131875.0, 80131.0, 45044.0, 24030.0, 12518.0, 6665.0, 3629.0, 2037.0, 1047.0, 704.0, 403.0, 240.0, 147.0, 87.0, 85.0, 35.0, 31.0, 17.0, 20.0, 6.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5986328125, -0.5778579711914062, -0.5570831298828125, -0.5363082885742188, -0.515533447265625, -0.49475860595703125, -0.4739837646484375, -0.45320892333984375, -0.43243408203125, -0.41165924072265625, -0.3908843994140625, -0.37010955810546875, -0.349334716796875, -0.32855987548828125, -0.3077850341796875, -0.28701019287109375, -0.2662353515625, -0.24546051025390625, -0.2246856689453125, -0.20391082763671875, -0.183135986328125, -0.16236114501953125, -0.1415863037109375, -0.12081146240234375, -0.10003662109375, -0.07926177978515625, -0.0584869384765625, -0.03771209716796875, -0.016937255859375, 0.00383758544921875, 0.0246124267578125, 0.04538726806640625, 0.066162109375, 0.08693695068359375, 0.1077117919921875, 0.12848663330078125, 0.149261474609375, 0.17003631591796875, 0.1908111572265625, 0.21158599853515625, 0.23236083984375, 0.25313568115234375, 0.2739105224609375, 0.29468536376953125, 0.315460205078125, 0.33623504638671875, 0.3570098876953125, 0.37778472900390625, 0.3985595703125, 0.41933441162109375, 0.4401092529296875, 0.46088409423828125, 0.481658935546875, 0.5024337768554688, 0.5232086181640625, 0.5439834594726562, 0.56475830078125, 0.5855331420898438, 0.6063079833984375, 0.6270828247070312, 0.647857666015625, 0.6686325073242188, 0.6894073486328125, 0.7101821899414062, 0.73095703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 15.0, 8.0, 13.0, 12.0, 20.0, 18.0, 25.0, 31.0, 37.0, 31.0, 28.0, 35.0, 34.0, 39.0, 44.0, 48.0, 59.0, 45.0, 46.0, 36.0, 47.0, 43.0, 39.0, 35.0, 25.0, 24.0, 28.0, 15.0, 16.0, 15.0, 14.0, 7.0, 13.0, 11.0, 8.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.154296875, -0.14919281005859375, -0.1440887451171875, -0.13898468017578125, -0.133880615234375, -0.12877655029296875, -0.1236724853515625, -0.11856842041015625, -0.11346435546875, -0.10836029052734375, -0.1032562255859375, -0.09815216064453125, -0.093048095703125, -0.08794403076171875, -0.0828399658203125, -0.07773590087890625, -0.0726318359375, -0.06752777099609375, -0.0624237060546875, -0.05731964111328125, -0.052215576171875, -0.04711151123046875, -0.0420074462890625, -0.03690338134765625, -0.03179931640625, -0.02669525146484375, -0.0215911865234375, -0.01648712158203125, -0.011383056640625, -0.00627899169921875, -0.0011749267578125, 0.00392913818359375, 0.009033203125, 0.01413726806640625, 0.0192413330078125, 0.02434539794921875, 0.029449462890625, 0.03455352783203125, 0.0396575927734375, 0.04476165771484375, 0.04986572265625, 0.05496978759765625, 0.0600738525390625, 0.06517791748046875, 0.070281982421875, 0.07538604736328125, 0.0804901123046875, 0.08559417724609375, 0.0906982421875, 0.09580230712890625, 0.1009063720703125, 0.10601043701171875, 0.111114501953125, 0.11621856689453125, 0.1213226318359375, 0.12642669677734375, 0.13153076171875, 0.13663482666015625, 0.1417388916015625, 0.14684295654296875, 0.151947021484375, 0.15705108642578125, 0.1621551513671875, 0.16725921630859375, 0.17236328125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 16.0, 6.0, 15.0, 20.0, 18.0, 33.0, 39.0, 30.0, 43.0, 39.0, 54.0, 55.0, 60.0, 48.0, 60.0, 65.0, 46.0, 48.0, 45.0, 50.0, 34.0, 18.0, 22.0, 22.0, 19.0, 14.0, 14.0, 21.0, 7.0, 4.0, 6.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.6769119501113892, -1.6277453899383545, -1.5785787105560303, -1.5294121503829956, -1.4802454710006714, -1.4310789108276367, -1.3819122314453125, -1.3327456712722778, -1.2835791110992432, -1.2344125509262085, -1.1852458715438843, -1.1360793113708496, -1.0869126319885254, -1.0377460718154907, -0.9885794520378113, -0.9394128322601318, -0.8902461528778076, -0.8410795331001282, -0.7919129133224487, -0.7427463531494141, -0.6935796737670898, -0.6444131135940552, -0.5952464938163757, -0.5460798740386963, -0.49691325426101685, -0.4477466344833374, -0.39858001470565796, -0.3494134247303009, -0.30024680495262146, -0.251080185174942, -0.20191359519958496, -0.15274697542190552, -0.10358047485351562, -0.05441386252641678, -0.005247250199317932, 0.04391935467720032, 0.09308597445487976, 0.1422525942325592, 0.19141918420791626, 0.2405858039855957, 0.28975242376327515, 0.3389190435409546, 0.38808566331863403, 0.4372522532939911, 0.48641887307167053, 0.5355855226516724, 0.584752082824707, 0.6339187026023865, 0.6830853223800659, 0.7322519421577454, 0.7814185619354248, 0.8305851221084595, 0.8797518014907837, 0.9289183616638184, 0.9780849814414978, 1.0272516012191772, 1.076418161392212, 1.1255847215652466, 1.1747514009475708, 1.2239179611206055, 1.2730846405029297, 1.3222512006759644, 1.371417760848999, 1.4205844402313232, 1.4697511196136475]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 14.0, 9.0, 22.0, 16.0, 26.0, 21.0, 23.0, 30.0, 30.0, 41.0, 38.0, 37.0, 39.0, 51.0, 48.0, 35.0, 56.0, 37.0, 38.0, 33.0, 31.0, 28.0, 35.0, 27.0, 34.0, 31.0, 28.0, 27.0, 19.0, 11.0, 7.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.144634485244751, -1.109297513961792, -1.073960542678833, -1.0386236906051636, -1.0032867193222046, -0.9679497480392456, -0.9326127767562866, -0.8972758054733276, -0.8619388937950134, -0.8266019225120544, -0.7912650108337402, -0.7559280395507812, -0.7205910682678223, -0.6852541565895081, -0.6499171853065491, -0.6145802736282349, -0.5792433023452759, -0.5439063310623169, -0.5085694193840027, -0.4732324481010437, -0.4378955066204071, -0.4025585651397705, -0.3672215938568115, -0.3318846523761749, -0.29654771089553833, -0.26121076941490173, -0.22587381303310394, -0.19053685665130615, -0.15519991517066956, -0.11986297369003296, -0.08452601730823517, -0.04918906092643738, -0.013852119445800781, 0.021484829485416412, 0.056821778416633606, 0.0921587273478508, 0.127495676279068, 0.1628326177597046, 0.19816957414150238, 0.23350653052330017, 0.26884347200393677, 0.30418041348457336, 0.33951735496520996, 0.37485432624816895, 0.41019126772880554, 0.44552820920944214, 0.4808651804924011, 0.5162020921707153, 0.5515390634536743, 0.5868760347366333, 0.6222129464149475, 0.6575499176979065, 0.6928868293762207, 0.7282238006591797, 0.7635607719421387, 0.7988977432250977, 0.8342346549034119, 0.8695716261863708, 0.9049085378646851, 0.940245509147644, 0.975582480430603, 1.0109193325042725, 1.0462563037872314, 1.0815932750701904, 1.1169302463531494]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 13.0, 11.0, 15.0, 41.0, 46.0, 109.0, 174.0, 333.0, 568.0, 1207.0, 2272.0, 4708.0, 9716.0, 20627.0, 44025.0, 95672.0, 203285.0, 409970.0, 706146.0, 909909.0, 798348.0, 501046.0, 258374.0, 121932.0, 55986.0, 25905.0, 12256.0, 5804.0, 2836.0, 1409.0, 723.0, 384.0, 184.0, 94.0, 64.0, 39.0, 19.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.755859375, -1.7052001953125, -1.654541015625, -1.6038818359375, -1.55322265625, -1.5025634765625, -1.451904296875, -1.4012451171875, -1.3505859375, -1.2999267578125, -1.249267578125, -1.1986083984375, -1.14794921875, -1.0972900390625, -1.046630859375, -0.9959716796875, -0.9453125, -0.8946533203125, -0.843994140625, -0.7933349609375, -0.74267578125, -0.6920166015625, -0.641357421875, -0.5906982421875, -0.5400390625, -0.4893798828125, -0.438720703125, -0.3880615234375, -0.33740234375, -0.2867431640625, -0.236083984375, -0.1854248046875, -0.134765625, -0.0841064453125, -0.033447265625, 0.0172119140625, 0.06787109375, 0.1185302734375, 0.169189453125, 0.2198486328125, 0.2705078125, 0.3211669921875, 0.371826171875, 0.4224853515625, 0.47314453125, 0.5238037109375, 0.574462890625, 0.6251220703125, 0.67578125, 0.7264404296875, 0.777099609375, 0.8277587890625, 0.87841796875, 0.9290771484375, 0.979736328125, 1.0303955078125, 1.0810546875, 1.1317138671875, 1.182373046875, 1.2330322265625, 1.28369140625, 1.3343505859375, 1.385009765625, 1.4356689453125, 1.486328125]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 13.0, 9.0, 12.0, 10.0, 19.0, 31.0, 30.0, 29.0, 26.0, 49.0, 33.0, 41.0, 45.0, 49.0, 38.0, 35.0, 40.0, 45.0, 37.0, 43.0, 29.0, 45.0, 33.0, 27.0, 30.0, 25.0, 16.0, 29.0, 25.0, 18.0, 17.0, 10.0, 7.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.787078857421875, -0.76019287109375, -0.733306884765625, -0.7064208984375, -0.679534912109375, -0.65264892578125, -0.625762939453125, -0.598876953125, -0.571990966796875, -0.54510498046875, -0.518218994140625, -0.4913330078125, -0.464447021484375, -0.43756103515625, -0.410675048828125, -0.3837890625, -0.356903076171875, -0.33001708984375, -0.303131103515625, -0.2762451171875, -0.249359130859375, -0.22247314453125, -0.195587158203125, -0.168701171875, -0.141815185546875, -0.11492919921875, -0.088043212890625, -0.0611572265625, -0.034271240234375, -0.00738525390625, 0.019500732421875, 0.04638671875, 0.073272705078125, 0.10015869140625, 0.127044677734375, 0.1539306640625, 0.180816650390625, 0.20770263671875, 0.234588623046875, 0.261474609375, 0.288360595703125, 0.31524658203125, 0.342132568359375, 0.3690185546875, 0.395904541015625, 0.42279052734375, 0.449676513671875, 0.4765625, 0.503448486328125, 0.53033447265625, 0.557220458984375, 0.5841064453125, 0.610992431640625, 0.63787841796875, 0.664764404296875, 0.691650390625, 0.718536376953125, 0.74542236328125, 0.772308349609375, 0.7991943359375, 0.826080322265625, 0.85296630859375, 0.879852294921875, 0.90673828125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 13.0, 15.0, 24.0, 32.0, 52.0, 98.0, 134.0, 218.0, 400.0, 645.0, 1104.0, 1712.0, 2976.0, 4915.0, 8323.0, 14300.0, 23989.0, 40635.0, 68420.0, 112730.0, 179049.0, 273481.0, 385726.0, 496175.0, 562167.0, 549921.0, 468452.0, 354587.0, 243655.0, 158411.0, 97473.0, 59054.0, 34842.0, 20728.0, 12034.0, 7288.0, 4193.0, 2548.0, 1474.0, 897.0, 544.0, 323.0, 208.0, 126.0, 71.0, 49.0, 17.0, 19.0, 16.0, 3.0, 3.0, 2.0, 5.0], "bins": [-1.2412109375, -1.2065963745117188, -1.1719818115234375, -1.1373672485351562, -1.102752685546875, -1.0681381225585938, -1.0335235595703125, -0.9989089965820312, -0.96429443359375, -0.9296798706054688, -0.8950653076171875, -0.8604507446289062, -0.825836181640625, -0.7912216186523438, -0.7566070556640625, -0.7219924926757812, -0.6873779296875, -0.6527633666992188, -0.6181488037109375, -0.5835342407226562, -0.548919677734375, -0.5143051147460938, -0.4796905517578125, -0.44507598876953125, -0.41046142578125, -0.37584686279296875, -0.3412322998046875, -0.30661773681640625, -0.272003173828125, -0.23738861083984375, -0.2027740478515625, -0.16815948486328125, -0.133544921875, -0.09893035888671875, -0.0643157958984375, -0.02970123291015625, 0.004913330078125, 0.03952789306640625, 0.0741424560546875, 0.10875701904296875, 0.14337158203125, 0.17798614501953125, 0.2126007080078125, 0.24721527099609375, 0.281829833984375, 0.31644439697265625, 0.3510589599609375, 0.38567352294921875, 0.4202880859375, 0.45490264892578125, 0.4895172119140625, 0.5241317749023438, 0.558746337890625, 0.5933609008789062, 0.6279754638671875, 0.6625900268554688, 0.69720458984375, 0.7318191528320312, 0.7664337158203125, 0.8010482788085938, 0.835662841796875, 0.8702774047851562, 0.9048919677734375, 0.9395065307617188, 0.97412109375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 13.0, 10.0, 15.0, 11.0, 25.0, 26.0, 24.0, 32.0, 44.0, 62.0, 72.0, 77.0, 112.0, 123.0, 109.0, 142.0, 148.0, 164.0, 194.0, 216.0, 214.0, 193.0, 221.0, 194.0, 202.0, 178.0, 155.0, 176.0, 144.0, 127.0, 103.0, 82.0, 92.0, 73.0, 59.0, 41.0, 50.0, 29.0, 26.0, 17.0, 14.0, 13.0, 8.0, 10.0, 3.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 2.0], "bins": [-0.425048828125, -0.4124870300292969, -0.39992523193359375, -0.3873634338378906, -0.3748016357421875, -0.3622398376464844, -0.34967803955078125, -0.3371162414550781, -0.324554443359375, -0.3119926452636719, -0.29943084716796875, -0.2868690490722656, -0.2743072509765625, -0.2617454528808594, -0.24918365478515625, -0.23662185668945312, -0.22406005859375, -0.21149826049804688, -0.19893646240234375, -0.18637466430664062, -0.1738128662109375, -0.16125106811523438, -0.14868927001953125, -0.13612747192382812, -0.123565673828125, -0.11100387573242188, -0.09844207763671875, -0.08588027954101562, -0.0733184814453125, -0.060756683349609375, -0.04819488525390625, -0.035633087158203125, -0.0230712890625, -0.010509490966796875, 0.00205230712890625, 0.014614105224609375, 0.0271759033203125, 0.039737701416015625, 0.05229949951171875, 0.06486129760742188, 0.077423095703125, 0.08998489379882812, 0.10254669189453125, 0.11510848999023438, 0.1276702880859375, 0.14023208618164062, 0.15279388427734375, 0.16535568237304688, 0.17791748046875, 0.19047927856445312, 0.20304107666015625, 0.21560287475585938, 0.2281646728515625, 0.24072647094726562, 0.25328826904296875, 0.2658500671386719, 0.278411865234375, 0.2909736633300781, 0.30353546142578125, 0.3160972595214844, 0.3286590576171875, 0.3412208557128906, 0.35378265380859375, 0.3663444519042969, 0.37890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 14.0, 20.0, 21.0, 23.0, 32.0, 42.0, 41.0, 47.0, 55.0, 63.0, 73.0, 64.0, 59.0, 70.0, 55.0, 55.0, 47.0, 50.0, 23.0, 22.0, 22.0, 17.0, 15.0, 12.0, 9.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7150763273239136, -1.6594101190567017, -1.6037440299987793, -1.5480778217315674, -1.4924116134643555, -1.4367454051971436, -1.3810791969299316, -1.3254131078720093, -1.2697468996047974, -1.2140806913375854, -1.158414602279663, -1.1027483940124512, -1.0470821857452393, -0.9914159774780273, -0.9357498288154602, -0.8800836801528931, -0.8244174718856812, -0.7687512636184692, -0.7130851149559021, -0.657418966293335, -0.601752758026123, -0.5460865497589111, -0.490420401096344, -0.43475422263145447, -0.37908804416656494, -0.3234218657016754, -0.2677556872367859, -0.21208950877189636, -0.15642333030700684, -0.10075715184211731, -0.04509097337722778, 0.010575205087661743, 0.06624150276184082, 0.12190768122673035, 0.17757385969161987, 0.2332400381565094, 0.2889062166213989, 0.34457239508628845, 0.400238573551178, 0.4559047520160675, 0.511570930480957, 0.567237138748169, 0.6229032874107361, 0.6785694360733032, 0.7342356443405151, 0.789901852607727, 0.8455680012702942, 0.9012341499328613, 0.9569003582000732, 1.0125665664672852, 1.068232774734497, 1.1238988637924194, 1.1795650720596313, 1.2352312803268433, 1.2908973693847656, 1.3465635776519775, 1.4022297859191895, 1.4578959941864014, 1.5135622024536133, 1.5692282915115356, 1.6248944997787476, 1.6805607080459595, 1.7362267971038818, 1.7918930053710938, 1.8475592136383057]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 12.0, 9.0, 17.0, 12.0, 14.0, 25.0, 23.0, 24.0, 23.0, 38.0, 36.0, 38.0, 33.0, 33.0, 38.0, 52.0, 30.0, 51.0, 30.0, 50.0, 43.0, 42.0, 31.0, 35.0, 34.0, 33.0, 28.0, 11.0, 27.0, 16.0, 11.0, 14.0, 10.0, 5.0, 9.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0477453470230103, -1.0165857076644897, -0.9854260087013245, -0.9542663097381592, -0.9231066703796387, -0.8919470310211182, -0.8607873320579529, -0.8296276330947876, -0.7984679937362671, -0.7673083543777466, -0.7361486554145813, -0.704988956451416, -0.6738293170928955, -0.642669677734375, -0.6115099787712097, -0.5803502798080444, -0.5491906404495239, -0.5180310010910034, -0.48687130212783813, -0.45571163296699524, -0.42455196380615234, -0.39339229464530945, -0.36223262548446655, -0.33107295632362366, -0.29991328716278076, -0.26875361800193787, -0.23759394884109497, -0.20643427968025208, -0.17527461051940918, -0.14411494135856628, -0.11295527219772339, -0.0817956030368805, -0.0506359338760376, -0.019476264715194702, 0.011683404445648193, 0.04284307360649109, 0.07400274276733398, 0.10516241192817688, 0.13632208108901978, 0.16748175024986267, 0.19864141941070557, 0.22980108857154846, 0.26096075773239136, 0.29212042689323425, 0.32328009605407715, 0.35443976521492004, 0.38559943437576294, 0.41675910353660583, 0.44791877269744873, 0.4790784418582916, 0.5102381110191345, 0.5413978099822998, 0.5725574493408203, 0.6037170886993408, 0.6348767876625061, 0.6660364866256714, 0.6971961259841919, 0.7283557653427124, 0.7595154643058777, 0.790675163269043, 0.8218348026275635, 0.852994441986084, 0.8841541409492493, 0.9153138399124146, 0.9464734792709351]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 7.0, 8.0, 17.0, 33.0, 33.0, 74.0, 89.0, 155.0, 243.0, 405.0, 644.0, 1115.0, 1781.0, 2826.0, 4627.0, 7473.0, 12351.0, 20138.0, 33082.0, 53694.0, 83657.0, 124547.0, 163936.0, 168373.0, 130924.0, 89435.0, 57114.0, 35471.0, 22043.0, 13466.0, 8199.0, 4824.0, 2978.0, 1825.0, 1112.0, 689.0, 447.0, 265.0, 164.0, 106.0, 72.0, 49.0, 38.0, 14.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21484375, -0.20660400390625, -0.1983642578125, -0.19012451171875, -0.181884765625, -0.17364501953125, -0.1654052734375, -0.15716552734375, -0.14892578125, -0.14068603515625, -0.1324462890625, -0.12420654296875, -0.115966796875, -0.10772705078125, -0.0994873046875, -0.09124755859375, -0.0830078125, -0.07476806640625, -0.0665283203125, -0.05828857421875, -0.050048828125, -0.04180908203125, -0.0335693359375, -0.02532958984375, -0.01708984375, -0.00885009765625, -0.0006103515625, 0.00762939453125, 0.015869140625, 0.02410888671875, 0.0323486328125, 0.04058837890625, 0.048828125, 0.05706787109375, 0.0653076171875, 0.07354736328125, 0.081787109375, 0.09002685546875, 0.0982666015625, 0.10650634765625, 0.11474609375, 0.12298583984375, 0.1312255859375, 0.13946533203125, 0.147705078125, 0.15594482421875, 0.1641845703125, 0.17242431640625, 0.1806640625, 0.18890380859375, 0.1971435546875, 0.20538330078125, 0.213623046875, 0.22186279296875, 0.2301025390625, 0.23834228515625, 0.24658203125, 0.25482177734375, 0.2630615234375, 0.27130126953125, 0.279541015625, 0.28778076171875, 0.2960205078125, 0.30426025390625, 0.3125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 5.0, 7.0, 16.0, 18.0, 14.0, 16.0, 22.0, 27.0, 31.0, 33.0, 41.0, 35.0, 36.0, 30.0, 44.0, 47.0, 42.0, 51.0, 44.0, 45.0, 31.0, 40.0, 37.0, 31.0, 27.0, 35.0, 14.0, 32.0, 27.0, 26.0, 8.0, 12.0, 15.0, 8.0, 5.0, 6.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.09375, -1.0586395263671875, -1.023529052734375, -0.9884185791015625, -0.95330810546875, -0.9181976318359375, -0.883087158203125, -0.8479766845703125, -0.8128662109375, -0.7777557373046875, -0.742645263671875, -0.7075347900390625, -0.67242431640625, -0.6373138427734375, -0.602203369140625, -0.5670928955078125, -0.531982421875, -0.4968719482421875, -0.461761474609375, -0.4266510009765625, -0.39154052734375, -0.3564300537109375, -0.321319580078125, -0.2862091064453125, -0.2510986328125, -0.2159881591796875, -0.180877685546875, -0.1457672119140625, -0.11065673828125, -0.0755462646484375, -0.040435791015625, -0.0053253173828125, 0.02978515625, 0.0648956298828125, 0.100006103515625, 0.1351165771484375, 0.17022705078125, 0.2053375244140625, 0.240447998046875, 0.2755584716796875, 0.3106689453125, 0.3457794189453125, 0.380889892578125, 0.4160003662109375, 0.45111083984375, 0.4862213134765625, 0.521331787109375, 0.5564422607421875, 0.591552734375, 0.6266632080078125, 0.661773681640625, 0.6968841552734375, 0.73199462890625, 0.7671051025390625, 0.802215576171875, 0.8373260498046875, 0.8724365234375, 0.9075469970703125, 0.942657470703125, 0.9777679443359375, 1.01287841796875, 1.0479888916015625, 1.083099365234375, 1.1182098388671875, 1.1533203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 16.0, 21.0, 26.0, 44.0, 65.0, 100.0, 151.0, 321.0, 527.0, 1001.0, 1953.0, 3783.0, 7899.0, 16429.0, 34407.0, 72623.0, 143544.0, 232116.0, 237087.0, 149841.0, 76474.0, 36324.0, 17294.0, 8163.0, 4082.0, 1903.0, 1014.0, 571.0, 291.0, 193.0, 83.0, 63.0, 48.0, 22.0, 25.0, 14.0, 8.0, 7.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.437255859375, -0.424407958984375, -0.41156005859375, -0.398712158203125, -0.3858642578125, -0.373016357421875, -0.36016845703125, -0.347320556640625, -0.33447265625, -0.321624755859375, -0.30877685546875, -0.295928955078125, -0.2830810546875, -0.270233154296875, -0.25738525390625, -0.244537353515625, -0.231689453125, -0.218841552734375, -0.20599365234375, -0.193145751953125, -0.1802978515625, -0.167449951171875, -0.15460205078125, -0.141754150390625, -0.12890625, -0.116058349609375, -0.10321044921875, -0.090362548828125, -0.0775146484375, -0.064666748046875, -0.05181884765625, -0.038970947265625, -0.026123046875, -0.013275146484375, -0.00042724609375, 0.012420654296875, 0.0252685546875, 0.038116455078125, 0.05096435546875, 0.063812255859375, 0.07666015625, 0.089508056640625, 0.10235595703125, 0.115203857421875, 0.1280517578125, 0.140899658203125, 0.15374755859375, 0.166595458984375, 0.179443359375, 0.192291259765625, 0.20513916015625, 0.217987060546875, 0.2308349609375, 0.243682861328125, 0.25653076171875, 0.269378662109375, 0.2822265625, 0.295074462890625, 0.30792236328125, 0.320770263671875, 0.3336181640625, 0.346466064453125, 0.35931396484375, 0.372161865234375, 0.385009765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 10.0, 22.0, 23.0, 25.0, 25.0, 32.0, 25.0, 40.0, 36.0, 36.0, 37.0, 44.0, 35.0, 36.0, 34.0, 47.0, 40.0, 39.0, 47.0, 42.0, 43.0, 25.0, 43.0, 29.0, 27.0, 31.0, 15.0, 14.0, 13.0, 12.0, 8.0, 8.0, 6.0, 4.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.748046875, -0.7252426147460938, -0.7024383544921875, -0.6796340942382812, -0.656829833984375, -0.6340255737304688, -0.6112213134765625, -0.5884170532226562, -0.56561279296875, -0.5428085327148438, -0.5200042724609375, -0.49720001220703125, -0.474395751953125, -0.45159149169921875, -0.4287872314453125, -0.40598297119140625, -0.3831787109375, -0.36037445068359375, -0.3375701904296875, -0.31476593017578125, -0.291961669921875, -0.26915740966796875, -0.2463531494140625, -0.22354888916015625, -0.20074462890625, -0.17794036865234375, -0.1551361083984375, -0.13233184814453125, -0.109527587890625, -0.08672332763671875, -0.0639190673828125, -0.04111480712890625, -0.018310546875, 0.00449371337890625, 0.0272979736328125, 0.05010223388671875, 0.072906494140625, 0.09571075439453125, 0.1185150146484375, 0.14131927490234375, 0.16412353515625, 0.18692779541015625, 0.2097320556640625, 0.23253631591796875, 0.255340576171875, 0.27814483642578125, 0.3009490966796875, 0.32375335693359375, 0.3465576171875, 0.36936187744140625, 0.3921661376953125, 0.41497039794921875, 0.437774658203125, 0.46057891845703125, 0.4833831787109375, 0.5061874389648438, 0.52899169921875, 0.5517959594726562, 0.5746002197265625, 0.5974044799804688, 0.620208740234375, 0.6430130004882812, 0.6658172607421875, 0.6886215209960938, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 7.0, 15.0, 20.0, 30.0, 33.0, 39.0, 80.0, 106.0, 159.0, 253.0, 363.0, 540.0, 882.0, 1338.0, 2145.0, 3523.0, 5848.0, 10449.0, 19765.0, 42676.0, 104117.0, 275394.0, 334154.0, 138400.0, 53669.0, 24343.0, 12486.0, 6746.0, 4049.0, 2498.0, 1514.0, 985.0, 650.0, 397.0, 284.0, 186.0, 112.0, 71.0, 69.0, 46.0, 28.0, 23.0, 22.0, 12.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1417236328125, -0.13717269897460938, -0.13262176513671875, -0.12807083129882812, -0.1235198974609375, -0.11896896362304688, -0.11441802978515625, -0.10986709594726562, -0.105316162109375, -0.10076522827148438, -0.09621429443359375, -0.09166336059570312, -0.0871124267578125, -0.08256149291992188, -0.07801055908203125, -0.07345962524414062, -0.06890869140625, -0.06435775756835938, -0.05980682373046875, -0.055255889892578125, -0.0507049560546875, -0.046154022216796875, -0.04160308837890625, -0.037052154541015625, -0.032501220703125, -0.027950286865234375, -0.02339935302734375, -0.018848419189453125, -0.0142974853515625, -0.009746551513671875, -0.00519561767578125, -0.000644683837890625, 0.00390625, 0.008457183837890625, 0.01300811767578125, 0.017559051513671875, 0.0221099853515625, 0.026660919189453125, 0.03121185302734375, 0.035762786865234375, 0.040313720703125, 0.044864654541015625, 0.04941558837890625, 0.053966522216796875, 0.0585174560546875, 0.06306838989257812, 0.06761932373046875, 0.07217025756835938, 0.07672119140625, 0.08127212524414062, 0.08582305908203125, 0.09037399291992188, 0.0949249267578125, 0.09947586059570312, 0.10402679443359375, 0.10857772827148438, 0.113128662109375, 0.11767959594726562, 0.12223052978515625, 0.12678146362304688, 0.1313323974609375, 0.13588333129882812, 0.14043426513671875, 0.14498519897460938, 0.1495361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 12.0, 15.0, 12.0, 30.0, 30.0, 31.0, 34.0, 43.0, 42.0, 46.0, 42.0, 64.0, 59.0, 59.0, 50.0, 56.0, 43.0, 51.0, 38.0, 39.0, 29.0, 30.0, 27.0, 21.0, 10.0, 9.0, 11.0, 10.0, 7.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0132789611816406e-05, -9.812414646148682e-06, -9.492039680480957e-06, -9.171664714813232e-06, -8.851289749145508e-06, -8.530914783477783e-06, -8.210539817810059e-06, -7.890164852142334e-06, -7.569789886474609e-06, -7.249414920806885e-06, -6.92903995513916e-06, -6.6086649894714355e-06, -6.288290023803711e-06, -5.967915058135986e-06, -5.647540092468262e-06, -5.327165126800537e-06, -5.0067901611328125e-06, -4.686415195465088e-06, -4.366040229797363e-06, -4.045665264129639e-06, -3.725290298461914e-06, -3.4049153327941895e-06, -3.084540367126465e-06, -2.7641654014587402e-06, -2.4437904357910156e-06, -2.123415470123291e-06, -1.8030405044555664e-06, -1.4826655387878418e-06, -1.1622905731201172e-06, -8.419156074523926e-07, -5.21540641784668e-07, -2.0116567611694336e-07, 1.1920928955078125e-07, 4.3958425521850586e-07, 7.599592208862305e-07, 1.080334186553955e-06, 1.4007091522216797e-06, 1.7210841178894043e-06, 2.041459083557129e-06, 2.3618340492248535e-06, 2.682209014892578e-06, 3.0025839805603027e-06, 3.3229589462280273e-06, 3.643333911895752e-06, 3.9637088775634766e-06, 4.284083843231201e-06, 4.604458808898926e-06, 4.92483377456665e-06, 5.245208740234375e-06, 5.5655837059021e-06, 5.885958671569824e-06, 6.206333637237549e-06, 6.5267086029052734e-06, 6.847083568572998e-06, 7.167458534240723e-06, 7.487833499908447e-06, 7.808208465576172e-06, 8.128583431243896e-06, 8.448958396911621e-06, 8.769333362579346e-06, 9.08970832824707e-06, 9.410083293914795e-06, 9.73045825958252e-06, 1.0050833225250244e-05, 1.0371208190917969e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 0.0, 7.0, 18.0, 19.0, 27.0, 53.0, 80.0, 119.0, 212.0, 291.0, 476.0, 824.0, 1382.0, 2432.0, 4030.0, 7078.0, 12623.0, 23080.0, 43206.0, 84580.0, 157625.0, 234993.0, 210404.0, 124752.0, 64491.0, 33679.0, 18115.0, 10100.0, 5688.0, 3372.0, 1835.0, 1180.0, 700.0, 384.0, 259.0, 164.0, 100.0, 64.0, 42.0, 20.0, 19.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111572265625, -0.1075592041015625, -0.103546142578125, -0.0995330810546875, -0.09552001953125, -0.0915069580078125, -0.087493896484375, -0.0834808349609375, -0.0794677734375, -0.0754547119140625, -0.071441650390625, -0.0674285888671875, -0.06341552734375, -0.0594024658203125, -0.055389404296875, -0.0513763427734375, -0.04736328125, -0.0433502197265625, -0.039337158203125, -0.0353240966796875, -0.03131103515625, -0.0272979736328125, -0.023284912109375, -0.0192718505859375, -0.0152587890625, -0.0112457275390625, -0.007232666015625, -0.0032196044921875, 0.00079345703125, 0.0048065185546875, 0.008819580078125, 0.0128326416015625, 0.016845703125, 0.0208587646484375, 0.024871826171875, 0.0288848876953125, 0.03289794921875, 0.0369110107421875, 0.040924072265625, 0.0449371337890625, 0.0489501953125, 0.0529632568359375, 0.056976318359375, 0.0609893798828125, 0.06500244140625, 0.0690155029296875, 0.073028564453125, 0.0770416259765625, 0.0810546875, 0.0850677490234375, 0.089080810546875, 0.0930938720703125, 0.09710693359375, 0.1011199951171875, 0.105133056640625, 0.1091461181640625, 0.1131591796875, 0.1171722412109375, 0.121185302734375, 0.1251983642578125, 0.12921142578125, 0.1332244873046875, 0.137237548828125, 0.1412506103515625, 0.145263671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 6.0, 8.0, 6.0, 9.0, 17.0, 23.0, 31.0, 40.0, 47.0, 59.0, 60.0, 76.0, 96.0, 70.0, 84.0, 81.0, 55.0, 50.0, 42.0, 27.0, 22.0, 19.0, 7.0, 9.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.028400421142578125, -0.02716827392578125, -0.025936126708984375, -0.0247039794921875, -0.023471832275390625, -0.02223968505859375, -0.021007537841796875, -0.019775390625, -0.018543243408203125, -0.01731109619140625, -0.016078948974609375, -0.0148468017578125, -0.013614654541015625, -0.01238250732421875, -0.011150360107421875, -0.009918212890625, -0.008686065673828125, -0.00745391845703125, -0.006221771240234375, -0.0049896240234375, -0.003757476806640625, -0.00252532958984375, -0.001293182373046875, -6.103515625e-05, 0.001171112060546875, 0.00240325927734375, 0.003635406494140625, 0.0048675537109375, 0.006099700927734375, 0.00733184814453125, 0.008563995361328125, 0.009796142578125, 0.011028289794921875, 0.01226043701171875, 0.013492584228515625, 0.0147247314453125, 0.015956878662109375, 0.01718902587890625, 0.018421173095703125, 0.0196533203125, 0.020885467529296875, 0.02211761474609375, 0.023349761962890625, 0.0245819091796875, 0.025814056396484375, 0.02704620361328125, 0.028278350830078125, 0.029510498046875, 0.030742645263671875, 0.03197479248046875, 0.033206939697265625, 0.0344390869140625, 0.035671234130859375, 0.03690338134765625, 0.038135528564453125, 0.03936767578125, 0.040599822998046875, 0.04183197021484375, 0.043064117431640625, 0.0442962646484375, 0.045528411865234375, 0.04676055908203125, 0.047992706298828125, 0.049224853515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 7.0, 6.0, 6.0, 9.0, 10.0, 16.0, 19.0, 20.0, 28.0, 48.0, 30.0, 45.0, 46.0, 66.0, 55.0, 71.0, 69.0, 54.0, 70.0, 52.0, 47.0, 43.0, 45.0, 25.0, 23.0, 18.0, 18.0, 15.0, 9.0, 10.0, 10.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.644814133644104, -1.5906760692596436, -1.5365378856658936, -1.482399821281433, -1.428261637687683, -1.3741235733032227, -1.3199853897094727, -1.2658473253250122, -1.2117092609405518, -1.1575711965560913, -1.1034330129623413, -1.0492949485778809, -0.9951568245887756, -0.9410187005996704, -0.8868805766105652, -0.83274245262146, -0.7786043286323547, -0.7244662046432495, -0.6703280806541443, -0.6161899566650391, -0.5620518922805786, -0.5079137682914734, -0.45377564430236816, -0.3996375501155853, -0.3454994261264801, -0.2913613021373749, -0.23722320795059204, -0.18308508396148682, -0.12894697487354279, -0.07480886578559875, -0.02067074179649353, 0.03346735239028931, 0.08760547637939453, 0.14174358546733856, 0.1958816945552826, 0.2500198185443878, 0.30415791273117065, 0.3582960367202759, 0.4124341607093811, 0.46657225489616394, 0.5207103490829468, 0.574848473072052, 0.6289865970611572, 0.6831246614456177, 0.7372627854347229, 0.7914009094238281, 0.8455390334129333, 0.8996771574020386, 0.9538152813911438, 1.007953405380249, 1.0620914697647095, 1.1162296533584595, 1.17036771774292, 1.22450590133667, 1.2786439657211304, 1.3327820301055908, 1.3869202136993408, 1.4410582780838013, 1.4951964616775513, 1.5493345260620117, 1.6034727096557617, 1.6576107740402222, 1.7117488384246826, 1.7658870220184326, 1.820025086402893]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 16.0, 11.0, 14.0, 17.0, 27.0, 20.0, 24.0, 28.0, 41.0, 36.0, 33.0, 33.0, 37.0, 41.0, 44.0, 40.0, 41.0, 35.0, 49.0, 46.0, 33.0, 39.0, 36.0, 29.0, 29.0, 26.0, 14.0, 24.0, 15.0, 13.0, 12.0, 8.0, 7.0, 10.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0365345478057861, -1.0054458379745483, -0.9743571877479553, -0.9432684779167175, -0.9121797680854797, -0.8810911178588867, -0.8500024080276489, -0.8189136981964111, -0.7878249883651733, -0.7567362785339355, -0.7256476283073425, -0.6945589184761047, -0.6634702086448669, -0.6323815584182739, -0.6012928485870361, -0.5702041387557983, -0.5391154289245605, -0.5080267190933228, -0.47693803906440735, -0.44584935903549194, -0.41476064920425415, -0.38367196917533875, -0.35258328914642334, -0.32149457931518555, -0.29040592908859253, -0.2593172490596771, -0.22822853922843933, -0.19713985919952393, -0.16605114936828613, -0.13496246933937073, -0.10387377440929413, -0.07278507947921753, -0.041696369647979736, -0.010607676580548286, 0.020481016486883163, 0.051569707691669464, 0.08265840262174606, 0.11374709010124207, 0.14483578503131866, 0.17592447996139526, 0.20701317489147186, 0.23810186982154846, 0.26919054985046387, 0.30027925968170166, 0.33136793971061707, 0.36245661973953247, 0.39354532957077026, 0.42463403940200806, 0.45572271943092346, 0.48681139945983887, 0.5179001092910767, 0.5489888191223145, 0.5800774693489075, 0.6111661791801453, 0.6422548890113831, 0.6733435392379761, 0.7044322490692139, 0.7355209589004517, 0.7666096091270447, 0.7976983189582825, 0.8287870287895203, 0.8598756790161133, 0.8909643888473511, 0.9220530986785889, 0.9531418085098267]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 15.0, 13.0, 24.0, 35.0, 67.0, 98.0, 133.0, 251.0, 436.0, 672.0, 1159.0, 2024.0, 3361.0, 5546.0, 9478.0, 15526.0, 24875.0, 38559.0, 57642.0, 80537.0, 104299.0, 122948.0, 129396.0, 121257.0, 101697.0, 77271.0, 54921.0, 37020.0, 23107.0, 14401.0, 8788.0, 5247.0, 3018.0, 1896.0, 1153.0, 637.0, 369.0, 241.0, 147.0, 106.0, 59.0, 37.0, 27.0, 21.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 6.0], "bins": [-1.0537109375, -1.0231094360351562, -0.9925079345703125, -0.9619064331054688, -0.931304931640625, -0.9007034301757812, -0.8701019287109375, -0.8395004272460938, -0.80889892578125, -0.7782974243164062, -0.7476959228515625, -0.7170944213867188, -0.686492919921875, -0.6558914184570312, -0.6252899169921875, -0.5946884155273438, -0.5640869140625, -0.5334854125976562, -0.5028839111328125, -0.47228240966796875, -0.441680908203125, -0.41107940673828125, -0.3804779052734375, -0.34987640380859375, -0.31927490234375, -0.28867340087890625, -0.2580718994140625, -0.22747039794921875, -0.196868896484375, -0.16626739501953125, -0.1356658935546875, -0.10506439208984375, -0.074462890625, -0.04386138916015625, -0.0132598876953125, 0.01734161376953125, 0.047943115234375, 0.07854461669921875, 0.1091461181640625, 0.13974761962890625, 0.17034912109375, 0.20095062255859375, 0.2315521240234375, 0.26215362548828125, 0.292755126953125, 0.32335662841796875, 0.3539581298828125, 0.38455963134765625, 0.4151611328125, 0.44576263427734375, 0.4763641357421875, 0.5069656372070312, 0.537567138671875, 0.5681686401367188, 0.5987701416015625, 0.6293716430664062, 0.65997314453125, 0.6905746459960938, 0.7211761474609375, 0.7517776489257812, 0.782379150390625, 0.8129806518554688, 0.8435821533203125, 0.8741836547851562, 0.90478515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 12.0, 5.0, 14.0, 16.0, 11.0, 23.0, 35.0, 22.0, 33.0, 31.0, 30.0, 44.0, 49.0, 44.0, 60.0, 49.0, 53.0, 52.0, 37.0, 45.0, 44.0, 43.0, 30.0, 25.0, 28.0, 29.0, 25.0, 8.0, 16.0, 11.0, 15.0, 16.0, 9.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.22607421875, -1.1884765625, -1.15087890625, -1.11328125, -1.07568359375, -1.0380859375, -1.00048828125, -0.962890625, -0.92529296875, -0.8876953125, -0.85009765625, -0.8125, -0.77490234375, -0.7373046875, -0.69970703125, -0.662109375, -0.62451171875, -0.5869140625, -0.54931640625, -0.51171875, -0.47412109375, -0.4365234375, -0.39892578125, -0.361328125, -0.32373046875, -0.2861328125, -0.24853515625, -0.2109375, -0.17333984375, -0.1357421875, -0.09814453125, -0.060546875, -0.02294921875, 0.0146484375, 0.05224609375, 0.08984375, 0.12744140625, 0.1650390625, 0.20263671875, 0.240234375, 0.27783203125, 0.3154296875, 0.35302734375, 0.390625, 0.42822265625, 0.4658203125, 0.50341796875, 0.541015625, 0.57861328125, 0.6162109375, 0.65380859375, 0.69140625, 0.72900390625, 0.7666015625, 0.80419921875, 0.841796875, 0.87939453125, 0.9169921875, 0.95458984375, 0.9921875, 1.02978515625, 1.0673828125, 1.10498046875, 1.142578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 5.0, 13.0, 18.0, 27.0, 37.0, 68.0, 94.0, 179.0, 303.0, 486.0, 819.0, 1395.0, 2398.0, 3926.0, 6242.0, 10014.0, 16372.0, 25509.0, 38498.0, 55605.0, 75921.0, 97229.0, 114464.0, 121588.0, 117499.0, 101670.0, 80640.0, 59727.0, 42282.0, 27995.0, 18212.0, 11424.0, 6979.0, 4390.0, 2663.0, 1530.0, 971.0, 557.0, 339.0, 179.0, 129.0, 59.0, 41.0, 23.0, 12.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.97216796875, -0.9423599243164062, -0.9125518798828125, -0.8827438354492188, -0.852935791015625, -0.8231277465820312, -0.7933197021484375, -0.7635116577148438, -0.73370361328125, -0.7038955688476562, -0.6740875244140625, -0.6442794799804688, -0.614471435546875, -0.5846633911132812, -0.5548553466796875, -0.5250473022460938, -0.4952392578125, -0.46543121337890625, -0.4356231689453125, -0.40581512451171875, -0.376007080078125, -0.34619903564453125, -0.3163909912109375, -0.28658294677734375, -0.25677490234375, -0.22696685791015625, -0.1971588134765625, -0.16735076904296875, -0.137542724609375, -0.10773468017578125, -0.0779266357421875, -0.04811859130859375, -0.018310546875, 0.01149749755859375, 0.0413055419921875, 0.07111358642578125, 0.100921630859375, 0.13072967529296875, 0.1605377197265625, 0.19034576416015625, 0.22015380859375, 0.24996185302734375, 0.2797698974609375, 0.30957794189453125, 0.339385986328125, 0.36919403076171875, 0.3990020751953125, 0.42881011962890625, 0.4586181640625, 0.48842620849609375, 0.5182342529296875, 0.5480422973632812, 0.577850341796875, 0.6076583862304688, 0.6374664306640625, 0.6672744750976562, 0.69708251953125, 0.7268905639648438, 0.7566986083984375, 0.7865066528320312, 0.816314697265625, 0.8461227416992188, 0.8759307861328125, 0.9057388305664062, 0.935546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 10.0, 6.0, 7.0, 16.0, 12.0, 29.0, 22.0, 21.0, 28.0, 25.0, 44.0, 31.0, 42.0, 53.0, 47.0, 40.0, 41.0, 30.0, 41.0, 34.0, 44.0, 47.0, 38.0, 46.0, 28.0, 32.0, 26.0, 22.0, 23.0, 26.0, 18.0, 23.0, 10.0, 9.0, 8.0, 2.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5962295532226562, -0.5747833251953125, -0.5533370971679688, -0.531890869140625, -0.5104446411132812, -0.4889984130859375, -0.46755218505859375, -0.44610595703125, -0.42465972900390625, -0.4032135009765625, -0.38176727294921875, -0.360321044921875, -0.33887481689453125, -0.3174285888671875, -0.29598236083984375, -0.2745361328125, -0.25308990478515625, -0.2316436767578125, -0.21019744873046875, -0.188751220703125, -0.16730499267578125, -0.1458587646484375, -0.12441253662109375, -0.10296630859375, -0.08152008056640625, -0.0600738525390625, -0.03862762451171875, -0.017181396484375, 0.00426483154296875, 0.0257110595703125, 0.04715728759765625, 0.068603515625, 0.09004974365234375, 0.1114959716796875, 0.13294219970703125, 0.154388427734375, 0.17583465576171875, 0.1972808837890625, 0.21872711181640625, 0.24017333984375, 0.26161956787109375, 0.2830657958984375, 0.30451202392578125, 0.325958251953125, 0.34740447998046875, 0.3688507080078125, 0.39029693603515625, 0.4117431640625, 0.43318939208984375, 0.4546356201171875, 0.47608184814453125, 0.497528076171875, 0.5189743041992188, 0.5404205322265625, 0.5618667602539062, 0.58331298828125, 0.6047592163085938, 0.6262054443359375, 0.6476516723632812, 0.669097900390625, 0.6905441284179688, 0.7119903564453125, 0.7334365844726562, 0.7548828125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 21.0, 26.0, 52.0, 71.0, 107.0, 147.0, 193.0, 351.0, 498.0, 812.0, 1331.0, 2348.0, 4114.0, 7777.0, 14953.0, 29138.0, 56813.0, 104569.0, 168142.0, 209219.0, 184407.0, 121519.0, 67684.0, 35248.0, 17903.0, 9201.0, 4971.0, 2733.0, 1586.0, 945.0, 573.0, 352.0, 242.0, 158.0, 103.0, 59.0, 48.0, 39.0, 21.0, 18.0, 15.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.70123291015625, -0.6783447265625, -0.65545654296875, -0.632568359375, -0.60968017578125, -0.5867919921875, -0.56390380859375, -0.541015625, -0.51812744140625, -0.4952392578125, -0.47235107421875, -0.449462890625, -0.42657470703125, -0.4036865234375, -0.38079833984375, -0.35791015625, -0.33502197265625, -0.3121337890625, -0.28924560546875, -0.266357421875, -0.24346923828125, -0.2205810546875, -0.19769287109375, -0.1748046875, -0.15191650390625, -0.1290283203125, -0.10614013671875, -0.083251953125, -0.06036376953125, -0.0374755859375, -0.01458740234375, 0.00830078125, 0.03118896484375, 0.0540771484375, 0.07696533203125, 0.099853515625, 0.12274169921875, 0.1456298828125, 0.16851806640625, 0.19140625, 0.21429443359375, 0.2371826171875, 0.26007080078125, 0.282958984375, 0.30584716796875, 0.3287353515625, 0.35162353515625, 0.37451171875, 0.39739990234375, 0.4202880859375, 0.44317626953125, 0.466064453125, 0.48895263671875, 0.5118408203125, 0.53472900390625, 0.5576171875, 0.58050537109375, 0.6033935546875, 0.62628173828125, 0.649169921875, 0.67205810546875, 0.6949462890625, 0.71783447265625, 0.74072265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 1.0, 5.0, 11.0, 7.0, 11.0, 15.0, 17.0, 24.0, 22.0, 23.0, 27.0, 45.0, 39.0, 34.0, 52.0, 51.0, 62.0, 47.0, 40.0, 69.0, 48.0, 53.0, 48.0, 52.0, 32.0, 32.0, 36.0, 17.0, 11.0, 18.0, 8.0, 8.0, 5.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.357099533081055e-05, -4.1943974792957306e-05, -4.0316954255104065e-05, -3.8689933717250824e-05, -3.706291317939758e-05, -3.543589264154434e-05, -3.38088721036911e-05, -3.218185156583786e-05, -3.055483102798462e-05, -2.8927810490131378e-05, -2.7300789952278137e-05, -2.5673769414424896e-05, -2.4046748876571655e-05, -2.2419728338718414e-05, -2.0792707800865173e-05, -1.9165687263011932e-05, -1.753866672515869e-05, -1.591164618730545e-05, -1.428462564945221e-05, -1.2657605111598969e-05, -1.1030584573745728e-05, -9.403564035892487e-06, -7.776543498039246e-06, -6.149522960186005e-06, -4.522502422332764e-06, -2.8954818844795227e-06, -1.2684613466262817e-06, 3.5855919122695923e-07, 1.9855797290802e-06, 3.612600266933441e-06, 5.239620804786682e-06, 6.866641342639923e-06, 8.493661880493164e-06, 1.0120682418346405e-05, 1.1747702956199646e-05, 1.3374723494052887e-05, 1.5001744031906128e-05, 1.662876456975937e-05, 1.825578510761261e-05, 1.988280564546585e-05, 2.1509826183319092e-05, 2.3136846721172333e-05, 2.4763867259025574e-05, 2.6390887796878815e-05, 2.8017908334732056e-05, 2.9644928872585297e-05, 3.127194941043854e-05, 3.289896994829178e-05, 3.452599048614502e-05, 3.615301102399826e-05, 3.77800315618515e-05, 3.940705209970474e-05, 4.1034072637557983e-05, 4.2661093175411224e-05, 4.4288113713264465e-05, 4.5915134251117706e-05, 4.754215478897095e-05, 4.916917532682419e-05, 5.079619586467743e-05, 5.242321640253067e-05, 5.405023694038391e-05, 5.567725747823715e-05, 5.730427801609039e-05, 5.8931298553943634e-05, 6.0558319091796875e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 3.0, 11.0, 9.0, 17.0, 30.0, 54.0, 70.0, 127.0, 189.0, 283.0, 545.0, 880.0, 1416.0, 2431.0, 3994.0, 6661.0, 11224.0, 19066.0, 31131.0, 49666.0, 75383.0, 106676.0, 134235.0, 147185.0, 136659.0, 108893.0, 78643.0, 51342.0, 32335.0, 19917.0, 11936.0, 7034.0, 4096.0, 2517.0, 1515.0, 903.0, 569.0, 323.0, 218.0, 131.0, 84.0, 63.0, 30.0, 29.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.580078125, -0.5642051696777344, -0.5483322143554688, -0.5324592590332031, -0.5165863037109375, -0.5007133483886719, -0.48484039306640625, -0.4689674377441406, -0.453094482421875, -0.4372215270996094, -0.42134857177734375, -0.4054756164550781, -0.3896026611328125, -0.3737297058105469, -0.35785675048828125, -0.3419837951660156, -0.32611083984375, -0.3102378845214844, -0.29436492919921875, -0.2784919738769531, -0.2626190185546875, -0.24674606323242188, -0.23087310791015625, -0.21500015258789062, -0.199127197265625, -0.18325424194335938, -0.16738128662109375, -0.15150833129882812, -0.1356353759765625, -0.11976242065429688, -0.10388946533203125, -0.08801651000976562, -0.0721435546875, -0.056270599365234375, -0.04039764404296875, -0.024524688720703125, -0.0086517333984375, 0.007221221923828125, 0.02309417724609375, 0.038967132568359375, 0.054840087890625, 0.07071304321289062, 0.08658599853515625, 0.10245895385742188, 0.1183319091796875, 0.13420486450195312, 0.15007781982421875, 0.16595077514648438, 0.18182373046875, 0.19769668579101562, 0.21356964111328125, 0.22944259643554688, 0.2453155517578125, 0.2611885070800781, 0.27706146240234375, 0.2929344177246094, 0.308807373046875, 0.3246803283691406, 0.34055328369140625, 0.3564262390136719, 0.3722991943359375, 0.3881721496582031, 0.40404510498046875, 0.4199180603027344, 0.435791015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 3.0, 6.0, 10.0, 10.0, 8.0, 13.0, 10.0, 17.0, 22.0, 15.0, 29.0, 32.0, 36.0, 39.0, 46.0, 40.0, 43.0, 30.0, 46.0, 46.0, 45.0, 40.0, 42.0, 40.0, 37.0, 33.0, 33.0, 30.0, 23.0, 21.0, 27.0, 21.0, 19.0, 20.0, 9.0, 10.0, 9.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12152099609375, -0.11739253997802734, -0.11326408386230469, -0.10913562774658203, -0.10500717163085938, -0.10087871551513672, -0.09675025939941406, -0.0926218032836914, -0.08849334716796875, -0.0843648910522461, -0.08023643493652344, -0.07610797882080078, -0.07197952270507812, -0.06785106658935547, -0.06372261047363281, -0.059594154357910156, -0.0554656982421875, -0.051337242126464844, -0.04720878601074219, -0.04308032989501953, -0.038951873779296875, -0.03482341766357422, -0.030694961547851562, -0.026566505432128906, -0.02243804931640625, -0.018309593200683594, -0.014181137084960938, -0.010052680969238281, -0.005924224853515625, -0.0017957687377929688, 0.0023326873779296875, 0.006461143493652344, 0.010589599609375, 0.014718055725097656, 0.018846511840820312, 0.02297496795654297, 0.027103424072265625, 0.03123188018798828, 0.03536033630371094, 0.039488792419433594, 0.04361724853515625, 0.047745704650878906, 0.05187416076660156, 0.05600261688232422, 0.060131072998046875, 0.06425952911376953, 0.06838798522949219, 0.07251644134521484, 0.0766448974609375, 0.08077335357666016, 0.08490180969238281, 0.08903026580810547, 0.09315872192382812, 0.09728717803955078, 0.10141563415527344, 0.1055440902709961, 0.10967254638671875, 0.1138010025024414, 0.11792945861816406, 0.12205791473388672, 0.12618637084960938, 0.13031482696533203, 0.1344432830810547, 0.13857173919677734, 0.1427001953125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 16.0, 22.0, 26.0, 35.0, 49.0, 46.0, 52.0, 66.0, 55.0, 63.0, 78.0, 63.0, 65.0, 57.0, 39.0, 32.0, 34.0, 38.0, 17.0, 22.0, 22.0, 15.0, 10.0, 5.0, 6.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5396769046783447, -1.4855743646621704, -1.4314717054367065, -1.3773691654205322, -1.3232665061950684, -1.269163966178894, -1.2150613069534302, -1.1609587669372559, -1.106856107711792, -1.0527535676956177, -0.9986509084701538, -0.9445483088493347, -0.8904457092285156, -0.8363431692123413, -0.7822405099868774, -0.7281379699707031, -0.674035370349884, -0.6199327707290649, -0.5658301711082458, -0.5117275714874268, -0.45762497186660767, -0.40352240204811096, -0.34941980242729187, -0.2953172028064728, -0.2412146031856537, -0.1871120035648346, -0.1330094039440155, -0.0789068192243576, -0.024804219603538513, 0.029298365116119385, 0.08340096473693848, 0.13750356435775757, 0.19160616397857666, 0.24570876359939575, 0.29981136322021484, 0.35391396284103394, 0.408016562461853, 0.46211913228034973, 0.5162217617034912, 0.5703243017196655, 0.6244269609451294, 0.6785295605659485, 0.7326321601867676, 0.7867347598075867, 0.8408373594284058, 0.8949398994445801, 0.949042558670044, 1.0031450986862183, 1.0572476387023926, 1.111350178718567, 1.1654528379440308, 1.219555377960205, 1.273658037185669, 1.3277605772018433, 1.3818632364273071, 1.4359657764434814, 1.4900684356689453, 1.5441709756851196, 1.5982736349105835, 1.6523761749267578, 1.7064788341522217, 1.760581374168396, 1.8146840333938599, 1.8687865734100342, 1.922889232635498]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 14.0, 19.0, 21.0, 19.0, 30.0, 30.0, 31.0, 31.0, 48.0, 46.0, 24.0, 34.0, 41.0, 45.0, 34.0, 45.0, 47.0, 44.0, 46.0, 36.0, 42.0, 37.0, 23.0, 16.0, 24.0, 22.0, 16.0, 13.0, 15.0, 11.0, 7.0, 12.0, 6.0, 10.0, 10.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0716361999511719, -1.0388997793197632, -1.006163239479065, -0.9734268188476562, -0.9406903386116028, -0.9079538583755493, -0.8752174377441406, -0.8424809575080872, -0.8097444772720337, -0.7770079970359802, -0.7442715167999268, -0.7115350961685181, -0.6787986159324646, -0.6460621356964111, -0.6133257150650024, -0.580589234828949, -0.5478527545928955, -0.515116274356842, -0.48237982392311096, -0.4496433734893799, -0.4169068932533264, -0.38417041301727295, -0.35143396258354187, -0.3186975121498108, -0.2859610319137573, -0.25322455167770386, -0.22048810124397278, -0.1877516359090805, -0.15501517057418823, -0.12227870523929596, -0.08954223990440369, -0.056805774569511414, -0.02406930923461914, 0.008667156100273132, 0.041403621435165405, 0.07414008677005768, 0.10687655210494995, 0.13961301743984222, 0.1723494827747345, 0.20508594810962677, 0.23782241344451904, 0.2705588936805725, 0.3032953441143036, 0.33603179454803467, 0.36876827478408813, 0.4015047550201416, 0.4342412054538727, 0.46697765588760376, 0.4997141361236572, 0.5324506163597107, 0.5651870965957642, 0.5979235172271729, 0.6306599974632263, 0.6633964776992798, 0.6961328983306885, 0.7288693785667419, 0.7616058588027954, 0.7943423390388489, 0.8270788192749023, 0.859815239906311, 0.8925517201423645, 0.925288200378418, 0.9580246210098267, 0.9907611012458801, 1.0234975814819336]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 17.0, 36.0, 48.0, 96.0, 103.0, 175.0, 266.0, 446.0, 790.0, 1303.0, 2120.0, 3750.0, 6345.0, 11120.0, 19382.0, 34501.0, 62484.0, 111686.0, 196831.0, 326758.0, 499138.0, 653865.0, 691305.0, 579542.0, 404078.0, 250541.0, 146391.0, 82448.0, 46626.0, 26247.0, 14894.0, 8594.0, 4901.0, 2963.0, 1765.0, 1074.0, 615.0, 380.0, 226.0, 160.0, 99.0, 52.0, 43.0, 27.0, 11.0, 7.0, 3.0, 10.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1010284423828125, -1.063385009765625, -1.0257415771484375, -0.98809814453125, -0.9504547119140625, -0.912811279296875, -0.8751678466796875, -0.8375244140625, -0.7998809814453125, -0.762237548828125, -0.7245941162109375, -0.68695068359375, -0.6493072509765625, -0.611663818359375, -0.5740203857421875, -0.536376953125, -0.4987335205078125, -0.461090087890625, -0.4234466552734375, -0.38580322265625, -0.3481597900390625, -0.310516357421875, -0.2728729248046875, -0.2352294921875, -0.1975860595703125, -0.159942626953125, -0.1222991943359375, -0.08465576171875, -0.0470123291015625, -0.009368896484375, 0.0282745361328125, 0.06591796875, 0.1035614013671875, 0.141204833984375, 0.1788482666015625, 0.21649169921875, 0.2541351318359375, 0.291778564453125, 0.3294219970703125, 0.3670654296875, 0.4047088623046875, 0.442352294921875, 0.4799957275390625, 0.51763916015625, 0.5552825927734375, 0.592926025390625, 0.6305694580078125, 0.668212890625, 0.7058563232421875, 0.743499755859375, 0.7811431884765625, 0.81878662109375, 0.8564300537109375, 0.894073486328125, 0.9317169189453125, 0.9693603515625, 1.0070037841796875, 1.044647216796875, 1.0822906494140625, 1.11993408203125, 1.1575775146484375, 1.195220947265625, 1.2328643798828125, 1.2705078125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 10.0, 15.0, 15.0, 9.0, 16.0, 29.0, 29.0, 26.0, 34.0, 27.0, 38.0, 44.0, 47.0, 34.0, 48.0, 49.0, 42.0, 40.0, 39.0, 43.0, 32.0, 32.0, 36.0, 33.0, 28.0, 23.0, 21.0, 21.0, 23.0, 18.0, 11.0, 15.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.806640625, -0.7824478149414062, -0.7582550048828125, -0.7340621948242188, -0.709869384765625, -0.6856765747070312, -0.6614837646484375, -0.6372909545898438, -0.61309814453125, -0.5889053344726562, -0.5647125244140625, -0.5405197143554688, -0.516326904296875, -0.49213409423828125, -0.4679412841796875, -0.44374847412109375, -0.4195556640625, -0.39536285400390625, -0.3711700439453125, -0.34697723388671875, -0.322784423828125, -0.29859161376953125, -0.2743988037109375, -0.25020599365234375, -0.22601318359375, -0.20182037353515625, -0.1776275634765625, -0.15343475341796875, -0.129241943359375, -0.10504913330078125, -0.0808563232421875, -0.05666351318359375, -0.032470703125, -0.00827789306640625, 0.0159149169921875, 0.04010772705078125, 0.064300537109375, 0.08849334716796875, 0.1126861572265625, 0.13687896728515625, 0.16107177734375, 0.18526458740234375, 0.2094573974609375, 0.23365020751953125, 0.257843017578125, 0.28203582763671875, 0.3062286376953125, 0.33042144775390625, 0.3546142578125, 0.37880706787109375, 0.4029998779296875, 0.42719268798828125, 0.451385498046875, 0.47557830810546875, 0.4997711181640625, 0.5239639282226562, 0.54815673828125, 0.5723495483398438, 0.5965423583984375, 0.6207351684570312, 0.644927978515625, 0.6691207885742188, 0.6933135986328125, 0.7175064086914062, 0.74169921875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [6.0, 3.0, 7.0, 13.0, 11.0, 26.0, 38.0, 66.0, 103.0, 191.0, 282.0, 464.0, 703.0, 1231.0, 1892.0, 3184.0, 5404.0, 8628.0, 14278.0, 23079.0, 38163.0, 62887.0, 99300.0, 157117.0, 236270.0, 334758.0, 440439.0, 517329.0, 536276.0, 490242.0, 395143.0, 289910.0, 198909.0, 128821.0, 81100.0, 50081.0, 30506.0, 18710.0, 11388.0, 6685.0, 4119.0, 2481.0, 1566.0, 985.0, 567.0, 362.0, 205.0, 140.0, 78.0, 60.0, 40.0, 20.0, 16.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92919921875, -0.8963394165039062, -0.8634796142578125, -0.8306198120117188, -0.797760009765625, -0.7649002075195312, -0.7320404052734375, -0.6991806030273438, -0.66632080078125, -0.6334609985351562, -0.6006011962890625, -0.5677413940429688, -0.534881591796875, -0.5020217895507812, -0.4691619873046875, -0.43630218505859375, -0.4034423828125, -0.37058258056640625, -0.3377227783203125, -0.30486297607421875, -0.272003173828125, -0.23914337158203125, -0.2062835693359375, -0.17342376708984375, -0.14056396484375, -0.10770416259765625, -0.0748443603515625, -0.04198455810546875, -0.009124755859375, 0.02373504638671875, 0.0565948486328125, 0.08945465087890625, 0.122314453125, 0.15517425537109375, 0.1880340576171875, 0.22089385986328125, 0.253753662109375, 0.28661346435546875, 0.3194732666015625, 0.35233306884765625, 0.38519287109375, 0.41805267333984375, 0.4509124755859375, 0.48377227783203125, 0.516632080078125, 0.5494918823242188, 0.5823516845703125, 0.6152114868164062, 0.6480712890625, 0.6809310913085938, 0.7137908935546875, 0.7466506958007812, 0.779510498046875, 0.8123703002929688, 0.8452301025390625, 0.8780899047851562, 0.91094970703125, 0.9438095092773438, 0.9766693115234375, 1.0095291137695312, 1.042388916015625, 1.0752487182617188, 1.1081085205078125, 1.1409683227539062, 1.173828125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 6.0, 6.0, 15.0, 13.0, 14.0, 22.0, 28.0, 33.0, 45.0, 52.0, 67.0, 71.0, 84.0, 81.0, 112.0, 126.0, 145.0, 147.0, 154.0, 193.0, 200.0, 202.0, 189.0, 207.0, 213.0, 185.0, 194.0, 183.0, 155.0, 141.0, 136.0, 101.0, 89.0, 79.0, 82.0, 57.0, 49.0, 28.0, 42.0, 23.0, 22.0, 10.0, 15.0, 13.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.38671875, -0.374908447265625, -0.36309814453125, -0.351287841796875, -0.3394775390625, -0.327667236328125, -0.31585693359375, -0.304046630859375, -0.292236328125, -0.280426025390625, -0.26861572265625, -0.256805419921875, -0.2449951171875, -0.233184814453125, -0.22137451171875, -0.209564208984375, -0.19775390625, -0.185943603515625, -0.17413330078125, -0.162322998046875, -0.1505126953125, -0.138702392578125, -0.12689208984375, -0.115081787109375, -0.103271484375, -0.091461181640625, -0.07965087890625, -0.067840576171875, -0.0560302734375, -0.044219970703125, -0.03240966796875, -0.020599365234375, -0.0087890625, 0.003021240234375, 0.01483154296875, 0.026641845703125, 0.0384521484375, 0.050262451171875, 0.06207275390625, 0.073883056640625, 0.085693359375, 0.097503662109375, 0.10931396484375, 0.121124267578125, 0.1329345703125, 0.144744873046875, 0.15655517578125, 0.168365478515625, 0.18017578125, 0.191986083984375, 0.20379638671875, 0.215606689453125, 0.2274169921875, 0.239227294921875, 0.25103759765625, 0.262847900390625, 0.274658203125, 0.286468505859375, 0.29827880859375, 0.310089111328125, 0.3218994140625, 0.333709716796875, 0.34552001953125, 0.357330322265625, 0.369140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 13.0, 10.0, 20.0, 14.0, 20.0, 19.0, 37.0, 42.0, 42.0, 52.0, 44.0, 60.0, 63.0, 63.0, 52.0, 53.0, 43.0, 56.0, 47.0, 41.0, 34.0, 29.0, 22.0, 25.0, 24.0, 10.0, 7.0, 12.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6071772575378418, -1.5585997104644775, -1.5100221633911133, -1.461444616317749, -1.4128670692443848, -1.3642895221710205, -1.3157119750976562, -1.267134428024292, -1.2185568809509277, -1.1699793338775635, -1.1214017868041992, -1.072824239730835, -1.0242466926574707, -0.9756691455841064, -0.927091658115387, -0.8785141110420227, -0.8299366235733032, -0.781359076499939, -0.7327815294265747, -0.6842039823532104, -0.6356264352798462, -0.5870488882064819, -0.5384714007377625, -0.4898938536643982, -0.44131630659103394, -0.3927387595176697, -0.3441612124443054, -0.29558369517326355, -0.2470061480998993, -0.19842860102653503, -0.14985108375549316, -0.1012735366821289, -0.0526958703994751, -0.004118330776691437, 0.044459208846092224, 0.09303674101829529, 0.14161428809165955, 0.1901918351650238, 0.23876935243606567, 0.28734689950942993, 0.3359244465827942, 0.38450199365615845, 0.4330795407295227, 0.4816570580005646, 0.5302345752716064, 0.5788121223449707, 0.627389669418335, 0.6759672164916992, 0.7245447635650635, 0.7731223106384277, 0.821699857711792, 0.8702774047851562, 0.9188549518585205, 0.9674324989318848, 1.016010046005249, 1.0645875930786133, 1.1131651401519775, 1.1617426872253418, 1.210320234298706, 1.2588977813720703, 1.3074753284454346, 1.3560528755187988, 1.404630422592163, 1.4532079696655273, 1.501785397529602]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 11.0, 14.0, 18.0, 20.0, 20.0, 26.0, 32.0, 26.0, 32.0, 43.0, 39.0, 31.0, 38.0, 31.0, 41.0, 42.0, 40.0, 43.0, 40.0, 42.0, 36.0, 47.0, 33.0, 29.0, 16.0, 34.0, 27.0, 15.0, 19.0, 10.0, 16.0, 12.0, 11.0, 10.0, 3.0, 10.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.025536060333252, -0.9957210421562195, -0.9659060835838318, -0.9360910654067993, -0.9062761068344116, -0.8764610886573792, -0.8466460704803467, -0.816831111907959, -0.7870160937309265, -0.757201075553894, -0.7273861169815063, -0.6975710988044739, -0.6677560806274414, -0.6379411220550537, -0.6081261038780212, -0.5783110857009888, -0.5484961271286011, -0.5186811089515686, -0.4888661503791809, -0.45905113220214844, -0.42923614382743835, -0.39942115545272827, -0.3696061372756958, -0.3397911489009857, -0.30997616052627563, -0.28016117215156555, -0.25034618377685547, -0.220531165599823, -0.19071617722511292, -0.16090118885040283, -0.13108618557453156, -0.10127118229866028, -0.0714561939239502, -0.041641198098659515, -0.011826202273368835, 0.017988793551921844, 0.047803789377212524, 0.07761877775192261, 0.10743378102779388, 0.13724878430366516, 0.16706377267837524, 0.19687876105308533, 0.2266937643289566, 0.2565087676048279, 0.28632375597953796, 0.31613874435424805, 0.3459537625312805, 0.3757687509059906, 0.4055837392807007, 0.43539872765541077, 0.46521371603012085, 0.4950287342071533, 0.524843692779541, 0.5546587109565735, 0.584473729133606, 0.6142886877059937, 0.6441037058830261, 0.6739187240600586, 0.7037336826324463, 0.7335487008094788, 0.7633637189865112, 0.7931786775588989, 0.8229936957359314, 0.8528087139129639, 0.8826236724853516]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 15.0, 21.0, 27.0, 36.0, 40.0, 75.0, 102.0, 178.0, 234.0, 318.0, 522.0, 750.0, 1180.0, 1866.0, 2999.0, 4865.0, 8342.0, 14639.0, 26880.0, 50211.0, 94159.0, 166844.0, 231184.0, 192673.0, 114023.0, 60994.0, 32664.0, 17614.0, 9820.0, 5576.0, 3467.0, 2112.0, 1335.0, 899.0, 600.0, 390.0, 272.0, 192.0, 129.0, 86.0, 59.0, 41.0, 35.0, 23.0, 18.0, 13.0, 9.0, 7.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.390869140625, -0.3785209655761719, -0.36617279052734375, -0.3538246154785156, -0.3414764404296875, -0.3291282653808594, -0.31678009033203125, -0.3044319152832031, -0.292083740234375, -0.2797355651855469, -0.26738739013671875, -0.2550392150878906, -0.2426910400390625, -0.23034286499023438, -0.21799468994140625, -0.20564651489257812, -0.19329833984375, -0.18095016479492188, -0.16860198974609375, -0.15625381469726562, -0.1439056396484375, -0.13155746459960938, -0.11920928955078125, -0.10686111450195312, -0.094512939453125, -0.08216476440429688, -0.06981658935546875, -0.057468414306640625, -0.0451202392578125, -0.032772064208984375, -0.02042388916015625, -0.008075714111328125, 0.0042724609375, 0.016620635986328125, 0.02896881103515625, 0.041316986083984375, 0.0536651611328125, 0.06601333618164062, 0.07836151123046875, 0.09070968627929688, 0.103057861328125, 0.11540603637695312, 0.12775421142578125, 0.14010238647460938, 0.1524505615234375, 0.16479873657226562, 0.17714691162109375, 0.18949508666992188, 0.20184326171875, 0.21419143676757812, 0.22653961181640625, 0.23888778686523438, 0.2512359619140625, 0.2635841369628906, 0.27593231201171875, 0.2882804870605469, 0.300628662109375, 0.3129768371582031, 0.32532501220703125, 0.3376731872558594, 0.3500213623046875, 0.3623695373535156, 0.37471771240234375, 0.3870658874511719, 0.3994140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 7.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 18.0, 15.0, 26.0, 19.0, 22.0, 19.0, 26.0, 39.0, 41.0, 37.0, 38.0, 48.0, 30.0, 41.0, 48.0, 40.0, 34.0, 30.0, 38.0, 36.0, 41.0, 29.0, 31.0, 20.0, 25.0, 23.0, 25.0, 18.0, 12.0, 5.0, 12.0, 12.0, 11.0, 5.0, 4.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0360031127929688, -1.0046234130859375, -0.9732437133789062, -0.941864013671875, -0.9104843139648438, -0.8791046142578125, -0.8477249145507812, -0.81634521484375, -0.7849655151367188, -0.7535858154296875, -0.7222061157226562, -0.690826416015625, -0.6594467163085938, -0.6280670166015625, -0.5966873168945312, -0.5653076171875, -0.5339279174804688, -0.5025482177734375, -0.47116851806640625, -0.439788818359375, -0.40840911865234375, -0.3770294189453125, -0.34564971923828125, -0.31427001953125, -0.28289031982421875, -0.2515106201171875, -0.22013092041015625, -0.188751220703125, -0.15737152099609375, -0.1259918212890625, -0.09461212158203125, -0.063232421875, -0.03185272216796875, -0.0004730224609375, 0.03090667724609375, 0.062286376953125, 0.09366607666015625, 0.1250457763671875, 0.15642547607421875, 0.18780517578125, 0.21918487548828125, 0.2505645751953125, 0.28194427490234375, 0.313323974609375, 0.34470367431640625, 0.3760833740234375, 0.40746307373046875, 0.4388427734375, 0.47022247314453125, 0.5016021728515625, 0.5329818725585938, 0.564361572265625, 0.5957412719726562, 0.6271209716796875, 0.6585006713867188, 0.68988037109375, 0.7212600708007812, 0.7526397705078125, 0.7840194702148438, 0.815399169921875, 0.8467788696289062, 0.8781585693359375, 0.9095382690429688, 0.94091796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 12.0, 16.0, 27.0, 53.0, 40.0, 76.0, 128.0, 191.0, 313.0, 408.0, 645.0, 1009.0, 1678.0, 3093.0, 6303.0, 13032.0, 30344.0, 75614.0, 189844.0, 330399.0, 231462.0, 94277.0, 37567.0, 15860.0, 7191.0, 3695.0, 2024.0, 1168.0, 682.0, 465.0, 307.0, 181.0, 135.0, 108.0, 64.0, 31.0, 36.0, 13.0, 9.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5599822998046875, -0.542816162109375, -0.5256500244140625, -0.50848388671875, -0.4913177490234375, -0.474151611328125, -0.4569854736328125, -0.4398193359375, -0.4226531982421875, -0.405487060546875, -0.3883209228515625, -0.37115478515625, -0.3539886474609375, -0.336822509765625, -0.3196563720703125, -0.302490234375, -0.2853240966796875, -0.268157958984375, -0.2509918212890625, -0.23382568359375, -0.2166595458984375, -0.199493408203125, -0.1823272705078125, -0.1651611328125, -0.1479949951171875, -0.130828857421875, -0.1136627197265625, -0.09649658203125, -0.0793304443359375, -0.062164306640625, -0.0449981689453125, -0.02783203125, -0.0106658935546875, 0.006500244140625, 0.0236663818359375, 0.04083251953125, 0.0579986572265625, 0.075164794921875, 0.0923309326171875, 0.1094970703125, 0.1266632080078125, 0.143829345703125, 0.1609954833984375, 0.17816162109375, 0.1953277587890625, 0.212493896484375, 0.2296600341796875, 0.246826171875, 0.2639923095703125, 0.281158447265625, 0.2983245849609375, 0.31549072265625, 0.3326568603515625, 0.349822998046875, 0.3669891357421875, 0.3841552734375, 0.4013214111328125, 0.418487548828125, 0.4356536865234375, 0.45281982421875, 0.4699859619140625, 0.487152099609375, 0.5043182373046875, 0.521484375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 8.0, 6.0, 10.0, 11.0, 11.0, 16.0, 14.0, 19.0, 20.0, 26.0, 30.0, 29.0, 39.0, 47.0, 46.0, 39.0, 42.0, 38.0, 37.0, 45.0, 46.0, 38.0, 40.0, 40.0, 42.0, 45.0, 31.0, 39.0, 14.0, 19.0, 17.0, 24.0, 14.0, 6.0, 10.0, 7.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.66143798828125, -0.6402587890625, -0.61907958984375, -0.597900390625, -0.57672119140625, -0.5555419921875, -0.53436279296875, -0.51318359375, -0.49200439453125, -0.4708251953125, -0.44964599609375, -0.428466796875, -0.40728759765625, -0.3861083984375, -0.36492919921875, -0.34375, -0.32257080078125, -0.3013916015625, -0.28021240234375, -0.259033203125, -0.23785400390625, -0.2166748046875, -0.19549560546875, -0.17431640625, -0.15313720703125, -0.1319580078125, -0.11077880859375, -0.089599609375, -0.06842041015625, -0.0472412109375, -0.02606201171875, -0.0048828125, 0.01629638671875, 0.0374755859375, 0.05865478515625, 0.079833984375, 0.10101318359375, 0.1221923828125, 0.14337158203125, 0.16455078125, 0.18572998046875, 0.2069091796875, 0.22808837890625, 0.249267578125, 0.27044677734375, 0.2916259765625, 0.31280517578125, 0.333984375, 0.35516357421875, 0.3763427734375, 0.39752197265625, 0.418701171875, 0.43988037109375, 0.4610595703125, 0.48223876953125, 0.50341796875, 0.52459716796875, 0.5457763671875, 0.56695556640625, 0.588134765625, 0.60931396484375, 0.6304931640625, 0.65167236328125, 0.6728515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 8.0, 13.0, 7.0, 14.0, 19.0, 19.0, 42.0, 45.0, 62.0, 102.0, 152.0, 202.0, 311.0, 483.0, 709.0, 1112.0, 2138.0, 3962.0, 9292.0, 33561.0, 534818.0, 414011.0, 29973.0, 8666.0, 3581.0, 1907.0, 1158.0, 675.0, 459.0, 317.0, 209.0, 165.0, 94.0, 73.0, 51.0, 48.0, 31.0, 18.0, 14.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5329666137695312, -0.5131988525390625, -0.49343109130859375, -0.473663330078125, -0.45389556884765625, -0.4341278076171875, -0.41436004638671875, -0.39459228515625, -0.37482452392578125, -0.3550567626953125, -0.33528900146484375, -0.315521240234375, -0.29575347900390625, -0.2759857177734375, -0.25621795654296875, -0.2364501953125, -0.21668243408203125, -0.1969146728515625, -0.17714691162109375, -0.157379150390625, -0.13761138916015625, -0.1178436279296875, -0.09807586669921875, -0.07830810546875, -0.05854034423828125, -0.0387725830078125, -0.01900482177734375, 0.000762939453125, 0.02053070068359375, 0.0402984619140625, 0.06006622314453125, 0.079833984375, 0.09960174560546875, 0.1193695068359375, 0.13913726806640625, 0.158905029296875, 0.17867279052734375, 0.1984405517578125, 0.21820831298828125, 0.23797607421875, 0.25774383544921875, 0.2775115966796875, 0.29727935791015625, 0.317047119140625, 0.33681488037109375, 0.3565826416015625, 0.37635040283203125, 0.3961181640625, 0.41588592529296875, 0.4356536865234375, 0.45542144775390625, 0.475189208984375, 0.49495697021484375, 0.5147247314453125, 0.5344924926757812, 0.55426025390625, 0.5740280151367188, 0.5937957763671875, 0.6135635375976562, 0.633331298828125, 0.6530990600585938, 0.6728668212890625, 0.6926345825195312, 0.71240234375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 7.0, 6.0, 11.0, 17.0, 37.0, 71.0, 66.0, 130.0, 157.0, 140.0, 105.0, 87.0, 61.0, 30.0, 18.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.946518361568451e-05, -2.841278910636902e-05, -2.7360394597053528e-05, -2.6308000087738037e-05, -2.5255605578422546e-05, -2.4203211069107056e-05, -2.3150816559791565e-05, -2.2098422050476074e-05, -2.1046027541160583e-05, -1.9993633031845093e-05, -1.8941238522529602e-05, -1.788884401321411e-05, -1.683644950389862e-05, -1.578405499458313e-05, -1.473166048526764e-05, -1.3679265975952148e-05, -1.2626871466636658e-05, -1.1574476957321167e-05, -1.0522082448005676e-05, -9.469687938690186e-06, -8.417293429374695e-06, -7.364898920059204e-06, -6.312504410743713e-06, -5.260109901428223e-06, -4.207715392112732e-06, -3.155320882797241e-06, -2.1029263734817505e-06, -1.0505318641662598e-06, 1.862645149230957e-09, 1.0542571544647217e-06, 2.1066516637802124e-06, 3.159046173095703e-06, 4.211440682411194e-06, 5.2638351917266846e-06, 6.316229701042175e-06, 7.368624210357666e-06, 8.421018719673157e-06, 9.473413228988647e-06, 1.0525807738304138e-05, 1.1578202247619629e-05, 1.263059675693512e-05, 1.368299126625061e-05, 1.4735385775566101e-05, 1.5787780284881592e-05, 1.6840174794197083e-05, 1.7892569303512573e-05, 1.8944963812828064e-05, 1.9997358322143555e-05, 2.1049752831459045e-05, 2.2102147340774536e-05, 2.3154541850090027e-05, 2.4206936359405518e-05, 2.5259330868721008e-05, 2.63117253780365e-05, 2.736411988735199e-05, 2.841651439666748e-05, 2.946890890598297e-05, 3.052130341529846e-05, 3.157369792461395e-05, 3.262609243392944e-05, 3.3678486943244934e-05, 3.4730881452560425e-05, 3.5783275961875916e-05, 3.6835670471191406e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 17.0, 14.0, 18.0, 39.0, 40.0, 62.0, 55.0, 96.0, 145.0, 179.0, 267.0, 332.0, 432.0, 644.0, 936.0, 1340.0, 2043.0, 3175.0, 4984.0, 8638.0, 16254.0, 38430.0, 140454.0, 507221.0, 222042.0, 53205.0, 20443.0, 10299.0, 5884.0, 3522.0, 2204.0, 1464.0, 1079.0, 701.0, 518.0, 394.0, 233.0, 200.0, 126.0, 96.0, 81.0, 64.0, 50.0, 30.0, 26.0, 18.0, 15.0, 10.0, 7.0, 10.0, 7.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.35888671875, -0.34789276123046875, -0.3368988037109375, -0.32590484619140625, -0.314910888671875, -0.30391693115234375, -0.2929229736328125, -0.28192901611328125, -0.27093505859375, -0.25994110107421875, -0.2489471435546875, -0.23795318603515625, -0.226959228515625, -0.21596527099609375, -0.2049713134765625, -0.19397735595703125, -0.1829833984375, -0.17198944091796875, -0.1609954833984375, -0.15000152587890625, -0.139007568359375, -0.12801361083984375, -0.1170196533203125, -0.10602569580078125, -0.09503173828125, -0.08403778076171875, -0.0730438232421875, -0.06204986572265625, -0.051055908203125, -0.04006195068359375, -0.0290679931640625, -0.01807403564453125, -0.007080078125, 0.00391387939453125, 0.0149078369140625, 0.02590179443359375, 0.036895751953125, 0.04788970947265625, 0.0588836669921875, 0.06987762451171875, 0.08087158203125, 0.09186553955078125, 0.1028594970703125, 0.11385345458984375, 0.124847412109375, 0.13584136962890625, 0.1468353271484375, 0.15782928466796875, 0.1688232421875, 0.17981719970703125, 0.1908111572265625, 0.20180511474609375, 0.212799072265625, 0.22379302978515625, 0.2347869873046875, 0.24578094482421875, 0.25677490234375, 0.26776885986328125, 0.2787628173828125, 0.28975677490234375, 0.300750732421875, 0.31174468994140625, 0.3227386474609375, 0.33373260498046875, 0.3447265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 9.0, 9.0, 18.0, 20.0, 34.0, 45.0, 97.0, 220.0, 235.0, 124.0, 65.0, 31.0, 28.0, 16.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.14694595336914062, -0.14264678955078125, -0.13834762573242188, -0.1340484619140625, -0.12974929809570312, -0.12545013427734375, -0.12115097045898438, -0.116851806640625, -0.11255264282226562, -0.10825347900390625, -0.10395431518554688, -0.0996551513671875, -0.09535598754882812, -0.09105682373046875, -0.08675765991210938, -0.08245849609375, -0.07815933227539062, -0.07386016845703125, -0.06956100463867188, -0.0652618408203125, -0.060962677001953125, -0.05666351318359375, -0.052364349365234375, -0.048065185546875, -0.043766021728515625, -0.03946685791015625, -0.035167694091796875, -0.0308685302734375, -0.026569366455078125, -0.02227020263671875, -0.017971038818359375, -0.013671875, -0.009372711181640625, -0.00507354736328125, -0.000774383544921875, 0.0035247802734375, 0.007823944091796875, 0.01212310791015625, 0.016422271728515625, 0.020721435546875, 0.025020599365234375, 0.02931976318359375, 0.033618927001953125, 0.0379180908203125, 0.042217254638671875, 0.04651641845703125, 0.050815582275390625, 0.05511474609375, 0.059413909912109375, 0.06371307373046875, 0.06801223754882812, 0.0723114013671875, 0.07661056518554688, 0.08090972900390625, 0.08520889282226562, 0.089508056640625, 0.09380722045898438, 0.09810638427734375, 0.10240554809570312, 0.1067047119140625, 0.11100387573242188, 0.11530303955078125, 0.11960220336914062, 0.1239013671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 21.0, 10.0, 20.0, 22.0, 33.0, 29.0, 44.0, 48.0, 51.0, 52.0, 64.0, 59.0, 46.0, 58.0, 54.0, 46.0, 49.0, 41.0, 42.0, 37.0, 21.0, 23.0, 23.0, 18.0, 10.0, 12.0, 10.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5663504600524902, -1.518341064453125, -1.4703317880630493, -1.422322392463684, -1.3743131160736084, -1.3263037204742432, -1.2782944440841675, -1.2302850484848022, -1.1822757720947266, -1.1342663764953613, -1.0862571001052856, -1.0382477045059204, -0.9902384281158447, -0.9422290921211243, -0.8942197561264038, -0.8462103605270386, -0.7982010245323181, -0.7501916885375977, -0.7021823525428772, -0.6541730165481567, -0.6061636805534363, -0.5581543445587158, -0.5101449489593506, -0.4621356427669525, -0.41412630677223206, -0.3661169707775116, -0.31810763478279114, -0.2700982689857483, -0.22208894789218903, -0.17407961189746857, -0.12607026100158691, -0.07806092500686646, -0.030051589012145996, 0.01795775070786476, 0.06596709042787552, 0.11397643387317657, 0.16198576986789703, 0.2099951058626175, 0.25800445675849915, 0.3060137927532196, 0.35402312874794006, 0.4020324647426605, 0.450041800737381, 0.49805116653442383, 0.5460605025291443, 0.5940698385238647, 0.6420791745185852, 0.6900885105133057, 0.7380978465080261, 0.7861071825027466, 0.834116518497467, 0.8821258544921875, 0.930135190486908, 0.9781445264816284, 1.0261539220809937, 1.0741631984710693, 1.1221725940704346, 1.1701819896697998, 1.2181912660598755, 1.2662006616592407, 1.3142099380493164, 1.3622193336486816, 1.4102286100387573, 1.4582380056381226, 1.5062472820281982]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 12.0, 5.0, 12.0, 14.0, 18.0, 22.0, 23.0, 23.0, 29.0, 28.0, 34.0, 39.0, 43.0, 34.0, 30.0, 35.0, 38.0, 45.0, 41.0, 39.0, 34.0, 40.0, 43.0, 40.0, 36.0, 28.0, 18.0, 34.0, 23.0, 12.0, 23.0, 14.0, 10.0, 14.0, 15.0, 8.0, 4.0, 7.0, 11.0, 7.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.999873161315918, -0.9706754088401794, -0.9414777159690857, -0.9122799634933472, -0.8830822706222534, -0.8538845181465149, -0.8246867656707764, -0.7954890727996826, -0.7662913799285889, -0.7370936274528503, -0.7078959345817566, -0.6786981821060181, -0.6495004892349243, -0.6203027367591858, -0.5911049842834473, -0.5619072914123535, -0.532709538936615, -0.5035117864608765, -0.4743140935897827, -0.4451163411140442, -0.41591864824295044, -0.3867208957672119, -0.3575231730937958, -0.32832545042037964, -0.2991277277469635, -0.26993000507354736, -0.24073228240013123, -0.2115345448255539, -0.18233682215213776, -0.15313909947872162, -0.12394136190414429, -0.09474363923072815, -0.06554597616195679, -0.03634824976325035, -0.007150523364543915, 0.02204720675945282, 0.05124492943286896, 0.0804426521062851, 0.10964038968086243, 0.13883811235427856, 0.1680358350276947, 0.19723355770111084, 0.22643128037452698, 0.2556290030479431, 0.28482675552368164, 0.3140244483947754, 0.3432222008705139, 0.37241992354393005, 0.4016176462173462, 0.43081536889076233, 0.46001309156417847, 0.489210844039917, 0.5184085369110107, 0.5476062893867493, 0.5768040418624878, 0.6060017347335815, 0.6351994276046753, 0.6643971800804138, 0.6935948729515076, 0.7227926254272461, 0.7519903182983398, 0.7811880707740784, 0.8103858232498169, 0.8395835161209106, 0.8687812685966492]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 10.0, 11.0, 23.0, 48.0, 76.0, 86.0, 154.0, 228.0, 424.0, 616.0, 877.0, 1482.0, 2232.0, 3495.0, 5394.0, 8185.0, 12522.0, 18719.0, 26972.0, 38317.0, 52104.0, 68538.0, 84633.0, 98160.0, 105484.0, 106325.0, 97266.0, 83393.0, 66853.0, 50854.0, 37206.0, 25735.0, 17828.0, 11861.0, 7833.0, 5104.0, 3333.0, 2149.0, 1460.0, 932.0, 580.0, 362.0, 280.0, 153.0, 89.0, 65.0, 35.0, 29.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.81005859375, -0.7847061157226562, -0.7593536376953125, -0.7340011596679688, -0.708648681640625, -0.6832962036132812, -0.6579437255859375, -0.6325912475585938, -0.60723876953125, -0.5818862915039062, -0.5565338134765625, -0.5311813354492188, -0.505828857421875, -0.48047637939453125, -0.4551239013671875, -0.42977142333984375, -0.4044189453125, -0.37906646728515625, -0.3537139892578125, -0.32836151123046875, -0.303009033203125, -0.27765655517578125, -0.2523040771484375, -0.22695159912109375, -0.20159912109375, -0.17624664306640625, -0.1508941650390625, -0.12554168701171875, -0.100189208984375, -0.07483673095703125, -0.0494842529296875, -0.02413177490234375, 0.001220703125, 0.02657318115234375, 0.0519256591796875, 0.07727813720703125, 0.102630615234375, 0.12798309326171875, 0.1533355712890625, 0.17868804931640625, 0.20404052734375, 0.22939300537109375, 0.2547454833984375, 0.28009796142578125, 0.305450439453125, 0.33080291748046875, 0.3561553955078125, 0.38150787353515625, 0.4068603515625, 0.43221282958984375, 0.4575653076171875, 0.48291778564453125, 0.508270263671875, 0.5336227416992188, 0.5589752197265625, 0.5843276977539062, 0.60968017578125, 0.6350326538085938, 0.6603851318359375, 0.6857376098632812, 0.711090087890625, 0.7364425659179688, 0.7617950439453125, 0.7871475219726562, 0.8125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 14.0, 11.0, 13.0, 17.0, 17.0, 22.0, 19.0, 26.0, 24.0, 36.0, 34.0, 36.0, 34.0, 41.0, 37.0, 41.0, 41.0, 28.0, 54.0, 39.0, 34.0, 39.0, 49.0, 29.0, 28.0, 27.0, 20.0, 22.0, 24.0, 23.0, 15.0, 16.0, 10.0, 13.0, 14.0, 10.0, 8.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0791015625, -1.04779052734375, -1.0164794921875, -0.98516845703125, -0.953857421875, -0.92254638671875, -0.8912353515625, -0.85992431640625, -0.82861328125, -0.79730224609375, -0.7659912109375, -0.73468017578125, -0.703369140625, -0.67205810546875, -0.6407470703125, -0.60943603515625, -0.578125, -0.54681396484375, -0.5155029296875, -0.48419189453125, -0.452880859375, -0.42156982421875, -0.3902587890625, -0.35894775390625, -0.32763671875, -0.29632568359375, -0.2650146484375, -0.23370361328125, -0.202392578125, -0.17108154296875, -0.1397705078125, -0.10845947265625, -0.0771484375, -0.04583740234375, -0.0145263671875, 0.01678466796875, 0.048095703125, 0.07940673828125, 0.1107177734375, 0.14202880859375, 0.17333984375, 0.20465087890625, 0.2359619140625, 0.26727294921875, 0.298583984375, 0.32989501953125, 0.3612060546875, 0.39251708984375, 0.423828125, 0.45513916015625, 0.4864501953125, 0.51776123046875, 0.549072265625, 0.58038330078125, 0.6116943359375, 0.64300537109375, 0.67431640625, 0.70562744140625, 0.7369384765625, 0.76824951171875, 0.799560546875, 0.83087158203125, 0.8621826171875, 0.89349365234375, 0.9248046875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 13.0, 20.0, 29.0, 44.0, 67.0, 101.0, 148.0, 276.0, 357.0, 662.0, 1004.0, 1583.0, 2454.0, 4004.0, 6099.0, 9600.0, 15093.0, 22473.0, 32911.0, 46223.0, 62955.0, 80810.0, 97359.0, 108282.0, 110793.0, 103765.0, 90898.0, 73331.0, 55579.0, 40128.0, 28018.0, 18925.0, 12409.0, 8120.0, 5110.0, 3319.0, 2035.0, 1259.0, 846.0, 519.0, 318.0, 219.0, 143.0, 86.0, 58.0, 45.0, 18.0, 13.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8521575927734375, -0.824920654296875, -0.7976837158203125, -0.77044677734375, -0.7432098388671875, -0.715972900390625, -0.6887359619140625, -0.6614990234375, -0.6342620849609375, -0.607025146484375, -0.5797882080078125, -0.55255126953125, -0.5253143310546875, -0.498077392578125, -0.4708404541015625, -0.443603515625, -0.4163665771484375, -0.389129638671875, -0.3618927001953125, -0.33465576171875, -0.3074188232421875, -0.280181884765625, -0.2529449462890625, -0.2257080078125, -0.1984710693359375, -0.171234130859375, -0.1439971923828125, -0.11676025390625, -0.0895233154296875, -0.062286376953125, -0.0350494384765625, -0.0078125, 0.0194244384765625, 0.046661376953125, 0.0738983154296875, 0.10113525390625, 0.1283721923828125, 0.155609130859375, 0.1828460693359375, 0.2100830078125, 0.2373199462890625, 0.264556884765625, 0.2917938232421875, 0.31903076171875, 0.3462677001953125, 0.373504638671875, 0.4007415771484375, 0.427978515625, 0.4552154541015625, 0.482452392578125, 0.5096893310546875, 0.53692626953125, 0.5641632080078125, 0.591400146484375, 0.6186370849609375, 0.6458740234375, 0.6731109619140625, 0.700347900390625, 0.7275848388671875, 0.75482177734375, 0.7820587158203125, 0.809295654296875, 0.8365325927734375, 0.86376953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 17.0, 12.0, 17.0, 18.0, 12.0, 18.0, 21.0, 23.0, 33.0, 25.0, 30.0, 18.0, 29.0, 42.0, 31.0, 35.0, 46.0, 48.0, 29.0, 45.0, 41.0, 33.0, 28.0, 36.0, 31.0, 30.0, 30.0, 33.0, 26.0, 22.0, 17.0, 19.0, 15.0, 9.0, 12.0, 4.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.546875, -0.5294418334960938, -0.5120086669921875, -0.49457550048828125, -0.477142333984375, -0.45970916748046875, -0.4422760009765625, -0.42484283447265625, -0.40740966796875, -0.38997650146484375, -0.3725433349609375, -0.35511016845703125, -0.337677001953125, -0.32024383544921875, -0.3028106689453125, -0.28537750244140625, -0.2679443359375, -0.25051116943359375, -0.2330780029296875, -0.21564483642578125, -0.198211669921875, -0.18077850341796875, -0.1633453369140625, -0.14591217041015625, -0.12847900390625, -0.11104583740234375, -0.0936126708984375, -0.07617950439453125, -0.058746337890625, -0.04131317138671875, -0.0238800048828125, -0.00644683837890625, 0.010986328125, 0.02841949462890625, 0.0458526611328125, 0.06328582763671875, 0.080718994140625, 0.09815216064453125, 0.1155853271484375, 0.13301849365234375, 0.15045166015625, 0.16788482666015625, 0.1853179931640625, 0.20275115966796875, 0.220184326171875, 0.23761749267578125, 0.2550506591796875, 0.27248382568359375, 0.2899169921875, 0.30735015869140625, 0.3247833251953125, 0.34221649169921875, 0.359649658203125, 0.37708282470703125, 0.3945159912109375, 0.41194915771484375, 0.42938232421875, 0.44681549072265625, 0.4642486572265625, 0.48168182373046875, 0.499114990234375, 0.5165481567382812, 0.5339813232421875, 0.5514144897460938, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 12.0, 23.0, 47.0, 69.0, 102.0, 148.0, 236.0, 362.0, 641.0, 980.0, 1418.0, 2274.0, 3591.0, 5607.0, 8773.0, 13739.0, 21428.0, 32919.0, 49663.0, 71792.0, 96924.0, 120999.0, 132617.0, 127312.0, 107304.0, 81767.0, 57413.0, 38751.0, 25680.0, 16575.0, 10579.0, 6772.0, 4415.0, 2838.0, 1642.0, 1159.0, 706.0, 486.0, 295.0, 164.0, 128.0, 68.0, 59.0, 26.0, 19.0, 11.0, 11.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45325469970703125, -0.4384918212890625, -0.42372894287109375, -0.408966064453125, -0.39420318603515625, -0.3794403076171875, -0.36467742919921875, -0.34991455078125, -0.33515167236328125, -0.3203887939453125, -0.30562591552734375, -0.290863037109375, -0.27610015869140625, -0.2613372802734375, -0.24657440185546875, -0.2318115234375, -0.21704864501953125, -0.2022857666015625, -0.18752288818359375, -0.172760009765625, -0.15799713134765625, -0.1432342529296875, -0.12847137451171875, -0.11370849609375, -0.09894561767578125, -0.0841827392578125, -0.06941986083984375, -0.054656982421875, -0.03989410400390625, -0.0251312255859375, -0.01036834716796875, 0.00439453125, 0.01915740966796875, 0.0339202880859375, 0.04868316650390625, 0.063446044921875, 0.07820892333984375, 0.0929718017578125, 0.10773468017578125, 0.12249755859375, 0.13726043701171875, 0.1520233154296875, 0.16678619384765625, 0.181549072265625, 0.19631195068359375, 0.2110748291015625, 0.22583770751953125, 0.2406005859375, 0.25536346435546875, 0.2701263427734375, 0.28488922119140625, 0.299652099609375, 0.31441497802734375, 0.3291778564453125, 0.34394073486328125, 0.35870361328125, 0.37346649169921875, 0.3882293701171875, 0.40299224853515625, 0.417755126953125, 0.43251800537109375, 0.4472808837890625, 0.46204376220703125, 0.476806640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 12.0, 7.0, 8.0, 3.0, 14.0, 16.0, 24.0, 21.0, 35.0, 26.0, 43.0, 54.0, 50.0, 47.0, 54.0, 48.0, 53.0, 57.0, 50.0, 47.0, 45.0, 49.0, 34.0, 37.0, 35.0, 26.0, 25.0, 18.0, 17.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.739927291870117e-05, -5.577225238084793e-05, -5.414523184299469e-05, -5.251821130514145e-05, -5.089119076728821e-05, -4.926417022943497e-05, -4.7637149691581726e-05, -4.6010129153728485e-05, -4.4383108615875244e-05, -4.2756088078022e-05, -4.112906754016876e-05, -3.950204700231552e-05, -3.787502646446228e-05, -3.624800592660904e-05, -3.46209853887558e-05, -3.299396485090256e-05, -3.1366944313049316e-05, -2.9739923775196075e-05, -2.8112903237342834e-05, -2.6485882699489594e-05, -2.4858862161636353e-05, -2.323184162378311e-05, -2.160482108592987e-05, -1.997780054807663e-05, -1.835078001022339e-05, -1.6723759472370148e-05, -1.5096738934516907e-05, -1.3469718396663666e-05, -1.1842697858810425e-05, -1.0215677320957184e-05, -8.588656783103943e-06, -6.961636245250702e-06, -5.334615707397461e-06, -3.70759516954422e-06, -2.080574631690979e-06, -4.5355409383773804e-07, 1.173466444015503e-06, 2.800486981868744e-06, 4.427507519721985e-06, 6.054528057575226e-06, 7.681548595428467e-06, 9.308569133281708e-06, 1.0935589671134949e-05, 1.256261020898819e-05, 1.418963074684143e-05, 1.581665128469467e-05, 1.7443671822547913e-05, 1.9070692360401154e-05, 2.0697712898254395e-05, 2.2324733436107635e-05, 2.3951753973960876e-05, 2.5578774511814117e-05, 2.720579504966736e-05, 2.88328155875206e-05, 3.045983612537384e-05, 3.208685666322708e-05, 3.371387720108032e-05, 3.534089773893356e-05, 3.6967918276786804e-05, 3.8594938814640045e-05, 4.0221959352493286e-05, 4.184897989034653e-05, 4.347600042819977e-05, 4.510302096605301e-05, 4.673004150390625e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 14.0, 27.0, 46.0, 61.0, 116.0, 195.0, 314.0, 435.0, 773.0, 1214.0, 2107.0, 3487.0, 5866.0, 9935.0, 16769.0, 27183.0, 43301.0, 66628.0, 94840.0, 123548.0, 142199.0, 140680.0, 118615.0, 88658.0, 60800.0, 39430.0, 24270.0, 14941.0, 8973.0, 5110.0, 3178.0, 1855.0, 1107.0, 713.0, 447.0, 244.0, 173.0, 109.0, 62.0, 42.0, 34.0, 17.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49330902099609375, -0.4773406982421875, -0.46137237548828125, -0.445404052734375, -0.42943572998046875, -0.4134674072265625, -0.39749908447265625, -0.38153076171875, -0.36556243896484375, -0.3495941162109375, -0.33362579345703125, -0.317657470703125, -0.30168914794921875, -0.2857208251953125, -0.26975250244140625, -0.2537841796875, -0.23781585693359375, -0.2218475341796875, -0.20587921142578125, -0.189910888671875, -0.17394256591796875, -0.1579742431640625, -0.14200592041015625, -0.12603759765625, -0.11006927490234375, -0.0941009521484375, -0.07813262939453125, -0.062164306640625, -0.04619598388671875, -0.0302276611328125, -0.01425933837890625, 0.001708984375, 0.01767730712890625, 0.0336456298828125, 0.04961395263671875, 0.065582275390625, 0.08155059814453125, 0.0975189208984375, 0.11348724365234375, 0.12945556640625, 0.14542388916015625, 0.1613922119140625, 0.17736053466796875, 0.193328857421875, 0.20929718017578125, 0.2252655029296875, 0.24123382568359375, 0.2572021484375, 0.27317047119140625, 0.2891387939453125, 0.30510711669921875, 0.321075439453125, 0.33704376220703125, 0.3530120849609375, 0.36898040771484375, 0.38494873046875, 0.40091705322265625, 0.4168853759765625, 0.43285369873046875, 0.448822021484375, 0.46479034423828125, 0.4807586669921875, 0.49672698974609375, 0.5126953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 17.0, 9.0, 11.0, 12.0, 19.0, 17.0, 23.0, 29.0, 24.0, 37.0, 37.0, 33.0, 32.0, 41.0, 34.0, 43.0, 53.0, 50.0, 48.0, 50.0, 45.0, 54.0, 36.0, 32.0, 28.0, 24.0, 26.0, 17.0, 20.0, 15.0, 11.0, 13.0, 14.0, 6.0, 7.0, 8.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.1547374725341797, -0.15017318725585938, -0.14560890197753906, -0.14104461669921875, -0.13648033142089844, -0.13191604614257812, -0.1273517608642578, -0.1227874755859375, -0.11822319030761719, -0.11365890502929688, -0.10909461975097656, -0.10453033447265625, -0.09996604919433594, -0.09540176391601562, -0.09083747863769531, -0.086273193359375, -0.08170890808105469, -0.07714462280273438, -0.07258033752441406, -0.06801605224609375, -0.06345176696777344, -0.058887481689453125, -0.05432319641113281, -0.0497589111328125, -0.04519462585449219, -0.040630340576171875, -0.03606605529785156, -0.03150177001953125, -0.026937484741210938, -0.022373199462890625, -0.017808914184570312, -0.01324462890625, -0.008680343627929688, -0.004116058349609375, 0.0004482269287109375, 0.00501251220703125, 0.009576797485351562, 0.014141082763671875, 0.018705368041992188, 0.0232696533203125, 0.027833938598632812, 0.032398223876953125, 0.03696250915527344, 0.04152679443359375, 0.04609107971191406, 0.050655364990234375, 0.05521965026855469, 0.059783935546875, 0.06434822082519531, 0.06891250610351562, 0.07347679138183594, 0.07804107666015625, 0.08260536193847656, 0.08716964721679688, 0.09173393249511719, 0.0962982177734375, 0.10086250305175781, 0.10542678833007812, 0.10999107360839844, 0.11455535888671875, 0.11911964416503906, 0.12368392944335938, 0.1282482147216797, 0.1328125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 7.0, 8.0, 6.0, 11.0, 11.0, 18.0, 17.0, 22.0, 28.0, 35.0, 44.0, 45.0, 47.0, 43.0, 42.0, 49.0, 56.0, 61.0, 54.0, 46.0, 47.0, 38.0, 41.0, 40.0, 34.0, 27.0, 24.0, 23.0, 13.0, 15.0, 10.0, 6.0, 9.0, 5.0, 5.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.5691479444503784, -1.5247411727905273, -1.4803344011306763, -1.4359276294708252, -1.3915208578109741, -1.347114086151123, -1.302707314491272, -1.258300542831421, -1.2138937711715698, -1.1694869995117188, -1.1250802278518677, -1.0806734561920166, -1.0362666845321655, -0.9918599128723145, -0.9474531412124634, -0.9030463695526123, -0.858639657497406, -0.8142328858375549, -0.7698261141777039, -0.7254193425178528, -0.6810125708580017, -0.6366057991981506, -0.5921990871429443, -0.5477923154830933, -0.5033855438232422, -0.4589787721633911, -0.41457200050354004, -0.37016522884368896, -0.3257584571838379, -0.2813516855239868, -0.23694494366645813, -0.19253817200660706, -0.1481313705444336, -0.10372459888458252, -0.05931783467531204, -0.014911070466041565, 0.02949570119380951, 0.07390247285366058, 0.11830922961235046, 0.16271600127220154, 0.2071227729320526, 0.2515295445919037, 0.29593631625175476, 0.34034305810928345, 0.3847498297691345, 0.4291566014289856, 0.47356337308883667, 0.5179701447486877, 0.5623769164085388, 0.6067836880683899, 0.651190459728241, 0.695597231388092, 0.7400040030479431, 0.7844107747077942, 0.8288174867630005, 0.8732242584228516, 0.9176310300827026, 0.9620378017425537, 1.0064445734024048, 1.0508513450622559, 1.095258116722107, 1.139664888381958, 1.184071660041809, 1.2284784317016602, 1.2728852033615112]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 3.0, 1.0, 11.0, 7.0, 14.0, 14.0, 17.0, 23.0, 14.0, 32.0, 18.0, 27.0, 26.0, 38.0, 34.0, 32.0, 37.0, 31.0, 40.0, 43.0, 31.0, 47.0, 36.0, 26.0, 32.0, 33.0, 23.0, 25.0, 33.0, 29.0, 31.0, 23.0, 21.0, 28.0, 21.0, 19.0, 6.0, 7.0, 6.0, 10.0, 5.0, 9.0, 8.0, 8.0, 5.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8512454032897949, -0.823173463344574, -0.795101523399353, -0.7670295834541321, -0.7389576435089111, -0.7108856439590454, -0.6828137040138245, -0.6547417640686035, -0.6266698241233826, -0.5985978841781616, -0.5705259442329407, -0.5424540042877197, -0.514382004737854, -0.48631009459495544, -0.4582381248474121, -0.43016618490219116, -0.4020942449569702, -0.37402230501174927, -0.3459503650665283, -0.317878395318985, -0.28980645537376404, -0.2617345154285431, -0.23366256058216095, -0.2055906057357788, -0.17751866579055786, -0.14944672584533691, -0.12137477099895477, -0.09330282360315323, -0.06523087620735168, -0.03715893626213074, -0.009086981415748596, 0.018984973430633545, 0.04705685377120972, 0.07512880116701126, 0.1032007485628128, 0.13127270340919495, 0.1593446433544159, 0.18741658329963684, 0.21548853814601898, 0.24356049299240112, 0.27163243293762207, 0.299704372882843, 0.32777631282806396, 0.3558482825756073, 0.38392022252082825, 0.4119921624660492, 0.44006413221359253, 0.4681360721588135, 0.4962080121040344, 0.5242799520492554, 0.5523518919944763, 0.5804238319396973, 0.608495831489563, 0.6365677118301392, 0.6646397113800049, 0.6927116513252258, 0.7207835912704468, 0.7488555312156677, 0.7769274711608887, 0.8049994111061096, 0.8330713510513306, 0.8611433506011963, 0.8892152905464172, 0.9172872304916382, 0.9453591704368591]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 14.0, 13.0, 21.0, 48.0, 64.0, 116.0, 182.0, 321.0, 636.0, 1056.0, 1945.0, 3825.0, 7265.0, 14544.0, 28719.0, 57960.0, 116626.0, 230718.0, 419027.0, 664369.0, 820548.0, 738583.0, 502134.0, 286032.0, 149223.0, 74702.0, 37259.0, 18699.0, 9440.0, 4701.0, 2513.0, 1301.0, 746.0, 417.0, 191.0, 134.0, 85.0, 44.0, 21.0, 17.0, 7.0, 6.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5625, -1.5160980224609375, -1.469696044921875, -1.4232940673828125, -1.37689208984375, -1.3304901123046875, -1.284088134765625, -1.2376861572265625, -1.1912841796875, -1.1448822021484375, -1.098480224609375, -1.0520782470703125, -1.00567626953125, -0.9592742919921875, -0.912872314453125, -0.8664703369140625, -0.820068359375, -0.7736663818359375, -0.727264404296875, -0.6808624267578125, -0.63446044921875, -0.5880584716796875, -0.541656494140625, -0.4952545166015625, -0.4488525390625, -0.4024505615234375, -0.356048583984375, -0.3096466064453125, -0.26324462890625, -0.2168426513671875, -0.170440673828125, -0.1240386962890625, -0.07763671875, -0.0312347412109375, 0.015167236328125, 0.0615692138671875, 0.10797119140625, 0.1543731689453125, 0.200775146484375, 0.2471771240234375, 0.2935791015625, 0.3399810791015625, 0.386383056640625, 0.4327850341796875, 0.47918701171875, 0.5255889892578125, 0.571990966796875, 0.6183929443359375, 0.664794921875, 0.7111968994140625, 0.757598876953125, 0.8040008544921875, 0.85040283203125, 0.8968048095703125, 0.943206787109375, 0.9896087646484375, 1.0360107421875, 1.0824127197265625, 1.128814697265625, 1.1752166748046875, 1.22161865234375, 1.2680206298828125, 1.314422607421875, 1.3608245849609375, 1.4072265625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 14.0, 13.0, 15.0, 18.0, 37.0, 25.0, 29.0, 32.0, 29.0, 33.0, 33.0, 42.0, 39.0, 47.0, 38.0, 48.0, 35.0, 49.0, 52.0, 39.0, 34.0, 36.0, 28.0, 29.0, 32.0, 18.0, 22.0, 17.0, 14.0, 12.0, 8.0, 12.0, 14.0, 4.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.75732421875, -0.73187255859375, -0.7064208984375, -0.68096923828125, -0.655517578125, -0.63006591796875, -0.6046142578125, -0.57916259765625, -0.5537109375, -0.52825927734375, -0.5028076171875, -0.47735595703125, -0.451904296875, -0.42645263671875, -0.4010009765625, -0.37554931640625, -0.35009765625, -0.32464599609375, -0.2991943359375, -0.27374267578125, -0.248291015625, -0.22283935546875, -0.1973876953125, -0.17193603515625, -0.146484375, -0.12103271484375, -0.0955810546875, -0.07012939453125, -0.044677734375, -0.01922607421875, 0.0062255859375, 0.03167724609375, 0.05712890625, 0.08258056640625, 0.1080322265625, 0.13348388671875, 0.158935546875, 0.18438720703125, 0.2098388671875, 0.23529052734375, 0.2607421875, 0.28619384765625, 0.3116455078125, 0.33709716796875, 0.362548828125, 0.38800048828125, 0.4134521484375, 0.43890380859375, 0.46435546875, 0.48980712890625, 0.5152587890625, 0.54071044921875, 0.566162109375, 0.59161376953125, 0.6170654296875, 0.64251708984375, 0.66796875, 0.69342041015625, 0.7188720703125, 0.74432373046875, 0.769775390625, 0.79522705078125, 0.8206787109375, 0.84613037109375, 0.87158203125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 10.0, 15.0, 29.0, 49.0, 59.0, 101.0, 147.0, 208.0, 345.0, 565.0, 924.0, 1485.0, 2386.0, 3765.0, 5901.0, 9598.0, 15752.0, 25186.0, 39861.0, 63095.0, 98882.0, 148523.0, 217341.0, 302422.0, 391982.0, 468376.0, 502358.0, 479228.0, 411582.0, 320062.0, 232448.0, 160558.0, 105881.0, 69419.0, 43298.0, 27452.0, 16920.0, 10505.0, 6654.0, 4075.0, 2620.0, 1543.0, 991.0, 646.0, 381.0, 258.0, 134.0, 80.0, 75.0, 29.0, 29.0, 21.0, 10.0, 7.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.97314453125, -0.9413375854492188, -0.9095306396484375, -0.8777236938476562, -0.845916748046875, -0.8141098022460938, -0.7823028564453125, -0.7504959106445312, -0.71868896484375, -0.6868820190429688, -0.6550750732421875, -0.6232681274414062, -0.591461181640625, -0.5596542358398438, -0.5278472900390625, -0.49604034423828125, -0.4642333984375, -0.43242645263671875, -0.4006195068359375, -0.36881256103515625, -0.337005615234375, -0.30519866943359375, -0.2733917236328125, -0.24158477783203125, -0.20977783203125, -0.17797088623046875, -0.1461639404296875, -0.11435699462890625, -0.082550048828125, -0.05074310302734375, -0.0189361572265625, 0.01287078857421875, 0.044677734375, 0.07648468017578125, 0.1082916259765625, 0.14009857177734375, 0.171905517578125, 0.20371246337890625, 0.2355194091796875, 0.26732635498046875, 0.29913330078125, 0.33094024658203125, 0.3627471923828125, 0.39455413818359375, 0.426361083984375, 0.45816802978515625, 0.4899749755859375, 0.5217819213867188, 0.5535888671875, 0.5853958129882812, 0.6172027587890625, 0.6490097045898438, 0.680816650390625, 0.7126235961914062, 0.7444305419921875, 0.7762374877929688, 0.80804443359375, 0.8398513793945312, 0.8716583251953125, 0.9034652709960938, 0.935272216796875, 0.9670791625976562, 0.9988861083984375, 1.0306930541992188, 1.0625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 24.0, 16.0, 21.0, 33.0, 30.0, 47.0, 66.0, 62.0, 90.0, 85.0, 91.0, 122.0, 112.0, 157.0, 172.0, 160.0, 202.0, 196.0, 209.0, 175.0, 189.0, 207.0, 182.0, 204.0, 166.0, 154.0, 135.0, 126.0, 108.0, 84.0, 69.0, 65.0, 54.0, 41.0, 54.0, 28.0, 40.0, 20.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.392578125, -0.3801116943359375, -0.367645263671875, -0.3551788330078125, -0.34271240234375, -0.3302459716796875, -0.317779541015625, -0.3053131103515625, -0.2928466796875, -0.2803802490234375, -0.267913818359375, -0.2554473876953125, -0.24298095703125, -0.2305145263671875, -0.218048095703125, -0.2055816650390625, -0.193115234375, -0.1806488037109375, -0.168182373046875, -0.1557159423828125, -0.14324951171875, -0.1307830810546875, -0.118316650390625, -0.1058502197265625, -0.0933837890625, -0.0809173583984375, -0.068450927734375, -0.0559844970703125, -0.04351806640625, -0.0310516357421875, -0.018585205078125, -0.0061187744140625, 0.00634765625, 0.0188140869140625, 0.031280517578125, 0.0437469482421875, 0.05621337890625, 0.0686798095703125, 0.081146240234375, 0.0936126708984375, 0.1060791015625, 0.1185455322265625, 0.131011962890625, 0.1434783935546875, 0.15594482421875, 0.1684112548828125, 0.180877685546875, 0.1933441162109375, 0.205810546875, 0.2182769775390625, 0.230743408203125, 0.2432098388671875, 0.25567626953125, 0.2681427001953125, 0.280609130859375, 0.2930755615234375, 0.3055419921875, 0.3180084228515625, 0.330474853515625, 0.3429412841796875, 0.35540771484375, 0.3678741455078125, 0.380340576171875, 0.3928070068359375, 0.4052734375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 17.0, 32.0, 32.0, 19.0, 50.0, 41.0, 49.0, 57.0, 63.0, 61.0, 41.0, 55.0, 33.0, 43.0, 47.0, 27.0, 34.0, 34.0, 30.0, 18.0, 13.0, 19.0, 16.0, 10.0, 15.0, 13.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.5239067077636719, -1.4816919565200806, -1.4394772052764893, -1.397262454032898, -1.3550477027893066, -1.3128328323364258, -1.2706180810928345, -1.2284033298492432, -1.1861885786056519, -1.1439738273620605, -1.1017590761184692, -1.059544324874878, -1.017329454421997, -0.9751147627830505, -0.9328999519348145, -0.8906852006912231, -0.8484704494476318, -0.8062556982040405, -0.7640409469604492, -0.7218261361122131, -0.6796113848686218, -0.6373966336250305, -0.5951818227767944, -0.5529670715332031, -0.5107523202896118, -0.4685375690460205, -0.4263227880001068, -0.3841080069541931, -0.3418932557106018, -0.2996785044670105, -0.2574637234210968, -0.2152489423751831, -0.17303407192230225, -0.13081930577754974, -0.08860453963279724, -0.04638977348804474, -0.004175007343292236, 0.038039758801460266, 0.08025452494621277, 0.12246930599212646, 0.16468405723571777, 0.20689882338047028, 0.24911358952522278, 0.2913283705711365, 0.3335431218147278, 0.3757578730583191, 0.4179726541042328, 0.4601874351501465, 0.5024021863937378, 0.5446169376373291, 0.5868316888809204, 0.6290464997291565, 0.6712612509727478, 0.7134760022163391, 0.7556908130645752, 0.7979055643081665, 0.8401203155517578, 0.8823350667953491, 0.9245498180389404, 0.9667646288871765, 1.008979320526123, 1.051194190979004, 1.0934089422225952, 1.1356236934661865, 1.1778384447097778]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 15.0, 12.0, 22.0, 14.0, 18.0, 17.0, 24.0, 38.0, 25.0, 29.0, 32.0, 31.0, 44.0, 37.0, 43.0, 28.0, 41.0, 32.0, 44.0, 34.0, 46.0, 40.0, 34.0, 33.0, 35.0, 27.0, 32.0, 27.0, 20.0, 15.0, 16.0, 9.0, 15.0, 12.0, 8.0, 7.0, 9.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8927128911018372, -0.8629211783409119, -0.8331294655799866, -0.8033376932144165, -0.7735459804534912, -0.7437542676925659, -0.7139625549316406, -0.6841708421707153, -0.65437912940979, -0.6245874166488647, -0.5947957038879395, -0.5650039911270142, -0.5352122187614441, -0.5054205060005188, -0.4756287932395935, -0.4458370804786682, -0.41604530811309814, -0.38625359535217285, -0.35646185278892517, -0.3266701400279999, -0.2968783974647522, -0.2670866847038269, -0.2372949719429016, -0.20750324428081512, -0.17771151661872864, -0.14791978895664215, -0.11812806874513626, -0.08833634853363037, -0.058544620871543884, -0.028752893209457397, 0.0010388195514678955, 0.030830547213554382, 0.060622334480285645, 0.09041406214237213, 0.12020578235387802, 0.1499975025653839, 0.1797892302274704, 0.20958095788955688, 0.23937267065048218, 0.26916438341140747, 0.29895612597465515, 0.32874783873558044, 0.3585395812988281, 0.3883312940597534, 0.4181230068206787, 0.4479147493839264, 0.4777064621448517, 0.5074982047080994, 0.5372899174690247, 0.56708163022995, 0.5968733429908752, 0.6266651153564453, 0.6564568281173706, 0.6862485408782959, 0.7160402536392212, 0.7458319664001465, 0.7756236791610718, 0.8054153919219971, 0.8352071046829224, 0.8649988174438477, 0.8947905898094177, 0.924582302570343, 0.9543740153312683, 0.9841657280921936, 1.0139575004577637]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 17.0, 36.0, 47.0, 64.0, 99.0, 135.0, 252.0, 363.0, 579.0, 888.0, 1426.0, 2285.0, 3651.0, 5875.0, 9740.0, 16518.0, 27680.0, 46405.0, 75989.0, 122123.0, 171544.0, 184211.0, 142336.0, 93330.0, 57356.0, 34168.0, 20107.0, 12079.0, 7463.0, 4430.0, 2690.0, 1632.0, 1083.0, 690.0, 426.0, 295.0, 154.0, 122.0, 75.0, 57.0, 37.0, 25.0, 16.0, 15.0, 5.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.287109375, -0.2779083251953125, -0.268707275390625, -0.2595062255859375, -0.25030517578125, -0.2411041259765625, -0.231903076171875, -0.2227020263671875, -0.2135009765625, -0.2042999267578125, -0.195098876953125, -0.1858978271484375, -0.17669677734375, -0.1674957275390625, -0.158294677734375, -0.1490936279296875, -0.139892578125, -0.1306915283203125, -0.121490478515625, -0.1122894287109375, -0.10308837890625, -0.0938873291015625, -0.084686279296875, -0.0754852294921875, -0.0662841796875, -0.0570831298828125, -0.047882080078125, -0.0386810302734375, -0.02947998046875, -0.0202789306640625, -0.011077880859375, -0.0018768310546875, 0.00732421875, 0.0165252685546875, 0.025726318359375, 0.0349273681640625, 0.04412841796875, 0.0533294677734375, 0.062530517578125, 0.0717315673828125, 0.0809326171875, 0.0901336669921875, 0.099334716796875, 0.1085357666015625, 0.11773681640625, 0.1269378662109375, 0.136138916015625, 0.1453399658203125, 0.154541015625, 0.1637420654296875, 0.172943115234375, 0.1821441650390625, 0.19134521484375, 0.2005462646484375, 0.209747314453125, 0.2189483642578125, 0.2281494140625, 0.2373504638671875, 0.246551513671875, 0.2557525634765625, 0.26495361328125, 0.2741546630859375, 0.283355712890625, 0.2925567626953125, 0.3017578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 5.0, 10.0, 8.0, 10.0, 15.0, 17.0, 18.0, 29.0, 31.0, 34.0, 31.0, 39.0, 38.0, 55.0, 50.0, 34.0, 43.0, 34.0, 47.0, 49.0, 50.0, 48.0, 47.0, 50.0, 32.0, 38.0, 18.0, 24.0, 28.0, 17.0, 9.0, 5.0, 10.0, 11.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0746002197265625, -1.036895751953125, -0.9991912841796875, -0.96148681640625, -0.9237823486328125, -0.886077880859375, -0.8483734130859375, -0.8106689453125, -0.7729644775390625, -0.735260009765625, -0.6975555419921875, -0.65985107421875, -0.6221466064453125, -0.584442138671875, -0.5467376708984375, -0.509033203125, -0.4713287353515625, -0.433624267578125, -0.3959197998046875, -0.35821533203125, -0.3205108642578125, -0.282806396484375, -0.2451019287109375, -0.2073974609375, -0.1696929931640625, -0.131988525390625, -0.0942840576171875, -0.05657958984375, -0.0188751220703125, 0.018829345703125, 0.0565338134765625, 0.09423828125, 0.1319427490234375, 0.169647216796875, 0.2073516845703125, 0.24505615234375, 0.2827606201171875, 0.320465087890625, 0.3581695556640625, 0.3958740234375, 0.4335784912109375, 0.471282958984375, 0.5089874267578125, 0.54669189453125, 0.5843963623046875, 0.622100830078125, 0.6598052978515625, 0.697509765625, 0.7352142333984375, 0.772918701171875, 0.8106231689453125, 0.84832763671875, 0.8860321044921875, 0.923736572265625, 0.9614410400390625, 0.9991455078125, 1.0368499755859375, 1.074554443359375, 1.1122589111328125, 1.14996337890625, 1.1876678466796875, 1.225372314453125, 1.2630767822265625, 1.30078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 10.0, 6.0, 10.0, 19.0, 26.0, 31.0, 48.0, 78.0, 92.0, 183.0, 287.0, 428.0, 713.0, 1215.0, 2119.0, 3675.0, 6701.0, 12524.0, 24172.0, 47481.0, 92232.0, 167658.0, 238107.0, 202878.0, 118327.0, 62149.0, 31329.0, 16273.0, 8631.0, 4754.0, 2584.0, 1481.0, 870.0, 511.0, 345.0, 192.0, 136.0, 91.0, 63.0, 40.0, 21.0, 21.0, 16.0, 8.0, 11.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.39501953125, -0.3829383850097656, -0.37085723876953125, -0.3587760925292969, -0.3466949462890625, -0.3346138000488281, -0.32253265380859375, -0.3104515075683594, -0.298370361328125, -0.2862892150878906, -0.27420806884765625, -0.2621269226074219, -0.2500457763671875, -0.23796463012695312, -0.22588348388671875, -0.21380233764648438, -0.20172119140625, -0.18964004516601562, -0.17755889892578125, -0.16547775268554688, -0.1533966064453125, -0.14131546020507812, -0.12923431396484375, -0.11715316772460938, -0.105072021484375, -0.09299087524414062, -0.08090972900390625, -0.06882858276367188, -0.0567474365234375, -0.044666290283203125, -0.03258514404296875, -0.020503997802734375, -0.0084228515625, 0.003658294677734375, 0.01573944091796875, 0.027820587158203125, 0.0399017333984375, 0.051982879638671875, 0.06406402587890625, 0.07614517211914062, 0.088226318359375, 0.10030746459960938, 0.11238861083984375, 0.12446975708007812, 0.1365509033203125, 0.14863204956054688, 0.16071319580078125, 0.17279434204101562, 0.18487548828125, 0.19695663452148438, 0.20903778076171875, 0.22111892700195312, 0.2332000732421875, 0.24528121948242188, 0.25736236572265625, 0.2694435119628906, 0.281524658203125, 0.2936058044433594, 0.30568695068359375, 0.3177680969238281, 0.3298492431640625, 0.3419303894042969, 0.35401153564453125, 0.3660926818847656, 0.378173828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 6.0, 4.0, 6.0, 1.0, 10.0, 11.0, 15.0, 17.0, 23.0, 20.0, 11.0, 32.0, 27.0, 31.0, 29.0, 39.0, 31.0, 37.0, 23.0, 50.0, 35.0, 32.0, 39.0, 45.0, 44.0, 27.0, 36.0, 28.0, 33.0, 29.0, 37.0, 25.0, 18.0, 22.0, 16.0, 13.0, 13.0, 10.0, 12.0, 11.0, 16.0, 5.0, 4.0, 9.0, 1.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.5888671875, -0.5704879760742188, -0.5521087646484375, -0.5337295532226562, -0.515350341796875, -0.49697113037109375, -0.4785919189453125, -0.46021270751953125, -0.44183349609375, -0.42345428466796875, -0.4050750732421875, -0.38669586181640625, -0.368316650390625, -0.34993743896484375, -0.3315582275390625, -0.31317901611328125, -0.2947998046875, -0.27642059326171875, -0.2580413818359375, -0.23966217041015625, -0.221282958984375, -0.20290374755859375, -0.1845245361328125, -0.16614532470703125, -0.14776611328125, -0.12938690185546875, -0.1110076904296875, -0.09262847900390625, -0.074249267578125, -0.05587005615234375, -0.0374908447265625, -0.01911163330078125, -0.000732421875, 0.01764678955078125, 0.0360260009765625, 0.05440521240234375, 0.072784423828125, 0.09116363525390625, 0.1095428466796875, 0.12792205810546875, 0.14630126953125, 0.16468048095703125, 0.1830596923828125, 0.20143890380859375, 0.219818115234375, 0.23819732666015625, 0.2565765380859375, 0.27495574951171875, 0.2933349609375, 0.31171417236328125, 0.3300933837890625, 0.34847259521484375, 0.366851806640625, 0.38523101806640625, 0.4036102294921875, 0.42198944091796875, 0.44036865234375, 0.45874786376953125, 0.4771270751953125, 0.49550628662109375, 0.513885498046875, 0.5322647094726562, 0.5506439208984375, 0.5690231323242188, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 16.0, 33.0, 24.0, 29.0, 84.0, 87.0, 135.0, 177.0, 268.0, 419.0, 613.0, 960.0, 1519.0, 2474.0, 4525.0, 8841.0, 21741.0, 72438.0, 375292.0, 430020.0, 83585.0, 23599.0, 9634.0, 4815.0, 2649.0, 1516.0, 1006.0, 651.0, 446.0, 278.0, 229.0, 142.0, 88.0, 57.0, 41.0, 30.0, 24.0, 14.0, 11.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2736091613769531, -0.26450347900390625, -0.2553977966308594, -0.2462921142578125, -0.23718643188476562, -0.22808074951171875, -0.21897506713867188, -0.209869384765625, -0.20076370239257812, -0.19165802001953125, -0.18255233764648438, -0.1734466552734375, -0.16434097290039062, -0.15523529052734375, -0.14612960815429688, -0.13702392578125, -0.12791824340820312, -0.11881256103515625, -0.10970687866210938, -0.1006011962890625, -0.09149551391601562, -0.08238983154296875, -0.07328414916992188, -0.064178466796875, -0.055072784423828125, -0.04596710205078125, -0.036861419677734375, -0.0277557373046875, -0.018650054931640625, -0.00954437255859375, -0.000438690185546875, 0.0086669921875, 0.017772674560546875, 0.02687835693359375, 0.035984039306640625, 0.0450897216796875, 0.054195404052734375, 0.06330108642578125, 0.07240676879882812, 0.081512451171875, 0.09061813354492188, 0.09972381591796875, 0.10882949829101562, 0.1179351806640625, 0.12704086303710938, 0.13614654541015625, 0.14525222778320312, 0.15435791015625, 0.16346359252929688, 0.17256927490234375, 0.18167495727539062, 0.1907806396484375, 0.19988632202148438, 0.20899200439453125, 0.21809768676757812, 0.227203369140625, 0.23630905151367188, 0.24541473388671875, 0.2545204162597656, 0.2636260986328125, 0.2727317810058594, 0.28183746337890625, 0.2909431457519531, 0.300048828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 16.0, 29.0, 65.0, 64.0, 88.0, 110.0, 125.0, 124.0, 115.0, 89.0, 52.0, 29.0, 26.0, 15.0, 10.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1655112504959106e-05, -2.0839273929595947e-05, -2.0023435354232788e-05, -1.920759677886963e-05, -1.839175820350647e-05, -1.757591962814331e-05, -1.676008105278015e-05, -1.5944242477416992e-05, -1.5128403902053833e-05, -1.4312565326690674e-05, -1.3496726751327515e-05, -1.2680888175964355e-05, -1.1865049600601196e-05, -1.1049211025238037e-05, -1.0233372449874878e-05, -9.417533874511719e-06, -8.60169529914856e-06, -7.7858567237854e-06, -6.970018148422241e-06, -6.154179573059082e-06, -5.338340997695923e-06, -4.522502422332764e-06, -3.7066638469696045e-06, -2.8908252716064453e-06, -2.074986696243286e-06, -1.259148120880127e-06, -4.4330954551696777e-07, 3.725290298461914e-07, 1.1883676052093506e-06, 2.0042061805725098e-06, 2.820044755935669e-06, 3.635883331298828e-06, 4.451721906661987e-06, 5.2675604820251465e-06, 6.083399057388306e-06, 6.899237632751465e-06, 7.715076208114624e-06, 8.530914783477783e-06, 9.346753358840942e-06, 1.0162591934204102e-05, 1.097843050956726e-05, 1.179426908493042e-05, 1.2610107660293579e-05, 1.3425946235656738e-05, 1.4241784811019897e-05, 1.5057623386383057e-05, 1.5873461961746216e-05, 1.6689300537109375e-05, 1.7505139112472534e-05, 1.8320977687835693e-05, 1.9136816263198853e-05, 1.9952654838562012e-05, 2.076849341392517e-05, 2.158433198928833e-05, 2.240017056465149e-05, 2.321600914001465e-05, 2.4031847715377808e-05, 2.4847686290740967e-05, 2.5663524866104126e-05, 2.6479363441467285e-05, 2.7295202016830444e-05, 2.8111040592193604e-05, 2.8926879167556763e-05, 2.9742717742919922e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 6.0, 16.0, 15.0, 9.0, 28.0, 42.0, 49.0, 69.0, 102.0, 174.0, 244.0, 368.0, 621.0, 935.0, 1592.0, 2658.0, 4724.0, 9444.0, 22645.0, 73713.0, 302116.0, 442906.0, 124475.0, 34270.0, 12918.0, 6156.0, 3245.0, 1832.0, 1072.0, 689.0, 449.0, 282.0, 209.0, 130.0, 93.0, 61.0, 50.0, 28.0, 25.0, 14.0, 15.0, 13.0, 11.0, 6.0, 3.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3310546875, -0.320770263671875, -0.31048583984375, -0.300201416015625, -0.2899169921875, -0.279632568359375, -0.26934814453125, -0.259063720703125, -0.248779296875, -0.238494873046875, -0.22821044921875, -0.217926025390625, -0.2076416015625, -0.197357177734375, -0.18707275390625, -0.176788330078125, -0.16650390625, -0.156219482421875, -0.14593505859375, -0.135650634765625, -0.1253662109375, -0.115081787109375, -0.10479736328125, -0.094512939453125, -0.084228515625, -0.073944091796875, -0.06365966796875, -0.053375244140625, -0.0430908203125, -0.032806396484375, -0.02252197265625, -0.012237548828125, -0.001953125, 0.008331298828125, 0.01861572265625, 0.028900146484375, 0.0391845703125, 0.049468994140625, 0.05975341796875, 0.070037841796875, 0.080322265625, 0.090606689453125, 0.10089111328125, 0.111175537109375, 0.1214599609375, 0.131744384765625, 0.14202880859375, 0.152313232421875, 0.16259765625, 0.172882080078125, 0.18316650390625, 0.193450927734375, 0.2037353515625, 0.214019775390625, 0.22430419921875, 0.234588623046875, 0.244873046875, 0.255157470703125, 0.26544189453125, 0.275726318359375, 0.2860107421875, 0.296295166015625, 0.30657958984375, 0.316864013671875, 0.3271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 8.0, 3.0, 3.0, 10.0, 4.0, 3.0, 7.0, 12.0, 10.0, 13.0, 18.0, 17.0, 21.0, 31.0, 44.0, 54.0, 74.0, 100.0, 93.0, 76.0, 80.0, 62.0, 42.0, 45.0, 26.0, 27.0, 19.0, 18.0, 14.0, 11.0, 7.0, 7.0, 7.0, 9.0, 3.0, 7.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048370361328125, -0.04680013656616211, -0.04522991180419922, -0.04365968704223633, -0.04208946228027344, -0.04051923751831055, -0.038949012756347656, -0.037378787994384766, -0.035808563232421875, -0.034238338470458984, -0.032668113708496094, -0.031097888946533203, -0.029527664184570312, -0.027957439422607422, -0.02638721466064453, -0.02481698989868164, -0.02324676513671875, -0.02167654037475586, -0.02010631561279297, -0.018536090850830078, -0.016965866088867188, -0.015395641326904297, -0.013825416564941406, -0.012255191802978516, -0.010684967041015625, -0.009114742279052734, -0.007544517517089844, -0.005974292755126953, -0.0044040679931640625, -0.002833843231201172, -0.0012636184692382812, 0.0003066062927246094, 0.0018768310546875, 0.0034470558166503906, 0.005017280578613281, 0.006587505340576172, 0.008157730102539062, 0.009727954864501953, 0.011298179626464844, 0.012868404388427734, 0.014438629150390625, 0.016008853912353516, 0.017579078674316406, 0.019149303436279297, 0.020719528198242188, 0.022289752960205078, 0.02385997772216797, 0.02543020248413086, 0.02700042724609375, 0.02857065200805664, 0.03014087677001953, 0.03171110153198242, 0.03328132629394531, 0.0348515510559082, 0.036421775817871094, 0.037992000579833984, 0.039562225341796875, 0.041132450103759766, 0.042702674865722656, 0.04427289962768555, 0.04584312438964844, 0.04741334915161133, 0.04898357391357422, 0.05055379867553711, 0.0521240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 9.0, 13.0, 19.0, 19.0, 17.0, 22.0, 21.0, 40.0, 24.0, 44.0, 43.0, 57.0, 52.0, 66.0, 56.0, 51.0, 45.0, 36.0, 50.0, 37.0, 30.0, 37.0, 36.0, 26.0, 18.0, 17.0, 13.0, 15.0, 14.0, 16.0, 6.0, 11.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0], "bins": [-1.584175705909729, -1.5413509607315063, -1.4985262155532837, -1.455701470375061, -1.412876844406128, -1.3700520992279053, -1.3272273540496826, -1.28440260887146, -1.2415778636932373, -1.1987531185150146, -1.155928373336792, -1.1131036281585693, -1.0702788829803467, -1.0274542570114136, -0.9846295118331909, -0.9418047666549683, -0.8989800214767456, -0.856155276298523, -0.8133305311203003, -0.7705058455467224, -0.7276811003684998, -0.6848563551902771, -0.6420316696166992, -0.5992069244384766, -0.5563821792602539, -0.5135574340820312, -0.470732718706131, -0.4279080033302307, -0.38508325815200806, -0.3422585129737854, -0.29943379759788513, -0.25660908222198486, -0.21378445625305176, -0.1709597259759903, -0.12813499569892883, -0.08531026542186737, -0.04248553514480591, 0.0003391951322555542, 0.04316392540931702, 0.08598864078521729, 0.12881338596343994, 0.1716381162405014, 0.21446284651756287, 0.25728756189346313, 0.3001123070716858, 0.34293705224990845, 0.3857617676258087, 0.428586483001709, 0.47141122817993164, 0.5142359733581543, 0.557060718536377, 0.5998854041099548, 0.6427101492881775, 0.6855348944664001, 0.728359580039978, 0.7711843252182007, 0.8140090703964233, 0.856833815574646, 0.8996585607528687, 0.9424832463264465, 0.9853079915046692, 1.028132677078247, 1.0709574222564697, 1.1137821674346924, 1.156606912612915]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 18.0, 15.0, 15.0, 19.0, 20.0, 16.0, 30.0, 32.0, 25.0, 26.0, 39.0, 32.0, 42.0, 36.0, 43.0, 35.0, 38.0, 31.0, 44.0, 46.0, 34.0, 38.0, 38.0, 29.0, 32.0, 35.0, 30.0, 25.0, 16.0, 14.0, 14.0, 11.0, 18.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8862427473068237, -0.8564247488975525, -0.8266066908836365, -0.7967886924743652, -0.766970694065094, -0.7371526956558228, -0.7073346376419067, -0.6775166392326355, -0.6476986408233643, -0.617880642414093, -0.588062584400177, -0.5582445859909058, -0.5284265875816345, -0.4986085593700409, -0.46879053115844727, -0.438972532749176, -0.40915447473526, -0.3793364465236664, -0.34951844811439514, -0.3197004199028015, -0.2898824214935303, -0.26006439328193665, -0.23024636507034302, -0.20042835175991058, -0.17061033844947815, -0.14079232513904572, -0.11097430437803268, -0.08115628361701965, -0.05133827030658722, -0.021520256996154785, 0.008297771215438843, 0.03811578452587128, 0.06793379783630371, 0.09775181114673615, 0.12756982445716858, 0.1573878526687622, 0.18720586597919464, 0.21702387928962708, 0.2468419075012207, 0.27665990591049194, 0.30647793412208557, 0.3362959623336792, 0.36611396074295044, 0.39593198895454407, 0.4257500171661377, 0.45556801557540894, 0.48538604378700256, 0.5152040719985962, 0.5450220704078674, 0.5748400688171387, 0.6046581268310547, 0.6344761252403259, 0.6642941236495972, 0.6941121816635132, 0.7239301800727844, 0.7537481784820557, 0.7835662364959717, 0.8133842349052429, 0.8432022929191589, 0.8730202913284302, 0.9028382897377014, 0.9326562881469727, 0.9624743461608887, 0.9922923445701599, 1.0221103429794312]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 13.0, 18.0, 34.0, 43.0, 58.0, 99.0, 186.0, 260.0, 451.0, 641.0, 1063.0, 1744.0, 2757.0, 4522.0, 7418.0, 11858.0, 18801.0, 29105.0, 43605.0, 62628.0, 84486.0, 104622.0, 119193.0, 122436.0, 113746.0, 95058.0, 73044.0, 52177.0, 35877.0, 23411.0, 14931.0, 9292.0, 5736.0, 3542.0, 2141.0, 1317.0, 812.0, 582.0, 305.0, 192.0, 133.0, 86.0, 49.0, 22.0, 24.0, 21.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.984375, -0.9538497924804688, -0.9233245849609375, -0.8927993774414062, -0.862274169921875, -0.8317489624023438, -0.8012237548828125, -0.7706985473632812, -0.74017333984375, -0.7096481323242188, -0.6791229248046875, -0.6485977172851562, -0.618072509765625, -0.5875473022460938, -0.5570220947265625, -0.5264968872070312, -0.4959716796875, -0.46544647216796875, -0.4349212646484375, -0.40439605712890625, -0.373870849609375, -0.34334564208984375, -0.3128204345703125, -0.28229522705078125, -0.25177001953125, -0.22124481201171875, -0.1907196044921875, -0.16019439697265625, -0.129669189453125, -0.09914398193359375, -0.0686187744140625, -0.03809356689453125, -0.007568359375, 0.02295684814453125, 0.0534820556640625, 0.08400726318359375, 0.114532470703125, 0.14505767822265625, 0.1755828857421875, 0.20610809326171875, 0.23663330078125, 0.26715850830078125, 0.2976837158203125, 0.32820892333984375, 0.358734130859375, 0.38925933837890625, 0.4197845458984375, 0.45030975341796875, 0.4808349609375, 0.5113601684570312, 0.5418853759765625, 0.5724105834960938, 0.602935791015625, 0.6334609985351562, 0.6639862060546875, 0.6945114135742188, 0.72503662109375, 0.7555618286132812, 0.7860870361328125, 0.8166122436523438, 0.847137451171875, 0.8776626586914062, 0.9081878662109375, 0.9387130737304688, 0.96923828125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 11.0, 10.0, 16.0, 15.0, 24.0, 25.0, 24.0, 18.0, 29.0, 29.0, 33.0, 36.0, 35.0, 46.0, 43.0, 40.0, 48.0, 40.0, 42.0, 32.0, 59.0, 37.0, 30.0, 39.0, 28.0, 30.0, 31.0, 22.0, 22.0, 20.0, 8.0, 21.0, 12.0, 7.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0275115966796875, -0.993499755859375, -0.9594879150390625, -0.92547607421875, -0.8914642333984375, -0.857452392578125, -0.8234405517578125, -0.7894287109375, -0.7554168701171875, -0.721405029296875, -0.6873931884765625, -0.65338134765625, -0.6193695068359375, -0.585357666015625, -0.5513458251953125, -0.517333984375, -0.4833221435546875, -0.449310302734375, -0.4152984619140625, -0.38128662109375, -0.3472747802734375, -0.313262939453125, -0.2792510986328125, -0.2452392578125, -0.2112274169921875, -0.177215576171875, -0.1432037353515625, -0.10919189453125, -0.0751800537109375, -0.041168212890625, -0.0071563720703125, 0.02685546875, 0.0608673095703125, 0.094879150390625, 0.1288909912109375, 0.16290283203125, 0.1969146728515625, 0.230926513671875, 0.2649383544921875, 0.2989501953125, 0.3329620361328125, 0.366973876953125, 0.4009857177734375, 0.43499755859375, 0.4690093994140625, 0.503021240234375, 0.5370330810546875, 0.571044921875, 0.6050567626953125, 0.639068603515625, 0.6730804443359375, 0.70709228515625, 0.7411041259765625, 0.775115966796875, 0.8091278076171875, 0.8431396484375, 0.8771514892578125, 0.911163330078125, 0.9451751708984375, 0.97918701171875, 1.0131988525390625, 1.047210693359375, 1.0812225341796875, 1.115234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 25.0, 32.0, 48.0, 76.0, 93.0, 169.0, 258.0, 371.0, 583.0, 909.0, 1389.0, 2217.0, 3487.0, 5229.0, 7921.0, 11858.0, 17735.0, 25076.0, 35306.0, 48511.0, 62575.0, 77501.0, 91774.0, 99311.0, 101884.0, 97625.0, 86166.0, 72361.0, 57289.0, 42784.0, 31079.0, 22028.0, 15110.0, 10146.0, 6871.0, 4430.0, 2935.0, 1878.0, 1200.0, 805.0, 515.0, 330.0, 209.0, 163.0, 97.0, 74.0, 39.0, 26.0, 16.0, 4.0, 7.0, 9.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.83984375, -0.8138504028320312, -0.7878570556640625, -0.7618637084960938, -0.735870361328125, -0.7098770141601562, -0.6838836669921875, -0.6578903198242188, -0.63189697265625, -0.6059036254882812, -0.5799102783203125, -0.5539169311523438, -0.527923583984375, -0.5019302368164062, -0.4759368896484375, -0.44994354248046875, -0.4239501953125, -0.39795684814453125, -0.3719635009765625, -0.34597015380859375, -0.319976806640625, -0.29398345947265625, -0.2679901123046875, -0.24199676513671875, -0.21600341796875, -0.19001007080078125, -0.1640167236328125, -0.13802337646484375, -0.112030029296875, -0.08603668212890625, -0.0600433349609375, -0.03404998779296875, -0.008056640625, 0.01793670654296875, 0.0439300537109375, 0.06992340087890625, 0.095916748046875, 0.12191009521484375, 0.1479034423828125, 0.17389678955078125, 0.19989013671875, 0.22588348388671875, 0.2518768310546875, 0.27787017822265625, 0.303863525390625, 0.32985687255859375, 0.3558502197265625, 0.38184356689453125, 0.4078369140625, 0.43383026123046875, 0.4598236083984375, 0.48581695556640625, 0.511810302734375, 0.5378036499023438, 0.5637969970703125, 0.5897903442382812, 0.61578369140625, 0.6417770385742188, 0.6677703857421875, 0.6937637329101562, 0.719757080078125, 0.7457504272460938, 0.7717437744140625, 0.7977371215820312, 0.82373046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 8.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 17.0, 8.0, 18.0, 20.0, 24.0, 21.0, 18.0, 28.0, 24.0, 37.0, 41.0, 42.0, 35.0, 34.0, 35.0, 39.0, 45.0, 25.0, 37.0, 31.0, 17.0, 29.0, 31.0, 35.0, 16.0, 30.0, 22.0, 25.0, 18.0, 18.0, 11.0, 8.0, 11.0, 13.0, 5.0, 10.0, 12.0, 9.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.50830078125, -0.49228668212890625, -0.4762725830078125, -0.46025848388671875, -0.444244384765625, -0.42823028564453125, -0.4122161865234375, -0.39620208740234375, -0.38018798828125, -0.36417388916015625, -0.3481597900390625, -0.33214569091796875, -0.316131591796875, -0.30011749267578125, -0.2841033935546875, -0.26808929443359375, -0.2520751953125, -0.23606109619140625, -0.2200469970703125, -0.20403289794921875, -0.188018798828125, -0.17200469970703125, -0.1559906005859375, -0.13997650146484375, -0.12396240234375, -0.10794830322265625, -0.0919342041015625, -0.07592010498046875, -0.059906005859375, -0.04389190673828125, -0.0278778076171875, -0.01186370849609375, 0.004150390625, 0.02016448974609375, 0.0361785888671875, 0.05219268798828125, 0.068206787109375, 0.08422088623046875, 0.1002349853515625, 0.11624908447265625, 0.13226318359375, 0.14827728271484375, 0.1642913818359375, 0.18030548095703125, 0.196319580078125, 0.21233367919921875, 0.2283477783203125, 0.24436187744140625, 0.2603759765625, 0.27639007568359375, 0.2924041748046875, 0.30841827392578125, 0.324432373046875, 0.34044647216796875, 0.3564605712890625, 0.37247467041015625, 0.38848876953125, 0.40450286865234375, 0.4205169677734375, 0.43653106689453125, 0.452545166015625, 0.46855926513671875, 0.4845733642578125, 0.5005874633789062, 0.5166015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 17.0, 7.0, 26.0, 25.0, 39.0, 47.0, 53.0, 87.0, 127.0, 155.0, 224.0, 259.0, 396.0, 487.0, 733.0, 993.0, 1545.0, 2065.0, 3362.0, 5792.0, 14319.0, 62424.0, 326381.0, 465670.0, 120042.0, 23139.0, 7778.0, 3985.0, 2439.0, 1718.0, 1154.0, 826.0, 591.0, 425.0, 306.0, 235.0, 167.0, 123.0, 91.0, 74.0, 55.0, 41.0, 30.0, 23.0, 21.0, 16.0, 14.0, 7.0, 3.0, 5.0, 3.0], "bins": [-2.533203125, -2.46319580078125, -2.3931884765625, -2.32318115234375, -2.253173828125, -2.18316650390625, -2.1131591796875, -2.04315185546875, -1.97314453125, -1.90313720703125, -1.8331298828125, -1.76312255859375, -1.693115234375, -1.62310791015625, -1.5531005859375, -1.48309326171875, -1.4130859375, -1.34307861328125, -1.2730712890625, -1.20306396484375, -1.133056640625, -1.06304931640625, -0.9930419921875, -0.92303466796875, -0.85302734375, -0.78302001953125, -0.7130126953125, -0.64300537109375, -0.572998046875, -0.50299072265625, -0.4329833984375, -0.36297607421875, -0.29296875, -0.22296142578125, -0.1529541015625, -0.08294677734375, -0.012939453125, 0.05706787109375, 0.1270751953125, 0.19708251953125, 0.26708984375, 0.33709716796875, 0.4071044921875, 0.47711181640625, 0.547119140625, 0.61712646484375, 0.6871337890625, 0.75714111328125, 0.8271484375, 0.89715576171875, 0.9671630859375, 1.03717041015625, 1.107177734375, 1.17718505859375, 1.2471923828125, 1.31719970703125, 1.38720703125, 1.45721435546875, 1.5272216796875, 1.59722900390625, 1.667236328125, 1.73724365234375, 1.8072509765625, 1.87725830078125, 1.947265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 15.0, 28.0, 52.0, 81.0, 166.0, 194.0, 164.0, 116.0, 82.0, 34.0, 20.0, 11.0, 7.0, 6.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021147727966308594, -0.0002046283334493637, -0.00019777938723564148, -0.00019093044102191925, -0.00018408149480819702, -0.0001772325485944748, -0.00017038360238075256, -0.00016353465616703033, -0.0001566857099533081, -0.00014983676373958588, -0.00014298781752586365, -0.00013613887131214142, -0.0001292899250984192, -0.00012244097888469696, -0.00011559203267097473, -0.0001087430864572525, -0.00010189414024353027, -9.504519402980804e-05, -8.819624781608582e-05, -8.134730160236359e-05, -7.449835538864136e-05, -6.764940917491913e-05, -6.08004629611969e-05, -5.395151674747467e-05, -4.710257053375244e-05, -4.025362432003021e-05, -3.3404678106307983e-05, -2.6555731892585754e-05, -1.9706785678863525e-05, -1.2857839465141296e-05, -6.008893251419067e-06, 8.400529623031616e-07, 7.68899917602539e-06, 1.453794538974762e-05, 2.138689160346985e-05, 2.8235837817192078e-05, 3.508478403091431e-05, 4.1933730244636536e-05, 4.8782676458358765e-05, 5.5631622672080994e-05, 6.248056888580322e-05, 6.932951509952545e-05, 7.617846131324768e-05, 8.302740752696991e-05, 8.987635374069214e-05, 9.672529995441437e-05, 0.0001035742461681366, 0.00011042319238185883, 0.00011727213859558105, 0.00012412108480930328, 0.0001309700310230255, 0.00013781897723674774, 0.00014466792345046997, 0.0001515168696641922, 0.00015836581587791443, 0.00016521476209163666, 0.0001720637083053589, 0.00017891265451908112, 0.00018576160073280334, 0.00019261054694652557, 0.0001994594931602478, 0.00020630843937397003, 0.00021315738558769226, 0.0002200063318014145, 0.00022685527801513672]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 9.0, 8.0, 8.0, 20.0, 22.0, 34.0, 45.0, 82.0, 109.0, 167.0, 227.0, 401.0, 532.0, 804.0, 1270.0, 2045.0, 3555.0, 8269.0, 31062.0, 166683.0, 480473.0, 274360.0, 54881.0, 12088.0, 4607.0, 2537.0, 1476.0, 958.0, 593.0, 424.0, 236.0, 181.0, 107.0, 79.0, 47.0, 43.0, 32.0, 26.0, 19.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.306640625, -2.241973876953125, -2.17730712890625, -2.112640380859375, -2.0479736328125, -1.983306884765625, -1.91864013671875, -1.853973388671875, -1.789306640625, -1.724639892578125, -1.65997314453125, -1.595306396484375, -1.5306396484375, -1.465972900390625, -1.40130615234375, -1.336639404296875, -1.27197265625, -1.207305908203125, -1.14263916015625, -1.077972412109375, -1.0133056640625, -0.948638916015625, -0.88397216796875, -0.819305419921875, -0.754638671875, -0.689971923828125, -0.62530517578125, -0.560638427734375, -0.4959716796875, -0.431304931640625, -0.36663818359375, -0.301971435546875, -0.2373046875, -0.172637939453125, -0.10797119140625, -0.043304443359375, 0.0213623046875, 0.086029052734375, 0.15069580078125, 0.215362548828125, 0.280029296875, 0.344696044921875, 0.40936279296875, 0.474029541015625, 0.5386962890625, 0.603363037109375, 0.66802978515625, 0.732696533203125, 0.79736328125, 0.862030029296875, 0.92669677734375, 0.991363525390625, 1.0560302734375, 1.120697021484375, 1.18536376953125, 1.250030517578125, 1.314697265625, 1.379364013671875, 1.44403076171875, 1.508697509765625, 1.5733642578125, 1.638031005859375, 1.70269775390625, 1.767364501953125, 1.83203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 10.0, 7.0, 12.0, 16.0, 17.0, 26.0, 34.0, 42.0, 59.0, 56.0, 73.0, 74.0, 65.0, 84.0, 84.0, 82.0, 69.0, 46.0, 39.0, 21.0, 25.0, 14.0, 11.0, 9.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212646484375, -0.20475387573242188, -0.19686126708984375, -0.18896865844726562, -0.1810760498046875, -0.17318344116210938, -0.16529083251953125, -0.15739822387695312, -0.149505615234375, -0.14161300659179688, -0.13372039794921875, -0.12582778930664062, -0.1179351806640625, -0.11004257202148438, -0.10214996337890625, -0.09425735473632812, -0.08636474609375, -0.07847213745117188, -0.07057952880859375, -0.06268692016601562, -0.0547943115234375, -0.046901702880859375, -0.03900909423828125, -0.031116485595703125, -0.023223876953125, -0.015331268310546875, -0.00743865966796875, 0.000453948974609375, 0.0083465576171875, 0.016239166259765625, 0.02413177490234375, 0.032024383544921875, 0.0399169921875, 0.047809600830078125, 0.05570220947265625, 0.06359481811523438, 0.0714874267578125, 0.07938003540039062, 0.08727264404296875, 0.09516525268554688, 0.103057861328125, 0.11095046997070312, 0.11884307861328125, 0.12673568725585938, 0.1346282958984375, 0.14252090454101562, 0.15041351318359375, 0.15830612182617188, 0.16619873046875, 0.17409133911132812, 0.18198394775390625, 0.18987655639648438, 0.1977691650390625, 0.20566177368164062, 0.21355438232421875, 0.22144699096679688, 0.229339599609375, 0.23723220825195312, 0.24512481689453125, 0.2530174255371094, 0.2609100341796875, 0.2688026428222656, 0.27669525146484375, 0.2845878601074219, 0.29248046875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 8.0, 10.0, 12.0, 13.0, 14.0, 29.0, 28.0, 28.0, 33.0, 39.0, 41.0, 51.0, 48.0, 54.0, 55.0, 65.0, 56.0, 51.0, 36.0, 51.0, 37.0, 39.0, 32.0, 22.0, 26.0, 21.0, 23.0, 17.0, 10.0, 8.0, 3.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.5890384912490845, -1.5426957607269287, -1.496353030204773, -1.4500102996826172, -1.4036675691604614, -1.3573248386383057, -1.3109819889068604, -1.2646393775939941, -1.2182965278625488, -1.171953797340393, -1.1256110668182373, -1.0792683362960815, -1.0329256057739258, -0.98658287525177, -0.9402400851249695, -0.8938973546028137, -0.8475546836853027, -0.801211953163147, -0.7548692226409912, -0.7085264921188354, -0.6621837615966797, -0.6158410310745239, -0.5694982409477234, -0.5231555104255676, -0.47681277990341187, -0.4304700493812561, -0.38412731885910034, -0.3377845585346222, -0.29144182801246643, -0.24509909749031067, -0.19875633716583252, -0.15241360664367676, -0.10607099533081055, -0.05972825735807419, -0.01338551938533783, 0.032957226037979126, 0.07929995656013489, 0.12564268708229065, 0.1719854474067688, 0.21832817792892456, 0.2646709084510803, 0.3110136389732361, 0.35735636949539185, 0.40369912981987, 0.45004186034202576, 0.4963845908641815, 0.5427273511886597, 0.5890700817108154, 0.6354128122329712, 0.681755542755127, 0.7280982732772827, 0.7744410037994385, 0.8207837343215942, 0.86712646484375, 0.9134692549705505, 0.9598119854927063, 1.0061547756195068, 1.0524975061416626, 1.0988402366638184, 1.1451829671859741, 1.1915256977081299, 1.2378684282302856, 1.2842111587524414, 1.3305540084838867, 1.376896619796753]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 7.0, 10.0, 8.0, 18.0, 8.0, 20.0, 21.0, 15.0, 34.0, 37.0, 23.0, 34.0, 48.0, 26.0, 46.0, 38.0, 27.0, 58.0, 38.0, 42.0, 47.0, 46.0, 47.0, 28.0, 34.0, 40.0, 38.0, 18.0, 27.0, 20.0, 19.0, 15.0, 14.0, 10.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.153900146484375, -1.1200770139694214, -1.0862538814544678, -1.0524308681488037, -1.01860773563385, -0.9847846031188965, -0.9509614706039429, -0.9171383380889893, -0.8833152651786804, -0.8494921326637268, -0.815669059753418, -0.7818459272384644, -0.7480227947235107, -0.7141997218132019, -0.6803765892982483, -0.6465535163879395, -0.6127303838729858, -0.5789072513580322, -0.5450841784477234, -0.5112610459327698, -0.47743794322013855, -0.4436148405075073, -0.4097917079925537, -0.3759686052799225, -0.34214550256729126, -0.30832239985466003, -0.2744992971420288, -0.2406761646270752, -0.20685306191444397, -0.17302995920181274, -0.13920684158802032, -0.1053837239742279, -0.07156062126159668, -0.03773751109838486, -0.003914400935173035, 0.029908709228038788, 0.06373181939125061, 0.09755492210388184, 0.13137803971767426, 0.16520115733146667, 0.1990242600440979, 0.23284736275672913, 0.26667046546936035, 0.30049359798431396, 0.3343167006969452, 0.3681398034095764, 0.40196293592453003, 0.43578603863716125, 0.4696091413497925, 0.5034322738647461, 0.5372553467750549, 0.5710784792900085, 0.6049015522003174, 0.638724684715271, 0.6725478172302246, 0.7063709497451782, 0.7401940226554871, 0.7740171551704407, 0.8078402280807495, 0.8416633605957031, 0.8754864931106567, 0.9093095660209656, 0.9431326985359192, 0.976955771446228, 1.0107789039611816]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 6.0, 12.0, 18.0, 34.0, 53.0, 88.0, 133.0, 229.0, 338.0, 530.0, 858.0, 1469.0, 2435.0, 4044.0, 6904.0, 11900.0, 20216.0, 35296.0, 61153.0, 104817.0, 176564.0, 285254.0, 423747.0, 563860.0, 633579.0, 591438.0, 462193.0, 318973.0, 200328.0, 120198.0, 69911.0, 40563.0, 23435.0, 13945.0, 7871.0, 4776.0, 2818.0, 1682.0, 1052.0, 608.0, 375.0, 231.0, 136.0, 88.0, 45.0, 27.0, 16.0, 14.0, 10.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.265625, -1.2279815673828125, -1.190338134765625, -1.1526947021484375, -1.11505126953125, -1.0774078369140625, -1.039764404296875, -1.0021209716796875, -0.9644775390625, -0.9268341064453125, -0.889190673828125, -0.8515472412109375, -0.81390380859375, -0.7762603759765625, -0.738616943359375, -0.7009735107421875, -0.663330078125, -0.6256866455078125, -0.588043212890625, -0.5503997802734375, -0.51275634765625, -0.4751129150390625, -0.437469482421875, -0.3998260498046875, -0.3621826171875, -0.3245391845703125, -0.286895751953125, -0.2492523193359375, -0.21160888671875, -0.1739654541015625, -0.136322021484375, -0.0986785888671875, -0.06103515625, -0.0233917236328125, 0.014251708984375, 0.0518951416015625, 0.08953857421875, 0.1271820068359375, 0.164825439453125, 0.2024688720703125, 0.2401123046875, 0.2777557373046875, 0.315399169921875, 0.3530426025390625, 0.39068603515625, 0.4283294677734375, 0.465972900390625, 0.5036163330078125, 0.541259765625, 0.5789031982421875, 0.616546630859375, 0.6541900634765625, 0.69183349609375, 0.7294769287109375, 0.767120361328125, 0.8047637939453125, 0.8424072265625, 0.8800506591796875, 0.917694091796875, 0.9553375244140625, 0.99298095703125, 1.0306243896484375, 1.068267822265625, 1.1059112548828125, 1.1435546875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 10.0, 15.0, 21.0, 19.0, 30.0, 28.0, 25.0, 26.0, 30.0, 28.0, 37.0, 45.0, 45.0, 44.0, 43.0, 47.0, 57.0, 51.0, 58.0, 36.0, 33.0, 30.0, 30.0, 23.0, 32.0, 25.0, 26.0, 13.0, 6.0, 17.0, 14.0, 8.0, 10.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9123153686523438, -0.8842010498046875, -0.8560867309570312, -0.827972412109375, -0.7998580932617188, -0.7717437744140625, -0.7436294555664062, -0.71551513671875, -0.6874008178710938, -0.6592864990234375, -0.6311721801757812, -0.603057861328125, -0.5749435424804688, -0.5468292236328125, -0.5187149047851562, -0.4906005859375, -0.46248626708984375, -0.4343719482421875, -0.40625762939453125, -0.378143310546875, -0.35002899169921875, -0.3219146728515625, -0.29380035400390625, -0.26568603515625, -0.23757171630859375, -0.2094573974609375, -0.18134307861328125, -0.153228759765625, -0.12511444091796875, -0.0970001220703125, -0.06888580322265625, -0.040771484375, -0.01265716552734375, 0.0154571533203125, 0.04357147216796875, 0.071685791015625, 0.09980010986328125, 0.1279144287109375, 0.15602874755859375, 0.18414306640625, 0.21225738525390625, 0.2403717041015625, 0.26848602294921875, 0.296600341796875, 0.32471466064453125, 0.3528289794921875, 0.38094329833984375, 0.4090576171875, 0.43717193603515625, 0.4652862548828125, 0.49340057373046875, 0.521514892578125, 0.5496292114257812, 0.5777435302734375, 0.6058578491210938, 0.63397216796875, 0.6620864868164062, 0.6902008056640625, 0.7183151245117188, 0.746429443359375, 0.7745437622070312, 0.8026580810546875, 0.8307723999023438, 0.85888671875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 21.0, 27.0, 57.0, 73.0, 166.0, 238.0, 393.0, 785.0, 1107.0, 2026.0, 3309.0, 5889.0, 10196.0, 17635.0, 30827.0, 53391.0, 91300.0, 149651.0, 236105.0, 349679.0, 470769.0, 561428.0, 579443.0, 510425.0, 397337.0, 277121.0, 179294.0, 110597.0, 64992.0, 38232.0, 22053.0, 12648.0, 7146.0, 4113.0, 2403.0, 1389.0, 786.0, 492.0, 306.0, 164.0, 119.0, 69.0, 31.0, 21.0, 10.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1825103759765625, -1.143341064453125, -1.1041717529296875, -1.06500244140625, -1.0258331298828125, -0.986663818359375, -0.9474945068359375, -0.9083251953125, -0.8691558837890625, -0.829986572265625, -0.7908172607421875, -0.75164794921875, -0.7124786376953125, -0.673309326171875, -0.6341400146484375, -0.594970703125, -0.5558013916015625, -0.516632080078125, -0.4774627685546875, -0.43829345703125, -0.3991241455078125, -0.359954833984375, -0.3207855224609375, -0.2816162109375, -0.2424468994140625, -0.203277587890625, -0.1641082763671875, -0.12493896484375, -0.0857696533203125, -0.046600341796875, -0.0074310302734375, 0.03173828125, 0.0709075927734375, 0.110076904296875, 0.1492462158203125, 0.18841552734375, 0.2275848388671875, 0.266754150390625, 0.3059234619140625, 0.3450927734375, 0.3842620849609375, 0.423431396484375, 0.4626007080078125, 0.50177001953125, 0.5409393310546875, 0.580108642578125, 0.6192779541015625, 0.658447265625, 0.6976165771484375, 0.736785888671875, 0.7759552001953125, 0.81512451171875, 0.8542938232421875, 0.893463134765625, 0.9326324462890625, 0.9718017578125, 1.0109710693359375, 1.050140380859375, 1.0893096923828125, 1.12847900390625, 1.1676483154296875, 1.206817626953125, 1.2459869384765625, 1.28515625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 9.0, 17.0, 16.0, 21.0, 36.0, 44.0, 40.0, 53.0, 71.0, 92.0, 107.0, 91.0, 145.0, 128.0, 168.0, 178.0, 196.0, 188.0, 209.0, 218.0, 199.0, 219.0, 220.0, 196.0, 173.0, 160.0, 141.0, 143.0, 105.0, 82.0, 75.0, 77.0, 69.0, 31.0, 26.0, 20.0, 26.0, 17.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.400146484375, -0.3865547180175781, -0.37296295166015625, -0.3593711853027344, -0.3457794189453125, -0.3321876525878906, -0.31859588623046875, -0.3050041198730469, -0.291412353515625, -0.2778205871582031, -0.26422882080078125, -0.2506370544433594, -0.2370452880859375, -0.22345352172851562, -0.20986175537109375, -0.19626998901367188, -0.18267822265625, -0.16908645629882812, -0.15549468994140625, -0.14190292358398438, -0.1283111572265625, -0.11471939086914062, -0.10112762451171875, -0.08753585815429688, -0.073944091796875, -0.060352325439453125, -0.04676055908203125, -0.033168792724609375, -0.0195770263671875, -0.005985260009765625, 0.00760650634765625, 0.021198272705078125, 0.0347900390625, 0.048381805419921875, 0.06197357177734375, 0.07556533813476562, 0.0891571044921875, 0.10274887084960938, 0.11634063720703125, 0.12993240356445312, 0.143524169921875, 0.15711593627929688, 0.17070770263671875, 0.18429946899414062, 0.1978912353515625, 0.21148300170898438, 0.22507476806640625, 0.23866653442382812, 0.25225830078125, 0.2658500671386719, 0.27944183349609375, 0.2930335998535156, 0.3066253662109375, 0.3202171325683594, 0.33380889892578125, 0.3474006652832031, 0.360992431640625, 0.3745841979980469, 0.38817596435546875, 0.4017677307128906, 0.4153594970703125, 0.4289512634277344, 0.44254302978515625, 0.4561347961425781, 0.4697265625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 3.0, 1.0, 8.0, 13.0, 13.0, 14.0, 21.0, 20.0, 29.0, 31.0, 34.0, 49.0, 51.0, 42.0, 44.0, 43.0, 55.0, 61.0, 64.0, 59.0, 60.0, 48.0, 42.0, 34.0, 24.0, 24.0, 23.0, 15.0, 12.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5419496297836304, -1.49064040184021, -1.4393311738967896, -1.3880219459533691, -1.3367127180099487, -1.2854034900665283, -1.234094262123108, -1.1827850341796875, -1.131475806236267, -1.0801665782928467, -1.0288573503494263, -0.9775481224060059, -0.9262388944625854, -0.874929666519165, -0.8236204385757446, -0.7723112106323242, -0.721001923084259, -0.6696926951408386, -0.6183834671974182, -0.5670742392539978, -0.5157650113105774, -0.4644557535648346, -0.4131465256214142, -0.3618372976779938, -0.31052806973457336, -0.25921884179115295, -0.20790961384773254, -0.15660037100315094, -0.10529114305973053, -0.053981900215148926, -0.0026726722717285156, 0.048636555671691895, 0.0999457836151123, 0.15125501155853271, 0.20256423950195312, 0.25387346744537354, 0.30518269538879395, 0.35649195313453674, 0.40780118107795715, 0.45911040902137756, 0.5104196071624756, 0.561728835105896, 0.6130380630493164, 0.6643472909927368, 0.7156565189361572, 0.7669657468795776, 0.818274974822998, 0.8695842027664185, 0.9208934903144836, 0.972202718257904, 1.0235120058059692, 1.0748212337493896, 1.12613046169281, 1.1774396896362305, 1.2287489175796509, 1.2800581455230713, 1.3313673734664917, 1.382676601409912, 1.4339858293533325, 1.485295057296753, 1.5366042852401733, 1.5879135131835938, 1.6392227411270142, 1.6905319690704346, 1.741841197013855]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 0.0, 10.0, 7.0, 9.0, 7.0, 13.0, 8.0, 16.0, 18.0, 18.0, 23.0, 32.0, 38.0, 37.0, 31.0, 34.0, 29.0, 39.0, 33.0, 41.0, 39.0, 38.0, 24.0, 37.0, 25.0, 48.0, 47.0, 40.0, 33.0, 36.0, 22.0, 22.0, 16.0, 19.0, 16.0, 22.0, 15.0, 12.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.0659161806106567, -1.0348045825958252, -1.0036929845809937, -0.9725813865661621, -0.9414697885513306, -0.910358190536499, -0.8792465329170227, -0.8481349349021912, -0.8170233368873596, -0.7859117388725281, -0.7548001408576965, -0.723688542842865, -0.6925768852233887, -0.6614652872085571, -0.6303536891937256, -0.599242091178894, -0.5681304931640625, -0.537018895149231, -0.5059072971343994, -0.4747956693172455, -0.44368407130241394, -0.4125724732875824, -0.38146084547042847, -0.3503492474555969, -0.3192376494407654, -0.28812605142593384, -0.2570144534111023, -0.22590282559394836, -0.19479122757911682, -0.16367962956428528, -0.13256801664829254, -0.1014564037322998, -0.07034474611282349, -0.039233140647411346, -0.008121535181999207, 0.022990070283412933, 0.05410167574882507, 0.08521327376365662, 0.11632488667964935, 0.1474364995956421, 0.17854809761047363, 0.20965969562530518, 0.2407713085412979, 0.27188292145729065, 0.3029945194721222, 0.33410611748695374, 0.36521774530410767, 0.3963293433189392, 0.42744094133377075, 0.4585525393486023, 0.48966413736343384, 0.5207757353782654, 0.5518873929977417, 0.5829989910125732, 0.6141105890274048, 0.6452221870422363, 0.6763337850570679, 0.7074453830718994, 0.738556981086731, 0.7696685791015625, 0.800780177116394, 0.8318917751312256, 0.8630034327507019, 0.8941150307655334, 0.925226628780365]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 5.0, 10.0, 21.0, 20.0, 36.0, 48.0, 81.0, 101.0, 197.0, 289.0, 464.0, 776.0, 1383.0, 2312.0, 4198.0, 7676.0, 14496.0, 28443.0, 54446.0, 105623.0, 185868.0, 241308.0, 183822.0, 104303.0, 53288.0, 27486.0, 14362.0, 7641.0, 4094.0, 2366.0, 1313.0, 816.0, 455.0, 271.0, 176.0, 127.0, 64.0, 51.0, 27.0, 23.0, 19.0, 13.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.404052734375, -0.3912200927734375, -0.378387451171875, -0.3655548095703125, -0.35272216796875, -0.3398895263671875, -0.327056884765625, -0.3142242431640625, -0.3013916015625, -0.2885589599609375, -0.275726318359375, -0.2628936767578125, -0.25006103515625, -0.2372283935546875, -0.224395751953125, -0.2115631103515625, -0.19873046875, -0.1858978271484375, -0.173065185546875, -0.1602325439453125, -0.14739990234375, -0.1345672607421875, -0.121734619140625, -0.1089019775390625, -0.0960693359375, -0.0832366943359375, -0.070404052734375, -0.0575714111328125, -0.04473876953125, -0.0319061279296875, -0.019073486328125, -0.0062408447265625, 0.006591796875, 0.0194244384765625, 0.032257080078125, 0.0450897216796875, 0.05792236328125, 0.0707550048828125, 0.083587646484375, 0.0964202880859375, 0.1092529296875, 0.1220855712890625, 0.134918212890625, 0.1477508544921875, 0.16058349609375, 0.1734161376953125, 0.186248779296875, 0.1990814208984375, 0.2119140625, 0.2247467041015625, 0.237579345703125, 0.2504119873046875, 0.26324462890625, 0.2760772705078125, 0.288909912109375, 0.3017425537109375, 0.3145751953125, 0.3274078369140625, 0.340240478515625, 0.3530731201171875, 0.36590576171875, 0.3787384033203125, 0.391571044921875, 0.4044036865234375, 0.417236328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 10.0, 8.0, 24.0, 25.0, 19.0, 31.0, 25.0, 32.0, 52.0, 36.0, 36.0, 43.0, 41.0, 42.0, 46.0, 41.0, 43.0, 44.0, 43.0, 44.0, 42.0, 41.0, 36.0, 38.0, 21.0, 19.0, 18.0, 19.0, 25.0, 8.0, 9.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.277587890625, -1.23681640625, -1.196044921875, -1.1552734375, -1.114501953125, -1.07373046875, -1.032958984375, -0.9921875, -0.951416015625, -0.91064453125, -0.869873046875, -0.8291015625, -0.788330078125, -0.74755859375, -0.706787109375, -0.666015625, -0.625244140625, -0.58447265625, -0.543701171875, -0.5029296875, -0.462158203125, -0.42138671875, -0.380615234375, -0.33984375, -0.299072265625, -0.25830078125, -0.217529296875, -0.1767578125, -0.135986328125, -0.09521484375, -0.054443359375, -0.013671875, 0.027099609375, 0.06787109375, 0.108642578125, 0.1494140625, 0.190185546875, 0.23095703125, 0.271728515625, 0.3125, 0.353271484375, 0.39404296875, 0.434814453125, 0.4755859375, 0.516357421875, 0.55712890625, 0.597900390625, 0.638671875, 0.679443359375, 0.72021484375, 0.760986328125, 0.8017578125, 0.842529296875, 0.88330078125, 0.924072265625, 0.96484375, 1.005615234375, 1.04638671875, 1.087158203125, 1.1279296875, 1.168701171875, 1.20947265625, 1.250244140625, 1.291015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 12.0, 24.0, 25.0, 58.0, 77.0, 111.0, 167.0, 244.0, 331.0, 498.0, 861.0, 1489.0, 2551.0, 5101.0, 9958.0, 21089.0, 45580.0, 99574.0, 198390.0, 276317.0, 197932.0, 99271.0, 46143.0, 21146.0, 10069.0, 4889.0, 2702.0, 1481.0, 866.0, 529.0, 335.0, 214.0, 157.0, 94.0, 70.0, 51.0, 31.0, 31.0, 20.0, 14.0, 5.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.53369140625, -0.5190696716308594, -0.5044479370117188, -0.4898262023925781, -0.4752044677734375, -0.4605827331542969, -0.44596099853515625, -0.4313392639160156, -0.416717529296875, -0.4020957946777344, -0.38747406005859375, -0.3728523254394531, -0.3582305908203125, -0.3436088562011719, -0.32898712158203125, -0.3143653869628906, -0.29974365234375, -0.2851219177246094, -0.27050018310546875, -0.2558784484863281, -0.2412567138671875, -0.22663497924804688, -0.21201324462890625, -0.19739151000976562, -0.182769775390625, -0.16814804077148438, -0.15352630615234375, -0.13890457153320312, -0.1242828369140625, -0.10966110229492188, -0.09503936767578125, -0.08041763305664062, -0.0657958984375, -0.051174163818359375, -0.03655242919921875, -0.021930694580078125, -0.0073089599609375, 0.007312774658203125, 0.02193450927734375, 0.036556243896484375, 0.051177978515625, 0.06579971313476562, 0.08042144775390625, 0.09504318237304688, 0.1096649169921875, 0.12428665161132812, 0.13890838623046875, 0.15353012084960938, 0.16815185546875, 0.18277359008789062, 0.19739532470703125, 0.21201705932617188, 0.2266387939453125, 0.24126052856445312, 0.25588226318359375, 0.2705039978027344, 0.285125732421875, 0.2997474670410156, 0.31436920166015625, 0.3289909362792969, 0.3436126708984375, 0.3582344055175781, 0.37285614013671875, 0.3874778747558594, 0.402099609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 2.0, 9.0, 7.0, 13.0, 7.0, 20.0, 13.0, 31.0, 22.0, 28.0, 24.0, 21.0, 31.0, 22.0, 16.0, 33.0, 33.0, 33.0, 44.0, 38.0, 37.0, 46.0, 37.0, 39.0, 47.0, 31.0, 28.0, 27.0, 24.0, 25.0, 21.0, 26.0, 23.0, 18.0, 23.0, 12.0, 12.0, 14.0, 10.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.56787109375, -0.5485000610351562, -0.5291290283203125, -0.5097579956054688, -0.490386962890625, -0.47101593017578125, -0.4516448974609375, -0.43227386474609375, -0.41290283203125, -0.39353179931640625, -0.3741607666015625, -0.35478973388671875, -0.335418701171875, -0.31604766845703125, -0.2966766357421875, -0.27730560302734375, -0.2579345703125, -0.23856353759765625, -0.2191925048828125, -0.19982147216796875, -0.180450439453125, -0.16107940673828125, -0.1417083740234375, -0.12233734130859375, -0.10296630859375, -0.08359527587890625, -0.0642242431640625, -0.04485321044921875, -0.025482177734375, -0.00611114501953125, 0.0132598876953125, 0.03263092041015625, 0.052001953125, 0.07137298583984375, 0.0907440185546875, 0.11011505126953125, 0.129486083984375, 0.14885711669921875, 0.1682281494140625, 0.18759918212890625, 0.20697021484375, 0.22634124755859375, 0.2457122802734375, 0.26508331298828125, 0.284454345703125, 0.30382537841796875, 0.3231964111328125, 0.34256744384765625, 0.3619384765625, 0.38130950927734375, 0.4006805419921875, 0.42005157470703125, 0.439422607421875, 0.45879364013671875, 0.4781646728515625, 0.49753570556640625, 0.51690673828125, 0.5362777709960938, 0.5556488037109375, 0.5750198364257812, 0.594390869140625, 0.6137619018554688, 0.6331329345703125, 0.6525039672851562, 0.671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 2.0, 16.0, 14.0, 34.0, 35.0, 45.0, 63.0, 93.0, 155.0, 224.0, 306.0, 520.0, 867.0, 1549.0, 3290.0, 8701.0, 36064.0, 429811.0, 509021.0, 40619.0, 9380.0, 3567.0, 1655.0, 952.0, 524.0, 364.0, 206.0, 135.0, 108.0, 70.0, 43.0, 32.0, 21.0, 13.0, 10.0, 9.0, 11.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.59375, -0.5768013000488281, -0.5598526000976562, -0.5429039001464844, -0.5259552001953125, -0.5090065002441406, -0.49205780029296875, -0.4751091003417969, -0.458160400390625, -0.4412117004394531, -0.42426300048828125, -0.4073143005371094, -0.3903656005859375, -0.3734169006347656, -0.35646820068359375, -0.3395195007324219, -0.32257080078125, -0.3056221008300781, -0.28867340087890625, -0.2717247009277344, -0.2547760009765625, -0.23782730102539062, -0.22087860107421875, -0.20392990112304688, -0.186981201171875, -0.17003250122070312, -0.15308380126953125, -0.13613510131835938, -0.1191864013671875, -0.10223770141601562, -0.08528900146484375, -0.06834030151367188, -0.0513916015625, -0.034442901611328125, -0.01749420166015625, -0.000545501708984375, 0.0164031982421875, 0.033351898193359375, 0.05030059814453125, 0.06724929809570312, 0.084197998046875, 0.10114669799804688, 0.11809539794921875, 0.13504409790039062, 0.1519927978515625, 0.16894149780273438, 0.18589019775390625, 0.20283889770507812, 0.21978759765625, 0.23673629760742188, 0.25368499755859375, 0.2706336975097656, 0.2875823974609375, 0.3045310974121094, 0.32147979736328125, 0.3384284973144531, 0.355377197265625, 0.3723258972167969, 0.38927459716796875, 0.4062232971191406, 0.4231719970703125, 0.4401206970214844, 0.45706939697265625, 0.4740180969238281, 0.490966796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 11.0, 12.0, 20.0, 54.0, 67.0, 94.0, 115.0, 132.0, 110.0, 125.0, 87.0, 68.0, 33.0, 26.0, 21.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7060508728027344e-05, -2.623721957206726e-05, -2.5413930416107178e-05, -2.4590641260147095e-05, -2.3767352104187012e-05, -2.294406294822693e-05, -2.2120773792266846e-05, -2.1297484636306763e-05, -2.047419548034668e-05, -1.9650906324386597e-05, -1.8827617168426514e-05, -1.800432801246643e-05, -1.7181038856506348e-05, -1.6357749700546265e-05, -1.553446054458618e-05, -1.4711171388626099e-05, -1.3887882232666016e-05, -1.3064593076705933e-05, -1.224130392074585e-05, -1.1418014764785767e-05, -1.0594725608825684e-05, -9.7714364528656e-06, -8.948147296905518e-06, -8.124858140945435e-06, -7.3015689849853516e-06, -6.4782798290252686e-06, -5.6549906730651855e-06, -4.8317015171051025e-06, -4.0084123611450195e-06, -3.1851232051849365e-06, -2.3618340492248535e-06, -1.5385448932647705e-06, -7.152557373046875e-07, 1.0803341865539551e-07, 9.313225746154785e-07, 1.7546117305755615e-06, 2.5779008865356445e-06, 3.4011900424957275e-06, 4.2244791984558105e-06, 5.0477683544158936e-06, 5.8710575103759766e-06, 6.6943466663360596e-06, 7.517635822296143e-06, 8.340924978256226e-06, 9.164214134216309e-06, 9.987503290176392e-06, 1.0810792446136475e-05, 1.1634081602096558e-05, 1.245737075805664e-05, 1.3280659914016724e-05, 1.4103949069976807e-05, 1.492723822593689e-05, 1.5750527381896973e-05, 1.6573816537857056e-05, 1.739710569381714e-05, 1.822039484977722e-05, 1.9043684005737305e-05, 1.9866973161697388e-05, 2.069026231765747e-05, 2.1513551473617554e-05, 2.2336840629577637e-05, 2.316012978553772e-05, 2.3983418941497803e-05, 2.4806708097457886e-05, 2.562999725341797e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 10.0, 7.0, 14.0, 26.0, 21.0, 38.0, 59.0, 56.0, 104.0, 129.0, 162.0, 249.0, 270.0, 353.0, 460.0, 659.0, 885.0, 1273.0, 1744.0, 2701.0, 4083.0, 7419.0, 15063.0, 36196.0, 98868.0, 284753.0, 360898.0, 139700.0, 48294.0, 19614.0, 9155.0, 5025.0, 3056.0, 1934.0, 1379.0, 998.0, 696.0, 548.0, 439.0, 302.0, 224.0, 178.0, 109.0, 118.0, 72.0, 68.0, 41.0, 34.0, 25.0, 19.0, 12.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2734375, -0.2649345397949219, -0.25643157958984375, -0.24792861938476562, -0.2394256591796875, -0.23092269897460938, -0.22241973876953125, -0.21391677856445312, -0.205413818359375, -0.19691085815429688, -0.18840789794921875, -0.17990493774414062, -0.1714019775390625, -0.16289901733398438, -0.15439605712890625, -0.14589309692382812, -0.13739013671875, -0.12888717651367188, -0.12038421630859375, -0.11188125610351562, -0.1033782958984375, -0.09487533569335938, -0.08637237548828125, -0.07786941528320312, -0.069366455078125, -0.060863494873046875, -0.05236053466796875, -0.043857574462890625, -0.0353546142578125, -0.026851654052734375, -0.01834869384765625, -0.009845733642578125, -0.0013427734375, 0.007160186767578125, 0.01566314697265625, 0.024166107177734375, 0.0326690673828125, 0.041172027587890625, 0.04967498779296875, 0.058177947998046875, 0.066680908203125, 0.07518386840820312, 0.08368682861328125, 0.09218978881835938, 0.1006927490234375, 0.10919570922851562, 0.11769866943359375, 0.12620162963867188, 0.13470458984375, 0.14320755004882812, 0.15171051025390625, 0.16021347045898438, 0.1687164306640625, 0.17721939086914062, 0.18572235107421875, 0.19422531127929688, 0.202728271484375, 0.21123123168945312, 0.21973419189453125, 0.22823715209960938, 0.2367401123046875, 0.24524307250976562, 0.25374603271484375, 0.2622489929199219, 0.270751953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 12.0, 16.0, 25.0, 65.0, 80.0, 151.0, 188.0, 150.0, 119.0, 59.0, 40.0, 23.0, 15.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11114501953125, -0.10774517059326172, -0.10434532165527344, -0.10094547271728516, -0.09754562377929688, -0.0941457748413086, -0.09074592590332031, -0.08734607696533203, -0.08394622802734375, -0.08054637908935547, -0.07714653015136719, -0.0737466812133789, -0.07034683227539062, -0.06694698333740234, -0.06354713439941406, -0.06014728546142578, -0.0567474365234375, -0.05334758758544922, -0.04994773864746094, -0.046547889709472656, -0.043148040771484375, -0.039748191833496094, -0.03634834289550781, -0.03294849395751953, -0.02954864501953125, -0.02614879608154297, -0.022748947143554688, -0.019349098205566406, -0.015949249267578125, -0.012549400329589844, -0.009149551391601562, -0.005749702453613281, -0.002349853515625, 0.0010499954223632812, 0.0044498443603515625, 0.007849693298339844, 0.011249542236328125, 0.014649391174316406, 0.018049240112304688, 0.02144908905029297, 0.02484893798828125, 0.02824878692626953, 0.03164863586425781, 0.035048484802246094, 0.038448333740234375, 0.041848182678222656, 0.04524803161621094, 0.04864788055419922, 0.0520477294921875, 0.05544757843017578, 0.05884742736816406, 0.062247276306152344, 0.06564712524414062, 0.0690469741821289, 0.07244682312011719, 0.07584667205810547, 0.07924652099609375, 0.08264636993408203, 0.08604621887207031, 0.0894460678100586, 0.09284591674804688, 0.09624576568603516, 0.09964561462402344, 0.10304546356201172, 0.1064453125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 3.0, 9.0, 10.0, 17.0, 13.0, 16.0, 27.0, 27.0, 23.0, 40.0, 51.0, 56.0, 40.0, 43.0, 40.0, 57.0, 57.0, 69.0, 62.0, 64.0, 47.0, 32.0, 33.0, 28.0, 18.0, 27.0, 16.0, 11.0, 12.0, 11.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5451518297195435, -1.4936035871505737, -1.442055344581604, -1.3905071020126343, -1.3389588594436646, -1.2874106168746948, -1.2358622550964355, -1.1843140125274658, -1.132765769958496, -1.0812175273895264, -1.0296692848205566, -0.9781210422515869, -0.9265727996826172, -0.8750245571136475, -0.823476254940033, -0.7719280123710632, -0.7203798294067383, -0.6688315868377686, -0.6172833442687988, -0.5657351016998291, -0.5141868591308594, -0.46263858675956726, -0.41109031438827515, -0.3595420718193054, -0.3079938292503357, -0.25644558668136597, -0.20489732921123505, -0.15334907174110413, -0.1018008291721344, -0.05025258660316467, 0.0012956857681274414, 0.05284392833709717, 0.10439229011535645, 0.15594053268432617, 0.2074887901544571, 0.259037047624588, 0.31058529019355774, 0.36213353276252747, 0.4136818051338196, 0.4652300477027893, 0.516778290271759, 0.5683265328407288, 0.6198747754096985, 0.671423077583313, 0.7229713201522827, 0.7745195627212524, 0.8260678052902222, 0.8776160478591919, 0.9291642904281616, 0.9807125329971313, 1.032260775566101, 1.0838090181350708, 1.1353572607040405, 1.1869055032730103, 1.2384538650512695, 1.2900021076202393, 1.341550350189209, 1.3930985927581787, 1.4446468353271484, 1.4961950778961182, 1.547743320465088, 1.5992915630340576, 1.6508398056030273, 1.702388048171997, 1.7539362907409668]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 9.0, 5.0, 8.0, 8.0, 9.0, 10.0, 15.0, 23.0, 14.0, 26.0, 29.0, 34.0, 39.0, 35.0, 38.0, 22.0, 40.0, 37.0, 42.0, 35.0, 41.0, 28.0, 32.0, 28.0, 50.0, 43.0, 40.0, 39.0, 31.0, 30.0, 14.0, 25.0, 14.0, 17.0, 19.0, 15.0, 14.0, 5.0, 6.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.084733486175537, -1.0531185865402222, -1.0215036869049072, -0.9898887872695923, -0.9582739472389221, -0.9266590476036072, -0.8950441479682922, -0.8634292483329773, -0.8318144083023071, -0.8001995086669922, -0.7685846090316772, -0.7369697093963623, -0.7053548693656921, -0.6737399697303772, -0.6421250700950623, -0.6105101704597473, -0.5788952708244324, -0.5472803711891174, -0.5156654715538025, -0.48405060172080994, -0.4524357318878174, -0.42082083225250244, -0.3892059326171875, -0.35759103298187256, -0.32597616314888, -0.29436126351356506, -0.2627463936805725, -0.23113149404525757, -0.19951660931110382, -0.16790172457695007, -0.13628682494163513, -0.10467194020748138, -0.07305705547332764, -0.04144216701388359, -0.009827278554439545, 0.0217876136302948, 0.05340249836444855, 0.0850173830986023, 0.11663228273391724, 0.14824716746807098, 0.17986205220222473, 0.21147693693637848, 0.24309182167053223, 0.27470672130584717, 0.3063216209411621, 0.33793649077415466, 0.3695513904094696, 0.40116626024246216, 0.4327811598777771, 0.46439605951309204, 0.4960109293460846, 0.5276257991790771, 0.5592406988143921, 0.590855598449707, 0.622470498085022, 0.6540853977203369, 0.6857002973556519, 0.7173151969909668, 0.7489300966262817, 0.7805449962615967, 0.8121598362922668, 0.8437747359275818, 0.8753896355628967, 0.9070045351982117, 0.9386193752288818]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 6.0, 5.0, 12.0, 13.0, 12.0, 23.0, 36.0, 49.0, 92.0, 137.0, 210.0, 384.0, 712.0, 1241.0, 2273.0, 4014.0, 7296.0, 13048.0, 22807.0, 38352.0, 61084.0, 91232.0, 122152.0, 143329.0, 145623.0, 127589.0, 97427.0, 67908.0, 42830.0, 25478.0, 14627.0, 8248.0, 4399.0, 2518.0, 1425.0, 834.0, 477.0, 242.0, 149.0, 97.0, 50.0, 38.0, 25.0, 15.0, 15.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.015777587890625, -0.97686767578125, -0.937957763671875, -0.8990478515625, -0.860137939453125, -0.82122802734375, -0.782318115234375, -0.743408203125, -0.704498291015625, -0.66558837890625, -0.626678466796875, -0.5877685546875, -0.548858642578125, -0.50994873046875, -0.471038818359375, -0.43212890625, -0.393218994140625, -0.35430908203125, -0.315399169921875, -0.2764892578125, -0.237579345703125, -0.19866943359375, -0.159759521484375, -0.120849609375, -0.081939697265625, -0.04302978515625, -0.004119873046875, 0.0347900390625, 0.073699951171875, 0.11260986328125, 0.151519775390625, 0.1904296875, 0.229339599609375, 0.26824951171875, 0.307159423828125, 0.3460693359375, 0.384979248046875, 0.42388916015625, 0.462799072265625, 0.501708984375, 0.540618896484375, 0.57952880859375, 0.618438720703125, 0.6573486328125, 0.696258544921875, 0.73516845703125, 0.774078369140625, 0.81298828125, 0.851898193359375, 0.89080810546875, 0.929718017578125, 0.9686279296875, 1.007537841796875, 1.04644775390625, 1.085357666015625, 1.124267578125, 1.163177490234375, 1.20208740234375, 1.240997314453125, 1.2799072265625, 1.318817138671875, 1.35772705078125, 1.396636962890625, 1.435546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 3.0, 6.0, 10.0, 8.0, 9.0, 18.0, 15.0, 17.0, 14.0, 27.0, 23.0, 34.0, 29.0, 28.0, 26.0, 28.0, 35.0, 37.0, 33.0, 25.0, 34.0, 42.0, 36.0, 34.0, 34.0, 35.0, 40.0, 35.0, 22.0, 28.0, 32.0, 28.0, 21.0, 27.0, 15.0, 18.0, 13.0, 14.0, 11.0, 11.0, 7.0, 4.0, 8.0, 4.0, 10.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.99609375, -0.9644775390625, -0.932861328125, -0.9012451171875, -0.86962890625, -0.8380126953125, -0.806396484375, -0.7747802734375, -0.7431640625, -0.7115478515625, -0.679931640625, -0.6483154296875, -0.61669921875, -0.5850830078125, -0.553466796875, -0.5218505859375, -0.490234375, -0.4586181640625, -0.427001953125, -0.3953857421875, -0.36376953125, -0.3321533203125, -0.300537109375, -0.2689208984375, -0.2373046875, -0.2056884765625, -0.174072265625, -0.1424560546875, -0.11083984375, -0.0792236328125, -0.047607421875, -0.0159912109375, 0.015625, 0.0472412109375, 0.078857421875, 0.1104736328125, 0.14208984375, 0.1737060546875, 0.205322265625, 0.2369384765625, 0.2685546875, 0.3001708984375, 0.331787109375, 0.3634033203125, 0.39501953125, 0.4266357421875, 0.458251953125, 0.4898681640625, 0.521484375, 0.5531005859375, 0.584716796875, 0.6163330078125, 0.64794921875, 0.6795654296875, 0.711181640625, 0.7427978515625, 0.7744140625, 0.8060302734375, 0.837646484375, 0.8692626953125, 0.90087890625, 0.9324951171875, 0.964111328125, 0.9957275390625, 1.02734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 15.0, 26.0, 34.0, 56.0, 75.0, 121.0, 226.0, 399.0, 700.0, 1088.0, 1722.0, 3012.0, 4984.0, 8379.0, 13891.0, 21694.0, 33191.0, 48950.0, 69343.0, 91114.0, 110539.0, 121366.0, 120343.0, 108176.0, 88922.0, 67483.0, 47664.0, 31834.0, 20388.0, 12991.0, 7889.0, 4780.0, 2863.0, 1694.0, 1065.0, 628.0, 358.0, 208.0, 124.0, 84.0, 46.0, 31.0, 21.0, 14.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0368804931640625, -1.004425048828125, -0.9719696044921875, -0.93951416015625, -0.9070587158203125, -0.874603271484375, -0.8421478271484375, -0.8096923828125, -0.7772369384765625, -0.744781494140625, -0.7123260498046875, -0.67987060546875, -0.6474151611328125, -0.614959716796875, -0.5825042724609375, -0.550048828125, -0.5175933837890625, -0.485137939453125, -0.4526824951171875, -0.42022705078125, -0.3877716064453125, -0.355316162109375, -0.3228607177734375, -0.2904052734375, -0.2579498291015625, -0.225494384765625, -0.1930389404296875, -0.16058349609375, -0.1281280517578125, -0.095672607421875, -0.0632171630859375, -0.03076171875, 0.0016937255859375, 0.034149169921875, 0.0666046142578125, 0.09906005859375, 0.1315155029296875, 0.163970947265625, 0.1964263916015625, 0.2288818359375, 0.2613372802734375, 0.293792724609375, 0.3262481689453125, 0.35870361328125, 0.3911590576171875, 0.423614501953125, 0.4560699462890625, 0.488525390625, 0.5209808349609375, 0.553436279296875, 0.5858917236328125, 0.61834716796875, 0.6508026123046875, 0.683258056640625, 0.7157135009765625, 0.7481689453125, 0.7806243896484375, 0.813079833984375, 0.8455352783203125, 0.87799072265625, 0.9104461669921875, 0.942901611328125, 0.9753570556640625, 1.0078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 8.0, 6.0, 13.0, 16.0, 15.0, 15.0, 26.0, 22.0, 22.0, 28.0, 28.0, 39.0, 39.0, 32.0, 32.0, 38.0, 41.0, 40.0, 29.0, 44.0, 42.0, 56.0, 37.0, 22.0, 32.0, 32.0, 33.0, 31.0, 17.0, 22.0, 17.0, 21.0, 20.0, 15.0, 9.0, 8.0, 5.0, 5.0, 11.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.6943359375, -0.6731109619140625, -0.651885986328125, -0.6306610107421875, -0.60943603515625, -0.5882110595703125, -0.566986083984375, -0.5457611083984375, -0.5245361328125, -0.5033111572265625, -0.482086181640625, -0.4608612060546875, -0.43963623046875, -0.4184112548828125, -0.397186279296875, -0.3759613037109375, -0.354736328125, -0.3335113525390625, -0.312286376953125, -0.2910614013671875, -0.26983642578125, -0.2486114501953125, -0.227386474609375, -0.2061614990234375, -0.1849365234375, -0.1637115478515625, -0.142486572265625, -0.1212615966796875, -0.10003662109375, -0.0788116455078125, -0.057586669921875, -0.0363616943359375, -0.01513671875, 0.0060882568359375, 0.027313232421875, 0.0485382080078125, 0.06976318359375, 0.0909881591796875, 0.112213134765625, 0.1334381103515625, 0.1546630859375, 0.1758880615234375, 0.197113037109375, 0.2183380126953125, 0.23956298828125, 0.2607879638671875, 0.282012939453125, 0.3032379150390625, 0.324462890625, 0.3456878662109375, 0.366912841796875, 0.3881378173828125, 0.40936279296875, 0.4305877685546875, 0.451812744140625, 0.4730377197265625, 0.4942626953125, 0.5154876708984375, 0.536712646484375, 0.5579376220703125, 0.57916259765625, 0.6003875732421875, 0.621612548828125, 0.6428375244140625, 0.6640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 10.0, 12.0, 11.0, 9.0, 20.0, 23.0, 46.0, 50.0, 88.0, 131.0, 161.0, 282.0, 387.0, 716.0, 940.0, 1534.0, 2416.0, 3875.0, 7295.0, 22962.0, 200420.0, 637312.0, 135941.0, 17513.0, 6396.0, 3667.0, 2365.0, 1340.0, 876.0, 574.0, 380.0, 252.0, 153.0, 110.0, 93.0, 56.0, 47.0, 20.0, 23.0, 13.0, 13.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.880859375, -2.77947998046875, -2.6781005859375, -2.57672119140625, -2.475341796875, -2.37396240234375, -2.2725830078125, -2.17120361328125, -2.06982421875, -1.96844482421875, -1.8670654296875, -1.76568603515625, -1.664306640625, -1.56292724609375, -1.4615478515625, -1.36016845703125, -1.2587890625, -1.15740966796875, -1.0560302734375, -0.95465087890625, -0.853271484375, -0.75189208984375, -0.6505126953125, -0.54913330078125, -0.44775390625, -0.34637451171875, -0.2449951171875, -0.14361572265625, -0.042236328125, 0.05914306640625, 0.1605224609375, 0.26190185546875, 0.36328125, 0.46466064453125, 0.5660400390625, 0.66741943359375, 0.768798828125, 0.87017822265625, 0.9715576171875, 1.07293701171875, 1.17431640625, 1.27569580078125, 1.3770751953125, 1.47845458984375, 1.579833984375, 1.68121337890625, 1.7825927734375, 1.88397216796875, 1.9853515625, 2.08673095703125, 2.1881103515625, 2.28948974609375, 2.390869140625, 2.49224853515625, 2.5936279296875, 2.69500732421875, 2.79638671875, 2.89776611328125, 2.9991455078125, 3.10052490234375, 3.201904296875, 3.30328369140625, 3.4046630859375, 3.50604248046875, 3.607421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 10.0, 27.0, 57.0, 98.0, 146.0, 205.0, 173.0, 135.0, 59.0, 35.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002510547637939453, -0.0002442058175802231, -0.00023735687136650085, -0.00023050792515277863, -0.0002236589789390564, -0.00021681003272533417, -0.00020996108651161194, -0.0002031121402978897, -0.00019626319408416748, -0.00018941424787044525, -0.00018256530165672302, -0.0001757163554430008, -0.00016886740922927856, -0.00016201846301555634, -0.0001551695168018341, -0.00014832057058811188, -0.00014147162437438965, -0.00013462267816066742, -0.0001277737319469452, -0.00012092478573322296, -0.00011407583951950073, -0.0001072268933057785, -0.00010037794709205627, -9.352900087833405e-05, -8.668005466461182e-05, -7.983110845088959e-05, -7.298216223716736e-05, -6.613321602344513e-05, -5.92842698097229e-05, -5.243532359600067e-05, -4.558637738227844e-05, -3.873743116855621e-05, -3.1888484954833984e-05, -2.5039538741111755e-05, -1.8190592527389526e-05, -1.1341646313667297e-05, -4.492700099945068e-06, 2.3562461137771606e-06, 9.20519232749939e-06, 1.605413854122162e-05, 2.2903084754943848e-05, 2.9752030968666077e-05, 3.6600977182388306e-05, 4.3449923396110535e-05, 5.0298869609832764e-05, 5.714781582355499e-05, 6.399676203727722e-05, 7.084570825099945e-05, 7.769465446472168e-05, 8.454360067844391e-05, 9.139254689216614e-05, 9.824149310588837e-05, 0.0001050904393196106, 0.00011193938553333282, 0.00011878833174705505, 0.00012563727796077728, 0.0001324862241744995, 0.00013933517038822174, 0.00014618411660194397, 0.0001530330628156662, 0.00015988200902938843, 0.00016673095524311066, 0.00017357990145683289, 0.00018042884767055511, 0.00018727779388427734]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 32.0, 38.0, 53.0, 65.0, 93.0, 137.0, 170.0, 295.0, 415.0, 596.0, 920.0, 1494.0, 2164.0, 3684.0, 7856.0, 29919.0, 198674.0, 553854.0, 199567.0, 30264.0, 7896.0, 3835.0, 2164.0, 1463.0, 918.0, 602.0, 404.0, 274.0, 185.0, 139.0, 95.0, 63.0, 55.0, 39.0, 23.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.76171875, -2.681671142578125, -2.60162353515625, -2.521575927734375, -2.4415283203125, -2.361480712890625, -2.28143310546875, -2.201385498046875, -2.121337890625, -2.041290283203125, -1.96124267578125, -1.881195068359375, -1.8011474609375, -1.721099853515625, -1.64105224609375, -1.561004638671875, -1.48095703125, -1.400909423828125, -1.32086181640625, -1.240814208984375, -1.1607666015625, -1.080718994140625, -1.00067138671875, -0.920623779296875, -0.840576171875, -0.760528564453125, -0.68048095703125, -0.600433349609375, -0.5203857421875, -0.440338134765625, -0.36029052734375, -0.280242919921875, -0.2001953125, -0.120147705078125, -0.04010009765625, 0.039947509765625, 0.1199951171875, 0.200042724609375, 0.28009033203125, 0.360137939453125, 0.440185546875, 0.520233154296875, 0.60028076171875, 0.680328369140625, 0.7603759765625, 0.840423583984375, 0.92047119140625, 1.000518798828125, 1.08056640625, 1.160614013671875, 1.24066162109375, 1.320709228515625, 1.4007568359375, 1.480804443359375, 1.56085205078125, 1.640899658203125, 1.720947265625, 1.800994873046875, 1.88104248046875, 1.961090087890625, 2.0411376953125, 2.121185302734375, 2.20123291015625, 2.281280517578125, 2.361328125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 9.0, 10.0, 13.0, 28.0, 25.0, 44.0, 32.0, 60.0, 69.0, 74.0, 74.0, 81.0, 88.0, 66.0, 70.0, 57.0, 37.0, 42.0, 23.0, 21.0, 10.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.292724609375, -0.28343963623046875, -0.2741546630859375, -0.26486968994140625, -0.255584716796875, -0.24629974365234375, -0.2370147705078125, -0.22772979736328125, -0.21844482421875, -0.20915985107421875, -0.1998748779296875, -0.19058990478515625, -0.181304931640625, -0.17201995849609375, -0.1627349853515625, -0.15345001220703125, -0.1441650390625, -0.13488006591796875, -0.1255950927734375, -0.11631011962890625, -0.107025146484375, -0.09774017333984375, -0.0884552001953125, -0.07917022705078125, -0.06988525390625, -0.06060028076171875, -0.0513153076171875, -0.04203033447265625, -0.032745361328125, -0.02346038818359375, -0.0141754150390625, -0.00489044189453125, 0.00439453125, 0.01367950439453125, 0.0229644775390625, 0.03224945068359375, 0.041534423828125, 0.05081939697265625, 0.0601043701171875, 0.06938934326171875, 0.07867431640625, 0.08795928955078125, 0.0972442626953125, 0.10652923583984375, 0.115814208984375, 0.12509918212890625, 0.1343841552734375, 0.14366912841796875, 0.1529541015625, 0.16223907470703125, 0.1715240478515625, 0.18080902099609375, 0.190093994140625, 0.19937896728515625, 0.2086639404296875, 0.21794891357421875, 0.22723388671875, 0.23651885986328125, 0.2458038330078125, 0.25508880615234375, 0.264373779296875, 0.27365875244140625, 0.2829437255859375, 0.29222869873046875, 0.301513671875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 8.0, 7.0, 11.0, 10.0, 12.0, 16.0, 20.0, 31.0, 26.0, 29.0, 44.0, 40.0, 45.0, 46.0, 50.0, 49.0, 54.0, 76.0, 60.0, 41.0, 48.0, 51.0, 37.0, 35.0, 26.0, 20.0, 13.0, 12.0, 15.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4523892402648926, -1.4023908376693726, -1.352392554283142, -1.302394151687622, -1.2523958683013916, -1.2023974657058716, -1.1523990631103516, -1.102400779724121, -1.0524024963378906, -1.0024040937423706, -0.9524058103561401, -0.9024074077606201, -0.8524091243743896, -0.8024107217788696, -0.7524123787879944, -0.7024140357971191, -0.6524156332015991, -0.6024172902107239, -0.5524189472198486, -0.5024205446243286, -0.45242223143577576, -0.4024238884449005, -0.3524255156517029, -0.30242717266082764, -0.2524288296699524, -0.20243048667907715, -0.1524321287870407, -0.10243377089500427, -0.05243542790412903, -0.002437084913253784, 0.04756128787994385, 0.09755963087081909, 0.1475580930709839, 0.19755643606185913, 0.24755479395389557, 0.297553151845932, 0.34755149483680725, 0.3975498378276825, 0.4475482106208801, 0.49754655361175537, 0.5475448966026306, 0.5975432395935059, 0.6475415825843811, 0.6975399255752563, 0.7475383281707764, 0.7975366115570068, 0.8475350141525269, 0.8975333571434021, 0.9475317001342773, 0.9975300431251526, 1.0475283861160278, 1.0975267887115479, 1.1475250720977783, 1.1975234746932983, 1.2475218772888184, 1.2975201606750488, 1.3475184440612793, 1.3975168466567993, 1.4475151300430298, 1.4975135326385498, 1.5475118160247803, 1.5975102186203003, 1.6475086212158203, 1.6975069046020508, 1.7475053071975708]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 10.0, 14.0, 14.0, 15.0, 12.0, 11.0, 27.0, 39.0, 29.0, 22.0, 31.0, 40.0, 30.0, 48.0, 40.0, 41.0, 37.0, 46.0, 35.0, 38.0, 40.0, 37.0, 41.0, 46.0, 31.0, 30.0, 30.0, 19.0, 18.0, 16.0, 11.0, 18.0, 13.0, 10.0, 9.0, 9.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9461370706558228, -0.9124075770378113, -0.8786780834197998, -0.8449485898017883, -0.8112190961837769, -0.7774896025657654, -0.7437601089477539, -0.7100306153297424, -0.676301121711731, -0.6425716280937195, -0.608842134475708, -0.5751126408576965, -0.5413831472396851, -0.5076536536216736, -0.4739241600036621, -0.44019466638565063, -0.40646517276763916, -0.3727356791496277, -0.3390061855316162, -0.30527669191360474, -0.27154719829559326, -0.2378177046775818, -0.2040882110595703, -0.17035871744155884, -0.13662922382354736, -0.10289973020553589, -0.06917023658752441, -0.03544074296951294, -0.0017112493515014648, 0.03201824426651001, 0.06574773788452148, 0.09947723150253296, 0.13320660591125488, 0.16693609952926636, 0.20066559314727783, 0.2343950867652893, 0.2681245803833008, 0.30185407400131226, 0.33558356761932373, 0.3693130612373352, 0.4030425548553467, 0.43677204847335815, 0.47050154209136963, 0.5042310357093811, 0.5379605293273926, 0.571690022945404, 0.6054195165634155, 0.639149010181427, 0.6728785037994385, 0.70660799741745, 0.7403374910354614, 0.7740669846534729, 0.8077964782714844, 0.8415259718894958, 0.8752554655075073, 0.9089849591255188, 0.9427144527435303, 0.9764439463615417, 1.0101734399795532, 1.04390287399292, 1.0776324272155762, 1.1113619804382324, 1.1450914144515991, 1.1788208484649658, 1.212550401687622]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 10.0, 14.0, 20.0, 47.0, 74.0, 134.0, 214.0, 368.0, 632.0, 1061.0, 1799.0, 3203.0, 6021.0, 11090.0, 20479.0, 39249.0, 72928.0, 136052.0, 243458.0, 407757.0, 595266.0, 715323.0, 678755.0, 515434.0, 330522.0, 191268.0, 104274.0, 55907.0, 29351.0, 15477.0, 8022.0, 4434.0, 2479.0, 1335.0, 711.0, 462.0, 249.0, 154.0, 102.0, 50.0, 36.0, 21.0, 9.0, 7.0, 11.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2646484375, -1.2174224853515625, -1.170196533203125, -1.1229705810546875, -1.07574462890625, -1.0285186767578125, -0.981292724609375, -0.9340667724609375, -0.8868408203125, -0.8396148681640625, -0.792388916015625, -0.7451629638671875, -0.69793701171875, -0.6507110595703125, -0.603485107421875, -0.5562591552734375, -0.509033203125, -0.4618072509765625, -0.414581298828125, -0.3673553466796875, -0.32012939453125, -0.2729034423828125, -0.225677490234375, -0.1784515380859375, -0.1312255859375, -0.0839996337890625, -0.036773681640625, 0.0104522705078125, 0.05767822265625, 0.1049041748046875, 0.152130126953125, 0.1993560791015625, 0.24658203125, 0.2938079833984375, 0.341033935546875, 0.3882598876953125, 0.43548583984375, 0.4827117919921875, 0.529937744140625, 0.5771636962890625, 0.6243896484375, 0.6716156005859375, 0.718841552734375, 0.7660675048828125, 0.81329345703125, 0.8605194091796875, 0.907745361328125, 0.9549713134765625, 1.002197265625, 1.0494232177734375, 1.096649169921875, 1.1438751220703125, 1.19110107421875, 1.2383270263671875, 1.285552978515625, 1.3327789306640625, 1.3800048828125, 1.4272308349609375, 1.474456787109375, 1.5216827392578125, 1.56890869140625, 1.6161346435546875, 1.663360595703125, 1.7105865478515625, 1.7578125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 7.0, 10.0, 16.0, 14.0, 18.0, 17.0, 29.0, 27.0, 28.0, 41.0, 35.0, 49.0, 53.0, 46.0, 53.0, 54.0, 63.0, 47.0, 58.0, 40.0, 52.0, 32.0, 32.0, 36.0, 23.0, 28.0, 15.0, 17.0, 10.0, 19.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9773101806640625, -0.941925048828125, -0.9065399169921875, -0.87115478515625, -0.8357696533203125, -0.800384521484375, -0.7649993896484375, -0.7296142578125, -0.6942291259765625, -0.658843994140625, -0.6234588623046875, -0.58807373046875, -0.5526885986328125, -0.517303466796875, -0.4819183349609375, -0.446533203125, -0.4111480712890625, -0.375762939453125, -0.3403778076171875, -0.30499267578125, -0.2696075439453125, -0.234222412109375, -0.1988372802734375, -0.1634521484375, -0.1280670166015625, -0.092681884765625, -0.0572967529296875, -0.02191162109375, 0.0134735107421875, 0.048858642578125, 0.0842437744140625, 0.11962890625, 0.1550140380859375, 0.190399169921875, 0.2257843017578125, 0.26116943359375, 0.2965545654296875, 0.331939697265625, 0.3673248291015625, 0.4027099609375, 0.4380950927734375, 0.473480224609375, 0.5088653564453125, 0.54425048828125, 0.5796356201171875, 0.615020751953125, 0.6504058837890625, 0.685791015625, 0.7211761474609375, 0.756561279296875, 0.7919464111328125, 0.82733154296875, 0.8627166748046875, 0.898101806640625, 0.9334869384765625, 0.9688720703125, 1.0042572021484375, 1.039642333984375, 1.0750274658203125, 1.11041259765625, 1.1457977294921875, 1.181182861328125, 1.2165679931640625, 1.251953125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 15.0, 23.0, 38.0, 61.0, 103.0, 157.0, 284.0, 415.0, 661.0, 1177.0, 1817.0, 2773.0, 4503.0, 7114.0, 11331.0, 18261.0, 28860.0, 45113.0, 70205.0, 107095.0, 160165.0, 228873.0, 312064.0, 395004.0, 460143.0, 484807.0, 459232.0, 394357.0, 311583.0, 228009.0, 160185.0, 107599.0, 70442.0, 45002.0, 28526.0, 17976.0, 11296.0, 7058.0, 4404.0, 2856.0, 1727.0, 1111.0, 717.0, 424.0, 251.0, 182.0, 110.0, 59.0, 37.0, 30.0, 21.0, 11.0, 4.0, 4.0, 7.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0959014892578125, -1.059967041015625, -1.0240325927734375, -0.98809814453125, -0.9521636962890625, -0.916229248046875, -0.8802947998046875, -0.8443603515625, -0.8084259033203125, -0.772491455078125, -0.7365570068359375, -0.70062255859375, -0.6646881103515625, -0.628753662109375, -0.5928192138671875, -0.556884765625, -0.5209503173828125, -0.485015869140625, -0.4490814208984375, -0.41314697265625, -0.3772125244140625, -0.341278076171875, -0.3053436279296875, -0.2694091796875, -0.2334747314453125, -0.197540283203125, -0.1616058349609375, -0.12567138671875, -0.0897369384765625, -0.053802490234375, -0.0178680419921875, 0.01806640625, 0.0540008544921875, 0.089935302734375, 0.1258697509765625, 0.16180419921875, 0.1977386474609375, 0.233673095703125, 0.2696075439453125, 0.3055419921875, 0.3414764404296875, 0.377410888671875, 0.4133453369140625, 0.44927978515625, 0.4852142333984375, 0.521148681640625, 0.5570831298828125, 0.593017578125, 0.6289520263671875, 0.664886474609375, 0.7008209228515625, 0.73675537109375, 0.7726898193359375, 0.808624267578125, 0.8445587158203125, 0.8804931640625, 0.9164276123046875, 0.952362060546875, 0.9882965087890625, 1.02423095703125, 1.0601654052734375, 1.096099853515625, 1.1320343017578125, 1.16796875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 5.0, 15.0, 21.0, 19.0, 24.0, 41.0, 49.0, 56.0, 66.0, 72.0, 89.0, 86.0, 92.0, 140.0, 127.0, 155.0, 179.0, 191.0, 192.0, 222.0, 184.0, 216.0, 211.0, 202.0, 184.0, 167.0, 148.0, 143.0, 144.0, 97.0, 100.0, 61.0, 80.0, 69.0, 53.0, 36.0, 28.0, 25.0, 23.0, 9.0, 13.0, 6.0, 3.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.4287147521972656, -0.41431427001953125, -0.3999137878417969, -0.3855133056640625, -0.3711128234863281, -0.35671234130859375, -0.3423118591308594, -0.327911376953125, -0.3135108947753906, -0.29911041259765625, -0.2847099304199219, -0.2703094482421875, -0.2559089660644531, -0.24150848388671875, -0.22710800170898438, -0.21270751953125, -0.19830703735351562, -0.18390655517578125, -0.16950607299804688, -0.1551055908203125, -0.14070510864257812, -0.12630462646484375, -0.11190414428710938, -0.097503662109375, -0.08310317993164062, -0.06870269775390625, -0.054302215576171875, -0.0399017333984375, -0.025501251220703125, -0.01110076904296875, 0.003299713134765625, 0.0177001953125, 0.032100677490234375, 0.04650115966796875, 0.060901641845703125, 0.0753021240234375, 0.08970260620117188, 0.10410308837890625, 0.11850357055664062, 0.132904052734375, 0.14730453491210938, 0.16170501708984375, 0.17610549926757812, 0.1905059814453125, 0.20490646362304688, 0.21930694580078125, 0.23370742797851562, 0.24810791015625, 0.2625083923339844, 0.27690887451171875, 0.2913093566894531, 0.3057098388671875, 0.3201103210449219, 0.33451080322265625, 0.3489112854003906, 0.363311767578125, 0.3777122497558594, 0.39211273193359375, 0.4065132141113281, 0.4209136962890625, 0.4353141784667969, 0.44971466064453125, 0.4641151428222656, 0.478515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 7.0, 1.0, 3.0, 8.0, 9.0, 21.0, 4.0, 24.0, 27.0, 17.0, 29.0, 37.0, 31.0, 35.0, 49.0, 47.0, 49.0, 40.0, 48.0, 54.0, 40.0, 61.0, 48.0, 45.0, 51.0, 39.0, 34.0, 10.0, 22.0, 22.0, 11.0, 7.0, 11.0, 12.0, 9.0, 4.0, 2.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.58762526512146, -1.5393799543380737, -1.491134524345398, -1.4428892135620117, -1.394643783569336, -1.3463984727859497, -1.2981531620025635, -1.2499077320098877, -1.2016624212265015, -1.1534171104431152, -1.1051716804504395, -1.0569263696670532, -1.008681058883667, -0.9604356288909912, -0.912190318107605, -0.863944947719574, -0.815699577331543, -0.767454206943512, -0.719208836555481, -0.6709635257720947, -0.6227181553840637, -0.5744727849960327, -0.5262274742126465, -0.4779821038246155, -0.4297367334365845, -0.38149136304855347, -0.33324602246284485, -0.28500068187713623, -0.23675531148910522, -0.1885099560022354, -0.1402646005153656, -0.09201925992965698, -0.04377400875091553, 0.004471346735954285, 0.0527167022228241, 0.10096205770969391, 0.14920741319656372, 0.19745276868343353, 0.24569812417030334, 0.29394346475601196, 0.34218883514404297, 0.390434205532074, 0.4386795461177826, 0.4869248867034912, 0.5351702570915222, 0.5834156274795532, 0.6316609382629395, 0.6799063086509705, 0.7281516790390015, 0.7763970494270325, 0.8246424198150635, 0.8728877305984497, 0.9211331009864807, 0.9693784713745117, 1.017623782157898, 1.0658690929412842, 1.11411452293396, 1.1623598337173462, 1.210605263710022, 1.2588505744934082, 1.307096004486084, 1.3553413152694702, 1.4035866260528564, 1.4518320560455322, 1.5000773668289185]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 6.0, 8.0, 5.0, 8.0, 10.0, 14.0, 7.0, 19.0, 25.0, 15.0, 23.0, 26.0, 29.0, 31.0, 33.0, 30.0, 26.0, 41.0, 44.0, 38.0, 39.0, 40.0, 44.0, 33.0, 41.0, 34.0, 41.0, 33.0, 22.0, 33.0, 37.0, 34.0, 19.0, 18.0, 18.0, 15.0, 13.0, 7.0, 7.0, 13.0, 7.0, 3.0, 7.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9469460844993591, -0.91257643699646, -0.878206729888916, -0.8438370823860168, -0.8094674348831177, -0.7750977873802185, -0.7407281398773193, -0.7063584327697754, -0.6719887852668762, -0.637619137763977, -0.6032494306564331, -0.5688797831535339, -0.5345101356506348, -0.5001404881477356, -0.46577081084251404, -0.4314011335372925, -0.3970314860343933, -0.36266183853149414, -0.3282921612262726, -0.293922483921051, -0.25955283641815186, -0.2251831740140915, -0.19081351161003113, -0.15644384920597076, -0.1220741868019104, -0.08770452439785004, -0.05333486199378967, -0.01896519958972931, 0.015404462814331055, 0.04977412521839142, 0.08414378762245178, 0.11851345002651215, 0.15288305282592773, 0.1872527152299881, 0.22162237763404846, 0.25599205493927, 0.2903617024421692, 0.32473134994506836, 0.3591010272502899, 0.3934707045555115, 0.42784035205841064, 0.4622099995613098, 0.49657967686653137, 0.5309493541717529, 0.5653190016746521, 0.5996886491775513, 0.6340583562850952, 0.6684280037879944, 0.7027976512908936, 0.7371672987937927, 0.7715369462966919, 0.8059066534042358, 0.840276300907135, 0.8746459484100342, 0.9090156555175781, 0.9433853030204773, 0.9777549505233765, 1.0121246576309204, 1.0464942455291748, 1.0808639526367188, 1.1152336597442627, 1.149603247642517, 1.183972954750061, 1.2183425426483154, 1.2527122497558594]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 13.0, 17.0, 29.0, 58.0, 80.0, 132.0, 217.0, 323.0, 509.0, 782.0, 1239.0, 1847.0, 2890.0, 4691.0, 7261.0, 11411.0, 17941.0, 28141.0, 44028.0, 66459.0, 97515.0, 131501.0, 153763.0, 144211.0, 110781.0, 78027.0, 51626.0, 33684.0, 21337.0, 13813.0, 8786.0, 5674.0, 3549.0, 2228.0, 1407.0, 933.0, 575.0, 392.0, 260.0, 143.0, 96.0, 64.0, 41.0, 31.0, 17.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22998046875, -0.22223663330078125, -0.2144927978515625, -0.20674896240234375, -0.199005126953125, -0.19126129150390625, -0.1835174560546875, -0.17577362060546875, -0.16802978515625, -0.16028594970703125, -0.1525421142578125, -0.14479827880859375, -0.137054443359375, -0.12931060791015625, -0.1215667724609375, -0.11382293701171875, -0.1060791015625, -0.09833526611328125, -0.0905914306640625, -0.08284759521484375, -0.075103759765625, -0.06735992431640625, -0.0596160888671875, -0.05187225341796875, -0.04412841796875, -0.03638458251953125, -0.0286407470703125, -0.02089691162109375, -0.013153076171875, -0.00540924072265625, 0.0023345947265625, 0.01007843017578125, 0.017822265625, 0.02556610107421875, 0.0333099365234375, 0.04105377197265625, 0.048797607421875, 0.05654144287109375, 0.0642852783203125, 0.07202911376953125, 0.07977294921875, 0.08751678466796875, 0.0952606201171875, 0.10300445556640625, 0.110748291015625, 0.11849212646484375, 0.1262359619140625, 0.13397979736328125, 0.1417236328125, 0.14946746826171875, 0.1572113037109375, 0.16495513916015625, 0.172698974609375, 0.18044281005859375, 0.1881866455078125, 0.19593048095703125, 0.20367431640625, 0.21141815185546875, 0.2191619873046875, 0.22690582275390625, 0.234649658203125, 0.24239349365234375, 0.2501373291015625, 0.25788116455078125, 0.265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 7.0, 4.0, 6.0, 3.0, 8.0, 10.0, 17.0, 16.0, 21.0, 29.0, 18.0, 30.0, 41.0, 39.0, 35.0, 35.0, 39.0, 43.0, 35.0, 40.0, 37.0, 54.0, 32.0, 39.0, 43.0, 32.0, 45.0, 27.0, 31.0, 37.0, 25.0, 23.0, 18.0, 12.0, 11.0, 12.0, 7.0, 9.0, 2.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2645416259765625, -1.225372314453125, -1.1862030029296875, -1.14703369140625, -1.1078643798828125, -1.068695068359375, -1.0295257568359375, -0.9903564453125, -0.9511871337890625, -0.912017822265625, -0.8728485107421875, -0.83367919921875, -0.7945098876953125, -0.755340576171875, -0.7161712646484375, -0.677001953125, -0.6378326416015625, -0.598663330078125, -0.5594940185546875, -0.52032470703125, -0.4811553955078125, -0.441986083984375, -0.4028167724609375, -0.3636474609375, -0.3244781494140625, -0.285308837890625, -0.2461395263671875, -0.20697021484375, -0.1678009033203125, -0.128631591796875, -0.0894622802734375, -0.05029296875, -0.0111236572265625, 0.028045654296875, 0.0672149658203125, 0.10638427734375, 0.1455535888671875, 0.184722900390625, 0.2238922119140625, 0.2630615234375, 0.3022308349609375, 0.341400146484375, 0.3805694580078125, 0.41973876953125, 0.4589080810546875, 0.498077392578125, 0.5372467041015625, 0.576416015625, 0.6155853271484375, 0.654754638671875, 0.6939239501953125, 0.73309326171875, 0.7722625732421875, 0.811431884765625, 0.8506011962890625, 0.8897705078125, 0.9289398193359375, 0.968109130859375, 1.0072784423828125, 1.04644775390625, 1.0856170654296875, 1.124786376953125, 1.1639556884765625, 1.203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 4.0, 13.0, 17.0, 16.0, 32.0, 70.0, 63.0, 132.0, 169.0, 250.0, 485.0, 729.0, 1315.0, 2065.0, 3783.0, 6854.0, 12615.0, 24199.0, 45849.0, 87053.0, 153431.0, 218223.0, 203564.0, 132397.0, 72529.0, 38114.0, 20149.0, 10826.0, 5734.0, 3248.0, 1827.0, 1050.0, 654.0, 389.0, 238.0, 164.0, 95.0, 54.0, 45.0, 30.0, 21.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3344306945800781, -0.32242584228515625, -0.3104209899902344, -0.2984161376953125, -0.2864112854003906, -0.27440643310546875, -0.2624015808105469, -0.250396728515625, -0.23839187622070312, -0.22638702392578125, -0.21438217163085938, -0.2023773193359375, -0.19037246704101562, -0.17836761474609375, -0.16636276245117188, -0.15435791015625, -0.14235305786132812, -0.13034820556640625, -0.11834335327148438, -0.1063385009765625, -0.09433364868164062, -0.08232879638671875, -0.07032394409179688, -0.058319091796875, -0.046314239501953125, -0.03430938720703125, -0.022304534912109375, -0.0102996826171875, 0.001705169677734375, 0.01371002197265625, 0.025714874267578125, 0.0377197265625, 0.049724578857421875, 0.06172943115234375, 0.07373428344726562, 0.0857391357421875, 0.09774398803710938, 0.10974884033203125, 0.12175369262695312, 0.133758544921875, 0.14576339721679688, 0.15776824951171875, 0.16977310180664062, 0.1817779541015625, 0.19378280639648438, 0.20578765869140625, 0.21779251098632812, 0.22979736328125, 0.24180221557617188, 0.25380706787109375, 0.2658119201660156, 0.2778167724609375, 0.2898216247558594, 0.30182647705078125, 0.3138313293457031, 0.325836181640625, 0.3378410339355469, 0.34984588623046875, 0.3618507385253906, 0.3738555908203125, 0.3858604431152344, 0.39786529541015625, 0.4098701477050781, 0.421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 15.0, 9.0, 12.0, 15.0, 18.0, 14.0, 20.0, 30.0, 21.0, 22.0, 25.0, 30.0, 25.0, 37.0, 48.0, 44.0, 34.0, 40.0, 42.0, 50.0, 34.0, 42.0, 43.0, 37.0, 32.0, 32.0, 43.0, 18.0, 36.0, 14.0, 14.0, 13.0, 11.0, 11.0, 8.0, 12.0, 9.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72607421875, -0.7030868530273438, -0.6800994873046875, -0.6571121215820312, -0.634124755859375, -0.6111373901367188, -0.5881500244140625, -0.5651626586914062, -0.54217529296875, -0.5191879272460938, -0.4962005615234375, -0.47321319580078125, -0.450225830078125, -0.42723846435546875, -0.4042510986328125, -0.38126373291015625, -0.3582763671875, -0.33528900146484375, -0.3123016357421875, -0.28931427001953125, -0.266326904296875, -0.24333953857421875, -0.2203521728515625, -0.19736480712890625, -0.17437744140625, -0.15139007568359375, -0.1284027099609375, -0.10541534423828125, -0.082427978515625, -0.05944061279296875, -0.0364532470703125, -0.01346588134765625, 0.009521484375, 0.03250885009765625, 0.0554962158203125, 0.07848358154296875, 0.101470947265625, 0.12445831298828125, 0.1474456787109375, 0.17043304443359375, 0.19342041015625, 0.21640777587890625, 0.2393951416015625, 0.26238250732421875, 0.285369873046875, 0.30835723876953125, 0.3313446044921875, 0.35433197021484375, 0.3773193359375, 0.40030670166015625, 0.4232940673828125, 0.44628143310546875, 0.469268798828125, 0.49225616455078125, 0.5152435302734375, 0.5382308959960938, 0.56121826171875, 0.5842056274414062, 0.6071929931640625, 0.6301803588867188, 0.653167724609375, 0.6761550903320312, 0.6991424560546875, 0.7221298217773438, 0.7451171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 32.0, 23.0, 46.0, 54.0, 102.0, 160.0, 184.0, 321.0, 511.0, 749.0, 1195.0, 1951.0, 3226.0, 5470.0, 10192.0, 20521.0, 47821.0, 132885.0, 374830.0, 283790.0, 92254.0, 35682.0, 16228.0, 8277.0, 4553.0, 2758.0, 1689.0, 1065.0, 693.0, 423.0, 242.0, 169.0, 99.0, 105.0, 70.0, 36.0, 26.0, 27.0, 15.0, 13.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.199462890625, -0.19373703002929688, -0.18801116943359375, -0.18228530883789062, -0.1765594482421875, -0.17083358764648438, -0.16510772705078125, -0.15938186645507812, -0.153656005859375, -0.14793014526367188, -0.14220428466796875, -0.13647842407226562, -0.1307525634765625, -0.12502670288085938, -0.11930084228515625, -0.11357498168945312, -0.10784912109375, -0.10212326049804688, -0.09639739990234375, -0.09067153930664062, -0.0849456787109375, -0.07921981811523438, -0.07349395751953125, -0.06776809692382812, -0.062042236328125, -0.056316375732421875, -0.05059051513671875, -0.044864654541015625, -0.0391387939453125, -0.033412933349609375, -0.02768707275390625, -0.021961212158203125, -0.0162353515625, -0.010509490966796875, -0.00478363037109375, 0.000942230224609375, 0.0066680908203125, 0.012393951416015625, 0.01811981201171875, 0.023845672607421875, 0.029571533203125, 0.035297393798828125, 0.04102325439453125, 0.046749114990234375, 0.0524749755859375, 0.058200836181640625, 0.06392669677734375, 0.06965255737304688, 0.07537841796875, 0.08110427856445312, 0.08683013916015625, 0.09255599975585938, 0.0982818603515625, 0.10400772094726562, 0.10973358154296875, 0.11545944213867188, 0.121185302734375, 0.12691116333007812, 0.13263702392578125, 0.13836288452148438, 0.1440887451171875, 0.14981460571289062, 0.15554046630859375, 0.16126632690429688, 0.1669921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 8.0, 12.0, 6.0, 12.0, 11.0, 6.0, 14.0, 20.0, 10.0, 15.0, 18.0, 15.0, 26.0, 30.0, 46.0, 36.0, 36.0, 37.0, 46.0, 37.0, 43.0, 44.0, 41.0, 32.0, 30.0, 40.0, 50.0, 46.0, 29.0, 26.0, 29.0, 27.0, 15.0, 21.0, 16.0, 15.0, 7.0, 15.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.445923984050751e-06, -7.202848792076111e-06, -6.959773600101471e-06, -6.716698408126831e-06, -6.473623216152191e-06, -6.230548024177551e-06, -5.987472832202911e-06, -5.7443976402282715e-06, -5.501322448253632e-06, -5.258247256278992e-06, -5.015172064304352e-06, -4.772096872329712e-06, -4.529021680355072e-06, -4.285946488380432e-06, -4.042871296405792e-06, -3.7997961044311523e-06, -3.5567209124565125e-06, -3.3136457204818726e-06, -3.0705705285072327e-06, -2.8274953365325928e-06, -2.584420144557953e-06, -2.341344952583313e-06, -2.098269760608673e-06, -1.8551945686340332e-06, -1.6121193766593933e-06, -1.3690441846847534e-06, -1.1259689927101135e-06, -8.828938007354736e-07, -6.398186087608337e-07, -3.9674341678619385e-07, -1.5366822481155396e-07, 8.940696716308594e-08, 3.3248215913772583e-07, 5.755573511123657e-07, 8.186325430870056e-07, 1.0617077350616455e-06, 1.3047829270362854e-06, 1.5478581190109253e-06, 1.7909333109855652e-06, 2.034008502960205e-06, 2.277083694934845e-06, 2.520158886909485e-06, 2.7632340788841248e-06, 3.0063092708587646e-06, 3.2493844628334045e-06, 3.4924596548080444e-06, 3.7355348467826843e-06, 3.978610038757324e-06, 4.221685230731964e-06, 4.464760422706604e-06, 4.707835614681244e-06, 4.950910806655884e-06, 5.193985998630524e-06, 5.4370611906051636e-06, 5.6801363825798035e-06, 5.923211574554443e-06, 6.166286766529083e-06, 6.409361958503723e-06, 6.652437150478363e-06, 6.895512342453003e-06, 7.138587534427643e-06, 7.381662726402283e-06, 7.624737918376923e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 12.0, 23.0, 30.0, 36.0, 62.0, 116.0, 164.0, 239.0, 424.0, 666.0, 1065.0, 1836.0, 3230.0, 5851.0, 11140.0, 22446.0, 46314.0, 101049.0, 209933.0, 286311.0, 186535.0, 88597.0, 40421.0, 19503.0, 10092.0, 5292.0, 2853.0, 1686.0, 985.0, 625.0, 366.0, 221.0, 153.0, 120.0, 59.0, 43.0, 16.0, 16.0, 7.0, 1.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.197998046875, -0.19256019592285156, -0.18712234497070312, -0.1816844940185547, -0.17624664306640625, -0.1708087921142578, -0.16537094116210938, -0.15993309020996094, -0.1544952392578125, -0.14905738830566406, -0.14361953735351562, -0.1381816864013672, -0.13274383544921875, -0.1273059844970703, -0.12186813354492188, -0.11643028259277344, -0.110992431640625, -0.10555458068847656, -0.10011672973632812, -0.09467887878417969, -0.08924102783203125, -0.08380317687988281, -0.07836532592773438, -0.07292747497558594, -0.0674896240234375, -0.06205177307128906, -0.056613922119140625, -0.05117607116699219, -0.04573822021484375, -0.04030036926269531, -0.034862518310546875, -0.029424667358398438, -0.02398681640625, -0.018548965454101562, -0.013111114501953125, -0.0076732635498046875, -0.00223541259765625, 0.0032024383544921875, 0.008640289306640625, 0.014078140258789062, 0.0195159912109375, 0.024953842163085938, 0.030391693115234375, 0.03582954406738281, 0.04126739501953125, 0.04670524597167969, 0.052143096923828125, 0.05758094787597656, 0.063018798828125, 0.06845664978027344, 0.07389450073242188, 0.07933235168457031, 0.08477020263671875, 0.09020805358886719, 0.09564590454101562, 0.10108375549316406, 0.1065216064453125, 0.11195945739746094, 0.11739730834960938, 0.12283515930175781, 0.12827301025390625, 0.1337108612060547, 0.13914871215820312, 0.14458656311035156, 0.1500244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 8.0, 5.0, 11.0, 14.0, 20.0, 12.0, 13.0, 18.0, 36.0, 37.0, 40.0, 36.0, 49.0, 58.0, 58.0, 65.0, 49.0, 57.0, 44.0, 44.0, 40.0, 41.0, 34.0, 31.0, 25.0, 25.0, 19.0, 17.0, 10.0, 7.0, 9.0, 13.0, 6.0, 8.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.036956787109375, -0.0358738899230957, -0.034790992736816406, -0.03370809555053711, -0.03262519836425781, -0.031542301177978516, -0.03045940399169922, -0.029376506805419922, -0.028293609619140625, -0.027210712432861328, -0.02612781524658203, -0.025044918060302734, -0.023962020874023438, -0.02287912368774414, -0.021796226501464844, -0.020713329315185547, -0.01963043212890625, -0.018547534942626953, -0.017464637756347656, -0.01638174057006836, -0.015298843383789062, -0.014215946197509766, -0.013133049011230469, -0.012050151824951172, -0.010967254638671875, -0.009884357452392578, -0.008801460266113281, -0.007718563079833984, -0.0066356658935546875, -0.005552768707275391, -0.004469871520996094, -0.003386974334716797, -0.0023040771484375, -0.0012211799621582031, -0.00013828277587890625, 0.0009446144104003906, 0.0020275115966796875, 0.0031104087829589844, 0.004193305969238281, 0.005276203155517578, 0.006359100341796875, 0.007441997528076172, 0.008524894714355469, 0.009607791900634766, 0.010690689086914062, 0.01177358627319336, 0.012856483459472656, 0.013939380645751953, 0.01502227783203125, 0.016105175018310547, 0.017188072204589844, 0.01827096939086914, 0.019353866577148438, 0.020436763763427734, 0.02151966094970703, 0.022602558135986328, 0.023685455322265625, 0.024768352508544922, 0.02585124969482422, 0.026934146881103516, 0.028017044067382812, 0.02909994125366211, 0.030182838439941406, 0.0312657356262207, 0.0323486328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 1.0, 1.0, 9.0, 8.0, 15.0, 14.0, 18.0, 26.0, 26.0, 23.0, 32.0, 25.0, 36.0, 49.0, 51.0, 45.0, 37.0, 51.0, 54.0, 48.0, 56.0, 47.0, 41.0, 46.0, 47.0, 32.0, 20.0, 21.0, 17.0, 16.0, 11.0, 9.0, 10.0, 11.0, 5.0, 3.0, 7.0, 3.0, 6.0, 5.0, 0.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.542368769645691, -1.4943792819976807, -1.44638991355896, -1.3984004259109497, -1.3504109382629395, -1.3024214506149292, -1.254431962966919, -1.2064425945281982, -1.158453106880188, -1.1104636192321777, -1.062474250793457, -1.0144847631454468, -0.9664952754974365, -0.9185057878494263, -0.8705163598060608, -0.8225269317626953, -0.7745374441146851, -0.7265479564666748, -0.6785585284233093, -0.6305691003799438, -0.5825796127319336, -0.5345901250839233, -0.48660069704055786, -0.43861123919487, -0.39062178134918213, -0.34263232350349426, -0.2946428656578064, -0.24665340781211853, -0.19866394996643066, -0.1506744921207428, -0.10268503427505493, -0.054695576429367065, -0.0067059993743896484, 0.04128345847129822, 0.08927291631698608, 0.13726237416267395, 0.18525183200836182, 0.23324128985404968, 0.28123074769973755, 0.3292202055454254, 0.3772096633911133, 0.42519912123680115, 0.473188579082489, 0.5211780071258545, 0.5691674947738647, 0.617156982421875, 0.6651464104652405, 0.713135838508606, 0.7611253261566162, 0.8091148138046265, 0.8571042418479919, 0.9050936698913574, 0.9530831575393677, 1.001072645187378, 1.0490620136260986, 1.0970515012741089, 1.1450409889221191, 1.1930304765701294, 1.2410199642181396, 1.2890093326568604, 1.3369988203048706, 1.3849883079528809, 1.4329776763916016, 1.4809671640396118, 1.528956651687622]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 10.0, 6.0, 7.0, 9.0, 8.0, 13.0, 8.0, 19.0, 25.0, 16.0, 24.0, 26.0, 27.0, 30.0, 31.0, 34.0, 26.0, 38.0, 40.0, 36.0, 50.0, 38.0, 41.0, 36.0, 34.0, 34.0, 42.0, 34.0, 27.0, 29.0, 35.0, 34.0, 25.0, 17.0, 18.0, 15.0, 13.0, 6.0, 8.0, 12.0, 7.0, 4.0, 7.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9426308274269104, -0.908301591873169, -0.8739722967147827, -0.8396430611610413, -0.8053138256072998, -0.7709845900535583, -0.7366553544998169, -0.7023260593414307, -0.6679968237876892, -0.6336675882339478, -0.5993382930755615, -0.5650090575218201, -0.5306798219680786, -0.49635058641433716, -0.4620213210582733, -0.4276920557022095, -0.393362820148468, -0.35903358459472656, -0.3247043192386627, -0.2903750538825989, -0.2560458183288574, -0.22171656787395477, -0.18738731741905212, -0.15305806696414948, -0.11872881650924683, -0.08439956605434418, -0.05007031559944153, -0.01574106514453888, 0.01858818531036377, 0.05291743576526642, 0.08724668622016907, 0.12157593667507172, 0.1559051275253296, 0.19023437798023224, 0.2245636284351349, 0.25889289379119873, 0.2932221293449402, 0.32755136489868164, 0.3618806302547455, 0.3962098956108093, 0.4305391311645508, 0.46486836671829224, 0.4991976320743561, 0.5335268974304199, 0.5678561329841614, 0.6021853685379028, 0.6365146636962891, 0.6708438992500305, 0.705173134803772, 0.7395023703575134, 0.7738316059112549, 0.8081609010696411, 0.8424901366233826, 0.876819372177124, 0.9111486673355103, 0.9454779028892517, 0.9798071384429932, 1.0141364336013794, 1.048465609550476, 1.0827949047088623, 1.117124080657959, 1.1514533758163452, 1.1857826709747314, 1.2201118469238281, 1.2544411420822144]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 18.0, 10.0, 23.0, 45.0, 56.0, 101.0, 196.0, 313.0, 462.0, 797.0, 1301.0, 2144.0, 3470.0, 5554.0, 9074.0, 14025.0, 21432.0, 31929.0, 46236.0, 62590.0, 81074.0, 98146.0, 109613.0, 112145.0, 106358.0, 92312.0, 74645.0, 56736.0, 40207.0, 27881.0, 18387.0, 11884.0, 7364.0, 4746.0, 2857.0, 1695.0, 1077.0, 691.0, 396.0, 217.0, 130.0, 94.0, 48.0, 28.0, 21.0, 16.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.0693359375, -1.0381698608398438, -1.0070037841796875, -0.9758377075195312, -0.944671630859375, -0.9135055541992188, -0.8823394775390625, -0.8511734008789062, -0.82000732421875, -0.7888412475585938, -0.7576751708984375, -0.7265090942382812, -0.695343017578125, -0.6641769409179688, -0.6330108642578125, -0.6018447875976562, -0.5706787109375, -0.5395126342773438, -0.5083465576171875, -0.47718048095703125, -0.446014404296875, -0.41484832763671875, -0.3836822509765625, -0.35251617431640625, -0.32135009765625, -0.29018402099609375, -0.2590179443359375, -0.22785186767578125, -0.196685791015625, -0.16551971435546875, -0.1343536376953125, -0.10318756103515625, -0.072021484375, -0.04085540771484375, -0.0096893310546875, 0.02147674560546875, 0.052642822265625, 0.08380889892578125, 0.1149749755859375, 0.14614105224609375, 0.17730712890625, 0.20847320556640625, 0.2396392822265625, 0.27080535888671875, 0.301971435546875, 0.33313751220703125, 0.3643035888671875, 0.39546966552734375, 0.4266357421875, 0.45780181884765625, 0.4889678955078125, 0.5201339721679688, 0.551300048828125, 0.5824661254882812, 0.6136322021484375, 0.6447982788085938, 0.67596435546875, 0.7071304321289062, 0.7382965087890625, 0.7694625854492188, 0.800628662109375, 0.8317947387695312, 0.8629608154296875, 0.8941268920898438, 0.92529296875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 3.0, 9.0, 7.0, 13.0, 10.0, 19.0, 14.0, 21.0, 14.0, 16.0, 20.0, 20.0, 23.0, 25.0, 37.0, 24.0, 39.0, 31.0, 36.0, 32.0, 36.0, 47.0, 38.0, 40.0, 34.0, 45.0, 32.0, 35.0, 29.0, 18.0, 35.0, 30.0, 14.0, 26.0, 17.0, 14.0, 10.0, 19.0, 12.0, 5.0, 6.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.00390625, -0.969512939453125, -0.93511962890625, -0.900726318359375, -0.8663330078125, -0.831939697265625, -0.79754638671875, -0.763153076171875, -0.728759765625, -0.694366455078125, -0.65997314453125, -0.625579833984375, -0.5911865234375, -0.556793212890625, -0.52239990234375, -0.488006591796875, -0.45361328125, -0.419219970703125, -0.38482666015625, -0.350433349609375, -0.3160400390625, -0.281646728515625, -0.24725341796875, -0.212860107421875, -0.178466796875, -0.144073486328125, -0.10968017578125, -0.075286865234375, -0.0408935546875, -0.006500244140625, 0.02789306640625, 0.062286376953125, 0.0966796875, 0.131072998046875, 0.16546630859375, 0.199859619140625, 0.2342529296875, 0.268646240234375, 0.30303955078125, 0.337432861328125, 0.371826171875, 0.406219482421875, 0.44061279296875, 0.475006103515625, 0.5093994140625, 0.543792724609375, 0.57818603515625, 0.612579345703125, 0.64697265625, 0.681365966796875, 0.71575927734375, 0.750152587890625, 0.7845458984375, 0.818939208984375, 0.85333251953125, 0.887725830078125, 0.922119140625, 0.956512451171875, 0.99090576171875, 1.025299072265625, 1.0596923828125, 1.094085693359375, 1.12847900390625, 1.162872314453125, 1.197265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 9.0, 4.0, 9.0, 13.0, 26.0, 39.0, 72.0, 82.0, 121.0, 177.0, 266.0, 477.0, 676.0, 978.0, 1503.0, 2389.0, 3548.0, 5526.0, 8398.0, 12473.0, 18010.0, 26113.0, 36334.0, 48920.0, 63210.0, 77698.0, 89308.0, 97870.0, 99361.0, 95435.0, 84868.0, 71558.0, 57634.0, 43627.0, 32365.0, 22577.0, 15850.0, 10575.0, 7127.0, 4665.0, 2954.0, 2017.0, 1277.0, 825.0, 554.0, 376.0, 219.0, 164.0, 90.0, 83.0, 33.0, 30.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0], "bins": [-0.88916015625, -0.86163330078125, -0.8341064453125, -0.80657958984375, -0.779052734375, -0.75152587890625, -0.7239990234375, -0.69647216796875, -0.6689453125, -0.64141845703125, -0.6138916015625, -0.58636474609375, -0.558837890625, -0.53131103515625, -0.5037841796875, -0.47625732421875, -0.44873046875, -0.42120361328125, -0.3936767578125, -0.36614990234375, -0.338623046875, -0.31109619140625, -0.2835693359375, -0.25604248046875, -0.228515625, -0.20098876953125, -0.1734619140625, -0.14593505859375, -0.118408203125, -0.09088134765625, -0.0633544921875, -0.03582763671875, -0.00830078125, 0.01922607421875, 0.0467529296875, 0.07427978515625, 0.101806640625, 0.12933349609375, 0.1568603515625, 0.18438720703125, 0.2119140625, 0.23944091796875, 0.2669677734375, 0.29449462890625, 0.322021484375, 0.34954833984375, 0.3770751953125, 0.40460205078125, 0.43212890625, 0.45965576171875, 0.4871826171875, 0.51470947265625, 0.542236328125, 0.56976318359375, 0.5972900390625, 0.62481689453125, 0.65234375, 0.67987060546875, 0.7073974609375, 0.73492431640625, 0.762451171875, 0.78997802734375, 0.8175048828125, 0.84503173828125, 0.87255859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 5.0, 8.0, 9.0, 6.0, 10.0, 15.0, 18.0, 18.0, 26.0, 32.0, 27.0, 33.0, 34.0, 35.0, 38.0, 47.0, 41.0, 43.0, 39.0, 51.0, 46.0, 33.0, 35.0, 25.0, 42.0, 33.0, 27.0, 24.0, 31.0, 25.0, 22.0, 24.0, 21.0, 9.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7119598388671875, -0.688568115234375, -0.6651763916015625, -0.64178466796875, -0.6183929443359375, -0.595001220703125, -0.5716094970703125, -0.5482177734375, -0.5248260498046875, -0.501434326171875, -0.4780426025390625, -0.45465087890625, -0.4312591552734375, -0.407867431640625, -0.3844757080078125, -0.361083984375, -0.3376922607421875, -0.314300537109375, -0.2909088134765625, -0.26751708984375, -0.2441253662109375, -0.220733642578125, -0.1973419189453125, -0.1739501953125, -0.1505584716796875, -0.127166748046875, -0.1037750244140625, -0.08038330078125, -0.0569915771484375, -0.033599853515625, -0.0102081298828125, 0.01318359375, 0.0365753173828125, 0.059967041015625, 0.0833587646484375, 0.10675048828125, 0.1301422119140625, 0.153533935546875, 0.1769256591796875, 0.2003173828125, 0.2237091064453125, 0.247100830078125, 0.2704925537109375, 0.29388427734375, 0.3172760009765625, 0.340667724609375, 0.3640594482421875, 0.387451171875, 0.4108428955078125, 0.434234619140625, 0.4576263427734375, 0.48101806640625, 0.5044097900390625, 0.527801513671875, 0.5511932373046875, 0.5745849609375, 0.5979766845703125, 0.621368408203125, 0.6447601318359375, 0.66815185546875, 0.6915435791015625, 0.714935302734375, 0.7383270263671875, 0.76171875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 11.0, 26.0, 23.0, 34.0, 67.0, 91.0, 140.0, 204.0, 316.0, 442.0, 720.0, 1123.0, 1711.0, 2578.0, 4119.0, 6639.0, 10492.0, 16850.0, 27204.0, 43180.0, 67381.0, 97196.0, 128152.0, 145784.0, 140292.0, 115908.0, 84659.0, 56949.0, 36088.0, 22574.0, 13903.0, 8576.0, 5370.0, 3394.0, 2155.0, 1455.0, 917.0, 654.0, 435.0, 239.0, 160.0, 125.0, 72.0, 58.0, 33.0, 16.0, 18.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65234375, -0.6318283081054688, -0.6113128662109375, -0.5907974243164062, -0.570281982421875, -0.5497665405273438, -0.5292510986328125, -0.5087356567382812, -0.48822021484375, -0.46770477294921875, -0.4471893310546875, -0.42667388916015625, -0.406158447265625, -0.38564300537109375, -0.3651275634765625, -0.34461212158203125, -0.3240966796875, -0.30358123779296875, -0.2830657958984375, -0.26255035400390625, -0.242034912109375, -0.22151947021484375, -0.2010040283203125, -0.18048858642578125, -0.15997314453125, -0.13945770263671875, -0.1189422607421875, -0.09842681884765625, -0.077911376953125, -0.05739593505859375, -0.0368804931640625, -0.01636505126953125, 0.004150390625, 0.02466583251953125, 0.0451812744140625, 0.06569671630859375, 0.086212158203125, 0.10672760009765625, 0.1272430419921875, 0.14775848388671875, 0.16827392578125, 0.18878936767578125, 0.2093048095703125, 0.22982025146484375, 0.250335693359375, 0.27085113525390625, 0.2913665771484375, 0.31188201904296875, 0.3323974609375, 0.35291290283203125, 0.3734283447265625, 0.39394378662109375, 0.414459228515625, 0.43497467041015625, 0.4554901123046875, 0.47600555419921875, 0.49652099609375, 0.5170364379882812, 0.5375518798828125, 0.5580673217773438, 0.578582763671875, 0.5990982055664062, 0.6196136474609375, 0.6401290893554688, 0.66064453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 7.0, 9.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 30.0, 35.0, 46.0, 53.0, 49.0, 44.0, 57.0, 58.0, 58.0, 58.0, 49.0, 57.0, 52.0, 35.0, 46.0, 29.0, 26.0, 18.0, 16.0, 14.0, 11.0, 15.0, 11.0, 4.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.069110870361328e-05, -6.841868162155151e-05, -6.614625453948975e-05, -6.387382745742798e-05, -6.160140037536621e-05, -5.932897329330444e-05, -5.7056546211242676e-05, -5.478411912918091e-05, -5.251169204711914e-05, -5.023926496505737e-05, -4.7966837882995605e-05, -4.569441080093384e-05, -4.342198371887207e-05, -4.11495566368103e-05, -3.8877129554748535e-05, -3.660470247268677e-05, -3.4332275390625e-05, -3.205984830856323e-05, -2.9787421226501465e-05, -2.7514994144439697e-05, -2.524256706237793e-05, -2.2970139980316162e-05, -2.0697712898254395e-05, -1.8425285816192627e-05, -1.615285873413086e-05, -1.3880431652069092e-05, -1.1608004570007324e-05, -9.335577487945557e-06, -7.063150405883789e-06, -4.7907233238220215e-06, -2.518296241760254e-06, -2.4586915969848633e-07, 2.0265579223632812e-06, 4.298985004425049e-06, 6.571412086486816e-06, 8.843839168548584e-06, 1.1116266250610352e-05, 1.3388693332672119e-05, 1.5661120414733887e-05, 1.7933547496795654e-05, 2.0205974578857422e-05, 2.247840166091919e-05, 2.4750828742980957e-05, 2.7023255825042725e-05, 2.9295682907104492e-05, 3.156810998916626e-05, 3.384053707122803e-05, 3.6112964153289795e-05, 3.838539123535156e-05, 4.065781831741333e-05, 4.29302453994751e-05, 4.5202672481536865e-05, 4.747509956359863e-05, 4.97475266456604e-05, 5.201995372772217e-05, 5.4292380809783936e-05, 5.65648078918457e-05, 5.883723497390747e-05, 6.110966205596924e-05, 6.3382089138031e-05, 6.565451622009277e-05, 6.792694330215454e-05, 7.019937038421631e-05, 7.247179746627808e-05, 7.474422454833984e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 3.0, 15.0, 19.0, 29.0, 46.0, 42.0, 90.0, 113.0, 141.0, 227.0, 312.0, 487.0, 711.0, 1077.0, 1674.0, 2668.0, 4250.0, 6433.0, 10284.0, 16137.0, 24976.0, 38845.0, 57677.0, 81109.0, 107378.0, 127329.0, 132846.0, 120742.0, 98360.0, 72531.0, 49906.0, 32907.0, 21387.0, 13490.0, 8662.0, 5562.0, 3464.0, 2240.0, 1455.0, 980.0, 598.0, 416.0, 283.0, 193.0, 122.0, 95.0, 65.0, 56.0, 35.0, 22.0, 21.0, 10.0, 10.0, 10.0, 4.0, 4.0, 2.0, 5.0], "bins": [-0.60009765625, -0.5815277099609375, -0.562957763671875, -0.5443878173828125, -0.52581787109375, -0.5072479248046875, -0.488677978515625, -0.4701080322265625, -0.4515380859375, -0.4329681396484375, -0.414398193359375, -0.3958282470703125, -0.37725830078125, -0.3586883544921875, -0.340118408203125, -0.3215484619140625, -0.302978515625, -0.2844085693359375, -0.265838623046875, -0.2472686767578125, -0.22869873046875, -0.2101287841796875, -0.191558837890625, -0.1729888916015625, -0.1544189453125, -0.1358489990234375, -0.117279052734375, -0.0987091064453125, -0.08013916015625, -0.0615692138671875, -0.042999267578125, -0.0244293212890625, -0.005859375, 0.0127105712890625, 0.031280517578125, 0.0498504638671875, 0.06842041015625, 0.0869903564453125, 0.105560302734375, 0.1241302490234375, 0.1427001953125, 0.1612701416015625, 0.179840087890625, 0.1984100341796875, 0.21697998046875, 0.2355499267578125, 0.254119873046875, 0.2726898193359375, 0.291259765625, 0.3098297119140625, 0.328399658203125, 0.3469696044921875, 0.36553955078125, 0.3841094970703125, 0.402679443359375, 0.4212493896484375, 0.4398193359375, 0.4583892822265625, 0.476959228515625, 0.4955291748046875, 0.51409912109375, 0.5326690673828125, 0.551239013671875, 0.5698089599609375, 0.58837890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 18.0, 18.0, 21.0, 19.0, 27.0, 23.0, 30.0, 37.0, 37.0, 47.0, 44.0, 58.0, 50.0, 42.0, 56.0, 39.0, 45.0, 51.0, 28.0, 35.0, 42.0, 40.0, 33.0, 28.0, 15.0, 19.0, 15.0, 13.0, 17.0, 12.0, 4.0, 5.0, 3.0, 1.0, 0.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2127685546875, -0.20659637451171875, -0.2004241943359375, -0.19425201416015625, -0.188079833984375, -0.18190765380859375, -0.1757354736328125, -0.16956329345703125, -0.16339111328125, -0.15721893310546875, -0.1510467529296875, -0.14487457275390625, -0.138702392578125, -0.13253021240234375, -0.1263580322265625, -0.12018585205078125, -0.114013671875, -0.10784149169921875, -0.1016693115234375, -0.09549713134765625, -0.089324951171875, -0.08315277099609375, -0.0769805908203125, -0.07080841064453125, -0.06463623046875, -0.05846405029296875, -0.0522918701171875, -0.04611968994140625, -0.039947509765625, -0.03377532958984375, -0.0276031494140625, -0.02143096923828125, -0.0152587890625, -0.00908660888671875, -0.0029144287109375, 0.00325775146484375, 0.009429931640625, 0.01560211181640625, 0.0217742919921875, 0.02794647216796875, 0.03411865234375, 0.04029083251953125, 0.0464630126953125, 0.05263519287109375, 0.058807373046875, 0.06497955322265625, 0.0711517333984375, 0.07732391357421875, 0.08349609375, 0.08966827392578125, 0.0958404541015625, 0.10201263427734375, 0.108184814453125, 0.11435699462890625, 0.1205291748046875, 0.12670135498046875, 0.13287353515625, 0.13904571533203125, 0.1452178955078125, 0.15139007568359375, 0.157562255859375, 0.16373443603515625, 0.1699066162109375, 0.17607879638671875, 0.1822509765625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 5.0, 10.0, 22.0, 28.0, 24.0, 28.0, 32.0, 47.0, 38.0, 48.0, 46.0, 44.0, 66.0, 51.0, 47.0, 59.0, 63.0, 50.0, 51.0, 39.0, 27.0, 36.0, 18.0, 14.0, 20.0, 11.0, 7.0, 13.0, 7.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67812180519104, -1.6232253313064575, -1.568328857421875, -1.513432264328003, -1.4585357904434204, -1.403639316558838, -1.3487428426742554, -1.2938463687896729, -1.2389497756958008, -1.1840533018112183, -1.1291568279266357, -1.0742602348327637, -1.0193637609481812, -0.9644672870635986, -0.9095708131790161, -0.8546743392944336, -0.7997778654098511, -0.7448813915252686, -0.6899848580360413, -0.6350883841514587, -0.5801918506622314, -0.5252953767776489, -0.4703989028930664, -0.4155023992061615, -0.3606058955192566, -0.3057093918323517, -0.2508128881454468, -0.19591641426086426, -0.14101991057395935, -0.08612340688705444, -0.031226933002471924, 0.023669570684432983, 0.07856607437133789, 0.1334625780582428, 0.1883590668439865, 0.24325555562973022, 0.29815205931663513, 0.35304856300354004, 0.40794503688812256, 0.46284154057502747, 0.5177380442619324, 0.5726345181465149, 0.6275310516357422, 0.6824275255203247, 0.7373239994049072, 0.7922205328941345, 0.847117006778717, 0.9020135402679443, 0.9569100141525269, 1.0118064880371094, 1.066702961921692, 1.1215994358062744, 1.1764960289001465, 1.231392502784729, 1.2862889766693115, 1.341185450553894, 1.3960819244384766, 1.450978398323059, 1.5058748722076416, 1.5607714653015137, 1.6156679391860962, 1.6705644130706787, 1.7254608869552612, 1.7803573608398438, 1.8352539539337158]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 9.0, 8.0, 8.0, 19.0, 20.0, 25.0, 13.0, 19.0, 25.0, 33.0, 29.0, 29.0, 41.0, 40.0, 35.0, 44.0, 31.0, 44.0, 44.0, 41.0, 44.0, 41.0, 37.0, 31.0, 44.0, 33.0, 25.0, 40.0, 22.0, 26.0, 19.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1000877618789673, -1.062829852104187, -1.0255720615386963, -0.988314151763916, -0.9510563015937805, -0.913798451423645, -0.8765405416488647, -0.8392826914787292, -0.8020248413085938, -0.7647669911384583, -0.7275091409683228, -0.6902512311935425, -0.652993381023407, -0.6157355308532715, -0.5784776210784912, -0.5412197709083557, -0.5039619207382202, -0.4667040705680847, -0.42944619059562683, -0.39218831062316895, -0.35493046045303345, -0.31767261028289795, -0.28041473031044006, -0.24315685033798218, -0.20589900016784668, -0.16864113509655, -0.1313832700252533, -0.0941254049539566, -0.05686753988265991, -0.01960967481136322, 0.01764819025993347, 0.05490607023239136, 0.0921638011932373, 0.129421666264534, 0.1666795313358307, 0.20393739640712738, 0.24119526147842407, 0.27845311164855957, 0.31571099162101746, 0.35296887159347534, 0.39022672176361084, 0.42748457193374634, 0.4647424519062042, 0.5020003318786621, 0.5392581820487976, 0.5765160322189331, 0.6137739419937134, 0.6510317921638489, 0.6882896423339844, 0.7255474925041199, 0.7628053426742554, 0.8000632524490356, 0.8373211026191711, 0.8745789527893066, 0.9118368625640869, 0.9490947127342224, 0.9863525629043579, 1.0236104726791382, 1.060868263244629, 1.0981261730194092, 1.1353840827941895, 1.1726418733596802, 1.2098997831344604, 1.2471575736999512, 1.2844154834747314]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 5.0, 13.0, 14.0, 29.0, 27.0, 59.0, 82.0, 137.0, 238.0, 369.0, 606.0, 1014.0, 1689.0, 2746.0, 4712.0, 7934.0, 13483.0, 23605.0, 40828.0, 69666.0, 118268.0, 195329.0, 304290.0, 438709.0, 559336.0, 611423.0, 561969.0, 443387.0, 306077.0, 197396.0, 120363.0, 71279.0, 41336.0, 24236.0, 13786.0, 8127.0, 4683.0, 2835.0, 1607.0, 979.0, 621.0, 346.0, 234.0, 141.0, 97.0, 76.0, 37.0, 18.0, 17.0, 16.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1665802001953125, -1.124176025390625, -1.0817718505859375, -1.03936767578125, -0.9969635009765625, -0.954559326171875, -0.9121551513671875, -0.8697509765625, -0.8273468017578125, -0.784942626953125, -0.7425384521484375, -0.70013427734375, -0.6577301025390625, -0.615325927734375, -0.5729217529296875, -0.530517578125, -0.4881134033203125, -0.445709228515625, -0.4033050537109375, -0.36090087890625, -0.3184967041015625, -0.276092529296875, -0.2336883544921875, -0.1912841796875, -0.1488800048828125, -0.106475830078125, -0.0640716552734375, -0.02166748046875, 0.0207366943359375, 0.063140869140625, 0.1055450439453125, 0.14794921875, 0.1903533935546875, 0.232757568359375, 0.2751617431640625, 0.31756591796875, 0.3599700927734375, 0.402374267578125, 0.4447784423828125, 0.4871826171875, 0.5295867919921875, 0.571990966796875, 0.6143951416015625, 0.65679931640625, 0.6992034912109375, 0.741607666015625, 0.7840118408203125, 0.826416015625, 0.8688201904296875, 0.911224365234375, 0.9536285400390625, 0.99603271484375, 1.0384368896484375, 1.080841064453125, 1.1232452392578125, 1.1656494140625, 1.2080535888671875, 1.250457763671875, 1.2928619384765625, 1.33526611328125, 1.3776702880859375, 1.420074462890625, 1.4624786376953125, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 6.0, 3.0, 6.0, 5.0, 15.0, 11.0, 7.0, 11.0, 12.0, 10.0, 17.0, 20.0, 25.0, 16.0, 25.0, 26.0, 22.0, 30.0, 37.0, 35.0, 34.0, 41.0, 30.0, 39.0, 36.0, 40.0, 40.0, 32.0, 42.0, 40.0, 38.0, 29.0, 31.0, 32.0, 26.0, 19.0, 24.0, 14.0, 11.0, 13.0, 14.0, 12.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8059539794921875, -0.777923583984375, -0.7498931884765625, -0.72186279296875, -0.6938323974609375, -0.665802001953125, -0.6377716064453125, -0.6097412109375, -0.5817108154296875, -0.553680419921875, -0.5256500244140625, -0.49761962890625, -0.4695892333984375, -0.441558837890625, -0.4135284423828125, -0.385498046875, -0.3574676513671875, -0.329437255859375, -0.3014068603515625, -0.27337646484375, -0.2453460693359375, -0.217315673828125, -0.1892852783203125, -0.1612548828125, -0.1332244873046875, -0.105194091796875, -0.0771636962890625, -0.04913330078125, -0.0211029052734375, 0.006927490234375, 0.0349578857421875, 0.06298828125, 0.0910186767578125, 0.119049072265625, 0.1470794677734375, 0.17510986328125, 0.2031402587890625, 0.231170654296875, 0.2592010498046875, 0.2872314453125, 0.3152618408203125, 0.343292236328125, 0.3713226318359375, 0.39935302734375, 0.4273834228515625, 0.455413818359375, 0.4834442138671875, 0.511474609375, 0.5395050048828125, 0.567535400390625, 0.5955657958984375, 0.62359619140625, 0.6516265869140625, 0.679656982421875, 0.7076873779296875, 0.7357177734375, 0.7637481689453125, 0.791778564453125, 0.8198089599609375, 0.84783935546875, 0.8758697509765625, 0.903900146484375, 0.9319305419921875, 0.9599609375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 0.0, 3.0, 9.0, 13.0, 14.0, 22.0, 28.0, 48.0, 107.0, 162.0, 224.0, 382.0, 589.0, 933.0, 1483.0, 2336.0, 3826.0, 6323.0, 10166.0, 16238.0, 26151.0, 41231.0, 65015.0, 100398.0, 149506.0, 216368.0, 296933.0, 380937.0, 449834.0, 482505.0, 464970.0, 409577.0, 326725.0, 244496.0, 173521.0, 116501.0, 75851.0, 49122.0, 30594.0, 19613.0, 11908.0, 7454.0, 4564.0, 2829.0, 1779.0, 1123.0, 702.0, 443.0, 246.0, 170.0, 119.0, 77.0, 40.0, 32.0, 24.0, 17.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1.263671875, -1.225006103515625, -1.18634033203125, -1.147674560546875, -1.1090087890625, -1.070343017578125, -1.03167724609375, -0.993011474609375, -0.954345703125, -0.915679931640625, -0.87701416015625, -0.838348388671875, -0.7996826171875, -0.761016845703125, -0.72235107421875, -0.683685302734375, -0.64501953125, -0.606353759765625, -0.56768798828125, -0.529022216796875, -0.4903564453125, -0.451690673828125, -0.41302490234375, -0.374359130859375, -0.335693359375, -0.297027587890625, -0.25836181640625, -0.219696044921875, -0.1810302734375, -0.142364501953125, -0.10369873046875, -0.065032958984375, -0.0263671875, 0.012298583984375, 0.05096435546875, 0.089630126953125, 0.1282958984375, 0.166961669921875, 0.20562744140625, 0.244293212890625, 0.282958984375, 0.321624755859375, 0.36029052734375, 0.398956298828125, 0.4376220703125, 0.476287841796875, 0.51495361328125, 0.553619384765625, 0.59228515625, 0.630950927734375, 0.66961669921875, 0.708282470703125, 0.7469482421875, 0.785614013671875, 0.82427978515625, 0.862945556640625, 0.901611328125, 0.940277099609375, 0.97894287109375, 1.017608642578125, 1.0562744140625, 1.094940185546875, 1.13360595703125, 1.172271728515625, 1.2109375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 9.0, 7.0, 12.0, 15.0, 10.0, 16.0, 27.0, 26.0, 39.0, 36.0, 45.0, 64.0, 79.0, 91.0, 106.0, 135.0, 119.0, 128.0, 166.0, 171.0, 160.0, 187.0, 192.0, 185.0, 195.0, 188.0, 213.0, 169.0, 189.0, 167.0, 148.0, 126.0, 105.0, 91.0, 82.0, 72.0, 68.0, 40.0, 35.0, 32.0, 25.0, 17.0, 18.0, 20.0, 11.0, 4.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.50634765625, -0.4912910461425781, -0.47623443603515625, -0.4611778259277344, -0.4461212158203125, -0.4310646057128906, -0.41600799560546875, -0.4009513854980469, -0.385894775390625, -0.3708381652832031, -0.35578155517578125, -0.3407249450683594, -0.3256683349609375, -0.3106117248535156, -0.29555511474609375, -0.2804985046386719, -0.26544189453125, -0.2503852844238281, -0.23532867431640625, -0.22027206420898438, -0.2052154541015625, -0.19015884399414062, -0.17510223388671875, -0.16004562377929688, -0.144989013671875, -0.12993240356445312, -0.11487579345703125, -0.09981918334960938, -0.0847625732421875, -0.06970596313476562, -0.05464935302734375, -0.039592742919921875, -0.0245361328125, -0.009479522705078125, 0.00557708740234375, 0.020633697509765625, 0.0356903076171875, 0.050746917724609375, 0.06580352783203125, 0.08086013793945312, 0.095916748046875, 0.11097335815429688, 0.12602996826171875, 0.14108657836914062, 0.1561431884765625, 0.17119979858398438, 0.18625640869140625, 0.20131301879882812, 0.21636962890625, 0.23142623901367188, 0.24648284912109375, 0.2615394592285156, 0.2765960693359375, 0.2916526794433594, 0.30670928955078125, 0.3217658996582031, 0.336822509765625, 0.3518791198730469, 0.36693572998046875, 0.3819923400878906, 0.3970489501953125, 0.4121055603027344, 0.42716217041015625, 0.4422187805175781, 0.457275390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 7.0, 5.0, 18.0, 17.0, 16.0, 16.0, 23.0, 26.0, 44.0, 34.0, 49.0, 50.0, 45.0, 51.0, 60.0, 58.0, 46.0, 55.0, 57.0, 40.0, 46.0, 46.0, 31.0, 22.0, 35.0, 25.0, 19.0, 8.0, 10.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8614811897277832, -1.8005732297897339, -1.7396652698516846, -1.6787573099136353, -1.617849349975586, -1.5569415092468262, -1.4960334300994873, -1.4351255893707275, -1.3742176294326782, -1.313309669494629, -1.2524017095565796, -1.1914937496185303, -1.130585789680481, -1.0696778297424316, -1.0087699890136719, -0.9478620290756226, -0.8869540095329285, -0.8260460495948792, -0.7651380896568298, -0.7042301893234253, -0.643322229385376, -0.5824142694473267, -0.5215063095092773, -0.4605983793735504, -0.3996904194355011, -0.3387824594974518, -0.27787452936172485, -0.21696656942367554, -0.15605862438678741, -0.09515067934989929, -0.034242719411849976, 0.026665210723876953, 0.08757317066192627, 0.1484811156988144, 0.20938906073570251, 0.27029702067375183, 0.33120495080947876, 0.3921129107475281, 0.4530208706855774, 0.5139287710189819, 0.5748367309570312, 0.6357446908950806, 0.6966526508331299, 0.7575606107711792, 0.8184685111045837, 0.8793764710426331, 0.9402844309806824, 1.001192331314087, 1.0621004104614258, 1.123008370399475, 1.1839163303375244, 1.2448242902755737, 1.305732250213623, 1.3666400909423828, 1.4275481700897217, 1.4884560108184814, 1.5493639707565308, 1.61027193069458, 1.6711798906326294, 1.7320878505706787, 1.792995810508728, 1.8539037704467773, 1.914811611175537, 1.9757195711135864, 2.0366275310516357]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 11.0, 9.0, 7.0, 10.0, 12.0, 13.0, 19.0, 27.0, 17.0, 26.0, 37.0, 43.0, 49.0, 52.0, 42.0, 40.0, 48.0, 55.0, 45.0, 52.0, 41.0, 47.0, 39.0, 44.0, 46.0, 25.0, 23.0, 27.0, 16.0, 24.0, 17.0, 8.0, 7.0, 6.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4232420921325684, -1.3767975568771362, -1.3303531408309937, -1.2839086055755615, -1.237464189529419, -1.1910196542739868, -1.1445751190185547, -1.098130702972412, -1.0516862869262695, -1.0052417516708374, -0.9587973356246948, -0.9123528003692627, -0.8659083843231201, -0.819463849067688, -0.7730193734169006, -0.7265748977661133, -0.6801303625106812, -0.6336858868598938, -0.5872414112091064, -0.5407968759536743, -0.49435243010520935, -0.447907954454422, -0.40146344900131226, -0.3550189733505249, -0.30857449769973755, -0.2621300220489502, -0.21568553149700165, -0.1692410409450531, -0.12279656529426575, -0.0763520896434784, -0.029907584190368652, 0.0165368914604187, 0.06298136711120605, 0.109425850212574, 0.15587033331394196, 0.2023148238658905, 0.24875929951667786, 0.2952037751674652, 0.34164828062057495, 0.3880927562713623, 0.43453723192214966, 0.480981707572937, 0.5274261832237244, 0.5738706588745117, 0.6203151941299438, 0.6667596101760864, 0.7132041454315186, 0.7596486210823059, 0.8060930967330933, 0.8525375723838806, 0.898982048034668, 0.9454265832901001, 0.9918709993362427, 1.0383155345916748, 1.0847599506378174, 1.1312044858932495, 1.1776490211486816, 1.2240935564041138, 1.2705379724502563, 1.3169825077056885, 1.363426923751831, 1.4098714590072632, 1.4563159942626953, 1.502760410308838, 1.5492048263549805]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 12.0, 19.0, 29.0, 50.0, 48.0, 107.0, 147.0, 221.0, 325.0, 534.0, 786.0, 1106.0, 1828.0, 3008.0, 4740.0, 7689.0, 12914.0, 21252.0, 35628.0, 58930.0, 94956.0, 143121.0, 179111.0, 166344.0, 120305.0, 76739.0, 46917.0, 27907.0, 16792.0, 10252.0, 6125.0, 3879.0, 2443.0, 1487.0, 926.0, 641.0, 441.0, 263.0, 177.0, 102.0, 81.0, 55.0, 31.0, 19.0, 21.0, 11.0, 2.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.35888671875, -0.3479347229003906, -0.33698272705078125, -0.3260307312011719, -0.3150787353515625, -0.3041267395019531, -0.29317474365234375, -0.2822227478027344, -0.271270751953125, -0.2603187561035156, -0.24936676025390625, -0.23841476440429688, -0.2274627685546875, -0.21651077270507812, -0.20555877685546875, -0.19460678100585938, -0.18365478515625, -0.17270278930664062, -0.16175079345703125, -0.15079879760742188, -0.1398468017578125, -0.12889480590820312, -0.11794281005859375, -0.10699081420898438, -0.096038818359375, -0.08508682250976562, -0.07413482666015625, -0.06318283081054688, -0.0522308349609375, -0.041278839111328125, -0.03032684326171875, -0.019374847412109375, -0.0084228515625, 0.002529144287109375, 0.01348114013671875, 0.024433135986328125, 0.0353851318359375, 0.046337127685546875, 0.05728912353515625, 0.06824111938476562, 0.079193115234375, 0.09014511108398438, 0.10109710693359375, 0.11204910278320312, 0.1230010986328125, 0.13395309448242188, 0.14490509033203125, 0.15585708618164062, 0.16680908203125, 0.17776107788085938, 0.18871307373046875, 0.19966506958007812, 0.2106170654296875, 0.22156906127929688, 0.23252105712890625, 0.24347305297851562, 0.254425048828125, 0.2653770446777344, 0.27632904052734375, 0.2872810363769531, 0.2982330322265625, 0.3091850280761719, 0.32013702392578125, 0.3310890197753906, 0.342041015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 4.0, 10.0, 9.0, 12.0, 13.0, 14.0, 15.0, 33.0, 17.0, 29.0, 49.0, 27.0, 40.0, 44.0, 51.0, 38.0, 33.0, 51.0, 46.0, 45.0, 47.0, 44.0, 52.0, 43.0, 42.0, 35.0, 27.0, 23.0, 16.0, 15.0, 17.0, 11.0, 7.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4326171875, -1.384765625, -1.3369140625, -1.2890625, -1.2412109375, -1.193359375, -1.1455078125, -1.09765625, -1.0498046875, -1.001953125, -0.9541015625, -0.90625, -0.8583984375, -0.810546875, -0.7626953125, -0.71484375, -0.6669921875, -0.619140625, -0.5712890625, -0.5234375, -0.4755859375, -0.427734375, -0.3798828125, -0.33203125, -0.2841796875, -0.236328125, -0.1884765625, -0.140625, -0.0927734375, -0.044921875, 0.0029296875, 0.05078125, 0.0986328125, 0.146484375, 0.1943359375, 0.2421875, 0.2900390625, 0.337890625, 0.3857421875, 0.43359375, 0.4814453125, 0.529296875, 0.5771484375, 0.625, 0.6728515625, 0.720703125, 0.7685546875, 0.81640625, 0.8642578125, 0.912109375, 0.9599609375, 1.0078125, 1.0556640625, 1.103515625, 1.1513671875, 1.19921875, 1.2470703125, 1.294921875, 1.3427734375, 1.390625, 1.4384765625, 1.486328125, 1.5341796875, 1.58203125, 1.6298828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 12.0, 8.0, 7.0, 12.0, 13.0, 19.0, 25.0, 48.0, 63.0, 100.0, 141.0, 213.0, 288.0, 442.0, 691.0, 1057.0, 1655.0, 2696.0, 4574.0, 8210.0, 14611.0, 27187.0, 50959.0, 95104.0, 166356.0, 227233.0, 192001.0, 115673.0, 63178.0, 33557.0, 18064.0, 9982.0, 5562.0, 3213.0, 2044.0, 1256.0, 772.0, 470.0, 340.0, 213.0, 144.0, 103.0, 66.0, 62.0, 44.0, 18.0, 19.0, 14.0, 12.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-0.45361328125, -0.439727783203125, -0.42584228515625, -0.411956787109375, -0.3980712890625, -0.384185791015625, -0.37030029296875, -0.356414794921875, -0.342529296875, -0.328643798828125, -0.31475830078125, -0.300872802734375, -0.2869873046875, -0.273101806640625, -0.25921630859375, -0.245330810546875, -0.2314453125, -0.217559814453125, -0.20367431640625, -0.189788818359375, -0.1759033203125, -0.162017822265625, -0.14813232421875, -0.134246826171875, -0.120361328125, -0.106475830078125, -0.09259033203125, -0.078704833984375, -0.0648193359375, -0.050933837890625, -0.03704833984375, -0.023162841796875, -0.00927734375, 0.004608154296875, 0.01849365234375, 0.032379150390625, 0.0462646484375, 0.060150146484375, 0.07403564453125, 0.087921142578125, 0.101806640625, 0.115692138671875, 0.12957763671875, 0.143463134765625, 0.1573486328125, 0.171234130859375, 0.18511962890625, 0.199005126953125, 0.212890625, 0.226776123046875, 0.24066162109375, 0.254547119140625, 0.2684326171875, 0.282318115234375, 0.29620361328125, 0.310089111328125, 0.323974609375, 0.337860107421875, 0.35174560546875, 0.365631103515625, 0.3795166015625, 0.393402099609375, 0.40728759765625, 0.421173095703125, 0.43505859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 7.0, 8.0, 8.0, 18.0, 25.0, 29.0, 26.0, 26.0, 29.0, 33.0, 32.0, 40.0, 38.0, 35.0, 37.0, 50.0, 53.0, 40.0, 53.0, 28.0, 35.0, 29.0, 38.0, 34.0, 29.0, 26.0, 19.0, 29.0, 19.0, 26.0, 13.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8212203979492188, -0.7942962646484375, -0.7673721313476562, -0.740447998046875, -0.7135238647460938, -0.6865997314453125, -0.6596755981445312, -0.63275146484375, -0.6058273315429688, -0.5789031982421875, -0.5519790649414062, -0.525054931640625, -0.49813079833984375, -0.4712066650390625, -0.44428253173828125, -0.4173583984375, -0.39043426513671875, -0.3635101318359375, -0.33658599853515625, -0.309661865234375, -0.28273773193359375, -0.2558135986328125, -0.22888946533203125, -0.20196533203125, -0.17504119873046875, -0.1481170654296875, -0.12119293212890625, -0.094268798828125, -0.06734466552734375, -0.0404205322265625, -0.01349639892578125, 0.013427734375, 0.04035186767578125, 0.0672760009765625, 0.09420013427734375, 0.121124267578125, 0.14804840087890625, 0.1749725341796875, 0.20189666748046875, 0.22882080078125, 0.25574493408203125, 0.2826690673828125, 0.30959320068359375, 0.336517333984375, 0.36344146728515625, 0.3903656005859375, 0.41728973388671875, 0.4442138671875, 0.47113800048828125, 0.4980621337890625, 0.5249862670898438, 0.551910400390625, 0.5788345336914062, 0.6057586669921875, 0.6326828002929688, 0.65960693359375, 0.6865310668945312, 0.7134552001953125, 0.7403793334960938, 0.767303466796875, 0.7942276000976562, 0.8211517333984375, 0.8480758666992188, 0.875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 10.0, 11.0, 13.0, 21.0, 18.0, 24.0, 37.0, 43.0, 63.0, 79.0, 85.0, 175.0, 235.0, 393.0, 629.0, 959.0, 1778.0, 3458.0, 7204.0, 18633.0, 66772.0, 420814.0, 425475.0, 67459.0, 18764.0, 7329.0, 3400.0, 1820.0, 1036.0, 588.0, 393.0, 236.0, 185.0, 97.0, 80.0, 62.0, 34.0, 28.0, 24.0, 18.0, 20.0, 10.0, 9.0, 7.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3502845764160156, -0.33777618408203125, -0.3252677917480469, -0.3127593994140625, -0.3002510070800781, -0.28774261474609375, -0.2752342224121094, -0.262725830078125, -0.2502174377441406, -0.23770904541015625, -0.22520065307617188, -0.2126922607421875, -0.20018386840820312, -0.18767547607421875, -0.17516708374023438, -0.16265869140625, -0.15015029907226562, -0.13764190673828125, -0.12513351440429688, -0.1126251220703125, -0.10011672973632812, -0.08760833740234375, -0.07509994506835938, -0.062591552734375, -0.050083160400390625, -0.03757476806640625, -0.025066375732421875, -0.0125579833984375, -4.9591064453125e-05, 0.01245880126953125, 0.024967193603515625, 0.0374755859375, 0.049983978271484375, 0.06249237060546875, 0.07500076293945312, 0.0875091552734375, 0.10001754760742188, 0.11252593994140625, 0.12503433227539062, 0.137542724609375, 0.15005111694335938, 0.16255950927734375, 0.17506790161132812, 0.1875762939453125, 0.20008468627929688, 0.21259307861328125, 0.22510147094726562, 0.23760986328125, 0.2501182556152344, 0.26262664794921875, 0.2751350402832031, 0.2876434326171875, 0.3001518249511719, 0.31266021728515625, 0.3251686096191406, 0.337677001953125, 0.3501853942871094, 0.36269378662109375, 0.3752021789550781, 0.3877105712890625, 0.4002189636230469, 0.41272735595703125, 0.4252357482910156, 0.437744140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 14.0, 15.0, 18.0, 22.0, 41.0, 39.0, 47.0, 44.0, 61.0, 72.0, 62.0, 76.0, 60.0, 67.0, 48.0, 63.0, 47.0, 38.0, 33.0, 19.0, 24.0, 18.0, 17.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.5463680028915405e-05, -1.5012919902801514e-05, -1.4562159776687622e-05, -1.411139965057373e-05, -1.3660639524459839e-05, -1.3209879398345947e-05, -1.2759119272232056e-05, -1.2308359146118164e-05, -1.1857599020004272e-05, -1.1406838893890381e-05, -1.095607876777649e-05, -1.0505318641662598e-05, -1.0054558515548706e-05, -9.603798389434814e-06, -9.153038263320923e-06, -8.702278137207031e-06, -8.25151801109314e-06, -7.800757884979248e-06, -7.3499977588653564e-06, -6.899237632751465e-06, -6.448477506637573e-06, -5.997717380523682e-06, -5.54695725440979e-06, -5.0961971282958984e-06, -4.645437002182007e-06, -4.194676876068115e-06, -3.7439167499542236e-06, -3.293156623840332e-06, -2.8423964977264404e-06, -2.391636371612549e-06, -1.9408762454986572e-06, -1.4901161193847656e-06, -1.039355993270874e-06, -5.885958671569824e-07, -1.3783574104309082e-07, 3.129243850708008e-07, 7.636845111846924e-07, 1.214444637298584e-06, 1.6652047634124756e-06, 2.115964889526367e-06, 2.566725015640259e-06, 3.0174851417541504e-06, 3.468245267868042e-06, 3.919005393981934e-06, 4.369765520095825e-06, 4.820525646209717e-06, 5.271285772323608e-06, 5.7220458984375e-06, 6.172806024551392e-06, 6.623566150665283e-06, 7.074326276779175e-06, 7.525086402893066e-06, 7.975846529006958e-06, 8.42660665512085e-06, 8.877366781234741e-06, 9.328126907348633e-06, 9.778887033462524e-06, 1.0229647159576416e-05, 1.0680407285690308e-05, 1.11311674118042e-05, 1.158192753791809e-05, 1.2032687664031982e-05, 1.2483447790145874e-05, 1.2934207916259766e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 6.0, 14.0, 10.0, 24.0, 30.0, 29.0, 39.0, 42.0, 60.0, 89.0, 146.0, 195.0, 269.0, 371.0, 540.0, 776.0, 1207.0, 1838.0, 2898.0, 4977.0, 8937.0, 17829.0, 40222.0, 100456.0, 249803.0, 332979.0, 164280.0, 63700.0, 26940.0, 12380.0, 6590.0, 3778.0, 2273.0, 1515.0, 1034.0, 663.0, 449.0, 341.0, 241.0, 177.0, 114.0, 95.0, 60.0, 43.0, 29.0, 18.0, 16.0, 9.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28271484375, -0.2736701965332031, -0.26462554931640625, -0.2555809020996094, -0.2465362548828125, -0.23749160766601562, -0.22844696044921875, -0.21940231323242188, -0.210357666015625, -0.20131301879882812, -0.19226837158203125, -0.18322372436523438, -0.1741790771484375, -0.16513442993164062, -0.15608978271484375, -0.14704513549804688, -0.13800048828125, -0.12895584106445312, -0.11991119384765625, -0.11086654663085938, -0.1018218994140625, -0.09277725219726562, -0.08373260498046875, -0.07468795776367188, -0.065643310546875, -0.056598663330078125, -0.04755401611328125, -0.038509368896484375, -0.0294647216796875, -0.020420074462890625, -0.01137542724609375, -0.002330780029296875, 0.0067138671875, 0.015758514404296875, 0.02480316162109375, 0.033847808837890625, 0.0428924560546875, 0.051937103271484375, 0.06098175048828125, 0.07002639770507812, 0.079071044921875, 0.08811569213867188, 0.09716033935546875, 0.10620498657226562, 0.1152496337890625, 0.12429428100585938, 0.13333892822265625, 0.14238357543945312, 0.15142822265625, 0.16047286987304688, 0.16951751708984375, 0.17856216430664062, 0.1876068115234375, 0.19665145874023438, 0.20569610595703125, 0.21474075317382812, 0.223785400390625, 0.23283004760742188, 0.24187469482421875, 0.2509193420410156, 0.2599639892578125, 0.2690086364746094, 0.27805328369140625, 0.2870979309082031, 0.296142578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 10.0, 14.0, 24.0, 33.0, 49.0, 69.0, 109.0, 129.0, 151.0, 145.0, 98.0, 52.0, 37.0, 18.0, 12.0, 7.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08376884460449219, -0.08056259155273438, -0.07735633850097656, -0.07415008544921875, -0.07094383239746094, -0.06773757934570312, -0.06453132629394531, -0.0613250732421875, -0.05811882019042969, -0.054912567138671875, -0.05170631408691406, -0.04850006103515625, -0.04529380798339844, -0.042087554931640625, -0.03888130187988281, -0.035675048828125, -0.03246879577636719, -0.029262542724609375, -0.026056289672851562, -0.02285003662109375, -0.019643783569335938, -0.016437530517578125, -0.013231277465820312, -0.0100250244140625, -0.0068187713623046875, -0.003612518310546875, -0.0004062652587890625, 0.00279998779296875, 0.0060062408447265625, 0.009212493896484375, 0.012418746948242188, 0.015625, 0.018831253051757812, 0.022037506103515625, 0.025243759155273438, 0.02845001220703125, 0.03165626525878906, 0.034862518310546875, 0.03806877136230469, 0.0412750244140625, 0.04448127746582031, 0.047687530517578125, 0.05089378356933594, 0.05410003662109375, 0.05730628967285156, 0.060512542724609375, 0.06371879577636719, 0.066925048828125, 0.07013130187988281, 0.07333755493164062, 0.07654380798339844, 0.07975006103515625, 0.08295631408691406, 0.08616256713867188, 0.08936882019042969, 0.0925750732421875, 0.09578132629394531, 0.09898757934570312, 0.10219383239746094, 0.10540008544921875, 0.10860633850097656, 0.11181259155273438, 0.11501884460449219, 0.11822509765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 1.0, 9.0, 3.0, 12.0, 12.0, 19.0, 14.0, 21.0, 27.0, 29.0, 42.0, 43.0, 47.0, 41.0, 52.0, 60.0, 60.0, 50.0, 56.0, 53.0, 54.0, 41.0, 49.0, 42.0, 23.0, 34.0, 24.0, 17.0, 16.0, 13.0, 8.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9357694387435913, -1.8736472129821777, -1.8115248680114746, -1.7494025230407715, -1.687280297279358, -1.6251580715179443, -1.5630357265472412, -1.500913381576538, -1.4387911558151245, -1.376668930053711, -1.3145465850830078, -1.2524242401123047, -1.1903020143508911, -1.1281797885894775, -1.0660574436187744, -1.0039350986480713, -0.9418128728866577, -0.8796905875205994, -0.817568302154541, -0.7554460167884827, -0.6933237314224243, -0.631201446056366, -0.5690791606903076, -0.5069568753242493, -0.4448345899581909, -0.38271230459213257, -0.3205900192260742, -0.25846773386001587, -0.19634544849395752, -0.13422316312789917, -0.07210087776184082, -0.00997859239578247, 0.05214381217956543, 0.11426609754562378, 0.17638838291168213, 0.23851066827774048, 0.30063295364379883, 0.3627552390098572, 0.4248775243759155, 0.4869998097419739, 0.5491220951080322, 0.6112443804740906, 0.6733666658401489, 0.7354889512062073, 0.7976112365722656, 0.859733521938324, 0.9218558073043823, 0.9839780926704407, 1.046100378036499, 1.1082227230072021, 1.1703449487686157, 1.2324671745300293, 1.2945895195007324, 1.3567118644714355, 1.4188340902328491, 1.4809563159942627, 1.5430786609649658, 1.605201005935669, 1.6673232316970825, 1.729445457458496, 1.7915678024291992, 1.8536901473999023, 1.915812373161316, 1.9779345989227295, 2.0400569438934326]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 9.0, 13.0, 5.0, 9.0, 9.0, 13.0, 12.0, 18.0, 29.0, 18.0, 27.0, 41.0, 40.0, 51.0, 52.0, 37.0, 46.0, 52.0, 50.0, 46.0, 47.0, 45.0, 48.0, 35.0, 46.0, 46.0, 25.0, 21.0, 31.0, 14.0, 19.0, 16.0, 10.0, 6.0, 6.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4187204837799072, -1.3720732927322388, -1.3254261016845703, -1.2787789106369019, -1.2321317195892334, -1.1854846477508545, -1.1388373374938965, -1.0921902656555176, -1.0455430746078491, -0.9988958835601807, -0.9522486925125122, -0.9056015014648438, -0.8589543700218201, -0.8123071789741516, -0.7656599879264832, -0.7190128564834595, -0.6723656058311462, -0.6257184147834778, -0.5790712237358093, -0.5324240922927856, -0.4857769012451172, -0.43912971019744873, -0.3924825191497803, -0.3458353579044342, -0.29918816685676575, -0.2525409758090973, -0.20589381456375122, -0.15924662351608276, -0.1125994473695755, -0.06595227122306824, -0.01930508017539978, 0.02734208106994629, 0.07398927211761475, 0.12063644826412201, 0.16728362441062927, 0.21393081545829773, 0.2605779767036438, 0.30722516775131226, 0.3538723587989807, 0.4005195200443268, 0.44716671109199524, 0.4938139021396637, 0.5404610633850098, 0.5871082544326782, 0.6337554454803467, 0.6804026365280151, 0.7270498275756836, 0.7736969590187073, 0.8203441500663757, 0.8669913411140442, 0.9136385321617126, 0.9602856636047363, 1.0069328546524048, 1.0535800457000732, 1.1002272367477417, 1.1468744277954102, 1.1935216188430786, 1.240168809890747, 1.2868160009384155, 1.333463191986084, 1.3801103830337524, 1.426757574081421, 1.4734046459197998, 1.5200518369674683, 1.5666990280151367]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 21.0, 29.0, 59.0, 93.0, 115.0, 215.0, 357.0, 556.0, 914.0, 1436.0, 2456.0, 3962.0, 6272.0, 9967.0, 15798.0, 23710.0, 35374.0, 50109.0, 67737.0, 86839.0, 102476.0, 112177.0, 112537.0, 103339.0, 87901.0, 69103.0, 51012.0, 36121.0, 24443.0, 16034.0, 10233.0, 6615.0, 4023.0, 2534.0, 1472.0, 913.0, 580.0, 382.0, 253.0, 143.0, 83.0, 54.0, 30.0, 26.0, 7.0, 16.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.033203125, -0.999908447265625, -0.96661376953125, -0.933319091796875, -0.9000244140625, -0.866729736328125, -0.83343505859375, -0.800140380859375, -0.766845703125, -0.733551025390625, -0.70025634765625, -0.666961669921875, -0.6336669921875, -0.600372314453125, -0.56707763671875, -0.533782958984375, -0.50048828125, -0.467193603515625, -0.43389892578125, -0.400604248046875, -0.3673095703125, -0.334014892578125, -0.30072021484375, -0.267425537109375, -0.234130859375, -0.200836181640625, -0.16754150390625, -0.134246826171875, -0.1009521484375, -0.067657470703125, -0.03436279296875, -0.001068115234375, 0.0322265625, 0.065521240234375, 0.09881591796875, 0.132110595703125, 0.1654052734375, 0.198699951171875, 0.23199462890625, 0.265289306640625, 0.298583984375, 0.331878662109375, 0.36517333984375, 0.398468017578125, 0.4317626953125, 0.465057373046875, 0.49835205078125, 0.531646728515625, 0.56494140625, 0.598236083984375, 0.63153076171875, 0.664825439453125, 0.6981201171875, 0.731414794921875, 0.76470947265625, 0.798004150390625, 0.831298828125, 0.864593505859375, 0.89788818359375, 0.931182861328125, 0.9644775390625, 0.997772216796875, 1.03106689453125, 1.064361572265625, 1.09765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 9.0, 9.0, 25.0, 8.0, 13.0, 27.0, 31.0, 25.0, 28.0, 30.0, 48.0, 50.0, 44.0, 47.0, 55.0, 59.0, 42.0, 49.0, 54.0, 43.0, 54.0, 38.0, 31.0, 30.0, 31.0, 19.0, 16.0, 20.0, 20.0, 8.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7255859375, -1.6743927001953125, -1.623199462890625, -1.5720062255859375, -1.52081298828125, -1.4696197509765625, -1.418426513671875, -1.3672332763671875, -1.3160400390625, -1.2648468017578125, -1.213653564453125, -1.1624603271484375, -1.11126708984375, -1.0600738525390625, -1.008880615234375, -0.9576873779296875, -0.906494140625, -0.8553009033203125, -0.804107666015625, -0.7529144287109375, -0.70172119140625, -0.6505279541015625, -0.599334716796875, -0.5481414794921875, -0.4969482421875, -0.4457550048828125, -0.394561767578125, -0.3433685302734375, -0.29217529296875, -0.2409820556640625, -0.189788818359375, -0.1385955810546875, -0.08740234375, -0.0362091064453125, 0.014984130859375, 0.0661773681640625, 0.11737060546875, 0.1685638427734375, 0.219757080078125, 0.2709503173828125, 0.3221435546875, 0.3733367919921875, 0.424530029296875, 0.4757232666015625, 0.52691650390625, 0.5781097412109375, 0.629302978515625, 0.6804962158203125, 0.731689453125, 0.7828826904296875, 0.834075927734375, 0.8852691650390625, 0.93646240234375, 0.9876556396484375, 1.038848876953125, 1.0900421142578125, 1.1412353515625, 1.1924285888671875, 1.243621826171875, 1.2948150634765625, 1.34600830078125, 1.3972015380859375, 1.448394775390625, 1.4995880126953125, 1.55078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 14.0, 17.0, 24.0, 37.0, 47.0, 80.0, 149.0, 207.0, 298.0, 477.0, 771.0, 1205.0, 1883.0, 2874.0, 4354.0, 6469.0, 9581.0, 14008.0, 20079.0, 28277.0, 38270.0, 49942.0, 63771.0, 76515.0, 86947.0, 94432.0, 95371.0, 91425.0, 82589.0, 70116.0, 56284.0, 44099.0, 33042.0, 23600.0, 16956.0, 11675.0, 7698.0, 5212.0, 3450.0, 2238.0, 1459.0, 972.0, 607.0, 346.0, 238.0, 160.0, 110.0, 68.0, 41.0, 24.0, 27.0, 14.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8673171997070312, -0.8386383056640625, -0.8099594116210938, -0.781280517578125, -0.7526016235351562, -0.7239227294921875, -0.6952438354492188, -0.66656494140625, -0.6378860473632812, -0.6092071533203125, -0.5805282592773438, -0.551849365234375, -0.5231704711914062, -0.4944915771484375, -0.46581268310546875, -0.4371337890625, -0.40845489501953125, -0.3797760009765625, -0.35109710693359375, -0.322418212890625, -0.29373931884765625, -0.2650604248046875, -0.23638153076171875, -0.20770263671875, -0.17902374267578125, -0.1503448486328125, -0.12166595458984375, -0.092987060546875, -0.06430816650390625, -0.0356292724609375, -0.00695037841796875, 0.021728515625, 0.05040740966796875, 0.0790863037109375, 0.10776519775390625, 0.136444091796875, 0.16512298583984375, 0.1938018798828125, 0.22248077392578125, 0.25115966796875, 0.27983856201171875, 0.3085174560546875, 0.33719635009765625, 0.365875244140625, 0.39455413818359375, 0.4232330322265625, 0.45191192626953125, 0.4805908203125, 0.5092697143554688, 0.5379486083984375, 0.5666275024414062, 0.595306396484375, 0.6239852905273438, 0.6526641845703125, 0.6813430786132812, 0.71002197265625, 0.7387008666992188, 0.7673797607421875, 0.7960586547851562, 0.824737548828125, 0.8534164428710938, 0.8820953369140625, 0.9107742309570312, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 4.0, 13.0, 5.0, 14.0, 15.0, 11.0, 19.0, 19.0, 22.0, 21.0, 22.0, 34.0, 38.0, 25.0, 30.0, 36.0, 39.0, 37.0, 39.0, 28.0, 30.0, 40.0, 36.0, 29.0, 42.0, 38.0, 32.0, 33.0, 30.0, 26.0, 26.0, 26.0, 16.0, 20.0, 9.0, 19.0, 15.0, 10.0, 8.0, 7.0, 5.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.8330078125, -0.8095779418945312, -0.7861480712890625, -0.7627182006835938, -0.739288330078125, -0.7158584594726562, -0.6924285888671875, -0.6689987182617188, -0.64556884765625, -0.6221389770507812, -0.5987091064453125, -0.5752792358398438, -0.551849365234375, -0.5284194946289062, -0.5049896240234375, -0.48155975341796875, -0.4581298828125, -0.43470001220703125, -0.4112701416015625, -0.38784027099609375, -0.364410400390625, -0.34098052978515625, -0.3175506591796875, -0.29412078857421875, -0.27069091796875, -0.24726104736328125, -0.2238311767578125, -0.20040130615234375, -0.176971435546875, -0.15354156494140625, -0.1301116943359375, -0.10668182373046875, -0.083251953125, -0.05982208251953125, -0.0363922119140625, -0.01296234130859375, 0.010467529296875, 0.03389739990234375, 0.0573272705078125, 0.08075714111328125, 0.10418701171875, 0.12761688232421875, 0.1510467529296875, 0.17447662353515625, 0.197906494140625, 0.22133636474609375, 0.2447662353515625, 0.26819610595703125, 0.2916259765625, 0.31505584716796875, 0.3384857177734375, 0.36191558837890625, 0.385345458984375, 0.40877532958984375, 0.4322052001953125, 0.45563507080078125, 0.47906494140625, 0.5024948120117188, 0.5259246826171875, 0.5493545532226562, 0.572784423828125, 0.5962142944335938, 0.6196441650390625, 0.6430740356445312, 0.66650390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 13.0, 27.0, 30.0, 53.0, 72.0, 89.0, 119.0, 186.0, 221.0, 362.0, 500.0, 748.0, 1130.0, 1782.0, 2819.0, 5074.0, 9421.0, 18078.0, 34812.0, 65433.0, 114540.0, 168930.0, 195492.0, 170623.0, 115426.0, 65912.0, 35101.0, 18451.0, 9577.0, 5133.0, 2947.0, 1789.0, 1155.0, 753.0, 505.0, 362.0, 243.0, 165.0, 114.0, 116.0, 55.0, 62.0, 33.0, 22.0, 17.0, 8.0, 5.0, 11.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.9111328125, -0.8822174072265625, -0.853302001953125, -0.8243865966796875, -0.79547119140625, -0.7665557861328125, -0.737640380859375, -0.7087249755859375, -0.6798095703125, -0.6508941650390625, -0.621978759765625, -0.5930633544921875, -0.56414794921875, -0.5352325439453125, -0.506317138671875, -0.4774017333984375, -0.448486328125, -0.4195709228515625, -0.390655517578125, -0.3617401123046875, -0.33282470703125, -0.3039093017578125, -0.274993896484375, -0.2460784912109375, -0.2171630859375, -0.1882476806640625, -0.159332275390625, -0.1304168701171875, -0.10150146484375, -0.0725860595703125, -0.043670654296875, -0.0147552490234375, 0.01416015625, 0.0430755615234375, 0.071990966796875, 0.1009063720703125, 0.12982177734375, 0.1587371826171875, 0.187652587890625, 0.2165679931640625, 0.2454833984375, 0.2743988037109375, 0.303314208984375, 0.3322296142578125, 0.36114501953125, 0.3900604248046875, 0.418975830078125, 0.4478912353515625, 0.476806640625, 0.5057220458984375, 0.534637451171875, 0.5635528564453125, 0.59246826171875, 0.6213836669921875, 0.650299072265625, 0.6792144775390625, 0.7081298828125, 0.7370452880859375, 0.765960693359375, 0.7948760986328125, 0.82379150390625, 0.8527069091796875, 0.881622314453125, 0.9105377197265625, 0.939453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 7.0, 15.0, 32.0, 34.0, 52.0, 69.0, 104.0, 114.0, 99.0, 115.0, 98.0, 70.0, 53.0, 46.0, 29.0, 16.0, 12.0, 8.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010120868682861328, -9.655021131038666e-05, -9.189173579216003e-05, -8.723326027393341e-05, -8.257478475570679e-05, -7.791630923748016e-05, -7.325783371925354e-05, -6.859935820102692e-05, -6.394088268280029e-05, -5.928240716457367e-05, -5.4623931646347046e-05, -4.996545612812042e-05, -4.53069806098938e-05, -4.0648505091667175e-05, -3.599002957344055e-05, -3.133155405521393e-05, -2.6673078536987305e-05, -2.201460301876068e-05, -1.7356127500534058e-05, -1.2697651982307434e-05, -8.03917646408081e-06, -3.380700945854187e-06, 1.2777745723724365e-06, 5.93625009059906e-06, 1.0594725608825684e-05, 1.5253201127052307e-05, 1.991167664527893e-05, 2.4570152163505554e-05, 2.9228627681732178e-05, 3.38871031999588e-05, 3.8545578718185425e-05, 4.320405423641205e-05, 4.786252975463867e-05, 5.2521005272865295e-05, 5.717948079109192e-05, 6.183795630931854e-05, 6.649643182754517e-05, 7.115490734577179e-05, 7.581338286399841e-05, 8.047185838222504e-05, 8.513033390045166e-05, 8.978880941867828e-05, 9.444728493690491e-05, 9.910576045513153e-05, 0.00010376423597335815, 0.00010842271149158478, 0.0001130811870098114, 0.00011773966252803802, 0.00012239813804626465, 0.00012705661356449127, 0.0001317150890827179, 0.00013637356460094452, 0.00014103204011917114, 0.00014569051563739777, 0.0001503489911556244, 0.000155007466673851, 0.00015966594219207764, 0.00016432441771030426, 0.00016898289322853088, 0.0001736413687467575, 0.00017829984426498413, 0.00018295831978321075, 0.00018761679530143738, 0.000192275270819664, 0.00019693374633789062]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 8.0, 5.0, 7.0, 17.0, 10.0, 26.0, 35.0, 40.0, 62.0, 87.0, 135.0, 178.0, 259.0, 351.0, 536.0, 766.0, 1161.0, 1730.0, 2595.0, 4006.0, 6300.0, 10164.0, 17278.0, 28996.0, 49312.0, 79210.0, 115121.0, 147790.0, 158166.0, 139796.0, 105500.0, 69976.0, 42988.0, 25683.0, 14877.0, 9033.0, 5630.0, 3598.0, 2328.0, 1536.0, 975.0, 685.0, 483.0, 327.0, 240.0, 169.0, 111.0, 83.0, 58.0, 35.0, 36.0, 24.0, 13.0, 7.0, 11.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.73828125, -0.7147445678710938, -0.6912078857421875, -0.6676712036132812, -0.644134521484375, -0.6205978393554688, -0.5970611572265625, -0.5735244750976562, -0.54998779296875, -0.5264511108398438, -0.5029144287109375, -0.47937774658203125, -0.455841064453125, -0.43230438232421875, -0.4087677001953125, -0.38523101806640625, -0.3616943359375, -0.33815765380859375, -0.3146209716796875, -0.29108428955078125, -0.267547607421875, -0.24401092529296875, -0.2204742431640625, -0.19693756103515625, -0.17340087890625, -0.14986419677734375, -0.1263275146484375, -0.10279083251953125, -0.079254150390625, -0.05571746826171875, -0.0321807861328125, -0.00864410400390625, 0.014892578125, 0.03842926025390625, 0.0619659423828125, 0.08550262451171875, 0.109039306640625, 0.13257598876953125, 0.1561126708984375, 0.17964935302734375, 0.20318603515625, 0.22672271728515625, 0.2502593994140625, 0.27379608154296875, 0.297332763671875, 0.32086944580078125, 0.3444061279296875, 0.36794281005859375, 0.3914794921875, 0.41501617431640625, 0.4385528564453125, 0.46208953857421875, 0.485626220703125, 0.5091629028320312, 0.5326995849609375, 0.5562362670898438, 0.57977294921875, 0.6033096313476562, 0.6268463134765625, 0.6503829956054688, 0.673919677734375, 0.6974563598632812, 0.7209930419921875, 0.7445297241210938, 0.76806640625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 2.0, 8.0, 12.0, 6.0, 11.0, 25.0, 22.0, 31.0, 34.0, 34.0, 39.0, 50.0, 43.0, 52.0, 66.0, 65.0, 69.0, 64.0, 56.0, 43.0, 44.0, 43.0, 27.0, 25.0, 29.0, 20.0, 8.0, 6.0, 12.0, 17.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.234619140625, -0.22672653198242188, -0.21883392333984375, -0.21094131469726562, -0.2030487060546875, -0.19515609741210938, -0.18726348876953125, -0.17937088012695312, -0.171478271484375, -0.16358566284179688, -0.15569305419921875, -0.14780044555664062, -0.1399078369140625, -0.13201522827148438, -0.12412261962890625, -0.11623001098632812, -0.10833740234375, -0.10044479370117188, -0.09255218505859375, -0.08465957641601562, -0.0767669677734375, -0.06887435913085938, -0.06098175048828125, -0.053089141845703125, -0.045196533203125, -0.037303924560546875, -0.02941131591796875, -0.021518707275390625, -0.0136260986328125, -0.005733489990234375, 0.00215911865234375, 0.010051727294921875, 0.0179443359375, 0.025836944580078125, 0.03372955322265625, 0.041622161865234375, 0.0495147705078125, 0.057407379150390625, 0.06529998779296875, 0.07319259643554688, 0.081085205078125, 0.08897781372070312, 0.09687042236328125, 0.10476303100585938, 0.1126556396484375, 0.12054824829101562, 0.12844085693359375, 0.13633346557617188, 0.14422607421875, 0.15211868286132812, 0.16001129150390625, 0.16790390014648438, 0.1757965087890625, 0.18368911743164062, 0.19158172607421875, 0.19947433471679688, 0.207366943359375, 0.21525955200195312, 0.22315216064453125, 0.23104476928710938, 0.2389373779296875, 0.24682998657226562, 0.25472259521484375, 0.2626152038574219, 0.2705078125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 2.0, 11.0, 10.0, 14.0, 4.0, 14.0, 14.0, 15.0, 23.0, 26.0, 42.0, 51.0, 41.0, 34.0, 42.0, 54.0, 45.0, 47.0, 48.0, 51.0, 48.0, 40.0, 40.0, 44.0, 42.0, 32.0, 33.0, 23.0, 21.0, 16.0, 10.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6329678297042847, -1.5764333009719849, -1.519898772239685, -1.4633642435073853, -1.4068297147750854, -1.3502951860427856, -1.2937607765197754, -1.2372262477874756, -1.1806917190551758, -1.124157190322876, -1.0676226615905762, -1.0110881328582764, -0.9545536041259766, -0.8980190753936768, -0.8414846062660217, -0.7849500775337219, -0.7284154891967773, -0.6718809604644775, -0.6153464317321777, -0.5588119029998779, -0.5022773742675781, -0.4457428753376007, -0.3892083764076233, -0.3326738476753235, -0.2761393189430237, -0.21960479021072388, -0.16307027637958527, -0.10653576254844666, -0.05000123381614685, 0.006533294916152954, 0.06306779384613037, 0.11960232257843018, 0.17613673210144043, 0.23267126083374023, 0.28920578956604004, 0.34574028849601746, 0.40227481722831726, 0.45880934596061707, 0.5153438448905945, 0.5718783736228943, 0.6284129023551941, 0.6849474310874939, 0.7414819598197937, 0.7980164289474487, 0.8545509576797485, 0.9110854864120483, 0.9676200151443481, 1.024154543876648, 1.0806890726089478, 1.1372236013412476, 1.1937581300735474, 1.2502926588058472, 1.306827187538147, 1.3633617162704468, 1.419896125793457, 1.4764306545257568, 1.5329651832580566, 1.5894997119903564, 1.6460342407226562, 1.702568769454956, 1.7591032981872559, 1.8156378269195557, 1.8721723556518555, 1.9287068843841553, 1.985241413116455]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 16.0, 6.0, 16.0, 16.0, 18.0, 22.0, 23.0, 22.0, 32.0, 30.0, 46.0, 34.0, 39.0, 52.0, 40.0, 35.0, 49.0, 42.0, 42.0, 46.0, 38.0, 35.0, 38.0, 32.0, 35.0, 30.0, 28.0, 21.0, 19.0, 17.0, 14.0, 15.0, 5.0, 6.0, 12.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3978337049484253, -1.353912115097046, -1.309990406036377, -1.2660688161849976, -1.2221472263336182, -1.1782256364822388, -1.1343040466308594, -1.0903823375701904, -1.046460747718811, -1.0025391578674316, -0.9586175084114075, -0.9146958589553833, -0.8707742691040039, -0.8268526792526245, -0.7829310297966003, -0.7390093803405762, -0.6950877904891968, -0.6511662006378174, -0.6072445511817932, -0.563322901725769, -0.5194013118743896, -0.47547969222068787, -0.4315580725669861, -0.3876364529132843, -0.3437148332595825, -0.29979321360588074, -0.25587159395217896, -0.21194997429847717, -0.1680283546447754, -0.12410673499107361, -0.08018511533737183, -0.036263495683670044, 0.007658123970031738, 0.05157974362373352, 0.0955013632774353, 0.13942298293113708, 0.18334460258483887, 0.22726622223854065, 0.27118784189224243, 0.3151094615459442, 0.359031081199646, 0.4029527008533478, 0.44687432050704956, 0.49079594016075134, 0.5347175598144531, 0.5786391496658325, 0.6225607991218567, 0.6664824485778809, 0.7104040384292603, 0.7543256282806396, 0.7982472777366638, 0.842168927192688, 0.8860905170440674, 0.9300121068954468, 0.973933756351471, 1.0178554058074951, 1.0617769956588745, 1.105698585510254, 1.1496202945709229, 1.1935418844223022, 1.2374634742736816, 1.281385064125061, 1.3253066539764404, 1.3692283630371094, 1.4131499528884888]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 6.0, 13.0, 25.0, 33.0, 57.0, 92.0, 168.0, 263.0, 480.0, 773.0, 1243.0, 2205.0, 3993.0, 7227.0, 12803.0, 23414.0, 42565.0, 76368.0, 134845.0, 227770.0, 360197.0, 510090.0, 622073.0, 637597.0, 540215.0, 391226.0, 252904.0, 151390.0, 86177.0, 48244.0, 26735.0, 14644.0, 8074.0, 4462.0, 2513.0, 1424.0, 809.0, 477.0, 285.0, 168.0, 93.0, 50.0, 41.0, 21.0, 16.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4785308837890625, -1.427764892578125, -1.3769989013671875, -1.32623291015625, -1.2754669189453125, -1.224700927734375, -1.1739349365234375, -1.1231689453125, -1.0724029541015625, -1.021636962890625, -0.9708709716796875, -0.92010498046875, -0.8693389892578125, -0.818572998046875, -0.7678070068359375, -0.717041015625, -0.6662750244140625, -0.615509033203125, -0.5647430419921875, -0.51397705078125, -0.4632110595703125, -0.412445068359375, -0.3616790771484375, -0.3109130859375, -0.2601470947265625, -0.209381103515625, -0.1586151123046875, -0.10784912109375, -0.0570831298828125, -0.006317138671875, 0.0444488525390625, 0.09521484375, 0.1459808349609375, 0.196746826171875, 0.2475128173828125, 0.29827880859375, 0.3490447998046875, 0.399810791015625, 0.4505767822265625, 0.5013427734375, 0.5521087646484375, 0.602874755859375, 0.6536407470703125, 0.70440673828125, 0.7551727294921875, 0.805938720703125, 0.8567047119140625, 0.907470703125, 0.9582366943359375, 1.009002685546875, 1.0597686767578125, 1.11053466796875, 1.1613006591796875, 1.212066650390625, 1.2628326416015625, 1.3135986328125, 1.3643646240234375, 1.415130615234375, 1.4658966064453125, 1.51666259765625, 1.5674285888671875, 1.618194580078125, 1.6689605712890625, 1.7197265625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 8.0, 13.0, 13.0, 15.0, 18.0, 29.0, 25.0, 27.0, 19.0, 30.0, 26.0, 43.0, 40.0, 52.0, 27.0, 33.0, 51.0, 43.0, 37.0, 45.0, 37.0, 31.0, 34.0, 41.0, 40.0, 34.0, 31.0, 27.0, 13.0, 22.0, 14.0, 19.0, 11.0, 10.0, 4.0, 11.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1434173583984375, -1.108123779296875, -1.0728302001953125, -1.03753662109375, -1.0022430419921875, -0.966949462890625, -0.9316558837890625, -0.8963623046875, -0.8610687255859375, -0.825775146484375, -0.7904815673828125, -0.75518798828125, -0.7198944091796875, -0.684600830078125, -0.6493072509765625, -0.614013671875, -0.5787200927734375, -0.543426513671875, -0.5081329345703125, -0.47283935546875, -0.4375457763671875, -0.402252197265625, -0.3669586181640625, -0.3316650390625, -0.2963714599609375, -0.261077880859375, -0.2257843017578125, -0.19049072265625, -0.1551971435546875, -0.119903564453125, -0.0846099853515625, -0.04931640625, -0.0140228271484375, 0.021270751953125, 0.0565643310546875, 0.09185791015625, 0.1271514892578125, 0.162445068359375, 0.1977386474609375, 0.2330322265625, 0.2683258056640625, 0.303619384765625, 0.3389129638671875, 0.37420654296875, 0.4095001220703125, 0.444793701171875, 0.4800872802734375, 0.515380859375, 0.5506744384765625, 0.585968017578125, 0.6212615966796875, 0.65655517578125, 0.6918487548828125, 0.727142333984375, 0.7624359130859375, 0.7977294921875, 0.8330230712890625, 0.868316650390625, 0.9036102294921875, 0.93890380859375, 0.9741973876953125, 1.009490966796875, 1.0447845458984375, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 18.0, 18.0, 42.0, 58.0, 88.0, 126.0, 195.0, 327.0, 564.0, 890.0, 1364.0, 2316.0, 3681.0, 5795.0, 9585.0, 15446.0, 25553.0, 40369.0, 63993.0, 98149.0, 146268.0, 212878.0, 290699.0, 372180.0, 438707.0, 474247.0, 462564.0, 411738.0, 337848.0, 254038.0, 181491.0, 123446.0, 81500.0, 52030.0, 32834.0, 20388.0, 12460.0, 7816.0, 4756.0, 2940.0, 1811.0, 1181.0, 682.0, 464.0, 255.0, 188.0, 111.0, 65.0, 49.0, 28.0, 17.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.388671875, -1.344970703125, -1.30126953125, -1.257568359375, -1.2138671875, -1.170166015625, -1.12646484375, -1.082763671875, -1.0390625, -0.995361328125, -0.95166015625, -0.907958984375, -0.8642578125, -0.820556640625, -0.77685546875, -0.733154296875, -0.689453125, -0.645751953125, -0.60205078125, -0.558349609375, -0.5146484375, -0.470947265625, -0.42724609375, -0.383544921875, -0.33984375, -0.296142578125, -0.25244140625, -0.208740234375, -0.1650390625, -0.121337890625, -0.07763671875, -0.033935546875, 0.009765625, 0.053466796875, 0.09716796875, 0.140869140625, 0.1845703125, 0.228271484375, 0.27197265625, 0.315673828125, 0.359375, 0.403076171875, 0.44677734375, 0.490478515625, 0.5341796875, 0.577880859375, 0.62158203125, 0.665283203125, 0.708984375, 0.752685546875, 0.79638671875, 0.840087890625, 0.8837890625, 0.927490234375, 0.97119140625, 1.014892578125, 1.05859375, 1.102294921875, 1.14599609375, 1.189697265625, 1.2333984375, 1.277099609375, 1.32080078125, 1.364501953125, 1.408203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 7.0, 14.0, 16.0, 19.0, 20.0, 32.0, 30.0, 31.0, 39.0, 49.0, 58.0, 71.0, 74.0, 109.0, 119.0, 122.0, 127.0, 154.0, 171.0, 174.0, 193.0, 206.0, 210.0, 168.0, 207.0, 190.0, 159.0, 157.0, 140.0, 148.0, 126.0, 119.0, 113.0, 82.0, 79.0, 68.0, 42.0, 45.0, 45.0, 30.0, 27.0, 20.0, 15.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.54931640625, -0.5322036743164062, -0.5150909423828125, -0.49797821044921875, -0.480865478515625, -0.46375274658203125, -0.4466400146484375, -0.42952728271484375, -0.41241455078125, -0.39530181884765625, -0.3781890869140625, -0.36107635498046875, -0.343963623046875, -0.32685089111328125, -0.3097381591796875, -0.29262542724609375, -0.2755126953125, -0.25839996337890625, -0.2412872314453125, -0.22417449951171875, -0.207061767578125, -0.18994903564453125, -0.1728363037109375, -0.15572357177734375, -0.13861083984375, -0.12149810791015625, -0.1043853759765625, -0.08727264404296875, -0.070159912109375, -0.05304718017578125, -0.0359344482421875, -0.01882171630859375, -0.001708984375, 0.01540374755859375, 0.0325164794921875, 0.04962921142578125, 0.066741943359375, 0.08385467529296875, 0.1009674072265625, 0.11808013916015625, 0.13519287109375, 0.15230560302734375, 0.1694183349609375, 0.18653106689453125, 0.203643798828125, 0.22075653076171875, 0.2378692626953125, 0.25498199462890625, 0.2720947265625, 0.28920745849609375, 0.3063201904296875, 0.32343292236328125, 0.340545654296875, 0.35765838623046875, 0.3747711181640625, 0.39188385009765625, 0.40899658203125, 0.42610931396484375, 0.4432220458984375, 0.46033477783203125, 0.477447509765625, 0.49456024169921875, 0.5116729736328125, 0.5287857055664062, 0.5458984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 4.0, 7.0, 14.0, 15.0, 9.0, 17.0, 16.0, 26.0, 27.0, 28.0, 41.0, 41.0, 48.0, 55.0, 64.0, 52.0, 57.0, 49.0, 62.0, 42.0, 48.0, 49.0, 30.0, 28.0, 28.0, 23.0, 22.0, 24.0, 12.0, 17.0, 11.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.348088264465332, -2.280186176300049, -2.2122840881347656, -2.1443819999694824, -2.0764801502227783, -2.008578062057495, -1.940675973892212, -1.8727738857269287, -1.8048717975616455, -1.7369697093963623, -1.6690677404403687, -1.6011656522750854, -1.5332635641098022, -1.4653615951538086, -1.3974595069885254, -1.3295574188232422, -1.2616554498672485, -1.1937533617019653, -1.1258513927459717, -1.0579493045806885, -0.9900472164154053, -0.9221451878547668, -0.8542431592941284, -0.7863410711288452, -0.7184390425682068, -0.6505370140075684, -0.5826349258422852, -0.5147328972816467, -0.4468308389186859, -0.3789287805557251, -0.31102675199508667, -0.24312469363212585, -0.17522263526916504, -0.10732058435678482, -0.0394185334444046, 0.02848351001739502, 0.09638556838035583, 0.16428762674331665, 0.23218965530395508, 0.3000917136669159, 0.3679937720298767, 0.4358958303928375, 0.5037978887557983, 0.5716999173164368, 0.6396019458770752, 0.7075040340423584, 0.7754060626029968, 0.8433080911636353, 0.9112101793289185, 0.9791122078895569, 1.0470142364501953, 1.1149163246154785, 1.1828184127807617, 1.250720500946045, 1.3186224699020386, 1.3865245580673218, 1.4544265270233154, 1.5223286151885986, 1.5902305841445923, 1.6581326723098755, 1.7260347604751587, 1.7939367294311523, 1.8618388175964355, 1.9297409057617188, 1.997642993927002]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 12.0, 9.0, 12.0, 18.0, 15.0, 23.0, 14.0, 24.0, 18.0, 29.0, 36.0, 47.0, 40.0, 33.0, 39.0, 46.0, 42.0, 39.0, 41.0, 51.0, 44.0, 42.0, 49.0, 30.0, 27.0, 26.0, 26.0, 31.0, 19.0, 19.0, 16.0, 17.0, 11.0, 12.0, 8.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.7488301992416382, -1.7021123170852661, -1.6553945541381836, -1.6086766719818115, -1.561958909034729, -1.515241026878357, -1.4685232639312744, -1.4218053817749023, -1.3750876188278198, -1.3283697366714478, -1.2816519737243652, -1.2349340915679932, -1.1882163286209106, -1.1414984464645386, -1.094780683517456, -1.048062801361084, -1.001344919204712, -0.9546270966529846, -0.9079092741012573, -0.86119145154953, -0.8144736289978027, -0.7677558064460754, -0.7210379838943481, -0.6743201017379761, -0.6276023387908936, -0.5808845162391663, -0.534166693687439, -0.48744887113571167, -0.4407310485839844, -0.3940132260322571, -0.3472953736782074, -0.3005775511264801, -0.2538597583770752, -0.2071419358253479, -0.1604241132736206, -0.11370627582073212, -0.06698845326900482, -0.020270630717277527, 0.026447206735610962, 0.07316502928733826, 0.11988285183906555, 0.16660067439079285, 0.21331849694252014, 0.2600363492965698, 0.3067541718482971, 0.3534719944000244, 0.4001898169517517, 0.446907639503479, 0.4936254620552063, 0.5403432846069336, 0.5870611071586609, 0.6337789297103882, 0.6804967522621155, 0.7272145748138428, 0.7739324569702148, 0.8206502199172974, 0.8673681020736694, 0.9140859246253967, 0.960803747177124, 1.007521629333496, 1.0542393922805786, 1.1009572744369507, 1.1476750373840332, 1.1943929195404053, 1.2411106824874878]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 11.0, 23.0, 20.0, 47.0, 77.0, 111.0, 146.0, 239.0, 363.0, 558.0, 883.0, 1192.0, 2080.0, 3223.0, 4981.0, 8184.0, 13213.0, 21773.0, 36158.0, 58197.0, 92153.0, 137461.0, 174055.0, 164789.0, 121882.0, 78916.0, 49423.0, 30329.0, 18173.0, 11106.0, 6880.0, 4364.0, 2661.0, 1746.0, 1066.0, 699.0, 425.0, 289.0, 197.0, 147.0, 114.0, 68.0, 41.0, 25.0, 22.0, 12.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.343505859375, -0.3323631286621094, -0.32122039794921875, -0.3100776672363281, -0.2989349365234375, -0.2877922058105469, -0.27664947509765625, -0.2655067443847656, -0.254364013671875, -0.24322128295898438, -0.23207855224609375, -0.22093582153320312, -0.2097930908203125, -0.19865036010742188, -0.18750762939453125, -0.17636489868164062, -0.16522216796875, -0.15407943725585938, -0.14293670654296875, -0.13179397583007812, -0.1206512451171875, -0.10950851440429688, -0.09836578369140625, -0.08722305297851562, -0.076080322265625, -0.06493759155273438, -0.05379486083984375, -0.042652130126953125, -0.0315093994140625, -0.020366668701171875, -0.00922393798828125, 0.001918792724609375, 0.0130615234375, 0.024204254150390625, 0.03534698486328125, 0.046489715576171875, 0.0576324462890625, 0.06877517700195312, 0.07991790771484375, 0.09106063842773438, 0.102203369140625, 0.11334609985351562, 0.12448883056640625, 0.13563156127929688, 0.1467742919921875, 0.15791702270507812, 0.16905975341796875, 0.18020248413085938, 0.19134521484375, 0.20248794555664062, 0.21363067626953125, 0.22477340698242188, 0.2359161376953125, 0.24705886840820312, 0.25820159912109375, 0.2693443298339844, 0.280487060546875, 0.2916297912597656, 0.30277252197265625, 0.3139152526855469, 0.3250579833984375, 0.3362007141113281, 0.34734344482421875, 0.3584861755371094, 0.36962890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 8.0, 12.0, 12.0, 21.0, 19.0, 21.0, 30.0, 28.0, 34.0, 27.0, 26.0, 35.0, 42.0, 40.0, 52.0, 40.0, 38.0, 34.0, 51.0, 34.0, 43.0, 51.0, 43.0, 37.0, 28.0, 16.0, 30.0, 23.0, 16.0, 27.0, 10.0, 12.0, 12.0, 7.0, 6.0, 8.0, 1.0, 6.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7933349609375, -1.741943359375, -1.6905517578125, -1.63916015625, -1.5877685546875, -1.536376953125, -1.4849853515625, -1.43359375, -1.3822021484375, -1.330810546875, -1.2794189453125, -1.22802734375, -1.1766357421875, -1.125244140625, -1.0738525390625, -1.0224609375, -0.9710693359375, -0.919677734375, -0.8682861328125, -0.81689453125, -0.7655029296875, -0.714111328125, -0.6627197265625, -0.611328125, -0.5599365234375, -0.508544921875, -0.4571533203125, -0.40576171875, -0.3543701171875, -0.302978515625, -0.2515869140625, -0.2001953125, -0.1488037109375, -0.097412109375, -0.0460205078125, 0.00537109375, 0.0567626953125, 0.108154296875, 0.1595458984375, 0.2109375, 0.2623291015625, 0.313720703125, 0.3651123046875, 0.41650390625, 0.4678955078125, 0.519287109375, 0.5706787109375, 0.6220703125, 0.6734619140625, 0.724853515625, 0.7762451171875, 0.82763671875, 0.8790283203125, 0.930419921875, 0.9818115234375, 1.033203125, 1.0845947265625, 1.135986328125, 1.1873779296875, 1.23876953125, 1.2901611328125, 1.341552734375, 1.3929443359375, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 9.0, 20.0, 31.0, 26.0, 39.0, 78.0, 102.0, 152.0, 248.0, 371.0, 628.0, 1072.0, 1912.0, 3275.0, 5853.0, 11076.0, 20867.0, 40352.0, 77504.0, 140286.0, 212390.0, 215760.0, 146346.0, 80335.0, 42153.0, 21871.0, 11529.0, 6166.0, 3297.0, 1877.0, 1071.0, 650.0, 395.0, 272.0, 172.0, 89.0, 75.0, 47.0, 47.0, 23.0, 10.0, 18.0, 11.0, 9.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49560546875, -0.4806022644042969, -0.46559906005859375, -0.4505958557128906, -0.4355926513671875, -0.4205894470214844, -0.40558624267578125, -0.3905830383300781, -0.375579833984375, -0.3605766296386719, -0.34557342529296875, -0.3305702209472656, -0.3155670166015625, -0.3005638122558594, -0.28556060791015625, -0.2705574035644531, -0.25555419921875, -0.24055099487304688, -0.22554779052734375, -0.21054458618164062, -0.1955413818359375, -0.18053817749023438, -0.16553497314453125, -0.15053176879882812, -0.135528564453125, -0.12052536010742188, -0.10552215576171875, -0.09051895141601562, -0.0755157470703125, -0.060512542724609375, -0.04550933837890625, -0.030506134033203125, -0.0155029296875, -0.000499725341796875, 0.01450347900390625, 0.029506683349609375, 0.0445098876953125, 0.059513092041015625, 0.07451629638671875, 0.08951950073242188, 0.104522705078125, 0.11952590942382812, 0.13452911376953125, 0.14953231811523438, 0.1645355224609375, 0.17953872680664062, 0.19454193115234375, 0.20954513549804688, 0.22454833984375, 0.23955154418945312, 0.25455474853515625, 0.2695579528808594, 0.2845611572265625, 0.2995643615722656, 0.31456756591796875, 0.3295707702636719, 0.344573974609375, 0.3595771789550781, 0.37458038330078125, 0.3895835876464844, 0.4045867919921875, 0.4195899963378906, 0.43459320068359375, 0.4495964050292969, 0.464599609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 9.0, 3.0, 15.0, 12.0, 10.0, 17.0, 16.0, 23.0, 12.0, 32.0, 34.0, 40.0, 34.0, 51.0, 44.0, 53.0, 38.0, 37.0, 48.0, 40.0, 50.0, 42.0, 34.0, 39.0, 35.0, 36.0, 32.0, 29.0, 26.0, 22.0, 17.0, 21.0, 11.0, 8.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9091796875, -0.8769073486328125, -0.844635009765625, -0.8123626708984375, -0.78009033203125, -0.7478179931640625, -0.715545654296875, -0.6832733154296875, -0.6510009765625, -0.6187286376953125, -0.586456298828125, -0.5541839599609375, -0.52191162109375, -0.4896392822265625, -0.457366943359375, -0.4250946044921875, -0.392822265625, -0.3605499267578125, -0.328277587890625, -0.2960052490234375, -0.26373291015625, -0.2314605712890625, -0.199188232421875, -0.1669158935546875, -0.1346435546875, -0.1023712158203125, -0.070098876953125, -0.0378265380859375, -0.00555419921875, 0.0267181396484375, 0.058990478515625, 0.0912628173828125, 0.12353515625, 0.1558074951171875, 0.188079833984375, 0.2203521728515625, 0.25262451171875, 0.2848968505859375, 0.317169189453125, 0.3494415283203125, 0.3817138671875, 0.4139862060546875, 0.446258544921875, 0.4785308837890625, 0.51080322265625, 0.5430755615234375, 0.575347900390625, 0.6076202392578125, 0.639892578125, 0.6721649169921875, 0.704437255859375, 0.7367095947265625, 0.76898193359375, 0.8012542724609375, 0.833526611328125, 0.8657989501953125, 0.8980712890625, 0.9303436279296875, 0.962615966796875, 0.9948883056640625, 1.02716064453125, 1.0594329833984375, 1.091705322265625, 1.1239776611328125, 1.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 4.0, 9.0, 6.0, 17.0, 19.0, 29.0, 34.0, 51.0, 65.0, 86.0, 133.0, 175.0, 242.0, 401.0, 768.0, 1356.0, 2700.0, 6069.0, 16988.0, 70262.0, 511066.0, 363189.0, 50721.0, 13666.0, 5096.0, 2273.0, 1161.0, 669.0, 425.0, 267.0, 157.0, 124.0, 79.0, 57.0, 33.0, 30.0, 23.0, 18.0, 17.0, 14.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.47998046875, -0.4662284851074219, -0.45247650146484375, -0.4387245178222656, -0.4249725341796875, -0.4112205505371094, -0.39746856689453125, -0.3837165832519531, -0.369964599609375, -0.3562126159667969, -0.34246063232421875, -0.3287086486816406, -0.3149566650390625, -0.3012046813964844, -0.28745269775390625, -0.2737007141113281, -0.25994873046875, -0.24619674682617188, -0.23244476318359375, -0.21869277954101562, -0.2049407958984375, -0.19118881225585938, -0.17743682861328125, -0.16368484497070312, -0.149932861328125, -0.13618087768554688, -0.12242889404296875, -0.10867691040039062, -0.0949249267578125, -0.08117294311523438, -0.06742095947265625, -0.053668975830078125, -0.0399169921875, -0.026165008544921875, -0.01241302490234375, 0.001338958740234375, 0.0150909423828125, 0.028842926025390625, 0.04259490966796875, 0.056346893310546875, 0.070098876953125, 0.08385086059570312, 0.09760284423828125, 0.11135482788085938, 0.1251068115234375, 0.13885879516601562, 0.15261077880859375, 0.16636276245117188, 0.18011474609375, 0.19386672973632812, 0.20761871337890625, 0.22137069702148438, 0.2351226806640625, 0.24887466430664062, 0.26262664794921875, 0.2763786315917969, 0.290130615234375, 0.3038825988769531, 0.31763458251953125, 0.3313865661621094, 0.3451385498046875, 0.3588905334472656, 0.37264251708984375, 0.3863945007324219, 0.400146484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 20.0, 21.0, 21.0, 43.0, 45.0, 60.0, 68.0, 90.0, 97.0, 97.0, 79.0, 96.0, 56.0, 61.0, 38.0, 34.0, 21.0, 8.0, 13.0, 5.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.907162368297577e-05, -1.841410994529724e-05, -1.7756596207618713e-05, -1.7099082469940186e-05, -1.6441568732261658e-05, -1.578405499458313e-05, -1.5126541256904602e-05, -1.4469027519226074e-05, -1.3811513781547546e-05, -1.3154000043869019e-05, -1.249648630619049e-05, -1.1838972568511963e-05, -1.1181458830833435e-05, -1.0523945093154907e-05, -9.86643135547638e-06, -9.208917617797852e-06, -8.551403880119324e-06, -7.893890142440796e-06, -7.236376404762268e-06, -6.57886266708374e-06, -5.921348929405212e-06, -5.2638351917266846e-06, -4.606321454048157e-06, -3.948807716369629e-06, -3.291293978691101e-06, -2.6337802410125732e-06, -1.9762665033340454e-06, -1.3187527656555176e-06, -6.612390279769897e-07, -3.725290298461914e-09, 6.537884473800659e-07, 1.3113021850585938e-06, 1.9688159227371216e-06, 2.6263296604156494e-06, 3.2838433980941772e-06, 3.941357135772705e-06, 4.598870873451233e-06, 5.256384611129761e-06, 5.9138983488082886e-06, 6.571412086486816e-06, 7.228925824165344e-06, 7.886439561843872e-06, 8.5439532995224e-06, 9.201467037200928e-06, 9.858980774879456e-06, 1.0516494512557983e-05, 1.1174008250236511e-05, 1.1831521987915039e-05, 1.2489035725593567e-05, 1.3146549463272095e-05, 1.3804063200950623e-05, 1.446157693862915e-05, 1.5119090676307678e-05, 1.5776604413986206e-05, 1.6434118151664734e-05, 1.7091631889343262e-05, 1.774914562702179e-05, 1.8406659364700317e-05, 1.9064173102378845e-05, 1.9721686840057373e-05, 2.03792005777359e-05, 2.103671431541443e-05, 2.1694228053092957e-05, 2.2351741790771484e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 19.0, 19.0, 34.0, 47.0, 37.0, 83.0, 87.0, 142.0, 181.0, 217.0, 326.0, 407.0, 591.0, 808.0, 1166.0, 1744.0, 3056.0, 6147.0, 14618.0, 44795.0, 169416.0, 469661.0, 238226.0, 60446.0, 18656.0, 7510.0, 3536.0, 2064.0, 1343.0, 893.0, 569.0, 415.0, 330.0, 246.0, 163.0, 148.0, 97.0, 81.0, 60.0, 39.0, 23.0, 28.0, 16.0, 17.0, 8.0, 6.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.372314453125, -0.35930633544921875, -0.3462982177734375, -0.33329010009765625, -0.320281982421875, -0.30727386474609375, -0.2942657470703125, -0.28125762939453125, -0.26824951171875, -0.25524139404296875, -0.2422332763671875, -0.22922515869140625, -0.216217041015625, -0.20320892333984375, -0.1902008056640625, -0.17719268798828125, -0.1641845703125, -0.15117645263671875, -0.1381683349609375, -0.12516021728515625, -0.112152099609375, -0.09914398193359375, -0.0861358642578125, -0.07312774658203125, -0.06011962890625, -0.04711151123046875, -0.0341033935546875, -0.02109527587890625, -0.008087158203125, 0.00492095947265625, 0.0179290771484375, 0.03093719482421875, 0.0439453125, 0.05695343017578125, 0.0699615478515625, 0.08296966552734375, 0.095977783203125, 0.10898590087890625, 0.1219940185546875, 0.13500213623046875, 0.14801025390625, 0.16101837158203125, 0.1740264892578125, 0.18703460693359375, 0.200042724609375, 0.21305084228515625, 0.2260589599609375, 0.23906707763671875, 0.2520751953125, 0.26508331298828125, 0.2780914306640625, 0.29109954833984375, 0.304107666015625, 0.31711578369140625, 0.3301239013671875, 0.34313201904296875, 0.35614013671875, 0.36914825439453125, 0.3821563720703125, 0.39516448974609375, 0.408172607421875, 0.42118072509765625, 0.4341888427734375, 0.44719696044921875, 0.460205078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 10.0, 4.0, 10.0, 17.0, 22.0, 34.0, 32.0, 49.0, 59.0, 91.0, 123.0, 127.0, 113.0, 66.0, 53.0, 51.0, 26.0, 22.0, 16.0, 15.0, 9.0, 3.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07037353515625, -0.06778240203857422, -0.06519126892089844, -0.06260013580322266, -0.060009002685546875, -0.057417869567871094, -0.05482673645019531, -0.05223560333251953, -0.04964447021484375, -0.04705333709716797, -0.04446220397949219, -0.041871070861816406, -0.039279937744140625, -0.036688804626464844, -0.03409767150878906, -0.03150653839111328, -0.0289154052734375, -0.02632427215576172, -0.023733139038085938, -0.021142005920410156, -0.018550872802734375, -0.015959739685058594, -0.013368606567382812, -0.010777473449707031, -0.00818634033203125, -0.005595207214355469, -0.0030040740966796875, -0.00041294097900390625, 0.002178192138671875, 0.004769325256347656, 0.0073604583740234375, 0.009951591491699219, 0.012542724609375, 0.015133857727050781, 0.017724990844726562, 0.020316123962402344, 0.022907257080078125, 0.025498390197753906, 0.028089523315429688, 0.03068065643310547, 0.03327178955078125, 0.03586292266845703, 0.03845405578613281, 0.041045188903808594, 0.043636322021484375, 0.046227455139160156, 0.04881858825683594, 0.05140972137451172, 0.0540008544921875, 0.05659198760986328, 0.05918312072753906, 0.061774253845214844, 0.06436538696289062, 0.0669565200805664, 0.06954765319824219, 0.07213878631591797, 0.07472991943359375, 0.07732105255126953, 0.07991218566894531, 0.0825033187866211, 0.08509445190429688, 0.08768558502197266, 0.09027671813964844, 0.09286785125732422, 0.095458984375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 8.0, 8.0, 12.0, 18.0, 11.0, 19.0, 15.0, 33.0, 24.0, 36.0, 47.0, 32.0, 59.0, 61.0, 55.0, 60.0, 58.0, 49.0, 56.0, 40.0, 53.0, 39.0, 26.0, 28.0, 24.0, 22.0, 28.0, 12.0, 12.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4011058807373047, -2.3326547145843506, -2.2642035484313965, -2.1957523822784424, -2.1273012161254883, -2.058850049972534, -1.9903987646102905, -1.9219475984573364, -1.8534964323043823, -1.7850452661514282, -1.7165940999984741, -1.64814293384552, -1.5796916484832764, -1.5112404823303223, -1.4427893161773682, -1.374338150024414, -1.30588698387146, -1.2374358177185059, -1.1689846515655518, -1.1005334854125977, -1.0320823192596436, -0.9636310935020447, -0.8951798677444458, -0.8267287015914917, -0.7582775354385376, -0.6898263692855835, -0.6213752031326294, -0.5529239773750305, -0.4844728112220764, -0.4160216450691223, -0.3475704491138458, -0.27911925315856934, -0.21066796779632568, -0.1422167867422104, -0.07376560568809509, -0.005314424633979797, 0.0631367564201355, 0.1315879225730896, 0.2000391185283661, 0.2684903144836426, 0.3369414806365967, 0.4053926467895508, 0.47384384274482727, 0.5422950387001038, 0.6107462048530579, 0.679197371006012, 0.7476485967636108, 0.8160997629165649, 0.884550929069519, 0.9530020952224731, 1.0214532613754272, 1.0899044275283813, 1.158355712890625, 1.226806879043579, 1.2952580451965332, 1.3637092113494873, 1.4321603775024414, 1.5006115436553955, 1.5690627098083496, 1.6375138759613037, 1.7059650421142578, 1.774416208267212, 1.8428674936294556, 1.9113186597824097, 1.9797698259353638]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 23.0, 15.0, 22.0, 15.0, 22.0, 19.0, 31.0, 35.0, 46.0, 43.0, 30.0, 41.0, 52.0, 41.0, 38.0, 51.0, 41.0, 44.0, 44.0, 47.0, 27.0, 26.0, 29.0, 31.0, 25.0, 17.0, 20.0, 18.0, 12.0, 14.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.7654094696044922, -1.7181633710861206, -1.6709171533584595, -1.623671054840088, -1.5764248371124268, -1.5291787385940552, -1.4819326400756836, -1.4346864223480225, -1.3874403238296509, -1.3401942253112793, -1.2929480075836182, -1.2457019090652466, -1.198455810546875, -1.1512095928192139, -1.1039634943008423, -1.0567173957824707, -1.0094711780548096, -0.9622250199317932, -0.9149788618087769, -0.8677327632904053, -0.8204866051673889, -0.7732404470443726, -0.725994348526001, -0.6787481904029846, -0.6315020322799683, -0.5842558741569519, -0.5370097160339355, -0.48976361751556396, -0.4425174593925476, -0.39527130126953125, -0.3480251729488373, -0.3007790446281433, -0.25353288650512695, -0.2062867432832718, -0.15904060006141663, -0.11179445683956146, -0.0645483136177063, -0.017302170395851135, 0.02994397282600403, 0.077190101146698, 0.12443625926971436, 0.17168240249156952, 0.21892854571342468, 0.26617467403411865, 0.313420832157135, 0.36066699028015137, 0.40791311860084534, 0.4551592469215393, 0.5024054050445557, 0.549651563167572, 0.5968977212905884, 0.64414381980896, 0.6913899779319763, 0.7386361360549927, 0.7858822345733643, 0.8331283926963806, 0.880374550819397, 0.9276207089424133, 0.9748668670654297, 1.0221129655838013, 1.0693590641021729, 1.116605281829834, 1.1638513803482056, 1.2110974788665771, 1.2583436965942383]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 8.0, 15.0, 14.0, 25.0, 55.0, 81.0, 128.0, 197.0, 338.0, 544.0, 797.0, 1232.0, 1752.0, 2857.0, 4235.0, 6360.0, 9471.0, 13672.0, 19373.0, 27283.0, 36458.0, 47943.0, 60727.0, 72949.0, 84306.0, 91300.0, 93304.0, 90939.0, 83174.0, 71981.0, 59448.0, 46977.0, 35271.0, 26278.0, 18658.0, 13315.0, 9156.0, 6069.0, 4165.0, 2670.0, 1849.0, 1127.0, 762.0, 437.0, 297.0, 231.0, 133.0, 78.0, 47.0, 33.0, 19.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89794921875, -0.8684616088867188, -0.8389739990234375, -0.8094863891601562, -0.779998779296875, -0.7505111694335938, -0.7210235595703125, -0.6915359497070312, -0.66204833984375, -0.6325607299804688, -0.6030731201171875, -0.5735855102539062, -0.544097900390625, -0.5146102905273438, -0.4851226806640625, -0.45563507080078125, -0.4261474609375, -0.39665985107421875, -0.3671722412109375, -0.33768463134765625, -0.308197021484375, -0.27870941162109375, -0.2492218017578125, -0.21973419189453125, -0.19024658203125, -0.16075897216796875, -0.1312713623046875, -0.10178375244140625, -0.072296142578125, -0.04280853271484375, -0.0133209228515625, 0.01616668701171875, 0.045654296875, 0.07514190673828125, 0.1046295166015625, 0.13411712646484375, 0.163604736328125, 0.19309234619140625, 0.2225799560546875, 0.25206756591796875, 0.28155517578125, 0.31104278564453125, 0.3405303955078125, 0.37001800537109375, 0.399505615234375, 0.42899322509765625, 0.4584808349609375, 0.48796844482421875, 0.5174560546875, 0.5469436645507812, 0.5764312744140625, 0.6059188842773438, 0.635406494140625, 0.6648941040039062, 0.6943817138671875, 0.7238693237304688, 0.75335693359375, 0.7828445434570312, 0.8123321533203125, 0.8418197631835938, 0.871307373046875, 0.9007949829101562, 0.9302825927734375, 0.9597702026367188, 0.9892578125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 9.0, 10.0, 6.0, 6.0, 5.0, 15.0, 15.0, 20.0, 16.0, 21.0, 26.0, 43.0, 33.0, 31.0, 40.0, 37.0, 50.0, 41.0, 45.0, 42.0, 37.0, 36.0, 48.0, 45.0, 41.0, 46.0, 32.0, 26.0, 29.0, 22.0, 16.0, 32.0, 9.0, 19.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.822265625, -1.7723846435546875, -1.722503662109375, -1.6726226806640625, -1.62274169921875, -1.5728607177734375, -1.522979736328125, -1.4730987548828125, -1.4232177734375, -1.3733367919921875, -1.323455810546875, -1.2735748291015625, -1.22369384765625, -1.1738128662109375, -1.123931884765625, -1.0740509033203125, -1.024169921875, -0.9742889404296875, -0.924407958984375, -0.8745269775390625, -0.82464599609375, -0.7747650146484375, -0.724884033203125, -0.6750030517578125, -0.6251220703125, -0.5752410888671875, -0.525360107421875, -0.4754791259765625, -0.42559814453125, -0.3757171630859375, -0.325836181640625, -0.2759552001953125, -0.22607421875, -0.1761932373046875, -0.126312255859375, -0.0764312744140625, -0.02655029296875, 0.0233306884765625, 0.073211669921875, 0.1230926513671875, 0.1729736328125, 0.2228546142578125, 0.272735595703125, 0.3226165771484375, 0.37249755859375, 0.4223785400390625, 0.472259521484375, 0.5221405029296875, 0.572021484375, 0.6219024658203125, 0.671783447265625, 0.7216644287109375, 0.77154541015625, 0.8214263916015625, 0.871307373046875, 0.9211883544921875, 0.9710693359375, 1.0209503173828125, 1.070831298828125, 1.1207122802734375, 1.17059326171875, 1.2204742431640625, 1.270355224609375, 1.3202362060546875, 1.3701171875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 29.0, 34.0, 61.0, 110.0, 157.0, 240.0, 434.0, 709.0, 1150.0, 1840.0, 3092.0, 4683.0, 7584.0, 11518.0, 17911.0, 26462.0, 37853.0, 52354.0, 68496.0, 84795.0, 98785.0, 105512.0, 105893.0, 98562.0, 84539.0, 68253.0, 52906.0, 38203.0, 26530.0, 17758.0, 11975.0, 7527.0, 4816.0, 3004.0, 1841.0, 1144.0, 702.0, 449.0, 256.0, 144.0, 82.0, 57.0, 32.0, 23.0, 24.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9619140625, -0.9275665283203125, -0.893218994140625, -0.8588714599609375, -0.82452392578125, -0.7901763916015625, -0.755828857421875, -0.7214813232421875, -0.6871337890625, -0.6527862548828125, -0.618438720703125, -0.5840911865234375, -0.54974365234375, -0.5153961181640625, -0.481048583984375, -0.4467010498046875, -0.412353515625, -0.3780059814453125, -0.343658447265625, -0.3093109130859375, -0.27496337890625, -0.2406158447265625, -0.206268310546875, -0.1719207763671875, -0.1375732421875, -0.1032257080078125, -0.068878173828125, -0.0345306396484375, -0.00018310546875, 0.0341644287109375, 0.068511962890625, 0.1028594970703125, 0.13720703125, 0.1715545654296875, 0.205902099609375, 0.2402496337890625, 0.27459716796875, 0.3089447021484375, 0.343292236328125, 0.3776397705078125, 0.4119873046875, 0.4463348388671875, 0.480682373046875, 0.5150299072265625, 0.54937744140625, 0.5837249755859375, 0.618072509765625, 0.6524200439453125, 0.686767578125, 0.7211151123046875, 0.755462646484375, 0.7898101806640625, 0.82415771484375, 0.8585052490234375, 0.892852783203125, 0.9272003173828125, 0.9615478515625, 0.9958953857421875, 1.030242919921875, 1.0645904541015625, 1.09893798828125, 1.1332855224609375, 1.167633056640625, 1.2019805908203125, 1.236328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 8.0, 13.0, 11.0, 23.0, 25.0, 24.0, 21.0, 35.0, 26.0, 33.0, 36.0, 44.0, 45.0, 40.0, 41.0, 44.0, 53.0, 36.0, 49.0, 40.0, 42.0, 31.0, 28.0, 26.0, 30.0, 31.0, 24.0, 22.0, 18.0, 16.0, 13.0, 11.0, 9.0, 7.0, 5.0, 1.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94677734375, -0.9163818359375, -0.885986328125, -0.8555908203125, -0.8251953125, -0.7947998046875, -0.764404296875, -0.7340087890625, -0.70361328125, -0.6732177734375, -0.642822265625, -0.6124267578125, -0.58203125, -0.5516357421875, -0.521240234375, -0.4908447265625, -0.46044921875, -0.4300537109375, -0.399658203125, -0.3692626953125, -0.3388671875, -0.3084716796875, -0.278076171875, -0.2476806640625, -0.21728515625, -0.1868896484375, -0.156494140625, -0.1260986328125, -0.095703125, -0.0653076171875, -0.034912109375, -0.0045166015625, 0.02587890625, 0.0562744140625, 0.086669921875, 0.1170654296875, 0.1474609375, 0.1778564453125, 0.208251953125, 0.2386474609375, 0.26904296875, 0.2994384765625, 0.329833984375, 0.3602294921875, 0.390625, 0.4210205078125, 0.451416015625, 0.4818115234375, 0.51220703125, 0.5426025390625, 0.572998046875, 0.6033935546875, 0.6337890625, 0.6641845703125, 0.694580078125, 0.7249755859375, 0.75537109375, 0.7857666015625, 0.816162109375, 0.8465576171875, 0.876953125, 0.9073486328125, 0.937744140625, 0.9681396484375, 0.99853515625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 7.0, 13.0, 20.0, 28.0, 53.0, 79.0, 105.0, 174.0, 261.0, 406.0, 630.0, 997.0, 1690.0, 2523.0, 4260.0, 6978.0, 11316.0, 17798.0, 28071.0, 42237.0, 61801.0, 84552.0, 106911.0, 122931.0, 126065.0, 115297.0, 96278.0, 72106.0, 51564.0, 34392.0, 22055.0, 14036.0, 8641.0, 5505.0, 3283.0, 1967.0, 1261.0, 832.0, 511.0, 333.0, 210.0, 130.0, 85.0, 53.0, 46.0, 24.0, 17.0, 6.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.654296875, -0.634613037109375, -0.61492919921875, -0.595245361328125, -0.5755615234375, -0.555877685546875, -0.53619384765625, -0.516510009765625, -0.496826171875, -0.477142333984375, -0.45745849609375, -0.437774658203125, -0.4180908203125, -0.398406982421875, -0.37872314453125, -0.359039306640625, -0.33935546875, -0.319671630859375, -0.29998779296875, -0.280303955078125, -0.2606201171875, -0.240936279296875, -0.22125244140625, -0.201568603515625, -0.181884765625, -0.162200927734375, -0.14251708984375, -0.122833251953125, -0.1031494140625, -0.083465576171875, -0.06378173828125, -0.044097900390625, -0.0244140625, -0.004730224609375, 0.01495361328125, 0.034637451171875, 0.0543212890625, 0.074005126953125, 0.09368896484375, 0.113372802734375, 0.133056640625, 0.152740478515625, 0.17242431640625, 0.192108154296875, 0.2117919921875, 0.231475830078125, 0.25115966796875, 0.270843505859375, 0.29052734375, 0.310211181640625, 0.32989501953125, 0.349578857421875, 0.3692626953125, 0.388946533203125, 0.40863037109375, 0.428314208984375, 0.447998046875, 0.467681884765625, 0.48736572265625, 0.507049560546875, 0.5267333984375, 0.546417236328125, 0.56610107421875, 0.585784912109375, 0.60546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0, 9.0, 2.0, 10.0, 11.0, 16.0, 7.0, 16.0, 16.0, 21.0, 24.0, 36.0, 43.0, 44.0, 47.0, 47.0, 43.0, 38.0, 31.0, 49.0, 54.0, 54.0, 47.0, 47.0, 45.0, 33.0, 37.0, 34.0, 20.0, 22.0, 21.0, 16.0, 18.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.736682891845703e-05, -7.528718560934067e-05, -7.32075423002243e-05, -7.112789899110794e-05, -6.904825568199158e-05, -6.696861237287521e-05, -6.488896906375885e-05, -6.280932575464249e-05, -6.072968244552612e-05, -5.865003913640976e-05, -5.6570395827293396e-05, -5.449075251817703e-05, -5.241110920906067e-05, -5.0331465899944305e-05, -4.825182259082794e-05, -4.617217928171158e-05, -4.4092535972595215e-05, -4.201289266347885e-05, -3.993324935436249e-05, -3.7853606045246124e-05, -3.577396273612976e-05, -3.36943194270134e-05, -3.1614676117897034e-05, -2.953503280878067e-05, -2.7455389499664307e-05, -2.5375746190547943e-05, -2.329610288143158e-05, -2.1216459572315216e-05, -1.9136816263198853e-05, -1.705717295408249e-05, -1.4977529644966125e-05, -1.2897886335849762e-05, -1.0818243026733398e-05, -8.738599717617035e-06, -6.658956408500671e-06, -4.579313099384308e-06, -2.4996697902679443e-06, -4.200264811515808e-07, 1.6596168279647827e-06, 3.7392601370811462e-06, 5.81890344619751e-06, 7.898546755313873e-06, 9.978190064430237e-06, 1.20578333735466e-05, 1.4137476682662964e-05, 1.6217119991779327e-05, 1.829676330089569e-05, 2.0376406610012054e-05, 2.2456049919128418e-05, 2.453569322824478e-05, 2.6615336537361145e-05, 2.869497984647751e-05, 3.077462315559387e-05, 3.2854266464710236e-05, 3.49339097738266e-05, 3.701355308294296e-05, 3.9093196392059326e-05, 4.117283970117569e-05, 4.325248301029205e-05, 4.533212631940842e-05, 4.741176962852478e-05, 4.9491412937641144e-05, 5.157105624675751e-05, 5.365069955587387e-05, 5.5730342864990234e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 7.0, 17.0, 30.0, 34.0, 49.0, 73.0, 124.0, 189.0, 261.0, 408.0, 609.0, 955.0, 1427.0, 2153.0, 3295.0, 4967.0, 7789.0, 11594.0, 17740.0, 25976.0, 37427.0, 52088.0, 69389.0, 87052.0, 102017.0, 110650.0, 109008.0, 99364.0, 83872.0, 65065.0, 49103.0, 34702.0, 24081.0, 16095.0, 10594.0, 7042.0, 4707.0, 2985.0, 1938.0, 1269.0, 880.0, 544.0, 339.0, 236.0, 130.0, 91.0, 70.0, 41.0, 22.0, 20.0, 16.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.57080078125, -0.5529022216796875, -0.535003662109375, -0.5171051025390625, -0.49920654296875, -0.4813079833984375, -0.463409423828125, -0.4455108642578125, -0.4276123046875, -0.4097137451171875, -0.391815185546875, -0.3739166259765625, -0.35601806640625, -0.3381195068359375, -0.320220947265625, -0.3023223876953125, -0.284423828125, -0.2665252685546875, -0.248626708984375, -0.2307281494140625, -0.21282958984375, -0.1949310302734375, -0.177032470703125, -0.1591339111328125, -0.1412353515625, -0.1233367919921875, -0.105438232421875, -0.0875396728515625, -0.06964111328125, -0.0517425537109375, -0.033843994140625, -0.0159454345703125, 0.001953125, 0.0198516845703125, 0.037750244140625, 0.0556488037109375, 0.07354736328125, 0.0914459228515625, 0.109344482421875, 0.1272430419921875, 0.1451416015625, 0.1630401611328125, 0.180938720703125, 0.1988372802734375, 0.21673583984375, 0.2346343994140625, 0.252532958984375, 0.2704315185546875, 0.288330078125, 0.3062286376953125, 0.324127197265625, 0.3420257568359375, 0.35992431640625, 0.3778228759765625, 0.395721435546875, 0.4136199951171875, 0.4315185546875, 0.4494171142578125, 0.467315673828125, 0.4852142333984375, 0.50311279296875, 0.5210113525390625, 0.538909912109375, 0.5568084716796875, 0.57470703125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 10.0, 19.0, 16.0, 18.0, 22.0, 29.0, 20.0, 31.0, 34.0, 35.0, 39.0, 40.0, 50.0, 38.0, 51.0, 52.0, 52.0, 55.0, 34.0, 49.0, 38.0, 42.0, 39.0, 38.0, 28.0, 21.0, 20.0, 8.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1801280975341797, -0.17263412475585938, -0.16514015197753906, -0.15764617919921875, -0.15015220642089844, -0.14265823364257812, -0.1351642608642578, -0.1276702880859375, -0.12017631530761719, -0.11268234252929688, -0.10518836975097656, -0.09769439697265625, -0.09020042419433594, -0.08270645141601562, -0.07521247863769531, -0.067718505859375, -0.06022453308105469, -0.052730560302734375, -0.04523658752441406, -0.03774261474609375, -0.030248641967773438, -0.022754669189453125, -0.015260696411132812, -0.0077667236328125, -0.0002727508544921875, 0.007221221923828125, 0.014715194702148438, 0.02220916748046875, 0.029703140258789062, 0.037197113037109375, 0.04469108581542969, 0.05218505859375, 0.05967903137207031, 0.06717300415039062, 0.07466697692871094, 0.08216094970703125, 0.08965492248535156, 0.09714889526367188, 0.10464286804199219, 0.1121368408203125, 0.11963081359863281, 0.12712478637695312, 0.13461875915527344, 0.14211273193359375, 0.14960670471191406, 0.15710067749023438, 0.1645946502685547, 0.172088623046875, 0.1795825958251953, 0.18707656860351562, 0.19457054138183594, 0.20206451416015625, 0.20955848693847656, 0.21705245971679688, 0.2245464324951172, 0.2320404052734375, 0.2395343780517578, 0.24702835083007812, 0.25452232360839844, 0.26201629638671875, 0.26951026916503906, 0.2770042419433594, 0.2844982147216797, 0.2919921875]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 18.0, 17.0, 27.0, 16.0, 23.0, 25.0, 41.0, 26.0, 50.0, 58.0, 47.0, 53.0, 62.0, 71.0, 58.0, 40.0, 45.0, 51.0, 34.0, 36.0, 31.0, 28.0, 23.0, 20.0, 24.0, 18.0, 12.0, 10.0, 5.0, 3.0, 5.0, 0.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.052737236022949, -1.9824645519256592, -1.9121919870376587, -1.8419193029403687, -1.7716466188430786, -1.7013740539550781, -1.631101369857788, -1.560828685760498, -1.490556001663208, -1.420283317565918, -1.3500107526779175, -1.2797380685806274, -1.2094653844833374, -1.139192819595337, -1.0689201354980469, -0.9986474514007568, -0.9283748865127563, -0.8581022620201111, -0.787829577922821, -0.7175569534301758, -0.6472842693328857, -0.5770116448402405, -0.5067390203475952, -0.43646636605262756, -0.3661937117576599, -0.29592105746269226, -0.2256484180688858, -0.15537577867507935, -0.0851031243801117, -0.014830470085144043, 0.05544215440750122, 0.12571480870246887, 0.19598746299743652, 0.2662601172924042, 0.3365327715873718, 0.4068053960800171, 0.47707805037498474, 0.5473507046699524, 0.6176233291625977, 0.6878960132598877, 0.758168637752533, 0.8284412622451782, 0.8987139463424683, 0.9689865708351135, 1.0392591953277588, 1.1095318794250488, 1.1798045635223389, 1.2500771284103394, 1.3203498125076294, 1.3906224966049194, 1.46089506149292, 1.53116774559021, 1.6014404296875, 1.67171311378479, 1.7419856786727905, 1.8122583627700806, 1.882530927658081, 1.952803611755371, 2.023076295852661, 2.093348979949951, 2.163621425628662, 2.233894109725952, 2.304166793823242, 2.3744394779205322, 2.4447121620178223]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 10.0, 8.0, 7.0, 18.0, 9.0, 21.0, 15.0, 27.0, 24.0, 26.0, 31.0, 35.0, 28.0, 39.0, 49.0, 44.0, 54.0, 34.0, 40.0, 41.0, 37.0, 48.0, 31.0, 43.0, 36.0, 32.0, 33.0, 25.0, 25.0, 21.0, 19.0, 11.0, 16.0, 7.0, 10.0, 10.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6441646814346313, -1.5958521366119385, -1.547539472579956, -1.4992269277572632, -1.4509143829345703, -1.4026018381118774, -1.3542892932891846, -1.3059766292572021, -1.2576640844345093, -1.2093515396118164, -1.161038875579834, -1.1127263307571411, -1.0644137859344482, -1.0161012411117554, -0.9677886366844177, -0.9194760322570801, -0.8711634874343872, -0.8228509426116943, -0.7745383381843567, -0.726225733757019, -0.6779131889343262, -0.6296006441116333, -0.5812880396842957, -0.532975435256958, -0.48466289043426514, -0.4363503158092499, -0.3880377411842346, -0.33972516655921936, -0.2914125919342041, -0.24310001730918884, -0.19478744268417358, -0.14647486805915833, -0.09816241264343262, -0.04984983801841736, -0.0015372633934020996, 0.04677531123161316, 0.09508788585662842, 0.14340046048164368, 0.19171303510665894, 0.2400256097316742, 0.28833818435668945, 0.3366507589817047, 0.38496333360671997, 0.43327590823173523, 0.4815884828567505, 0.5299010276794434, 0.578213632106781, 0.6265262365341187, 0.6748387813568115, 0.7231513261795044, 0.771463930606842, 0.8197765350341797, 0.8680890798568726, 0.9164016246795654, 0.9647142291069031, 1.0130268335342407, 1.0613393783569336, 1.1096519231796265, 1.1579644680023193, 1.2062771320343018, 1.2545896768569946, 1.3029022216796875, 1.35121488571167, 1.3995274305343628, 1.4478399753570557]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 16.0, 31.0, 52.0, 80.0, 104.0, 179.0, 311.0, 472.0, 780.0, 1244.0, 2147.0, 3646.0, 6049.0, 10341.0, 17374.0, 29901.0, 51538.0, 86344.0, 140587.0, 222680.0, 327754.0, 445322.0, 538683.0, 567637.0, 519751.0, 415012.0, 299586.0, 199195.0, 124863.0, 75576.0, 44861.0, 26159.0, 15083.0, 8728.0, 5065.0, 2967.0, 1662.0, 995.0, 599.0, 335.0, 211.0, 132.0, 92.0, 46.0, 30.0, 17.0, 17.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003570556640625, -1.549346923828125, -1.4983367919921875, -1.44732666015625, -1.3963165283203125, -1.345306396484375, -1.2942962646484375, -1.2432861328125, -1.1922760009765625, -1.141265869140625, -1.0902557373046875, -1.03924560546875, -0.9882354736328125, -0.937225341796875, -0.8862152099609375, -0.835205078125, -0.7841949462890625, -0.733184814453125, -0.6821746826171875, -0.63116455078125, -0.5801544189453125, -0.529144287109375, -0.4781341552734375, -0.4271240234375, -0.3761138916015625, -0.325103759765625, -0.2740936279296875, -0.22308349609375, -0.1720733642578125, -0.121063232421875, -0.0700531005859375, -0.01904296875, 0.0319671630859375, 0.082977294921875, 0.1339874267578125, 0.18499755859375, 0.2360076904296875, 0.287017822265625, 0.3380279541015625, 0.3890380859375, 0.4400482177734375, 0.491058349609375, 0.5420684814453125, 0.59307861328125, 0.6440887451171875, 0.695098876953125, 0.7461090087890625, 0.797119140625, 0.8481292724609375, 0.899139404296875, 0.9501495361328125, 1.00115966796875, 1.0521697998046875, 1.103179931640625, 1.1541900634765625, 1.2052001953125, 1.2562103271484375, 1.307220458984375, 1.3582305908203125, 1.40924072265625, 1.4602508544921875, 1.511260986328125, 1.5622711181640625, 1.61328125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 9.0, 11.0, 6.0, 15.0, 13.0, 16.0, 15.0, 27.0, 22.0, 28.0, 35.0, 32.0, 37.0, 40.0, 41.0, 39.0, 31.0, 37.0, 44.0, 42.0, 40.0, 37.0, 38.0, 35.0, 44.0, 25.0, 24.0, 23.0, 26.0, 25.0, 13.0, 12.0, 17.0, 18.0, 14.0, 5.0, 7.0, 5.0, 4.0, 8.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3056640625, -1.2673187255859375, -1.228973388671875, -1.1906280517578125, -1.15228271484375, -1.1139373779296875, -1.075592041015625, -1.0372467041015625, -0.9989013671875, -0.9605560302734375, -0.922210693359375, -0.8838653564453125, -0.84552001953125, -0.8071746826171875, -0.768829345703125, -0.7304840087890625, -0.692138671875, -0.6537933349609375, -0.615447998046875, -0.5771026611328125, -0.53875732421875, -0.5004119873046875, -0.462066650390625, -0.4237213134765625, -0.3853759765625, -0.3470306396484375, -0.308685302734375, -0.2703399658203125, -0.23199462890625, -0.1936492919921875, -0.155303955078125, -0.1169586181640625, -0.07861328125, -0.0402679443359375, -0.001922607421875, 0.0364227294921875, 0.07476806640625, 0.1131134033203125, 0.151458740234375, 0.1898040771484375, 0.2281494140625, 0.2664947509765625, 0.304840087890625, 0.3431854248046875, 0.38153076171875, 0.4198760986328125, 0.458221435546875, 0.4965667724609375, 0.534912109375, 0.5732574462890625, 0.611602783203125, 0.6499481201171875, 0.68829345703125, 0.7266387939453125, 0.764984130859375, 0.8033294677734375, 0.8416748046875, 0.8800201416015625, 0.918365478515625, 0.9567108154296875, 0.99505615234375, 1.0334014892578125, 1.071746826171875, 1.1100921630859375, 1.1484375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 17.0, 29.0, 42.0, 73.0, 120.0, 215.0, 351.0, 556.0, 932.0, 1594.0, 2777.0, 4568.0, 8097.0, 13402.0, 22683.0, 38392.0, 62227.0, 100217.0, 154234.0, 226711.0, 314267.0, 402179.0, 472768.0, 500720.0, 478665.0, 410040.0, 321211.0, 232322.0, 158581.0, 103429.0, 64824.0, 39677.0, 24078.0, 14092.0, 8348.0, 4799.0, 2918.0, 1680.0, 1009.0, 549.0, 338.0, 224.0, 133.0, 85.0, 49.0, 17.0, 13.0, 13.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6858062744140625, -1.632354736328125, -1.5789031982421875, -1.52545166015625, -1.4720001220703125, -1.418548583984375, -1.3650970458984375, -1.3116455078125, -1.2581939697265625, -1.204742431640625, -1.1512908935546875, -1.09783935546875, -1.0443878173828125, -0.990936279296875, -0.9374847412109375, -0.884033203125, -0.8305816650390625, -0.777130126953125, -0.7236785888671875, -0.67022705078125, -0.6167755126953125, -0.563323974609375, -0.5098724365234375, -0.4564208984375, -0.4029693603515625, -0.349517822265625, -0.2960662841796875, -0.24261474609375, -0.1891632080078125, -0.135711669921875, -0.0822601318359375, -0.02880859375, 0.0246429443359375, 0.078094482421875, 0.1315460205078125, 0.18499755859375, 0.2384490966796875, 0.291900634765625, 0.3453521728515625, 0.3988037109375, 0.4522552490234375, 0.505706787109375, 0.5591583251953125, 0.61260986328125, 0.6660614013671875, 0.719512939453125, 0.7729644775390625, 0.826416015625, 0.8798675537109375, 0.933319091796875, 0.9867706298828125, 1.04022216796875, 1.0936737060546875, 1.147125244140625, 1.2005767822265625, 1.2540283203125, 1.3074798583984375, 1.360931396484375, 1.4143829345703125, 1.46783447265625, 1.5212860107421875, 1.574737548828125, 1.6281890869140625, 1.681640625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 12.0, 10.0, 6.0, 27.0, 34.0, 30.0, 34.0, 60.0, 67.0, 84.0, 118.0, 136.0, 149.0, 142.0, 168.0, 206.0, 203.0, 215.0, 216.0, 240.0, 238.0, 212.0, 217.0, 170.0, 155.0, 151.0, 142.0, 147.0, 105.0, 80.0, 63.0, 57.0, 44.0, 42.0, 29.0, 12.0, 17.0, 5.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7265853881835938, -0.7026824951171875, -0.6787796020507812, -0.654876708984375, -0.6309738159179688, -0.6070709228515625, -0.5831680297851562, -0.55926513671875, -0.5353622436523438, -0.5114593505859375, -0.48755645751953125, -0.463653564453125, -0.43975067138671875, -0.4158477783203125, -0.39194488525390625, -0.3680419921875, -0.34413909912109375, -0.3202362060546875, -0.29633331298828125, -0.272430419921875, -0.24852752685546875, -0.2246246337890625, -0.20072174072265625, -0.17681884765625, -0.15291595458984375, -0.1290130615234375, -0.10511016845703125, -0.081207275390625, -0.05730438232421875, -0.0334014892578125, -0.00949859619140625, 0.014404296875, 0.03830718994140625, 0.0622100830078125, 0.08611297607421875, 0.110015869140625, 0.13391876220703125, 0.1578216552734375, 0.18172454833984375, 0.20562744140625, 0.22953033447265625, 0.2534332275390625, 0.27733612060546875, 0.301239013671875, 0.32514190673828125, 0.3490447998046875, 0.37294769287109375, 0.3968505859375, 0.42075347900390625, 0.4446563720703125, 0.46855926513671875, 0.492462158203125, 0.5163650512695312, 0.5402679443359375, 0.5641708374023438, 0.58807373046875, 0.6119766235351562, 0.6358795166015625, 0.6597824096679688, 0.683685302734375, 0.7075881958007812, 0.7314910888671875, 0.7553939819335938, 0.779296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 13.0, 17.0, 9.0, 28.0, 33.0, 22.0, 31.0, 34.0, 48.0, 62.0, 64.0, 61.0, 71.0, 49.0, 55.0, 50.0, 66.0, 49.0, 39.0, 40.0, 28.0, 27.0, 23.0, 13.0, 15.0, 13.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.804446220397949, -2.719447135925293, -2.6344478130340576, -2.5494487285614014, -2.464449644088745, -2.3794503211975098, -2.2944512367248535, -2.2094521522521973, -2.124453067779541, -2.0394539833068848, -1.954454779624939, -1.8694555759429932, -1.784456491470337, -1.6994572877883911, -1.6144580841064453, -1.529458999633789, -1.4444596767425537, -1.359460473060608, -1.2744613885879517, -1.1894621849060059, -1.1044631004333496, -1.0194638967514038, -0.934464693069458, -0.849465548992157, -0.764466404914856, -0.6794672608375549, -0.5944681167602539, -0.5094689130783081, -0.4244697690010071, -0.33947062492370605, -0.25447142124176025, -0.16947227716445923, -0.0844733715057373, 0.0005257874727249146, 0.08552494645118713, 0.17052412033081055, 0.2555232644081116, 0.3405224084854126, 0.4255216121673584, 0.5105207562446594, 0.5955199003219604, 0.6805190443992615, 0.7655181884765625, 0.8505173921585083, 0.9355165362358093, 1.0205156803131104, 1.1055148839950562, 1.190514087677002, 1.2755131721496582, 1.360512375831604, 1.4455114603042603, 1.530510663986206, 1.6155097484588623, 1.700508952140808, 1.785508155822754, 1.8705072402954102, 1.955506443977356, 2.0405056476593018, 2.125504732131958, 2.2105040550231934, 2.2955031394958496, 2.380502223968506, 2.465501308441162, 2.5505006313323975, 2.6354997158050537]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 12.0, 9.0, 10.0, 15.0, 18.0, 14.0, 23.0, 21.0, 30.0, 21.0, 36.0, 36.0, 27.0, 31.0, 42.0, 49.0, 43.0, 33.0, 42.0, 44.0, 42.0, 34.0, 46.0, 35.0, 35.0, 28.0, 24.0, 29.0, 25.0, 21.0, 18.0, 19.0, 14.0, 6.0, 8.0, 8.0, 3.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6612660884857178, -1.6119011640548706, -1.5625362396240234, -1.5131713151931763, -1.463806390762329, -1.414441466331482, -1.3650765419006348, -1.3157117366790771, -1.2663466930389404, -1.2169817686080933, -1.167616844177246, -1.118251919746399, -1.0688869953155518, -1.0195220708847046, -0.9701572060585022, -0.920792281627655, -0.8714274168014526, -0.8220624923706055, -0.7726975679397583, -0.7233326435089111, -0.673967719078064, -0.6246027946472168, -0.5752379298210144, -0.5258730053901672, -0.47650808095932007, -0.4271431565284729, -0.37777823209762573, -0.32841333746910095, -0.2790484130382538, -0.22968348860740662, -0.18031859397888184, -0.13095366954803467, -0.08158862590789795, -0.03222370892763138, 0.017141208052635193, 0.06650611758232117, 0.11587104201316833, 0.1652359664440155, 0.21460086107254028, 0.26396578550338745, 0.3133307099342346, 0.3626956343650818, 0.41206055879592896, 0.46142545342445374, 0.5107903480529785, 0.5601552724838257, 0.6095201969146729, 0.65888512134552, 0.7082500457763672, 0.7576149702072144, 0.8069798946380615, 0.8563448190689087, 0.9057097434997559, 0.955074667930603, 1.0044395923614502, 1.0538043975830078, 1.1031694412231445, 1.1525343656539917, 1.2018992900848389, 1.251264214515686, 1.3006291389465332, 1.3499940633773804, 1.3993589878082275, 1.4487237930297852, 1.4980887174606323]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 14.0, 12.0, 23.0, 38.0, 53.0, 72.0, 121.0, 181.0, 308.0, 468.0, 734.0, 1318.0, 2311.0, 4126.0, 7945.0, 15267.0, 29808.0, 56438.0, 105028.0, 179337.0, 231757.0, 182776.0, 108068.0, 57877.0, 30468.0, 15650.0, 8120.0, 4429.0, 2416.0, 1325.0, 769.0, 482.0, 291.0, 173.0, 97.0, 68.0, 58.0, 43.0, 17.0, 19.0, 15.0, 10.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5322265625, -0.5141983032226562, -0.4961700439453125, -0.47814178466796875, -0.460113525390625, -0.44208526611328125, -0.4240570068359375, -0.40602874755859375, -0.38800048828125, -0.36997222900390625, -0.3519439697265625, -0.33391571044921875, -0.315887451171875, -0.29785919189453125, -0.2798309326171875, -0.26180267333984375, -0.2437744140625, -0.22574615478515625, -0.2077178955078125, -0.18968963623046875, -0.171661376953125, -0.15363311767578125, -0.1356048583984375, -0.11757659912109375, -0.09954833984375, -0.08152008056640625, -0.0634918212890625, -0.04546356201171875, -0.027435302734375, -0.00940704345703125, 0.0086212158203125, 0.02664947509765625, 0.044677734375, 0.06270599365234375, 0.0807342529296875, 0.09876251220703125, 0.116790771484375, 0.13481903076171875, 0.1528472900390625, 0.17087554931640625, 0.18890380859375, 0.20693206787109375, 0.2249603271484375, 0.24298858642578125, 0.261016845703125, 0.27904510498046875, 0.2970733642578125, 0.31510162353515625, 0.3331298828125, 0.35115814208984375, 0.3691864013671875, 0.38721466064453125, 0.405242919921875, 0.42327117919921875, 0.4412994384765625, 0.45932769775390625, 0.47735595703125, 0.49538421630859375, 0.5134124755859375, 0.5314407348632812, 0.549468994140625, 0.5674972534179688, 0.5855255126953125, 0.6035537719726562, 0.62158203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 9.0, 20.0, 15.0, 19.0, 23.0, 22.0, 34.0, 30.0, 34.0, 26.0, 32.0, 35.0, 37.0, 37.0, 40.0, 47.0, 39.0, 45.0, 38.0, 40.0, 30.0, 33.0, 33.0, 29.0, 26.0, 20.0, 30.0, 14.0, 19.0, 26.0, 14.0, 5.0, 12.0, 10.0, 7.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.587890625, -1.536163330078125, -1.48443603515625, -1.432708740234375, -1.3809814453125, -1.329254150390625, -1.27752685546875, -1.225799560546875, -1.174072265625, -1.122344970703125, -1.07061767578125, -1.018890380859375, -0.9671630859375, -0.915435791015625, -0.86370849609375, -0.811981201171875, -0.76025390625, -0.708526611328125, -0.65679931640625, -0.605072021484375, -0.5533447265625, -0.501617431640625, -0.44989013671875, -0.398162841796875, -0.346435546875, -0.294708251953125, -0.24298095703125, -0.191253662109375, -0.1395263671875, -0.087799072265625, -0.03607177734375, 0.015655517578125, 0.0673828125, 0.119110107421875, 0.17083740234375, 0.222564697265625, 0.2742919921875, 0.326019287109375, 0.37774658203125, 0.429473876953125, 0.481201171875, 0.532928466796875, 0.58465576171875, 0.636383056640625, 0.6881103515625, 0.739837646484375, 0.79156494140625, 0.843292236328125, 0.89501953125, 0.946746826171875, 0.99847412109375, 1.050201416015625, 1.1019287109375, 1.153656005859375, 1.20538330078125, 1.257110595703125, 1.308837890625, 1.360565185546875, 1.41229248046875, 1.464019775390625, 1.5157470703125, 1.567474365234375, 1.61920166015625, 1.670928955078125, 1.72265625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 9.0, 11.0, 11.0, 25.0, 28.0, 34.0, 53.0, 74.0, 120.0, 184.0, 246.0, 363.0, 602.0, 935.0, 1483.0, 2676.0, 4663.0, 9102.0, 17957.0, 36978.0, 79615.0, 163223.0, 261603.0, 228074.0, 124296.0, 58646.0, 27684.0, 13572.0, 6828.0, 3792.0, 2123.0, 1329.0, 766.0, 462.0, 319.0, 200.0, 126.0, 87.0, 61.0, 55.0, 46.0, 34.0, 18.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5990371704101562, -0.5789337158203125, -0.5588302612304688, -0.538726806640625, -0.5186233520507812, -0.4985198974609375, -0.47841644287109375, -0.45831298828125, -0.43820953369140625, -0.4181060791015625, -0.39800262451171875, -0.377899169921875, -0.35779571533203125, -0.3376922607421875, -0.31758880615234375, -0.2974853515625, -0.27738189697265625, -0.2572784423828125, -0.23717498779296875, -0.217071533203125, -0.19696807861328125, -0.1768646240234375, -0.15676116943359375, -0.13665771484375, -0.11655426025390625, -0.0964508056640625, -0.07634735107421875, -0.056243896484375, -0.03614044189453125, -0.0160369873046875, 0.00406646728515625, 0.024169921875, 0.04427337646484375, 0.0643768310546875, 0.08448028564453125, 0.104583740234375, 0.12468719482421875, 0.1447906494140625, 0.16489410400390625, 0.18499755859375, 0.20510101318359375, 0.2252044677734375, 0.24530792236328125, 0.265411376953125, 0.28551483154296875, 0.3056182861328125, 0.32572174072265625, 0.3458251953125, 0.36592864990234375, 0.3860321044921875, 0.40613555908203125, 0.426239013671875, 0.44634246826171875, 0.4664459228515625, 0.48654937744140625, 0.50665283203125, 0.5267562866210938, 0.5468597412109375, 0.5669631958007812, 0.587066650390625, 0.6071701049804688, 0.6272735595703125, 0.6473770141601562, 0.66748046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 0.0, 0.0, 5.0, 6.0, 2.0, 4.0, 5.0, 2.0, 11.0, 8.0, 16.0, 14.0, 15.0, 22.0, 28.0, 22.0, 23.0, 30.0, 28.0, 35.0, 35.0, 62.0, 38.0, 39.0, 52.0, 42.0, 52.0, 42.0, 41.0, 39.0, 41.0, 34.0, 24.0, 33.0, 23.0, 21.0, 23.0, 14.0, 19.0, 16.0, 7.0, 14.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0341796875, -0.99884033203125, -0.9635009765625, -0.92816162109375, -0.892822265625, -0.85748291015625, -0.8221435546875, -0.78680419921875, -0.75146484375, -0.71612548828125, -0.6807861328125, -0.64544677734375, -0.610107421875, -0.57476806640625, -0.5394287109375, -0.50408935546875, -0.46875, -0.43341064453125, -0.3980712890625, -0.36273193359375, -0.327392578125, -0.29205322265625, -0.2567138671875, -0.22137451171875, -0.18603515625, -0.15069580078125, -0.1153564453125, -0.08001708984375, -0.044677734375, -0.00933837890625, 0.0260009765625, 0.06134033203125, 0.0966796875, 0.13201904296875, 0.1673583984375, 0.20269775390625, 0.238037109375, 0.27337646484375, 0.3087158203125, 0.34405517578125, 0.37939453125, 0.41473388671875, 0.4500732421875, 0.48541259765625, 0.520751953125, 0.55609130859375, 0.5914306640625, 0.62677001953125, 0.662109375, 0.69744873046875, 0.7327880859375, 0.76812744140625, 0.803466796875, 0.83880615234375, 0.8741455078125, 0.90948486328125, 0.94482421875, 0.98016357421875, 1.0155029296875, 1.05084228515625, 1.086181640625, 1.12152099609375, 1.1568603515625, 1.19219970703125, 1.2275390625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 7.0, 7.0, 6.0, 6.0, 13.0, 16.0, 19.0, 22.0, 49.0, 57.0, 61.0, 68.0, 98.0, 142.0, 179.0, 253.0, 331.0, 470.0, 718.0, 1055.0, 1608.0, 2597.0, 4691.0, 8932.0, 19480.0, 54137.0, 201674.0, 482523.0, 181015.0, 49612.0, 18402.0, 8207.0, 4572.0, 2545.0, 1480.0, 1001.0, 698.0, 479.0, 363.0, 221.0, 176.0, 157.0, 118.0, 77.0, 53.0, 48.0, 22.0, 27.0, 17.0, 14.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.33349609375, -0.32254791259765625, -0.3115997314453125, -0.30065155029296875, -0.289703369140625, -0.27875518798828125, -0.2678070068359375, -0.25685882568359375, -0.24591064453125, -0.23496246337890625, -0.2240142822265625, -0.21306610107421875, -0.202117919921875, -0.19116973876953125, -0.1802215576171875, -0.16927337646484375, -0.1583251953125, -0.14737701416015625, -0.1364288330078125, -0.12548065185546875, -0.114532470703125, -0.10358428955078125, -0.0926361083984375, -0.08168792724609375, -0.07073974609375, -0.05979156494140625, -0.0488433837890625, -0.03789520263671875, -0.026947021484375, -0.01599884033203125, -0.0050506591796875, 0.00589752197265625, 0.016845703125, 0.02779388427734375, 0.0387420654296875, 0.04969024658203125, 0.060638427734375, 0.07158660888671875, 0.0825347900390625, 0.09348297119140625, 0.10443115234375, 0.11537933349609375, 0.1263275146484375, 0.13727569580078125, 0.148223876953125, 0.15917205810546875, 0.1701202392578125, 0.18106842041015625, 0.1920166015625, 0.20296478271484375, 0.2139129638671875, 0.22486114501953125, 0.235809326171875, 0.24675750732421875, 0.2577056884765625, 0.26865386962890625, 0.27960205078125, 0.29055023193359375, 0.3014984130859375, 0.31244659423828125, 0.323394775390625, 0.33434295654296875, 0.3452911376953125, 0.35623931884765625, 0.3671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 10.0, 6.0, 9.0, 11.0, 9.0, 14.0, 14.0, 15.0, 35.0, 35.0, 32.0, 35.0, 42.0, 36.0, 56.0, 34.0, 48.0, 43.0, 43.0, 57.0, 41.0, 41.0, 35.0, 42.0, 40.0, 37.0, 23.0, 23.0, 15.0, 21.0, 14.0, 11.0, 9.0, 10.0, 13.0, 7.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.049041748046875e-05, -1.0143034160137177e-05, -9.795650839805603e-06, -9.44826751947403e-06, -9.100884199142456e-06, -8.753500878810883e-06, -8.406117558479309e-06, -8.058734238147736e-06, -7.711350917816162e-06, -7.363967597484589e-06, -7.016584277153015e-06, -6.669200956821442e-06, -6.321817636489868e-06, -5.974434316158295e-06, -5.627050995826721e-06, -5.279667675495148e-06, -4.932284355163574e-06, -4.584901034832001e-06, -4.237517714500427e-06, -3.890134394168854e-06, -3.5427510738372803e-06, -3.1953677535057068e-06, -2.8479844331741333e-06, -2.50060111284256e-06, -2.1532177925109863e-06, -1.8058344721794128e-06, -1.4584511518478394e-06, -1.1110678315162659e-06, -7.636845111846924e-07, -4.163011908531189e-07, -6.891787052154541e-08, 2.784654498100281e-07, 6.258487701416016e-07, 9.73232090473175e-07, 1.3206154108047485e-06, 1.667998731136322e-06, 2.0153820514678955e-06, 2.362765371799469e-06, 2.7101486921310425e-06, 3.057532012462616e-06, 3.4049153327941895e-06, 3.752298653125763e-06, 4.0996819734573364e-06, 4.44706529378891e-06, 4.794448614120483e-06, 5.141831934452057e-06, 5.48921525478363e-06, 5.836598575115204e-06, 6.183981895446777e-06, 6.531365215778351e-06, 6.878748536109924e-06, 7.226131856441498e-06, 7.573515176773071e-06, 7.920898497104645e-06, 8.268281817436218e-06, 8.615665137767792e-06, 8.963048458099365e-06, 9.310431778430939e-06, 9.657815098762512e-06, 1.0005198419094086e-05, 1.035258173942566e-05, 1.0699965059757233e-05, 1.1047348380088806e-05, 1.139473170042038e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 27.0, 18.0, 42.0, 53.0, 85.0, 121.0, 199.0, 227.0, 386.0, 571.0, 860.0, 1284.0, 2241.0, 4135.0, 8937.0, 22001.0, 67106.0, 226908.0, 433895.0, 188161.0, 55375.0, 18818.0, 7780.0, 3694.0, 1961.0, 1204.0, 713.0, 552.0, 357.0, 253.0, 169.0, 126.0, 68.0, 61.0, 48.0, 24.0, 17.0, 11.0, 10.0, 10.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5, -0.48503875732421875, -0.4700775146484375, -0.45511627197265625, -0.440155029296875, -0.42519378662109375, -0.4102325439453125, -0.39527130126953125, -0.38031005859375, -0.36534881591796875, -0.3503875732421875, -0.33542633056640625, -0.320465087890625, -0.30550384521484375, -0.2905426025390625, -0.27558135986328125, -0.2606201171875, -0.24565887451171875, -0.2306976318359375, -0.21573638916015625, -0.200775146484375, -0.18581390380859375, -0.1708526611328125, -0.15589141845703125, -0.14093017578125, -0.12596893310546875, -0.1110076904296875, -0.09604644775390625, -0.081085205078125, -0.06612396240234375, -0.0511627197265625, -0.03620147705078125, -0.021240234375, -0.00627899169921875, 0.0086822509765625, 0.02364349365234375, 0.038604736328125, 0.05356597900390625, 0.0685272216796875, 0.08348846435546875, 0.09844970703125, 0.11341094970703125, 0.1283721923828125, 0.14333343505859375, 0.158294677734375, 0.17325592041015625, 0.1882171630859375, 0.20317840576171875, 0.2181396484375, 0.23310089111328125, 0.2480621337890625, 0.26302337646484375, 0.277984619140625, 0.29294586181640625, 0.3079071044921875, 0.32286834716796875, 0.33782958984375, 0.35279083251953125, 0.3677520751953125, 0.38271331787109375, 0.397674560546875, 0.41263580322265625, 0.4275970458984375, 0.44255828857421875, 0.45751953125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 6.0, 13.0, 7.0, 19.0, 29.0, 37.0, 70.0, 85.0, 147.0, 130.0, 124.0, 95.0, 69.0, 41.0, 33.0, 21.0, 17.0, 21.0, 4.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1312255859375, -0.12743854522705078, -0.12365150451660156, -0.11986446380615234, -0.11607742309570312, -0.1122903823852539, -0.10850334167480469, -0.10471630096435547, -0.10092926025390625, -0.09714221954345703, -0.09335517883300781, -0.0895681381225586, -0.08578109741210938, -0.08199405670166016, -0.07820701599121094, -0.07441997528076172, -0.0706329345703125, -0.06684589385986328, -0.06305885314941406, -0.059271812438964844, -0.055484771728515625, -0.051697731018066406, -0.04791069030761719, -0.04412364959716797, -0.04033660888671875, -0.03654956817626953, -0.03276252746582031, -0.028975486755371094, -0.025188446044921875, -0.021401405334472656, -0.017614364624023438, -0.013827323913574219, -0.010040283203125, -0.006253242492675781, -0.0024662017822265625, 0.0013208389282226562, 0.005107879638671875, 0.008894920349121094, 0.012681961059570312, 0.01646900177001953, 0.02025604248046875, 0.02404308319091797, 0.027830123901367188, 0.031617164611816406, 0.035404205322265625, 0.039191246032714844, 0.04297828674316406, 0.04676532745361328, 0.0505523681640625, 0.05433940887451172, 0.05812644958496094, 0.061913490295410156, 0.06570053100585938, 0.0694875717163086, 0.07327461242675781, 0.07706165313720703, 0.08084869384765625, 0.08463573455810547, 0.08842277526855469, 0.0922098159790039, 0.09599685668945312, 0.09978389739990234, 0.10357093811035156, 0.10735797882080078, 0.11114501953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 15.0, 15.0, 26.0, 32.0, 17.0, 39.0, 36.0, 53.0, 71.0, 64.0, 69.0, 63.0, 46.0, 53.0, 58.0, 55.0, 50.0, 39.0, 35.0, 33.0, 21.0, 21.0, 11.0, 13.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8028035163879395, -2.7170827388763428, -2.631361961364746, -2.5456411838531494, -2.4599204063415527, -2.374199628829956, -2.2884788513183594, -2.202758312225342, -2.117037296295166, -2.0313165187835693, -1.9455957412719727, -1.859874963760376, -1.7741541862487793, -1.6884334087371826, -1.6027127504348755, -1.5169919729232788, -1.4312713146209717, -1.345550537109375, -1.2598297595977783, -1.1741089820861816, -1.088388204574585, -1.0026674270629883, -0.9169467687606812, -0.8312259912490845, -0.7455052137374878, -0.6597844362258911, -0.5740636587142944, -0.48834294080734253, -0.40262216329574585, -0.31690138578414917, -0.23118066787719727, -0.14545989036560059, -0.059739112854003906, 0.02598164975643158, 0.11170241236686707, 0.19742316007614136, 0.28314393758773804, 0.3688647150993347, 0.4545854330062866, 0.5403062105178833, 0.62602698802948, 0.7117477655410767, 0.7974685430526733, 0.8831892609596252, 0.9689100384712219, 1.0546307563781738, 1.1403515338897705, 1.2260723114013672, 1.3117930889129639, 1.3975138664245605, 1.4832346439361572, 1.568955421447754, 1.6546761989593506, 1.7403969764709473, 1.8261176347732544, 1.911838412284851, 1.9975591897964478, 2.083279848098755, 2.1690006256103516, 2.2547214031219482, 2.340442180633545, 2.4261629581451416, 2.5118837356567383, 2.597604513168335, 2.6833252906799316]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 14.0, 8.0, 13.0, 13.0, 15.0, 18.0, 21.0, 23.0, 23.0, 28.0, 29.0, 42.0, 27.0, 33.0, 39.0, 48.0, 47.0, 29.0, 47.0, 48.0, 28.0, 41.0, 49.0, 36.0, 32.0, 34.0, 17.0, 34.0, 21.0, 20.0, 21.0, 19.0, 10.0, 8.0, 9.0, 6.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.6686097383499146, -1.6190205812454224, -1.5694313049316406, -1.5198421478271484, -1.4702529907226562, -1.4206637144088745, -1.3710745573043823, -1.3214852809906006, -1.2718961238861084, -1.2223069667816162, -1.1727176904678345, -1.1231285333633423, -1.0735392570495605, -1.0239500999450684, -0.9743609428405762, -0.9247717261314392, -0.8751825094223022, -0.8255932927131653, -0.7760040760040283, -0.7264149188995361, -0.6768257021903992, -0.6272364854812622, -0.57764732837677, -0.5280581116676331, -0.4784688949584961, -0.42887967824935913, -0.37929049134254456, -0.32970130443573, -0.280112087726593, -0.23052288591861725, -0.18093368411064148, -0.1313444972038269, -0.08175528049468994, -0.03216607868671417, 0.017423123121261597, 0.06701232492923737, 0.11660152673721313, 0.1661907285451889, 0.21577993035316467, 0.26536911725997925, 0.3149583339691162, 0.3645475506782532, 0.41413673758506775, 0.4637259244918823, 0.5133151412010193, 0.5629043579101562, 0.6124935150146484, 0.6620827317237854, 0.7116719484329224, 0.7612611651420593, 0.8108503818511963, 0.8604395389556885, 0.9100287556648254, 0.9596179723739624, 1.0092071294784546, 1.0587964057922363, 1.1083855628967285, 1.1579747200012207, 1.2075639963150024, 1.2571531534194946, 1.3067424297332764, 1.3563315868377686, 1.4059207439422607, 1.455509901046753, 1.5050991773605347]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 16.0, 25.0, 37.0, 70.0, 107.0, 142.0, 226.0, 396.0, 625.0, 1031.0, 1565.0, 2541.0, 3896.0, 6096.0, 9060.0, 13846.0, 20351.0, 29148.0, 39452.0, 52889.0, 66788.0, 80266.0, 91485.0, 98529.0, 98322.0, 92410.0, 82139.0, 68646.0, 54180.0, 40819.0, 29955.0, 21244.0, 14587.0, 9797.0, 6427.0, 4045.0, 2712.0, 1763.0, 1078.0, 691.0, 433.0, 243.0, 172.0, 116.0, 77.0, 39.0, 25.0, 22.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0188446044921875, -0.984954833984375, -0.9510650634765625, -0.91717529296875, -0.8832855224609375, -0.849395751953125, -0.8155059814453125, -0.7816162109375, -0.7477264404296875, -0.713836669921875, -0.6799468994140625, -0.64605712890625, -0.6121673583984375, -0.578277587890625, -0.5443878173828125, -0.510498046875, -0.4766082763671875, -0.442718505859375, -0.4088287353515625, -0.37493896484375, -0.3410491943359375, -0.307159423828125, -0.2732696533203125, -0.2393798828125, -0.2054901123046875, -0.171600341796875, -0.1377105712890625, -0.10382080078125, -0.0699310302734375, -0.036041259765625, -0.0021514892578125, 0.03173828125, 0.0656280517578125, 0.099517822265625, 0.1334075927734375, 0.16729736328125, 0.2011871337890625, 0.235076904296875, 0.2689666748046875, 0.3028564453125, 0.3367462158203125, 0.370635986328125, 0.4045257568359375, 0.43841552734375, 0.4723052978515625, 0.506195068359375, 0.5400848388671875, 0.573974609375, 0.6078643798828125, 0.641754150390625, 0.6756439208984375, 0.70953369140625, 0.7434234619140625, 0.777313232421875, 0.8112030029296875, 0.8450927734375, 0.8789825439453125, 0.912872314453125, 0.9467620849609375, 0.98065185546875, 1.0145416259765625, 1.048431396484375, 1.0823211669921875, 1.1162109375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 8.0, 10.0, 10.0, 14.0, 20.0, 23.0, 19.0, 22.0, 31.0, 34.0, 27.0, 40.0, 48.0, 38.0, 50.0, 43.0, 44.0, 55.0, 43.0, 44.0, 37.0, 42.0, 32.0, 31.0, 28.0, 34.0, 24.0, 24.0, 14.0, 15.0, 19.0, 17.0, 9.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9345703125, -1.8772125244140625, -1.819854736328125, -1.7624969482421875, -1.70513916015625, -1.6477813720703125, -1.590423583984375, -1.5330657958984375, -1.4757080078125, -1.4183502197265625, -1.360992431640625, -1.3036346435546875, -1.24627685546875, -1.1889190673828125, -1.131561279296875, -1.0742034912109375, -1.016845703125, -0.9594879150390625, -0.902130126953125, -0.8447723388671875, -0.78741455078125, -0.7300567626953125, -0.672698974609375, -0.6153411865234375, -0.5579833984375, -0.5006256103515625, -0.443267822265625, -0.3859100341796875, -0.32855224609375, -0.2711944580078125, -0.213836669921875, -0.1564788818359375, -0.09912109375, -0.0417633056640625, 0.015594482421875, 0.0729522705078125, 0.13031005859375, 0.1876678466796875, 0.245025634765625, 0.3023834228515625, 0.3597412109375, 0.4170989990234375, 0.474456787109375, 0.5318145751953125, 0.58917236328125, 0.6465301513671875, 0.703887939453125, 0.7612457275390625, 0.818603515625, 0.8759613037109375, 0.933319091796875, 0.9906768798828125, 1.04803466796875, 1.1053924560546875, 1.162750244140625, 1.2201080322265625, 1.2774658203125, 1.3348236083984375, 1.392181396484375, 1.4495391845703125, 1.50689697265625, 1.5642547607421875, 1.621612548828125, 1.6789703369140625, 1.736328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 10.0, 26.0, 31.0, 64.0, 89.0, 140.0, 188.0, 310.0, 489.0, 766.0, 1134.0, 1903.0, 2869.0, 4493.0, 6856.0, 10342.0, 15388.0, 22428.0, 31941.0, 43266.0, 57743.0, 72693.0, 86664.0, 96855.0, 101445.0, 98873.0, 90408.0, 76969.0, 63033.0, 48504.0, 35833.0, 24916.0, 17667.0, 11958.0, 7671.0, 5072.0, 3315.0, 2268.0, 1367.0, 953.0, 630.0, 353.0, 239.0, 149.0, 86.0, 54.0, 32.0, 21.0, 20.0, 9.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0], "bins": [-1.1435546875, -1.108551025390625, -1.07354736328125, -1.038543701171875, -1.0035400390625, -0.968536376953125, -0.93353271484375, -0.898529052734375, -0.863525390625, -0.828521728515625, -0.79351806640625, -0.758514404296875, -0.7235107421875, -0.688507080078125, -0.65350341796875, -0.618499755859375, -0.58349609375, -0.548492431640625, -0.51348876953125, -0.478485107421875, -0.4434814453125, -0.408477783203125, -0.37347412109375, -0.338470458984375, -0.303466796875, -0.268463134765625, -0.23345947265625, -0.198455810546875, -0.1634521484375, -0.128448486328125, -0.09344482421875, -0.058441162109375, -0.0234375, 0.011566162109375, 0.04656982421875, 0.081573486328125, 0.1165771484375, 0.151580810546875, 0.18658447265625, 0.221588134765625, 0.256591796875, 0.291595458984375, 0.32659912109375, 0.361602783203125, 0.3966064453125, 0.431610107421875, 0.46661376953125, 0.501617431640625, 0.53662109375, 0.571624755859375, 0.60662841796875, 0.641632080078125, 0.6766357421875, 0.711639404296875, 0.74664306640625, 0.781646728515625, 0.816650390625, 0.851654052734375, 0.88665771484375, 0.921661376953125, 0.9566650390625, 0.991668701171875, 1.02667236328125, 1.061676025390625, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 9.0, 15.0, 15.0, 14.0, 25.0, 24.0, 29.0, 30.0, 20.0, 26.0, 40.0, 48.0, 33.0, 40.0, 36.0, 39.0, 45.0, 58.0, 36.0, 41.0, 45.0, 37.0, 49.0, 46.0, 31.0, 30.0, 19.0, 20.0, 28.0, 13.0, 13.0, 9.0, 8.0, 6.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1130523681640625, -1.076690673828125, -1.0403289794921875, -1.00396728515625, -0.9676055908203125, -0.931243896484375, -0.8948822021484375, -0.8585205078125, -0.8221588134765625, -0.785797119140625, -0.7494354248046875, -0.71307373046875, -0.6767120361328125, -0.640350341796875, -0.6039886474609375, -0.567626953125, -0.5312652587890625, -0.494903564453125, -0.4585418701171875, -0.42218017578125, -0.3858184814453125, -0.349456787109375, -0.3130950927734375, -0.2767333984375, -0.2403717041015625, -0.204010009765625, -0.1676483154296875, -0.13128662109375, -0.0949249267578125, -0.058563232421875, -0.0222015380859375, 0.01416015625, 0.0505218505859375, 0.086883544921875, 0.1232452392578125, 0.15960693359375, 0.1959686279296875, 0.232330322265625, 0.2686920166015625, 0.3050537109375, 0.3414154052734375, 0.377777099609375, 0.4141387939453125, 0.45050048828125, 0.4868621826171875, 0.523223876953125, 0.5595855712890625, 0.595947265625, 0.6323089599609375, 0.668670654296875, 0.7050323486328125, 0.74139404296875, 0.7777557373046875, 0.814117431640625, 0.8504791259765625, 0.8868408203125, 0.9232025146484375, 0.959564208984375, 0.9959259033203125, 1.03228759765625, 1.0686492919921875, 1.105010986328125, 1.1413726806640625, 1.177734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 9.0, 26.0, 14.0, 18.0, 29.0, 40.0, 55.0, 84.0, 155.0, 195.0, 365.0, 556.0, 951.0, 1644.0, 3090.0, 5693.0, 10394.0, 19512.0, 35968.0, 64015.0, 104060.0, 149177.0, 175861.0, 165834.0, 126548.0, 80438.0, 47252.0, 25694.0, 14114.0, 7355.0, 3912.0, 2306.0, 1224.0, 716.0, 423.0, 240.0, 181.0, 126.0, 75.0, 52.0, 35.0, 35.0, 16.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.91845703125, -0.8895111083984375, -0.860565185546875, -0.8316192626953125, -0.80267333984375, -0.7737274169921875, -0.744781494140625, -0.7158355712890625, -0.6868896484375, -0.6579437255859375, -0.628997802734375, -0.6000518798828125, -0.57110595703125, -0.5421600341796875, -0.513214111328125, -0.4842681884765625, -0.455322265625, -0.4263763427734375, -0.397430419921875, -0.3684844970703125, -0.33953857421875, -0.3105926513671875, -0.281646728515625, -0.2527008056640625, -0.2237548828125, -0.1948089599609375, -0.165863037109375, -0.1369171142578125, -0.10797119140625, -0.0790252685546875, -0.050079345703125, -0.0211334228515625, 0.0078125, 0.0367584228515625, 0.065704345703125, 0.0946502685546875, 0.12359619140625, 0.1525421142578125, 0.181488037109375, 0.2104339599609375, 0.2393798828125, 0.2683258056640625, 0.297271728515625, 0.3262176513671875, 0.35516357421875, 0.3841094970703125, 0.413055419921875, 0.4420013427734375, 0.470947265625, 0.4998931884765625, 0.528839111328125, 0.5577850341796875, 0.58673095703125, 0.6156768798828125, 0.644622802734375, 0.6735687255859375, 0.7025146484375, 0.7314605712890625, 0.760406494140625, 0.7893524169921875, 0.81829833984375, 0.8472442626953125, 0.876190185546875, 0.9051361083984375, 0.93408203125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 9.0, 4.0, 5.0, 3.0, 12.0, 16.0, 13.0, 24.0, 30.0, 39.0, 30.0, 42.0, 49.0, 52.0, 62.0, 66.0, 63.0, 75.0, 50.0, 67.0, 58.0, 51.0, 35.0, 39.0, 26.0, 20.0, 17.0, 15.0, 7.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.512901306152344e-05, -9.219907224178314e-05, -8.926913142204285e-05, -8.633919060230255e-05, -8.340924978256226e-05, -8.047930896282196e-05, -7.754936814308167e-05, -7.461942732334137e-05, -7.168948650360107e-05, -6.875954568386078e-05, -6.582960486412048e-05, -6.289966404438019e-05, -5.996972322463989e-05, -5.70397824048996e-05, -5.41098415851593e-05, -5.1179900765419006e-05, -4.824995994567871e-05, -4.5320019125938416e-05, -4.239007830619812e-05, -3.9460137486457825e-05, -3.653019666671753e-05, -3.3600255846977234e-05, -3.067031502723694e-05, -2.7740374207496643e-05, -2.4810433387756348e-05, -2.1880492568016052e-05, -1.8950551748275757e-05, -1.602061092853546e-05, -1.3090670108795166e-05, -1.016072928905487e-05, -7.230788469314575e-06, -4.30084764957428e-06, -1.3709068298339844e-06, 1.559033989906311e-06, 4.4889748096466064e-06, 7.418915629386902e-06, 1.0348856449127197e-05, 1.3278797268867493e-05, 1.6208738088607788e-05, 1.9138678908348083e-05, 2.206861972808838e-05, 2.4998560547828674e-05, 2.792850136756897e-05, 3.0858442187309265e-05, 3.378838300704956e-05, 3.6718323826789856e-05, 3.964826464653015e-05, 4.257820546627045e-05, 4.550814628601074e-05, 4.843808710575104e-05, 5.136802792549133e-05, 5.429796874523163e-05, 5.7227909564971924e-05, 6.015785038471222e-05, 6.308779120445251e-05, 6.601773202419281e-05, 6.89476728439331e-05, 7.18776136636734e-05, 7.48075544834137e-05, 7.773749530315399e-05, 8.066743612289429e-05, 8.359737694263458e-05, 8.652731776237488e-05, 8.945725858211517e-05, 9.238719940185547e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 5.0, 14.0, 18.0, 34.0, 54.0, 56.0, 102.0, 127.0, 160.0, 267.0, 471.0, 735.0, 1167.0, 2161.0, 3877.0, 7541.0, 14839.0, 29396.0, 56962.0, 103039.0, 159489.0, 196257.0, 182200.0, 129725.0, 76541.0, 40230.0, 20638.0, 10244.0, 5273.0, 2858.0, 1562.0, 887.0, 555.0, 350.0, 223.0, 157.0, 118.0, 71.0, 52.0, 35.0, 22.0, 15.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1484375, -1.1143951416015625, -1.080352783203125, -1.0463104248046875, -1.01226806640625, -0.9782257080078125, -0.944183349609375, -0.9101409912109375, -0.8760986328125, -0.8420562744140625, -0.808013916015625, -0.7739715576171875, -0.73992919921875, -0.7058868408203125, -0.671844482421875, -0.6378021240234375, -0.603759765625, -0.5697174072265625, -0.535675048828125, -0.5016326904296875, -0.46759033203125, -0.4335479736328125, -0.399505615234375, -0.3654632568359375, -0.3314208984375, -0.2973785400390625, -0.263336181640625, -0.2292938232421875, -0.19525146484375, -0.1612091064453125, -0.127166748046875, -0.0931243896484375, -0.05908203125, -0.0250396728515625, 0.009002685546875, 0.0430450439453125, 0.07708740234375, 0.1111297607421875, 0.145172119140625, 0.1792144775390625, 0.2132568359375, 0.2472991943359375, 0.281341552734375, 0.3153839111328125, 0.34942626953125, 0.3834686279296875, 0.417510986328125, 0.4515533447265625, 0.485595703125, 0.5196380615234375, 0.553680419921875, 0.5877227783203125, 0.62176513671875, 0.6558074951171875, 0.689849853515625, 0.7238922119140625, 0.7579345703125, 0.7919769287109375, 0.826019287109375, 0.8600616455078125, 0.89410400390625, 0.9281463623046875, 0.962188720703125, 0.9962310791015625, 1.0302734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 11.0, 14.0, 15.0, 23.0, 31.0, 32.0, 42.0, 44.0, 64.0, 61.0, 85.0, 73.0, 75.0, 72.0, 47.0, 50.0, 39.0, 57.0, 35.0, 25.0, 20.0, 19.0, 19.0, 9.0, 5.0, 10.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.344482421875, -0.3343162536621094, -0.32415008544921875, -0.3139839172363281, -0.3038177490234375, -0.2936515808105469, -0.28348541259765625, -0.2733192443847656, -0.263153076171875, -0.2529869079589844, -0.24282073974609375, -0.23265457153320312, -0.2224884033203125, -0.21232223510742188, -0.20215606689453125, -0.19198989868164062, -0.18182373046875, -0.17165756225585938, -0.16149139404296875, -0.15132522583007812, -0.1411590576171875, -0.13099288940429688, -0.12082672119140625, -0.11066055297851562, -0.100494384765625, -0.09032821655273438, -0.08016204833984375, -0.06999588012695312, -0.0598297119140625, -0.049663543701171875, -0.03949737548828125, -0.029331207275390625, -0.0191650390625, -0.008998870849609375, 0.00116729736328125, 0.011333465576171875, 0.0214996337890625, 0.031665802001953125, 0.04183197021484375, 0.051998138427734375, 0.062164306640625, 0.07233047485351562, 0.08249664306640625, 0.09266281127929688, 0.1028289794921875, 0.11299514770507812, 0.12316131591796875, 0.13332748413085938, 0.14349365234375, 0.15365982055664062, 0.16382598876953125, 0.17399215698242188, 0.1841583251953125, 0.19432449340820312, 0.20449066162109375, 0.21465682983398438, 0.224822998046875, 0.23498916625976562, 0.24515533447265625, 0.2553215026855469, 0.2654876708984375, 0.2756538391113281, 0.28582000732421875, 0.2959861755371094, 0.30615234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 9.0, 10.0, 6.0, 4.0, 27.0, 21.0, 21.0, 22.0, 32.0, 40.0, 40.0, 51.0, 54.0, 64.0, 65.0, 55.0, 51.0, 53.0, 50.0, 61.0, 34.0, 46.0, 37.0, 36.0, 23.0, 19.0, 19.0, 13.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6378824710845947, -2.55696964263916, -2.4760570526123047, -2.39514422416687, -2.3142313957214355, -2.233318567276001, -2.1524057388305664, -2.071493148803711, -1.9905803203582764, -1.9096674919128418, -1.8287547826766968, -1.7478420734405518, -1.6669292449951172, -1.5860164165496826, -1.5051037073135376, -1.4241909980773926, -1.343278169631958, -1.2623653411865234, -1.1814526319503784, -1.1005399227142334, -1.0196270942687988, -0.938714325428009, -0.8578015565872192, -0.7768887877464294, -0.6959760189056396, -0.6150632500648499, -0.5341504812240601, -0.45323771238327026, -0.37232494354248047, -0.2914121747016907, -0.21049940586090088, -0.12958663702011108, -0.04867410659790039, 0.032238662242889404, 0.1131514310836792, 0.194064199924469, 0.2749769687652588, 0.3558897376060486, 0.4368025064468384, 0.5177152752876282, 0.598628044128418, 0.6795408129692078, 0.7604535818099976, 0.8413663506507874, 0.9222791194915771, 1.0031919479370117, 1.0841046571731567, 1.1650173664093018, 1.2459301948547363, 1.326843023300171, 1.407755732536316, 1.488668441772461, 1.5695812702178955, 1.65049409866333, 1.731406807899475, 1.8123195171356201, 1.8932323455810547, 1.9741451740264893, 2.055058002471924, 2.1359705924987793, 2.216883420944214, 2.2977962493896484, 2.378708839416504, 2.4596216678619385, 2.540534496307373]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 3.0, 9.0, 12.0, 15.0, 6.0, 17.0, 16.0, 8.0, 24.0, 22.0, 28.0, 30.0, 26.0, 32.0, 40.0, 32.0, 43.0, 37.0, 35.0, 43.0, 46.0, 31.0, 46.0, 38.0, 22.0, 40.0, 34.0, 42.0, 29.0, 30.0, 29.0, 23.0, 25.0, 15.0, 12.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7800862789154053, -1.7279075384140015, -1.6757287979125977, -1.6235501766204834, -1.5713714361190796, -1.5191926956176758, -1.4670140743255615, -1.4148353338241577, -1.362656593322754, -1.31047785282135, -1.2582991123199463, -1.206120491027832, -1.1539417505264282, -1.1017630100250244, -1.0495843887329102, -0.9974056482315063, -0.9452269077301025, -0.8930481672286987, -0.8408694863319397, -0.7886908054351807, -0.7365120649337769, -0.684333324432373, -0.632154643535614, -0.579975962638855, -0.5277972221374512, -0.47561851143836975, -0.42343980073928833, -0.3712610900402069, -0.3190823793411255, -0.26690366864204407, -0.21472495794296265, -0.16254624724388123, -0.11036765575408936, -0.058188945055007935, -0.006010234355926514, 0.04616847634315491, 0.09834718704223633, 0.15052589774131775, 0.20270460844039917, 0.2548833191394806, 0.307062029838562, 0.35924074053764343, 0.41141945123672485, 0.4635981619358063, 0.5157768726348877, 0.5679556131362915, 0.6201342940330505, 0.6723129749298096, 0.7244917154312134, 0.7766704559326172, 0.8288491368293762, 0.8810278177261353, 0.9332065582275391, 0.9853852987289429, 1.0375640392303467, 1.089742660522461, 1.1419214010238647, 1.1941001415252686, 1.2462787628173828, 1.2984575033187866, 1.3506362438201904, 1.4028149843215942, 1.454993724822998, 1.5071723461151123, 1.5593510866165161]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 9.0, 18.0, 27.0, 35.0, 54.0, 83.0, 121.0, 187.0, 340.0, 522.0, 886.0, 1481.0, 2412.0, 4237.0, 7285.0, 12654.0, 21566.0, 36922.0, 62354.0, 104771.0, 166104.0, 252475.0, 357782.0, 462754.0, 534085.0, 543572.0, 487063.0, 385959.0, 277514.0, 184558.0, 116806.0, 70856.0, 41709.0, 24144.0, 13981.0, 7839.0, 4576.0, 2691.0, 1488.0, 938.0, 586.0, 295.0, 212.0, 128.0, 87.0, 43.0, 35.0, 13.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8046875, -1.7467193603515625, -1.688751220703125, -1.6307830810546875, -1.57281494140625, -1.5148468017578125, -1.456878662109375, -1.3989105224609375, -1.3409423828125, -1.2829742431640625, -1.225006103515625, -1.1670379638671875, -1.10906982421875, -1.0511016845703125, -0.993133544921875, -0.9351654052734375, -0.877197265625, -0.8192291259765625, -0.761260986328125, -0.7032928466796875, -0.64532470703125, -0.5873565673828125, -0.529388427734375, -0.4714202880859375, -0.4134521484375, -0.3554840087890625, -0.297515869140625, -0.2395477294921875, -0.18157958984375, -0.1236114501953125, -0.065643310546875, -0.0076751708984375, 0.05029296875, 0.1082611083984375, 0.166229248046875, 0.2241973876953125, 0.28216552734375, 0.3401336669921875, 0.398101806640625, 0.4560699462890625, 0.5140380859375, 0.5720062255859375, 0.629974365234375, 0.6879425048828125, 0.74591064453125, 0.8038787841796875, 0.861846923828125, 0.9198150634765625, 0.977783203125, 1.0357513427734375, 1.093719482421875, 1.1516876220703125, 1.20965576171875, 1.2676239013671875, 1.325592041015625, 1.3835601806640625, 1.4415283203125, 1.4994964599609375, 1.557464599609375, 1.6154327392578125, 1.67340087890625, 1.7313690185546875, 1.789337158203125, 1.8473052978515625, 1.9052734375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 3.0, 3.0, 5.0, 10.0, 11.0, 12.0, 12.0, 9.0, 17.0, 14.0, 12.0, 16.0, 20.0, 26.0, 27.0, 40.0, 33.0, 30.0, 39.0, 42.0, 31.0, 44.0, 48.0, 40.0, 35.0, 36.0, 47.0, 34.0, 32.0, 30.0, 34.0, 35.0, 29.0, 21.0, 26.0, 18.0, 10.0, 13.0, 10.0, 8.0, 5.0, 2.0, 4.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0], "bins": [-1.611328125, -1.5662841796875, -1.521240234375, -1.4761962890625, -1.43115234375, -1.3861083984375, -1.341064453125, -1.2960205078125, -1.2509765625, -1.2059326171875, -1.160888671875, -1.1158447265625, -1.07080078125, -1.0257568359375, -0.980712890625, -0.9356689453125, -0.890625, -0.8455810546875, -0.800537109375, -0.7554931640625, -0.71044921875, -0.6654052734375, -0.620361328125, -0.5753173828125, -0.5302734375, -0.4852294921875, -0.440185546875, -0.3951416015625, -0.35009765625, -0.3050537109375, -0.260009765625, -0.2149658203125, -0.169921875, -0.1248779296875, -0.079833984375, -0.0347900390625, 0.01025390625, 0.0552978515625, 0.100341796875, 0.1453857421875, 0.1904296875, 0.2354736328125, 0.280517578125, 0.3255615234375, 0.37060546875, 0.4156494140625, 0.460693359375, 0.5057373046875, 0.55078125, 0.5958251953125, 0.640869140625, 0.6859130859375, 0.73095703125, 0.7760009765625, 0.821044921875, 0.8660888671875, 0.9111328125, 0.9561767578125, 1.001220703125, 1.0462646484375, 1.09130859375, 1.1363525390625, 1.181396484375, 1.2264404296875, 1.271484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 8.0, 13.0, 15.0, 37.0, 48.0, 85.0, 127.0, 245.0, 460.0, 784.0, 1379.0, 2343.0, 4176.0, 7597.0, 13104.0, 22841.0, 39031.0, 65387.0, 106857.0, 166479.0, 247792.0, 340674.0, 431886.0, 497237.0, 511027.0, 474096.0, 395133.0, 300736.0, 211483.0, 138844.0, 87820.0, 53205.0, 31266.0, 18204.0, 10393.0, 5901.0, 3267.0, 1893.0, 1020.0, 568.0, 372.0, 186.0, 103.0, 66.0, 39.0, 19.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.890533447265625, -1.82598876953125, -1.761444091796875, -1.6968994140625, -1.632354736328125, -1.56781005859375, -1.503265380859375, -1.438720703125, -1.374176025390625, -1.30963134765625, -1.245086669921875, -1.1805419921875, -1.115997314453125, -1.05145263671875, -0.986907958984375, -0.92236328125, -0.857818603515625, -0.79327392578125, -0.728729248046875, -0.6641845703125, -0.599639892578125, -0.53509521484375, -0.470550537109375, -0.406005859375, -0.341461181640625, -0.27691650390625, -0.212371826171875, -0.1478271484375, -0.083282470703125, -0.01873779296875, 0.045806884765625, 0.1103515625, 0.174896240234375, 0.23944091796875, 0.303985595703125, 0.3685302734375, 0.433074951171875, 0.49761962890625, 0.562164306640625, 0.626708984375, 0.691253662109375, 0.75579833984375, 0.820343017578125, 0.8848876953125, 0.949432373046875, 1.01397705078125, 1.078521728515625, 1.14306640625, 1.207611083984375, 1.27215576171875, 1.336700439453125, 1.4012451171875, 1.465789794921875, 1.53033447265625, 1.594879150390625, 1.659423828125, 1.723968505859375, 1.78851318359375, 1.853057861328125, 1.9176025390625, 1.982147216796875, 2.04669189453125, 2.111236572265625, 2.17578125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 3.0, 5.0, 9.0, 10.0, 9.0, 12.0, 24.0, 16.0, 20.0, 33.0, 40.0, 54.0, 63.0, 68.0, 90.0, 95.0, 98.0, 117.0, 140.0, 147.0, 162.0, 183.0, 193.0, 188.0, 219.0, 235.0, 223.0, 207.0, 172.0, 175.0, 147.0, 146.0, 110.0, 122.0, 111.0, 78.0, 80.0, 60.0, 51.0, 39.0, 21.0, 25.0, 28.0, 10.0, 12.0, 10.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83203125, -0.8075332641601562, -0.7830352783203125, -0.7585372924804688, -0.734039306640625, -0.7095413208007812, -0.6850433349609375, -0.6605453491210938, -0.63604736328125, -0.6115493774414062, -0.5870513916015625, -0.5625534057617188, -0.538055419921875, -0.5135574340820312, -0.4890594482421875, -0.46456146240234375, -0.4400634765625, -0.41556549072265625, -0.3910675048828125, -0.36656951904296875, -0.342071533203125, -0.31757354736328125, -0.2930755615234375, -0.26857757568359375, -0.24407958984375, -0.21958160400390625, -0.1950836181640625, -0.17058563232421875, -0.146087646484375, -0.12158966064453125, -0.0970916748046875, -0.07259368896484375, -0.048095703125, -0.02359771728515625, 0.0009002685546875, 0.02539825439453125, 0.049896240234375, 0.07439422607421875, 0.0988922119140625, 0.12339019775390625, 0.14788818359375, 0.17238616943359375, 0.1968841552734375, 0.22138214111328125, 0.245880126953125, 0.27037811279296875, 0.2948760986328125, 0.31937408447265625, 0.3438720703125, 0.36837005615234375, 0.3928680419921875, 0.41736602783203125, 0.441864013671875, 0.46636199951171875, 0.4908599853515625, 0.5153579711914062, 0.53985595703125, 0.5643539428710938, 0.5888519287109375, 0.6133499145507812, 0.637847900390625, 0.6623458862304688, 0.6868438720703125, 0.7113418579101562, 0.73583984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 7.0, 7.0, 4.0, 13.0, 13.0, 21.0, 14.0, 28.0, 33.0, 40.0, 54.0, 44.0, 39.0, 58.0, 60.0, 70.0, 74.0, 50.0, 57.0, 55.0, 43.0, 45.0, 42.0, 34.0, 22.0, 22.0, 12.0, 17.0, 6.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2938148975372314, -3.1929543018341064, -3.0920934677124023, -2.9912328720092773, -2.8903722763061523, -2.7895114421844482, -2.6886508464813232, -2.587790012359619, -2.486929416656494, -2.386068820953369, -2.285207986831665, -2.18434739112854, -2.083486557006836, -1.982625961303711, -1.881765365600586, -1.7809046506881714, -1.6800439357757568, -1.5791832208633423, -1.4783225059509277, -1.3774619102478027, -1.2766011953353882, -1.1757404804229736, -1.0748798847198486, -0.9740191698074341, -0.8731584548950195, -0.772297739982605, -0.6714370846748352, -0.5705764293670654, -0.4697157144546509, -0.36885499954223633, -0.26799434423446655, -0.16713368892669678, -0.06627321243286133, 0.034587472677230835, 0.135448157787323, 0.23630884289741516, 0.3371695280075073, 0.4380302429199219, 0.5388908982276917, 0.6397515535354614, 0.740612268447876, 0.8414729833602905, 0.9423336386680603, 1.04319429397583, 1.1440550088882446, 1.2449157238006592, 1.3457763195037842, 1.4466370344161987, 1.5474977493286133, 1.6483584642410278, 1.7492191791534424, 1.8500797748565674, 1.950940489768982, 2.0518012046813965, 2.1526618003845215, 2.2535223960876465, 2.3543832302093506, 2.4552438259124756, 2.5561046600341797, 2.6569652557373047, 2.7578258514404297, 2.858686685562134, 2.959547281265259, 3.060408115386963, 3.161268711090088]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 12.0, 4.0, 6.0, 9.0, 13.0, 13.0, 23.0, 17.0, 14.0, 13.0, 28.0, 24.0, 20.0, 27.0, 28.0, 34.0, 43.0, 36.0, 44.0, 32.0, 45.0, 36.0, 46.0, 39.0, 36.0, 37.0, 32.0, 23.0, 38.0, 35.0, 33.0, 29.0, 21.0, 22.0, 11.0, 15.0, 17.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8168824911117554, -1.7598389387130737, -1.7027955055236816, -1.645751953125, -1.5887084007263184, -1.5316649675369263, -1.4746214151382446, -1.4175779819488525, -1.360534429550171, -1.3034908771514893, -1.2464474439620972, -1.1894038915634155, -1.1323603391647339, -1.0753169059753418, -1.0182733535766602, -0.9612298607826233, -0.9041863083839417, -0.8471428155899048, -0.7900992631912231, -0.7330557703971863, -0.6760122776031494, -0.6189687252044678, -0.5619252324104309, -0.504881739616394, -0.4478382170200348, -0.39079469442367554, -0.33375120162963867, -0.2767076790332794, -0.21966417133808136, -0.1626206636428833, -0.10557714104652405, -0.04853364825248718, 0.00850987434387207, 0.06555338203907013, 0.12259689718484879, 0.17964041233062744, 0.2366839200258255, 0.29372742772102356, 0.3507709503173828, 0.4078144431114197, 0.46485796570777893, 0.5219014883041382, 0.578944981098175, 0.6359884738922119, 0.6930320262908936, 0.7500755190849304, 0.8071190118789673, 0.8641625642776489, 0.9212060570716858, 0.9782495498657227, 1.0352931022644043, 1.092336654663086, 1.149380087852478, 1.2064236402511597, 1.2634670734405518, 1.3205106258392334, 1.377554178237915, 1.4345977306365967, 1.4916411638259888, 1.5486847162246704, 1.605728268623352, 1.6627717018127441, 1.7198152542114258, 1.7768588066101074, 1.8339022397994995]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 12.0, 23.0, 24.0, 46.0, 58.0, 106.0, 145.0, 224.0, 279.0, 439.0, 660.0, 1019.0, 1419.0, 2146.0, 3322.0, 4931.0, 7488.0, 11555.0, 17962.0, 28246.0, 42907.0, 65004.0, 94734.0, 128331.0, 149902.0, 141480.0, 112387.0, 80042.0, 53264.0, 34856.0, 22861.0, 14528.0, 9563.0, 6222.0, 4150.0, 2714.0, 1820.0, 1166.0, 818.0, 557.0, 362.0, 244.0, 181.0, 119.0, 71.0, 55.0, 47.0, 21.0, 14.0, 8.0, 7.0, 3.0, 1.0, 5.0], "bins": [-0.473388671875, -0.45977020263671875, -0.4461517333984375, -0.43253326416015625, -0.418914794921875, -0.40529632568359375, -0.3916778564453125, -0.37805938720703125, -0.36444091796875, -0.35082244873046875, -0.3372039794921875, -0.32358551025390625, -0.309967041015625, -0.29634857177734375, -0.2827301025390625, -0.26911163330078125, -0.2554931640625, -0.24187469482421875, -0.2282562255859375, -0.21463775634765625, -0.201019287109375, -0.18740081787109375, -0.1737823486328125, -0.16016387939453125, -0.14654541015625, -0.13292694091796875, -0.1193084716796875, -0.10569000244140625, -0.092071533203125, -0.07845306396484375, -0.0648345947265625, -0.05121612548828125, -0.03759765625, -0.02397918701171875, -0.0103607177734375, 0.00325775146484375, 0.016876220703125, 0.03049468994140625, 0.0441131591796875, 0.05773162841796875, 0.07135009765625, 0.08496856689453125, 0.0985870361328125, 0.11220550537109375, 0.125823974609375, 0.13944244384765625, 0.1530609130859375, 0.16667938232421875, 0.1802978515625, 0.19391632080078125, 0.2075347900390625, 0.22115325927734375, 0.234771728515625, 0.24839019775390625, 0.2620086669921875, 0.27562713623046875, 0.28924560546875, 0.30286407470703125, 0.3164825439453125, 0.33010101318359375, 0.343719482421875, 0.35733795166015625, 0.3709564208984375, 0.38457489013671875, 0.398193359375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 14.0, 13.0, 19.0, 17.0, 22.0, 18.0, 16.0, 21.0, 19.0, 27.0, 19.0, 29.0, 33.0, 41.0, 32.0, 43.0, 44.0, 52.0, 45.0, 28.0, 50.0, 42.0, 41.0, 26.0, 40.0, 28.0, 34.0, 30.0, 26.0, 19.0, 12.0, 10.0, 18.0, 14.0, 2.0, 7.0, 4.0, 5.0, 8.0, 6.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9150390625, -1.8527374267578125, -1.790435791015625, -1.7281341552734375, -1.66583251953125, -1.6035308837890625, -1.541229248046875, -1.4789276123046875, -1.4166259765625, -1.3543243408203125, -1.292022705078125, -1.2297210693359375, -1.16741943359375, -1.1051177978515625, -1.042816162109375, -0.9805145263671875, -0.918212890625, -0.8559112548828125, -0.793609619140625, -0.7313079833984375, -0.66900634765625, -0.6067047119140625, -0.544403076171875, -0.4821014404296875, -0.4197998046875, -0.3574981689453125, -0.295196533203125, -0.2328948974609375, -0.17059326171875, -0.1082916259765625, -0.045989990234375, 0.0163116455078125, 0.07861328125, 0.1409149169921875, 0.203216552734375, 0.2655181884765625, 0.32781982421875, 0.3901214599609375, 0.452423095703125, 0.5147247314453125, 0.5770263671875, 0.6393280029296875, 0.701629638671875, 0.7639312744140625, 0.82623291015625, 0.8885345458984375, 0.950836181640625, 1.0131378173828125, 1.075439453125, 1.1377410888671875, 1.200042724609375, 1.2623443603515625, 1.32464599609375, 1.3869476318359375, 1.449249267578125, 1.5115509033203125, 1.5738525390625, 1.6361541748046875, 1.698455810546875, 1.7607574462890625, 1.82305908203125, 1.8853607177734375, 1.947662353515625, 2.0099639892578125, 2.072265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 10.0, 19.0, 26.0, 35.0, 45.0, 76.0, 117.0, 174.0, 238.0, 412.0, 608.0, 1016.0, 1660.0, 2632.0, 4724.0, 8713.0, 16049.0, 30628.0, 59733.0, 114975.0, 198380.0, 239234.0, 171293.0, 93696.0, 48393.0, 25064.0, 13174.0, 7166.0, 3990.0, 2397.0, 1403.0, 875.0, 563.0, 345.0, 227.0, 139.0, 105.0, 60.0, 52.0, 26.0, 26.0, 13.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0], "bins": [-0.669921875, -0.6492080688476562, -0.6284942626953125, -0.6077804565429688, -0.587066650390625, -0.5663528442382812, -0.5456390380859375, -0.5249252319335938, -0.50421142578125, -0.48349761962890625, -0.4627838134765625, -0.44207000732421875, -0.421356201171875, -0.40064239501953125, -0.3799285888671875, -0.35921478271484375, -0.3385009765625, -0.31778717041015625, -0.2970733642578125, -0.27635955810546875, -0.255645751953125, -0.23493194580078125, -0.2142181396484375, -0.19350433349609375, -0.17279052734375, -0.15207672119140625, -0.1313629150390625, -0.11064910888671875, -0.089935302734375, -0.06922149658203125, -0.0485076904296875, -0.02779388427734375, -0.007080078125, 0.01363372802734375, 0.0343475341796875, 0.05506134033203125, 0.075775146484375, 0.09648895263671875, 0.1172027587890625, 0.13791656494140625, 0.15863037109375, 0.17934417724609375, 0.2000579833984375, 0.22077178955078125, 0.241485595703125, 0.26219940185546875, 0.2829132080078125, 0.30362701416015625, 0.3243408203125, 0.34505462646484375, 0.3657684326171875, 0.38648223876953125, 0.407196044921875, 0.42790985107421875, 0.4486236572265625, 0.46933746337890625, 0.49005126953125, 0.5107650756835938, 0.5314788818359375, 0.5521926879882812, 0.572906494140625, 0.5936203002929688, 0.6143341064453125, 0.6350479125976562, 0.65576171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 10.0, 9.0, 7.0, 11.0, 9.0, 15.0, 14.0, 27.0, 26.0, 25.0, 31.0, 31.0, 43.0, 32.0, 32.0, 38.0, 51.0, 60.0, 45.0, 40.0, 37.0, 34.0, 56.0, 36.0, 31.0, 28.0, 50.0, 21.0, 33.0, 23.0, 14.0, 12.0, 13.0, 18.0, 12.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1943359375, -1.1537017822265625, -1.113067626953125, -1.0724334716796875, -1.03179931640625, -0.9911651611328125, -0.950531005859375, -0.9098968505859375, -0.8692626953125, -0.8286285400390625, -0.787994384765625, -0.7473602294921875, -0.70672607421875, -0.6660919189453125, -0.625457763671875, -0.5848236083984375, -0.544189453125, -0.5035552978515625, -0.462921142578125, -0.4222869873046875, -0.38165283203125, -0.3410186767578125, -0.300384521484375, -0.2597503662109375, -0.2191162109375, -0.1784820556640625, -0.137847900390625, -0.0972137451171875, -0.05657958984375, -0.0159454345703125, 0.024688720703125, 0.0653228759765625, 0.10595703125, 0.1465911865234375, 0.187225341796875, 0.2278594970703125, 0.26849365234375, 0.3091278076171875, 0.349761962890625, 0.3903961181640625, 0.4310302734375, 0.4716644287109375, 0.512298583984375, 0.5529327392578125, 0.59356689453125, 0.6342010498046875, 0.674835205078125, 0.7154693603515625, 0.756103515625, 0.7967376708984375, 0.837371826171875, 0.8780059814453125, 0.91864013671875, 0.9592742919921875, 0.999908447265625, 1.0405426025390625, 1.0811767578125, 1.1218109130859375, 1.162445068359375, 1.2030792236328125, 1.24371337890625, 1.2843475341796875, 1.324981689453125, 1.3656158447265625, 1.40625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 14.0, 7.0, 28.0, 31.0, 29.0, 44.0, 53.0, 65.0, 86.0, 141.0, 183.0, 244.0, 351.0, 505.0, 727.0, 1222.0, 1885.0, 3160.0, 5712.0, 11583.0, 27475.0, 88541.0, 393989.0, 375300.0, 84834.0, 26569.0, 11473.0, 5771.0, 3045.0, 1827.0, 1134.0, 736.0, 498.0, 344.0, 238.0, 162.0, 130.0, 118.0, 88.0, 63.0, 39.0, 30.0, 18.0, 11.0, 9.0, 7.0, 6.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4084968566894531, -0.39389801025390625, -0.3792991638183594, -0.3647003173828125, -0.3501014709472656, -0.33550262451171875, -0.3209037780761719, -0.306304931640625, -0.2917060852050781, -0.27710723876953125, -0.2625083923339844, -0.2479095458984375, -0.23331069946289062, -0.21871185302734375, -0.20411300659179688, -0.18951416015625, -0.17491531372070312, -0.16031646728515625, -0.14571762084960938, -0.1311187744140625, -0.11651992797851562, -0.10192108154296875, -0.08732223510742188, -0.072723388671875, -0.058124542236328125, -0.04352569580078125, -0.028926849365234375, -0.0143280029296875, 0.000270843505859375, 0.01486968994140625, 0.029468536376953125, 0.0440673828125, 0.058666229248046875, 0.07326507568359375, 0.08786392211914062, 0.1024627685546875, 0.11706161499023438, 0.13166046142578125, 0.14625930786132812, 0.160858154296875, 0.17545700073242188, 0.19005584716796875, 0.20465469360351562, 0.2192535400390625, 0.23385238647460938, 0.24845123291015625, 0.2630500793457031, 0.27764892578125, 0.2922477722167969, 0.30684661865234375, 0.3214454650878906, 0.3360443115234375, 0.3506431579589844, 0.36524200439453125, 0.3798408508300781, 0.394439697265625, 0.4090385437011719, 0.42363739013671875, 0.4382362365722656, 0.4528350830078125, 0.4674339294433594, 0.48203277587890625, 0.4966316223144531, 0.51123046875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 6.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 4.0, 5.0, 7.0, 9.0, 12.0, 16.0, 12.0, 27.0, 15.0, 44.0, 45.0, 35.0, 40.0, 53.0, 57.0, 57.0, 62.0, 59.0, 51.0, 50.0, 36.0, 44.0, 36.0, 37.0, 22.0, 25.0, 23.0, 13.0, 20.0, 9.0, 7.0, 5.0, 9.0, 16.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.328345388174057e-05, -1.2798234820365906e-05, -1.2313015758991241e-05, -1.1827796697616577e-05, -1.1342577636241913e-05, -1.0857358574867249e-05, -1.0372139513492584e-05, -9.88692045211792e-06, -9.401701390743256e-06, -8.916482329368591e-06, -8.431263267993927e-06, -7.946044206619263e-06, -7.460825145244598e-06, -6.975606083869934e-06, -6.49038702249527e-06, -6.0051679611206055e-06, -5.519948899745941e-06, -5.034729838371277e-06, -4.5495107769966125e-06, -4.064291715621948e-06, -3.579072654247284e-06, -3.0938535928726196e-06, -2.6086345314979553e-06, -2.123415470123291e-06, -1.6381964087486267e-06, -1.1529773473739624e-06, -6.677582859992981e-07, -1.825392246246338e-07, 3.026798367500305e-07, 7.878988981246948e-07, 1.2731179594993591e-06, 1.7583370208740234e-06, 2.2435560822486877e-06, 2.728775143623352e-06, 3.2139942049980164e-06, 3.6992132663726807e-06, 4.184432327747345e-06, 4.669651389122009e-06, 5.154870450496674e-06, 5.640089511871338e-06, 6.125308573246002e-06, 6.6105276346206665e-06, 7.095746695995331e-06, 7.580965757369995e-06, 8.06618481874466e-06, 8.551403880119324e-06, 9.036622941493988e-06, 9.521842002868652e-06, 1.0007061064243317e-05, 1.0492280125617981e-05, 1.0977499186992645e-05, 1.146271824836731e-05, 1.1947937309741974e-05, 1.2433156371116638e-05, 1.2918375432491302e-05, 1.3403594493865967e-05, 1.3888813555240631e-05, 1.4374032616615295e-05, 1.485925167798996e-05, 1.5344470739364624e-05, 1.582968980073929e-05, 1.6314908862113953e-05, 1.6800127923488617e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 19.0, 18.0, 40.0, 34.0, 47.0, 96.0, 113.0, 158.0, 223.0, 314.0, 446.0, 686.0, 974.0, 1476.0, 2254.0, 3524.0, 5962.0, 10912.0, 23249.0, 58464.0, 172586.0, 384852.0, 238732.0, 80543.0, 30208.0, 13690.0, 7018.0, 4096.0, 2522.0, 1621.0, 1121.0, 772.0, 552.0, 369.0, 269.0, 181.0, 131.0, 95.0, 59.0, 37.0, 24.0, 15.0, 19.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5106124877929688, -0.4933929443359375, -0.47617340087890625, -0.458953857421875, -0.44173431396484375, -0.4245147705078125, -0.40729522705078125, -0.39007568359375, -0.37285614013671875, -0.3556365966796875, -0.33841705322265625, -0.321197509765625, -0.30397796630859375, -0.2867584228515625, -0.26953887939453125, -0.2523193359375, -0.23509979248046875, -0.2178802490234375, -0.20066070556640625, -0.183441162109375, -0.16622161865234375, -0.1490020751953125, -0.13178253173828125, -0.11456298828125, -0.09734344482421875, -0.0801239013671875, -0.06290435791015625, -0.045684814453125, -0.02846527099609375, -0.0112457275390625, 0.00597381591796875, 0.023193359375, 0.04041290283203125, 0.0576324462890625, 0.07485198974609375, 0.092071533203125, 0.10929107666015625, 0.1265106201171875, 0.14373016357421875, 0.16094970703125, 0.17816925048828125, 0.1953887939453125, 0.21260833740234375, 0.229827880859375, 0.24704742431640625, 0.2642669677734375, 0.28148651123046875, 0.2987060546875, 0.31592559814453125, 0.3331451416015625, 0.35036468505859375, 0.367584228515625, 0.38480377197265625, 0.4020233154296875, 0.41924285888671875, 0.43646240234375, 0.45368194580078125, 0.4709014892578125, 0.48812103271484375, 0.505340576171875, 0.5225601196289062, 0.5397796630859375, 0.5569992065429688, 0.57421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 10.0, 16.0, 11.0, 19.0, 23.0, 31.0, 40.0, 44.0, 71.0, 73.0, 73.0, 90.0, 70.0, 86.0, 59.0, 45.0, 40.0, 23.0, 27.0, 18.0, 22.0, 8.0, 9.0, 9.0, 14.0, 3.0, 3.0, 4.0, 4.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.11407470703125, -0.11100006103515625, -0.1079254150390625, -0.10485076904296875, -0.101776123046875, -0.09870147705078125, -0.0956268310546875, -0.09255218505859375, -0.0894775390625, -0.08640289306640625, -0.0833282470703125, -0.08025360107421875, -0.077178955078125, -0.07410430908203125, -0.0710296630859375, -0.06795501708984375, -0.06488037109375, -0.06180572509765625, -0.0587310791015625, -0.05565643310546875, -0.052581787109375, -0.04950714111328125, -0.0464324951171875, -0.04335784912109375, -0.040283203125, -0.03720855712890625, -0.0341339111328125, -0.03105926513671875, -0.027984619140625, -0.02490997314453125, -0.0218353271484375, -0.01876068115234375, -0.01568603515625, -0.01261138916015625, -0.0095367431640625, -0.00646209716796875, -0.003387451171875, -0.00031280517578125, 0.0027618408203125, 0.00583648681640625, 0.0089111328125, 0.01198577880859375, 0.0150604248046875, 0.01813507080078125, 0.021209716796875, 0.02428436279296875, 0.0273590087890625, 0.03043365478515625, 0.03350830078125, 0.03658294677734375, 0.0396575927734375, 0.04273223876953125, 0.045806884765625, 0.04888153076171875, 0.0519561767578125, 0.05503082275390625, 0.05810546875, 0.06118011474609375, 0.0642547607421875, 0.06732940673828125, 0.070404052734375, 0.07347869873046875, 0.0765533447265625, 0.07962799072265625, 0.08270263671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 6.0, 5.0, 6.0, 8.0, 10.0, 16.0, 17.0, 15.0, 29.0, 36.0, 37.0, 45.0, 46.0, 47.0, 52.0, 63.0, 68.0, 78.0, 50.0, 57.0, 51.0, 43.0, 48.0, 36.0, 35.0, 28.0, 20.0, 18.0, 10.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2994351387023926, -3.1985461711883545, -3.0976574420928955, -2.9967684745788574, -2.8958797454833984, -2.7949907779693604, -2.6941020488739014, -2.5932130813598633, -2.4923243522644043, -2.391435384750366, -2.2905466556549072, -2.189657688140869, -2.08876895904541, -1.987879991531372, -1.886991262435913, -1.786102294921875, -1.6852134466171265, -1.584324598312378, -1.4834357500076294, -1.3825469017028809, -1.2816580533981323, -1.1807692050933838, -1.0798802375793457, -0.9789914488792419, -0.8781026005744934, -0.7772137522697449, -0.6763249039649963, -0.575435996055603, -0.4745471775531769, -0.37365829944610596, -0.2727694511413574, -0.1718806028366089, -0.07099175453186035, 0.02989710122346878, 0.1307859569787979, 0.23167482018470764, 0.3325636684894562, 0.4334525465965271, 0.5343413949012756, 0.6352302432060242, 0.7361190915107727, 0.8370079398155212, 0.9378967881202698, 1.038785696029663, 1.1396745443344116, 1.2405633926391602, 1.3414522409439087, 1.4423410892486572, 1.5432299375534058, 1.6441187858581543, 1.7450076341629028, 1.8458964824676514, 1.9467853307724, 2.0476741790771484, 2.1485631465911865, 2.2494518756866455, 2.3503408432006836, 2.4512298107147217, 2.5521185398101807, 2.6530075073242188, 2.7538962364196777, 2.854785203933716, 2.955673933029175, 3.056562900543213, 3.157451629638672]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 4.0, 7.0, 10.0, 10.0, 18.0, 18.0, 21.0, 13.0, 16.0, 35.0, 17.0, 23.0, 29.0, 31.0, 37.0, 37.0, 41.0, 34.0, 41.0, 45.0, 40.0, 40.0, 39.0, 34.0, 42.0, 29.0, 26.0, 39.0, 36.0, 27.0, 24.0, 20.0, 17.0, 16.0, 15.0, 15.0, 6.0, 6.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7987110614776611, -1.7415999174118042, -1.6844886541366577, -1.6273775100708008, -1.5702662467956543, -1.5131551027297974, -1.4560439586639404, -1.398932695388794, -1.3418214321136475, -1.2847102880477905, -1.227599024772644, -1.170487880706787, -1.1133766174316406, -1.0562654733657837, -0.999154269695282, -0.9420430660247803, -0.8849319219589233, -0.8278207182884216, -0.7707095146179199, -0.713598370552063, -0.6564871072769165, -0.5993759632110596, -0.5422647595405579, -0.48515355587005615, -0.42804235219955444, -0.37093114852905273, -0.313819944858551, -0.2567087709903717, -0.19959756731987, -0.1424863636493683, -0.08537518978118896, -0.028263986110687256, 0.028847098350524902, 0.08595829457044601, 0.14306949079036713, 0.20018067955970764, 0.25729188323020935, 0.31440308690071106, 0.3715142607688904, 0.4286254644393921, 0.4857366681098938, 0.5428478717803955, 0.5999590754508972, 0.6570702791213989, 0.7141814231872559, 0.7712926864624023, 0.8284038305282593, 0.885515034198761, 0.9426262378692627, 0.9997374415397644, 1.0568486452102661, 1.113959789276123, 1.1710710525512695, 1.2281821966171265, 1.2852933406829834, 1.3424046039581299, 1.3995158672332764, 1.4566270112991333, 1.5137382745742798, 1.5708494186401367, 1.6279606819152832, 1.6850718259811401, 1.742182970046997, 1.7992942333221436, 1.8564053773880005]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 12.0, 11.0, 15.0, 33.0, 44.0, 73.0, 122.0, 205.0, 321.0, 533.0, 811.0, 1353.0, 2180.0, 3316.0, 5119.0, 7668.0, 11589.0, 16934.0, 24338.0, 34025.0, 45224.0, 58397.0, 72075.0, 83815.0, 92661.0, 96235.0, 94346.0, 87113.0, 76141.0, 62501.0, 49458.0, 37534.0, 27068.0, 18914.0, 13310.0, 8831.0, 5919.0, 3782.0, 2428.0, 1487.0, 963.0, 614.0, 393.0, 233.0, 172.0, 97.0, 64.0, 32.0, 26.0, 10.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0713043212890625, -1.035186767578125, -0.9990692138671875, -0.96295166015625, -0.9268341064453125, -0.890716552734375, -0.8545989990234375, -0.8184814453125, -0.7823638916015625, -0.746246337890625, -0.7101287841796875, -0.67401123046875, -0.6378936767578125, -0.601776123046875, -0.5656585693359375, -0.529541015625, -0.4934234619140625, -0.457305908203125, -0.4211883544921875, -0.38507080078125, -0.3489532470703125, -0.312835693359375, -0.2767181396484375, -0.2406005859375, -0.2044830322265625, -0.168365478515625, -0.1322479248046875, -0.09613037109375, -0.0600128173828125, -0.023895263671875, 0.0122222900390625, 0.04833984375, 0.0844573974609375, 0.120574951171875, 0.1566925048828125, 0.19281005859375, 0.2289276123046875, 0.265045166015625, 0.3011627197265625, 0.3372802734375, 0.3733978271484375, 0.409515380859375, 0.4456329345703125, 0.48175048828125, 0.5178680419921875, 0.553985595703125, 0.5901031494140625, 0.626220703125, 0.6623382568359375, 0.698455810546875, 0.7345733642578125, 0.77069091796875, 0.8068084716796875, 0.842926025390625, 0.8790435791015625, 0.9151611328125, 0.9512786865234375, 0.987396240234375, 1.0235137939453125, 1.05963134765625, 1.0957489013671875, 1.131866455078125, 1.1679840087890625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 4.0, 7.0, 15.0, 20.0, 14.0, 21.0, 19.0, 14.0, 30.0, 24.0, 32.0, 19.0, 38.0, 39.0, 38.0, 41.0, 38.0, 45.0, 49.0, 42.0, 47.0, 36.0, 43.0, 34.0, 31.0, 40.0, 32.0, 22.0, 19.0, 23.0, 15.0, 12.0, 19.0, 17.0, 10.0, 11.0, 5.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7926788330078125, -1.728912353515625, -1.6651458740234375, -1.60137939453125, -1.5376129150390625, -1.473846435546875, -1.4100799560546875, -1.3463134765625, -1.2825469970703125, -1.218780517578125, -1.1550140380859375, -1.09124755859375, -1.0274810791015625, -0.963714599609375, -0.8999481201171875, -0.836181640625, -0.7724151611328125, -0.708648681640625, -0.6448822021484375, -0.58111572265625, -0.5173492431640625, -0.453582763671875, -0.3898162841796875, -0.3260498046875, -0.2622833251953125, -0.198516845703125, -0.1347503662109375, -0.07098388671875, -0.0072174072265625, 0.056549072265625, 0.1203155517578125, 0.18408203125, 0.2478485107421875, 0.311614990234375, 0.3753814697265625, 0.43914794921875, 0.5029144287109375, 0.566680908203125, 0.6304473876953125, 0.6942138671875, 0.7579803466796875, 0.821746826171875, 0.8855133056640625, 0.94927978515625, 1.0130462646484375, 1.076812744140625, 1.1405792236328125, 1.204345703125, 1.2681121826171875, 1.331878662109375, 1.3956451416015625, 1.45941162109375, 1.5231781005859375, 1.586944580078125, 1.6507110595703125, 1.7144775390625, 1.7782440185546875, 1.842010498046875, 1.9057769775390625, 1.96954345703125, 2.0333099365234375, 2.097076416015625, 2.1608428955078125, 2.224609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 15.0, 21.0, 33.0, 60.0, 73.0, 135.0, 171.0, 295.0, 467.0, 771.0, 1237.0, 1877.0, 2916.0, 4384.0, 6577.0, 10310.0, 14945.0, 21212.0, 30042.0, 40877.0, 53925.0, 67250.0, 80181.0, 90402.0, 95305.0, 95868.0, 90125.0, 79853.0, 67319.0, 53853.0, 41463.0, 30134.0, 21714.0, 15144.0, 10312.0, 6724.0, 4518.0, 2883.0, 1893.0, 1218.0, 728.0, 460.0, 314.0, 203.0, 144.0, 80.0, 35.0, 37.0, 29.0, 10.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0953369140625, -1.058837890625, -1.0223388671875, -0.98583984375, -0.9493408203125, -0.912841796875, -0.8763427734375, -0.83984375, -0.8033447265625, -0.766845703125, -0.7303466796875, -0.69384765625, -0.6573486328125, -0.620849609375, -0.5843505859375, -0.5478515625, -0.5113525390625, -0.474853515625, -0.4383544921875, -0.40185546875, -0.3653564453125, -0.328857421875, -0.2923583984375, -0.255859375, -0.2193603515625, -0.182861328125, -0.1463623046875, -0.10986328125, -0.0733642578125, -0.036865234375, -0.0003662109375, 0.0361328125, 0.0726318359375, 0.109130859375, 0.1456298828125, 0.18212890625, 0.2186279296875, 0.255126953125, 0.2916259765625, 0.328125, 0.3646240234375, 0.401123046875, 0.4376220703125, 0.47412109375, 0.5106201171875, 0.547119140625, 0.5836181640625, 0.6201171875, 0.6566162109375, 0.693115234375, 0.7296142578125, 0.76611328125, 0.8026123046875, 0.839111328125, 0.8756103515625, 0.912109375, 0.9486083984375, 0.985107421875, 1.0216064453125, 1.05810546875, 1.0946044921875, 1.131103515625, 1.1676025390625, 1.2041015625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 14.0, 14.0, 17.0, 17.0, 20.0, 23.0, 16.0, 32.0, 27.0, 33.0, 44.0, 26.0, 59.0, 38.0, 42.0, 43.0, 43.0, 44.0, 42.0, 38.0, 44.0, 40.0, 40.0, 26.0, 27.0, 21.0, 34.0, 18.0, 16.0, 16.0, 15.0, 9.0, 9.0, 5.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3603515625, -1.3197479248046875, -1.279144287109375, -1.2385406494140625, -1.19793701171875, -1.1573333740234375, -1.116729736328125, -1.0761260986328125, -1.0355224609375, -0.9949188232421875, -0.954315185546875, -0.9137115478515625, -0.87310791015625, -0.8325042724609375, -0.791900634765625, -0.7512969970703125, -0.710693359375, -0.6700897216796875, -0.629486083984375, -0.5888824462890625, -0.54827880859375, -0.5076751708984375, -0.467071533203125, -0.4264678955078125, -0.3858642578125, -0.3452606201171875, -0.304656982421875, -0.2640533447265625, -0.22344970703125, -0.1828460693359375, -0.142242431640625, -0.1016387939453125, -0.06103515625, -0.0204315185546875, 0.020172119140625, 0.0607757568359375, 0.10137939453125, 0.1419830322265625, 0.182586669921875, 0.2231903076171875, 0.2637939453125, 0.3043975830078125, 0.345001220703125, 0.3856048583984375, 0.42620849609375, 0.4668121337890625, 0.507415771484375, 0.5480194091796875, 0.588623046875, 0.6292266845703125, 0.669830322265625, 0.7104339599609375, 0.75103759765625, 0.7916412353515625, 0.832244873046875, 0.8728485107421875, 0.9134521484375, 0.9540557861328125, 0.994659423828125, 1.0352630615234375, 1.07586669921875, 1.1164703369140625, 1.157073974609375, 1.1976776123046875, 1.23828125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 19.0, 32.0, 61.0, 77.0, 131.0, 188.0, 313.0, 555.0, 697.0, 1216.0, 1949.0, 2962.0, 4571.0, 7234.0, 11177.0, 17053.0, 25180.0, 37040.0, 51644.0, 68870.0, 85769.0, 101227.0, 109306.0, 109602.0, 100557.0, 85509.0, 67554.0, 50302.0, 35657.0, 24786.0, 16555.0, 11197.0, 7003.0, 4657.0, 2830.0, 1828.0, 1165.0, 746.0, 481.0, 308.0, 197.0, 124.0, 76.0, 59.0, 28.0, 19.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.57110595703125, -0.5513916015625, -0.53167724609375, -0.511962890625, -0.49224853515625, -0.4725341796875, -0.45281982421875, -0.43310546875, -0.41339111328125, -0.3936767578125, -0.37396240234375, -0.354248046875, -0.33453369140625, -0.3148193359375, -0.29510498046875, -0.275390625, -0.25567626953125, -0.2359619140625, -0.21624755859375, -0.196533203125, -0.17681884765625, -0.1571044921875, -0.13739013671875, -0.11767578125, -0.09796142578125, -0.0782470703125, -0.05853271484375, -0.038818359375, -0.01910400390625, 0.0006103515625, 0.02032470703125, 0.0400390625, 0.05975341796875, 0.0794677734375, 0.09918212890625, 0.118896484375, 0.13861083984375, 0.1583251953125, 0.17803955078125, 0.19775390625, 0.21746826171875, 0.2371826171875, 0.25689697265625, 0.276611328125, 0.29632568359375, 0.3160400390625, 0.33575439453125, 0.35546875, 0.37518310546875, 0.3948974609375, 0.41461181640625, 0.434326171875, 0.45404052734375, 0.4737548828125, 0.49346923828125, 0.51318359375, 0.53289794921875, 0.5526123046875, 0.57232666015625, 0.592041015625, 0.61175537109375, 0.6314697265625, 0.65118408203125, 0.6708984375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 16.0, 9.0, 19.0, 24.0, 21.0, 31.0, 32.0, 34.0, 43.0, 43.0, 37.0, 52.0, 66.0, 58.0, 51.0, 47.0, 58.0, 44.0, 42.0, 43.0, 35.0, 38.0, 24.0, 21.0, 20.0, 18.0, 11.0, 10.0, 11.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.399652481079102e-05, -9.12155956029892e-05, -8.843466639518738e-05, -8.565373718738556e-05, -8.287280797958374e-05, -8.009187877178192e-05, -7.73109495639801e-05, -7.453002035617828e-05, -7.174909114837646e-05, -6.896816194057465e-05, -6.618723273277283e-05, -6.340630352497101e-05, -6.062537431716919e-05, -5.784444510936737e-05, -5.506351590156555e-05, -5.228258669376373e-05, -4.9501657485961914e-05, -4.6720728278160095e-05, -4.3939799070358276e-05, -4.115886986255646e-05, -3.837794065475464e-05, -3.559701144695282e-05, -3.2816082239151e-05, -3.0035153031349182e-05, -2.7254223823547363e-05, -2.4473294615745544e-05, -2.1692365407943726e-05, -1.8911436200141907e-05, -1.6130506992340088e-05, -1.3349577784538269e-05, -1.056864857673645e-05, -7.787719368934631e-06, -5.0067901611328125e-06, -2.2258609533309937e-06, 5.550682544708252e-07, 3.335997462272644e-06, 6.116926670074463e-06, 8.897855877876282e-06, 1.16787850856781e-05, 1.445971429347992e-05, 1.7240643501281738e-05, 2.0021572709083557e-05, 2.2802501916885376e-05, 2.5583431124687195e-05, 2.8364360332489014e-05, 3.114528954029083e-05, 3.392621874809265e-05, 3.670714795589447e-05, 3.948807716369629e-05, 4.226900637149811e-05, 4.504993557929993e-05, 4.7830864787101746e-05, 5.0611793994903564e-05, 5.339272320270538e-05, 5.61736524105072e-05, 5.895458161830902e-05, 6.173551082611084e-05, 6.451644003391266e-05, 6.729736924171448e-05, 7.00782984495163e-05, 7.285922765731812e-05, 7.564015686511993e-05, 7.842108607292175e-05, 8.120201528072357e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 5.0, 7.0, 15.0, 24.0, 34.0, 70.0, 86.0, 129.0, 211.0, 299.0, 504.0, 748.0, 1220.0, 1941.0, 3099.0, 4886.0, 7731.0, 11867.0, 18267.0, 27525.0, 40138.0, 56625.0, 75412.0, 94927.0, 109401.0, 115207.0, 111321.0, 97903.0, 79672.0, 60504.0, 43184.0, 29808.0, 19820.0, 12948.0, 8397.0, 5274.0, 3350.0, 2224.0, 1393.0, 888.0, 555.0, 367.0, 214.0, 122.0, 88.0, 45.0, 41.0, 23.0, 19.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.59466552734375, -0.5731201171875, -0.55157470703125, -0.530029296875, -0.50848388671875, -0.4869384765625, -0.46539306640625, -0.44384765625, -0.42230224609375, -0.4007568359375, -0.37921142578125, -0.357666015625, -0.33612060546875, -0.3145751953125, -0.29302978515625, -0.271484375, -0.24993896484375, -0.2283935546875, -0.20684814453125, -0.185302734375, -0.16375732421875, -0.1422119140625, -0.12066650390625, -0.09912109375, -0.07757568359375, -0.0560302734375, -0.03448486328125, -0.012939453125, 0.00860595703125, 0.0301513671875, 0.05169677734375, 0.0732421875, 0.09478759765625, 0.1163330078125, 0.13787841796875, 0.159423828125, 0.18096923828125, 0.2025146484375, 0.22406005859375, 0.24560546875, 0.26715087890625, 0.2886962890625, 0.31024169921875, 0.331787109375, 0.35333251953125, 0.3748779296875, 0.39642333984375, 0.41796875, 0.43951416015625, 0.4610595703125, 0.48260498046875, 0.504150390625, 0.52569580078125, 0.5472412109375, 0.56878662109375, 0.59033203125, 0.61187744140625, 0.6334228515625, 0.65496826171875, 0.676513671875, 0.69805908203125, 0.7196044921875, 0.74114990234375, 0.7626953125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 7.0, 6.0, 11.0, 14.0, 11.0, 17.0, 17.0, 20.0, 29.0, 31.0, 41.0, 42.0, 31.0, 46.0, 41.0, 57.0, 38.0, 51.0, 53.0, 54.0, 38.0, 30.0, 35.0, 36.0, 32.0, 31.0, 24.0, 23.0, 19.0, 27.0, 14.0, 14.0, 11.0, 9.0, 4.0, 7.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2149658203125, -0.20800018310546875, -0.2010345458984375, -0.19406890869140625, -0.187103271484375, -0.18013763427734375, -0.1731719970703125, -0.16620635986328125, -0.15924072265625, -0.15227508544921875, -0.1453094482421875, -0.13834381103515625, -0.131378173828125, -0.12441253662109375, -0.1174468994140625, -0.11048126220703125, -0.103515625, -0.09654998779296875, -0.0895843505859375, -0.08261871337890625, -0.075653076171875, -0.06868743896484375, -0.0617218017578125, -0.05475616455078125, -0.04779052734375, -0.04082489013671875, -0.0338592529296875, -0.02689361572265625, -0.019927978515625, -0.01296234130859375, -0.0059967041015625, 0.00096893310546875, 0.0079345703125, 0.01490020751953125, 0.0218658447265625, 0.02883148193359375, 0.035797119140625, 0.04276275634765625, 0.0497283935546875, 0.05669403076171875, 0.06365966796875, 0.07062530517578125, 0.0775909423828125, 0.08455657958984375, 0.091522216796875, 0.09848785400390625, 0.1054534912109375, 0.11241912841796875, 0.119384765625, 0.12635040283203125, 0.1333160400390625, 0.14028167724609375, 0.147247314453125, 0.15421295166015625, 0.1611785888671875, 0.16814422607421875, 0.17510986328125, 0.18207550048828125, 0.1890411376953125, 0.19600677490234375, 0.202972412109375, 0.20993804931640625, 0.2169036865234375, 0.22386932373046875, 0.2308349609375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 4.0, 7.0, 6.0, 5.0, 14.0, 16.0, 14.0, 17.0, 24.0, 28.0, 29.0, 51.0, 41.0, 52.0, 48.0, 78.0, 62.0, 54.0, 57.0, 50.0, 53.0, 43.0, 48.0, 37.0, 43.0, 25.0, 23.0, 13.0, 21.0, 13.0, 15.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.274965286254883, -3.179086208343506, -3.083207130432129, -2.987328052520752, -2.891448974609375, -2.795569896697998, -2.699690818786621, -2.603811740875244, -2.507932662963867, -2.4120535850524902, -2.3161745071411133, -2.2202954292297363, -2.1244163513183594, -2.0285372734069824, -1.932658076286316, -1.836778998374939, -1.7408998012542725, -1.6450207233428955, -1.5491416454315186, -1.4532625675201416, -1.3573834896087646, -1.2615044116973877, -1.1656252145767212, -1.0697461366653442, -0.9738670587539673, -0.8779879808425903, -0.7821089029312134, -0.6862297654151917, -0.5903506875038147, -0.49447160959243774, -0.398592472076416, -0.30271339416503906, -0.2068345546722412, -0.11095546185970306, -0.015076369047164917, 0.08080273866653442, 0.17668181657791138, 0.27256089448928833, 0.36844003200531006, 0.464319109916687, 0.560198187828064, 0.6560772657394409, 0.7519563436508179, 0.8478354811668396, 0.9437145590782166, 1.0395936965942383, 1.1354727745056152, 1.2313518524169922, 1.3272309303283691, 1.423110008239746, 1.518989086151123, 1.6148681640625, 1.710747241973877, 1.806626319885254, 1.9025055170059204, 1.9983845949172974, 2.0942635536193848, 2.1901426315307617, 2.2860217094421387, 2.3819007873535156, 2.4777798652648926, 2.5736589431762695, 2.6695380210876465, 2.7654170989990234, 2.8612964153289795]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 4.0, 5.0, 5.0, 0.0, 8.0, 11.0, 7.0, 16.0, 7.0, 14.0, 12.0, 28.0, 19.0, 25.0, 27.0, 28.0, 32.0, 26.0, 32.0, 35.0, 42.0, 38.0, 34.0, 36.0, 49.0, 29.0, 36.0, 43.0, 41.0, 34.0, 34.0, 31.0, 35.0, 31.0, 28.0, 22.0, 16.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.041332721710205, -1.9815632104873657, -1.921793818473816, -1.8620243072509766, -1.8022549152374268, -1.7424854040145874, -1.682715892791748, -1.6229465007781982, -1.5631769895553589, -1.5034074783325195, -1.4436380863189697, -1.3838685750961304, -1.324099063873291, -1.2643296718597412, -1.2045601606369019, -1.1447906494140625, -1.0850212574005127, -1.0252517461776733, -0.9654823541641235, -0.9057128429412842, -0.8459433913230896, -0.786173939704895, -0.7264044284820557, -0.6666349768638611, -0.6068655252456665, -0.5470960736274719, -0.48732659220695496, -0.427557110786438, -0.3677876591682434, -0.30801820755004883, -0.24824872612953186, -0.1884792447090149, -0.12870991230010986, -0.06894044578075409, -0.009170979261398315, 0.05059848725795746, 0.11036795377731323, 0.1701374053955078, 0.22990688681602478, 0.28967636823654175, 0.34944581985473633, 0.4092152714729309, 0.4689847528934479, 0.5287542343139648, 0.5885236859321594, 0.648293137550354, 0.7080626487731934, 0.7678321003913879, 0.8276015520095825, 0.8873710036277771, 0.9471404552459717, 1.006909966468811, 1.0666794776916504, 1.1264488697052002, 1.1862183809280396, 1.245987892150879, 1.3057572841644287, 1.365526795387268, 1.4252961874008179, 1.4850656986236572, 1.544835090637207, 1.6046046018600464, 1.6643741130828857, 1.7241435050964355, 1.783913016319275]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 9.0, 17.0, 17.0, 25.0, 35.0, 63.0, 113.0, 176.0, 273.0, 428.0, 660.0, 1147.0, 1776.0, 2867.0, 4608.0, 7447.0, 12084.0, 19588.0, 31849.0, 50790.0, 79422.0, 121833.0, 179768.0, 252160.0, 335220.0, 414206.0, 465715.0, 478873.0, 443079.0, 374101.0, 291771.0, 212306.0, 146118.0, 97448.0, 62956.0, 40249.0, 24850.0, 15443.0, 9426.0, 5844.0, 3558.0, 2225.0, 1409.0, 835.0, 548.0, 340.0, 230.0, 139.0, 96.0, 62.0, 30.0, 24.0, 17.0, 8.0, 2.0, 2.0, 1.0], "bins": [-2.076171875, -2.015533447265625, -1.95489501953125, -1.894256591796875, -1.8336181640625, -1.772979736328125, -1.71234130859375, -1.651702880859375, -1.591064453125, -1.530426025390625, -1.46978759765625, -1.409149169921875, -1.3485107421875, -1.287872314453125, -1.22723388671875, -1.166595458984375, -1.10595703125, -1.045318603515625, -0.98468017578125, -0.924041748046875, -0.8634033203125, -0.802764892578125, -0.74212646484375, -0.681488037109375, -0.620849609375, -0.560211181640625, -0.49957275390625, -0.438934326171875, -0.3782958984375, -0.317657470703125, -0.25701904296875, -0.196380615234375, -0.1357421875, -0.075103759765625, -0.01446533203125, 0.046173095703125, 0.1068115234375, 0.167449951171875, 0.22808837890625, 0.288726806640625, 0.349365234375, 0.410003662109375, 0.47064208984375, 0.531280517578125, 0.5919189453125, 0.652557373046875, 0.71319580078125, 0.773834228515625, 0.83447265625, 0.895111083984375, 0.95574951171875, 1.016387939453125, 1.0770263671875, 1.137664794921875, 1.19830322265625, 1.258941650390625, 1.319580078125, 1.380218505859375, 1.44085693359375, 1.501495361328125, 1.5621337890625, 1.622772216796875, 1.68341064453125, 1.744049072265625, 1.8046875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 8.0, 11.0, 12.0, 16.0, 17.0, 18.0, 25.0, 12.0, 25.0, 41.0, 23.0, 24.0, 31.0, 39.0, 53.0, 31.0, 47.0, 40.0, 43.0, 41.0, 45.0, 36.0, 35.0, 29.0, 41.0, 33.0, 27.0, 25.0, 21.0, 28.0, 28.0, 15.0, 10.0, 16.0, 10.0, 5.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.0, -1.9428863525390625, -1.885772705078125, -1.8286590576171875, -1.77154541015625, -1.7144317626953125, -1.657318115234375, -1.6002044677734375, -1.5430908203125, -1.4859771728515625, -1.428863525390625, -1.3717498779296875, -1.31463623046875, -1.2575225830078125, -1.200408935546875, -1.1432952880859375, -1.086181640625, -1.0290679931640625, -0.971954345703125, -0.9148406982421875, -0.85772705078125, -0.8006134033203125, -0.743499755859375, -0.6863861083984375, -0.6292724609375, -0.5721588134765625, -0.515045166015625, -0.4579315185546875, -0.40081787109375, -0.3437042236328125, -0.286590576171875, -0.2294769287109375, -0.17236328125, -0.1152496337890625, -0.058135986328125, -0.0010223388671875, 0.05609130859375, 0.1132049560546875, 0.170318603515625, 0.2274322509765625, 0.2845458984375, 0.3416595458984375, 0.398773193359375, 0.4558868408203125, 0.51300048828125, 0.5701141357421875, 0.627227783203125, 0.6843414306640625, 0.741455078125, 0.7985687255859375, 0.855682373046875, 0.9127960205078125, 0.96990966796875, 1.0270233154296875, 1.084136962890625, 1.1412506103515625, 1.1983642578125, 1.2554779052734375, 1.312591552734375, 1.3697052001953125, 1.42681884765625, 1.4839324951171875, 1.541046142578125, 1.5981597900390625, 1.6552734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 6.0, 7.0, 13.0, 23.0, 25.0, 53.0, 66.0, 131.0, 243.0, 362.0, 605.0, 910.0, 1679.0, 2669.0, 4494.0, 7434.0, 12098.0, 19061.0, 31376.0, 49142.0, 75290.0, 113694.0, 164516.0, 227795.0, 299132.0, 368460.0, 422066.0, 445540.0, 434341.0, 388886.0, 322999.0, 250898.0, 183483.0, 128823.0, 86431.0, 56921.0, 36118.0, 22885.0, 13929.0, 8472.0, 5158.0, 3149.0, 1984.0, 1168.0, 644.0, 447.0, 231.0, 168.0, 106.0, 58.0, 41.0, 23.0, 18.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9755859375, -1.9066619873046875, -1.837738037109375, -1.7688140869140625, -1.69989013671875, -1.6309661865234375, -1.562042236328125, -1.4931182861328125, -1.4241943359375, -1.3552703857421875, -1.286346435546875, -1.2174224853515625, -1.14849853515625, -1.0795745849609375, -1.010650634765625, -0.9417266845703125, -0.872802734375, -0.8038787841796875, -0.734954833984375, -0.6660308837890625, -0.59710693359375, -0.5281829833984375, -0.459259033203125, -0.3903350830078125, -0.3214111328125, -0.2524871826171875, -0.183563232421875, -0.1146392822265625, -0.04571533203125, 0.0232086181640625, 0.092132568359375, 0.1610565185546875, 0.22998046875, 0.2989044189453125, 0.367828369140625, 0.4367523193359375, 0.50567626953125, 0.5746002197265625, 0.643524169921875, 0.7124481201171875, 0.7813720703125, 0.8502960205078125, 0.919219970703125, 0.9881439208984375, 1.05706787109375, 1.1259918212890625, 1.194915771484375, 1.2638397216796875, 1.332763671875, 1.4016876220703125, 1.470611572265625, 1.5395355224609375, 1.60845947265625, 1.6773834228515625, 1.746307373046875, 1.8152313232421875, 1.8841552734375, 1.9530792236328125, 2.022003173828125, 2.0909271240234375, 2.15985107421875, 2.2287750244140625, 2.297698974609375, 2.3666229248046875, 2.435546875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 3.0, 8.0, 7.0, 12.0, 17.0, 16.0, 24.0, 29.0, 37.0, 38.0, 56.0, 64.0, 80.0, 90.0, 107.0, 155.0, 161.0, 179.0, 207.0, 213.0, 211.0, 219.0, 251.0, 214.0, 212.0, 178.0, 201.0, 193.0, 167.0, 140.0, 129.0, 105.0, 65.0, 68.0, 40.0, 37.0, 38.0, 26.0, 14.0, 17.0, 10.0, 11.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.197265625, -1.16339111328125, -1.1295166015625, -1.09564208984375, -1.061767578125, -1.02789306640625, -0.9940185546875, -0.96014404296875, -0.92626953125, -0.89239501953125, -0.8585205078125, -0.82464599609375, -0.790771484375, -0.75689697265625, -0.7230224609375, -0.68914794921875, -0.6552734375, -0.62139892578125, -0.5875244140625, -0.55364990234375, -0.519775390625, -0.48590087890625, -0.4520263671875, -0.41815185546875, -0.38427734375, -0.35040283203125, -0.3165283203125, -0.28265380859375, -0.248779296875, -0.21490478515625, -0.1810302734375, -0.14715576171875, -0.11328125, -0.07940673828125, -0.0455322265625, -0.01165771484375, 0.022216796875, 0.05609130859375, 0.0899658203125, 0.12384033203125, 0.15771484375, 0.19158935546875, 0.2254638671875, 0.25933837890625, 0.293212890625, 0.32708740234375, 0.3609619140625, 0.39483642578125, 0.4287109375, 0.46258544921875, 0.4964599609375, 0.53033447265625, 0.564208984375, 0.59808349609375, 0.6319580078125, 0.66583251953125, 0.69970703125, 0.73358154296875, 0.7674560546875, 0.80133056640625, 0.835205078125, 0.86907958984375, 0.9029541015625, 0.93682861328125, 0.970703125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 12.0, 12.0, 9.0, 16.0, 18.0, 23.0, 17.0, 18.0, 34.0, 30.0, 27.0, 36.0, 52.0, 61.0, 46.0, 39.0, 48.0, 54.0, 46.0, 45.0, 55.0, 43.0, 36.0, 37.0, 35.0, 25.0, 18.0, 22.0, 18.0, 11.0, 10.0, 11.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.551114559173584, -3.4483602046966553, -3.3456058502197266, -3.242851495742798, -3.140097141265869, -3.0373425483703613, -2.9345881938934326, -2.831833839416504, -2.729079484939575, -2.6263251304626465, -2.5235707759857178, -2.420816421508789, -2.3180618286132812, -2.2153077125549316, -2.112553119659424, -2.009798765182495, -1.9070444107055664, -1.8042900562286377, -1.701535701751709, -1.5987812280654907, -1.496026873588562, -1.3932725191116333, -1.290518045425415, -1.1877636909484863, -1.0850093364715576, -0.9822549819946289, -0.8795005679130554, -0.7767461538314819, -0.6739917993545532, -0.5712374448776245, -0.468483030796051, -0.36572861671447754, -0.26297426223754883, -0.16021987795829773, -0.05746549367904663, 0.04528889060020447, 0.14804327487945557, 0.2507976293563843, 0.35355204343795776, 0.45630645751953125, 0.55906081199646, 0.6618151664733887, 0.7645695805549622, 0.8673239946365356, 0.9700783491134644, 1.072832703590393, 1.1755871772766113, 1.27834153175354, 1.3810958862304688, 1.4838502407073975, 1.5866045951843262, 1.6893590688705444, 1.7921134233474731, 1.8948677778244019, 1.9976222515106201, 2.100376605987549, 2.2031309604644775, 2.3058853149414062, 2.408639669418335, 2.5113940238952637, 2.6141486167907715, 2.716902732849121, 2.819657325744629, 2.9224116802215576, 3.0251660346984863]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 13.0, 9.0, 14.0, 18.0, 25.0, 16.0, 21.0, 27.0, 22.0, 29.0, 23.0, 33.0, 31.0, 36.0, 45.0, 43.0, 35.0, 45.0, 33.0, 56.0, 37.0, 30.0, 45.0, 37.0, 31.0, 30.0, 31.0, 18.0, 23.0, 22.0, 15.0, 17.0, 12.0, 21.0, 9.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2918717861175537, -2.2207958698272705, -2.149719715118408, -2.078643798828125, -2.007567882537842, -1.936491847038269, -1.8654158115386963, -1.794339895248413, -1.7232638597488403, -1.6521878242492676, -1.5811119079589844, -1.5100358724594116, -1.4389598369598389, -1.3678839206695557, -1.296807885169983, -1.2257318496704102, -1.154655933380127, -1.0835798978805542, -1.012503981590271, -0.9414279460906982, -0.8703519701957703, -0.7992759943008423, -0.7281999588012695, -0.6571239829063416, -0.5860480070114136, -0.5149720311164856, -0.44389602541923523, -0.37282001972198486, -0.3017440438270569, -0.2306680679321289, -0.15959206223487854, -0.08851605653762817, -0.017440319061279297, 0.053635671734809875, 0.12471166253089905, 0.19578765332698822, 0.2668636441230774, 0.33793962001800537, 0.40901562571525574, 0.4800916314125061, 0.5511676073074341, 0.6222435832023621, 0.69331955909729, 0.7643955945968628, 0.8354715704917908, 0.9065475463867188, 0.9776235818862915, 1.0486996173858643, 1.1197755336761475, 1.1908515691757202, 1.2619274854660034, 1.3330035209655762, 1.4040794372558594, 1.4751554727554321, 1.5462315082550049, 1.617307424545288, 1.6883834600448608, 1.7594594955444336, 1.8305354118347168, 1.9016114473342896, 1.9726874828338623, 2.0437633991241455, 2.1148393154144287, 2.185915470123291, 2.256991386413574]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 8.0, 12.0, 16.0, 18.0, 46.0, 68.0, 113.0, 166.0, 259.0, 476.0, 764.0, 1189.0, 2090.0, 3248.0, 5497.0, 9269.0, 15074.0, 25590.0, 41840.0, 68155.0, 105195.0, 150384.0, 176266.0, 152980.0, 108877.0, 70472.0, 43816.0, 26700.0, 16060.0, 9500.0, 5573.0, 3500.0, 2055.0, 1265.0, 785.0, 473.0, 300.0, 158.0, 94.0, 79.0, 42.0, 27.0, 10.0, 17.0, 7.0, 11.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5694046020507812, -0.5494537353515625, -0.5295028686523438, -0.509552001953125, -0.48960113525390625, -0.4696502685546875, -0.44969940185546875, -0.42974853515625, -0.40979766845703125, -0.3898468017578125, -0.36989593505859375, -0.349945068359375, -0.32999420166015625, -0.3100433349609375, -0.29009246826171875, -0.2701416015625, -0.25019073486328125, -0.2302398681640625, -0.21028900146484375, -0.190338134765625, -0.17038726806640625, -0.1504364013671875, -0.13048553466796875, -0.11053466796875, -0.09058380126953125, -0.0706329345703125, -0.05068206787109375, -0.030731201171875, -0.01078033447265625, 0.0091705322265625, 0.02912139892578125, 0.049072265625, 0.06902313232421875, 0.0889739990234375, 0.10892486572265625, 0.128875732421875, 0.14882659912109375, 0.1687774658203125, 0.18872833251953125, 0.20867919921875, 0.22863006591796875, 0.2485809326171875, 0.26853179931640625, 0.288482666015625, 0.30843353271484375, 0.3283843994140625, 0.34833526611328125, 0.3682861328125, 0.38823699951171875, 0.4081878662109375, 0.42813873291015625, 0.448089599609375, 0.46804046630859375, 0.4879913330078125, 0.5079421997070312, 0.52789306640625, 0.5478439331054688, 0.5677947998046875, 0.5877456665039062, 0.607696533203125, 0.6276473999023438, 0.6475982666015625, 0.6675491333007812, 0.6875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 12.0, 21.0, 18.0, 13.0, 14.0, 31.0, 22.0, 33.0, 27.0, 31.0, 24.0, 35.0, 32.0, 38.0, 38.0, 40.0, 37.0, 41.0, 33.0, 28.0, 39.0, 25.0, 32.0, 32.0, 28.0, 27.0, 18.0, 22.0, 32.0, 23.0, 24.0, 14.0, 10.0, 12.0, 8.0, 9.0, 5.0, 8.0, 9.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-2.263671875, -2.193115234375, -2.12255859375, -2.052001953125, -1.9814453125, -1.910888671875, -1.84033203125, -1.769775390625, -1.69921875, -1.628662109375, -1.55810546875, -1.487548828125, -1.4169921875, -1.346435546875, -1.27587890625, -1.205322265625, -1.134765625, -1.064208984375, -0.99365234375, -0.923095703125, -0.8525390625, -0.781982421875, -0.71142578125, -0.640869140625, -0.5703125, -0.499755859375, -0.42919921875, -0.358642578125, -0.2880859375, -0.217529296875, -0.14697265625, -0.076416015625, -0.005859375, 0.064697265625, 0.13525390625, 0.205810546875, 0.2763671875, 0.346923828125, 0.41748046875, 0.488037109375, 0.55859375, 0.629150390625, 0.69970703125, 0.770263671875, 0.8408203125, 0.911376953125, 0.98193359375, 1.052490234375, 1.123046875, 1.193603515625, 1.26416015625, 1.334716796875, 1.4052734375, 1.475830078125, 1.54638671875, 1.616943359375, 1.6875, 1.758056640625, 1.82861328125, 1.899169921875, 1.9697265625, 2.040283203125, 2.11083984375, 2.181396484375, 2.251953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 11.0, 12.0, 13.0, 22.0, 28.0, 32.0, 43.0, 98.0, 127.0, 193.0, 317.0, 504.0, 742.0, 1140.0, 1819.0, 3116.0, 4966.0, 8508.0, 14459.0, 25566.0, 46035.0, 82897.0, 142215.0, 204576.0, 198779.0, 134398.0, 77006.0, 42954.0, 23990.0, 13607.0, 7939.0, 4697.0, 2896.0, 1741.0, 1103.0, 678.0, 459.0, 293.0, 180.0, 123.0, 76.0, 63.0, 34.0, 37.0, 19.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.75146484375, -0.7286529541015625, -0.705841064453125, -0.6830291748046875, -0.66021728515625, -0.6374053955078125, -0.614593505859375, -0.5917816162109375, -0.5689697265625, -0.5461578369140625, -0.523345947265625, -0.5005340576171875, -0.47772216796875, -0.4549102783203125, -0.432098388671875, -0.4092864990234375, -0.386474609375, -0.3636627197265625, -0.340850830078125, -0.3180389404296875, -0.29522705078125, -0.2724151611328125, -0.249603271484375, -0.2267913818359375, -0.2039794921875, -0.1811676025390625, -0.158355712890625, -0.1355438232421875, -0.11273193359375, -0.0899200439453125, -0.067108154296875, -0.0442962646484375, -0.021484375, 0.0013275146484375, 0.024139404296875, 0.0469512939453125, 0.06976318359375, 0.0925750732421875, 0.115386962890625, 0.1381988525390625, 0.1610107421875, 0.1838226318359375, 0.206634521484375, 0.2294464111328125, 0.25225830078125, 0.2750701904296875, 0.297882080078125, 0.3206939697265625, 0.343505859375, 0.3663177490234375, 0.389129638671875, 0.4119415283203125, 0.43475341796875, 0.4575653076171875, 0.480377197265625, 0.5031890869140625, 0.5260009765625, 0.5488128662109375, 0.571624755859375, 0.5944366455078125, 0.61724853515625, 0.6400604248046875, 0.662872314453125, 0.6856842041015625, 0.70849609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 5.0, 10.0, 8.0, 12.0, 16.0, 22.0, 21.0, 13.0, 30.0, 25.0, 33.0, 21.0, 19.0, 26.0, 26.0, 37.0, 31.0, 33.0, 37.0, 42.0, 26.0, 36.0, 21.0, 41.0, 37.0, 40.0, 35.0, 38.0, 30.0, 32.0, 25.0, 17.0, 18.0, 20.0, 15.0, 15.0, 12.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.267578125, -1.2251129150390625, -1.182647705078125, -1.1401824951171875, -1.09771728515625, -1.0552520751953125, -1.012786865234375, -0.9703216552734375, -0.9278564453125, -0.8853912353515625, -0.842926025390625, -0.8004608154296875, -0.75799560546875, -0.7155303955078125, -0.673065185546875, -0.6305999755859375, -0.588134765625, -0.5456695556640625, -0.503204345703125, -0.4607391357421875, -0.41827392578125, -0.3758087158203125, -0.333343505859375, -0.2908782958984375, -0.2484130859375, -0.2059478759765625, -0.163482666015625, -0.1210174560546875, -0.07855224609375, -0.0360870361328125, 0.006378173828125, 0.0488433837890625, 0.09130859375, 0.1337738037109375, 0.176239013671875, 0.2187042236328125, 0.26116943359375, 0.3036346435546875, 0.346099853515625, 0.3885650634765625, 0.4310302734375, 0.4734954833984375, 0.515960693359375, 0.5584259033203125, 0.60089111328125, 0.6433563232421875, 0.685821533203125, 0.7282867431640625, 0.770751953125, 0.8132171630859375, 0.855682373046875, 0.8981475830078125, 0.94061279296875, 0.9830780029296875, 1.025543212890625, 1.0680084228515625, 1.1104736328125, 1.1529388427734375, 1.195404052734375, 1.2378692626953125, 1.28033447265625, 1.3227996826171875, 1.365264892578125, 1.4077301025390625, 1.4501953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 9.0, 14.0, 24.0, 21.0, 33.0, 46.0, 57.0, 95.0, 125.0, 195.0, 272.0, 426.0, 648.0, 985.0, 1684.0, 2921.0, 5313.0, 10752.0, 24373.0, 73210.0, 327167.0, 440721.0, 101124.0, 30718.0, 12651.0, 6329.0, 3391.0, 1953.0, 1110.0, 659.0, 499.0, 304.0, 218.0, 152.0, 96.0, 61.0, 47.0, 40.0, 28.0, 16.0, 19.0, 16.0, 5.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58740234375, -0.5685272216796875, -0.549652099609375, -0.5307769775390625, -0.51190185546875, -0.4930267333984375, -0.474151611328125, -0.4552764892578125, -0.4364013671875, -0.4175262451171875, -0.398651123046875, -0.3797760009765625, -0.36090087890625, -0.3420257568359375, -0.323150634765625, -0.3042755126953125, -0.285400390625, -0.2665252685546875, -0.247650146484375, -0.2287750244140625, -0.20989990234375, -0.1910247802734375, -0.172149658203125, -0.1532745361328125, -0.1343994140625, -0.1155242919921875, -0.096649169921875, -0.0777740478515625, -0.05889892578125, -0.0400238037109375, -0.021148681640625, -0.0022735595703125, 0.0166015625, 0.0354766845703125, 0.054351806640625, 0.0732269287109375, 0.09210205078125, 0.1109771728515625, 0.129852294921875, 0.1487274169921875, 0.1676025390625, 0.1864776611328125, 0.205352783203125, 0.2242279052734375, 0.24310302734375, 0.2619781494140625, 0.280853271484375, 0.2997283935546875, 0.318603515625, 0.3374786376953125, 0.356353759765625, 0.3752288818359375, 0.39410400390625, 0.4129791259765625, 0.431854248046875, 0.4507293701171875, 0.4696044921875, 0.4884796142578125, 0.507354736328125, 0.5262298583984375, 0.54510498046875, 0.5639801025390625, 0.582855224609375, 0.6017303466796875, 0.62060546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 20.0, 14.0, 19.0, 32.0, 34.0, 47.0, 43.0, 50.0, 54.0, 69.0, 72.0, 66.0, 67.0, 67.0, 56.0, 56.0, 41.0, 37.0, 27.0, 24.0, 18.0, 13.0, 10.0, 4.0, 8.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.7286278307437897e-05, -1.6571953892707825e-05, -1.5857629477977753e-05, -1.514330506324768e-05, -1.4428980648517609e-05, -1.3714656233787537e-05, -1.3000331819057465e-05, -1.2286007404327393e-05, -1.157168298959732e-05, -1.0857358574867249e-05, -1.0143034160137177e-05, -9.428709745407104e-06, -8.714385330677032e-06, -8.00006091594696e-06, -7.2857365012168884e-06, -6.571412086486816e-06, -5.857087671756744e-06, -5.142763257026672e-06, -4.4284388422966e-06, -3.7141144275665283e-06, -2.9997900128364563e-06, -2.2854655981063843e-06, -1.5711411833763123e-06, -8.568167686462402e-07, -1.424923539161682e-07, 5.718320608139038e-07, 1.2861564755439758e-06, 2.000480890274048e-06, 2.71480530500412e-06, 3.429129719734192e-06, 4.143454134464264e-06, 4.857778549194336e-06, 5.572102963924408e-06, 6.28642737865448e-06, 7.000751793384552e-06, 7.715076208114624e-06, 8.429400622844696e-06, 9.143725037574768e-06, 9.85804945230484e-06, 1.0572373867034912e-05, 1.1286698281764984e-05, 1.2001022696495056e-05, 1.2715347111225128e-05, 1.34296715259552e-05, 1.4143995940685272e-05, 1.4858320355415344e-05, 1.5572644770145416e-05, 1.6286969184875488e-05, 1.700129359960556e-05, 1.7715618014335632e-05, 1.8429942429065704e-05, 1.9144266843795776e-05, 1.985859125852585e-05, 2.057291567325592e-05, 2.1287240087985992e-05, 2.2001564502716064e-05, 2.2715888917446136e-05, 2.343021333217621e-05, 2.414453774690628e-05, 2.4858862161636353e-05, 2.5573186576366425e-05, 2.6287510991096497e-05, 2.700183540582657e-05, 2.771615982055664e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 9.0, 18.0, 28.0, 55.0, 53.0, 79.0, 120.0, 173.0, 246.0, 332.0, 539.0, 810.0, 1210.0, 1789.0, 2973.0, 5186.0, 8758.0, 16601.0, 34334.0, 81535.0, 206398.0, 341909.0, 196609.0, 77668.0, 33355.0, 15950.0, 8483.0, 4859.0, 3007.0, 1874.0, 1177.0, 754.0, 537.0, 358.0, 219.0, 168.0, 106.0, 72.0, 57.0, 48.0, 26.0, 17.0, 12.0, 6.0, 13.0, 3.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.73046875, -0.7098770141601562, -0.6892852783203125, -0.6686935424804688, -0.648101806640625, -0.6275100708007812, -0.6069183349609375, -0.5863265991210938, -0.56573486328125, -0.5451431274414062, -0.5245513916015625, -0.5039596557617188, -0.483367919921875, -0.46277618408203125, -0.4421844482421875, -0.42159271240234375, -0.4010009765625, -0.38040924072265625, -0.3598175048828125, -0.33922576904296875, -0.318634033203125, -0.29804229736328125, -0.2774505615234375, -0.25685882568359375, -0.23626708984375, -0.21567535400390625, -0.1950836181640625, -0.17449188232421875, -0.153900146484375, -0.13330841064453125, -0.1127166748046875, -0.09212493896484375, -0.071533203125, -0.05094146728515625, -0.0303497314453125, -0.00975799560546875, 0.010833740234375, 0.03142547607421875, 0.0520172119140625, 0.07260894775390625, 0.09320068359375, 0.11379241943359375, 0.1343841552734375, 0.15497589111328125, 0.175567626953125, 0.19615936279296875, 0.2167510986328125, 0.23734283447265625, 0.2579345703125, 0.27852630615234375, 0.2991180419921875, 0.31970977783203125, 0.340301513671875, 0.36089324951171875, 0.3814849853515625, 0.40207672119140625, 0.42266845703125, 0.44326019287109375, 0.4638519287109375, 0.48444366455078125, 0.505035400390625, 0.5256271362304688, 0.5462188720703125, 0.5668106079101562, 0.58740234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 8.0, 6.0, 10.0, 12.0, 17.0, 13.0, 17.0, 34.0, 39.0, 71.0, 65.0, 88.0, 110.0, 108.0, 99.0, 68.0, 54.0, 23.0, 25.0, 23.0, 22.0, 15.0, 15.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.14951324462890625, -0.1443634033203125, -0.13921356201171875, -0.134063720703125, -0.12891387939453125, -0.1237640380859375, -0.11861419677734375, -0.11346435546875, -0.10831451416015625, -0.1031646728515625, -0.09801483154296875, -0.092864990234375, -0.08771514892578125, -0.0825653076171875, -0.07741546630859375, -0.072265625, -0.06711578369140625, -0.0619659423828125, -0.05681610107421875, -0.051666259765625, -0.04651641845703125, -0.0413665771484375, -0.03621673583984375, -0.03106689453125, -0.02591705322265625, -0.0207672119140625, -0.01561737060546875, -0.010467529296875, -0.00531768798828125, -0.0001678466796875, 0.00498199462890625, 0.0101318359375, 0.01528167724609375, 0.0204315185546875, 0.02558135986328125, 0.030731201171875, 0.03588104248046875, 0.0410308837890625, 0.04618072509765625, 0.05133056640625, 0.05648040771484375, 0.0616302490234375, 0.06678009033203125, 0.071929931640625, 0.07707977294921875, 0.0822296142578125, 0.08737945556640625, 0.092529296875, 0.09767913818359375, 0.1028289794921875, 0.10797882080078125, 0.113128662109375, 0.11827850341796875, 0.1234283447265625, 0.12857818603515625, 0.13372802734375, 0.13887786865234375, 0.1440277099609375, 0.14917755126953125, 0.154327392578125, 0.15947723388671875, 0.1646270751953125, 0.16977691650390625, 0.1749267578125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 0.0, 6.0, 4.0, 8.0, 11.0, 15.0, 17.0, 20.0, 17.0, 14.0, 30.0, 26.0, 34.0, 31.0, 35.0, 52.0, 56.0, 44.0, 46.0, 52.0, 46.0, 49.0, 51.0, 46.0, 45.0, 38.0, 36.0, 33.0, 16.0, 31.0, 16.0, 16.0, 11.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.535590648651123, -3.4327683448791504, -3.3299460411071777, -3.227123737335205, -3.1243014335632324, -3.0214791297912598, -2.918656826019287, -2.8158345222473145, -2.713012218475342, -2.610189914703369, -2.5073676109313965, -2.404545307159424, -2.301723003387451, -2.1989006996154785, -2.096078395843506, -1.9932562112808228, -1.8904340267181396, -1.787611722946167, -1.6847894191741943, -1.5819671154022217, -1.479144811630249, -1.3763225078582764, -1.2735003232955933, -1.1706780195236206, -1.067855715751648, -0.9650334119796753, -0.8622111082077026, -0.7593888640403748, -0.6565665602684021, -0.5537442564964294, -0.45092201232910156, -0.3480997085571289, -0.24527764320373535, -0.1424553543329239, -0.03963306546211243, 0.06318920850753784, 0.1660115122795105, 0.26883381605148315, 0.37165606021881104, 0.4744783639907837, 0.5773006677627563, 0.680122971534729, 0.7829452753067017, 0.8857675194740295, 0.9885898232460022, 1.09141206741333, 1.1942343711853027, 1.2970566749572754, 1.399878978729248, 1.5027012825012207, 1.6055235862731934, 1.708345890045166, 1.8111681938171387, 1.9139904975891113, 2.016812801361084, 2.1196351051330566, 2.2224574089050293, 2.325279712677002, 2.4281020164489746, 2.5309243202209473, 2.63374662399292, 2.7365689277648926, 2.8393912315368652, 2.942213535308838, 3.0450356006622314]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 14.0, 13.0, 20.0, 21.0, 17.0, 21.0, 27.0, 16.0, 35.0, 21.0, 36.0, 26.0, 38.0, 46.0, 46.0, 31.0, 47.0, 35.0, 48.0, 41.0, 34.0, 39.0, 42.0, 32.0, 27.0, 26.0, 24.0, 20.0, 23.0, 13.0, 20.0, 10.0, 17.0, 12.0, 8.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2628321647644043, -2.1919450759887695, -2.1210579872131348, -2.0501708984375, -1.9792838096618652, -1.9083967208862305, -1.8375095129013062, -1.7666224241256714, -1.6957353353500366, -1.6248482465744019, -1.553961157798767, -1.4830740690231323, -1.412186861038208, -1.3412997722625732, -1.2704126834869385, -1.1995255947113037, -1.128638505935669, -1.0577514171600342, -0.9868643283843994, -0.9159771800041199, -0.8450900912284851, -0.7742030024528503, -0.7033158540725708, -0.632428765296936, -0.5615416765213013, -0.4906545877456665, -0.41976746916770935, -0.3488803505897522, -0.27799326181411743, -0.20710617303848267, -0.1362190544605255, -0.06533193588256836, 0.005554914474487305, 0.07644201815128326, 0.14732912182807922, 0.21821622550487518, 0.28910332918167114, 0.3599904179573059, 0.43087753653526306, 0.5017646551132202, 0.572651743888855, 0.6435388326644897, 0.7144259214401245, 0.785313069820404, 0.8562001585960388, 0.9270872473716736, 0.9979743957519531, 1.068861484527588, 1.1397485733032227, 1.2106356620788574, 1.2815227508544922, 1.352409839630127, 1.4232969284057617, 1.4941840171813965, 1.5650712251663208, 1.6359583139419556, 1.7068454027175903, 1.777732491493225, 1.8486195802688599, 1.9195066690444946, 1.990393877029419, 2.0612809658050537, 2.1321680545806885, 2.2030551433563232, 2.273942232131958]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 9.0, 5.0, 24.0, 28.0, 58.0, 67.0, 137.0, 199.0, 332.0, 472.0, 767.0, 1159.0, 1739.0, 2823.0, 4318.0, 6322.0, 9443.0, 13741.0, 19412.0, 27325.0, 36716.0, 47635.0, 59910.0, 71428.0, 81431.0, 89062.0, 91416.0, 89418.0, 82300.0, 72935.0, 60789.0, 48772.0, 37208.0, 28021.0, 19952.0, 14287.0, 9767.0, 6516.0, 4361.0, 2902.0, 1954.0, 1210.0, 819.0, 497.0, 319.0, 208.0, 138.0, 73.0, 47.0, 36.0, 17.0, 13.0, 9.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2197265625, -1.1797943115234375, -1.139862060546875, -1.0999298095703125, -1.05999755859375, -1.0200653076171875, -0.980133056640625, -0.9402008056640625, -0.9002685546875, -0.8603363037109375, -0.820404052734375, -0.7804718017578125, -0.74053955078125, -0.7006072998046875, -0.660675048828125, -0.6207427978515625, -0.580810546875, -0.5408782958984375, -0.500946044921875, -0.4610137939453125, -0.42108154296875, -0.3811492919921875, -0.341217041015625, -0.3012847900390625, -0.2613525390625, -0.2214202880859375, -0.181488037109375, -0.1415557861328125, -0.10162353515625, -0.0616912841796875, -0.021759033203125, 0.0181732177734375, 0.05810546875, 0.0980377197265625, 0.137969970703125, 0.1779022216796875, 0.21783447265625, 0.2577667236328125, 0.297698974609375, 0.3376312255859375, 0.3775634765625, 0.4174957275390625, 0.457427978515625, 0.4973602294921875, 0.53729248046875, 0.5772247314453125, 0.617156982421875, 0.6570892333984375, 0.697021484375, 0.7369537353515625, 0.776885986328125, 0.8168182373046875, 0.85675048828125, 0.8966827392578125, 0.936614990234375, 0.9765472412109375, 1.0164794921875, 1.0564117431640625, 1.096343994140625, 1.1362762451171875, 1.17620849609375, 1.2161407470703125, 1.256072998046875, 1.2960052490234375, 1.3359375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 13.0, 11.0, 10.0, 21.0, 14.0, 13.0, 15.0, 21.0, 26.0, 29.0, 33.0, 35.0, 43.0, 31.0, 41.0, 30.0, 38.0, 45.0, 37.0, 45.0, 38.0, 40.0, 45.0, 39.0, 36.0, 24.0, 30.0, 29.0, 15.0, 24.0, 23.0, 13.0, 15.0, 11.0, 13.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.541015625, -2.4637451171875, -2.386474609375, -2.3092041015625, -2.23193359375, -2.1546630859375, -2.077392578125, -2.0001220703125, -1.9228515625, -1.8455810546875, -1.768310546875, -1.6910400390625, -1.61376953125, -1.5364990234375, -1.459228515625, -1.3819580078125, -1.3046875, -1.2274169921875, -1.150146484375, -1.0728759765625, -0.99560546875, -0.9183349609375, -0.841064453125, -0.7637939453125, -0.6865234375, -0.6092529296875, -0.531982421875, -0.4547119140625, -0.37744140625, -0.3001708984375, -0.222900390625, -0.1456298828125, -0.068359375, 0.0089111328125, 0.086181640625, 0.1634521484375, 0.24072265625, 0.3179931640625, 0.395263671875, 0.4725341796875, 0.5498046875, 0.6270751953125, 0.704345703125, 0.7816162109375, 0.85888671875, 0.9361572265625, 1.013427734375, 1.0906982421875, 1.16796875, 1.2452392578125, 1.322509765625, 1.3997802734375, 1.47705078125, 1.5543212890625, 1.631591796875, 1.7088623046875, 1.7861328125, 1.8634033203125, 1.940673828125, 2.0179443359375, 2.09521484375, 2.1724853515625, 2.249755859375, 2.3270263671875, 2.404296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 8.0, 9.0, 23.0, 24.0, 46.0, 82.0, 127.0, 164.0, 326.0, 501.0, 723.0, 1202.0, 1879.0, 2946.0, 4518.0, 6836.0, 10184.0, 15255.0, 21617.0, 29999.0, 41417.0, 53773.0, 66959.0, 79651.0, 89229.0, 95397.0, 94963.0, 89799.0, 79778.0, 67221.0, 54069.0, 41362.0, 30831.0, 22153.0, 15329.0, 10471.0, 6819.0, 4752.0, 2926.0, 1920.0, 1243.0, 717.0, 512.0, 298.0, 200.0, 114.0, 66.0, 49.0, 37.0, 12.0, 14.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-1.4267578125, -1.383544921875, -1.34033203125, -1.297119140625, -1.25390625, -1.210693359375, -1.16748046875, -1.124267578125, -1.0810546875, -1.037841796875, -0.99462890625, -0.951416015625, -0.908203125, -0.864990234375, -0.82177734375, -0.778564453125, -0.7353515625, -0.692138671875, -0.64892578125, -0.605712890625, -0.5625, -0.519287109375, -0.47607421875, -0.432861328125, -0.3896484375, -0.346435546875, -0.30322265625, -0.260009765625, -0.216796875, -0.173583984375, -0.13037109375, -0.087158203125, -0.0439453125, -0.000732421875, 0.04248046875, 0.085693359375, 0.12890625, 0.172119140625, 0.21533203125, 0.258544921875, 0.3017578125, 0.344970703125, 0.38818359375, 0.431396484375, 0.474609375, 0.517822265625, 0.56103515625, 0.604248046875, 0.6474609375, 0.690673828125, 0.73388671875, 0.777099609375, 0.8203125, 0.863525390625, 0.90673828125, 0.949951171875, 0.9931640625, 1.036376953125, 1.07958984375, 1.122802734375, 1.166015625, 1.209228515625, 1.25244140625, 1.295654296875, 1.3388671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 4.0, 16.0, 16.0, 24.0, 31.0, 23.0, 21.0, 35.0, 23.0, 31.0, 36.0, 24.0, 30.0, 45.0, 36.0, 36.0, 43.0, 41.0, 42.0, 40.0, 42.0, 38.0, 46.0, 30.0, 25.0, 30.0, 22.0, 17.0, 20.0, 19.0, 14.0, 17.0, 10.0, 15.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 4.0], "bins": [-1.6552734375, -1.6083831787109375, -1.561492919921875, -1.5146026611328125, -1.46771240234375, -1.4208221435546875, -1.373931884765625, -1.3270416259765625, -1.2801513671875, -1.2332611083984375, -1.186370849609375, -1.1394805908203125, -1.09259033203125, -1.0457000732421875, -0.998809814453125, -0.9519195556640625, -0.905029296875, -0.8581390380859375, -0.811248779296875, -0.7643585205078125, -0.71746826171875, -0.6705780029296875, -0.623687744140625, -0.5767974853515625, -0.5299072265625, -0.4830169677734375, -0.436126708984375, -0.3892364501953125, -0.34234619140625, -0.2954559326171875, -0.248565673828125, -0.2016754150390625, -0.15478515625, -0.1078948974609375, -0.061004638671875, -0.0141143798828125, 0.03277587890625, 0.0796661376953125, 0.126556396484375, 0.1734466552734375, 0.2203369140625, 0.2672271728515625, 0.314117431640625, 0.3610076904296875, 0.40789794921875, 0.4547882080078125, 0.501678466796875, 0.5485687255859375, 0.595458984375, 0.6423492431640625, 0.689239501953125, 0.7361297607421875, 0.78302001953125, 0.8299102783203125, 0.876800537109375, 0.9236907958984375, 0.9705810546875, 1.0174713134765625, 1.064361572265625, 1.1112518310546875, 1.15814208984375, 1.2050323486328125, 1.251922607421875, 1.2988128662109375, 1.345703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 16.0, 18.0, 35.0, 56.0, 67.0, 136.0, 195.0, 277.0, 441.0, 752.0, 1171.0, 1809.0, 3073.0, 4911.0, 7819.0, 12768.0, 20684.0, 31294.0, 46198.0, 65024.0, 85707.0, 104289.0, 116774.0, 117972.0, 109350.0, 92306.0, 72120.0, 53091.0, 36384.0, 23633.0, 15138.0, 9616.0, 5870.0, 3600.0, 2229.0, 1348.0, 852.0, 524.0, 344.0, 220.0, 153.0, 95.0, 65.0, 45.0, 24.0, 18.0, 13.0, 9.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.76220703125, -0.7392349243164062, -0.7162628173828125, -0.6932907104492188, -0.670318603515625, -0.6473464965820312, -0.6243743896484375, -0.6014022827148438, -0.57843017578125, -0.5554580688476562, -0.5324859619140625, -0.5095138549804688, -0.486541748046875, -0.46356964111328125, -0.4405975341796875, -0.41762542724609375, -0.3946533203125, -0.37168121337890625, -0.3487091064453125, -0.32573699951171875, -0.302764892578125, -0.27979278564453125, -0.2568206787109375, -0.23384857177734375, -0.21087646484375, -0.18790435791015625, -0.1649322509765625, -0.14196014404296875, -0.118988037109375, -0.09601593017578125, -0.0730438232421875, -0.05007171630859375, -0.027099609375, -0.00412750244140625, 0.0188446044921875, 0.04181671142578125, 0.064788818359375, 0.08776092529296875, 0.1107330322265625, 0.13370513916015625, 0.15667724609375, 0.17964935302734375, 0.2026214599609375, 0.22559356689453125, 0.248565673828125, 0.27153778076171875, 0.2945098876953125, 0.31748199462890625, 0.3404541015625, 0.36342620849609375, 0.3863983154296875, 0.40937042236328125, 0.432342529296875, 0.45531463623046875, 0.4782867431640625, 0.5012588500976562, 0.52423095703125, 0.5472030639648438, 0.5701751708984375, 0.5931472778320312, 0.616119384765625, 0.6390914916992188, 0.6620635986328125, 0.6850357055664062, 0.7080078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 10.0, 14.0, 12.0, 15.0, 14.0, 19.0, 23.0, 19.0, 27.0, 31.0, 31.0, 47.0, 36.0, 35.0, 40.0, 39.0, 47.0, 57.0, 54.0, 39.0, 42.0, 50.0, 49.0, 30.0, 29.0, 29.0, 24.0, 22.0, 19.0, 18.0, 16.0, 8.0, 13.0, 5.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.502920925617218e-05, -7.22743570804596e-05, -6.951950490474701e-05, -6.676465272903442e-05, -6.400980055332184e-05, -6.125494837760925e-05, -5.850009620189667e-05, -5.574524402618408e-05, -5.2990391850471497e-05, -5.023553967475891e-05, -4.7480687499046326e-05, -4.472583532333374e-05, -4.1970983147621155e-05, -3.921613097190857e-05, -3.6461278796195984e-05, -3.37064266204834e-05, -3.095157444477081e-05, -2.8196722269058228e-05, -2.5441870093345642e-05, -2.2687017917633057e-05, -1.993216574192047e-05, -1.7177313566207886e-05, -1.44224613904953e-05, -1.1667609214782715e-05, -8.91275703907013e-06, -6.157904863357544e-06, -3.4030526876449585e-06, -6.48200511932373e-07, 2.1066516637802124e-06, 4.861503839492798e-06, 7.616356015205383e-06, 1.0371208190917969e-05, 1.3126060366630554e-05, 1.588091254234314e-05, 1.8635764718055725e-05, 2.139061689376831e-05, 2.4145469069480896e-05, 2.690032124519348e-05, 2.9655173420906067e-05, 3.241002559661865e-05, 3.516487777233124e-05, 3.791972994804382e-05, 4.067458212375641e-05, 4.3429434299468994e-05, 4.618428647518158e-05, 4.8939138650894165e-05, 5.169399082660675e-05, 5.4448843002319336e-05, 5.720369517803192e-05, 5.995854735374451e-05, 6.271339952945709e-05, 6.546825170516968e-05, 6.822310388088226e-05, 7.097795605659485e-05, 7.373280823230743e-05, 7.648766040802002e-05, 7.92425125837326e-05, 8.199736475944519e-05, 8.475221693515778e-05, 8.750706911087036e-05, 9.026192128658295e-05, 9.301677346229553e-05, 9.577162563800812e-05, 9.85264778137207e-05]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 16.0, 21.0, 30.0, 37.0, 61.0, 100.0, 138.0, 212.0, 378.0, 548.0, 957.0, 1466.0, 2512.0, 4045.0, 7152.0, 12209.0, 21844.0, 36953.0, 59736.0, 89391.0, 119891.0, 142460.0, 145242.0, 129061.0, 99974.0, 68303.0, 43575.0, 26191.0, 15054.0, 8518.0, 4930.0, 2922.0, 1726.0, 1023.0, 686.0, 409.0, 280.0, 151.0, 139.0, 85.0, 39.0, 30.0, 22.0, 17.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9258499145507812, -0.8951568603515625, -0.8644638061523438, -0.833770751953125, -0.8030776977539062, -0.7723846435546875, -0.7416915893554688, -0.71099853515625, -0.6803054809570312, -0.6496124267578125, -0.6189193725585938, -0.588226318359375, -0.5575332641601562, -0.5268402099609375, -0.49614715576171875, -0.4654541015625, -0.43476104736328125, -0.4040679931640625, -0.37337493896484375, -0.342681884765625, -0.31198883056640625, -0.2812957763671875, -0.25060272216796875, -0.21990966796875, -0.18921661376953125, -0.1585235595703125, -0.12783050537109375, -0.097137451171875, -0.06644439697265625, -0.0357513427734375, -0.00505828857421875, 0.025634765625, 0.05632781982421875, 0.0870208740234375, 0.11771392822265625, 0.148406982421875, 0.17910003662109375, 0.2097930908203125, 0.24048614501953125, 0.27117919921875, 0.30187225341796875, 0.3325653076171875, 0.36325836181640625, 0.393951416015625, 0.42464447021484375, 0.4553375244140625, 0.48603057861328125, 0.5167236328125, 0.5474166870117188, 0.5781097412109375, 0.6088027954101562, 0.639495849609375, 0.6701889038085938, 0.7008819580078125, 0.7315750122070312, 0.76226806640625, 0.7929611206054688, 0.8236541748046875, 0.8543472290039062, 0.885040283203125, 0.9157333374023438, 0.9464263916015625, 0.9771194458007812, 1.0078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 9.0, 5.0, 11.0, 6.0, 15.0, 14.0, 13.0, 24.0, 20.0, 33.0, 21.0, 31.0, 47.0, 48.0, 45.0, 39.0, 50.0, 38.0, 40.0, 41.0, 56.0, 27.0, 27.0, 41.0, 29.0, 32.0, 30.0, 23.0, 30.0, 19.0, 23.0, 13.0, 14.0, 10.0, 14.0, 3.0, 12.0, 10.0, 2.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2605476379394531, -0.25205230712890625, -0.24355697631835938, -0.2350616455078125, -0.22656631469726562, -0.21807098388671875, -0.20957565307617188, -0.201080322265625, -0.19258499145507812, -0.18408966064453125, -0.17559432983398438, -0.1670989990234375, -0.15860366821289062, -0.15010833740234375, -0.14161300659179688, -0.13311767578125, -0.12462234497070312, -0.11612701416015625, -0.10763168334960938, -0.0991363525390625, -0.09064102172851562, -0.08214569091796875, -0.07365036010742188, -0.065155029296875, -0.056659698486328125, -0.04816436767578125, -0.039669036865234375, -0.0311737060546875, -0.022678375244140625, -0.01418304443359375, -0.005687713623046875, 0.0028076171875, 0.011302947998046875, 0.01979827880859375, 0.028293609619140625, 0.0367889404296875, 0.045284271240234375, 0.05377960205078125, 0.062274932861328125, 0.070770263671875, 0.07926559448242188, 0.08776092529296875, 0.09625625610351562, 0.1047515869140625, 0.11324691772460938, 0.12174224853515625, 0.13023757934570312, 0.13873291015625, 0.14722824096679688, 0.15572357177734375, 0.16421890258789062, 0.1727142333984375, 0.18120956420898438, 0.18970489501953125, 0.19820022583007812, 0.206695556640625, 0.21519088745117188, 0.22368621826171875, 0.23218154907226562, 0.2406768798828125, 0.24917221069335938, 0.25766754150390625, 0.2661628723144531, 0.274658203125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 9.0, 9.0, 9.0, 10.0, 11.0, 14.0, 18.0, 20.0, 23.0, 29.0, 27.0, 40.0, 44.0, 37.0, 40.0, 45.0, 58.0, 58.0, 43.0, 41.0, 37.0, 58.0, 36.0, 41.0, 35.0, 38.0, 29.0, 30.0, 19.0, 20.0, 8.0, 11.0, 10.0, 5.0, 9.0, 6.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.380751848220825, -3.2809531688690186, -3.181154727935791, -3.0813560485839844, -2.981557607650757, -2.88175892829895, -2.7819604873657227, -2.682161808013916, -2.5823631286621094, -2.4825644493103027, -2.382766008377075, -2.2829673290252686, -2.183168888092041, -2.0833702087402344, -1.9835716485977173, -1.8837730884552002, -1.7839746475219727, -1.6841760873794556, -1.5843775272369385, -1.4845788478851318, -1.3847804069519043, -1.2849817276000977, -1.1851831674575806, -1.0853846073150635, -0.9855860471725464, -0.8857874870300293, -0.7859889268875122, -0.6861903071403503, -0.5863917469978333, -0.48659318685531616, -0.3867945671081543, -0.2869960069656372, -0.18719744682312012, -0.08739887177944183, 0.01239970326423645, 0.11219829320907593, 0.21199685335159302, 0.3117954134941101, 0.411594033241272, 0.5113925933837891, 0.6111911535263062, 0.7109897136688232, 0.8107882738113403, 0.9105868935585022, 1.010385513305664, 1.1101839542388916, 1.2099826335906982, 1.3097811937332153, 1.4095797538757324, 1.5093783140182495, 1.6091768741607666, 1.7089755535125732, 1.8087739944458008, 1.9085726737976074, 2.008371353149414, 2.1081697940826416, 2.207968235015869, 2.307766914367676, 2.4075653553009033, 2.50736403465271, 2.6071624755859375, 2.706961154937744, 2.806759834289551, 2.9065582752227783, 3.006356954574585]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 14.0, 9.0, 15.0, 18.0, 31.0, 28.0, 22.0, 22.0, 38.0, 47.0, 47.0, 39.0, 44.0, 48.0, 46.0, 47.0, 44.0, 50.0, 53.0, 43.0, 31.0, 37.0, 26.0, 35.0, 28.0, 23.0, 22.0, 13.0, 11.0, 12.0, 8.0, 12.0, 7.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2223832607269287, -3.131322145462036, -3.0402612686157227, -2.94920015335083, -2.8581392765045166, -2.767078161239624, -2.6760172843933105, -2.584956169128418, -2.4938952922821045, -2.402834177017212, -2.3117733001708984, -2.220712184906006, -2.1296513080596924, -2.0385901927948, -1.9475293159484863, -1.8564682006835938, -1.7654072046279907, -1.6743462085723877, -1.5832852125167847, -1.4922242164611816, -1.4011632204055786, -1.3101022243499756, -1.219041109085083, -1.1279802322387695, -1.036919116973877, -0.9458581209182739, -0.8547971248626709, -0.7637361288070679, -0.6726751327514648, -0.5816141366958618, -0.490553081035614, -0.399492084980011, -0.30843114852905273, -0.2173701524734497, -0.12630914151668549, -0.035248130559921265, 0.05581286549568176, 0.1468738615512848, 0.2379348874092102, 0.32899588346481323, 0.42005687952041626, 0.5111178755760193, 0.6021788716316223, 0.6932399272918701, 0.7843009233474731, 0.8753619194030762, 0.9664229154586792, 1.0574839115142822, 1.1485449075698853, 1.2396059036254883, 1.3306668996810913, 1.4217278957366943, 1.5127888917922974, 1.6038498878479004, 1.694911003112793, 1.7859718799591064, 1.877032995223999, 1.968093991279602, 2.059154987335205, 2.1502161026000977, 2.241276979446411, 2.3323380947113037, 2.423398971557617, 2.5144600868225098, 2.6055209636688232]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 18.0, 30.0, 33.0, 53.0, 96.0, 139.0, 209.0, 383.0, 551.0, 872.0, 1520.0, 2234.0, 3653.0, 5774.0, 9396.0, 14681.0, 23514.0, 37424.0, 58179.0, 89889.0, 135010.0, 196010.0, 273121.0, 357394.0, 433796.0, 477430.0, 476084.0, 427041.0, 348518.0, 263653.0, 188259.0, 129091.0, 86045.0, 56027.0, 35856.0, 23139.0, 14330.0, 9097.0, 5802.0, 3781.0, 2313.0, 1376.0, 912.0, 588.0, 392.0, 203.0, 140.0, 85.0, 56.0, 37.0, 23.0, 10.0, 10.0, 4.0, 0.0, 1.0], "bins": [-2.603515625, -2.526824951171875, -2.45013427734375, -2.373443603515625, -2.2967529296875, -2.220062255859375, -2.14337158203125, -2.066680908203125, -1.989990234375, -1.913299560546875, -1.83660888671875, -1.759918212890625, -1.6832275390625, -1.606536865234375, -1.52984619140625, -1.453155517578125, -1.37646484375, -1.299774169921875, -1.22308349609375, -1.146392822265625, -1.0697021484375, -0.993011474609375, -0.91632080078125, -0.839630126953125, -0.762939453125, -0.686248779296875, -0.60955810546875, -0.532867431640625, -0.4561767578125, -0.379486083984375, -0.30279541015625, -0.226104736328125, -0.1494140625, -0.072723388671875, 0.00396728515625, 0.080657958984375, 0.1573486328125, 0.234039306640625, 0.31072998046875, 0.387420654296875, 0.464111328125, 0.540802001953125, 0.61749267578125, 0.694183349609375, 0.7708740234375, 0.847564697265625, 0.92425537109375, 1.000946044921875, 1.07763671875, 1.154327392578125, 1.23101806640625, 1.307708740234375, 1.3843994140625, 1.461090087890625, 1.53778076171875, 1.614471435546875, 1.691162109375, 1.767852783203125, 1.84454345703125, 1.921234130859375, 1.9979248046875, 2.074615478515625, 2.15130615234375, 2.227996826171875, 2.3046875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 8.0, 7.0, 15.0, 12.0, 20.0, 21.0, 21.0, 28.0, 31.0, 21.0, 38.0, 36.0, 35.0, 28.0, 43.0, 44.0, 42.0, 36.0, 41.0, 36.0, 35.0, 40.0, 39.0, 43.0, 34.0, 27.0, 29.0, 27.0, 21.0, 15.0, 16.0, 20.0, 13.0, 8.0, 12.0, 9.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.51953125, -2.44488525390625, -2.3702392578125, -2.29559326171875, -2.220947265625, -2.14630126953125, -2.0716552734375, -1.99700927734375, -1.92236328125, -1.84771728515625, -1.7730712890625, -1.69842529296875, -1.623779296875, -1.54913330078125, -1.4744873046875, -1.39984130859375, -1.3251953125, -1.25054931640625, -1.1759033203125, -1.10125732421875, -1.026611328125, -0.95196533203125, -0.8773193359375, -0.80267333984375, -0.72802734375, -0.65338134765625, -0.5787353515625, -0.50408935546875, -0.429443359375, -0.35479736328125, -0.2801513671875, -0.20550537109375, -0.130859375, -0.05621337890625, 0.0184326171875, 0.09307861328125, 0.167724609375, 0.24237060546875, 0.3170166015625, 0.39166259765625, 0.46630859375, 0.54095458984375, 0.6156005859375, 0.69024658203125, 0.764892578125, 0.83953857421875, 0.9141845703125, 0.98883056640625, 1.0634765625, 1.13812255859375, 1.2127685546875, 1.28741455078125, 1.362060546875, 1.43670654296875, 1.5113525390625, 1.58599853515625, 1.66064453125, 1.73529052734375, 1.8099365234375, 1.88458251953125, 1.959228515625, 2.03387451171875, 2.1085205078125, 2.18316650390625, 2.2578125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 17.0, 30.0, 37.0, 60.0, 150.0, 199.0, 343.0, 516.0, 971.0, 1584.0, 2661.0, 4390.0, 7488.0, 12211.0, 20286.0, 33354.0, 52782.0, 83153.0, 126253.0, 185615.0, 256432.0, 337553.0, 411129.0, 460870.0, 470288.0, 436930.0, 369702.0, 290521.0, 213802.0, 148934.0, 98340.0, 64092.0, 40372.0, 25074.0, 15222.0, 9164.0, 5486.0, 3356.0, 1996.0, 1157.0, 684.0, 459.0, 232.0, 145.0, 95.0, 57.0, 30.0, 19.0, 7.0, 10.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.923828125, -2.83013916015625, -2.7364501953125, -2.64276123046875, -2.549072265625, -2.45538330078125, -2.3616943359375, -2.26800537109375, -2.17431640625, -2.08062744140625, -1.9869384765625, -1.89324951171875, -1.799560546875, -1.70587158203125, -1.6121826171875, -1.51849365234375, -1.4248046875, -1.33111572265625, -1.2374267578125, -1.14373779296875, -1.050048828125, -0.95635986328125, -0.8626708984375, -0.76898193359375, -0.67529296875, -0.58160400390625, -0.4879150390625, -0.39422607421875, -0.300537109375, -0.20684814453125, -0.1131591796875, -0.01947021484375, 0.07421875, 0.16790771484375, 0.2615966796875, 0.35528564453125, 0.448974609375, 0.54266357421875, 0.6363525390625, 0.73004150390625, 0.82373046875, 0.91741943359375, 1.0111083984375, 1.10479736328125, 1.198486328125, 1.29217529296875, 1.3858642578125, 1.47955322265625, 1.5732421875, 1.66693115234375, 1.7606201171875, 1.85430908203125, 1.947998046875, 2.04168701171875, 2.1353759765625, 2.22906494140625, 2.32275390625, 2.41644287109375, 2.5101318359375, 2.60382080078125, 2.697509765625, 2.79119873046875, 2.8848876953125, 2.97857666015625, 3.072265625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 11.0, 10.0, 21.0, 25.0, 37.0, 37.0, 46.0, 67.0, 77.0, 105.0, 140.0, 169.0, 193.0, 221.0, 237.0, 236.0, 261.0, 271.0, 256.0, 265.0, 249.0, 212.0, 187.0, 153.0, 144.0, 109.0, 77.0, 70.0, 56.0, 37.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.857818603515625, -1.80548095703125, -1.753143310546875, -1.7008056640625, -1.648468017578125, -1.59613037109375, -1.543792724609375, -1.491455078125, -1.439117431640625, -1.38677978515625, -1.334442138671875, -1.2821044921875, -1.229766845703125, -1.17742919921875, -1.125091552734375, -1.07275390625, -1.020416259765625, -0.96807861328125, -0.915740966796875, -0.8634033203125, -0.811065673828125, -0.75872802734375, -0.706390380859375, -0.654052734375, -0.601715087890625, -0.54937744140625, -0.497039794921875, -0.4447021484375, -0.392364501953125, -0.34002685546875, -0.287689208984375, -0.2353515625, -0.183013916015625, -0.13067626953125, -0.078338623046875, -0.0260009765625, 0.026336669921875, 0.07867431640625, 0.131011962890625, 0.183349609375, 0.235687255859375, 0.28802490234375, 0.340362548828125, 0.3927001953125, 0.445037841796875, 0.49737548828125, 0.549713134765625, 0.60205078125, 0.654388427734375, 0.70672607421875, 0.759063720703125, 0.8114013671875, 0.863739013671875, 0.91607666015625, 0.968414306640625, 1.020751953125, 1.073089599609375, 1.12542724609375, 1.177764892578125, 1.2301025390625, 1.282440185546875, 1.33477783203125, 1.387115478515625, 1.439453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 0.0, 4.0, 7.0, 11.0, 13.0, 9.0, 26.0, 19.0, 23.0, 32.0, 36.0, 46.0, 33.0, 49.0, 54.0, 52.0, 53.0, 45.0, 43.0, 52.0, 35.0, 39.0, 44.0, 41.0, 38.0, 30.0, 21.0, 29.0, 27.0, 13.0, 17.0, 11.0, 14.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.072996139526367, -3.9328458309173584, -3.7926955223083496, -3.6525449752807617, -3.512394666671753, -3.372244358062744, -3.2320938110351562, -3.0919435024261475, -2.9517931938171387, -2.81164288520813, -2.671492576599121, -2.531342029571533, -2.3911917209625244, -2.2510414123535156, -2.1108908653259277, -1.970740556716919, -1.8305902481079102, -1.6904399394989014, -1.550289511680603, -1.4101390838623047, -1.269988775253296, -1.129838466644287, -0.9896880388259888, -0.8495376706123352, -0.7093873023986816, -0.5692369341850281, -0.4290865659713745, -0.28893619775772095, -0.14878582954406738, -0.008635461330413818, 0.13151490688323975, 0.2716652750968933, 0.4118156433105469, 0.5519660115242004, 0.692116379737854, 0.8322667479515076, 0.9724171161651611, 1.11256742477417, 1.2527178525924683, 1.3928682804107666, 1.5330185890197754, 1.6731688976287842, 1.8133193254470825, 1.9534697532653809, 2.0936200618743896, 2.2337703704833984, 2.3739209175109863, 2.514071226119995, 2.654221534729004, 2.7943718433380127, 2.9345221519470215, 3.0746726989746094, 3.214823007583618, 3.354973316192627, 3.495123863220215, 3.6352741718292236, 3.7754244804382324, 3.915574789047241, 4.05572509765625, 4.195875644683838, 4.336026191711426, 4.4761762619018555, 4.616326808929443, 4.756476879119873, 4.896627426147461]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 8.0, 6.0, 10.0, 7.0, 17.0, 19.0, 21.0, 27.0, 21.0, 23.0, 25.0, 35.0, 27.0, 33.0, 43.0, 38.0, 49.0, 49.0, 43.0, 33.0, 44.0, 41.0, 27.0, 42.0, 35.0, 33.0, 37.0, 23.0, 22.0, 23.0, 18.0, 16.0, 15.0, 16.0, 12.0, 13.0, 9.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5045316219329834, -3.404284715652466, -3.3040378093719482, -3.2037906646728516, -3.103543758392334, -3.0032968521118164, -2.903049945831299, -2.8028030395507812, -2.7025561332702637, -2.602309226989746, -2.5020623207092285, -2.401815414428711, -2.3015682697296143, -2.2013213634490967, -2.101074457168579, -2.0008275508880615, -1.9005804061889648, -1.8003334999084473, -1.7000864744186401, -1.5998395681381226, -1.4995925426483154, -1.3993456363677979, -1.2990987300872803, -1.1988518238067627, -1.0986047983169556, -0.9983578324317932, -0.8981108665466309, -0.7978639602661133, -0.6976169943809509, -0.5973700284957886, -0.497123122215271, -0.39687615633010864, -0.2966291904449463, -0.19638223946094513, -0.09613528847694397, 0.004111647605895996, 0.10435861349105835, 0.2046055793762207, 0.3048524856567383, 0.40509945154190063, 0.505346417427063, 0.6055933833122253, 0.7058403491973877, 0.8060872554779053, 0.9063342213630676, 1.00658118724823, 1.1068280935287476, 1.2070751190185547, 1.3073220252990723, 1.4075689315795898, 1.507815957069397, 1.6080628633499146, 1.7083098888397217, 1.8085567951202393, 1.9088037014007568, 2.0090506076812744, 2.109297752380371, 2.2095446586608887, 2.3097915649414062, 2.410038471221924, 2.5102856159210205, 2.610532522201538, 2.7107794284820557, 2.8110263347625732, 2.911273241043091]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 13.0, 9.0, 23.0, 22.0, 34.0, 55.0, 73.0, 90.0, 147.0, 235.0, 343.0, 439.0, 689.0, 1109.0, 1684.0, 2623.0, 3833.0, 6033.0, 9165.0, 13924.0, 21680.0, 33252.0, 50761.0, 75719.0, 108031.0, 142434.0, 154598.0, 132006.0, 96595.0, 65967.0, 44188.0, 28847.0, 18870.0, 12162.0, 7925.0, 5136.0, 3365.0, 2198.0, 1416.0, 935.0, 663.0, 417.0, 282.0, 195.0, 108.0, 90.0, 68.0, 36.0, 19.0, 17.0, 12.0, 7.0, 10.0, 5.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.71826171875, -0.696044921875, -0.673828125, -0.651611328125, -0.62939453125, -0.607177734375, -0.5849609375, -0.562744140625, -0.54052734375, -0.518310546875, -0.49609375, -0.473876953125, -0.45166015625, -0.429443359375, -0.4072265625, -0.385009765625, -0.36279296875, -0.340576171875, -0.318359375, -0.296142578125, -0.27392578125, -0.251708984375, -0.2294921875, -0.207275390625, -0.18505859375, -0.162841796875, -0.140625, -0.118408203125, -0.09619140625, -0.073974609375, -0.0517578125, -0.029541015625, -0.00732421875, 0.014892578125, 0.037109375, 0.059326171875, 0.08154296875, 0.103759765625, 0.1259765625, 0.148193359375, 0.17041015625, 0.192626953125, 0.21484375, 0.237060546875, 0.25927734375, 0.281494140625, 0.3037109375, 0.325927734375, 0.34814453125, 0.370361328125, 0.392578125, 0.414794921875, 0.43701171875, 0.459228515625, 0.4814453125, 0.503662109375, 0.52587890625, 0.548095703125, 0.5703125, 0.592529296875, 0.61474609375, 0.636962890625, 0.6591796875, 0.681396484375, 0.70361328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 11.0, 22.0, 18.0, 22.0, 27.0, 30.0, 30.0, 42.0, 39.0, 37.0, 29.0, 45.0, 74.0, 59.0, 51.0, 57.0, 44.0, 53.0, 34.0, 33.0, 26.0, 34.0, 30.0, 24.0, 20.0, 13.0, 12.0, 14.0, 11.0, 6.0, 7.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.96075439453125, -3.8316650390625, -3.70257568359375, -3.573486328125, -3.44439697265625, -3.3153076171875, -3.18621826171875, -3.05712890625, -2.92803955078125, -2.7989501953125, -2.66986083984375, -2.540771484375, -2.41168212890625, -2.2825927734375, -2.15350341796875, -2.0244140625, -1.89532470703125, -1.7662353515625, -1.63714599609375, -1.508056640625, -1.37896728515625, -1.2498779296875, -1.12078857421875, -0.99169921875, -0.86260986328125, -0.7335205078125, -0.60443115234375, -0.475341796875, -0.34625244140625, -0.2171630859375, -0.08807373046875, 0.041015625, 0.17010498046875, 0.2991943359375, 0.42828369140625, 0.557373046875, 0.68646240234375, 0.8155517578125, 0.94464111328125, 1.07373046875, 1.20281982421875, 1.3319091796875, 1.46099853515625, 1.590087890625, 1.71917724609375, 1.8482666015625, 1.97735595703125, 2.1064453125, 2.23553466796875, 2.3646240234375, 2.49371337890625, 2.622802734375, 2.75189208984375, 2.8809814453125, 3.01007080078125, 3.13916015625, 3.26824951171875, 3.3973388671875, 3.52642822265625, 3.655517578125, 3.78460693359375, 3.9136962890625, 4.04278564453125, 4.171875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 9.0, 4.0, 6.0, 5.0, 15.0, 20.0, 28.0, 26.0, 55.0, 47.0, 87.0, 128.0, 216.0, 266.0, 465.0, 709.0, 990.0, 1555.0, 2407.0, 3710.0, 6013.0, 9889.0, 16661.0, 28912.0, 50259.0, 86383.0, 141128.0, 196176.0, 187269.0, 128610.0, 77118.0, 44587.0, 25592.0, 15111.0, 8983.0, 5521.0, 3291.0, 2174.0, 1369.0, 935.0, 576.0, 389.0, 267.0, 177.0, 139.0, 87.0, 50.0, 45.0, 41.0, 18.0, 15.0, 10.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.87841796875, -0.8499832153320312, -0.8215484619140625, -0.7931137084960938, -0.764678955078125, -0.7362442016601562, -0.7078094482421875, -0.6793746948242188, -0.65093994140625, -0.6225051879882812, -0.5940704345703125, -0.5656356811523438, -0.537200927734375, -0.5087661743164062, -0.4803314208984375, -0.45189666748046875, -0.4234619140625, -0.39502716064453125, -0.3665924072265625, -0.33815765380859375, -0.309722900390625, -0.28128814697265625, -0.2528533935546875, -0.22441864013671875, -0.19598388671875, -0.16754913330078125, -0.1391143798828125, -0.11067962646484375, -0.082244873046875, -0.05381011962890625, -0.0253753662109375, 0.00305938720703125, 0.031494140625, 0.05992889404296875, 0.0883636474609375, 0.11679840087890625, 0.145233154296875, 0.17366790771484375, 0.2021026611328125, 0.23053741455078125, 0.25897216796875, 0.28740692138671875, 0.3158416748046875, 0.34427642822265625, 0.372711181640625, 0.40114593505859375, 0.4295806884765625, 0.45801544189453125, 0.4864501953125, 0.5148849487304688, 0.5433197021484375, 0.5717544555664062, 0.600189208984375, 0.6286239624023438, 0.6570587158203125, 0.6854934692382812, 0.71392822265625, 0.7423629760742188, 0.7707977294921875, 0.7992324829101562, 0.827667236328125, 0.8561019897460938, 0.8845367431640625, 0.9129714965820312, 0.94140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 11.0, 3.0, 9.0, 16.0, 14.0, 18.0, 23.0, 35.0, 20.0, 29.0, 43.0, 28.0, 37.0, 34.0, 44.0, 48.0, 46.0, 46.0, 43.0, 39.0, 39.0, 46.0, 35.0, 40.0, 39.0, 22.0, 31.0, 20.0, 18.0, 22.0, 15.0, 20.0, 10.0, 12.0, 8.0, 5.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.19921875, -2.129913330078125, -2.06060791015625, -1.991302490234375, -1.9219970703125, -1.852691650390625, -1.78338623046875, -1.714080810546875, -1.644775390625, -1.575469970703125, -1.50616455078125, -1.436859130859375, -1.3675537109375, -1.298248291015625, -1.22894287109375, -1.159637451171875, -1.09033203125, -1.021026611328125, -0.95172119140625, -0.882415771484375, -0.8131103515625, -0.743804931640625, -0.67449951171875, -0.605194091796875, -0.535888671875, -0.466583251953125, -0.39727783203125, -0.327972412109375, -0.2586669921875, -0.189361572265625, -0.12005615234375, -0.050750732421875, 0.0185546875, 0.087860107421875, 0.15716552734375, 0.226470947265625, 0.2957763671875, 0.365081787109375, 0.43438720703125, 0.503692626953125, 0.572998046875, 0.642303466796875, 0.71160888671875, 0.780914306640625, 0.8502197265625, 0.919525146484375, 0.98883056640625, 1.058135986328125, 1.12744140625, 1.196746826171875, 1.26605224609375, 1.335357666015625, 1.4046630859375, 1.473968505859375, 1.54327392578125, 1.612579345703125, 1.681884765625, 1.751190185546875, 1.82049560546875, 1.889801025390625, 1.9591064453125, 2.028411865234375, 2.09771728515625, 2.167022705078125, 2.236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 12.0, 14.0, 19.0, 30.0, 27.0, 53.0, 68.0, 86.0, 121.0, 183.0, 231.0, 312.0, 435.0, 664.0, 998.0, 1571.0, 2386.0, 3781.0, 6264.0, 10953.0, 20913.0, 45324.0, 118264.0, 341696.0, 305237.0, 103039.0, 40309.0, 19148.0, 10149.0, 5838.0, 3511.0, 2320.0, 1453.0, 948.0, 661.0, 456.0, 292.0, 191.0, 162.0, 121.0, 73.0, 59.0, 48.0, 36.0, 28.0, 23.0, 10.0, 11.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.517578125, -0.5008468627929688, -0.4841156005859375, -0.46738433837890625, -0.450653076171875, -0.43392181396484375, -0.4171905517578125, -0.40045928955078125, -0.38372802734375, -0.36699676513671875, -0.3502655029296875, -0.33353424072265625, -0.316802978515625, -0.30007171630859375, -0.2833404541015625, -0.26660919189453125, -0.2498779296875, -0.23314666748046875, -0.2164154052734375, -0.19968414306640625, -0.182952880859375, -0.16622161865234375, -0.1494903564453125, -0.13275909423828125, -0.11602783203125, -0.09929656982421875, -0.0825653076171875, -0.06583404541015625, -0.049102783203125, -0.03237152099609375, -0.0156402587890625, 0.00109100341796875, 0.017822265625, 0.03455352783203125, 0.0512847900390625, 0.06801605224609375, 0.084747314453125, 0.10147857666015625, 0.1182098388671875, 0.13494110107421875, 0.15167236328125, 0.16840362548828125, 0.1851348876953125, 0.20186614990234375, 0.218597412109375, 0.23532867431640625, 0.2520599365234375, 0.26879119873046875, 0.2855224609375, 0.30225372314453125, 0.3189849853515625, 0.33571624755859375, 0.352447509765625, 0.36917877197265625, 0.3859100341796875, 0.40264129638671875, 0.41937255859375, 0.43610382080078125, 0.4528350830078125, 0.46956634521484375, 0.486297607421875, 0.5030288696289062, 0.5197601318359375, 0.5364913940429688, 0.55322265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 8.0, 4.0, 4.0, 12.0, 14.0, 17.0, 29.0, 24.0, 34.0, 47.0, 42.0, 55.0, 57.0, 58.0, 49.0, 61.0, 48.0, 52.0, 54.0, 41.0, 52.0, 43.0, 25.0, 29.0, 21.0, 28.0, 13.0, 22.0, 13.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4259090423583984e-05, -2.3513101041316986e-05, -2.2767111659049988e-05, -2.202112227678299e-05, -2.127513289451599e-05, -2.0529143512248993e-05, -1.9783154129981995e-05, -1.9037164747714996e-05, -1.8291175365447998e-05, -1.7545185983181e-05, -1.6799196600914e-05, -1.6053207218647003e-05, -1.5307217836380005e-05, -1.4561228454113007e-05, -1.3815239071846008e-05, -1.306924968957901e-05, -1.2323260307312012e-05, -1.1577270925045013e-05, -1.0831281542778015e-05, -1.0085292160511017e-05, -9.339302778244019e-06, -8.59331339597702e-06, -7.847324013710022e-06, -7.101334631443024e-06, -6.355345249176025e-06, -5.609355866909027e-06, -4.863366484642029e-06, -4.1173771023750305e-06, -3.3713877201080322e-06, -2.625398337841034e-06, -1.8794089555740356e-06, -1.1334195733070374e-06, -3.8743019104003906e-07, 3.5855919122695923e-07, 1.1045485734939575e-06, 1.8505379557609558e-06, 2.596527338027954e-06, 3.3425167202949524e-06, 4.088506102561951e-06, 4.834495484828949e-06, 5.580484867095947e-06, 6.3264742493629456e-06, 7.072463631629944e-06, 7.818453013896942e-06, 8.56444239616394e-06, 9.310431778430939e-06, 1.0056421160697937e-05, 1.0802410542964935e-05, 1.1548399925231934e-05, 1.2294389307498932e-05, 1.304037868976593e-05, 1.3786368072032928e-05, 1.4532357454299927e-05, 1.5278346836566925e-05, 1.6024336218833923e-05, 1.677032560110092e-05, 1.751631498336792e-05, 1.8262304365634918e-05, 1.9008293747901917e-05, 1.9754283130168915e-05, 2.0500272512435913e-05, 2.124626189470291e-05, 2.199225127696991e-05, 2.2738240659236908e-05, 2.3484230041503906e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 7.0, 15.0, 21.0, 32.0, 38.0, 64.0, 67.0, 123.0, 146.0, 231.0, 309.0, 460.0, 692.0, 952.0, 1537.0, 2281.0, 3514.0, 5741.0, 9430.0, 16148.0, 29452.0, 55141.0, 109463.0, 207699.0, 257993.0, 164112.0, 83079.0, 42523.0, 22740.0, 13112.0, 7630.0, 4728.0, 3020.0, 1964.0, 1295.0, 843.0, 580.0, 406.0, 292.0, 217.0, 135.0, 97.0, 60.0, 47.0, 40.0, 23.0, 19.0, 8.0, 3.0, 11.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5765151977539062, -0.5568389892578125, -0.5371627807617188, -0.517486572265625, -0.49781036376953125, -0.4781341552734375, -0.45845794677734375, -0.43878173828125, -0.41910552978515625, -0.3994293212890625, -0.37975311279296875, -0.360076904296875, -0.34040069580078125, -0.3207244873046875, -0.30104827880859375, -0.2813720703125, -0.26169586181640625, -0.2420196533203125, -0.22234344482421875, -0.202667236328125, -0.18299102783203125, -0.1633148193359375, -0.14363861083984375, -0.12396240234375, -0.10428619384765625, -0.0846099853515625, -0.06493377685546875, -0.045257568359375, -0.02558135986328125, -0.0059051513671875, 0.01377105712890625, 0.033447265625, 0.05312347412109375, 0.0727996826171875, 0.09247589111328125, 0.112152099609375, 0.13182830810546875, 0.1515045166015625, 0.17118072509765625, 0.19085693359375, 0.21053314208984375, 0.2302093505859375, 0.24988555908203125, 0.269561767578125, 0.28923797607421875, 0.3089141845703125, 0.32859039306640625, 0.3482666015625, 0.36794281005859375, 0.3876190185546875, 0.40729522705078125, 0.426971435546875, 0.44664764404296875, 0.4663238525390625, 0.48600006103515625, 0.50567626953125, 0.5253524780273438, 0.5450286865234375, 0.5647048950195312, 0.584381103515625, 0.6040573120117188, 0.6237335205078125, 0.6434097290039062, 0.6630859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 9.0, 13.0, 19.0, 23.0, 29.0, 40.0, 41.0, 58.0, 89.0, 102.0, 103.0, 93.0, 94.0, 63.0, 39.0, 35.0, 25.0, 29.0, 19.0, 17.0, 10.0, 10.0, 7.0, 6.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2238025665283203, -0.21750259399414062, -0.21120262145996094, -0.20490264892578125, -0.19860267639160156, -0.19230270385742188, -0.1860027313232422, -0.1797027587890625, -0.1734027862548828, -0.16710281372070312, -0.16080284118652344, -0.15450286865234375, -0.14820289611816406, -0.14190292358398438, -0.1356029510498047, -0.129302978515625, -0.12300300598144531, -0.11670303344726562, -0.11040306091308594, -0.10410308837890625, -0.09780311584472656, -0.09150314331054688, -0.08520317077636719, -0.0789031982421875, -0.07260322570800781, -0.06630325317382812, -0.06000328063964844, -0.05370330810546875, -0.04740333557128906, -0.041103363037109375, -0.03480339050292969, -0.02850341796875, -0.022203445434570312, -0.015903472900390625, -0.009603500366210938, -0.00330352783203125, 0.0029964447021484375, 0.009296417236328125, 0.015596389770507812, 0.0218963623046875, 0.028196334838867188, 0.034496307373046875, 0.04079627990722656, 0.04709625244140625, 0.05339622497558594, 0.059696197509765625, 0.06599617004394531, 0.072296142578125, 0.07859611511230469, 0.08489608764648438, 0.09119606018066406, 0.09749603271484375, 0.10379600524902344, 0.11009597778320312, 0.11639595031738281, 0.1226959228515625, 0.1289958953857422, 0.13529586791992188, 0.14159584045410156, 0.14789581298828125, 0.15419578552246094, 0.16049575805664062, 0.1667957305908203, 0.173095703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 3.0, 7.0, 11.0, 14.0, 12.0, 23.0, 20.0, 20.0, 35.0, 42.0, 41.0, 43.0, 44.0, 53.0, 52.0, 54.0, 45.0, 53.0, 39.0, 37.0, 36.0, 49.0, 39.0, 34.0, 29.0, 26.0, 27.0, 24.0, 11.0, 15.0, 17.0, 12.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.080476760864258, -3.939161539077759, -3.797846555709839, -3.65653133392334, -3.51521635055542, -3.373901128768921, -3.232585906982422, -3.091270923614502, -2.949955940246582, -2.808640718460083, -2.667325735092163, -2.526010513305664, -2.384695529937744, -2.243380308151245, -2.102065086364746, -1.9607501029968262, -1.8194348812103271, -1.6781197786331177, -1.5368046760559082, -1.3954894542694092, -1.2541744709014893, -1.1128592491149902, -0.9715441465377808, -0.8302290439605713, -0.6889139413833618, -0.5475988388061523, -0.4062837064266205, -0.2649685740470886, -0.12365347146987915, 0.017661631107330322, 0.15897679328918457, 0.30029189586639404, 0.4416069984436035, 0.582922101020813, 0.7242372035980225, 0.8655523657798767, 1.0068674087524414, 1.1481826305389404, 1.28949773311615, 1.4308128356933594, 1.5721279382705688, 1.7134430408477783, 1.8547581434249878, 1.9960732460021973, 2.1373884677886963, 2.278703451156616, 2.4200186729431152, 2.561333656311035, 2.702648878097534, 2.843964099884033, 2.985279083251953, 3.126594305038452, 3.267909288406372, 3.409224510192871, 3.550539493560791, 3.69185471534729, 3.833169937133789, 3.974485158920288, 4.115800380706787, 4.257115364074707, 4.398430347442627, 4.539745330810547, 4.681060791015625, 4.822375774383545, 4.963690757751465]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 8.0, 10.0, 9.0, 14.0, 19.0, 25.0, 23.0, 21.0, 21.0, 28.0, 26.0, 33.0, 34.0, 37.0, 44.0, 53.0, 46.0, 44.0, 35.0, 39.0, 46.0, 31.0, 36.0, 36.0, 32.0, 39.0, 21.0, 23.0, 25.0, 16.0, 16.0, 17.0, 17.0, 8.0, 15.0, 8.0, 7.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.544121503829956, -3.4429636001586914, -3.341805934906006, -3.240648031234741, -3.1394901275634766, -3.038332223892212, -2.9371743202209473, -2.8360166549682617, -2.734858751296997, -2.6337008476257324, -2.532543182373047, -2.4313852787017822, -2.3302273750305176, -2.229069471359253, -2.1279115676879883, -2.0267539024353027, -1.925595998764038, -1.8244380950927734, -1.7232803106307983, -1.6221225261688232, -1.5209646224975586, -1.419806718826294, -1.3186489343643188, -1.2174911499023438, -1.116333246231079, -1.0151753425598145, -0.9140175580978394, -0.8128597140312195, -0.7117018699645996, -0.6105440258979797, -0.5093861818313599, -0.40822833776474, -0.3070704936981201, -0.20591264963150024, -0.10475480556488037, -0.003596961498260498, 0.09756088256835938, 0.19871872663497925, 0.2998765707015991, 0.401034414768219, 0.5021922588348389, 0.6033501029014587, 0.7045079469680786, 0.8056657910346985, 0.9068236351013184, 1.007981538772583, 1.109139323234558, 1.2102971076965332, 1.3114550113677979, 1.4126129150390625, 1.5137706995010376, 1.6149284839630127, 1.7160863876342773, 1.817244291305542, 1.918402075767517, 2.019559860229492, 2.120717763900757, 2.2218756675720215, 2.323033332824707, 2.4241912364959717, 2.5253491401672363, 2.626507043838501, 2.7276649475097656, 2.828822612762451, 2.929980516433716]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 11.0, 8.0, 18.0, 31.0, 49.0, 64.0, 105.0, 193.0, 297.0, 452.0, 777.0, 1245.0, 1996.0, 3214.0, 5219.0, 8187.0, 13202.0, 20357.0, 30115.0, 43785.0, 60437.0, 78977.0, 97139.0, 110044.0, 114605.0, 108107.0, 94781.0, 75695.0, 57701.0, 41740.0, 28295.0, 18724.0, 12187.0, 7927.0, 4833.0, 3035.0, 1904.0, 1158.0, 761.0, 446.0, 248.0, 180.0, 114.0, 69.0, 46.0, 35.0, 15.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-2.095703125, -2.03106689453125, -1.9664306640625, -1.90179443359375, -1.837158203125, -1.77252197265625, -1.7078857421875, -1.64324951171875, -1.57861328125, -1.51397705078125, -1.4493408203125, -1.38470458984375, -1.320068359375, -1.25543212890625, -1.1907958984375, -1.12615966796875, -1.0615234375, -0.99688720703125, -0.9322509765625, -0.86761474609375, -0.802978515625, -0.73834228515625, -0.6737060546875, -0.60906982421875, -0.54443359375, -0.47979736328125, -0.4151611328125, -0.35052490234375, -0.285888671875, -0.22125244140625, -0.1566162109375, -0.09197998046875, -0.02734375, 0.03729248046875, 0.1019287109375, 0.16656494140625, 0.231201171875, 0.29583740234375, 0.3604736328125, 0.42510986328125, 0.48974609375, 0.55438232421875, 0.6190185546875, 0.68365478515625, 0.748291015625, 0.81292724609375, 0.8775634765625, 0.94219970703125, 1.0068359375, 1.07147216796875, 1.1361083984375, 1.20074462890625, 1.265380859375, 1.33001708984375, 1.3946533203125, 1.45928955078125, 1.52392578125, 1.58856201171875, 1.6531982421875, 1.71783447265625, 1.782470703125, 1.84710693359375, 1.9117431640625, 1.97637939453125, 2.041015625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 7.0, 8.0, 12.0, 14.0, 22.0, 13.0, 14.0, 22.0, 31.0, 28.0, 22.0, 29.0, 33.0, 33.0, 42.0, 33.0, 40.0, 40.0, 52.0, 35.0, 34.0, 40.0, 32.0, 31.0, 41.0, 26.0, 30.0, 20.0, 28.0, 22.0, 30.0, 16.0, 20.0, 12.0, 15.0, 9.0, 8.0, 11.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.916015625, -2.81646728515625, -2.7169189453125, -2.61737060546875, -2.517822265625, -2.41827392578125, -2.3187255859375, -2.21917724609375, -2.11962890625, -2.02008056640625, -1.9205322265625, -1.82098388671875, -1.721435546875, -1.62188720703125, -1.5223388671875, -1.42279052734375, -1.3232421875, -1.22369384765625, -1.1241455078125, -1.02459716796875, -0.925048828125, -0.82550048828125, -0.7259521484375, -0.62640380859375, -0.52685546875, -0.42730712890625, -0.3277587890625, -0.22821044921875, -0.128662109375, -0.02911376953125, 0.0704345703125, 0.16998291015625, 0.26953125, 0.36907958984375, 0.4686279296875, 0.56817626953125, 0.667724609375, 0.76727294921875, 0.8668212890625, 0.96636962890625, 1.06591796875, 1.16546630859375, 1.2650146484375, 1.36456298828125, 1.464111328125, 1.56365966796875, 1.6632080078125, 1.76275634765625, 1.8623046875, 1.96185302734375, 2.0614013671875, 2.16094970703125, 2.260498046875, 2.36004638671875, 2.4595947265625, 2.55914306640625, 2.65869140625, 2.75823974609375, 2.8577880859375, 2.95733642578125, 3.056884765625, 3.15643310546875, 3.2559814453125, 3.35552978515625, 3.455078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 13.0, 20.0, 28.0, 34.0, 52.0, 76.0, 122.0, 169.0, 260.0, 371.0, 561.0, 795.0, 1264.0, 1997.0, 2851.0, 4440.0, 6644.0, 10105.0, 15290.0, 22611.0, 32520.0, 46036.0, 61666.0, 78470.0, 94495.0, 105444.0, 108590.0, 102895.0, 90152.0, 73564.0, 56844.0, 41166.0, 29131.0, 19815.0, 13519.0, 9128.0, 6006.0, 3930.0, 2503.0, 1688.0, 1076.0, 753.0, 487.0, 291.0, 232.0, 140.0, 96.0, 81.0, 41.0, 30.0, 17.0, 18.0, 11.0, 8.0, 2.0, 4.0, 2.0], "bins": [-2.224609375, -2.15789794921875, -2.0911865234375, -2.02447509765625, -1.957763671875, -1.89105224609375, -1.8243408203125, -1.75762939453125, -1.69091796875, -1.62420654296875, -1.5574951171875, -1.49078369140625, -1.424072265625, -1.35736083984375, -1.2906494140625, -1.22393798828125, -1.1572265625, -1.09051513671875, -1.0238037109375, -0.95709228515625, -0.890380859375, -0.82366943359375, -0.7569580078125, -0.69024658203125, -0.62353515625, -0.55682373046875, -0.4901123046875, -0.42340087890625, -0.356689453125, -0.28997802734375, -0.2232666015625, -0.15655517578125, -0.08984375, -0.02313232421875, 0.0435791015625, 0.11029052734375, 0.177001953125, 0.24371337890625, 0.3104248046875, 0.37713623046875, 0.44384765625, 0.51055908203125, 0.5772705078125, 0.64398193359375, 0.710693359375, 0.77740478515625, 0.8441162109375, 0.91082763671875, 0.9775390625, 1.04425048828125, 1.1109619140625, 1.17767333984375, 1.244384765625, 1.31109619140625, 1.3778076171875, 1.44451904296875, 1.51123046875, 1.57794189453125, 1.6446533203125, 1.71136474609375, 1.778076171875, 1.84478759765625, 1.9114990234375, 1.97821044921875, 2.044921875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 14.0, 10.0, 17.0, 9.0, 18.0, 23.0, 27.0, 21.0, 22.0, 24.0, 25.0, 35.0, 39.0, 38.0, 37.0, 34.0, 48.0, 25.0, 31.0, 50.0, 42.0, 35.0, 27.0, 42.0, 29.0, 34.0, 28.0, 17.0, 32.0, 19.0, 25.0, 19.0, 13.0, 12.0, 14.0, 4.0, 8.0, 3.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7529296875, -1.6934661865234375, -1.634002685546875, -1.5745391845703125, -1.51507568359375, -1.4556121826171875, -1.396148681640625, -1.3366851806640625, -1.2772216796875, -1.2177581787109375, -1.158294677734375, -1.0988311767578125, -1.03936767578125, -0.9799041748046875, -0.920440673828125, -0.8609771728515625, -0.801513671875, -0.7420501708984375, -0.682586669921875, -0.6231231689453125, -0.56365966796875, -0.5041961669921875, -0.444732666015625, -0.3852691650390625, -0.3258056640625, -0.2663421630859375, -0.206878662109375, -0.1474151611328125, -0.08795166015625, -0.0284881591796875, 0.030975341796875, 0.0904388427734375, 0.14990234375, 0.2093658447265625, 0.268829345703125, 0.3282928466796875, 0.38775634765625, 0.4472198486328125, 0.506683349609375, 0.5661468505859375, 0.6256103515625, 0.6850738525390625, 0.744537353515625, 0.8040008544921875, 0.86346435546875, 0.9229278564453125, 0.982391357421875, 1.0418548583984375, 1.101318359375, 1.1607818603515625, 1.220245361328125, 1.2797088623046875, 1.33917236328125, 1.3986358642578125, 1.458099365234375, 1.5175628662109375, 1.5770263671875, 1.6364898681640625, 1.695953369140625, 1.7554168701171875, 1.81488037109375, 1.8743438720703125, 1.933807373046875, 1.9932708740234375, 2.052734375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 16.0, 22.0, 30.0, 46.0, 76.0, 79.0, 131.0, 193.0, 255.0, 378.0, 536.0, 785.0, 1254.0, 1834.0, 2872.0, 4855.0, 8611.0, 16627.0, 33492.0, 67499.0, 124095.0, 183565.0, 206651.0, 170396.0, 107148.0, 56342.0, 27984.0, 13730.0, 7178.0, 4145.0, 2610.0, 1604.0, 1100.0, 774.0, 491.0, 324.0, 245.0, 167.0, 120.0, 82.0, 72.0, 46.0, 33.0, 13.0, 13.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7421875, -1.6866455078125, -1.631103515625, -1.5755615234375, -1.52001953125, -1.4644775390625, -1.408935546875, -1.3533935546875, -1.2978515625, -1.2423095703125, -1.186767578125, -1.1312255859375, -1.07568359375, -1.0201416015625, -0.964599609375, -0.9090576171875, -0.853515625, -0.7979736328125, -0.742431640625, -0.6868896484375, -0.63134765625, -0.5758056640625, -0.520263671875, -0.4647216796875, -0.4091796875, -0.3536376953125, -0.298095703125, -0.2425537109375, -0.18701171875, -0.1314697265625, -0.075927734375, -0.0203857421875, 0.03515625, 0.0906982421875, 0.146240234375, 0.2017822265625, 0.25732421875, 0.3128662109375, 0.368408203125, 0.4239501953125, 0.4794921875, 0.5350341796875, 0.590576171875, 0.6461181640625, 0.70166015625, 0.7572021484375, 0.812744140625, 0.8682861328125, 0.923828125, 0.9793701171875, 1.034912109375, 1.0904541015625, 1.14599609375, 1.2015380859375, 1.257080078125, 1.3126220703125, 1.3681640625, 1.4237060546875, 1.479248046875, 1.5347900390625, 1.59033203125, 1.6458740234375, 1.701416015625, 1.7569580078125, 1.8125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 4.0, 12.0, 10.0, 29.0, 29.0, 43.0, 40.0, 56.0, 83.0, 86.0, 82.0, 88.0, 71.0, 68.0, 81.0, 56.0, 31.0, 26.0, 28.0, 13.0, 10.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002448558807373047, -0.00023787468671798706, -0.00023089349269866943, -0.0002239122986793518, -0.00021693110466003418, -0.00020994991064071655, -0.00020296871662139893, -0.0001959875226020813, -0.00018900632858276367, -0.00018202513456344604, -0.00017504394054412842, -0.0001680627465248108, -0.00016108155250549316, -0.00015410035848617554, -0.0001471191644668579, -0.00014013797044754028, -0.00013315677642822266, -0.00012617558240890503, -0.0001191943883895874, -0.00011221319437026978, -0.00010523200035095215, -9.825080633163452e-05, -9.12696123123169e-05, -8.428841829299927e-05, -7.730722427368164e-05, -7.032603025436401e-05, -6.334483623504639e-05, -5.636364221572876e-05, -4.938244819641113e-05, -4.2401254177093506e-05, -3.542006015777588e-05, -2.8438866138458252e-05, -2.1457672119140625e-05, -1.4476478099822998e-05, -7.495284080505371e-06, -5.140900611877441e-07, 6.467103958129883e-06, 1.344829797744751e-05, 2.0429491996765137e-05, 2.7410686016082764e-05, 3.439188003540039e-05, 4.137307405471802e-05, 4.8354268074035645e-05, 5.533546209335327e-05, 6.23166561126709e-05, 6.929785013198853e-05, 7.627904415130615e-05, 8.326023817062378e-05, 9.02414321899414e-05, 9.722262620925903e-05, 0.00010420382022857666, 0.00011118501424789429, 0.00011816620826721191, 0.00012514740228652954, 0.00013212859630584717, 0.0001391097903251648, 0.00014609098434448242, 0.00015307217836380005, 0.00016005337238311768, 0.0001670345664024353, 0.00017401576042175293, 0.00018099695444107056, 0.00018797814846038818, 0.0001949593424797058, 0.00020194053649902344]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 8.0, 7.0, 14.0, 21.0, 30.0, 44.0, 72.0, 112.0, 151.0, 262.0, 368.0, 567.0, 883.0, 1384.0, 2350.0, 3866.0, 6887.0, 14517.0, 32230.0, 74050.0, 150913.0, 229577.0, 231993.0, 155453.0, 76619.0, 33579.0, 14847.0, 7327.0, 4049.0, 2236.0, 1453.0, 928.0, 612.0, 389.0, 279.0, 164.0, 96.0, 76.0, 40.0, 43.0, 17.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.205078125, -2.1383056640625, -2.071533203125, -2.0047607421875, -1.93798828125, -1.8712158203125, -1.804443359375, -1.7376708984375, -1.6708984375, -1.6041259765625, -1.537353515625, -1.4705810546875, -1.40380859375, -1.3370361328125, -1.270263671875, -1.2034912109375, -1.13671875, -1.0699462890625, -1.003173828125, -0.9364013671875, -0.86962890625, -0.8028564453125, -0.736083984375, -0.6693115234375, -0.6025390625, -0.5357666015625, -0.468994140625, -0.4022216796875, -0.33544921875, -0.2686767578125, -0.201904296875, -0.1351318359375, -0.068359375, -0.0015869140625, 0.065185546875, 0.1319580078125, 0.19873046875, 0.2655029296875, 0.332275390625, 0.3990478515625, 0.4658203125, 0.5325927734375, 0.599365234375, 0.6661376953125, 0.73291015625, 0.7996826171875, 0.866455078125, 0.9332275390625, 1.0, 1.0667724609375, 1.133544921875, 1.2003173828125, 1.26708984375, 1.3338623046875, 1.400634765625, 1.4674072265625, 1.5341796875, 1.6009521484375, 1.667724609375, 1.7344970703125, 1.80126953125, 1.8680419921875, 1.934814453125, 2.0015869140625, 2.068359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 14.0, 16.0, 25.0, 45.0, 51.0, 45.0, 62.0, 68.0, 67.0, 81.0, 90.0, 81.0, 70.0, 52.0, 44.0, 40.0, 39.0, 22.0, 22.0, 11.0, 10.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5912933349609375, -0.572235107421875, -0.5531768798828125, -0.53411865234375, -0.5150604248046875, -0.496002197265625, -0.4769439697265625, -0.4578857421875, -0.4388275146484375, -0.419769287109375, -0.4007110595703125, -0.38165283203125, -0.3625946044921875, -0.343536376953125, -0.3244781494140625, -0.305419921875, -0.2863616943359375, -0.267303466796875, -0.2482452392578125, -0.22918701171875, -0.2101287841796875, -0.191070556640625, -0.1720123291015625, -0.1529541015625, -0.1338958740234375, -0.114837646484375, -0.0957794189453125, -0.07672119140625, -0.0576629638671875, -0.038604736328125, -0.0195465087890625, -0.00048828125, 0.0185699462890625, 0.037628173828125, 0.0566864013671875, 0.07574462890625, 0.0948028564453125, 0.113861083984375, 0.1329193115234375, 0.1519775390625, 0.1710357666015625, 0.190093994140625, 0.2091522216796875, 0.22821044921875, 0.2472686767578125, 0.266326904296875, 0.2853851318359375, 0.304443359375, 0.3235015869140625, 0.342559814453125, 0.3616180419921875, 0.38067626953125, 0.3997344970703125, 0.418792724609375, 0.4378509521484375, 0.4569091796875, 0.4759674072265625, 0.495025634765625, 0.5140838623046875, 0.53314208984375, 0.5522003173828125, 0.571258544921875, 0.5903167724609375, 0.609375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 12.0, 11.0, 18.0, 23.0, 26.0, 28.0, 24.0, 38.0, 46.0, 50.0, 55.0, 48.0, 52.0, 54.0, 43.0, 38.0, 47.0, 36.0, 43.0, 43.0, 36.0, 25.0, 23.0, 23.0, 21.0, 21.0, 21.0, 12.0, 11.0, 12.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.149673938751221, -4.006742000579834, -3.8638100624084473, -3.7208781242370605, -3.577946186065674, -3.435014247894287, -3.2920825481414795, -3.1491506099700928, -3.006218671798706, -2.8632867336273193, -2.7203547954559326, -2.577422857284546, -2.4344911575317383, -2.2915592193603516, -2.148627281188965, -2.005695343017578, -1.8627634048461914, -1.7198314666748047, -1.576899528503418, -1.4339677095413208, -1.291035771369934, -1.1481038331985474, -1.0051720142364502, -0.8622400760650635, -0.7193081378936768, -0.57637619972229, -0.4334443211555481, -0.29051241278648376, -0.14758050441741943, -0.004648566246032715, 0.13828331232070923, 0.28121519088745117, 0.4241471290588379, 0.5670790672302246, 0.7100109457969666, 0.8529428243637085, 0.9958747625350952, 1.138806700706482, 1.281738519668579, 1.4246704578399658, 1.5676023960113525, 1.7105343341827393, 1.853466272354126, 1.9963980913162231, 2.1393299102783203, 2.282261848449707, 2.4251937866210938, 2.5681257247924805, 2.711057662963867, 2.853989601135254, 2.9969215393066406, 3.1398534774780273, 3.282785415649414, 3.425717353820801, 3.5686490535736084, 3.711580991744995, 3.854512929916382, 3.9974448680877686, 4.140376567840576, 4.283308506011963, 4.42624044418335, 4.569172382354736, 4.712104320526123, 4.85503625869751, 4.9979681968688965]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 4.0, 10.0, 11.0, 10.0, 11.0, 13.0, 18.0, 24.0, 18.0, 25.0, 27.0, 28.0, 26.0, 48.0, 37.0, 31.0, 48.0, 44.0, 43.0, 49.0, 37.0, 53.0, 33.0, 47.0, 47.0, 26.0, 26.0, 17.0, 23.0, 25.0, 17.0, 22.0, 20.0, 16.0, 8.0, 10.0, 10.0, 7.0, 5.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0], "bins": [-4.125625133514404, -4.008246421813965, -3.890867233276367, -3.7734885215759277, -3.656109571456909, -3.5387306213378906, -3.421351671218872, -3.3039727210998535, -3.186594009399414, -3.0692150592803955, -2.951836109161377, -2.8344573974609375, -2.717078447341919, -2.5996994972229004, -2.482320547103882, -2.3649415969848633, -2.2475626468658447, -2.130183696746826, -2.0128047466278076, -1.8954259157180786, -1.7780470848083496, -1.660668134689331, -1.5432891845703125, -1.425910234451294, -1.308531403541565, -1.1911524534225464, -1.0737736225128174, -0.9563946723937988, -0.839015781879425, -0.7216368913650513, -0.6042579412460327, -0.48687905073165894, -0.36950016021728516, -0.2521212697029114, -0.1347423493862152, -0.017363429069519043, 0.10001546144485474, 0.21739435195922852, 0.33477330207824707, 0.45215219259262085, 0.5695310831069946, 0.6869099736213684, 0.8042888641357422, 0.9216678142547607, 1.0390467643737793, 1.1564255952835083, 1.2738045454025269, 1.3911833763122559, 1.5085623264312744, 1.625941276550293, 1.743320107460022, 1.8606990575790405, 1.9780778884887695, 2.095456838607788, 2.2128357887268066, 2.330214738845825, 2.4475936889648438, 2.5649726390838623, 2.682351589202881, 2.7997303009033203, 2.917109251022339, 3.0344882011413574, 3.151867151260376, 3.2692461013793945, 3.386624813079834]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 12.0, 28.0, 34.0, 47.0, 92.0, 123.0, 166.0, 233.0, 398.0, 595.0, 981.0, 1544.0, 2363.0, 3999.0, 6436.0, 10950.0, 18336.0, 31499.0, 55303.0, 95817.0, 166694.0, 284017.0, 452038.0, 634462.0, 716733.0, 624006.0, 437497.0, 271210.0, 160114.0, 91545.0, 52437.0, 30475.0, 17779.0, 10376.0, 6279.0, 3676.0, 2255.0, 1442.0, 898.0, 526.0, 327.0, 211.0, 130.0, 71.0, 44.0, 24.0, 19.0, 13.0, 15.0, 3.0, 0.0, 2.0], "bins": [-5.26953125, -5.125030517578125, -4.98052978515625, -4.836029052734375, -4.6915283203125, -4.547027587890625, -4.40252685546875, -4.258026123046875, -4.113525390625, -3.969024658203125, -3.82452392578125, -3.680023193359375, -3.5355224609375, -3.391021728515625, -3.24652099609375, -3.102020263671875, -2.95751953125, -2.813018798828125, -2.66851806640625, -2.524017333984375, -2.3795166015625, -2.235015869140625, -2.09051513671875, -1.946014404296875, -1.801513671875, -1.657012939453125, -1.51251220703125, -1.368011474609375, -1.2235107421875, -1.079010009765625, -0.93450927734375, -0.790008544921875, -0.6455078125, -0.501007080078125, -0.35650634765625, -0.212005615234375, -0.0675048828125, 0.076995849609375, 0.22149658203125, 0.365997314453125, 0.510498046875, 0.654998779296875, 0.79949951171875, 0.944000244140625, 1.0885009765625, 1.233001708984375, 1.37750244140625, 1.522003173828125, 1.66650390625, 1.811004638671875, 1.95550537109375, 2.100006103515625, 2.2445068359375, 2.389007568359375, 2.53350830078125, 2.678009033203125, 2.822509765625, 2.967010498046875, 3.11151123046875, 3.256011962890625, 3.4005126953125, 3.545013427734375, 3.68951416015625, 3.834014892578125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 4.0, 6.0, 13.0, 12.0, 15.0, 17.0, 20.0, 17.0, 23.0, 28.0, 30.0, 35.0, 42.0, 32.0, 35.0, 38.0, 38.0, 47.0, 50.0, 37.0, 42.0, 37.0, 38.0, 45.0, 39.0, 32.0, 26.0, 29.0, 14.0, 18.0, 20.0, 12.0, 13.0, 17.0, 17.0, 9.0, 7.0, 7.0, 12.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.736328125, -3.61822509765625, -3.5001220703125, -3.38201904296875, -3.263916015625, -3.14581298828125, -3.0277099609375, -2.90960693359375, -2.79150390625, -2.67340087890625, -2.5552978515625, -2.43719482421875, -2.319091796875, -2.20098876953125, -2.0828857421875, -1.96478271484375, -1.8466796875, -1.72857666015625, -1.6104736328125, -1.49237060546875, -1.374267578125, -1.25616455078125, -1.1380615234375, -1.01995849609375, -0.90185546875, -0.78375244140625, -0.6656494140625, -0.54754638671875, -0.429443359375, -0.31134033203125, -0.1932373046875, -0.07513427734375, 0.04296875, 0.16107177734375, 0.2791748046875, 0.39727783203125, 0.515380859375, 0.63348388671875, 0.7515869140625, 0.86968994140625, 0.98779296875, 1.10589599609375, 1.2239990234375, 1.34210205078125, 1.460205078125, 1.57830810546875, 1.6964111328125, 1.81451416015625, 1.9326171875, 2.05072021484375, 2.1688232421875, 2.28692626953125, 2.405029296875, 2.52313232421875, 2.6412353515625, 2.75933837890625, 2.87744140625, 2.99554443359375, 3.1136474609375, 3.23175048828125, 3.349853515625, 3.46795654296875, 3.5860595703125, 3.70416259765625, 3.822265625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 12.0, 19.0, 23.0, 37.0, 65.0, 124.0, 204.0, 294.0, 531.0, 924.0, 1563.0, 2805.0, 4727.0, 8332.0, 14990.0, 27004.0, 48049.0, 86296.0, 150623.0, 250802.0, 395535.0, 558656.0, 673454.0, 642958.0, 499298.0, 337153.0, 208527.0, 123051.0, 69896.0, 38982.0, 21476.0, 11957.0, 6731.0, 3894.0, 2114.0, 1284.0, 774.0, 410.0, 256.0, 169.0, 112.0, 68.0, 48.0, 19.0, 7.0, 8.0, 11.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.4991455078125, -5.314697265625, -5.1302490234375, -4.94580078125, -4.7613525390625, -4.576904296875, -4.3924560546875, -4.2080078125, -4.0235595703125, -3.839111328125, -3.6546630859375, -3.47021484375, -3.2857666015625, -3.101318359375, -2.9168701171875, -2.732421875, -2.5479736328125, -2.363525390625, -2.1790771484375, -1.99462890625, -1.8101806640625, -1.625732421875, -1.4412841796875, -1.2568359375, -1.0723876953125, -0.887939453125, -0.7034912109375, -0.51904296875, -0.3345947265625, -0.150146484375, 0.0343017578125, 0.21875, 0.4031982421875, 0.587646484375, 0.7720947265625, 0.95654296875, 1.1409912109375, 1.325439453125, 1.5098876953125, 1.6943359375, 1.8787841796875, 2.063232421875, 2.2476806640625, 2.43212890625, 2.6165771484375, 2.801025390625, 2.9854736328125, 3.169921875, 3.3543701171875, 3.538818359375, 3.7232666015625, 3.90771484375, 4.0921630859375, 4.276611328125, 4.4610595703125, 4.6455078125, 4.8299560546875, 5.014404296875, 5.1988525390625, 5.38330078125, 5.5677490234375, 5.752197265625, 5.9366455078125, 6.12109375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 10.0, 3.0, 7.0, 9.0, 11.0, 11.0, 28.0, 32.0, 53.0, 57.0, 67.0, 74.0, 97.0, 110.0, 132.0, 141.0, 198.0, 189.0, 231.0, 230.0, 266.0, 244.0, 272.0, 229.0, 228.0, 191.0, 170.0, 145.0, 125.0, 83.0, 94.0, 79.0, 73.0, 48.0, 25.0, 35.0, 25.0, 12.0, 12.0, 4.0, 6.0, 11.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.406463623046875, -2.33441162109375, -2.262359619140625, -2.1903076171875, -2.118255615234375, -2.04620361328125, -1.974151611328125, -1.902099609375, -1.830047607421875, -1.75799560546875, -1.685943603515625, -1.6138916015625, -1.541839599609375, -1.46978759765625, -1.397735595703125, -1.32568359375, -1.253631591796875, -1.18157958984375, -1.109527587890625, -1.0374755859375, -0.965423583984375, -0.89337158203125, -0.821319580078125, -0.749267578125, -0.677215576171875, -0.60516357421875, -0.533111572265625, -0.4610595703125, -0.389007568359375, -0.31695556640625, -0.244903564453125, -0.1728515625, -0.100799560546875, -0.02874755859375, 0.043304443359375, 0.1153564453125, 0.187408447265625, 0.25946044921875, 0.331512451171875, 0.403564453125, 0.475616455078125, 0.54766845703125, 0.619720458984375, 0.6917724609375, 0.763824462890625, 0.83587646484375, 0.907928466796875, 0.97998046875, 1.052032470703125, 1.12408447265625, 1.196136474609375, 1.2681884765625, 1.340240478515625, 1.41229248046875, 1.484344482421875, 1.556396484375, 1.628448486328125, 1.70050048828125, 1.772552490234375, 1.8446044921875, 1.916656494140625, 1.98870849609375, 2.060760498046875, 2.1328125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 5.0, 7.0, 25.0, 11.0, 23.0, 32.0, 38.0, 38.0, 55.0, 56.0, 63.0, 85.0, 72.0, 57.0, 58.0, 45.0, 53.0, 67.0, 34.0, 32.0, 28.0, 21.0, 25.0, 17.0, 9.0, 8.0, 5.0, 10.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.030409812927246, -10.74123764038086, -10.452064514160156, -10.16289234161377, -9.873720169067383, -9.58454704284668, -9.295374870300293, -9.006202697753906, -8.717029571533203, -8.427857398986816, -8.138684272766113, -7.849512100219727, -7.560339450836182, -7.271166801452637, -6.98199462890625, -6.692821979522705, -6.403649806976318, -6.114477157592773, -5.825304985046387, -5.536132335662842, -5.246959686279297, -4.95778751373291, -4.668614864349365, -4.37944221496582, -4.090270042419434, -3.8010976314544678, -3.511924982070923, -3.222752571105957, -2.933579921722412, -2.6444075107574463, -2.3552350997924805, -2.0660624504089355, -1.7768893241882324, -1.487716794013977, -1.1985442638397217, -0.9093718528747559, -0.6201993227005005, -0.3310267925262451, -0.0418543815612793, 0.24731826782226562, 0.5364906787872314, 0.8256632089614868, 1.1148357391357422, 1.404008150100708, 1.6931806802749634, 1.9823532104492188, 2.2715256214141846, 2.5606982707977295, 2.8498706817626953, 3.139043092727661, 3.428215742111206, 3.717388153076172, 4.006560802459717, 4.295733451843262, 4.584905624389648, 4.874078273773193, 5.163250923156738, 5.452423572540283, 5.74159574508667, 6.030768394470215, 6.31994104385376, 6.609113693237305, 6.898285865783691, 7.187458515167236, 7.476630687713623]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 12.0, 20.0, 14.0, 20.0, 22.0, 30.0, 25.0, 25.0, 31.0, 39.0, 46.0, 37.0, 47.0, 54.0, 44.0, 36.0, 49.0, 37.0, 38.0, 39.0, 40.0, 33.0, 36.0, 31.0, 22.0, 14.0, 22.0, 13.0, 16.0, 10.0, 11.0, 10.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.184546947479248, -5.999026775360107, -5.813506603240967, -5.627986907958984, -5.442466735839844, -5.256946563720703, -5.0714263916015625, -4.885906219482422, -4.700386047363281, -4.514865875244141, -4.329345703125, -4.143825531005859, -3.958305835723877, -3.7727856636047363, -3.5872654914855957, -3.401745319366455, -3.2162256240844727, -3.030705451965332, -2.8451855182647705, -2.65966534614563, -2.4741454124450684, -2.2886252403259277, -2.103105068206787, -1.917585015296936, -1.732064962387085, -1.5465449094772339, -1.3610248565673828, -1.1755046844482422, -0.9899846315383911, -0.80446457862854, -0.6189444065093994, -0.43342435359954834, -0.24790382385253906, -0.0623837411403656, 0.12313634157180786, 0.3086564540863037, 0.4941765069961548, 0.6796965599060059, 0.8652167320251465, 1.0507367849349976, 1.2362568378448486, 1.4217768907546997, 1.6072969436645508, 1.7928171157836914, 1.9783371686935425, 2.1638572216033936, 2.349377393722534, 2.5348973274230957, 2.7204174995422363, 2.905937671661377, 3.0914576053619385, 3.276977777481079, 3.4624977111816406, 3.6480178833007812, 3.833538055419922, 4.0190582275390625, 4.204578399658203, 4.390098571777344, 4.575618743896484, 4.761138916015625, 4.946658611297607, 5.132178783416748, 5.317698955535889, 5.503219127655029, 5.688738822937012]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 4.0, 7.0, 13.0, 23.0, 30.0, 39.0, 59.0, 62.0, 120.0, 171.0, 259.0, 464.0, 696.0, 1098.0, 1675.0, 2780.0, 4663.0, 8072.0, 14588.0, 26524.0, 50066.0, 96183.0, 182020.0, 256498.0, 187294.0, 99854.0, 51825.0, 27559.0, 15058.0, 8389.0, 4847.0, 2877.0, 1716.0, 1052.0, 639.0, 432.0, 290.0, 185.0, 137.0, 93.0, 52.0, 33.0, 30.0, 25.0, 15.0, 11.0, 11.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.62890625, -1.577239990234375, -1.52557373046875, -1.473907470703125, -1.4222412109375, -1.370574951171875, -1.31890869140625, -1.267242431640625, -1.215576171875, -1.163909912109375, -1.11224365234375, -1.060577392578125, -1.0089111328125, -0.957244873046875, -0.90557861328125, -0.853912353515625, -0.80224609375, -0.750579833984375, -0.69891357421875, -0.647247314453125, -0.5955810546875, -0.543914794921875, -0.49224853515625, -0.440582275390625, -0.388916015625, -0.337249755859375, -0.28558349609375, -0.233917236328125, -0.1822509765625, -0.130584716796875, -0.07891845703125, -0.027252197265625, 0.0244140625, 0.076080322265625, 0.12774658203125, 0.179412841796875, 0.2310791015625, 0.282745361328125, 0.33441162109375, 0.386077880859375, 0.437744140625, 0.489410400390625, 0.54107666015625, 0.592742919921875, 0.6444091796875, 0.696075439453125, 0.74774169921875, 0.799407958984375, 0.85107421875, 0.902740478515625, 0.95440673828125, 1.006072998046875, 1.0577392578125, 1.109405517578125, 1.16107177734375, 1.212738037109375, 1.264404296875, 1.316070556640625, 1.36773681640625, 1.419403076171875, 1.4710693359375, 1.522735595703125, 1.57440185546875, 1.626068115234375, 1.677734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 7.0, 7.0, 5.0, 11.0, 9.0, 10.0, 17.0, 21.0, 29.0, 22.0, 26.0, 39.0, 27.0, 43.0, 49.0, 43.0, 47.0, 56.0, 33.0, 39.0, 51.0, 44.0, 45.0, 52.0, 32.0, 29.0, 35.0, 24.0, 18.0, 21.0, 21.0, 14.0, 11.0, 12.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.75, -6.53973388671875, -6.3294677734375, -6.11920166015625, -5.908935546875, -5.69866943359375, -5.4884033203125, -5.27813720703125, -5.06787109375, -4.85760498046875, -4.6473388671875, -4.43707275390625, -4.226806640625, -4.01654052734375, -3.8062744140625, -3.59600830078125, -3.3857421875, -3.17547607421875, -2.9652099609375, -2.75494384765625, -2.544677734375, -2.33441162109375, -2.1241455078125, -1.91387939453125, -1.70361328125, -1.49334716796875, -1.2830810546875, -1.07281494140625, -0.862548828125, -0.65228271484375, -0.4420166015625, -0.23175048828125, -0.021484375, 0.18878173828125, 0.3990478515625, 0.60931396484375, 0.819580078125, 1.02984619140625, 1.2401123046875, 1.45037841796875, 1.66064453125, 1.87091064453125, 2.0811767578125, 2.29144287109375, 2.501708984375, 2.71197509765625, 2.9222412109375, 3.13250732421875, 3.3427734375, 3.55303955078125, 3.7633056640625, 3.97357177734375, 4.183837890625, 4.39410400390625, 4.6043701171875, 4.81463623046875, 5.02490234375, 5.23516845703125, 5.4454345703125, 5.65570068359375, 5.865966796875, 6.07623291015625, 6.2864990234375, 6.49676513671875, 6.70703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 6.0, 8.0, 15.0, 27.0, 32.0, 60.0, 94.0, 137.0, 233.0, 357.0, 613.0, 1019.0, 1786.0, 3201.0, 6113.0, 11718.0, 23069.0, 46548.0, 95184.0, 186824.0, 272834.0, 196394.0, 101465.0, 49612.0, 24454.0, 12362.0, 6398.0, 3390.0, 1891.0, 1091.0, 624.0, 394.0, 209.0, 135.0, 93.0, 47.0, 45.0, 22.0, 22.0, 10.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5841522216796875, -1.528656005859375, -1.4731597900390625, -1.41766357421875, -1.3621673583984375, -1.306671142578125, -1.2511749267578125, -1.1956787109375, -1.1401824951171875, -1.084686279296875, -1.0291900634765625, -0.97369384765625, -0.9181976318359375, -0.862701416015625, -0.8072052001953125, -0.751708984375, -0.6962127685546875, -0.640716552734375, -0.5852203369140625, -0.52972412109375, -0.4742279052734375, -0.418731689453125, -0.3632354736328125, -0.3077392578125, -0.2522430419921875, -0.196746826171875, -0.1412506103515625, -0.08575439453125, -0.0302581787109375, 0.025238037109375, 0.0807342529296875, 0.13623046875, 0.1917266845703125, 0.247222900390625, 0.3027191162109375, 0.35821533203125, 0.4137115478515625, 0.469207763671875, 0.5247039794921875, 0.5802001953125, 0.6356964111328125, 0.691192626953125, 0.7466888427734375, 0.80218505859375, 0.8576812744140625, 0.913177490234375, 0.9686737060546875, 1.024169921875, 1.0796661376953125, 1.135162353515625, 1.1906585693359375, 1.24615478515625, 1.3016510009765625, 1.357147216796875, 1.4126434326171875, 1.4681396484375, 1.5236358642578125, 1.579132080078125, 1.6346282958984375, 1.69012451171875, 1.7456207275390625, 1.801116943359375, 1.8566131591796875, 1.912109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 3.0, 10.0, 15.0, 14.0, 11.0, 13.0, 16.0, 20.0, 23.0, 18.0, 22.0, 31.0, 35.0, 36.0, 49.0, 46.0, 42.0, 67.0, 41.0, 39.0, 45.0, 47.0, 50.0, 42.0, 41.0, 41.0, 23.0, 22.0, 24.0, 20.0, 16.0, 10.0, 11.0, 10.0, 14.0, 6.0, 4.0, 1.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.1484375, -4.0252685546875, -3.902099609375, -3.7789306640625, -3.65576171875, -3.5325927734375, -3.409423828125, -3.2862548828125, -3.1630859375, -3.0399169921875, -2.916748046875, -2.7935791015625, -2.67041015625, -2.5472412109375, -2.424072265625, -2.3009033203125, -2.177734375, -2.0545654296875, -1.931396484375, -1.8082275390625, -1.68505859375, -1.5618896484375, -1.438720703125, -1.3155517578125, -1.1923828125, -1.0692138671875, -0.946044921875, -0.8228759765625, -0.69970703125, -0.5765380859375, -0.453369140625, -0.3302001953125, -0.20703125, -0.0838623046875, 0.039306640625, 0.1624755859375, 0.28564453125, 0.4088134765625, 0.531982421875, 0.6551513671875, 0.7783203125, 0.9014892578125, 1.024658203125, 1.1478271484375, 1.27099609375, 1.3941650390625, 1.517333984375, 1.6405029296875, 1.763671875, 1.8868408203125, 2.010009765625, 2.1331787109375, 2.25634765625, 2.3795166015625, 2.502685546875, 2.6258544921875, 2.7490234375, 2.8721923828125, 2.995361328125, 3.1185302734375, 3.24169921875, 3.3648681640625, 3.488037109375, 3.6112060546875, 3.734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 13.0, 11.0, 20.0, 26.0, 52.0, 56.0, 79.0, 140.0, 209.0, 273.0, 449.0, 654.0, 1029.0, 1695.0, 2896.0, 5786.0, 14046.0, 44699.0, 204230.0, 546031.0, 163951.0, 37355.0, 12350.0, 5326.0, 2665.0, 1592.0, 1002.0, 644.0, 405.0, 274.0, 196.0, 134.0, 74.0, 72.0, 30.0, 24.0, 16.0, 13.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8901824951171875, -0.860931396484375, -0.8316802978515625, -0.80242919921875, -0.7731781005859375, -0.743927001953125, -0.7146759033203125, -0.6854248046875, -0.6561737060546875, -0.626922607421875, -0.5976715087890625, -0.56842041015625, -0.5391693115234375, -0.509918212890625, -0.4806671142578125, -0.451416015625, -0.4221649169921875, -0.392913818359375, -0.3636627197265625, -0.33441162109375, -0.3051605224609375, -0.275909423828125, -0.2466583251953125, -0.2174072265625, -0.1881561279296875, -0.158905029296875, -0.1296539306640625, -0.10040283203125, -0.0711517333984375, -0.041900634765625, -0.0126495361328125, 0.0166015625, 0.0458526611328125, 0.075103759765625, 0.1043548583984375, 0.13360595703125, 0.1628570556640625, 0.192108154296875, 0.2213592529296875, 0.2506103515625, 0.2798614501953125, 0.309112548828125, 0.3383636474609375, 0.36761474609375, 0.3968658447265625, 0.426116943359375, 0.4553680419921875, 0.484619140625, 0.5138702392578125, 0.543121337890625, 0.5723724365234375, 0.60162353515625, 0.6308746337890625, 0.660125732421875, 0.6893768310546875, 0.7186279296875, 0.7478790283203125, 0.777130126953125, 0.8063812255859375, 0.83563232421875, 0.8648834228515625, 0.894134521484375, 0.9233856201171875, 0.95263671875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 0.0, 6.0, 4.0, 6.0, 10.0, 8.0, 17.0, 28.0, 24.0, 28.0, 40.0, 39.0, 50.0, 64.0, 63.0, 66.0, 83.0, 91.0, 71.0, 60.0, 45.0, 41.0, 28.0, 27.0, 21.0, 24.0, 14.0, 20.0, 11.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8014183044433594e-05, -2.690032124519348e-05, -2.578645944595337e-05, -2.4672597646713257e-05, -2.3558735847473145e-05, -2.2444874048233032e-05, -2.133101224899292e-05, -2.0217150449752808e-05, -1.9103288650512695e-05, -1.7989426851272583e-05, -1.687556505203247e-05, -1.576170325279236e-05, -1.4647841453552246e-05, -1.3533979654312134e-05, -1.2420117855072021e-05, -1.130625605583191e-05, -1.0192394256591797e-05, -9.078532457351685e-06, -7.964670658111572e-06, -6.85080885887146e-06, -5.736947059631348e-06, -4.623085260391235e-06, -3.509223461151123e-06, -2.3953616619110107e-06, -1.2814998626708984e-06, -1.6763806343078613e-07, 9.462237358093262e-07, 2.0600855350494385e-06, 3.1739473342895508e-06, 4.287809133529663e-06, 5.401670932769775e-06, 6.515532732009888e-06, 7.62939453125e-06, 8.743256330490112e-06, 9.857118129730225e-06, 1.0970979928970337e-05, 1.208484172821045e-05, 1.3198703527450562e-05, 1.4312565326690674e-05, 1.5426427125930786e-05, 1.65402889251709e-05, 1.765415072441101e-05, 1.8768012523651123e-05, 1.9881874322891235e-05, 2.0995736122131348e-05, 2.210959792137146e-05, 2.3223459720611572e-05, 2.4337321519851685e-05, 2.5451183319091797e-05, 2.656504511833191e-05, 2.767890691757202e-05, 2.8792768716812134e-05, 2.9906630516052246e-05, 3.102049231529236e-05, 3.213435411453247e-05, 3.324821591377258e-05, 3.4362077713012695e-05, 3.547593951225281e-05, 3.658980131149292e-05, 3.770366311073303e-05, 3.8817524909973145e-05, 3.993138670921326e-05, 4.104524850845337e-05, 4.215911030769348e-05, 4.3272972106933594e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 10.0, 16.0, 26.0, 41.0, 45.0, 46.0, 88.0, 136.0, 192.0, 253.0, 363.0, 502.0, 707.0, 1031.0, 1625.0, 2540.0, 4288.0, 7792.0, 15232.0, 34280.0, 84491.0, 220237.0, 360009.0, 184037.0, 70444.0, 28963.0, 13379.0, 6794.0, 3890.0, 2383.0, 1496.0, 940.0, 709.0, 418.0, 313.0, 233.0, 164.0, 126.0, 83.0, 69.0, 53.0, 26.0, 20.0, 20.0, 4.0, 13.0, 8.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.87030029296875, -0.8416748046875, -0.81304931640625, -0.784423828125, -0.75579833984375, -0.7271728515625, -0.69854736328125, -0.669921875, -0.64129638671875, -0.6126708984375, -0.58404541015625, -0.555419921875, -0.52679443359375, -0.4981689453125, -0.46954345703125, -0.44091796875, -0.41229248046875, -0.3836669921875, -0.35504150390625, -0.326416015625, -0.29779052734375, -0.2691650390625, -0.24053955078125, -0.2119140625, -0.18328857421875, -0.1546630859375, -0.12603759765625, -0.097412109375, -0.06878662109375, -0.0401611328125, -0.01153564453125, 0.01708984375, 0.04571533203125, 0.0743408203125, 0.10296630859375, 0.131591796875, 0.16021728515625, 0.1888427734375, 0.21746826171875, 0.24609375, 0.27471923828125, 0.3033447265625, 0.33197021484375, 0.360595703125, 0.38922119140625, 0.4178466796875, 0.44647216796875, 0.47509765625, 0.50372314453125, 0.5323486328125, 0.56097412109375, 0.589599609375, 0.61822509765625, 0.6468505859375, 0.67547607421875, 0.7041015625, 0.73272705078125, 0.7613525390625, 0.78997802734375, 0.818603515625, 0.84722900390625, 0.8758544921875, 0.90447998046875, 0.93310546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 15.0, 18.0, 24.0, 26.0, 47.0, 91.0, 99.0, 127.0, 137.0, 110.0, 83.0, 62.0, 61.0, 19.0, 19.0, 16.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4033203125, -0.3915367126464844, -0.37975311279296875, -0.3679695129394531, -0.3561859130859375, -0.3444023132324219, -0.33261871337890625, -0.3208351135253906, -0.309051513671875, -0.2972679138183594, -0.28548431396484375, -0.2737007141113281, -0.2619171142578125, -0.2501335144042969, -0.23834991455078125, -0.22656631469726562, -0.21478271484375, -0.20299911499023438, -0.19121551513671875, -0.17943191528320312, -0.1676483154296875, -0.15586471557617188, -0.14408111572265625, -0.13229751586914062, -0.120513916015625, -0.10873031616210938, -0.09694671630859375, -0.08516311645507812, -0.0733795166015625, -0.061595916748046875, -0.04981231689453125, -0.038028717041015625, -0.0262451171875, -0.014461517333984375, -0.00267791748046875, 0.009105682373046875, 0.0208892822265625, 0.032672882080078125, 0.04445648193359375, 0.056240081787109375, 0.068023681640625, 0.07980728149414062, 0.09159088134765625, 0.10337448120117188, 0.1151580810546875, 0.12694168090820312, 0.13872528076171875, 0.15050888061523438, 0.16229248046875, 0.17407608032226562, 0.18585968017578125, 0.19764328002929688, 0.2094268798828125, 0.22121047973632812, 0.23299407958984375, 0.24477767944335938, 0.256561279296875, 0.2683448791503906, 0.28012847900390625, 0.2919120788574219, 0.3036956787109375, 0.3154792785644531, 0.32726287841796875, 0.3390464782714844, 0.350830078125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 5.0, 24.0, 10.0, 21.0, 32.0, 37.0, 38.0, 50.0, 58.0, 60.0, 72.0, 78.0, 65.0, 54.0, 52.0, 49.0, 63.0, 39.0, 36.0, 26.0, 21.0, 28.0, 21.0, 9.0, 5.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.094508171081543, -10.80483341217041, -10.515158653259277, -10.225483894348145, -9.935808181762695, -9.646133422851562, -9.35645866394043, -9.066783905029297, -8.777109146118164, -8.487434387207031, -8.197759628295898, -7.908084392547607, -7.618409633636475, -7.328734874725342, -7.039059638977051, -6.749384880065918, -6.459710121154785, -6.170035362243652, -5.8803606033325195, -5.5906853675842285, -5.301010608673096, -5.011335849761963, -4.721660614013672, -4.431985855102539, -4.142311096191406, -3.8526363372802734, -3.5629613399505615, -3.2732863426208496, -2.983611583709717, -2.693936824798584, -2.404261827468872, -2.11458683013916, -1.8249125480651855, -1.5352376699447632, -1.2455627918243408, -0.9558879137039185, -0.6662130355834961, -0.37653815746307373, -0.08686327934265137, 0.20281171798706055, 0.49248647689819336, 0.7821613550186157, 1.071836233139038, 1.3615111112594604, 1.6511859893798828, 1.9408608675003052, 2.2305357456207275, 2.5202107429504395, 2.8098855018615723, 3.099560260772705, 3.389235258102417, 3.678910255432129, 3.9685850143432617, 4.2582597732543945, 4.547934532165527, 4.837609767913818, 5.127284526824951, 5.416959285736084, 5.706634521484375, 5.996309280395508, 6.285984039306641, 6.575658798217773, 6.865333557128906, 7.155008792877197, 7.44468355178833]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 11.0, 8.0, 13.0, 8.0, 14.0, 19.0, 16.0, 16.0, 26.0, 30.0, 27.0, 23.0, 31.0, 37.0, 37.0, 47.0, 43.0, 58.0, 40.0, 46.0, 41.0, 37.0, 42.0, 41.0, 40.0, 36.0, 37.0, 26.0, 19.0, 16.0, 19.0, 13.0, 17.0, 12.0, 9.0, 9.0, 5.0, 3.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.316371440887451, -6.126894950866699, -5.937417984008789, -5.747941017150879, -5.558464527130127, -5.368988037109375, -5.179511070251465, -4.990034103393555, -4.800557613372803, -4.611081123352051, -4.421604156494141, -4.2321271896362305, -4.0426506996154785, -3.8531739711761475, -3.6636972427368164, -3.4742205142974854, -3.2847437858581543, -3.0952670574188232, -2.905790328979492, -2.716313600540161, -2.52683687210083, -2.337360143661499, -2.147883415222168, -1.958406686782837, -1.7689299583435059, -1.5794532299041748, -1.3899765014648438, -1.2004997730255127, -1.0110230445861816, -0.8215463161468506, -0.6320695877075195, -0.4425928592681885, -0.2531156539916992, -0.06363892555236816, 0.1258378028869629, 0.31531453132629395, 0.504791259765625, 0.694267988204956, 0.8837447166442871, 1.0732214450836182, 1.2626981735229492, 1.4521749019622803, 1.6416516304016113, 1.8311283588409424, 2.0206050872802734, 2.2100818157196045, 2.3995585441589355, 2.5890352725982666, 2.7785120010375977, 2.9679887294769287, 3.1574654579162598, 3.346942186355591, 3.536418914794922, 3.725895643234253, 3.915372371673584, 4.104848861694336, 4.294325828552246, 4.483802795410156, 4.673279285430908, 4.86275577545166, 5.05223274230957, 5.2417097091674805, 5.431186199188232, 5.620662689208984, 5.8101396560668945]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 27.0, 21.0, 49.0, 54.0, 114.0, 163.0, 171.0, 290.0, 458.0, 666.0, 975.0, 1629.0, 2531.0, 4060.0, 6616.0, 11381.0, 19757.0, 35304.0, 62042.0, 104007.0, 152196.0, 179576.0, 166154.0, 121463.0, 75861.0, 43701.0, 24282.0, 13994.0, 7868.0, 4834.0, 2899.0, 1894.0, 1222.0, 747.0, 511.0, 304.0, 257.0, 141.0, 102.0, 65.0, 57.0, 32.0, 22.0, 12.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3359375, -5.17266845703125, -5.0093994140625, -4.84613037109375, -4.682861328125, -4.51959228515625, -4.3563232421875, -4.19305419921875, -4.02978515625, -3.86651611328125, -3.7032470703125, -3.53997802734375, -3.376708984375, -3.21343994140625, -3.0501708984375, -2.88690185546875, -2.7236328125, -2.56036376953125, -2.3970947265625, -2.23382568359375, -2.070556640625, -1.90728759765625, -1.7440185546875, -1.58074951171875, -1.41748046875, -1.25421142578125, -1.0909423828125, -0.92767333984375, -0.764404296875, -0.60113525390625, -0.4378662109375, -0.27459716796875, -0.111328125, 0.05194091796875, 0.2152099609375, 0.37847900390625, 0.541748046875, 0.70501708984375, 0.8682861328125, 1.03155517578125, 1.19482421875, 1.35809326171875, 1.5213623046875, 1.68463134765625, 1.847900390625, 2.01116943359375, 2.1744384765625, 2.33770751953125, 2.5009765625, 2.66424560546875, 2.8275146484375, 2.99078369140625, 3.154052734375, 3.31732177734375, 3.4805908203125, 3.64385986328125, 3.80712890625, 3.97039794921875, 4.1336669921875, 4.29693603515625, 4.460205078125, 4.62347412109375, 4.7867431640625, 4.95001220703125, 5.11328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 8.0, 13.0, 12.0, 12.0, 22.0, 19.0, 24.0, 21.0, 24.0, 28.0, 35.0, 29.0, 33.0, 34.0, 40.0, 45.0, 50.0, 45.0, 50.0, 37.0, 43.0, 46.0, 38.0, 31.0, 36.0, 36.0, 22.0, 20.0, 22.0, 24.0, 15.0, 8.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.59765625, -6.400146484375, -6.20263671875, -6.005126953125, -5.8076171875, -5.610107421875, -5.41259765625, -5.215087890625, -5.017578125, -4.820068359375, -4.62255859375, -4.425048828125, -4.2275390625, -4.030029296875, -3.83251953125, -3.635009765625, -3.4375, -3.239990234375, -3.04248046875, -2.844970703125, -2.6474609375, -2.449951171875, -2.25244140625, -2.054931640625, -1.857421875, -1.659912109375, -1.46240234375, -1.264892578125, -1.0673828125, -0.869873046875, -0.67236328125, -0.474853515625, -0.27734375, -0.079833984375, 0.11767578125, 0.315185546875, 0.5126953125, 0.710205078125, 0.90771484375, 1.105224609375, 1.302734375, 1.500244140625, 1.69775390625, 1.895263671875, 2.0927734375, 2.290283203125, 2.48779296875, 2.685302734375, 2.8828125, 3.080322265625, 3.27783203125, 3.475341796875, 3.6728515625, 3.870361328125, 4.06787109375, 4.265380859375, 4.462890625, 4.660400390625, 4.85791015625, 5.055419921875, 5.2529296875, 5.450439453125, 5.64794921875, 5.845458984375, 6.04296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 8.0, 18.0, 32.0, 32.0, 51.0, 70.0, 120.0, 132.0, 213.0, 335.0, 539.0, 752.0, 1185.0, 1851.0, 3014.0, 4721.0, 7716.0, 12466.0, 20804.0, 35708.0, 62572.0, 111614.0, 176604.0, 206782.0, 164834.0, 99424.0, 55959.0, 32040.0, 18758.0, 11333.0, 6772.0, 4347.0, 2789.0, 1727.0, 1056.0, 699.0, 473.0, 298.0, 229.0, 134.0, 101.0, 62.0, 63.0, 34.0, 15.0, 12.0, 13.0, 5.0, 7.0, 1.0, 8.0, 1.0, 2.0, 4.0, 3.0, 2.0], "bins": [-7.9921875, -7.7376708984375, -7.483154296875, -7.2286376953125, -6.97412109375, -6.7196044921875, -6.465087890625, -6.2105712890625, -5.9560546875, -5.7015380859375, -5.447021484375, -5.1925048828125, -4.93798828125, -4.6834716796875, -4.428955078125, -4.1744384765625, -3.919921875, -3.6654052734375, -3.410888671875, -3.1563720703125, -2.90185546875, -2.6473388671875, -2.392822265625, -2.1383056640625, -1.8837890625, -1.6292724609375, -1.374755859375, -1.1202392578125, -0.86572265625, -0.6112060546875, -0.356689453125, -0.1021728515625, 0.15234375, 0.4068603515625, 0.661376953125, 0.9158935546875, 1.17041015625, 1.4249267578125, 1.679443359375, 1.9339599609375, 2.1884765625, 2.4429931640625, 2.697509765625, 2.9520263671875, 3.20654296875, 3.4610595703125, 3.715576171875, 3.9700927734375, 4.224609375, 4.4791259765625, 4.733642578125, 4.9881591796875, 5.24267578125, 5.4971923828125, 5.751708984375, 6.0062255859375, 6.2607421875, 6.5152587890625, 6.769775390625, 7.0242919921875, 7.27880859375, 7.5333251953125, 7.787841796875, 8.0423583984375, 8.296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 12.0, 8.0, 18.0, 18.0, 21.0, 31.0, 34.0, 28.0, 27.0, 27.0, 33.0, 33.0, 34.0, 40.0, 47.0, 43.0, 31.0, 40.0, 47.0, 46.0, 29.0, 35.0, 32.0, 28.0, 30.0, 33.0, 38.0, 31.0, 19.0, 15.0, 14.0, 9.0, 15.0, 6.0, 9.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1796875, -4.05987548828125, -3.9400634765625, -3.82025146484375, -3.700439453125, -3.58062744140625, -3.4608154296875, -3.34100341796875, -3.22119140625, -3.10137939453125, -2.9815673828125, -2.86175537109375, -2.741943359375, -2.62213134765625, -2.5023193359375, -2.38250732421875, -2.2626953125, -2.14288330078125, -2.0230712890625, -1.90325927734375, -1.783447265625, -1.66363525390625, -1.5438232421875, -1.42401123046875, -1.30419921875, -1.18438720703125, -1.0645751953125, -0.94476318359375, -0.824951171875, -0.70513916015625, -0.5853271484375, -0.46551513671875, -0.345703125, -0.22589111328125, -0.1060791015625, 0.01373291015625, 0.133544921875, 0.25335693359375, 0.3731689453125, 0.49298095703125, 0.61279296875, 0.73260498046875, 0.8524169921875, 0.97222900390625, 1.092041015625, 1.21185302734375, 1.3316650390625, 1.45147705078125, 1.5712890625, 1.69110107421875, 1.8109130859375, 1.93072509765625, 2.050537109375, 2.17034912109375, 2.2901611328125, 2.40997314453125, 2.52978515625, 2.64959716796875, 2.7694091796875, 2.88922119140625, 3.009033203125, 3.12884521484375, 3.2486572265625, 3.36846923828125, 3.48828125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 16.0, 42.0, 42.0, 93.0, 86.0, 176.0, 254.0, 354.0, 596.0, 946.0, 1402.0, 2262.0, 3653.0, 5933.0, 9872.0, 16166.0, 26282.0, 41607.0, 63102.0, 89169.0, 114388.0, 132332.0, 133759.0, 119219.0, 95489.0, 68855.0, 46245.0, 29492.0, 18039.0, 10982.0, 6656.0, 4097.0, 2533.0, 1492.0, 1055.0, 594.0, 403.0, 286.0, 166.0, 140.0, 77.0, 64.0, 46.0, 22.0, 15.0, 7.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.4638671875, -1.4196624755859375, -1.375457763671875, -1.3312530517578125, -1.28704833984375, -1.2428436279296875, -1.198638916015625, -1.1544342041015625, -1.1102294921875, -1.0660247802734375, -1.021820068359375, -0.9776153564453125, -0.93341064453125, -0.8892059326171875, -0.845001220703125, -0.8007965087890625, -0.756591796875, -0.7123870849609375, -0.668182373046875, -0.6239776611328125, -0.57977294921875, -0.5355682373046875, -0.491363525390625, -0.4471588134765625, -0.4029541015625, -0.3587493896484375, -0.314544677734375, -0.2703399658203125, -0.22613525390625, -0.1819305419921875, -0.137725830078125, -0.0935211181640625, -0.04931640625, -0.0051116943359375, 0.039093017578125, 0.0832977294921875, 0.12750244140625, 0.1717071533203125, 0.215911865234375, 0.2601165771484375, 0.3043212890625, 0.3485260009765625, 0.392730712890625, 0.4369354248046875, 0.48114013671875, 0.5253448486328125, 0.569549560546875, 0.6137542724609375, 0.657958984375, 0.7021636962890625, 0.746368408203125, 0.7905731201171875, 0.83477783203125, 0.8789825439453125, 0.923187255859375, 0.9673919677734375, 1.0115966796875, 1.0558013916015625, 1.100006103515625, 1.1442108154296875, 1.18841552734375, 1.2326202392578125, 1.276824951171875, 1.3210296630859375, 1.365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 12.0, 20.0, 21.0, 21.0, 34.0, 47.0, 36.0, 42.0, 55.0, 45.0, 62.0, 65.0, 57.0, 47.0, 59.0, 66.0, 50.0, 47.0, 38.0, 26.0, 25.0, 17.0, 26.0, 14.0, 10.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019788742065429688, -0.0001915767788887024, -0.0001852661371231079, -0.00017895549535751343, -0.00017264485359191895, -0.00016633421182632446, -0.00016002357006072998, -0.0001537129282951355, -0.00014740228652954102, -0.00014109164476394653, -0.00013478100299835205, -0.00012847036123275757, -0.00012215971946716309, -0.0001158490777015686, -0.00010953843593597412, -0.00010322779417037964, -9.691715240478516e-05, -9.060651063919067e-05, -8.429586887359619e-05, -7.798522710800171e-05, -7.167458534240723e-05, -6.536394357681274e-05, -5.905330181121826e-05, -5.274266004562378e-05, -4.64320182800293e-05, -4.0121376514434814e-05, -3.381073474884033e-05, -2.750009298324585e-05, -2.1189451217651367e-05, -1.4878809452056885e-05, -8.568167686462402e-06, -2.25752592086792e-06, 4.0531158447265625e-06, 1.0363757610321045e-05, 1.6674399375915527e-05, 2.298504114151001e-05, 2.9295682907104492e-05, 3.5606324672698975e-05, 4.191696643829346e-05, 4.822760820388794e-05, 5.453824996948242e-05, 6.0848891735076904e-05, 6.715953350067139e-05, 7.347017526626587e-05, 7.978081703186035e-05, 8.609145879745483e-05, 9.240210056304932e-05, 9.87127423286438e-05, 0.00010502338409423828, 0.00011133402585983276, 0.00011764466762542725, 0.00012395530939102173, 0.0001302659511566162, 0.0001365765929222107, 0.00014288723468780518, 0.00014919787645339966, 0.00015550851821899414, 0.00016181915998458862, 0.0001681298017501831, 0.0001744404435157776, 0.00018075108528137207, 0.00018706172704696655, 0.00019337236881256104, 0.00019968301057815552, 0.00020599365234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 9.0, 7.0, 18.0, 23.0, 48.0, 58.0, 90.0, 139.0, 252.0, 383.0, 573.0, 999.0, 1628.0, 2790.0, 4603.0, 8160.0, 13796.0, 23291.0, 38158.0, 59980.0, 87228.0, 115249.0, 135668.0, 139778.0, 125858.0, 99780.0, 71202.0, 47053.0, 29118.0, 17613.0, 10173.0, 6042.0, 3546.0, 2042.0, 1280.0, 736.0, 458.0, 286.0, 181.0, 99.0, 53.0, 54.0, 26.0, 13.0, 9.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3470306396484375, -1.302459716796875, -1.2578887939453125, -1.21331787109375, -1.1687469482421875, -1.124176025390625, -1.0796051025390625, -1.0350341796875, -0.9904632568359375, -0.945892333984375, -0.9013214111328125, -0.85675048828125, -0.8121795654296875, -0.767608642578125, -0.7230377197265625, -0.678466796875, -0.6338958740234375, -0.589324951171875, -0.5447540283203125, -0.50018310546875, -0.4556121826171875, -0.411041259765625, -0.3664703369140625, -0.3218994140625, -0.2773284912109375, -0.232757568359375, -0.1881866455078125, -0.14361572265625, -0.0990447998046875, -0.054473876953125, -0.0099029541015625, 0.03466796875, 0.0792388916015625, 0.123809814453125, 0.1683807373046875, 0.21295166015625, 0.2575225830078125, 0.302093505859375, 0.3466644287109375, 0.3912353515625, 0.4358062744140625, 0.480377197265625, 0.5249481201171875, 0.56951904296875, 0.6140899658203125, 0.658660888671875, 0.7032318115234375, 0.747802734375, 0.7923736572265625, 0.836944580078125, 0.8815155029296875, 0.92608642578125, 0.9706573486328125, 1.015228271484375, 1.0597991943359375, 1.1043701171875, 1.1489410400390625, 1.193511962890625, 1.2380828857421875, 1.28265380859375, 1.3272247314453125, 1.371795654296875, 1.4163665771484375, 1.4609375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 7.0, 10.0, 8.0, 7.0, 14.0, 18.0, 17.0, 31.0, 28.0, 25.0, 31.0, 40.0, 30.0, 48.0, 46.0, 37.0, 50.0, 44.0, 48.0, 43.0, 43.0, 43.0, 42.0, 32.0, 37.0, 27.0, 24.0, 24.0, 22.0, 14.0, 25.0, 12.0, 9.0, 9.0, 4.0, 8.0, 3.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4423828125, -0.42792510986328125, -0.4134674072265625, -0.39900970458984375, -0.384552001953125, -0.37009429931640625, -0.3556365966796875, -0.34117889404296875, -0.32672119140625, -0.31226348876953125, -0.2978057861328125, -0.28334808349609375, -0.268890380859375, -0.25443267822265625, -0.2399749755859375, -0.22551727294921875, -0.2110595703125, -0.19660186767578125, -0.1821441650390625, -0.16768646240234375, -0.153228759765625, -0.13877105712890625, -0.1243133544921875, -0.10985565185546875, -0.09539794921875, -0.08094024658203125, -0.0664825439453125, -0.05202484130859375, -0.037567138671875, -0.02310943603515625, -0.0086517333984375, 0.00580596923828125, 0.020263671875, 0.03472137451171875, 0.0491790771484375, 0.06363677978515625, 0.078094482421875, 0.09255218505859375, 0.1070098876953125, 0.12146759033203125, 0.13592529296875, 0.15038299560546875, 0.1648406982421875, 0.17929840087890625, 0.193756103515625, 0.20821380615234375, 0.2226715087890625, 0.23712921142578125, 0.2515869140625, 0.26604461669921875, 0.2805023193359375, 0.29496002197265625, 0.309417724609375, 0.32387542724609375, 0.3383331298828125, 0.35279083251953125, 0.36724853515625, 0.38170623779296875, 0.3961639404296875, 0.41062164306640625, 0.425079345703125, 0.43953704833984375, 0.4539947509765625, 0.46845245361328125, 0.48291015625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 16.0, 16.0, 30.0, 32.0, 34.0, 37.0, 40.0, 51.0, 38.0, 63.0, 57.0, 72.0, 60.0, 55.0, 54.0, 47.0, 42.0, 29.0, 29.0, 29.0, 23.0, 15.0, 24.0, 16.0, 14.0, 11.0, 2.0, 3.0, 9.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.497963905334473, -9.224068641662598, -8.950172424316406, -8.676277160644531, -8.40238094329834, -8.128485679626465, -7.854589939117432, -7.580694198608398, -7.306798934936523, -7.03290319442749, -6.759007453918457, -6.485112190246582, -6.211216449737549, -5.937320709228516, -5.663424968719482, -5.389529228210449, -5.115633487701416, -4.841737747192383, -4.56784200668335, -4.293946266174316, -4.020051002502441, -3.746155261993408, -3.472259521484375, -3.198363780975342, -2.9244682788848877, -2.6505725383758545, -2.3766770362854004, -2.102781295776367, -1.8288856744766235, -1.5549900531768799, -1.2810943126678467, -1.007198691368103, -0.7333030700683594, -0.45940741896629333, -0.1855117678642273, 0.08838391304016113, 0.3622795343399048, 0.6361751556396484, 0.9100708961486816, 1.1839665174484253, 1.457862138748169, 1.7317577600479126, 2.0056533813476562, 2.2795491218566895, 2.5534448623657227, 2.8273403644561768, 3.10123610496521, 3.375131607055664, 3.6490273475646973, 3.9229230880737305, 4.196818828582764, 4.470714569091797, 4.744609832763672, 5.018505573272705, 5.292401313781738, 5.5662970542907715, 5.840192794799805, 6.114088535308838, 6.387984275817871, 6.661879539489746, 6.935775279998779, 7.2096710205078125, 7.483566761016846, 7.757462501525879, 8.031357765197754]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 14.0, 10.0, 17.0, 20.0, 30.0, 18.0, 24.0, 29.0, 38.0, 30.0, 47.0, 41.0, 43.0, 63.0, 58.0, 38.0, 44.0, 44.0, 51.0, 38.0, 26.0, 35.0, 36.0, 37.0, 25.0, 28.0, 15.0, 19.0, 14.0, 11.0, 7.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.619253158569336, -8.35822868347168, -8.097204208374023, -7.836179733276367, -7.575155258178711, -7.314130783081055, -7.053106307983398, -6.792081832885742, -6.531057357788086, -6.27003288269043, -6.009008407592773, -5.747983932495117, -5.486959457397461, -5.225934982299805, -4.964910507202148, -4.703886032104492, -4.442862033843994, -4.181837558746338, -3.9208130836486816, -3.6597886085510254, -3.398764133453369, -3.137739658355713, -2.8767154216766357, -2.6156909465789795, -2.3546664714813232, -2.093641996383667, -1.8326175212860107, -1.571593165397644, -1.3105686902999878, -1.0495442152023315, -0.7885198593139648, -0.5274953842163086, -0.26647090911865234, -0.0054464638233184814, 0.2555779814720154, 0.5166023969650269, 0.7776268720626831, 1.0386513471603394, 1.299675703048706, 1.5607001781463623, 1.8217246532440186, 2.082749128341675, 2.343773603439331, 2.604797840118408, 2.8658223152160645, 3.1268467903137207, 3.387871265411377, 3.648895740509033, 3.9099202156066895, 4.170944690704346, 4.431969165802002, 4.692993640899658, 4.9540181159973145, 5.215042591094971, 5.476066589355469, 5.737091064453125, 5.998115539550781, 6.2591400146484375, 6.520164489746094, 6.78118896484375, 7.042213439941406, 7.3032379150390625, 7.564262390136719, 7.825286865234375, 8.086311340332031]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 5.0, 16.0, 18.0, 21.0, 31.0, 42.0, 48.0, 65.0, 81.0, 119.0, 137.0, 225.0, 301.0, 390.0, 566.0, 793.0, 1131.0, 1655.0, 2295.0, 3183.0, 4330.0, 488572.0, 5585.0, 4059.0, 3035.0, 2148.0, 1544.0, 1086.0, 749.0, 554.0, 396.0, 265.0, 222.0, 142.0, 96.0, 83.0, 60.0, 46.0, 33.0, 28.0, 26.0, 14.0, 22.0, 7.0, 5.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-71.41798400878906, -69.10797119140625, -66.79795837402344, -64.48794555664062, -62.17793273925781, -59.867919921875, -57.55790328979492, -55.24789047241211, -52.9378776550293, -50.627864837646484, -48.31785202026367, -46.00783920288086, -43.69782257080078, -41.38780975341797, -39.077796936035156, -36.767784118652344, -34.45777130126953, -32.14775848388672, -29.837745666503906, -27.52773094177246, -25.21771812438965, -22.907705307006836, -20.59769058227539, -18.287677764892578, -15.977664947509766, -13.667652130126953, -11.357638359069824, -9.047624588012695, -6.737611770629883, -4.42759895324707, -2.1175851821899414, 0.1924285888671875, 2.50244140625, 4.812454700469971, 7.122467994689941, 9.43248176574707, 11.742494583129883, 14.052507400512695, 16.36252212524414, 18.672534942626953, 20.982547760009766, 23.292560577392578, 25.60257339477539, 27.912588119506836, 30.22260093688965, 32.532615661621094, 34.842628479003906, 37.15264129638672, 39.46265411376953, 41.772666931152344, 44.082679748535156, 46.39269256591797, 48.70270538330078, 51.012718200683594, 53.32273483276367, 55.632747650146484, 57.9427604675293, 60.25277328491211, 62.56278610229492, 64.872802734375, 67.18281555175781, 69.49282836914062, 71.80284118652344, 74.11285400390625, 76.42286682128906]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 12.0, 11.0, 12.0, 15.0, 22.0, 30.0, 16.0, 24.0, 29.0, 41.0, 28.0, 45.0, 43.0, 46.0, 64.0, 1080.0, 43.0, 42.0, 46.0, 50.0, 34.0, 28.0, 40.0, 36.0, 33.0, 27.0, 27.0, 12.0, 18.0, 14.0, 12.0, 6.0, 4.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-265.3472595214844, -257.3047790527344, -249.26229858398438, -241.21981811523438, -233.17733764648438, -225.13485717773438, -217.09237670898438, -209.04989624023438, -201.00741577148438, -192.96493530273438, -184.92245483398438, -176.87997436523438, -168.83749389648438, -160.79501342773438, -152.75253295898438, -144.71005249023438, -136.66758728027344, -128.62510681152344, -120.58262634277344, -112.54014587402344, -104.49766540527344, -96.45518493652344, -88.41271209716797, -80.37023162841797, -72.32775115966797, -64.28527069091797, -56.24279022216797, -48.200313568115234, -40.157833099365234, -32.115352630615234, -24.0728759765625, -16.0303955078125, -7.9879150390625, 0.054564476013183594, 8.097043991088867, 16.139522552490234, 24.182003021240234, 32.224483489990234, 40.26696014404297, 48.30944061279297, 56.35192108154297, 64.39440155029297, 72.43688201904297, 80.47935485839844, 88.52183532714844, 96.56431579589844, 104.60679626464844, 112.64927673339844, 120.69175720214844, 128.73423767089844, 136.77671813964844, 144.81919860839844, 152.86167907714844, 160.90415954589844, 168.94662475585938, 176.98910522460938, 185.03158569335938, 193.07406616210938, 201.11654663085938, 209.15902709960938, 217.20150756835938, 225.24398803710938, 233.28646850585938, 241.32894897460938, 249.37142944335938]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 13.0, 6.0, 13.0, 21.0, 21.0, 26.0, 39.0, 51.0, 80.0, 67.0, 123.0, 156.0, 178.0, 264.0, 373.0, 523.0, 687.0, 1038.0, 1566.0, 2346.0, 3328.0, 4723.0, 6289.0, 8418.0, 10499.0, 13807.0, 20183.0, 390907.0, 30684016.0, 34277.0, 31096.0, 16687.0, 8575.0, 5095.0, 3060.0, 1958.0, 1258.0, 808.0, 584.0, 378.0, 297.0, 229.0, 168.0, 119.0, 75.0, 36.0, 22.0, 12.0, 9.0, 5.0, 5.0, 2.0], "bins": [-91.87071228027344, -89.57714080810547, -87.2835693359375, -84.989990234375, -82.69641876220703, -80.40284729003906, -78.1092758178711, -75.81570434570312, -73.52213287353516, -71.22856140136719, -68.93498992919922, -66.64141845703125, -64.34783935546875, -62.05426788330078, -59.76069641113281, -57.467124938964844, -55.17354965209961, -52.87997817993164, -50.586402893066406, -48.29283142089844, -45.99925994873047, -43.7056884765625, -41.412113189697266, -39.1185417175293, -36.82496643066406, -34.531394958496094, -32.23781967163086, -29.94424819946289, -27.650676727294922, -25.35710334777832, -23.06352996826172, -20.76995849609375, -18.47638702392578, -16.18281364440918, -13.889242172241211, -11.59566879272461, -9.302096366882324, -7.008523941040039, -4.7149505615234375, -2.4213790893554688, -0.1278057098388672, 2.165766954421997, 4.459339618682861, 6.752912521362305, 9.04648494720459, 11.340057373046875, 13.633630752563477, 15.927202224731445, 18.220775604248047, 20.51434898376465, 22.807920455932617, 25.10149383544922, 27.395065307617188, 29.68863868713379, 31.98221206665039, 34.27578353881836, 36.569358825683594, 38.86293029785156, 41.1565055847168, 43.450077056884766, 45.743648529052734, 48.03722381591797, 50.33079528808594, 52.624366760253906, 54.917938232421875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 7.0, 15.0, 35.0, 47.0, 60.0, 73.0, 116.0, 167.0, 315.0, 509.0, 803.0, 1318.0, 2134.0, 3665.0, 6640.0, 12180.0, 24035.0, 51122.0, 117466.0, 302918.0, 946099.0, 3192008.0, 1063741.0, 330040.0, 126212.0, 54654.0, 25465.0, 12773.0, 6922.0, 3912.0, 2294.0, 1376.0, 862.0, 532.0, 323.0, 204.0, 118.0, 89.0, 55.0, 45.0, 26.0, 19.0, 13.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.6171875, -5.44970703125, -5.2822265625, -5.11474609375, -4.947265625, -4.77978515625, -4.6123046875, -4.44482421875, -4.27734375, -4.10986328125, -3.9423828125, -3.77490234375, -3.607421875, -3.43994140625, -3.2724609375, -3.10498046875, -2.9375, -2.77001953125, -2.6025390625, -2.43505859375, -2.267578125, -2.10009765625, -1.9326171875, -1.76513671875, -1.59765625, -1.43017578125, -1.2626953125, -1.09521484375, -0.927734375, -0.76025390625, -0.5927734375, -0.42529296875, -0.2578125, -0.09033203125, 0.0771484375, 0.24462890625, 0.412109375, 0.57958984375, 0.7470703125, 0.91455078125, 1.08203125, 1.24951171875, 1.4169921875, 1.58447265625, 1.751953125, 1.91943359375, 2.0869140625, 2.25439453125, 2.421875, 2.58935546875, 2.7568359375, 2.92431640625, 3.091796875, 3.25927734375, 3.4267578125, 3.59423828125, 3.76171875, 3.92919921875, 4.0966796875, 4.26416015625, 4.431640625, 4.59912109375, 4.7666015625, 4.93408203125, 5.1015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 3.0, 9.0, 6.0, 7.0, 9.0, 14.0, 14.0, 20.0, 21.0, 20.0, 27.0, 28.0, 34.0, 36.0, 38.0, 41.0, 44.0, 77.0, 149.0, 205.0, 258.0, 241.0, 146.0, 112.0, 74.0, 56.0, 44.0, 36.0, 35.0, 32.0, 27.0, 21.0, 24.0, 21.0, 14.0, 8.0, 17.0, 8.0, 9.0, 5.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.91796875, -3.79302978515625, -3.6680908203125, -3.54315185546875, -3.418212890625, -3.29327392578125, -3.1683349609375, -3.04339599609375, -2.91845703125, -2.79351806640625, -2.6685791015625, -2.54364013671875, -2.418701171875, -2.29376220703125, -2.1688232421875, -2.04388427734375, -1.9189453125, -1.79400634765625, -1.6690673828125, -1.54412841796875, -1.419189453125, -1.29425048828125, -1.1693115234375, -1.04437255859375, -0.91943359375, -0.79449462890625, -0.6695556640625, -0.54461669921875, -0.419677734375, -0.29473876953125, -0.1697998046875, -0.04486083984375, 0.080078125, 0.20501708984375, 0.3299560546875, 0.45489501953125, 0.579833984375, 0.70477294921875, 0.8297119140625, 0.95465087890625, 1.07958984375, 1.20452880859375, 1.3294677734375, 1.45440673828125, 1.579345703125, 1.70428466796875, 1.8292236328125, 1.95416259765625, 2.0791015625, 2.20404052734375, 2.3289794921875, 2.45391845703125, 2.578857421875, 2.70379638671875, 2.8287353515625, 2.95367431640625, 3.07861328125, 3.20355224609375, 3.3284912109375, 3.45343017578125, 3.578369140625, 3.70330810546875, 3.8282470703125, 3.95318603515625, 4.078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 5.0, 4.0, 14.0, 15.0, 16.0, 32.0, 56.0, 73.0, 81.0, 111.0, 158.0, 181.0, 267.0, 364.0, 510.0, 795.0, 1273.0, 1989.0, 3325.0, 5704.0, 9669.0, 17815.0, 33305.0, 64494.0, 130528.0, 279611.0, 702793.0, 3070359.0, 1223262.0, 388281.0, 175235.0, 85214.0, 43114.0, 22472.0, 12227.0, 6925.0, 3987.0, 2479.0, 1454.0, 1012.0, 668.0, 478.0, 318.0, 241.0, 164.0, 89.0, 60.0, 43.0, 42.0, 20.0, 20.0, 13.0, 18.0, 11.0, 10.0, 6.0, 8.0, 7.0, 7.0, 4.0, 3.0], "bins": [-3.26171875, -3.15545654296875, -3.0491943359375, -2.94293212890625, -2.836669921875, -2.73040771484375, -2.6241455078125, -2.51788330078125, -2.41162109375, -2.30535888671875, -2.1990966796875, -2.09283447265625, -1.986572265625, -1.88031005859375, -1.7740478515625, -1.66778564453125, -1.5615234375, -1.45526123046875, -1.3489990234375, -1.24273681640625, -1.136474609375, -1.03021240234375, -0.9239501953125, -0.81768798828125, -0.71142578125, -0.60516357421875, -0.4989013671875, -0.39263916015625, -0.286376953125, -0.18011474609375, -0.0738525390625, 0.03240966796875, 0.138671875, 0.24493408203125, 0.3511962890625, 0.45745849609375, 0.563720703125, 0.66998291015625, 0.7762451171875, 0.88250732421875, 0.98876953125, 1.09503173828125, 1.2012939453125, 1.30755615234375, 1.413818359375, 1.52008056640625, 1.6263427734375, 1.73260498046875, 1.8388671875, 1.94512939453125, 2.0513916015625, 2.15765380859375, 2.263916015625, 2.37017822265625, 2.4764404296875, 2.58270263671875, 2.68896484375, 2.79522705078125, 2.9014892578125, 3.00775146484375, 3.114013671875, 3.22027587890625, 3.3265380859375, 3.43280029296875, 3.5390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 16.0, 12.0, 16.0, 23.0, 26.0, 58.0, 45.0, 69.0, 88.0, 201.0, 454.0, 409.0, 172.0, 108.0, 76.0, 51.0, 40.0, 38.0, 28.0, 27.0, 11.0, 4.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.078125, -7.8463134765625, -7.614501953125, -7.3826904296875, -7.15087890625, -6.9190673828125, -6.687255859375, -6.4554443359375, -6.2236328125, -5.9918212890625, -5.760009765625, -5.5281982421875, -5.29638671875, -5.0645751953125, -4.832763671875, -4.6009521484375, -4.369140625, -4.1373291015625, -3.905517578125, -3.6737060546875, -3.44189453125, -3.2100830078125, -2.978271484375, -2.7464599609375, -2.5146484375, -2.2828369140625, -2.051025390625, -1.8192138671875, -1.58740234375, -1.3555908203125, -1.123779296875, -0.8919677734375, -0.66015625, -0.4283447265625, -0.196533203125, 0.0352783203125, 0.26708984375, 0.4989013671875, 0.730712890625, 0.9625244140625, 1.1943359375, 1.4261474609375, 1.657958984375, 1.8897705078125, 2.12158203125, 2.3533935546875, 2.585205078125, 2.8170166015625, 3.048828125, 3.2806396484375, 3.512451171875, 3.7442626953125, 3.97607421875, 4.2078857421875, 4.439697265625, 4.6715087890625, 4.9033203125, 5.1351318359375, 5.366943359375, 5.5987548828125, 5.83056640625, 6.0623779296875, 6.294189453125, 6.5260009765625, 6.7578125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 6.0, 0.0, 6.0, 7.0, 13.0, 10.0, 21.0, 16.0, 24.0, 37.0, 41.0, 27.0, 38.0, 54.0, 96.0, 120.0, 154.0, 214.0, 303.0, 524.0, 736.0, 1145.0, 1915.0, 3715.0, 8078.0, 21912.0, 94092.0, 5988706.0, 124753.0, 25506.0, 9146.0, 4035.0, 2220.0, 1231.0, 813.0, 519.0, 313.0, 269.0, 139.0, 135.0, 91.0, 57.0, 46.0, 29.0, 32.0, 25.0, 21.0, 17.0, 15.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-25.90625, -25.085693359375, -24.26513671875, -23.444580078125, -22.6240234375, -21.803466796875, -20.98291015625, -20.162353515625, -19.341796875, -18.521240234375, -17.70068359375, -16.880126953125, -16.0595703125, -15.239013671875, -14.41845703125, -13.597900390625, -12.77734375, -11.956787109375, -11.13623046875, -10.315673828125, -9.4951171875, -8.674560546875, -7.85400390625, -7.033447265625, -6.212890625, -5.392333984375, -4.57177734375, -3.751220703125, -2.9306640625, -2.110107421875, -1.28955078125, -0.468994140625, 0.3515625, 1.172119140625, 1.99267578125, 2.813232421875, 3.6337890625, 4.454345703125, 5.27490234375, 6.095458984375, 6.916015625, 7.736572265625, 8.55712890625, 9.377685546875, 10.1982421875, 11.018798828125, 11.83935546875, 12.659912109375, 13.48046875, 14.301025390625, 15.12158203125, 15.942138671875, 16.7626953125, 17.583251953125, 18.40380859375, 19.224365234375, 20.044921875, 20.865478515625, 21.68603515625, 22.506591796875, 23.3271484375, 24.147705078125, 24.96826171875, 25.788818359375, 26.609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 15.0, 11.0, 14.0, 17.0, 18.0, 32.0, 37.0, 47.0, 49.0, 72.0, 102.0, 328.0, 542.0, 242.0, 136.0, 70.0, 52.0, 38.0, 32.0, 26.0, 22.0, 17.0, 13.0, 16.0, 8.0, 10.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6796875, -8.3609619140625, -8.042236328125, -7.7235107421875, -7.40478515625, -7.0860595703125, -6.767333984375, -6.4486083984375, -6.1298828125, -5.8111572265625, -5.492431640625, -5.1737060546875, -4.85498046875, -4.5362548828125, -4.217529296875, -3.8988037109375, -3.580078125, -3.2613525390625, -2.942626953125, -2.6239013671875, -2.30517578125, -1.9864501953125, -1.667724609375, -1.3489990234375, -1.0302734375, -0.7115478515625, -0.392822265625, -0.0740966796875, 0.24462890625, 0.5633544921875, 0.882080078125, 1.2008056640625, 1.51953125, 1.8382568359375, 2.156982421875, 2.4757080078125, 2.79443359375, 3.1131591796875, 3.431884765625, 3.7506103515625, 4.0693359375, 4.3880615234375, 4.706787109375, 5.0255126953125, 5.34423828125, 5.6629638671875, 5.981689453125, 6.3004150390625, 6.619140625, 6.9378662109375, 7.256591796875, 7.5753173828125, 7.89404296875, 8.2127685546875, 8.531494140625, 8.8502197265625, 9.1689453125, 9.4876708984375, 9.806396484375, 10.1251220703125, 10.44384765625, 10.7625732421875, 11.081298828125, 11.4000244140625, 11.71875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 19.0, 94.0, 839.0, 33.0, 12.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-727.3897705078125, -708.3659057617188, -689.342041015625, -670.3181762695312, -651.2943115234375, -632.2704467773438, -613.24658203125, -594.2227172851562, -575.1988525390625, -556.1749877929688, -537.151123046875, -518.1272583007812, -499.1033935546875, -480.07952880859375, -461.0556640625, -442.03179931640625, -423.0079650878906, -403.9841003417969, -384.9602355957031, -365.9363708496094, -346.9125061035156, -327.8886413574219, -308.86480712890625, -289.8409423828125, -270.81707763671875, -251.793212890625, -232.76934814453125, -213.7454833984375, -194.72161865234375, -175.69775390625, -156.6739044189453, -137.65003967285156, -118.62615966796875, -99.602294921875, -80.57843017578125, -61.55457305908203, -42.53070831298828, -23.50684356689453, -4.4829864501953125, 14.540878295898438, 33.56474304199219, 52.58860778808594, 71.61247253417969, 90.6363296508789, 109.66019439697266, 128.68405151367188, 147.70791625976562, 166.73178100585938, 185.75564575195312, 204.77951049804688, 223.80337524414062, 242.82723999023438, 261.8511047363281, 280.8749694824219, 299.8988037109375, 318.92266845703125, 337.946533203125, 356.97039794921875, 375.9942626953125, 395.01812744140625, 414.0419921875, 433.06585693359375, 452.0897216796875, 471.11358642578125, 490.137451171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 17.0, 45.0, 533.0, 282.0, 38.0, 15.0, 19.0, 3.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-514.69970703125, -501.1358337402344, -487.57196044921875, -474.00811767578125, -460.4442443847656, -446.88037109375, -433.3164978027344, -419.75262451171875, -406.1887512207031, -392.6248779296875, -379.0610046386719, -365.49713134765625, -351.93328857421875, -338.3694152832031, -324.8055419921875, -311.2416687011719, -297.67779541015625, -284.1139221191406, -270.550048828125, -256.9862060546875, -243.4223175048828, -229.85845947265625, -216.29458618164062, -202.730712890625, -189.1668701171875, -175.60299682617188, -162.0391387939453, -148.4752655029297, -134.91139221191406, -121.34752655029297, -107.78366088867188, -94.21978759765625, -80.65591430664062, -67.09204864501953, -53.528175354003906, -39.96430969238281, -26.400440216064453, -12.836570739746094, 0.727294921875, 14.291168212890625, 27.85503387451172, 41.41890335083008, 54.98277282714844, 68.54663848876953, 82.11050415039062, 95.67437744140625, 109.23824310302734, 122.80211639404297, 136.36598205566406, 149.9298553466797, 163.49371337890625, 177.05758666992188, 190.6214599609375, 204.18533325195312, 217.7491912841797, 231.3130645751953, 244.87692260742188, 258.4407958984375, 272.0046691894531, 285.56854248046875, 299.13238525390625, 312.6962585449219, 326.2601318359375, 339.8240051269531, 353.38787841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 15.0, 18.0, 27.0, 30.0, 49.0, 80.0, 122.0, 171.0, 248.0, 430.0, 646.0, 976.0, 1678.0, 2917.0, 5915.0, 13237.0, 33525.0, 111659.0, 3505025.0, 419214.0, 56362.0, 22007.0, 9832.0, 4626.0, 2323.0, 1223.0, 714.0, 410.0, 249.0, 157.0, 91.0, 86.0, 53.0, 29.0, 28.0, 25.0, 22.0, 8.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3037109375, -1.2613372802734375, -1.218963623046875, -1.1765899658203125, -1.13421630859375, -1.0918426513671875, -1.049468994140625, -1.0070953369140625, -0.9647216796875, -0.9223480224609375, -0.879974365234375, -0.8376007080078125, -0.79522705078125, -0.7528533935546875, -0.710479736328125, -0.6681060791015625, -0.625732421875, -0.5833587646484375, -0.540985107421875, -0.4986114501953125, -0.45623779296875, -0.4138641357421875, -0.371490478515625, -0.3291168212890625, -0.2867431640625, -0.2443695068359375, -0.201995849609375, -0.1596221923828125, -0.11724853515625, -0.0748748779296875, -0.032501220703125, 0.0098724365234375, 0.05224609375, 0.0946197509765625, 0.136993408203125, 0.1793670654296875, 0.22174072265625, 0.2641143798828125, 0.306488037109375, 0.3488616943359375, 0.3912353515625, 0.4336090087890625, 0.475982666015625, 0.5183563232421875, 0.56072998046875, 0.6031036376953125, 0.645477294921875, 0.6878509521484375, 0.730224609375, 0.7725982666015625, 0.814971923828125, 0.8573455810546875, 0.89971923828125, 0.9420928955078125, 0.984466552734375, 1.0268402099609375, 1.0692138671875, 1.1115875244140625, 1.153961181640625, 1.1963348388671875, 1.23870849609375, 1.2810821533203125, 1.323455810546875, 1.3658294677734375, 1.408203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 13.0, 13.0, 12.0, 26.0, 113.0, 277.0, 306.0, 133.0, 33.0, 16.0, 11.0, 11.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12723207473754883, -0.12433719635009766, -0.12144231796264648, -0.11854743957519531, -0.11565256118774414, -0.11275768280029297, -0.1098628044128418, -0.10696792602539062, -0.10407304763793945, -0.10117816925048828, -0.09828329086303711, -0.09538841247558594, -0.09249353408813477, -0.0895986557006836, -0.08670377731323242, -0.08380889892578125, -0.08091402053833008, -0.0780191421508789, -0.07512426376342773, -0.07222938537597656, -0.06933450698852539, -0.06643962860107422, -0.06354475021362305, -0.060649871826171875, -0.0577549934387207, -0.05486011505126953, -0.05196523666381836, -0.04907035827636719, -0.046175479888916016, -0.043280601501464844, -0.04038572311401367, -0.0374908447265625, -0.03459596633911133, -0.031701087951660156, -0.028806209564208984, -0.025911331176757812, -0.02301645278930664, -0.02012157440185547, -0.017226696014404297, -0.014331817626953125, -0.011436939239501953, -0.008542060852050781, -0.005647182464599609, -0.0027523040771484375, 0.00014257431030273438, 0.0030374526977539062, 0.005932331085205078, 0.00882720947265625, 0.011722087860107422, 0.014616966247558594, 0.017511844635009766, 0.020406723022460938, 0.02330160140991211, 0.02619647979736328, 0.029091358184814453, 0.031986236572265625, 0.0348811149597168, 0.03777599334716797, 0.04067087173461914, 0.04356575012207031, 0.046460628509521484, 0.049355506896972656, 0.05225038528442383, 0.055145263671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 8.0, 8.0, 10.0, 21.0, 24.0, 34.0, 38.0, 57.0, 90.0, 110.0, 179.0, 334.0, 629.0, 1480.0, 3641.0, 10836.0, 44320.0, 290256.0, 2905048.0, 810971.0, 96440.0, 19518.0, 5926.0, 2181.0, 955.0, 463.0, 233.0, 134.0, 86.0, 59.0, 54.0, 27.0, 26.0, 9.0, 14.0, 8.0, 11.0, 9.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3857421875, -1.3433837890625, -1.301025390625, -1.2586669921875, -1.21630859375, -1.1739501953125, -1.131591796875, -1.0892333984375, -1.046875, -1.0045166015625, -0.962158203125, -0.9197998046875, -0.87744140625, -0.8350830078125, -0.792724609375, -0.7503662109375, -0.7080078125, -0.6656494140625, -0.623291015625, -0.5809326171875, -0.53857421875, -0.4962158203125, -0.453857421875, -0.4114990234375, -0.369140625, -0.3267822265625, -0.284423828125, -0.2420654296875, -0.19970703125, -0.1573486328125, -0.114990234375, -0.0726318359375, -0.0302734375, 0.0120849609375, 0.054443359375, 0.0968017578125, 0.13916015625, 0.1815185546875, 0.223876953125, 0.2662353515625, 0.30859375, 0.3509521484375, 0.393310546875, 0.4356689453125, 0.47802734375, 0.5203857421875, 0.562744140625, 0.6051025390625, 0.6474609375, 0.6898193359375, 0.732177734375, 0.7745361328125, 0.81689453125, 0.8592529296875, 0.901611328125, 0.9439697265625, 0.986328125, 1.0286865234375, 1.071044921875, 1.1134033203125, 1.15576171875, 1.1981201171875, 1.240478515625, 1.2828369140625, 1.3251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 10.0, 10.0, 12.0, 19.0, 21.0, 29.0, 37.0, 55.0, 66.0, 95.0, 107.0, 149.0, 193.0, 258.0, 266.0, 341.0, 451.0, 400.0, 297.0, 261.0, 196.0, 167.0, 131.0, 99.0, 100.0, 69.0, 51.0, 35.0, 33.0, 27.0, 23.0, 19.0, 11.0, 12.0, 8.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17529296875, -0.16959571838378906, -0.16389846801757812, -0.1582012176513672, -0.15250396728515625, -0.1468067169189453, -0.14110946655273438, -0.13541221618652344, -0.1297149658203125, -0.12401771545410156, -0.11832046508789062, -0.11262321472167969, -0.10692596435546875, -0.10122871398925781, -0.09553146362304688, -0.08983421325683594, -0.084136962890625, -0.07843971252441406, -0.07274246215820312, -0.06704521179199219, -0.06134796142578125, -0.05565071105957031, -0.049953460693359375, -0.04425621032714844, -0.0385589599609375, -0.03286170959472656, -0.027164459228515625, -0.021467208862304688, -0.01576995849609375, -0.010072708129882812, -0.004375457763671875, 0.0013217926025390625, 0.00701904296875, 0.012716293334960938, 0.018413543701171875, 0.024110794067382812, 0.02980804443359375, 0.03550529479980469, 0.041202545166015625, 0.04689979553222656, 0.0525970458984375, 0.05829429626464844, 0.06399154663085938, 0.06968879699707031, 0.07538604736328125, 0.08108329772949219, 0.08678054809570312, 0.09247779846191406, 0.098175048828125, 0.10387229919433594, 0.10956954956054688, 0.11526679992675781, 0.12096405029296875, 0.1266613006591797, 0.13235855102539062, 0.13805580139160156, 0.1437530517578125, 0.14945030212402344, 0.15514755249023438, 0.1608448028564453, 0.16654205322265625, 0.1722393035888672, 0.17793655395507812, 0.18363380432128906, 0.1893310546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 15.0, 59.0, 160.0, 326.0, 254.0, 104.0, 50.0, 24.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.431906223297119, -4.1932783126831055, -3.954650640487671, -3.7160229682922363, -3.4773950576782227, -3.238767385482788, -3.0001397132873535, -2.76151180267334, -2.5228841304779053, -2.2842564582824707, -2.045628547668457, -1.8070008754730225, -1.5683730840682983, -1.3297452926635742, -1.0911176204681396, -0.8524898290634155, -0.6138620376586914, -0.3752342760562897, -0.13660651445388794, 0.1020212173461914, 0.3406490087509155, 0.5792768001556396, 0.8179044723510742, 1.0565322637557983, 1.2951600551605225, 1.5337878465652466, 1.7724156379699707, 2.0110433101654053, 2.24967098236084, 2.4882988929748535, 2.726926565170288, 2.9655542373657227, 3.204181671142578, 3.4428093433380127, 3.6814372539520264, 3.920064926147461, 4.158692836761475, 4.397320747375488, 4.635948181152344, 4.874576091766357, 5.113204002380371, 5.351831912994385, 5.59045934677124, 5.829087257385254, 6.067715167999268, 6.306343078613281, 6.544970512390137, 6.78359842300415, 7.022225856781006, 7.2608537673950195, 7.499481201171875, 7.738109111785889, 7.976737022399902, 8.215364456176758, 8.45399284362793, 8.692620277404785, 8.93124771118164, 9.169875144958496, 9.408503532409668, 9.647130966186523, 9.885758399963379, 10.12438678741455, 10.363014221191406, 10.601641654968262, 10.840270042419434]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 16.0, 9.0, 11.0, 12.0, 24.0, 31.0, 43.0, 57.0, 46.0, 54.0, 67.0, 67.0, 55.0, 60.0, 48.0, 55.0, 47.0, 42.0, 57.0, 37.0, 26.0, 26.0, 17.0, 19.0, 14.0, 11.0, 11.0, 7.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5127581357955933, -1.460258960723877, -1.4077597856521606, -1.3552606105804443, -1.302761435508728, -1.2502622604370117, -1.197763204574585, -1.145263910293579, -1.0927648544311523, -1.040265679359436, -0.9877665042877197, -0.9352673292160034, -0.8827681541442871, -0.8302689790725708, -0.7777698636054993, -0.725270688533783, -0.6727714538574219, -0.6202722787857056, -0.5677731037139893, -0.515273928642273, -0.46277478337287903, -0.4102756083011627, -0.3577764630317688, -0.3052772879600525, -0.2527781128883362, -0.20027893781661987, -0.14777977764606476, -0.09528061747550964, -0.042781442403793335, 0.009717732667922974, 0.062216877937316895, 0.1147160530090332, 0.16721510887145996, 0.21971428394317627, 0.2722134590148926, 0.3247126042842865, 0.3772117793560028, 0.4297109544277191, 0.48221009969711304, 0.5347092747688293, 0.5872084498405457, 0.639707624912262, 0.6922067999839783, 0.7447059154510498, 0.7972050905227661, 0.8497042655944824, 0.9022034406661987, 0.954702615737915, 1.0072017908096313, 1.0597009658813477, 1.112200140953064, 1.1646993160247803, 1.2171984910964966, 1.269697666168213, 1.3221967220306396, 1.3746960163116455, 1.4271950721740723, 1.4796942472457886, 1.5321934223175049, 1.5846925973892212, 1.6371917724609375, 1.6896909475326538, 1.7421901226043701, 1.7946891784667969, 1.8471884727478027]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 6.0, 15.0, 13.0, 22.0, 24.0, 54.0, 70.0, 79.0, 121.0, 193.0, 275.0, 441.0, 710.0, 1224.0, 2177.0, 4329.0, 9928.0, 29971.0, 170070.0, 680147.0, 108899.0, 23101.0, 8164.0, 3674.0, 1913.0, 1071.0, 648.0, 357.0, 241.0, 197.0, 112.0, 82.0, 55.0, 31.0, 28.0, 28.0, 23.0, 13.0, 11.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.802734375, -0.7806777954101562, -0.7586212158203125, -0.7365646362304688, -0.714508056640625, -0.6924514770507812, -0.6703948974609375, -0.6483383178710938, -0.62628173828125, -0.6042251586914062, -0.5821685791015625, -0.5601119995117188, -0.538055419921875, -0.5159988403320312, -0.4939422607421875, -0.47188568115234375, -0.4498291015625, -0.42777252197265625, -0.4057159423828125, -0.38365936279296875, -0.361602783203125, -0.33954620361328125, -0.3174896240234375, -0.29543304443359375, -0.27337646484375, -0.25131988525390625, -0.2292633056640625, -0.20720672607421875, -0.185150146484375, -0.16309356689453125, -0.1410369873046875, -0.11898040771484375, -0.096923828125, -0.07486724853515625, -0.0528106689453125, -0.03075408935546875, -0.008697509765625, 0.01335906982421875, 0.0354156494140625, 0.05747222900390625, 0.07952880859375, 0.10158538818359375, 0.1236419677734375, 0.14569854736328125, 0.167755126953125, 0.18981170654296875, 0.2118682861328125, 0.23392486572265625, 0.2559814453125, 0.27803802490234375, 0.3000946044921875, 0.32215118408203125, 0.344207763671875, 0.36626434326171875, 0.3883209228515625, 0.41037750244140625, 0.43243408203125, 0.45449066162109375, 0.4765472412109375, 0.49860382080078125, 0.520660400390625, 0.5427169799804688, 0.5647735595703125, 0.5868301391601562, 0.60888671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 20.0, 20.0, 21.0, 44.0, 50.0, 66.0, 79.0, 86.0, 95.0, 107.0, 88.0, 78.0, 68.0, 44.0, 26.0, 19.0, 21.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06875371932983398, -0.06682872772216797, -0.06490373611450195, -0.06297874450683594, -0.06105375289916992, -0.059128761291503906, -0.05720376968383789, -0.055278778076171875, -0.05335378646850586, -0.051428794860839844, -0.04950380325317383, -0.04757881164550781, -0.0456538200378418, -0.04372882843017578, -0.041803836822509766, -0.03987884521484375, -0.037953853607177734, -0.03602886199951172, -0.0341038703918457, -0.03217887878417969, -0.030253887176513672, -0.028328895568847656, -0.02640390396118164, -0.024478912353515625, -0.02255392074584961, -0.020628929138183594, -0.018703937530517578, -0.016778945922851562, -0.014853954315185547, -0.012928962707519531, -0.011003971099853516, -0.0090789794921875, -0.007153987884521484, -0.005228996276855469, -0.003304004669189453, -0.0013790130615234375, 0.0005459785461425781, 0.0024709701538085938, 0.004395961761474609, 0.006320953369140625, 0.00824594497680664, 0.010170936584472656, 0.012095928192138672, 0.014020919799804688, 0.015945911407470703, 0.01787090301513672, 0.019795894622802734, 0.02172088623046875, 0.023645877838134766, 0.02557086944580078, 0.027495861053466797, 0.029420852661132812, 0.03134584426879883, 0.033270835876464844, 0.03519582748413086, 0.037120819091796875, 0.03904581069946289, 0.040970802307128906, 0.04289579391479492, 0.04482078552246094, 0.04674577713012695, 0.04867076873779297, 0.050595760345458984, 0.052520751953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 0.0, 8.0, 10.0, 6.0, 10.0, 15.0, 21.0, 34.0, 48.0, 47.0, 85.0, 117.0, 185.0, 338.0, 537.0, 971.0, 2105.0, 5476.0, 20586.0, 167761.0, 739844.0, 88627.0, 13708.0, 4220.0, 1683.0, 875.0, 455.0, 264.0, 175.0, 81.0, 83.0, 51.0, 33.0, 28.0, 20.0, 12.0, 12.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0087890625, -0.9744415283203125, -0.940093994140625, -0.9057464599609375, -0.87139892578125, -0.8370513916015625, -0.802703857421875, -0.7683563232421875, -0.7340087890625, -0.6996612548828125, -0.665313720703125, -0.6309661865234375, -0.59661865234375, -0.5622711181640625, -0.527923583984375, -0.4935760498046875, -0.459228515625, -0.4248809814453125, -0.390533447265625, -0.3561859130859375, -0.32183837890625, -0.2874908447265625, -0.253143310546875, -0.2187957763671875, -0.1844482421875, -0.1501007080078125, -0.115753173828125, -0.0814056396484375, -0.04705810546875, -0.0127105712890625, 0.021636962890625, 0.0559844970703125, 0.09033203125, 0.1246795654296875, 0.159027099609375, 0.1933746337890625, 0.22772216796875, 0.2620697021484375, 0.296417236328125, 0.3307647705078125, 0.3651123046875, 0.3994598388671875, 0.433807373046875, 0.4681549072265625, 0.50250244140625, 0.5368499755859375, 0.571197509765625, 0.6055450439453125, 0.639892578125, 0.6742401123046875, 0.708587646484375, 0.7429351806640625, 0.77728271484375, 0.8116302490234375, 0.845977783203125, 0.8803253173828125, 0.9146728515625, 0.9490203857421875, 0.983367919921875, 1.0177154541015625, 1.05206298828125, 1.0864105224609375, 1.120758056640625, 1.1551055908203125, 1.189453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 9.0, 5.0, 15.0, 8.0, 11.0, 13.0, 21.0, 21.0, 23.0, 35.0, 25.0, 30.0, 19.0, 34.0, 42.0, 28.0, 43.0, 49.0, 42.0, 40.0, 41.0, 41.0, 33.0, 37.0, 26.0, 35.0, 32.0, 25.0, 31.0, 14.0, 22.0, 18.0, 13.0, 18.0, 15.0, 9.0, 10.0, 6.0, 11.0, 10.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.2391357421875, -0.23168373107910156, -0.22423171997070312, -0.2167797088623047, -0.20932769775390625, -0.2018756866455078, -0.19442367553710938, -0.18697166442871094, -0.1795196533203125, -0.17206764221191406, -0.16461563110351562, -0.1571636199951172, -0.14971160888671875, -0.1422595977783203, -0.13480758666992188, -0.12735557556152344, -0.119903564453125, -0.11245155334472656, -0.10499954223632812, -0.09754753112792969, -0.09009552001953125, -0.08264350891113281, -0.07519149780273438, -0.06773948669433594, -0.0602874755859375, -0.05283546447753906, -0.045383453369140625, -0.03793144226074219, -0.03047943115234375, -0.023027420043945312, -0.015575408935546875, -0.008123397827148438, -0.00067138671875, 0.0067806243896484375, 0.014232635498046875, 0.021684646606445312, 0.02913665771484375, 0.03658866882324219, 0.044040679931640625, 0.05149269104003906, 0.0589447021484375, 0.06639671325683594, 0.07384872436523438, 0.08130073547363281, 0.08875274658203125, 0.09620475769042969, 0.10365676879882812, 0.11110877990722656, 0.118560791015625, 0.12601280212402344, 0.13346481323242188, 0.1409168243408203, 0.14836883544921875, 0.1558208465576172, 0.16327285766601562, 0.17072486877441406, 0.1781768798828125, 0.18562889099121094, 0.19308090209960938, 0.2005329132080078, 0.20798492431640625, 0.2154369354248047, 0.22288894653320312, 0.23034095764160156, 0.23779296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 23.0, 14.0, 27.0, 56.0, 81.0, 180.0, 394.0, 952.0, 3808.0, 63288.0, 968521.0, 8546.0, 1610.0, 527.0, 234.0, 115.0, 61.0, 29.0, 28.0, 15.0, 10.0, 8.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.2777099609375, -6.082763671875, -5.8878173828125, -5.69287109375, -5.4979248046875, -5.302978515625, -5.1080322265625, -4.9130859375, -4.7181396484375, -4.523193359375, -4.3282470703125, -4.13330078125, -3.9383544921875, -3.743408203125, -3.5484619140625, -3.353515625, -3.1585693359375, -2.963623046875, -2.7686767578125, -2.57373046875, -2.3787841796875, -2.183837890625, -1.9888916015625, -1.7939453125, -1.5989990234375, -1.404052734375, -1.2091064453125, -1.01416015625, -0.8192138671875, -0.624267578125, -0.4293212890625, -0.234375, -0.0394287109375, 0.155517578125, 0.3504638671875, 0.54541015625, 0.7403564453125, 0.935302734375, 1.1302490234375, 1.3251953125, 1.5201416015625, 1.715087890625, 1.9100341796875, 2.10498046875, 2.2999267578125, 2.494873046875, 2.6898193359375, 2.884765625, 3.0797119140625, 3.274658203125, 3.4696044921875, 3.66455078125, 3.8594970703125, 4.054443359375, 4.2493896484375, 4.4443359375, 4.6392822265625, 4.834228515625, 5.0291748046875, 5.22412109375, 5.4190673828125, 5.614013671875, 5.8089599609375, 6.00390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 2.0, 12.0, 6.0, 4.0, 16.0, 12.0, 15.0, 17.0, 24.0, 42.0, 48.0, 73.0, 139.0, 190.0, 115.0, 58.0, 41.0, 30.0, 30.0, 27.0, 16.0, 15.0, 11.0, 8.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.000701904296875, -0.0006814450025558472, -0.0006609857082366943, -0.0006405264139175415, -0.0006200671195983887, -0.0005996078252792358, -0.000579148530960083, -0.0005586892366409302, -0.0005382299423217773, -0.0005177706480026245, -0.0004973113536834717, -0.00047685205936431885, -0.000456392765045166, -0.0004359334707260132, -0.00041547417640686035, -0.0003950148820877075, -0.0003745555877685547, -0.00035409629344940186, -0.000333636999130249, -0.0003131777048110962, -0.00029271841049194336, -0.00027225911617279053, -0.0002517998218536377, -0.00023134052753448486, -0.00021088123321533203, -0.0001904219388961792, -0.00016996264457702637, -0.00014950335025787354, -0.0001290440559387207, -0.00010858476161956787, -8.812546730041504e-05, -6.766617298126221e-05, -4.7206878662109375e-05, -2.6747584342956543e-05, -6.288290023803711e-06, 1.4171004295349121e-05, 3.463029861450195e-05, 5.5089592933654785e-05, 7.554888725280762e-05, 9.600818157196045e-05, 0.00011646747589111328, 0.0001369267702102661, 0.00015738606452941895, 0.00017784535884857178, 0.0001983046531677246, 0.00021876394748687744, 0.00023922324180603027, 0.0002596825361251831, 0.00028014183044433594, 0.00030060112476348877, 0.0003210604190826416, 0.00034151971340179443, 0.00036197900772094727, 0.0003824383020401001, 0.00040289759635925293, 0.00042335689067840576, 0.0004438161849975586, 0.0004642754793167114, 0.00048473477363586426, 0.0005051940679550171, 0.0005256533622741699, 0.0005461126565933228, 0.0005665719509124756, 0.0005870312452316284, 0.0006074905395507812]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 11.0, 15.0, 13.0, 17.0, 32.0, 31.0, 49.0, 53.0, 78.0, 125.0, 182.0, 282.0, 445.0, 804.0, 1377.0, 3028.0, 8091.0, 34165.0, 791428.0, 178050.0, 19378.0, 5666.0, 2339.0, 1143.0, 582.0, 356.0, 233.0, 165.0, 113.0, 80.0, 62.0, 32.0, 25.0, 22.0, 12.0, 14.0, 10.0, 16.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.048828125, -2.953033447265625, -2.85723876953125, -2.761444091796875, -2.6656494140625, -2.569854736328125, -2.47406005859375, -2.378265380859375, -2.282470703125, -2.186676025390625, -2.09088134765625, -1.995086669921875, -1.8992919921875, -1.803497314453125, -1.70770263671875, -1.611907958984375, -1.51611328125, -1.420318603515625, -1.32452392578125, -1.228729248046875, -1.1329345703125, -1.037139892578125, -0.94134521484375, -0.845550537109375, -0.749755859375, -0.653961181640625, -0.55816650390625, -0.462371826171875, -0.3665771484375, -0.270782470703125, -0.17498779296875, -0.079193115234375, 0.0166015625, 0.112396240234375, 0.20819091796875, 0.303985595703125, 0.3997802734375, 0.495574951171875, 0.59136962890625, 0.687164306640625, 0.782958984375, 0.878753662109375, 0.97454833984375, 1.070343017578125, 1.1661376953125, 1.261932373046875, 1.35772705078125, 1.453521728515625, 1.54931640625, 1.645111083984375, 1.74090576171875, 1.836700439453125, 1.9324951171875, 2.028289794921875, 2.12408447265625, 2.219879150390625, 2.315673828125, 2.411468505859375, 2.50726318359375, 2.603057861328125, 2.6988525390625, 2.794647216796875, 2.89044189453125, 2.986236572265625, 3.08203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 2.0, 14.0, 7.0, 15.0, 13.0, 25.0, 24.0, 42.0, 54.0, 85.0, 189.0, 177.0, 97.0, 67.0, 35.0, 24.0, 29.0, 18.0, 10.0, 12.0, 11.0, 3.0, 9.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0160903930664062, -0.9862823486328125, -0.9564743041992188, -0.926666259765625, -0.8968582153320312, -0.8670501708984375, -0.8372421264648438, -0.80743408203125, -0.7776260375976562, -0.7478179931640625, -0.7180099487304688, -0.688201904296875, -0.6583938598632812, -0.6285858154296875, -0.5987777709960938, -0.5689697265625, -0.5391616821289062, -0.5093536376953125, -0.47954559326171875, -0.449737548828125, -0.41992950439453125, -0.3901214599609375, -0.36031341552734375, -0.33050537109375, -0.30069732666015625, -0.2708892822265625, -0.24108123779296875, -0.211273193359375, -0.18146514892578125, -0.1516571044921875, -0.12184906005859375, -0.092041015625, -0.06223297119140625, -0.0324249267578125, -0.00261688232421875, 0.027191162109375, 0.05699920654296875, 0.0868072509765625, 0.11661529541015625, 0.14642333984375, 0.17623138427734375, 0.2060394287109375, 0.23584747314453125, 0.265655517578125, 0.29546356201171875, 0.3252716064453125, 0.35507965087890625, 0.3848876953125, 0.41469573974609375, 0.4445037841796875, 0.47431182861328125, 0.504119873046875, 0.5339279174804688, 0.5637359619140625, 0.5935440063476562, 0.62335205078125, 0.6531600952148438, 0.6829681396484375, 0.7127761840820312, 0.742584228515625, 0.7723922729492188, 0.8022003173828125, 0.8320083618164062, 0.86181640625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 14.0, 21.0, 49.0, 116.0, 256.0, 320.0, 127.0, 61.0, 25.0, 10.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.086206436157227, -9.68289852142334, -9.27959156036377, -8.876283645629883, -8.472975730895996, -8.069668769836426, -7.666360855102539, -7.2630534172058105, -6.859745979309082, -6.4564385414123535, -6.053130626678467, -5.649823188781738, -5.24651575088501, -4.843208312988281, -4.4399003982543945, -4.036592960357666, -3.6332850456237793, -3.2299773693084717, -2.826669931411743, -2.4233622550964355, -2.020054817199707, -1.6167471408843994, -1.2134394645690918, -0.8101320266723633, -0.40682435035705566, -0.00351676344871521, 0.39979082345962524, 0.8030984401702881, 1.2064059972763062, 1.6097135543823242, 2.013021230697632, 2.4163286685943604, 2.819636344909668, 3.2229440212249756, 3.626251459121704, 4.029559135437012, 4.43286657333374, 4.836174011230469, 5.2394819259643555, 5.642789363861084, 6.0460968017578125, 6.449404239654541, 6.852712154388428, 7.256019592285156, 7.659327030181885, 8.062634468078613, 8.4659423828125, 8.86924934387207, 9.272558212280273, 9.67586612701416, 10.07917308807373, 10.482481002807617, 10.885788917541504, 11.289095878601074, 11.692403793334961, 12.095710754394531, 12.499018669128418, 12.902326583862305, 13.305633544921875, 13.708941459655762, 14.112249374389648, 14.515556335449219, 14.918864250183105, 15.322172164916992, 15.725479125976562]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 9.0, 28.0, 36.0, 49.0, 89.0, 93.0, 118.0, 123.0, 97.0, 106.0, 71.0, 43.0, 22.0, 29.0, 15.0, 10.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.885300636291504, -4.714145660400391, -4.5429911613464355, -4.371836185455322, -4.200681209564209, -4.029526233673096, -3.8583717346191406, -3.6872167587280273, -3.516061782836914, -3.34490704536438, -3.1737520694732666, -3.0025973320007324, -2.831442356109619, -2.660287618637085, -2.489132881164551, -2.3179779052734375, -2.1468231678009033, -1.9756683111190796, -1.8045134544372559, -1.6333587169647217, -1.4622037410736084, -1.2910490036010742, -1.1198941469192505, -0.9487392902374268, -0.777584433555603, -0.6064295768737793, -0.43527474999427795, -0.2641199231147766, -0.09296506643295288, 0.07818979024887085, 0.2493445873260498, 0.42049944400787354, 0.5916543006896973, 0.762809157371521, 0.9339640140533447, 1.105118751525879, 1.2762737274169922, 1.4474284648895264, 1.61858332157135, 1.7897381782531738, 1.9608930349349976, 2.1320478916168213, 2.3032026290893555, 2.4743576049804688, 2.645512342453003, 2.816667318344116, 2.9878220558166504, 3.1589770317077637, 3.330131769180298, 3.501286506652832, 3.6724414825439453, 3.8435962200164795, 4.014750957489014, 4.185905933380127, 4.35706090927124, 4.528215408325195, 4.699370384216309, 4.870525360107422, 5.041679859161377, 5.21283483505249, 5.3839898109436035, 5.555144786834717, 5.726299285888672, 5.897454261779785, 6.068609237670898]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 18.0, 27.0, 36.0, 122.0, 493.0, 8569.0, 4177163.0, 7429.0, 281.0, 57.0, 26.0, 13.0, 14.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.734375, -23.234619140625, -22.73486328125, -22.235107421875, -21.7353515625, -21.235595703125, -20.73583984375, -20.236083984375, -19.736328125, -19.236572265625, -18.73681640625, -18.237060546875, -17.7373046875, -17.237548828125, -16.73779296875, -16.238037109375, -15.73828125, -15.238525390625, -14.73876953125, -14.239013671875, -13.7392578125, -13.239501953125, -12.73974609375, -12.239990234375, -11.740234375, -11.240478515625, -10.74072265625, -10.240966796875, -9.7412109375, -9.241455078125, -8.74169921875, -8.241943359375, -7.7421875, -7.242431640625, -6.74267578125, -6.242919921875, -5.7431640625, -5.243408203125, -4.74365234375, -4.243896484375, -3.744140625, -3.244384765625, -2.74462890625, -2.244873046875, -1.7451171875, -1.245361328125, -0.74560546875, -0.245849609375, 0.25390625, 0.753662109375, 1.25341796875, 1.753173828125, 2.2529296875, 2.752685546875, 3.25244140625, 3.752197265625, 4.251953125, 4.751708984375, 5.25146484375, 5.751220703125, 6.2509765625, 6.750732421875, 7.25048828125, 7.750244140625, 8.25]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 8.0, 6.0, 20.0, 26.0, 31.0, 39.0, 59.0, 59.0, 75.0, 84.0, 94.0, 90.0, 92.0, 69.0, 59.0, 51.0, 32.0, 27.0, 15.0, 17.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06982421875, -0.06776952743530273, -0.06571483612060547, -0.0636601448059082, -0.06160545349121094, -0.05955076217651367, -0.057496070861816406, -0.05544137954711914, -0.053386688232421875, -0.05133199691772461, -0.049277305603027344, -0.04722261428833008, -0.04516792297363281, -0.04311323165893555, -0.04105854034423828, -0.039003849029541016, -0.03694915771484375, -0.034894466400146484, -0.03283977508544922, -0.030785083770751953, -0.028730392456054688, -0.026675701141357422, -0.024621009826660156, -0.02256631851196289, -0.020511627197265625, -0.01845693588256836, -0.016402244567871094, -0.014347553253173828, -0.012292861938476562, -0.010238170623779297, -0.008183479309082031, -0.006128787994384766, -0.0040740966796875, -0.0020194053649902344, 3.528594970703125e-05, 0.002089977264404297, 0.0041446685791015625, 0.006199359893798828, 0.008254051208496094, 0.01030874252319336, 0.012363433837890625, 0.01441812515258789, 0.016472816467285156, 0.018527507781982422, 0.020582199096679688, 0.022636890411376953, 0.02469158172607422, 0.026746273040771484, 0.02880096435546875, 0.030855655670166016, 0.03291034698486328, 0.03496503829956055, 0.03701972961425781, 0.03907442092895508, 0.041129112243652344, 0.04318380355834961, 0.045238494873046875, 0.04729318618774414, 0.049347877502441406, 0.05140256881713867, 0.05345726013183594, 0.0555119514465332, 0.05756664276123047, 0.059621334075927734, 0.061676025390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 14.0, 16.0, 24.0, 37.0, 92.0, 139.0, 327.0, 739.0, 2096.0, 7842.0, 40602.0, 474716.0, 3550703.0, 96640.0, 14585.0, 3471.0, 1137.0, 488.0, 230.0, 137.0, 97.0, 42.0, 32.0, 16.0, 15.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.142578125, -3.05072021484375, -2.9588623046875, -2.86700439453125, -2.775146484375, -2.68328857421875, -2.5914306640625, -2.49957275390625, -2.40771484375, -2.31585693359375, -2.2239990234375, -2.13214111328125, -2.040283203125, -1.94842529296875, -1.8565673828125, -1.76470947265625, -1.6728515625, -1.58099365234375, -1.4891357421875, -1.39727783203125, -1.305419921875, -1.21356201171875, -1.1217041015625, -1.02984619140625, -0.93798828125, -0.84613037109375, -0.7542724609375, -0.66241455078125, -0.570556640625, -0.47869873046875, -0.3868408203125, -0.29498291015625, -0.203125, -0.11126708984375, -0.0194091796875, 0.07244873046875, 0.164306640625, 0.25616455078125, 0.3480224609375, 0.43988037109375, 0.53173828125, 0.62359619140625, 0.7154541015625, 0.80731201171875, 0.899169921875, 0.99102783203125, 1.0828857421875, 1.17474365234375, 1.2666015625, 1.35845947265625, 1.4503173828125, 1.54217529296875, 1.634033203125, 1.72589111328125, 1.8177490234375, 1.90960693359375, 2.00146484375, 2.09332275390625, 2.1851806640625, 2.27703857421875, 2.368896484375, 2.46075439453125, 2.5526123046875, 2.64447021484375, 2.736328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 6.0, 1.0, 8.0, 8.0, 8.0, 14.0, 12.0, 10.0, 14.0, 22.0, 35.0, 37.0, 57.0, 80.0, 121.0, 161.0, 428.0, 1493.0, 716.0, 272.0, 171.0, 110.0, 72.0, 66.0, 28.0, 39.0, 17.0, 13.0, 17.0, 14.0, 6.0, 8.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2154541015625, -0.20940017700195312, -0.20334625244140625, -0.19729232788085938, -0.1912384033203125, -0.18518447875976562, -0.17913055419921875, -0.17307662963867188, -0.167022705078125, -0.16096878051757812, -0.15491485595703125, -0.14886093139648438, -0.1428070068359375, -0.13675308227539062, -0.13069915771484375, -0.12464523315429688, -0.11859130859375, -0.11253738403320312, -0.10648345947265625, -0.10042953491210938, -0.0943756103515625, -0.08832168579101562, -0.08226776123046875, -0.07621383666992188, -0.070159912109375, -0.06410598754882812, -0.05805206298828125, -0.051998138427734375, -0.0459442138671875, -0.039890289306640625, -0.03383636474609375, -0.027782440185546875, -0.021728515625, -0.015674591064453125, -0.00962066650390625, -0.003566741943359375, 0.0024871826171875, 0.008541107177734375, 0.01459503173828125, 0.020648956298828125, 0.026702880859375, 0.032756805419921875, 0.03881072998046875, 0.044864654541015625, 0.0509185791015625, 0.056972503662109375, 0.06302642822265625, 0.06908035278320312, 0.07513427734375, 0.08118820190429688, 0.08724212646484375, 0.09329605102539062, 0.0993499755859375, 0.10540390014648438, 0.11145782470703125, 0.11751174926757812, 0.123565673828125, 0.12961959838867188, 0.13567352294921875, 0.14172744750976562, 0.1477813720703125, 0.15383529663085938, 0.15988922119140625, 0.16594314575195312, 0.1719970703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 11.0, 42.0, 276.0, 547.0, 111.0, 15.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.924245834350586, -6.611834526062012, -6.2994232177734375, -5.9870123863220215, -5.674601078033447, -5.362189769744873, -5.049778938293457, -4.737367630004883, -4.424956321716309, -4.112545013427734, -3.8001339435577393, -3.487722873687744, -3.17531156539917, -2.8629002571105957, -2.5504891872406006, -2.2380781173706055, -1.9256668090820312, -1.6132556200027466, -1.300844430923462, -0.9884332418441772, -0.6760220527648926, -0.3636108636856079, -0.05119967460632324, 0.2612113952636719, 0.5736227035522461, 0.8860338926315308, 1.1984450817108154, 1.5108562707901, 1.8232674598693848, 2.135678768157959, 2.448089838027954, 2.760500907897949, 3.0729122161865234, 3.3853235244750977, 3.6977345943450928, 4.010145664215088, 4.322556972503662, 4.634968280792236, 4.947379112243652, 5.259790420532227, 5.572201728820801, 5.884613037109375, 6.197024345397949, 6.509435176849365, 6.8218464851379395, 7.134257793426514, 7.44666862487793, 7.759079933166504, 8.071491241455078, 8.383902549743652, 8.696313858032227, 9.0087251663208, 9.321136474609375, 9.633546829223633, 9.945958137512207, 10.258369445800781, 10.570780754089355, 10.88319206237793, 11.195603370666504, 11.508014678955078, 11.820425033569336, 12.13283634185791, 12.445247650146484, 12.757658958435059, 13.070070266723633]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 29.0, 45.0, 69.0, 87.0, 97.0, 95.0, 116.0, 104.0, 90.0, 66.0, 62.0, 30.0, 29.0, 11.0, 15.0, 3.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.533045768737793, -1.4771573543548584, -1.4212690591812134, -1.3653806447982788, -1.3094923496246338, -1.2536039352416992, -1.1977155208587646, -1.14182710647583, -1.085938811302185, -1.0300503969192505, -0.9741621017456055, -0.9182736873626709, -0.8623853325843811, -0.8064969778060913, -0.7506085634231567, -0.6947202086448669, -0.6388318538665771, -0.5829434990882874, -0.5270551443099976, -0.471166729927063, -0.4152783751487732, -0.3593900203704834, -0.3035016357898712, -0.24761325120925903, -0.19172489643096924, -0.13583652675151825, -0.07994815707206726, -0.024059787392616272, 0.03182858228683472, 0.08771693706512451, 0.1436053216457367, 0.19949370622634888, 0.25538206100463867, 0.31127041578292847, 0.36715880036354065, 0.42304718494415283, 0.4789355397224426, 0.5348238945007324, 0.590712308883667, 0.6466006636619568, 0.7024890184402466, 0.7583773732185364, 0.8142657279968262, 0.8701541423797607, 0.9260424971580505, 0.9819308519363403, 1.037819266319275, 1.09370756149292, 1.1495959758758545, 1.205484390258789, 1.261372685432434, 1.3172610998153687, 1.3731493949890137, 1.4290378093719482, 1.4849262237548828, 1.5408146381378174, 1.5967029333114624, 1.652591347694397, 1.708479642868042, 1.7643680572509766, 1.8202564716339111, 1.8761447668075562, 1.9320331811904907, 1.9879214763641357, 2.0438098907470703]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 4.0, 5.0, 5.0, 11.0, 10.0, 25.0, 25.0, 52.0, 69.0, 150.0, 299.0, 907.0, 3223.0, 17463.0, 344660.0, 650381.0, 25542.0, 3887.0, 1085.0, 367.0, 158.0, 82.0, 36.0, 33.0, 16.0, 11.0, 14.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.35546875, -3.25701904296875, -3.1585693359375, -3.06011962890625, -2.961669921875, -2.86322021484375, -2.7647705078125, -2.66632080078125, -2.56787109375, -2.46942138671875, -2.3709716796875, -2.27252197265625, -2.174072265625, -2.07562255859375, -1.9771728515625, -1.87872314453125, -1.7802734375, -1.68182373046875, -1.5833740234375, -1.48492431640625, -1.386474609375, -1.28802490234375, -1.1895751953125, -1.09112548828125, -0.99267578125, -0.89422607421875, -0.7957763671875, -0.69732666015625, -0.598876953125, -0.50042724609375, -0.4019775390625, -0.30352783203125, -0.205078125, -0.10662841796875, -0.0081787109375, 0.09027099609375, 0.188720703125, 0.28717041015625, 0.3856201171875, 0.48406982421875, 0.58251953125, 0.68096923828125, 0.7794189453125, 0.87786865234375, 0.976318359375, 1.07476806640625, 1.1732177734375, 1.27166748046875, 1.3701171875, 1.46856689453125, 1.5670166015625, 1.66546630859375, 1.763916015625, 1.86236572265625, 1.9608154296875, 2.05926513671875, 2.15771484375, 2.25616455078125, 2.3546142578125, 2.45306396484375, 2.551513671875, 2.64996337890625, 2.7484130859375, 2.84686279296875, 2.9453125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 6.0, 14.0, 35.0, 67.0, 103.0, 153.0, 171.0, 157.0, 135.0, 68.0, 36.0, 27.0, 12.0, 5.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06515979766845703, -0.06043434143066406, -0.055708885192871094, -0.050983428955078125, -0.046257972717285156, -0.04153251647949219, -0.03680706024169922, -0.03208160400390625, -0.02735614776611328, -0.022630691528320312, -0.017905235290527344, -0.013179779052734375, -0.008454322814941406, -0.0037288665771484375, 0.0009965896606445312, 0.0057220458984375, 0.010447502136230469, 0.015172958374023438, 0.019898414611816406, 0.024623870849609375, 0.029349327087402344, 0.03407478332519531, 0.03880023956298828, 0.04352569580078125, 0.04825115203857422, 0.05297660827636719, 0.057702064514160156, 0.062427520751953125, 0.0671529769897461, 0.07187843322753906, 0.07660388946533203, 0.081329345703125, 0.08605480194091797, 0.09078025817871094, 0.0955057144165039, 0.10023117065429688, 0.10495662689208984, 0.10968208312988281, 0.11440753936767578, 0.11913299560546875, 0.12385845184326172, 0.1285839080810547, 0.13330936431884766, 0.13803482055664062, 0.1427602767944336, 0.14748573303222656, 0.15221118927001953, 0.1569366455078125, 0.16166210174560547, 0.16638755798339844, 0.1711130142211914, 0.17583847045898438, 0.18056392669677734, 0.1852893829345703, 0.19001483917236328, 0.19474029541015625, 0.19946575164794922, 0.2041912078857422, 0.20891666412353516, 0.21364212036132812, 0.2183675765991211, 0.22309303283691406, 0.22781848907470703, 0.2325439453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 2.0, 4.0, 7.0, 2.0, 4.0, 8.0, 12.0, 8.0, 11.0, 17.0, 24.0, 18.0, 25.0, 39.0, 109.0, 505.0, 5170.0, 628767.0, 408917.0, 4182.0, 456.0, 66.0, 38.0, 29.0, 20.0, 15.0, 9.0, 13.0, 12.0, 11.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-4.66015625, -4.53057861328125, -4.4010009765625, -4.27142333984375, -4.141845703125, -4.01226806640625, -3.8826904296875, -3.75311279296875, -3.62353515625, -3.49395751953125, -3.3643798828125, -3.23480224609375, -3.105224609375, -2.97564697265625, -2.8460693359375, -2.71649169921875, -2.5869140625, -2.45733642578125, -2.3277587890625, -2.19818115234375, -2.068603515625, -1.93902587890625, -1.8094482421875, -1.67987060546875, -1.55029296875, -1.42071533203125, -1.2911376953125, -1.16156005859375, -1.031982421875, -0.90240478515625, -0.7728271484375, -0.64324951171875, -0.513671875, -0.38409423828125, -0.2545166015625, -0.12493896484375, 0.004638671875, 0.13421630859375, 0.2637939453125, 0.39337158203125, 0.52294921875, 0.65252685546875, 0.7821044921875, 0.91168212890625, 1.041259765625, 1.17083740234375, 1.3004150390625, 1.42999267578125, 1.5595703125, 1.68914794921875, 1.8187255859375, 1.94830322265625, 2.077880859375, 2.20745849609375, 2.3370361328125, 2.46661376953125, 2.59619140625, 2.72576904296875, 2.8553466796875, 2.98492431640625, 3.114501953125, 3.24407958984375, 3.3736572265625, 3.50323486328125, 3.6328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 12.0, 17.0, 7.0, 14.0, 22.0, 22.0, 28.0, 38.0, 36.0, 39.0, 51.0, 66.0, 43.0, 54.0, 51.0, 52.0, 50.0, 60.0, 44.0, 45.0, 38.0, 31.0, 35.0, 26.0, 11.0, 22.0, 19.0, 9.0, 12.0, 5.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.3027229309082031, -0.29172515869140625, -0.2807273864746094, -0.2697296142578125, -0.2587318420410156, -0.24773406982421875, -0.23673629760742188, -0.225738525390625, -0.21474075317382812, -0.20374298095703125, -0.19274520874023438, -0.1817474365234375, -0.17074966430664062, -0.15975189208984375, -0.14875411987304688, -0.13775634765625, -0.12675857543945312, -0.11576080322265625, -0.10476303100585938, -0.0937652587890625, -0.08276748657226562, -0.07176971435546875, -0.060771942138671875, -0.049774169921875, -0.038776397705078125, -0.02777862548828125, -0.016780853271484375, -0.0057830810546875, 0.005214691162109375, 0.01621246337890625, 0.027210235595703125, 0.0382080078125, 0.049205780029296875, 0.06020355224609375, 0.07120132446289062, 0.0821990966796875, 0.09319686889648438, 0.10419464111328125, 0.11519241333007812, 0.126190185546875, 0.13718795776367188, 0.14818572998046875, 0.15918350219726562, 0.1701812744140625, 0.18117904663085938, 0.19217681884765625, 0.20317459106445312, 0.21417236328125, 0.22517013549804688, 0.23616790771484375, 0.24716567993164062, 0.2581634521484375, 0.2691612243652344, 0.28015899658203125, 0.2911567687988281, 0.302154541015625, 0.3131523132324219, 0.32415008544921875, 0.3351478576660156, 0.3461456298828125, 0.3571434020996094, 0.36814117431640625, 0.3791389465332031, 0.39013671875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 7.0, 7.0, 11.0, 11.0, 18.0, 31.0, 79.0, 346.0, 3258.0, 1012672.0, 30883.0, 907.0, 139.0, 40.0, 26.0, 12.0, 18.0, 11.0, 7.0, 6.0, 11.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.09375, -12.6044921875, -12.115234375, -11.6259765625, -11.13671875, -10.6474609375, -10.158203125, -9.6689453125, -9.1796875, -8.6904296875, -8.201171875, -7.7119140625, -7.22265625, -6.7333984375, -6.244140625, -5.7548828125, -5.265625, -4.7763671875, -4.287109375, -3.7978515625, -3.30859375, -2.8193359375, -2.330078125, -1.8408203125, -1.3515625, -0.8623046875, -0.373046875, 0.1162109375, 0.60546875, 1.0947265625, 1.583984375, 2.0732421875, 2.5625, 3.0517578125, 3.541015625, 4.0302734375, 4.51953125, 5.0087890625, 5.498046875, 5.9873046875, 6.4765625, 6.9658203125, 7.455078125, 7.9443359375, 8.43359375, 8.9228515625, 9.412109375, 9.9013671875, 10.390625, 10.8798828125, 11.369140625, 11.8583984375, 12.34765625, 12.8369140625, 13.326171875, 13.8154296875, 14.3046875, 14.7939453125, 15.283203125, 15.7724609375, 16.26171875, 16.7509765625, 17.240234375, 17.7294921875, 18.21875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 3.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 9.0, 13.0, 46.0, 275.0, 439.0, 82.0, 22.0, 9.0, 4.0, 3.0, 11.0, 7.0, 9.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022125244140625, -0.0021167993545532227, -0.0020210742950439453, -0.001925349235534668, -0.0018296241760253906, -0.0017338991165161133, -0.001638174057006836, -0.0015424489974975586, -0.0014467239379882812, -0.001350998878479004, -0.0012552738189697266, -0.0011595487594604492, -0.0010638236999511719, -0.0009680986404418945, -0.0008723735809326172, -0.0007766485214233398, -0.0006809234619140625, -0.0005851984024047852, -0.0004894733428955078, -0.00039374828338623047, -0.0002980232238769531, -0.00020229816436767578, -0.00010657310485839844, -1.0848045349121094e-05, 8.487701416015625e-05, 0.0001806020736694336, 0.00027632713317871094, 0.0003720521926879883, 0.0004677772521972656, 0.000563502311706543, 0.0006592273712158203, 0.0007549524307250977, 0.000850677490234375, 0.0009464025497436523, 0.0010421276092529297, 0.001137852668762207, 0.0012335777282714844, 0.0013293027877807617, 0.001425027847290039, 0.0015207529067993164, 0.0016164779663085938, 0.001712203025817871, 0.0018079280853271484, 0.0019036531448364258, 0.001999378204345703, 0.0020951032638549805, 0.002190828323364258, 0.002286553382873535, 0.0023822784423828125, 0.00247800350189209, 0.002573728561401367, 0.0026694536209106445, 0.002765178680419922, 0.0028609037399291992, 0.0029566287994384766, 0.003052353858947754, 0.0031480789184570312, 0.0032438039779663086, 0.003339529037475586, 0.0034352540969848633, 0.0035309791564941406, 0.003626704216003418, 0.0037224292755126953, 0.0038181543350219727, 0.00391387939453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 2.0, 9.0, 9.0, 5.0, 13.0, 22.0, 21.0, 54.0, 52.0, 75.0, 126.0, 201.0, 266.0, 410.0, 733.0, 1268.0, 2222.0, 4205.0, 8595.0, 21763.0, 95944.0, 795824.0, 78667.0, 20337.0, 8253.0, 3928.0, 2159.0, 1159.0, 722.0, 480.0, 301.0, 219.0, 154.0, 105.0, 63.0, 48.0, 37.0, 25.0, 26.0, 14.0, 6.0, 11.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.499481201171875, -3.37200927734375, -3.244537353515625, -3.1170654296875, -2.989593505859375, -2.86212158203125, -2.734649658203125, -2.607177734375, -2.479705810546875, -2.35223388671875, -2.224761962890625, -2.0972900390625, -1.969818115234375, -1.84234619140625, -1.714874267578125, -1.58740234375, -1.459930419921875, -1.33245849609375, -1.204986572265625, -1.0775146484375, -0.950042724609375, -0.82257080078125, -0.695098876953125, -0.567626953125, -0.440155029296875, -0.31268310546875, -0.185211181640625, -0.0577392578125, 0.069732666015625, 0.19720458984375, 0.324676513671875, 0.4521484375, 0.579620361328125, 0.70709228515625, 0.834564208984375, 0.9620361328125, 1.089508056640625, 1.21697998046875, 1.344451904296875, 1.471923828125, 1.599395751953125, 1.72686767578125, 1.854339599609375, 1.9818115234375, 2.109283447265625, 2.23675537109375, 2.364227294921875, 2.49169921875, 2.619171142578125, 2.74664306640625, 2.874114990234375, 3.0015869140625, 3.129058837890625, 3.25653076171875, 3.384002685546875, 3.511474609375, 3.638946533203125, 3.76641845703125, 3.893890380859375, 4.0213623046875, 4.148834228515625, 4.27630615234375, 4.403778076171875, 4.53125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 4.0, 10.0, 16.0, 28.0, 30.0, 103.0, 190.0, 263.0, 158.0, 44.0, 32.0, 20.0, 18.0, 13.0, 9.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.640625, -1.57037353515625, -1.5001220703125, -1.42987060546875, -1.359619140625, -1.28936767578125, -1.2191162109375, -1.14886474609375, -1.07861328125, -1.00836181640625, -0.9381103515625, -0.86785888671875, -0.797607421875, -0.72735595703125, -0.6571044921875, -0.58685302734375, -0.5166015625, -0.44635009765625, -0.3760986328125, -0.30584716796875, -0.235595703125, -0.16534423828125, -0.0950927734375, -0.02484130859375, 0.04541015625, 0.11566162109375, 0.1859130859375, 0.25616455078125, 0.326416015625, 0.39666748046875, 0.4669189453125, 0.53717041015625, 0.607421875, 0.67767333984375, 0.7479248046875, 0.81817626953125, 0.888427734375, 0.95867919921875, 1.0289306640625, 1.09918212890625, 1.16943359375, 1.23968505859375, 1.3099365234375, 1.38018798828125, 1.450439453125, 1.52069091796875, 1.5909423828125, 1.66119384765625, 1.7314453125, 1.80169677734375, 1.8719482421875, 1.94219970703125, 2.012451171875, 2.08270263671875, 2.1529541015625, 2.22320556640625, 2.29345703125, 2.36370849609375, 2.4339599609375, 2.50421142578125, 2.574462890625, 2.64471435546875, 2.7149658203125, 2.78521728515625, 2.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 18.0, 30.0, 61.0, 109.0, 160.0, 235.0, 160.0, 104.0, 54.0, 22.0, 12.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40109634399414, -13.04529094696045, -12.689485549926758, -12.333680152893066, -11.977874755859375, -11.6220703125, -11.266263961791992, -10.910459518432617, -10.554654121398926, -10.198848724365234, -9.843043327331543, -9.487237930297852, -9.13143253326416, -8.775627136230469, -8.419822692871094, -8.064017295837402, -7.708211421966553, -7.352406024932861, -6.99660062789917, -6.640795707702637, -6.284990310668945, -5.929184913635254, -5.5733795166015625, -5.217574119567871, -4.86176872253418, -4.505963325500488, -4.150157928466797, -3.7943527698516846, -3.4385476112365723, -3.082742214202881, -2.7269368171691895, -2.371131658554077, -2.015326499938965, -1.659521222114563, -1.3037159442901611, -0.9479105472564697, -0.5921052694320679, -0.23629999160766602, 0.11950540542602539, 0.4753105640411377, 0.8311159610748291, 1.186921238899231, 1.5427265167236328, 1.8985319137573242, 2.2543373107910156, 2.610142469406128, 2.9659478664398193, 3.3217530250549316, 3.677558422088623, 4.0333638191223145, 4.389169216156006, 4.744974136352539, 5.1007795333862305, 5.456584930419922, 5.812390327453613, 6.168195724487305, 6.524001121520996, 6.8798065185546875, 7.235611915588379, 7.59141731262207, 7.9472222328186035, 8.303028106689453, 8.658832550048828, 9.01463794708252, 9.370443344116211]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 9.0, 13.0, 12.0, 16.0, 17.0, 19.0, 23.0, 30.0, 39.0, 26.0, 46.0, 46.0, 44.0, 47.0, 40.0, 50.0, 48.0, 44.0, 45.0, 48.0, 39.0, 35.0, 34.0, 27.0, 29.0, 34.0, 19.0, 16.0, 17.0, 8.0, 21.0, 11.0, 4.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.948370933532715, -2.8556225299835205, -2.7628743648529053, -2.670125961303711, -2.5773775577545166, -2.4846293926239014, -2.391880989074707, -2.299132823944092, -2.2063844203948975, -2.113636016845703, -2.020887851715088, -1.9281394481658936, -1.8353911638259888, -1.742642879486084, -1.6498944759368896, -1.5571461915969849, -1.4643977880477905, -1.3716495037078857, -1.2789011001586914, -1.1861528158187866, -1.0934045314788818, -1.0006561279296875, -0.9079078435897827, -0.8151595592498779, -0.7224112153053284, -0.6296628713607788, -0.536914587020874, -0.44416624307632446, -0.3514179289340973, -0.2586696147918701, -0.16592127084732056, -0.07317298650741577, 0.01957535743713379, 0.11232367902994156, 0.20507200062274933, 0.2978203296661377, 0.39056864380836487, 0.48331695795059204, 0.5760653018951416, 0.6688135862350464, 0.761561930179596, 0.8543102741241455, 0.9470585584640503, 1.039806842803955, 1.1325552463531494, 1.2253035306930542, 1.318051815032959, 1.4108002185821533, 1.503548502922058, 1.596296787261963, 1.6890451908111572, 1.781793475151062, 1.8745417594909668, 1.9672901630401611, 2.0600385665893555, 2.1527867317199707, 2.245535135269165, 2.3382835388183594, 2.4310317039489746, 2.523780107498169, 2.6165285110473633, 2.7092766761779785, 2.802025079727173, 2.894773483276367, 2.9875216484069824]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 7.0, 7.0, 8.0, 17.0, 33.0, 35.0, 37.0, 69.0, 129.0, 295.0, 982.0, 5318.0, 68001.0, 4050005.0, 62216.0, 5372.0, 1001.0, 294.0, 149.0, 71.0, 59.0, 37.0, 33.0, 29.0, 15.0, 16.0, 13.0, 8.0, 8.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.19451904296875, -4.9984130859375, -4.80230712890625, -4.606201171875, -4.41009521484375, -4.2139892578125, -4.01788330078125, -3.82177734375, -3.62567138671875, -3.4295654296875, -3.23345947265625, -3.037353515625, -2.84124755859375, -2.6451416015625, -2.44903564453125, -2.2529296875, -2.05682373046875, -1.8607177734375, -1.66461181640625, -1.468505859375, -1.27239990234375, -1.0762939453125, -0.88018798828125, -0.68408203125, -0.48797607421875, -0.2918701171875, -0.09576416015625, 0.100341796875, 0.29644775390625, 0.4925537109375, 0.68865966796875, 0.884765625, 1.08087158203125, 1.2769775390625, 1.47308349609375, 1.669189453125, 1.86529541015625, 2.0614013671875, 2.25750732421875, 2.45361328125, 2.64971923828125, 2.8458251953125, 3.04193115234375, 3.238037109375, 3.43414306640625, 3.6302490234375, 3.82635498046875, 4.0224609375, 4.21856689453125, 4.4146728515625, 4.61077880859375, 4.806884765625, 5.00299072265625, 5.1990966796875, 5.39520263671875, 5.59130859375, 5.78741455078125, 5.9835205078125, 6.17962646484375, 6.375732421875, 6.57183837890625, 6.7679443359375, 6.96405029296875, 7.16015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 20.0, 15.0, 19.0, 36.0, 42.0, 58.0, 57.0, 53.0, 55.0, 55.0, 70.0, 57.0, 58.0, 55.0, 42.0, 53.0, 41.0, 36.0, 32.0, 23.0, 27.0, 21.0, 8.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.06856441497802734, -0.06626701354980469, -0.06396961212158203, -0.061672210693359375, -0.05937480926513672, -0.05707740783691406, -0.054780006408691406, -0.05248260498046875, -0.050185203552246094, -0.04788780212402344, -0.04559040069580078, -0.043292999267578125, -0.04099559783935547, -0.03869819641113281, -0.036400794982910156, -0.0341033935546875, -0.031805992126464844, -0.029508590698242188, -0.02721118927001953, -0.024913787841796875, -0.02261638641357422, -0.020318984985351562, -0.018021583557128906, -0.01572418212890625, -0.013426780700683594, -0.011129379272460938, -0.008831977844238281, -0.006534576416015625, -0.004237174987792969, -0.0019397735595703125, 0.00035762786865234375, 0.002655029296875, 0.004952430725097656, 0.0072498321533203125, 0.009547233581542969, 0.011844635009765625, 0.014142036437988281, 0.016439437866210938, 0.018736839294433594, 0.02103424072265625, 0.023331642150878906, 0.025629043579101562, 0.02792644500732422, 0.030223846435546875, 0.03252124786376953, 0.03481864929199219, 0.037116050720214844, 0.0394134521484375, 0.041710853576660156, 0.04400825500488281, 0.04630565643310547, 0.048603057861328125, 0.05090045928955078, 0.05319786071777344, 0.055495262145996094, 0.05779266357421875, 0.060090065002441406, 0.06238746643066406, 0.06468486785888672, 0.06698226928710938, 0.06927967071533203, 0.07157707214355469, 0.07387447357177734, 0.076171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 12.0, 25.0, 27.0, 46.0, 100.0, 256.0, 1112.0, 41931.0, 4140417.0, 9423.0, 553.0, 161.0, 81.0, 44.0, 29.0, 10.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.433349609375, -8.99169921875, -8.550048828125, -8.1083984375, -7.666748046875, -7.22509765625, -6.783447265625, -6.341796875, -5.900146484375, -5.45849609375, -5.016845703125, -4.5751953125, -4.133544921875, -3.69189453125, -3.250244140625, -2.80859375, -2.366943359375, -1.92529296875, -1.483642578125, -1.0419921875, -0.600341796875, -0.15869140625, 0.282958984375, 0.724609375, 1.166259765625, 1.60791015625, 2.049560546875, 2.4912109375, 2.932861328125, 3.37451171875, 3.816162109375, 4.2578125, 4.699462890625, 5.14111328125, 5.582763671875, 6.0244140625, 6.466064453125, 6.90771484375, 7.349365234375, 7.791015625, 8.232666015625, 8.67431640625, 9.115966796875, 9.5576171875, 9.999267578125, 10.44091796875, 10.882568359375, 11.32421875, 11.765869140625, 12.20751953125, 12.649169921875, 13.0908203125, 13.532470703125, 13.97412109375, 14.415771484375, 14.857421875, 15.299072265625, 15.74072265625, 16.182373046875, 16.6240234375, 17.065673828125, 17.50732421875, 17.948974609375, 18.390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 9.0, 8.0, 19.0, 33.0, 35.0, 59.0, 71.0, 118.0, 195.0, 400.0, 1504.0, 775.0, 299.0, 201.0, 115.0, 59.0, 46.0, 41.0, 15.0, 21.0, 13.0, 8.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35433197021484375, -0.3441619873046875, -0.33399200439453125, -0.323822021484375, -0.31365203857421875, -0.3034820556640625, -0.29331207275390625, -0.28314208984375, -0.27297210693359375, -0.2628021240234375, -0.25263214111328125, -0.242462158203125, -0.23229217529296875, -0.2221221923828125, -0.21195220947265625, -0.2017822265625, -0.19161224365234375, -0.1814422607421875, -0.17127227783203125, -0.161102294921875, -0.15093231201171875, -0.1407623291015625, -0.13059234619140625, -0.12042236328125, -0.11025238037109375, -0.1000823974609375, -0.08991241455078125, -0.079742431640625, -0.06957244873046875, -0.0594024658203125, -0.04923248291015625, -0.0390625, -0.02889251708984375, -0.0187225341796875, -0.00855255126953125, 0.001617431640625, 0.01178741455078125, 0.0219573974609375, 0.03212738037109375, 0.04229736328125, 0.05246734619140625, 0.0626373291015625, 0.07280731201171875, 0.082977294921875, 0.09314727783203125, 0.1033172607421875, 0.11348724365234375, 0.1236572265625, 0.13382720947265625, 0.1439971923828125, 0.15416717529296875, 0.164337158203125, 0.17450714111328125, 0.1846771240234375, 0.19484710693359375, 0.20501708984375, 0.21518707275390625, 0.2253570556640625, 0.23552703857421875, 0.245697021484375, 0.25586700439453125, 0.2660369873046875, 0.27620697021484375, 0.286376953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 27.0, 189.0, 477.0, 269.0, 36.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.40032196044922, -20.019495010375977, -19.638669967651367, -19.257843017578125, -18.877017974853516, -18.496191024780273, -18.115365982055664, -17.734539031982422, -17.353713989257812, -16.97288703918457, -16.59206199645996, -16.21123504638672, -15.83041000366211, -15.449584007263184, -15.068758010864258, -14.687931060791016, -14.30710506439209, -13.926279067993164, -13.545453071594238, -13.164627075195312, -12.783801078796387, -12.402975082397461, -12.022148132324219, -11.64132308959961, -11.260496139526367, -10.879670143127441, -10.498844146728516, -10.11801815032959, -9.737192153930664, -9.356366157531738, -8.975540161132812, -8.59471321105957, -8.213887214660645, -7.833061218261719, -7.452235221862793, -7.071409225463867, -6.690583229064941, -6.309757232666016, -5.928930759429932, -5.548104763031006, -5.167279243469238, -4.7864532470703125, -4.405627250671387, -4.024801254272461, -3.643975019454956, -3.2631490230560303, -2.8823227882385254, -2.5014967918395996, -2.1206705570220947, -1.739844560623169, -1.3590184450149536, -0.9781923294067383, -0.5973663330078125, -0.21654033660888672, 0.16428589820861816, 0.545111894607544, 0.9259378910064697, 1.3067638874053955, 1.6875900030136108, 2.068416118621826, 2.449242115020752, 2.8300681114196777, 3.2108943462371826, 3.5917203426361084, 3.972546339035034]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 7.0, 14.0, 4.0, 9.0, 9.0, 14.0, 14.0, 22.0, 18.0, 28.0, 38.0, 27.0, 30.0, 31.0, 31.0, 32.0, 55.0, 51.0, 42.0, 57.0, 48.0, 44.0, 48.0, 43.0, 33.0, 28.0, 23.0, 30.0, 31.0, 23.0, 24.0, 11.0, 16.0, 11.0, 6.0, 11.0, 4.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.947307825088501, -0.9157190918922424, -0.8841303586959839, -0.8525416254997253, -0.8209528923034668, -0.7893641591072083, -0.7577754259109497, -0.7261867523193359, -0.6945979595184326, -0.6630092263221741, -0.6314204931259155, -0.599831759929657, -0.5682430267333984, -0.5366542935371399, -0.5050655603408813, -0.4734768569469452, -0.44188815355300903, -0.4102994203567505, -0.37871068716049194, -0.3471219539642334, -0.31553322076797485, -0.2839444875717163, -0.25235578417778015, -0.2207670509815216, -0.18917831778526306, -0.15758958458900452, -0.12600085139274597, -0.09441213309764862, -0.06282339990139008, -0.03123466670513153, 0.0003540515899658203, 0.031942784786224365, 0.06353151798248291, 0.09512025117874146, 0.126708984375, 0.15829770267009735, 0.1898864358663559, 0.22147516906261444, 0.2530638873577118, 0.28465262055397034, 0.3162413537502289, 0.3478300869464874, 0.37941882014274597, 0.41100752353668213, 0.4425962567329407, 0.4741849899291992, 0.5057737231254578, 0.5373624563217163, 0.5689511895179749, 0.6005399227142334, 0.6321286559104919, 0.6637173891067505, 0.695306122303009, 0.7268948554992676, 0.7584835290908813, 0.7900723218917847, 0.8216609954833984, 0.853249728679657, 0.8848384618759155, 0.9164271950721741, 0.9480159282684326, 0.9796046614646912, 1.0111933946609497, 1.0427820682525635, 1.0743708610534668]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 10.0, 15.0, 12.0, 20.0, 21.0, 27.0, 38.0, 38.0, 59.0, 108.0, 1651.0, 195599.0, 839217.0, 11018.0, 349.0, 81.0, 62.0, 50.0, 39.0, 25.0, 20.0, 24.0, 15.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.48046875, -5.304931640625, -5.12939453125, -4.953857421875, -4.7783203125, -4.602783203125, -4.42724609375, -4.251708984375, -4.076171875, -3.900634765625, -3.72509765625, -3.549560546875, -3.3740234375, -3.198486328125, -3.02294921875, -2.847412109375, -2.671875, -2.496337890625, -2.32080078125, -2.145263671875, -1.9697265625, -1.794189453125, -1.61865234375, -1.443115234375, -1.267578125, -1.092041015625, -0.91650390625, -0.740966796875, -0.5654296875, -0.389892578125, -0.21435546875, -0.038818359375, 0.13671875, 0.312255859375, 0.48779296875, 0.663330078125, 0.8388671875, 1.014404296875, 1.18994140625, 1.365478515625, 1.541015625, 1.716552734375, 1.89208984375, 2.067626953125, 2.2431640625, 2.418701171875, 2.59423828125, 2.769775390625, 2.9453125, 3.120849609375, 3.29638671875, 3.471923828125, 3.6474609375, 3.822998046875, 3.99853515625, 4.174072265625, 4.349609375, 4.525146484375, 4.70068359375, 4.876220703125, 5.0517578125, 5.227294921875, 5.40283203125, 5.578369140625, 5.75390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 21.0, 16.0, 18.0, 24.0, 26.0, 27.0, 46.0, 24.0, 37.0, 49.0, 53.0, 52.0, 46.0, 43.0, 62.0, 41.0, 44.0, 55.0, 44.0, 37.0, 43.0, 27.0, 28.0, 21.0, 21.0, 14.0, 16.0, 1.0, 14.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0753173828125, -0.07300186157226562, -0.07068634033203125, -0.06837081909179688, -0.0660552978515625, -0.06373977661132812, -0.06142425537109375, -0.059108734130859375, -0.056793212890625, -0.054477691650390625, -0.05216217041015625, -0.049846649169921875, -0.0475311279296875, -0.045215606689453125, -0.04290008544921875, -0.040584564208984375, -0.03826904296875, -0.035953521728515625, -0.03363800048828125, -0.031322479248046875, -0.0290069580078125, -0.026691436767578125, -0.02437591552734375, -0.022060394287109375, -0.019744873046875, -0.017429351806640625, -0.01511383056640625, -0.012798309326171875, -0.0104827880859375, -0.008167266845703125, -0.00585174560546875, -0.003536224365234375, -0.001220703125, 0.001094818115234375, 0.00341033935546875, 0.005725860595703125, 0.0080413818359375, 0.010356903076171875, 0.01267242431640625, 0.014987945556640625, 0.017303466796875, 0.019618988037109375, 0.02193450927734375, 0.024250030517578125, 0.0265655517578125, 0.028881072998046875, 0.03119659423828125, 0.033512115478515625, 0.03582763671875, 0.038143157958984375, 0.04045867919921875, 0.042774200439453125, 0.0450897216796875, 0.047405242919921875, 0.04972076416015625, 0.052036285400390625, 0.054351806640625, 0.056667327880859375, 0.05898284912109375, 0.061298370361328125, 0.0636138916015625, 0.06592941284179688, 0.06824493408203125, 0.07056045532226562, 0.0728759765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 13.0, 15.0, 15.0, 21.0, 42.0, 59.0, 84.0, 96.0, 159.0, 231.0, 289.0, 499.0, 764.0, 1314.0, 2464.0, 5284.0, 13613.0, 40183.0, 121345.0, 295639.0, 331863.0, 152119.0, 51497.0, 17388.0, 6508.0, 3009.0, 1473.0, 862.0, 572.0, 342.0, 208.0, 154.0, 103.0, 80.0, 60.0, 36.0, 37.0, 22.0, 22.0, 17.0, 10.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.3984375, -1.354888916015625, -1.31134033203125, -1.267791748046875, -1.2242431640625, -1.180694580078125, -1.13714599609375, -1.093597412109375, -1.050048828125, -1.006500244140625, -0.96295166015625, -0.919403076171875, -0.8758544921875, -0.832305908203125, -0.78875732421875, -0.745208740234375, -0.70166015625, -0.658111572265625, -0.61456298828125, -0.571014404296875, -0.5274658203125, -0.483917236328125, -0.44036865234375, -0.396820068359375, -0.353271484375, -0.309722900390625, -0.26617431640625, -0.222625732421875, -0.1790771484375, -0.135528564453125, -0.09197998046875, -0.048431396484375, -0.0048828125, 0.038665771484375, 0.08221435546875, 0.125762939453125, 0.1693115234375, 0.212860107421875, 0.25640869140625, 0.299957275390625, 0.343505859375, 0.387054443359375, 0.43060302734375, 0.474151611328125, 0.5177001953125, 0.561248779296875, 0.60479736328125, 0.648345947265625, 0.69189453125, 0.735443115234375, 0.77899169921875, 0.822540283203125, 0.8660888671875, 0.909637451171875, 0.95318603515625, 0.996734619140625, 1.040283203125, 1.083831787109375, 1.12738037109375, 1.170928955078125, 1.2144775390625, 1.258026123046875, 1.30157470703125, 1.345123291015625, 1.388671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 9.0, 15.0, 11.0, 17.0, 18.0, 22.0, 33.0, 44.0, 41.0, 49.0, 62.0, 57.0, 55.0, 70.0, 72.0, 48.0, 50.0, 53.0, 37.0, 36.0, 36.0, 30.0, 23.0, 21.0, 21.0, 11.0, 13.0, 15.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.640625, -0.621734619140625, -0.60284423828125, -0.583953857421875, -0.5650634765625, -0.546173095703125, -0.52728271484375, -0.508392333984375, -0.489501953125, -0.470611572265625, -0.45172119140625, -0.432830810546875, -0.4139404296875, -0.395050048828125, -0.37615966796875, -0.357269287109375, -0.33837890625, -0.319488525390625, -0.30059814453125, -0.281707763671875, -0.2628173828125, -0.243927001953125, -0.22503662109375, -0.206146240234375, -0.187255859375, -0.168365478515625, -0.14947509765625, -0.130584716796875, -0.1116943359375, -0.092803955078125, -0.07391357421875, -0.055023193359375, -0.0361328125, -0.017242431640625, 0.00164794921875, 0.020538330078125, 0.0394287109375, 0.058319091796875, 0.07720947265625, 0.096099853515625, 0.114990234375, 0.133880615234375, 0.15277099609375, 0.171661376953125, 0.1905517578125, 0.209442138671875, 0.22833251953125, 0.247222900390625, 0.26611328125, 0.285003662109375, 0.30389404296875, 0.322784423828125, 0.3416748046875, 0.360565185546875, 0.37945556640625, 0.398345947265625, 0.417236328125, 0.436126708984375, 0.45501708984375, 0.473907470703125, 0.4927978515625, 0.511688232421875, 0.53057861328125, 0.549468994140625, 0.568359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 14.0, 24.0, 22.0, 45.0, 56.0, 78.0, 116.0, 184.0, 322.0, 597.0, 1214.0, 2652.0, 7086.0, 21608.0, 83277.0, 322944.0, 424135.0, 134427.0, 33028.0, 9830.0, 3593.0, 1574.0, 710.0, 347.0, 205.0, 150.0, 96.0, 59.0, 36.0, 26.0, 29.0, 16.0, 14.0, 10.0, 8.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.666259765625, -1.61279296875, -1.559326171875, -1.505859375, -1.452392578125, -1.39892578125, -1.345458984375, -1.2919921875, -1.238525390625, -1.18505859375, -1.131591796875, -1.078125, -1.024658203125, -0.97119140625, -0.917724609375, -0.8642578125, -0.810791015625, -0.75732421875, -0.703857421875, -0.650390625, -0.596923828125, -0.54345703125, -0.489990234375, -0.4365234375, -0.383056640625, -0.32958984375, -0.276123046875, -0.22265625, -0.169189453125, -0.11572265625, -0.062255859375, -0.0087890625, 0.044677734375, 0.09814453125, 0.151611328125, 0.205078125, 0.258544921875, 0.31201171875, 0.365478515625, 0.4189453125, 0.472412109375, 0.52587890625, 0.579345703125, 0.6328125, 0.686279296875, 0.73974609375, 0.793212890625, 0.8466796875, 0.900146484375, 0.95361328125, 1.007080078125, 1.060546875, 1.114013671875, 1.16748046875, 1.220947265625, 1.2744140625, 1.327880859375, 1.38134765625, 1.434814453125, 1.48828125, 1.541748046875, 1.59521484375, 1.648681640625, 1.7021484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 1.0, 6.0, 6.0, 9.0, 16.0, 15.0, 19.0, 20.0, 28.0, 28.0, 42.0, 47.0, 67.0, 79.0, 85.0, 91.0, 88.0, 72.0, 72.0, 37.0, 36.0, 22.0, 22.0, 16.0, 15.0, 7.0, 8.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00026607513427734375, -0.0002579018473625183, -0.00024972856044769287, -0.00024155527353286743, -0.000233381986618042, -0.00022520869970321655, -0.0002170354127883911, -0.00020886212587356567, -0.00020068883895874023, -0.0001925155520439148, -0.00018434226512908936, -0.00017616897821426392, -0.00016799569129943848, -0.00015982240438461304, -0.0001516491174697876, -0.00014347583055496216, -0.00013530254364013672, -0.00012712925672531128, -0.00011895596981048584, -0.0001107826828956604, -0.00010260939598083496, -9.443610906600952e-05, -8.626282215118408e-05, -7.808953523635864e-05, -6.99162483215332e-05, -6.174296140670776e-05, -5.3569674491882324e-05, -4.5396387577056885e-05, -3.7223100662231445e-05, -2.9049813747406006e-05, -2.0876526832580566e-05, -1.2703239917755127e-05, -4.5299530029296875e-06, 3.643333911895752e-06, 1.1816620826721191e-05, 1.998990774154663e-05, 2.816319465637207e-05, 3.633648157119751e-05, 4.450976848602295e-05, 5.268305540084839e-05, 6.085634231567383e-05, 6.902962923049927e-05, 7.720291614532471e-05, 8.537620306015015e-05, 9.354948997497559e-05, 0.00010172277688980103, 0.00010989606380462646, 0.0001180693507194519, 0.00012624263763427734, 0.00013441592454910278, 0.00014258921146392822, 0.00015076249837875366, 0.0001589357852935791, 0.00016710907220840454, 0.00017528235912322998, 0.00018345564603805542, 0.00019162893295288086, 0.0001998022198677063, 0.00020797550678253174, 0.00021614879369735718, 0.00022432208061218262, 0.00023249536752700806, 0.0002406686544418335, 0.00024884194135665894, 0.0002570152282714844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 12.0, 15.0, 35.0, 39.0, 69.0, 117.0, 223.0, 454.0, 954.0, 2575.0, 8851.0, 50048.0, 398278.0, 500715.0, 69774.0, 11145.0, 3046.0, 1148.0, 472.0, 263.0, 125.0, 73.0, 25.0, 28.0, 19.0, 9.0, 7.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.80078125, -2.725250244140625, -2.64971923828125, -2.574188232421875, -2.4986572265625, -2.423126220703125, -2.34759521484375, -2.272064208984375, -2.196533203125, -2.121002197265625, -2.04547119140625, -1.969940185546875, -1.8944091796875, -1.818878173828125, -1.74334716796875, -1.667816162109375, -1.59228515625, -1.516754150390625, -1.44122314453125, -1.365692138671875, -1.2901611328125, -1.214630126953125, -1.13909912109375, -1.063568115234375, -0.988037109375, -0.912506103515625, -0.83697509765625, -0.761444091796875, -0.6859130859375, -0.610382080078125, -0.53485107421875, -0.459320068359375, -0.3837890625, -0.308258056640625, -0.23272705078125, -0.157196044921875, -0.0816650390625, -0.006134033203125, 0.06939697265625, 0.144927978515625, 0.220458984375, 0.295989990234375, 0.37152099609375, 0.447052001953125, 0.5225830078125, 0.598114013671875, 0.67364501953125, 0.749176025390625, 0.82470703125, 0.900238037109375, 0.97576904296875, 1.051300048828125, 1.1268310546875, 1.202362060546875, 1.27789306640625, 1.353424072265625, 1.428955078125, 1.504486083984375, 1.58001708984375, 1.655548095703125, 1.7310791015625, 1.806610107421875, 1.88214111328125, 1.957672119140625, 2.033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 8.0, 18.0, 16.0, 14.0, 22.0, 31.0, 29.0, 40.0, 38.0, 50.0, 66.0, 65.0, 49.0, 45.0, 44.0, 62.0, 55.0, 51.0, 47.0, 46.0, 35.0, 27.0, 28.0, 20.0, 13.0, 10.0, 9.0, 7.0, 9.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59765625, -0.5804367065429688, -0.5632171630859375, -0.5459976196289062, -0.528778076171875, -0.5115585327148438, -0.4943389892578125, -0.47711944580078125, -0.45989990234375, -0.44268035888671875, -0.4254608154296875, -0.40824127197265625, -0.391021728515625, -0.37380218505859375, -0.3565826416015625, -0.33936309814453125, -0.3221435546875, -0.30492401123046875, -0.2877044677734375, -0.27048492431640625, -0.253265380859375, -0.23604583740234375, -0.2188262939453125, -0.20160675048828125, -0.18438720703125, -0.16716766357421875, -0.1499481201171875, -0.13272857666015625, -0.115509033203125, -0.09828948974609375, -0.0810699462890625, -0.06385040283203125, -0.046630859375, -0.02941131591796875, -0.0121917724609375, 0.00502777099609375, 0.022247314453125, 0.03946685791015625, 0.0566864013671875, 0.07390594482421875, 0.09112548828125, 0.10834503173828125, 0.1255645751953125, 0.14278411865234375, 0.160003662109375, 0.17722320556640625, 0.1944427490234375, 0.21166229248046875, 0.2288818359375, 0.24610137939453125, 0.2633209228515625, 0.28054046630859375, 0.297760009765625, 0.31497955322265625, 0.3321990966796875, 0.34941864013671875, 0.36663818359375, 0.38385772705078125, 0.4010772705078125, 0.41829681396484375, 0.435516357421875, 0.45273590087890625, 0.4699554443359375, 0.48717498779296875, 0.50439453125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 19.0, 86.0, 249.0, 376.0, 191.0, 56.0, 23.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.846235752105713, -4.9172163009643555, -3.9881973266601562, -3.059178113937378, -2.1301589012145996, -1.2011399269104004, -0.27212047576904297, 0.6568989753723145, 1.5859179496765137, 2.514937162399292, 3.4439563751220703, 4.3729753494262695, 5.301994800567627, 6.231013774871826, 7.160033226013184, 8.089052200317383, 9.018072128295898, 9.947091102600098, 10.876110076904297, 11.805130004882812, 12.734148979187012, 13.663167953491211, 14.592187881469727, 15.521206855773926, 16.450225830078125, 17.37924575805664, 18.308263778686523, 19.23728370666504, 20.166301727294922, 21.095321655273438, 22.024341583251953, 22.95336151123047, 23.88237762451172, 24.811397552490234, 25.740415573120117, 26.669435501098633, 27.598453521728516, 28.52747344970703, 29.456493377685547, 30.385513305664062, 31.314531326293945, 32.24354934692383, 33.172569274902344, 34.10158920288086, 35.030609130859375, 35.959625244140625, 36.88864517211914, 37.817665100097656, 38.74668502807617, 39.67570495605469, 40.6047248840332, 41.53374099731445, 42.46276092529297, 43.391780853271484, 44.32080078125, 45.249820709228516, 46.17884063720703, 47.10786056518555, 48.03688049316406, 48.96589660644531, 49.89491653442383, 50.823936462402344, 51.75295639038086, 52.681976318359375, 53.610992431640625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 4.0, 15.0, 20.0, 14.0, 28.0, 36.0, 39.0, 38.0, 44.0, 46.0, 53.0, 53.0, 58.0, 48.0, 55.0, 67.0, 46.0, 46.0, 45.0, 42.0, 31.0, 29.0, 33.0, 20.0, 19.0, 11.0, 9.0, 12.0, 7.0, 4.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.695977210998535, -4.55609130859375, -4.416205883026123, -4.276319980621338, -4.136434078216553, -3.9965484142303467, -3.8566627502441406, -3.7167768478393555, -3.5768909454345703, -3.4370052814483643, -3.297119379043579, -3.157233715057373, -3.017347812652588, -2.877462148666382, -2.737576484680176, -2.5976905822753906, -2.4578049182891846, -2.3179192543029785, -2.1780333518981934, -2.0381476879119873, -1.8982617855072021, -1.758376121520996, -1.6184903383255005, -1.4786045551300049, -1.3387187719345093, -1.1988329887390137, -1.058947205543518, -0.9190614819526672, -0.7791756987571716, -0.639289915561676, -0.4994041919708252, -0.3595184087753296, -0.21963262557983398, -0.07974685728549957, 0.06013891100883484, 0.20002466440200806, 0.33991044759750366, 0.47979623079299927, 0.6196819543838501, 0.7595677375793457, 0.8994535207748413, 1.039339303970337, 1.1792250871658325, 1.3191108703613281, 1.4589965343475342, 1.5988824367523193, 1.7387681007385254, 1.878653883934021, 2.0185396671295166, 2.1584253311157227, 2.298311233520508, 2.438196897506714, 2.578082799911499, 2.717968463897705, 2.8578543663024902, 2.9977400302886963, 3.1376256942749023, 3.2775113582611084, 3.4173972606658936, 3.5572829246520996, 3.6971688270568848, 3.837054491043091, 3.976940155029297, 4.116826057434082, 4.256711959838867]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 13.0, 13.0, 17.0, 35.0, 33.0, 65.0, 88.0, 146.0, 355.0, 1182.0, 8371.0, 210532.0, 3937903.0, 31464.0, 2849.0, 615.0, 222.0, 102.0, 76.0, 40.0, 24.0, 25.0, 15.0, 17.0, 10.0, 11.0, 8.0, 6.0, 3.0, 3.0, 10.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.2734375, -8.0386962890625, -7.803955078125, -7.5692138671875, -7.33447265625, -7.0997314453125, -6.864990234375, -6.6302490234375, -6.3955078125, -6.1607666015625, -5.926025390625, -5.6912841796875, -5.45654296875, -5.2218017578125, -4.987060546875, -4.7523193359375, -4.517578125, -4.2828369140625, -4.048095703125, -3.8133544921875, -3.57861328125, -3.3438720703125, -3.109130859375, -2.8743896484375, -2.6396484375, -2.4049072265625, -2.170166015625, -1.9354248046875, -1.70068359375, -1.4659423828125, -1.231201171875, -0.9964599609375, -0.76171875, -0.5269775390625, -0.292236328125, -0.0574951171875, 0.17724609375, 0.4119873046875, 0.646728515625, 0.8814697265625, 1.1162109375, 1.3509521484375, 1.585693359375, 1.8204345703125, 2.05517578125, 2.2899169921875, 2.524658203125, 2.7593994140625, 2.994140625, 3.2288818359375, 3.463623046875, 3.6983642578125, 3.93310546875, 4.1678466796875, 4.402587890625, 4.6373291015625, 4.8720703125, 5.1068115234375, 5.341552734375, 5.5762939453125, 5.81103515625, 6.0457763671875, 6.280517578125, 6.5152587890625, 6.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 9.0, 19.0, 22.0, 33.0, 33.0, 50.0, 54.0, 73.0, 63.0, 84.0, 88.0, 80.0, 80.0, 74.0, 53.0, 34.0, 31.0, 26.0, 24.0, 20.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1724853515625, -0.1677417755126953, -0.16299819946289062, -0.15825462341308594, -0.15351104736328125, -0.14876747131347656, -0.14402389526367188, -0.1392803192138672, -0.1345367431640625, -0.1297931671142578, -0.12504959106445312, -0.12030601501464844, -0.11556243896484375, -0.11081886291503906, -0.10607528686523438, -0.10133171081542969, -0.096588134765625, -0.09184455871582031, -0.08710098266601562, -0.08235740661621094, -0.07761383056640625, -0.07287025451660156, -0.06812667846679688, -0.06338310241699219, -0.0586395263671875, -0.05389595031738281, -0.049152374267578125, -0.04440879821777344, -0.03966522216796875, -0.03492164611816406, -0.030178070068359375, -0.025434494018554688, -0.02069091796875, -0.015947341918945312, -0.011203765869140625, -0.0064601898193359375, -0.00171661376953125, 0.0030269622802734375, 0.007770538330078125, 0.012514114379882812, 0.0172576904296875, 0.022001266479492188, 0.026744842529296875, 0.03148841857910156, 0.03623199462890625, 0.04097557067871094, 0.045719146728515625, 0.05046272277832031, 0.055206298828125, 0.05994987487792969, 0.06469345092773438, 0.06943702697753906, 0.07418060302734375, 0.07892417907714844, 0.08366775512695312, 0.08841133117675781, 0.0931549072265625, 0.09789848327636719, 0.10264205932617188, 0.10738563537597656, 0.11212921142578125, 0.11687278747558594, 0.12161636352539062, 0.1263599395751953, 0.131103515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 23.0, 28.0, 60.0, 116.0, 144.0, 256.0, 388.0, 1713.0, 4179879.0, 10853.0, 363.0, 202.0, 113.0, 80.0, 35.0, 17.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.90625, -30.06298828125, -29.2197265625, -28.37646484375, -27.533203125, -26.68994140625, -25.8466796875, -25.00341796875, -24.16015625, -23.31689453125, -22.4736328125, -21.63037109375, -20.787109375, -19.94384765625, -19.1005859375, -18.25732421875, -17.4140625, -16.57080078125, -15.7275390625, -14.88427734375, -14.041015625, -13.19775390625, -12.3544921875, -11.51123046875, -10.66796875, -9.82470703125, -8.9814453125, -8.13818359375, -7.294921875, -6.45166015625, -5.6083984375, -4.76513671875, -3.921875, -3.07861328125, -2.2353515625, -1.39208984375, -0.548828125, 0.29443359375, 1.1376953125, 1.98095703125, 2.82421875, 3.66748046875, 4.5107421875, 5.35400390625, 6.197265625, 7.04052734375, 7.8837890625, 8.72705078125, 9.5703125, 10.41357421875, 11.2568359375, 12.10009765625, 12.943359375, 13.78662109375, 14.6298828125, 15.47314453125, 16.31640625, 17.15966796875, 18.0029296875, 18.84619140625, 19.689453125, 20.53271484375, 21.3759765625, 22.21923828125, 23.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 21.0, 95.0, 790.0, 2891.0, 246.0, 32.0, 10.0], "bins": [-4.74609375, -4.667285919189453, -4.588478088378906, -4.509670257568359, -4.4308624267578125, -4.352054595947266, -4.273246765136719, -4.194438934326172, -4.115631103515625, -4.036823272705078, -3.9580154418945312, -3.8792076110839844, -3.8003997802734375, -3.7215919494628906, -3.6427841186523438, -3.563976287841797, -3.48516845703125, -3.406360626220703, -3.3275527954101562, -3.2487449645996094, -3.1699371337890625, -3.0911293029785156, -3.0123214721679688, -2.933513641357422, -2.854705810546875, -2.775897979736328, -2.6970901489257812, -2.6182823181152344, -2.5394744873046875, -2.4606666564941406, -2.3818588256835938, -2.303050994873047, -2.2242431640625, -2.145435333251953, -2.0666275024414062, -1.9878196716308594, -1.9090118408203125, -1.8302040100097656, -1.7513961791992188, -1.6725883483886719, -1.593780517578125, -1.5149726867675781, -1.4361648559570312, -1.3573570251464844, -1.2785491943359375, -1.1997413635253906, -1.1209335327148438, -1.0421257019042969, -0.96331787109375, -0.8845100402832031, -0.8057022094726562, -0.7268943786621094, -0.6480865478515625, -0.5692787170410156, -0.49047088623046875, -0.4116630554199219, -0.332855224609375, -0.2540473937988281, -0.17523956298828125, -0.09643173217773438, -0.0176239013671875, 0.061183929443359375, 0.13999176025390625, 0.21879959106445312, 0.297607421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 33.0, 143.0, 544.0, 230.0, 36.0, 12.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.44783020019531, -42.63691711425781, -41.82600402832031, -41.01509094238281, -40.20417785644531, -39.39326858520508, -38.58235549926758, -37.77144241333008, -36.96052932739258, -36.14961624145508, -35.33870315551758, -34.52779006958008, -33.716880798339844, -32.905967712402344, -32.095054626464844, -31.284141540527344, -30.473228454589844, -29.662315368652344, -28.851402282714844, -28.040491104125977, -27.229578018188477, -26.418664932250977, -25.60775375366211, -24.79684066772461, -23.98592758178711, -23.17501449584961, -22.36410140991211, -21.553190231323242, -20.742277145385742, -19.931364059448242, -19.120452880859375, -18.309539794921875, -17.498624801635742, -16.687711715698242, -15.876799583435059, -15.065887451171875, -14.254974365234375, -13.444061279296875, -12.633149147033691, -11.822237014770508, -11.011323928833008, -10.200410842895508, -9.389498710632324, -8.57858657836914, -7.767673492431641, -6.956760883331299, -6.145848274230957, -5.334935665130615, -4.524023056030273, -3.7131104469299316, -2.90219783782959, -2.091285228729248, -1.2803726196289062, -0.46946001052856445, 0.34145259857177734, 1.1523652076721191, 1.963277816772461, 2.7741904258728027, 3.5851030349731445, 4.396015644073486, 5.206928253173828, 6.01784086227417, 6.828753471374512, 7.6396660804748535, 8.450578689575195]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 18.0, 37.0, 44.0, 76.0, 109.0, 135.0, 160.0, 130.0, 87.0, 82.0, 63.0, 35.0, 10.0, 10.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.518835067749023, -12.085025787353516, -11.651217460632324, -11.217408180236816, -10.783599853515625, -10.349790573120117, -9.91598129272461, -9.482172012329102, -9.04836368560791, -8.614554405212402, -8.180746078491211, -7.746936798095703, -7.3131279945373535, -6.879319190979004, -6.445509910583496, -6.0117011070251465, -5.577892303466797, -5.144083499908447, -4.710274696350098, -4.27646541595459, -3.8426566123962402, -3.4088478088378906, -2.975038766860962, -2.541229724884033, -2.1074209213256836, -1.6736119985580444, -1.2398030757904053, -0.8059941530227661, -0.37218523025512695, 0.061623573303222656, 0.49543261528015137, 0.9292416572570801, 1.363051414489746, 1.7968603372573853, 2.2306692600250244, 2.664478302001953, 3.0982871055603027, 3.5320959091186523, 3.965904951095581, 4.39971399307251, 4.833522796630859, 5.267331600189209, 5.701140403747559, 6.134949684143066, 6.568758487701416, 7.002567291259766, 7.436376571655273, 7.870185375213623, 8.303994178771973, 8.73780345916748, 9.171611785888672, 9.60542106628418, 10.039230346679688, 10.473038673400879, 10.906847953796387, 11.340656280517578, 11.774465560913086, 12.208274841308594, 12.642083168029785, 13.075892448425293, 13.509700775146484, 13.943510055541992, 14.3773193359375, 14.811128616333008, 15.2449369430542]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 6.0, 9.0, 5.0, 2.0, 9.0, 15.0, 16.0, 17.0, 27.0, 40.0, 53.0, 62.0, 120.0, 233.0, 555.0, 1343.0, 5495.0, 52407.0, 611332.0, 347556.0, 23936.0, 3339.0, 1019.0, 448.0, 178.0, 103.0, 57.0, 46.0, 29.0, 17.0, 20.0, 9.0, 8.0, 7.0, 8.0, 8.0, 3.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.53424072265625, -4.3653564453125, -4.19647216796875, -4.027587890625, -3.85870361328125, -3.6898193359375, -3.52093505859375, -3.35205078125, -3.18316650390625, -3.0142822265625, -2.84539794921875, -2.676513671875, -2.50762939453125, -2.3387451171875, -2.16986083984375, -2.0009765625, -1.83209228515625, -1.6632080078125, -1.49432373046875, -1.325439453125, -1.15655517578125, -0.9876708984375, -0.81878662109375, -0.64990234375, -0.48101806640625, -0.3121337890625, -0.14324951171875, 0.025634765625, 0.19451904296875, 0.3634033203125, 0.53228759765625, 0.701171875, 0.87005615234375, 1.0389404296875, 1.20782470703125, 1.376708984375, 1.54559326171875, 1.7144775390625, 1.88336181640625, 2.05224609375, 2.22113037109375, 2.3900146484375, 2.55889892578125, 2.727783203125, 2.89666748046875, 3.0655517578125, 3.23443603515625, 3.4033203125, 3.57220458984375, 3.7410888671875, 3.90997314453125, 4.078857421875, 4.24774169921875, 4.4166259765625, 4.58551025390625, 4.75439453125, 4.92327880859375, 5.0921630859375, 5.26104736328125, 5.429931640625, 5.59881591796875, 5.7677001953125, 5.93658447265625, 6.10546875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 16.0, 24.0, 30.0, 33.0, 45.0, 45.0, 68.0, 71.0, 81.0, 86.0, 81.0, 79.0, 61.0, 51.0, 48.0, 48.0, 33.0, 25.0, 14.0, 16.0, 11.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41552734375, -0.404205322265625, -0.39288330078125, -0.381561279296875, -0.3702392578125, -0.358917236328125, -0.34759521484375, -0.336273193359375, -0.324951171875, -0.313629150390625, -0.30230712890625, -0.290985107421875, -0.2796630859375, -0.268341064453125, -0.25701904296875, -0.245697021484375, -0.234375, -0.223052978515625, -0.21173095703125, -0.200408935546875, -0.1890869140625, -0.177764892578125, -0.16644287109375, -0.155120849609375, -0.143798828125, -0.132476806640625, -0.12115478515625, -0.109832763671875, -0.0985107421875, -0.087188720703125, -0.07586669921875, -0.064544677734375, -0.05322265625, -0.041900634765625, -0.03057861328125, -0.019256591796875, -0.0079345703125, 0.003387451171875, 0.01470947265625, 0.026031494140625, 0.037353515625, 0.048675537109375, 0.05999755859375, 0.071319580078125, 0.0826416015625, 0.093963623046875, 0.10528564453125, 0.116607666015625, 0.1279296875, 0.139251708984375, 0.15057373046875, 0.161895751953125, 0.1732177734375, 0.184539794921875, 0.19586181640625, 0.207183837890625, 0.218505859375, 0.229827880859375, 0.24114990234375, 0.252471923828125, 0.2637939453125, 0.275115966796875, 0.28643798828125, 0.297760009765625, 0.30908203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 15.0, 18.0, 25.0, 35.0, 46.0, 73.0, 82.0, 166.0, 201.0, 313.0, 523.0, 822.0, 1582.0, 3747.0, 11602.0, 47103.0, 195655.0, 440874.0, 256103.0, 64525.0, 15642.0, 4794.0, 1868.0, 1015.0, 600.0, 366.0, 227.0, 174.0, 97.0, 84.0, 42.0, 28.0, 25.0, 18.0, 12.0, 10.0, 6.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7978515625, -1.7303009033203125, -1.662750244140625, -1.5951995849609375, -1.52764892578125, -1.4600982666015625, -1.392547607421875, -1.3249969482421875, -1.2574462890625, -1.1898956298828125, -1.122344970703125, -1.0547943115234375, -0.98724365234375, -0.9196929931640625, -0.852142333984375, -0.7845916748046875, -0.717041015625, -0.6494903564453125, -0.581939697265625, -0.5143890380859375, -0.44683837890625, -0.3792877197265625, -0.311737060546875, -0.2441864013671875, -0.1766357421875, -0.1090850830078125, -0.041534423828125, 0.0260162353515625, 0.09356689453125, 0.1611175537109375, 0.228668212890625, 0.2962188720703125, 0.36376953125, 0.4313201904296875, 0.498870849609375, 0.5664215087890625, 0.63397216796875, 0.7015228271484375, 0.769073486328125, 0.8366241455078125, 0.9041748046875, 0.9717254638671875, 1.039276123046875, 1.1068267822265625, 1.17437744140625, 1.2419281005859375, 1.309478759765625, 1.3770294189453125, 1.444580078125, 1.5121307373046875, 1.579681396484375, 1.6472320556640625, 1.71478271484375, 1.7823333740234375, 1.849884033203125, 1.9174346923828125, 1.9849853515625, 2.0525360107421875, 2.120086669921875, 2.1876373291015625, 2.25518798828125, 2.3227386474609375, 2.390289306640625, 2.4578399658203125, 2.525390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 7.0, 7.0, 10.0, 12.0, 17.0, 18.0, 24.0, 30.0, 31.0, 27.0, 33.0, 34.0, 39.0, 39.0, 44.0, 45.0, 50.0, 45.0, 35.0, 44.0, 52.0, 41.0, 40.0, 33.0, 46.0, 30.0, 23.0, 24.0, 23.0, 12.0, 11.0, 12.0, 10.0, 4.0, 5.0, 4.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0032958984375, -0.970458984375, -0.9376220703125, -0.90478515625, -0.8719482421875, -0.839111328125, -0.8062744140625, -0.7734375, -0.7406005859375, -0.707763671875, -0.6749267578125, -0.64208984375, -0.6092529296875, -0.576416015625, -0.5435791015625, -0.5107421875, -0.4779052734375, -0.445068359375, -0.4122314453125, -0.37939453125, -0.3465576171875, -0.313720703125, -0.2808837890625, -0.248046875, -0.2152099609375, -0.182373046875, -0.1495361328125, -0.11669921875, -0.0838623046875, -0.051025390625, -0.0181884765625, 0.0146484375, 0.0474853515625, 0.080322265625, 0.1131591796875, 0.14599609375, 0.1788330078125, 0.211669921875, 0.2445068359375, 0.27734375, 0.3101806640625, 0.343017578125, 0.3758544921875, 0.40869140625, 0.4415283203125, 0.474365234375, 0.5072021484375, 0.5400390625, 0.5728759765625, 0.605712890625, 0.6385498046875, 0.67138671875, 0.7042236328125, 0.737060546875, 0.7698974609375, 0.802734375, 0.8355712890625, 0.868408203125, 0.9012451171875, 0.93408203125, 0.9669189453125, 0.999755859375, 1.0325927734375, 1.0654296875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 15.0, 21.0, 29.0, 52.0, 82.0, 107.0, 160.0, 309.0, 576.0, 1321.0, 3083.0, 9398.0, 36609.0, 220565.0, 582758.0, 153678.0, 27491.0, 7217.0, 2544.0, 1142.0, 528.0, 311.0, 164.0, 109.0, 85.0, 54.0, 36.0, 27.0, 16.0, 11.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7534027099609375, -1.689422607421875, -1.6254425048828125, -1.56146240234375, -1.4974822998046875, -1.433502197265625, -1.3695220947265625, -1.3055419921875, -1.2415618896484375, -1.177581787109375, -1.1136016845703125, -1.04962158203125, -0.9856414794921875, -0.921661376953125, -0.8576812744140625, -0.793701171875, -0.7297210693359375, -0.665740966796875, -0.6017608642578125, -0.53778076171875, -0.4738006591796875, -0.409820556640625, -0.3458404541015625, -0.2818603515625, -0.2178802490234375, -0.153900146484375, -0.0899200439453125, -0.02593994140625, 0.0380401611328125, 0.102020263671875, 0.1660003662109375, 0.22998046875, 0.2939605712890625, 0.357940673828125, 0.4219207763671875, 0.48590087890625, 0.5498809814453125, 0.613861083984375, 0.6778411865234375, 0.7418212890625, 0.8058013916015625, 0.869781494140625, 0.9337615966796875, 0.99774169921875, 1.0617218017578125, 1.125701904296875, 1.1896820068359375, 1.253662109375, 1.3176422119140625, 1.381622314453125, 1.4456024169921875, 1.50958251953125, 1.5735626220703125, 1.637542724609375, 1.7015228271484375, 1.7655029296875, 1.8294830322265625, 1.893463134765625, 1.9574432373046875, 2.02142333984375, 2.0854034423828125, 2.149383544921875, 2.2133636474609375, 2.27734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 11.0, 9.0, 10.0, 18.0, 17.0, 19.0, 27.0, 32.0, 35.0, 48.0, 55.0, 76.0, 61.0, 69.0, 68.0, 74.0, 53.0, 56.0, 50.0, 44.0, 33.0, 27.0, 27.0, 14.0, 17.0, 17.0, 5.0, 9.0, 4.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019943714141845703, -0.00019270740449428558, -0.00018597766757011414, -0.0001792479306459427, -0.00017251819372177124, -0.0001657884567975998, -0.00015905871987342834, -0.0001523289829492569, -0.00014559924602508545, -0.000138869509100914, -0.00013213977217674255, -0.0001254100352525711, -0.00011868029832839966, -0.00011195056140422821, -0.00010522082448005676, -9.849108755588531e-05, -9.176135063171387e-05, -8.503161370754242e-05, -7.830187678337097e-05, -7.157213985919952e-05, -6.484240293502808e-05, -5.811266601085663e-05, -5.138292908668518e-05, -4.465319216251373e-05, -3.7923455238342285e-05, -3.119371831417084e-05, -2.446398138999939e-05, -1.7734244465827942e-05, -1.1004507541656494e-05, -4.274770617485046e-06, 2.4549663066864014e-06, 9.184703230857849e-06, 1.5914440155029297e-05, 2.2644177079200745e-05, 2.9373914003372192e-05, 3.610365092754364e-05, 4.283338785171509e-05, 4.9563124775886536e-05, 5.6292861700057983e-05, 6.302259862422943e-05, 6.975233554840088e-05, 7.648207247257233e-05, 8.321180939674377e-05, 8.994154632091522e-05, 9.667128324508667e-05, 0.00010340102016925812, 0.00011013075709342957, 0.00011686049401760101, 0.00012359023094177246, 0.0001303199678659439, 0.00013704970479011536, 0.0001437794417142868, 0.00015050917863845825, 0.0001572389155626297, 0.00016396865248680115, 0.0001706983894109726, 0.00017742812633514404, 0.0001841578632593155, 0.00019088760018348694, 0.00019761733710765839, 0.00020434707403182983, 0.00021107681095600128, 0.00021780654788017273, 0.00022453628480434418, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 16.0, 24.0, 38.0, 73.0, 135.0, 218.0, 478.0, 1184.0, 3787.0, 20397.0, 240860.0, 688856.0, 78732.0, 9704.0, 2340.0, 850.0, 397.0, 192.0, 109.0, 44.0, 37.0, 21.0, 16.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.806793212890625, -2.71710205078125, -2.627410888671875, -2.5377197265625, -2.448028564453125, -2.35833740234375, -2.268646240234375, -2.178955078125, -2.089263916015625, -1.99957275390625, -1.909881591796875, -1.8201904296875, -1.730499267578125, -1.64080810546875, -1.551116943359375, -1.46142578125, -1.371734619140625, -1.28204345703125, -1.192352294921875, -1.1026611328125, -1.012969970703125, -0.92327880859375, -0.833587646484375, -0.743896484375, -0.654205322265625, -0.56451416015625, -0.474822998046875, -0.3851318359375, -0.295440673828125, -0.20574951171875, -0.116058349609375, -0.0263671875, 0.063323974609375, 0.15301513671875, 0.242706298828125, 0.3323974609375, 0.422088623046875, 0.51177978515625, 0.601470947265625, 0.691162109375, 0.780853271484375, 0.87054443359375, 0.960235595703125, 1.0499267578125, 1.139617919921875, 1.22930908203125, 1.319000244140625, 1.40869140625, 1.498382568359375, 1.58807373046875, 1.677764892578125, 1.7674560546875, 1.857147216796875, 1.94683837890625, 2.036529541015625, 2.126220703125, 2.215911865234375, 2.30560302734375, 2.395294189453125, 2.4849853515625, 2.574676513671875, 2.66436767578125, 2.754058837890625, 2.84375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 11.0, 15.0, 22.0, 18.0, 33.0, 45.0, 58.0, 71.0, 77.0, 78.0, 87.0, 87.0, 80.0, 70.0, 61.0, 43.0, 39.0, 14.0, 21.0, 20.0, 9.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.7998809814453125, -0.768707275390625, -0.7375335693359375, -0.70635986328125, -0.6751861572265625, -0.644012451171875, -0.6128387451171875, -0.5816650390625, -0.5504913330078125, -0.519317626953125, -0.4881439208984375, -0.45697021484375, -0.4257965087890625, -0.394622802734375, -0.3634490966796875, -0.332275390625, -0.3011016845703125, -0.269927978515625, -0.2387542724609375, -0.20758056640625, -0.1764068603515625, -0.145233154296875, -0.1140594482421875, -0.0828857421875, -0.0517120361328125, -0.020538330078125, 0.0106353759765625, 0.04180908203125, 0.0729827880859375, 0.104156494140625, 0.1353302001953125, 0.16650390625, 0.1976776123046875, 0.228851318359375, 0.2600250244140625, 0.29119873046875, 0.3223724365234375, 0.353546142578125, 0.3847198486328125, 0.4158935546875, 0.4470672607421875, 0.478240966796875, 0.5094146728515625, 0.54058837890625, 0.5717620849609375, 0.602935791015625, 0.6341094970703125, 0.665283203125, 0.6964569091796875, 0.727630615234375, 0.7588043212890625, 0.78997802734375, 0.8211517333984375, 0.852325439453125, 0.8834991455078125, 0.9146728515625, 0.9458465576171875, 0.977020263671875, 1.0081939697265625, 1.03936767578125, 1.0705413818359375, 1.101715087890625, 1.1328887939453125, 1.1640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 10.0, 24.0, 107.0, 218.0, 318.0, 208.0, 79.0, 26.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.307259559631348, -11.382889747619629, -10.458520889282227, -9.534151077270508, -8.609781265258789, -7.68541145324707, -6.76104211807251, -5.836672782897949, -4.9123029708862305, -3.987933397293091, -3.063563823699951, -2.1391942501068115, -1.2148246765136719, -0.2904548645019531, 0.6339144706726074, 1.558283805847168, 2.4826536178588867, 3.4070231914520264, 4.331392765045166, 5.255762100219727, 6.180131912231445, 7.104501724243164, 8.028871536254883, 8.953240394592285, 9.877610206604004, 10.801980018615723, 11.726348876953125, 12.650718688964844, 13.575088500976562, 14.499458312988281, 15.423828125, 16.34819793701172, 17.272567749023438, 18.196937561035156, 19.121307373046875, 20.045677185058594, 20.970046997070312, 21.89441680908203, 22.818784713745117, 23.743154525756836, 24.667524337768555, 25.591894149780273, 26.516263961791992, 27.44063377380371, 28.365001678466797, 29.289371490478516, 30.213741302490234, 31.138111114501953, 32.06248092651367, 32.98685073852539, 33.91122055053711, 34.83559036254883, 35.75996017456055, 36.684329986572266, 37.608699798583984, 38.53306579589844, 39.457435607910156, 40.381805419921875, 41.306175231933594, 42.23054504394531, 43.15491485595703, 44.07928466796875, 45.00365447998047, 45.92802429199219, 46.852394104003906]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 6.0, 11.0, 16.0, 19.0, 19.0, 19.0, 37.0, 34.0, 42.0, 38.0, 38.0, 44.0, 46.0, 52.0, 48.0, 38.0, 54.0, 41.0, 42.0, 35.0, 46.0, 36.0, 31.0, 22.0, 29.0, 30.0, 26.0, 10.0, 8.0, 9.0, 8.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.671116352081299, -7.450446128845215, -7.229775905609131, -7.009105682373047, -6.788434982299805, -6.567764759063721, -6.347094535827637, -6.126424312591553, -5.905754089355469, -5.685083866119385, -5.464413642883301, -5.243742942810059, -5.023072719573975, -4.802402496337891, -4.581732273101807, -4.361062049865723, -4.1403913497924805, -3.9197211265563965, -3.6990506649017334, -3.4783804416656494, -3.2577099800109863, -3.0370397567749023, -2.8163695335388184, -2.5956993103027344, -2.3750288486480713, -2.1543586254119873, -1.9336881637573242, -1.7130179405212402, -1.4923475980758667, -1.2716772556304932, -1.0510070323944092, -0.8303366899490356, -0.6096658706665039, -0.38899555802345276, -0.1683252453804016, 0.05234503746032715, 0.2730153799057007, 0.4936857223510742, 0.7143559455871582, 0.9350262880325317, 1.1556966304779053, 1.3763669729232788, 1.5970373153686523, 1.8177075386047363, 2.0383777618408203, 2.2590482234954834, 2.4797184467315674, 2.7003889083862305, 2.9210591316223145, 3.1417293548583984, 3.3623998165130615, 3.5830700397491455, 3.8037405014038086, 4.024410724639893, 4.245080947875977, 4.4657511711120605, 4.6864213943481445, 4.9070916175842285, 5.1277618408203125, 5.348432540893555, 5.569102764129639, 5.789772987365723, 6.010443210601807, 6.231113433837891, 6.451784133911133]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 7.0, 10.0, 3.0, 8.0, 15.0, 15.0, 13.0, 25.0, 28.0, 39.0, 49.0, 94.0, 127.0, 242.0, 510.0, 1122.0, 3793.0, 19237.0, 296440.0, 3790170.0, 70435.0, 8806.0, 1928.0, 637.0, 253.0, 101.0, 52.0, 34.0, 16.0, 12.0, 7.0, 13.0, 6.0, 6.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.06597900390625, -5.8780517578125, -5.69012451171875, -5.502197265625, -5.31427001953125, -5.1263427734375, -4.93841552734375, -4.75048828125, -4.56256103515625, -4.3746337890625, -4.18670654296875, -3.998779296875, -3.81085205078125, -3.6229248046875, -3.43499755859375, -3.2470703125, -3.05914306640625, -2.8712158203125, -2.68328857421875, -2.495361328125, -2.30743408203125, -2.1195068359375, -1.93157958984375, -1.74365234375, -1.55572509765625, -1.3677978515625, -1.17987060546875, -0.991943359375, -0.80401611328125, -0.6160888671875, -0.42816162109375, -0.240234375, -0.05230712890625, 0.1356201171875, 0.32354736328125, 0.511474609375, 0.69940185546875, 0.8873291015625, 1.07525634765625, 1.26318359375, 1.45111083984375, 1.6390380859375, 1.82696533203125, 2.014892578125, 2.20281982421875, 2.3907470703125, 2.57867431640625, 2.7666015625, 2.95452880859375, 3.1424560546875, 3.33038330078125, 3.518310546875, 3.70623779296875, 3.8941650390625, 4.08209228515625, 4.27001953125, 4.45794677734375, 4.6458740234375, 4.83380126953125, 5.021728515625, 5.20965576171875, 5.3975830078125, 5.58551025390625, 5.7734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 19.0, 16.0, 18.0, 47.0, 23.0, 41.0, 49.0, 81.0, 79.0, 75.0, 98.0, 76.0, 83.0, 51.0, 51.0, 34.0, 29.0, 25.0, 28.0, 19.0, 13.0, 11.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4599609375, -0.44878387451171875, -0.4376068115234375, -0.42642974853515625, -0.415252685546875, -0.40407562255859375, -0.3928985595703125, -0.38172149658203125, -0.37054443359375, -0.35936737060546875, -0.3481903076171875, -0.33701324462890625, -0.325836181640625, -0.31465911865234375, -0.3034820556640625, -0.29230499267578125, -0.2811279296875, -0.26995086669921875, -0.2587738037109375, -0.24759674072265625, -0.236419677734375, -0.22524261474609375, -0.2140655517578125, -0.20288848876953125, -0.19171142578125, -0.18053436279296875, -0.1693572998046875, -0.15818023681640625, -0.147003173828125, -0.13582611083984375, -0.1246490478515625, -0.11347198486328125, -0.102294921875, -0.09111785888671875, -0.0799407958984375, -0.06876373291015625, -0.057586669921875, -0.04640960693359375, -0.0352325439453125, -0.02405548095703125, -0.01287841796875, -0.00170135498046875, 0.0094757080078125, 0.02065277099609375, 0.031829833984375, 0.04300689697265625, 0.0541839599609375, 0.06536102294921875, 0.0765380859375, 0.08771514892578125, 0.0988922119140625, 0.11006927490234375, 0.121246337890625, 0.13242340087890625, 0.1436004638671875, 0.15477752685546875, 0.16595458984375, 0.17713165283203125, 0.1883087158203125, 0.19948577880859375, 0.210662841796875, 0.22183990478515625, 0.2330169677734375, 0.24419403076171875, 0.25537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 12.0, 14.0, 31.0, 53.0, 112.0, 229.0, 876.0, 28119.0, 4160066.0, 4183.0, 365.0, 102.0, 59.0, 35.0, 12.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.2078857421875, -27.525146484375, -26.8424072265625, -26.15966796875, -25.4769287109375, -24.794189453125, -24.1114501953125, -23.4287109375, -22.7459716796875, -22.063232421875, -21.3804931640625, -20.69775390625, -20.0150146484375, -19.332275390625, -18.6495361328125, -17.966796875, -17.2840576171875, -16.601318359375, -15.9185791015625, -15.23583984375, -14.5531005859375, -13.870361328125, -13.1876220703125, -12.5048828125, -11.8221435546875, -11.139404296875, -10.4566650390625, -9.77392578125, -9.0911865234375, -8.408447265625, -7.7257080078125, -7.04296875, -6.3602294921875, -5.677490234375, -4.9947509765625, -4.31201171875, -3.6292724609375, -2.946533203125, -2.2637939453125, -1.5810546875, -0.8983154296875, -0.215576171875, 0.4671630859375, 1.14990234375, 1.8326416015625, 2.515380859375, 3.1981201171875, 3.880859375, 4.5635986328125, 5.246337890625, 5.9290771484375, 6.61181640625, 7.2945556640625, 7.977294921875, 8.6600341796875, 9.3427734375, 10.0255126953125, 10.708251953125, 11.3909912109375, 12.07373046875, 12.7564697265625, 13.439208984375, 14.1219482421875, 14.8046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 24.0, 63.0, 183.0, 856.0, 2329.0, 412.0, 116.0, 39.0, 20.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.0078125, -2.9491729736328125, -2.890533447265625, -2.8318939208984375, -2.77325439453125, -2.7146148681640625, -2.655975341796875, -2.5973358154296875, -2.5386962890625, -2.4800567626953125, -2.421417236328125, -2.3627777099609375, -2.30413818359375, -2.2454986572265625, -2.186859130859375, -2.1282196044921875, -2.069580078125, -2.0109405517578125, -1.952301025390625, -1.8936614990234375, -1.83502197265625, -1.7763824462890625, -1.717742919921875, -1.6591033935546875, -1.6004638671875, -1.5418243408203125, -1.483184814453125, -1.4245452880859375, -1.36590576171875, -1.3072662353515625, -1.248626708984375, -1.1899871826171875, -1.13134765625, -1.0727081298828125, -1.014068603515625, -0.9554290771484375, -0.89678955078125, -0.8381500244140625, -0.779510498046875, -0.7208709716796875, -0.6622314453125, -0.6035919189453125, -0.544952392578125, -0.4863128662109375, -0.42767333984375, -0.3690338134765625, -0.310394287109375, -0.2517547607421875, -0.193115234375, -0.1344757080078125, -0.075836181640625, -0.0171966552734375, 0.04144287109375, 0.1000823974609375, 0.158721923828125, 0.2173614501953125, 0.2760009765625, 0.3346405029296875, 0.393280029296875, 0.4519195556640625, 0.51055908203125, 0.5691986083984375, 0.627838134765625, 0.6864776611328125, 0.7451171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 23.0, 64.0, 568.0, 318.0, 32.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.848087310791016, -42.86951446533203, -41.89094543457031, -40.91237258911133, -39.93380355834961, -38.955230712890625, -37.976661682128906, -36.99808883666992, -36.01951599121094, -35.04094314575195, -34.062374114990234, -33.08380126953125, -32.10523223876953, -31.126659393310547, -30.148088455200195, -29.169517517089844, -28.190948486328125, -27.212377548217773, -26.233806610107422, -25.255233764648438, -24.276662826538086, -23.298091888427734, -22.319520950317383, -21.34095001220703, -20.362377166748047, -19.383806228637695, -18.405235290527344, -17.42666244506836, -16.448091506958008, -15.469520568847656, -14.490949630737305, -13.512378692626953, -12.533807754516602, -11.55523681640625, -10.576664924621582, -9.59809398651123, -8.619523048400879, -7.640951633453369, -6.662380218505859, -5.683809280395508, -4.705237865447998, -3.7266666889190674, -2.7480955123901367, -1.769524097442627, -0.7909529209136963, 0.18761825561523438, 1.1661896705627441, 2.1447606086730957, 3.1233320236206055, 4.101903438568115, 5.080474376678467, 6.059045791625977, 7.037616729736328, 8.01618766784668, 8.994759559631348, 9.9733304977417, 10.951902389526367, 11.930473327636719, 12.909045219421387, 13.887616157531738, 14.86618709564209, 15.844758987426758, 16.82332992553711, 17.80190086364746, 18.780471801757812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 10.0, 5.0, 8.0, 18.0, 17.0, 34.0, 34.0, 62.0, 77.0, 63.0, 74.0, 86.0, 81.0, 73.0, 81.0, 68.0, 56.0, 57.0, 47.0, 21.0, 10.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.372196197509766, -6.1926469802856445, -6.013097286224365, -5.833547592163086, -5.653998374938965, -5.474449157714844, -5.2948994636535645, -5.115349769592285, -4.935800552368164, -4.756251335144043, -4.576701641082764, -4.397151947021484, -4.217602729797363, -4.038053512573242, -3.858503818511963, -3.6789543628692627, -3.4994049072265625, -3.3198554515838623, -3.140305995941162, -2.960756540298462, -2.7812070846557617, -2.6016576290130615, -2.4221081733703613, -2.242558717727661, -2.063009262084961, -1.8834598064422607, -1.7039103507995605, -1.5243608951568604, -1.3448114395141602, -1.16526198387146, -0.9857125282287598, -0.8061630725860596, -0.6266131401062012, -0.447063684463501, -0.2675142288208008, -0.08796477317810059, 0.09158468246459961, 0.2711341381072998, 0.45068359375, 0.6302330493927002, 0.8097825050354004, 0.9893319606781006, 1.1688814163208008, 1.348430871963501, 1.5279803276062012, 1.7075297832489014, 1.8870792388916016, 2.0666286945343018, 2.246178150177002, 2.425727605819702, 2.6052770614624023, 2.7848265171051025, 2.9643759727478027, 3.143925428390503, 3.323474884033203, 3.5030243396759033, 3.6825737953186035, 3.8621232509613037, 4.041672706604004, 4.221221923828125, 4.400771617889404, 4.580321311950684, 4.759870529174805, 4.939419746398926, 5.118969440460205]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 3.0, 6.0, 9.0, 18.0, 18.0, 25.0, 33.0, 41.0, 59.0, 115.0, 182.0, 364.0, 856.0, 2969.0, 17148.0, 203980.0, 708904.0, 100276.0, 10002.0, 2069.0, 706.0, 299.0, 164.0, 103.0, 62.0, 39.0, 19.0, 19.0, 11.0, 10.0, 5.0, 8.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.63671875, -5.4935302734375, -5.350341796875, -5.2071533203125, -5.06396484375, -4.9207763671875, -4.777587890625, -4.6343994140625, -4.4912109375, -4.3480224609375, -4.204833984375, -4.0616455078125, -3.91845703125, -3.7752685546875, -3.632080078125, -3.4888916015625, -3.345703125, -3.2025146484375, -3.059326171875, -2.9161376953125, -2.77294921875, -2.6297607421875, -2.486572265625, -2.3433837890625, -2.2001953125, -2.0570068359375, -1.913818359375, -1.7706298828125, -1.62744140625, -1.4842529296875, -1.341064453125, -1.1978759765625, -1.0546875, -0.9114990234375, -0.768310546875, -0.6251220703125, -0.48193359375, -0.3387451171875, -0.195556640625, -0.0523681640625, 0.0908203125, 0.2340087890625, 0.377197265625, 0.5203857421875, 0.66357421875, 0.8067626953125, 0.949951171875, 1.0931396484375, 1.236328125, 1.3795166015625, 1.522705078125, 1.6658935546875, 1.80908203125, 1.9522705078125, 2.095458984375, 2.2386474609375, 2.3818359375, 2.5250244140625, 2.668212890625, 2.8114013671875, 2.95458984375, 3.0977783203125, 3.240966796875, 3.3841552734375, 3.52734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 10.0, 9.0, 13.0, 19.0, 23.0, 36.0, 34.0, 60.0, 63.0, 90.0, 69.0, 85.0, 89.0, 68.0, 77.0, 64.0, 37.0, 40.0, 38.0, 31.0, 10.0, 7.0, 10.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.53955078125, -0.5252456665039062, -0.5109405517578125, -0.49663543701171875, -0.482330322265625, -0.46802520751953125, -0.4537200927734375, -0.43941497802734375, -0.42510986328125, -0.41080474853515625, -0.3964996337890625, -0.38219451904296875, -0.367889404296875, -0.35358428955078125, -0.3392791748046875, -0.32497406005859375, -0.3106689453125, -0.29636383056640625, -0.2820587158203125, -0.26775360107421875, -0.253448486328125, -0.23914337158203125, -0.2248382568359375, -0.21053314208984375, -0.19622802734375, -0.18192291259765625, -0.1676177978515625, -0.15331268310546875, -0.139007568359375, -0.12470245361328125, -0.1103973388671875, -0.09609222412109375, -0.081787109375, -0.06748199462890625, -0.0531768798828125, -0.03887176513671875, -0.024566650390625, -0.01026153564453125, 0.0040435791015625, 0.01834869384765625, 0.03265380859375, 0.04695892333984375, 0.0612640380859375, 0.07556915283203125, 0.089874267578125, 0.10417938232421875, 0.1184844970703125, 0.13278961181640625, 0.1470947265625, 0.16139984130859375, 0.1757049560546875, 0.19001007080078125, 0.204315185546875, 0.21862030029296875, 0.2329254150390625, 0.24723052978515625, 0.26153564453125, 0.27584075927734375, 0.2901458740234375, 0.30445098876953125, 0.318756103515625, 0.33306121826171875, 0.3473663330078125, 0.36167144775390625, 0.3759765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 10.0, 21.0, 20.0, 28.0, 37.0, 56.0, 74.0, 113.0, 145.0, 179.0, 305.0, 434.0, 730.0, 1274.0, 2426.0, 5536.0, 15307.0, 52112.0, 186801.0, 403862.0, 262675.0, 79392.0, 22339.0, 7479.0, 3124.0, 1549.0, 857.0, 491.0, 347.0, 236.0, 139.0, 132.0, 72.0, 64.0, 47.0, 30.0, 22.0, 17.0, 15.0, 10.0, 15.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.88671875, -1.828948974609375, -1.77117919921875, -1.713409423828125, -1.6556396484375, -1.597869873046875, -1.54010009765625, -1.482330322265625, -1.424560546875, -1.366790771484375, -1.30902099609375, -1.251251220703125, -1.1934814453125, -1.135711669921875, -1.07794189453125, -1.020172119140625, -0.96240234375, -0.904632568359375, -0.84686279296875, -0.789093017578125, -0.7313232421875, -0.673553466796875, -0.61578369140625, -0.558013916015625, -0.500244140625, -0.442474365234375, -0.38470458984375, -0.326934814453125, -0.2691650390625, -0.211395263671875, -0.15362548828125, -0.095855712890625, -0.0380859375, 0.019683837890625, 0.07745361328125, 0.135223388671875, 0.1929931640625, 0.250762939453125, 0.30853271484375, 0.366302490234375, 0.424072265625, 0.481842041015625, 0.53961181640625, 0.597381591796875, 0.6551513671875, 0.712921142578125, 0.77069091796875, 0.828460693359375, 0.88623046875, 0.944000244140625, 1.00177001953125, 1.059539794921875, 1.1173095703125, 1.175079345703125, 1.23284912109375, 1.290618896484375, 1.348388671875, 1.406158447265625, 1.46392822265625, 1.521697998046875, 1.5794677734375, 1.637237548828125, 1.69500732421875, 1.752777099609375, 1.810546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 1.0, 7.0, 10.0, 16.0, 9.0, 10.0, 13.0, 12.0, 18.0, 18.0, 24.0, 13.0, 25.0, 37.0, 33.0, 31.0, 42.0, 39.0, 39.0, 44.0, 30.0, 50.0, 36.0, 39.0, 33.0, 40.0, 44.0, 30.0, 34.0, 31.0, 23.0, 21.0, 26.0, 19.0, 14.0, 13.0, 13.0, 11.0, 8.0, 5.0, 8.0, 10.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.984375, -0.949249267578125, -0.91412353515625, -0.878997802734375, -0.8438720703125, -0.808746337890625, -0.77362060546875, -0.738494873046875, -0.703369140625, -0.668243408203125, -0.63311767578125, -0.597991943359375, -0.5628662109375, -0.527740478515625, -0.49261474609375, -0.457489013671875, -0.42236328125, -0.387237548828125, -0.35211181640625, -0.316986083984375, -0.2818603515625, -0.246734619140625, -0.21160888671875, -0.176483154296875, -0.141357421875, -0.106231689453125, -0.07110595703125, -0.035980224609375, -0.0008544921875, 0.034271240234375, 0.06939697265625, 0.104522705078125, 0.1396484375, 0.174774169921875, 0.20989990234375, 0.245025634765625, 0.2801513671875, 0.315277099609375, 0.35040283203125, 0.385528564453125, 0.420654296875, 0.455780029296875, 0.49090576171875, 0.526031494140625, 0.5611572265625, 0.596282958984375, 0.63140869140625, 0.666534423828125, 0.70166015625, 0.736785888671875, 0.77191162109375, 0.807037353515625, 0.8421630859375, 0.877288818359375, 0.91241455078125, 0.947540283203125, 0.982666015625, 1.017791748046875, 1.05291748046875, 1.088043212890625, 1.1231689453125, 1.158294677734375, 1.19342041015625, 1.228546142578125, 1.263671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 12.0, 16.0, 23.0, 43.0, 61.0, 99.0, 168.0, 319.0, 644.0, 1464.0, 3880.0, 13165.0, 64097.0, 358201.0, 477047.0, 101658.0, 19122.0, 5088.0, 1745.0, 778.0, 381.0, 219.0, 103.0, 88.0, 42.0, 23.0, 21.0, 15.0, 13.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2764892578125, -1.232666015625, -1.1888427734375, -1.14501953125, -1.1011962890625, -1.057373046875, -1.0135498046875, -0.9697265625, -0.9259033203125, -0.882080078125, -0.8382568359375, -0.79443359375, -0.7506103515625, -0.706787109375, -0.6629638671875, -0.619140625, -0.5753173828125, -0.531494140625, -0.4876708984375, -0.44384765625, -0.4000244140625, -0.356201171875, -0.3123779296875, -0.2685546875, -0.2247314453125, -0.180908203125, -0.1370849609375, -0.09326171875, -0.0494384765625, -0.005615234375, 0.0382080078125, 0.08203125, 0.1258544921875, 0.169677734375, 0.2135009765625, 0.25732421875, 0.3011474609375, 0.344970703125, 0.3887939453125, 0.4326171875, 0.4764404296875, 0.520263671875, 0.5640869140625, 0.60791015625, 0.6517333984375, 0.695556640625, 0.7393798828125, 0.783203125, 0.8270263671875, 0.870849609375, 0.9146728515625, 0.95849609375, 1.0023193359375, 1.046142578125, 1.0899658203125, 1.1337890625, 1.1776123046875, 1.221435546875, 1.2652587890625, 1.30908203125, 1.3529052734375, 1.396728515625, 1.4405517578125, 1.484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 11.0, 13.0, 7.0, 23.0, 20.0, 21.0, 27.0, 37.0, 37.0, 56.0, 53.0, 60.0, 66.0, 83.0, 69.0, 54.0, 52.0, 47.0, 46.0, 37.0, 27.0, 18.0, 18.0, 18.0, 18.0, 11.0, 12.0, 4.0, 10.0, 6.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013363361358642578, -0.0001293141394853592, -0.0001249946653842926, -0.00012067519128322601, -0.00011635571718215942, -0.00011203624308109283, -0.00010771676898002625, -0.00010339729487895966, -9.907782077789307e-05, -9.475834667682648e-05, -9.043887257575989e-05, -8.61193984746933e-05, -8.179992437362671e-05, -7.748045027256012e-05, -7.316097617149353e-05, -6.884150207042694e-05, -6.452202796936035e-05, -6.020255386829376e-05, -5.588307976722717e-05, -5.1563605666160583e-05, -4.7244131565093994e-05, -4.2924657464027405e-05, -3.8605183362960815e-05, -3.4285709261894226e-05, -2.9966235160827637e-05, -2.5646761059761047e-05, -2.1327286958694458e-05, -1.700781285762787e-05, -1.268833875656128e-05, -8.36886465549469e-06, -4.049390554428101e-06, 2.7008354663848877e-07, 4.589557647705078e-06, 8.909031748771667e-06, 1.3228505849838257e-05, 1.7547979950904846e-05, 2.1867454051971436e-05, 2.6186928153038025e-05, 3.0506402254104614e-05, 3.4825876355171204e-05, 3.914535045623779e-05, 4.346482455730438e-05, 4.778429865837097e-05, 5.210377275943756e-05, 5.642324686050415e-05, 6.074272096157074e-05, 6.506219506263733e-05, 6.938166916370392e-05, 7.370114326477051e-05, 7.80206173658371e-05, 8.234009146690369e-05, 8.665956556797028e-05, 9.097903966903687e-05, 9.529851377010345e-05, 9.961798787117004e-05, 0.00010393746197223663, 0.00010825693607330322, 0.00011257641017436981, 0.0001168958842754364, 0.00012121535837650299, 0.00012553483247756958, 0.00012985430657863617, 0.00013417378067970276, 0.00013849325478076935, 0.00014281272888183594]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 10.0, 4.0, 16.0, 23.0, 21.0, 30.0, 41.0, 56.0, 88.0, 130.0, 198.0, 317.0, 571.0, 1016.0, 1921.0, 3949.0, 9542.0, 27774.0, 103135.0, 346768.0, 380272.0, 120629.0, 31951.0, 10848.0, 4475.0, 2038.0, 1099.0, 617.0, 315.0, 184.0, 167.0, 77.0, 82.0, 39.0, 29.0, 35.0, 17.0, 12.0, 13.0, 5.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0274658203125, -0.994384765625, -0.9613037109375, -0.92822265625, -0.8951416015625, -0.862060546875, -0.8289794921875, -0.7958984375, -0.7628173828125, -0.729736328125, -0.6966552734375, -0.66357421875, -0.6304931640625, -0.597412109375, -0.5643310546875, -0.53125, -0.4981689453125, -0.465087890625, -0.4320068359375, -0.39892578125, -0.3658447265625, -0.332763671875, -0.2996826171875, -0.2666015625, -0.2335205078125, -0.200439453125, -0.1673583984375, -0.13427734375, -0.1011962890625, -0.068115234375, -0.0350341796875, -0.001953125, 0.0311279296875, 0.064208984375, 0.0972900390625, 0.13037109375, 0.1634521484375, 0.196533203125, 0.2296142578125, 0.2626953125, 0.2957763671875, 0.328857421875, 0.3619384765625, 0.39501953125, 0.4281005859375, 0.461181640625, 0.4942626953125, 0.52734375, 0.5604248046875, 0.593505859375, 0.6265869140625, 0.65966796875, 0.6927490234375, 0.725830078125, 0.7589111328125, 0.7919921875, 0.8250732421875, 0.858154296875, 0.8912353515625, 0.92431640625, 0.9573974609375, 0.990478515625, 1.0235595703125, 1.056640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 10.0, 21.0, 20.0, 20.0, 32.0, 24.0, 57.0, 51.0, 54.0, 53.0, 75.0, 76.0, 81.0, 70.0, 71.0, 63.0, 32.0, 36.0, 31.0, 29.0, 17.0, 12.0, 11.0, 5.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69287109375, -0.667724609375, -0.642578125, -0.617431640625, -0.59228515625, -0.567138671875, -0.5419921875, -0.516845703125, -0.49169921875, -0.466552734375, -0.44140625, -0.416259765625, -0.39111328125, -0.365966796875, -0.3408203125, -0.315673828125, -0.29052734375, -0.265380859375, -0.240234375, -0.215087890625, -0.18994140625, -0.164794921875, -0.1396484375, -0.114501953125, -0.08935546875, -0.064208984375, -0.0390625, -0.013916015625, 0.01123046875, 0.036376953125, 0.0615234375, 0.086669921875, 0.11181640625, 0.136962890625, 0.162109375, 0.187255859375, 0.21240234375, 0.237548828125, 0.2626953125, 0.287841796875, 0.31298828125, 0.338134765625, 0.36328125, 0.388427734375, 0.41357421875, 0.438720703125, 0.4638671875, 0.489013671875, 0.51416015625, 0.539306640625, 0.564453125, 0.589599609375, 0.61474609375, 0.639892578125, 0.6650390625, 0.690185546875, 0.71533203125, 0.740478515625, 0.765625, 0.790771484375, 0.81591796875, 0.841064453125, 0.8662109375, 0.891357421875, 0.91650390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 21.0, 67.0, 157.0, 245.0, 231.0, 144.0, 70.0, 32.0, 14.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53908348083496, -22.84380531311035, -22.148527145385742, -21.453248977661133, -20.75796890258789, -20.06269073486328, -19.367412567138672, -18.672134399414062, -17.976856231689453, -17.281578063964844, -16.586299896240234, -15.891020774841309, -15.1957426071167, -14.50046443939209, -13.805185317993164, -13.109907150268555, -12.414628982543945, -11.719350814819336, -11.024072647094727, -10.3287935256958, -9.633515357971191, -8.938237190246582, -8.242958068847656, -7.547679901123047, -6.8524017333984375, -6.157123565673828, -5.4618449211120605, -4.766566276550293, -4.071288108825684, -3.376009702682495, -2.6807312965393066, -1.985452651977539, -1.2901725769042969, -0.5948941707611084, 0.10038423538208008, 0.7956626415252686, 1.490941047668457, 2.1862194538116455, 2.881497859954834, 3.5767765045166016, 4.272054672241211, 4.96733283996582, 5.662611484527588, 6.3578901290893555, 7.053168296813965, 7.748446464538574, 8.4437255859375, 9.13900375366211, 9.834281921386719, 10.529560089111328, 11.224838256835938, 11.920117378234863, 12.615395545959473, 13.310673713684082, 14.005952835083008, 14.701231002807617, 15.396509170532227, 16.091787338256836, 16.787065505981445, 17.482343673706055, 18.177623748779297, 18.872901916503906, 19.568180084228516, 20.263458251953125, 20.958736419677734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 12.0, 12.0, 12.0, 11.0, 17.0, 11.0, 25.0, 27.0, 23.0, 32.0, 34.0, 36.0, 58.0, 38.0, 45.0, 59.0, 63.0, 49.0, 51.0, 40.0, 34.0, 40.0, 31.0, 34.0, 41.0, 26.0, 26.0, 12.0, 11.0, 21.0, 12.0, 10.0, 9.0, 6.0, 2.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.7847723960876465, -6.530965805053711, -6.277159214019775, -6.02335262298584, -5.7695465087890625, -5.515739440917969, -5.261933326721191, -5.008126735687256, -4.75432014465332, -4.500513553619385, -4.246706962585449, -3.9929006099700928, -3.7390940189361572, -3.4852874279022217, -3.2314810752868652, -2.9776744842529297, -2.723867893218994, -2.4700613021850586, -2.216254711151123, -1.9624483585357666, -1.708641767501831, -1.4548351764678955, -1.2010287046432495, -0.9472222328186035, -0.693415641784668, -0.4396091103553772, -0.18580257892608643, 0.06800395250320435, 0.3218104839324951, 0.5756170749664307, 0.8294235467910767, 1.0832300186157227, 1.3370361328125, 1.5908427238464355, 1.8446491956710815, 2.0984556674957275, 2.352262258529663, 2.6060688495635986, 2.859875202178955, 3.1136817932128906, 3.367488384246826, 3.6212949752807617, 3.8751015663146973, 4.128908157348633, 4.38271427154541, 4.636521339416504, 4.890327453613281, 5.144134044647217, 5.397940635681152, 5.651747226715088, 5.905553817749023, 6.159360408782959, 6.4131669998168945, 6.666973114013672, 6.920779705047607, 7.174586296081543, 7.4283928871154785, 7.682199478149414, 7.93600606918335, 8.189812660217285, 8.443618774414062, 8.697425842285156, 8.951231956481934, 9.205038070678711, 9.458845138549805]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 14.0, 5.0, 10.0, 10.0, 21.0, 25.0, 30.0, 43.0, 65.0, 78.0, 109.0, 155.0, 248.0, 484.0, 1247.0, 3750.0, 16202.0, 177915.0, 3886101.0, 91308.0, 11649.0, 2917.0, 993.0, 415.0, 181.0, 111.0, 66.0, 27.0, 26.0, 18.0, 6.0, 5.0, 14.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.90234375, -4.75555419921875, -4.6087646484375, -4.46197509765625, -4.315185546875, -4.16839599609375, -4.0216064453125, -3.87481689453125, -3.72802734375, -3.58123779296875, -3.4344482421875, -3.28765869140625, -3.140869140625, -2.99407958984375, -2.8472900390625, -2.70050048828125, -2.5537109375, -2.40692138671875, -2.2601318359375, -2.11334228515625, -1.966552734375, -1.81976318359375, -1.6729736328125, -1.52618408203125, -1.37939453125, -1.23260498046875, -1.0858154296875, -0.93902587890625, -0.792236328125, -0.64544677734375, -0.4986572265625, -0.35186767578125, -0.205078125, -0.05828857421875, 0.0885009765625, 0.23529052734375, 0.382080078125, 0.52886962890625, 0.6756591796875, 0.82244873046875, 0.96923828125, 1.11602783203125, 1.2628173828125, 1.40960693359375, 1.556396484375, 1.70318603515625, 1.8499755859375, 1.99676513671875, 2.1435546875, 2.29034423828125, 2.4371337890625, 2.58392333984375, 2.730712890625, 2.87750244140625, 3.0242919921875, 3.17108154296875, 3.31787109375, 3.46466064453125, 3.6114501953125, 3.75823974609375, 3.905029296875, 4.05181884765625, 4.1986083984375, 4.34539794921875, 4.4921875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 3.0, 8.0, 19.0, 18.0, 25.0, 44.0, 51.0, 59.0, 58.0, 69.0, 81.0, 79.0, 82.0, 59.0, 70.0, 53.0, 49.0, 39.0, 32.0, 27.0, 15.0, 14.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.54248046875, -0.5287551879882812, -0.5150299072265625, -0.5013046264648438, -0.487579345703125, -0.47385406494140625, -0.4601287841796875, -0.44640350341796875, -0.43267822265625, -0.41895294189453125, -0.4052276611328125, -0.39150238037109375, -0.377777099609375, -0.36405181884765625, -0.3503265380859375, -0.33660125732421875, -0.3228759765625, -0.30915069580078125, -0.2954254150390625, -0.28170013427734375, -0.267974853515625, -0.25424957275390625, -0.2405242919921875, -0.22679901123046875, -0.21307373046875, -0.19934844970703125, -0.1856231689453125, -0.17189788818359375, -0.158172607421875, -0.14444732666015625, -0.1307220458984375, -0.11699676513671875, -0.103271484375, -0.08954620361328125, -0.0758209228515625, -0.06209564208984375, -0.048370361328125, -0.03464508056640625, -0.0209197998046875, -0.00719451904296875, 0.00653076171875, 0.02025604248046875, 0.0339813232421875, 0.04770660400390625, 0.061431884765625, 0.07515716552734375, 0.0888824462890625, 0.10260772705078125, 0.1163330078125, 0.13005828857421875, 0.1437835693359375, 0.15750885009765625, 0.171234130859375, 0.18495941162109375, 0.1986846923828125, 0.21240997314453125, 0.22613525390625, 0.23986053466796875, 0.2535858154296875, 0.26731109619140625, 0.281036376953125, 0.29476165771484375, 0.3084869384765625, 0.32221221923828125, 0.3359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 10.0, 15.0, 19.0, 23.0, 48.0, 65.0, 93.0, 125.0, 175.0, 507.0, 5117.0, 3762717.0, 421604.0, 2862.0, 345.0, 153.0, 108.0, 70.0, 60.0, 33.0, 37.0, 37.0, 22.0, 12.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.25, -7.8896484375, -7.529296875, -7.1689453125, -6.80859375, -6.4482421875, -6.087890625, -5.7275390625, -5.3671875, -5.0068359375, -4.646484375, -4.2861328125, -3.92578125, -3.5654296875, -3.205078125, -2.8447265625, -2.484375, -2.1240234375, -1.763671875, -1.4033203125, -1.04296875, -0.6826171875, -0.322265625, 0.0380859375, 0.3984375, 0.7587890625, 1.119140625, 1.4794921875, 1.83984375, 2.2001953125, 2.560546875, 2.9208984375, 3.28125, 3.6416015625, 4.001953125, 4.3623046875, 4.72265625, 5.0830078125, 5.443359375, 5.8037109375, 6.1640625, 6.5244140625, 6.884765625, 7.2451171875, 7.60546875, 7.9658203125, 8.326171875, 8.6865234375, 9.046875, 9.4072265625, 9.767578125, 10.1279296875, 10.48828125, 10.8486328125, 11.208984375, 11.5693359375, 11.9296875, 12.2900390625, 12.650390625, 13.0107421875, 13.37109375, 13.7314453125, 14.091796875, 14.4521484375, 14.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 16.0, 41.0, 315.0, 3052.0, 544.0, 84.0, 19.0, 12.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.483154296875, -2.38623046875, -2.289306640625, -2.1923828125, -2.095458984375, -1.99853515625, -1.901611328125, -1.8046875, -1.707763671875, -1.61083984375, -1.513916015625, -1.4169921875, -1.320068359375, -1.22314453125, -1.126220703125, -1.029296875, -0.932373046875, -0.83544921875, -0.738525390625, -0.6416015625, -0.544677734375, -0.44775390625, -0.350830078125, -0.25390625, -0.156982421875, -0.06005859375, 0.036865234375, 0.1337890625, 0.230712890625, 0.32763671875, 0.424560546875, 0.521484375, 0.618408203125, 0.71533203125, 0.812255859375, 0.9091796875, 1.006103515625, 1.10302734375, 1.199951171875, 1.296875, 1.393798828125, 1.49072265625, 1.587646484375, 1.6845703125, 1.781494140625, 1.87841796875, 1.975341796875, 2.072265625, 2.169189453125, 2.26611328125, 2.363037109375, 2.4599609375, 2.556884765625, 2.65380859375, 2.750732421875, 2.84765625, 2.944580078125, 3.04150390625, 3.138427734375, 3.2353515625, 3.332275390625, 3.42919921875, 3.526123046875, 3.623046875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 13.0, 148.0, 590.0, 212.0, 33.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.634317874908447, -5.9419779777526855, -5.249637603759766, -4.557297706604004, -3.864957809448242, -3.1726179122924805, -2.4802775382995605, -1.7879376411437988, -1.095597743988037, -0.40325772762298584, 0.28908228874206543, 0.9814224243164062, 1.673762321472168, 2.3661022186279297, 3.0584425926208496, 3.7507824897766113, 4.443122386932373, 5.135462284088135, 5.827802658081055, 6.520142555236816, 7.212482452392578, 7.90482234954834, 8.597162246704102, 9.28950309753418, 9.981842041015625, 10.674181938171387, 11.366521835327148, 12.058862686157227, 12.751201629638672, 13.44354248046875, 14.135882377624512, 14.828222274780273, 15.520561218261719, 16.212902069091797, 16.905241012573242, 17.59758186340332, 18.289920806884766, 18.982261657714844, 19.674602508544922, 20.366941452026367, 21.059280395507812, 21.75162124633789, 22.443960189819336, 23.136301040649414, 23.82863998413086, 24.520980834960938, 25.213321685791016, 25.90566062927246, 26.59800148010254, 27.290342330932617, 27.982681274414062, 28.67502212524414, 29.367361068725586, 30.059701919555664, 30.75204086303711, 31.444381713867188, 32.136722564697266, 32.829063415527344, 33.52140426635742, 34.213741302490234, 34.90608215332031, 35.59842300415039, 36.29076385498047, 36.98310089111328, 37.67544174194336]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 10.0, 17.0, 23.0, 45.0, 68.0, 98.0, 112.0, 124.0, 118.0, 96.0, 110.0, 66.0, 46.0, 34.0, 14.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.434198379516602, -8.22624397277832, -8.018289566040039, -7.810335159301758, -7.602380752563477, -7.394426345825195, -7.186471939086914, -6.978517532348633, -6.770563125610352, -6.56260871887207, -6.354654312133789, -6.146699905395508, -5.938745498657227, -5.730791091918945, -5.522836685180664, -5.314882278442383, -5.106927871704102, -4.89897346496582, -4.691019058227539, -4.483064651489258, -4.275110244750977, -4.067155838012695, -3.859201431274414, -3.651247024536133, -3.4432926177978516, -3.2353382110595703, -3.027383804321289, -2.819429397583008, -2.6114749908447266, -2.4035205841064453, -2.195566177368164, -1.9876117706298828, -1.7796573638916016, -1.5717029571533203, -1.363748550415039, -1.1557941436767578, -0.9478397369384766, -0.7398853302001953, -0.5319309234619141, -0.3239765167236328, -0.11602210998535156, 0.09193229675292969, 0.29988670349121094, 0.5078411102294922, 0.7157955169677734, 0.9237499237060547, 1.131704330444336, 1.3396587371826172, 1.5476131439208984, 1.7555675506591797, 1.963521957397461, 2.171476364135742, 2.3794307708740234, 2.5873851776123047, 2.795339584350586, 3.003293991088867, 3.2112483978271484, 3.4192028045654297, 3.627157211303711, 3.835111618041992, 4.043066024780273, 4.251020431518555, 4.458974838256836, 4.666929244995117, 4.874883651733398]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 18.0, 26.0, 49.0, 91.0, 171.0, 412.0, 1472.0, 9789.0, 267981.0, 734818.0, 29902.0, 2654.0, 669.0, 243.0, 103.0, 52.0, 30.0, 25.0, 13.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.5302734375, -4.326171875, -4.1220703125, -3.91796875, -3.7138671875, -3.509765625, -3.3056640625, -3.1015625, -2.8974609375, -2.693359375, -2.4892578125, -2.28515625, -2.0810546875, -1.876953125, -1.6728515625, -1.46875, -1.2646484375, -1.060546875, -0.8564453125, -0.65234375, -0.4482421875, -0.244140625, -0.0400390625, 0.1640625, 0.3681640625, 0.572265625, 0.7763671875, 0.98046875, 1.1845703125, 1.388671875, 1.5927734375, 1.796875, 2.0009765625, 2.205078125, 2.4091796875, 2.61328125, 2.8173828125, 3.021484375, 3.2255859375, 3.4296875, 3.6337890625, 3.837890625, 4.0419921875, 4.24609375, 4.4501953125, 4.654296875, 4.8583984375, 5.0625, 5.2666015625, 5.470703125, 5.6748046875, 5.87890625, 6.0830078125, 6.287109375, 6.4912109375, 6.6953125, 6.8994140625, 7.103515625, 7.3076171875, 7.51171875, 7.7158203125, 7.919921875, 8.1240234375, 8.328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 17.0, 10.0, 16.0, 31.0, 30.0, 39.0, 31.0, 53.0, 64.0, 50.0, 60.0, 70.0, 68.0, 52.0, 56.0, 53.0, 57.0, 39.0, 39.0, 30.0, 19.0, 17.0, 18.0, 12.0, 12.0, 0.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.372314453125, -0.36093902587890625, -0.3495635986328125, -0.33818817138671875, -0.326812744140625, -0.31543731689453125, -0.3040618896484375, -0.29268646240234375, -0.28131103515625, -0.26993560791015625, -0.2585601806640625, -0.24718475341796875, -0.235809326171875, -0.22443389892578125, -0.2130584716796875, -0.20168304443359375, -0.1903076171875, -0.17893218994140625, -0.1675567626953125, -0.15618133544921875, -0.144805908203125, -0.13343048095703125, -0.1220550537109375, -0.11067962646484375, -0.09930419921875, -0.08792877197265625, -0.0765533447265625, -0.06517791748046875, -0.053802490234375, -0.04242706298828125, -0.0310516357421875, -0.01967620849609375, -0.00830078125, 0.00307464599609375, 0.0144500732421875, 0.02582550048828125, 0.037200927734375, 0.04857635498046875, 0.0599517822265625, 0.07132720947265625, 0.08270263671875, 0.09407806396484375, 0.1054534912109375, 0.11682891845703125, 0.128204345703125, 0.13957977294921875, 0.1509552001953125, 0.16233062744140625, 0.1737060546875, 0.18508148193359375, 0.1964569091796875, 0.20783233642578125, 0.219207763671875, 0.23058319091796875, 0.2419586181640625, 0.25333404541015625, 0.26470947265625, 0.27608489990234375, 0.2874603271484375, 0.29883575439453125, 0.310211181640625, 0.32158660888671875, 0.3329620361328125, 0.34433746337890625, 0.355712890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 18.0, 27.0, 25.0, 33.0, 50.0, 76.0, 109.0, 126.0, 212.0, 295.0, 451.0, 724.0, 1302.0, 2612.0, 5857.0, 16768.0, 62589.0, 240845.0, 440559.0, 200452.0, 50634.0, 14204.0, 4969.0, 2334.0, 1216.0, 672.0, 421.0, 266.0, 217.0, 110.0, 85.0, 74.0, 48.0, 52.0, 31.0, 20.0, 16.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.087890625, -2.02349853515625, -1.9591064453125, -1.89471435546875, -1.830322265625, -1.76593017578125, -1.7015380859375, -1.63714599609375, -1.57275390625, -1.50836181640625, -1.4439697265625, -1.37957763671875, -1.315185546875, -1.25079345703125, -1.1864013671875, -1.12200927734375, -1.0576171875, -0.99322509765625, -0.9288330078125, -0.86444091796875, -0.800048828125, -0.73565673828125, -0.6712646484375, -0.60687255859375, -0.54248046875, -0.47808837890625, -0.4136962890625, -0.34930419921875, -0.284912109375, -0.22052001953125, -0.1561279296875, -0.09173583984375, -0.02734375, 0.03704833984375, 0.1014404296875, 0.16583251953125, 0.230224609375, 0.29461669921875, 0.3590087890625, 0.42340087890625, 0.48779296875, 0.55218505859375, 0.6165771484375, 0.68096923828125, 0.745361328125, 0.80975341796875, 0.8741455078125, 0.93853759765625, 1.0029296875, 1.06732177734375, 1.1317138671875, 1.19610595703125, 1.260498046875, 1.32489013671875, 1.3892822265625, 1.45367431640625, 1.51806640625, 1.58245849609375, 1.6468505859375, 1.71124267578125, 1.775634765625, 1.84002685546875, 1.9044189453125, 1.96881103515625, 2.033203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 13.0, 5.0, 8.0, 14.0, 7.0, 19.0, 21.0, 30.0, 21.0, 22.0, 35.0, 35.0, 40.0, 48.0, 45.0, 64.0, 55.0, 54.0, 60.0, 53.0, 40.0, 44.0, 54.0, 35.0, 22.0, 30.0, 22.0, 19.0, 15.0, 22.0, 8.0, 11.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.9658203125, -1.914215087890625, -1.86260986328125, -1.811004638671875, -1.7593994140625, -1.707794189453125, -1.65618896484375, -1.604583740234375, -1.552978515625, -1.501373291015625, -1.44976806640625, -1.398162841796875, -1.3465576171875, -1.294952392578125, -1.24334716796875, -1.191741943359375, -1.14013671875, -1.088531494140625, -1.03692626953125, -0.985321044921875, -0.9337158203125, -0.882110595703125, -0.83050537109375, -0.778900146484375, -0.727294921875, -0.675689697265625, -0.62408447265625, -0.572479248046875, -0.5208740234375, -0.469268798828125, -0.41766357421875, -0.366058349609375, -0.314453125, -0.262847900390625, -0.21124267578125, -0.159637451171875, -0.1080322265625, -0.056427001953125, -0.00482177734375, 0.046783447265625, 0.098388671875, 0.149993896484375, 0.20159912109375, 0.253204345703125, 0.3048095703125, 0.356414794921875, 0.40802001953125, 0.459625244140625, 0.51123046875, 0.562835693359375, 0.61444091796875, 0.666046142578125, 0.7176513671875, 0.769256591796875, 0.82086181640625, 0.872467041015625, 0.924072265625, 0.975677490234375, 1.02728271484375, 1.078887939453125, 1.1304931640625, 1.182098388671875, 1.23370361328125, 1.285308837890625, 1.3369140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 7.0, 23.0, 36.0, 42.0, 63.0, 84.0, 169.0, 279.0, 459.0, 1057.0, 2330.0, 6425.0, 23757.0, 109620.0, 451595.0, 351656.0, 74982.0, 17107.0, 5041.0, 1870.0, 856.0, 452.0, 238.0, 132.0, 88.0, 55.0, 37.0, 30.0, 8.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.2896270751953125, -1.249176025390625, -1.2087249755859375, -1.16827392578125, -1.1278228759765625, -1.087371826171875, -1.0469207763671875, -1.0064697265625, -0.9660186767578125, -0.925567626953125, -0.8851165771484375, -0.84466552734375, -0.8042144775390625, -0.763763427734375, -0.7233123779296875, -0.682861328125, -0.6424102783203125, -0.601959228515625, -0.5615081787109375, -0.52105712890625, -0.4806060791015625, -0.440155029296875, -0.3997039794921875, -0.3592529296875, -0.3188018798828125, -0.278350830078125, -0.2378997802734375, -0.19744873046875, -0.1569976806640625, -0.116546630859375, -0.0760955810546875, -0.03564453125, 0.0048065185546875, 0.045257568359375, 0.0857086181640625, 0.12615966796875, 0.1666107177734375, 0.207061767578125, 0.2475128173828125, 0.2879638671875, 0.3284149169921875, 0.368865966796875, 0.4093170166015625, 0.44976806640625, 0.4902191162109375, 0.530670166015625, 0.5711212158203125, 0.611572265625, 0.6520233154296875, 0.692474365234375, 0.7329254150390625, 0.77337646484375, 0.8138275146484375, 0.854278564453125, 0.8947296142578125, 0.9351806640625, 0.9756317138671875, 1.016082763671875, 1.0565338134765625, 1.09698486328125, 1.1374359130859375, 1.177886962890625, 1.2183380126953125, 1.2587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 15.0, 9.0, 12.0, 16.0, 21.0, 34.0, 33.0, 46.0, 54.0, 75.0, 87.0, 106.0, 88.0, 74.0, 67.0, 47.0, 40.0, 45.0, 40.0, 21.0, 14.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00025582313537597656, -0.0002496875822544098, -0.00024355202913284302, -0.00023741647601127625, -0.00023128092288970947, -0.0002251453697681427, -0.00021900981664657593, -0.00021287426352500916, -0.00020673871040344238, -0.0002006031572818756, -0.00019446760416030884, -0.00018833205103874207, -0.0001821964979171753, -0.00017606094479560852, -0.00016992539167404175, -0.00016378983855247498, -0.0001576542854309082, -0.00015151873230934143, -0.00014538317918777466, -0.00013924762606620789, -0.0001331120729446411, -0.00012697651982307434, -0.00012084096670150757, -0.0001147054135799408, -0.00010856986045837402, -0.00010243430733680725, -9.629875421524048e-05, -9.01632010936737e-05, -8.402764797210693e-05, -7.789209485054016e-05, -7.175654172897339e-05, -6.562098860740662e-05, -5.9485435485839844e-05, -5.334988236427307e-05, -4.72143292427063e-05, -4.1078776121139526e-05, -3.4943222999572754e-05, -2.880766987800598e-05, -2.267211675643921e-05, -1.6536563634872437e-05, -1.0401010513305664e-05, -4.265457391738892e-06, 1.8700957298278809e-06, 8.005648851394653e-06, 1.4141201972961426e-05, 2.0276755094528198e-05, 2.641230821609497e-05, 3.254786133766174e-05, 3.8683414459228516e-05, 4.481896758079529e-05, 5.095452070236206e-05, 5.709007382392883e-05, 6.32256269454956e-05, 6.936118006706238e-05, 7.549673318862915e-05, 8.163228631019592e-05, 8.77678394317627e-05, 9.390339255332947e-05, 0.00010003894567489624, 0.00010617449879646301, 0.00011231005191802979, 0.00011844560503959656, 0.00012458115816116333, 0.0001307167112827301, 0.00013685226440429688]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 21.0, 23.0, 29.0, 51.0, 94.0, 140.0, 222.0, 347.0, 625.0, 1236.0, 2533.0, 6153.0, 18152.0, 68614.0, 294202.0, 466605.0, 138793.0, 33151.0, 10028.0, 3792.0, 1668.0, 852.0, 423.0, 293.0, 169.0, 92.0, 68.0, 49.0, 33.0, 13.0, 12.0, 13.0, 12.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.12109375, -1.085205078125, -1.04931640625, -1.013427734375, -0.9775390625, -0.941650390625, -0.90576171875, -0.869873046875, -0.833984375, -0.798095703125, -0.76220703125, -0.726318359375, -0.6904296875, -0.654541015625, -0.61865234375, -0.582763671875, -0.546875, -0.510986328125, -0.47509765625, -0.439208984375, -0.4033203125, -0.367431640625, -0.33154296875, -0.295654296875, -0.259765625, -0.223876953125, -0.18798828125, -0.152099609375, -0.1162109375, -0.080322265625, -0.04443359375, -0.008544921875, 0.02734375, 0.063232421875, 0.09912109375, 0.135009765625, 0.1708984375, 0.206787109375, 0.24267578125, 0.278564453125, 0.314453125, 0.350341796875, 0.38623046875, 0.422119140625, 0.4580078125, 0.493896484375, 0.52978515625, 0.565673828125, 0.6015625, 0.637451171875, 0.67333984375, 0.709228515625, 0.7451171875, 0.781005859375, 0.81689453125, 0.852783203125, 0.888671875, 0.924560546875, 0.96044921875, 0.996337890625, 1.0322265625, 1.068115234375, 1.10400390625, 1.139892578125, 1.17578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 6.0, 16.0, 14.0, 35.0, 35.0, 48.0, 47.0, 52.0, 74.0, 93.0, 97.0, 92.0, 83.0, 70.0, 50.0, 42.0, 25.0, 25.0, 24.0, 17.0, 11.0, 6.0, 5.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.9664154052734375, -0.934783935546875, -0.9031524658203125, -0.87152099609375, -0.8398895263671875, -0.808258056640625, -0.7766265869140625, -0.7449951171875, -0.7133636474609375, -0.681732177734375, -0.6501007080078125, -0.61846923828125, -0.5868377685546875, -0.555206298828125, -0.5235748291015625, -0.491943359375, -0.4603118896484375, -0.428680419921875, -0.3970489501953125, -0.36541748046875, -0.3337860107421875, -0.302154541015625, -0.2705230712890625, -0.2388916015625, -0.2072601318359375, -0.175628662109375, -0.1439971923828125, -0.11236572265625, -0.0807342529296875, -0.049102783203125, -0.0174713134765625, 0.01416015625, 0.0457916259765625, 0.077423095703125, 0.1090545654296875, 0.14068603515625, 0.1723175048828125, 0.203948974609375, 0.2355804443359375, 0.2672119140625, 0.2988433837890625, 0.330474853515625, 0.3621063232421875, 0.39373779296875, 0.4253692626953125, 0.457000732421875, 0.4886322021484375, 0.520263671875, 0.5518951416015625, 0.583526611328125, 0.6151580810546875, 0.64678955078125, 0.6784210205078125, 0.710052490234375, 0.7416839599609375, 0.7733154296875, 0.8049468994140625, 0.836578369140625, 0.8682098388671875, 0.89984130859375, 0.9314727783203125, 0.963104248046875, 0.9947357177734375, 1.0263671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 25.0, 27.0, 60.0, 108.0, 137.0, 176.0, 148.0, 102.0, 93.0, 45.0, 27.0, 21.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.19582748413086, -17.657377243041992, -17.118927001953125, -16.580474853515625, -16.042024612426758, -15.50357437133789, -14.965124130249023, -14.426673889160156, -13.888222694396973, -13.349772453308105, -12.811321258544922, -12.272871017456055, -11.734420776367188, -11.195969581604004, -10.657519340515137, -10.119068145751953, -9.580617904663086, -9.042167663574219, -8.503716468811035, -7.965266227722168, -7.426815509796143, -6.888364791870117, -6.34991455078125, -5.811463832855225, -5.273013114929199, -4.734562397003174, -4.196111679077148, -3.6576614379882812, -3.119210720062256, -2.5807600021362305, -2.042309522628784, -1.503859043121338, -0.9654083251953125, -0.42695772647857666, 0.11149287223815918, 0.649943470954895, 1.1883940696716309, 1.7268447875976562, 2.2652952671051025, 2.803745746612549, 3.342196464538574, 3.8806471824645996, 4.419097900390625, 4.957548141479492, 5.495998859405518, 6.034449577331543, 6.57289981842041, 7.1113505363464355, 7.649801254272461, 8.188251495361328, 8.726702690124512, 9.265152931213379, 9.803604125976562, 10.34205436706543, 10.880504608154297, 11.418954849243164, 11.957406044006348, 12.495856285095215, 13.034307479858398, 13.572757720947266, 14.111207962036133, 14.649659156799316, 15.188109397888184, 15.726560592651367, 16.265010833740234]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 1.0, 7.0, 6.0, 9.0, 20.0, 20.0, 27.0, 21.0, 28.0, 29.0, 18.0, 38.0, 34.0, 40.0, 45.0, 38.0, 45.0, 53.0, 50.0, 46.0, 53.0, 49.0, 43.0, 43.0, 33.0, 35.0, 26.0, 15.0, 23.0, 15.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.792655944824219, -8.506147384643555, -8.219637870788574, -7.93312931060791, -7.646620750427246, -7.360111713409424, -7.073602676391602, -6.7870941162109375, -6.500585556030273, -6.214076519012451, -5.927567958831787, -5.641058921813965, -5.354550361633301, -5.0680413246154785, -4.781532287597656, -4.495023727416992, -4.20851469039917, -3.9220058917999268, -3.6354970932006836, -3.3489880561828613, -3.0624794960021973, -2.775970458984375, -2.489461660385132, -2.2029528617858887, -1.9164440631866455, -1.6299352645874023, -1.3434264659881592, -1.0569175481796265, -0.7704087495803833, -0.48389995098114014, -0.19739103317260742, 0.08911776542663574, 0.3756265640258789, 0.6621353626251221, 0.94864422082901, 1.235153079032898, 1.5216618776321411, 1.8081706762313843, 2.094679594039917, 2.38118839263916, 2.6676971912384033, 2.9542059898376465, 3.2407147884368896, 3.527223587036133, 3.813732624053955, 4.100241184234619, 4.386750221252441, 4.6732587814331055, 4.959767818450928, 5.24627685546875, 5.532785415649414, 5.819294452667236, 6.1058030128479, 6.392312049865723, 6.678820610046387, 6.965329647064209, 7.251838684082031, 7.5383477210998535, 7.824856281280518, 8.11136531829834, 8.397873878479004, 8.684382438659668, 8.970891952514648, 9.257400512695312, 9.543909072875977]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 5.0, 8.0, 12.0, 10.0, 24.0, 29.0, 48.0, 53.0, 77.0, 119.0, 169.0, 274.0, 521.0, 1055.0, 2608.0, 7992.0, 35873.0, 350709.0, 3607440.0, 154926.0, 22482.0, 6071.0, 2073.0, 849.0, 400.0, 189.0, 96.0, 54.0, 29.0, 18.0, 18.0, 7.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.261688232421875, -4.14447021484375, -4.027252197265625, -3.9100341796875, -3.792816162109375, -3.67559814453125, -3.558380126953125, -3.441162109375, -3.323944091796875, -3.20672607421875, -3.089508056640625, -2.9722900390625, -2.855072021484375, -2.73785400390625, -2.620635986328125, -2.50341796875, -2.386199951171875, -2.26898193359375, -2.151763916015625, -2.0345458984375, -1.917327880859375, -1.80010986328125, -1.682891845703125, -1.565673828125, -1.448455810546875, -1.33123779296875, -1.214019775390625, -1.0968017578125, -0.979583740234375, -0.86236572265625, -0.745147705078125, -0.6279296875, -0.510711669921875, -0.39349365234375, -0.276275634765625, -0.1590576171875, -0.041839599609375, 0.07537841796875, 0.192596435546875, 0.309814453125, 0.427032470703125, 0.54425048828125, 0.661468505859375, 0.7786865234375, 0.895904541015625, 1.01312255859375, 1.130340576171875, 1.24755859375, 1.364776611328125, 1.48199462890625, 1.599212646484375, 1.7164306640625, 1.833648681640625, 1.95086669921875, 2.068084716796875, 2.185302734375, 2.302520751953125, 2.41973876953125, 2.536956787109375, 2.6541748046875, 2.771392822265625, 2.88861083984375, 3.005828857421875, 3.123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 9.0, 11.0, 8.0, 10.0, 15.0, 21.0, 22.0, 38.0, 37.0, 40.0, 44.0, 55.0, 59.0, 52.0, 63.0, 59.0, 63.0, 59.0, 62.0, 42.0, 35.0, 41.0, 26.0, 38.0, 27.0, 20.0, 12.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396728515625, -0.3847236633300781, -0.37271881103515625, -0.3607139587402344, -0.3487091064453125, -0.3367042541503906, -0.32469940185546875, -0.3126945495605469, -0.300689697265625, -0.2886848449707031, -0.27667999267578125, -0.2646751403808594, -0.2526702880859375, -0.24066543579101562, -0.22866058349609375, -0.21665573120117188, -0.20465087890625, -0.19264602661132812, -0.18064117431640625, -0.16863632202148438, -0.1566314697265625, -0.14462661743164062, -0.13262176513671875, -0.12061691284179688, -0.108612060546875, -0.09660720825195312, -0.08460235595703125, -0.07259750366210938, -0.0605926513671875, -0.048587799072265625, -0.03658294677734375, -0.024578094482421875, -0.0125732421875, -0.000568389892578125, 0.01143646240234375, 0.023441314697265625, 0.0354461669921875, 0.047451019287109375, 0.05945587158203125, 0.07146072387695312, 0.083465576171875, 0.09547042846679688, 0.10747528076171875, 0.11948013305664062, 0.1314849853515625, 0.14348983764648438, 0.15549468994140625, 0.16749954223632812, 0.17950439453125, 0.19150924682617188, 0.20351409912109375, 0.21551895141601562, 0.2275238037109375, 0.23952865600585938, 0.25153350830078125, 0.2635383605957031, 0.275543212890625, 0.2875480651855469, 0.29955291748046875, 0.3115577697753906, 0.3235626220703125, 0.3355674743652344, 0.34757232666015625, 0.3595771789550781, 0.37158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 11.0, 9.0, 16.0, 25.0, 30.0, 50.0, 55.0, 76.0, 132.0, 204.0, 331.0, 672.0, 1892.0, 8303.0, 325949.0, 3835483.0, 16371.0, 2611.0, 849.0, 406.0, 239.0, 142.0, 132.0, 84.0, 50.0, 55.0, 29.0, 20.0, 10.0, 16.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.899658203125, -10.58056640625, -10.261474609375, -9.9423828125, -9.623291015625, -9.30419921875, -8.985107421875, -8.666015625, -8.346923828125, -8.02783203125, -7.708740234375, -7.3896484375, -7.070556640625, -6.75146484375, -6.432373046875, -6.11328125, -5.794189453125, -5.47509765625, -5.156005859375, -4.8369140625, -4.517822265625, -4.19873046875, -3.879638671875, -3.560546875, -3.241455078125, -2.92236328125, -2.603271484375, -2.2841796875, -1.965087890625, -1.64599609375, -1.326904296875, -1.0078125, -0.688720703125, -0.36962890625, -0.050537109375, 0.2685546875, 0.587646484375, 0.90673828125, 1.225830078125, 1.544921875, 1.864013671875, 2.18310546875, 2.502197265625, 2.8212890625, 3.140380859375, 3.45947265625, 3.778564453125, 4.09765625, 4.416748046875, 4.73583984375, 5.054931640625, 5.3740234375, 5.693115234375, 6.01220703125, 6.331298828125, 6.650390625, 6.969482421875, 7.28857421875, 7.607666015625, 7.9267578125, 8.245849609375, 8.56494140625, 8.884033203125, 9.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 24.0, 32.0, 108.0, 486.0, 2227.0, 881.0, 194.0, 49.0, 20.0, 13.0, 12.0, 7.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6005859375, -1.5149383544921875, -1.429290771484375, -1.3436431884765625, -1.25799560546875, -1.1723480224609375, -1.086700439453125, -1.0010528564453125, -0.9154052734375, -0.8297576904296875, -0.744110107421875, -0.6584625244140625, -0.57281494140625, -0.4871673583984375, -0.401519775390625, -0.3158721923828125, -0.230224609375, -0.1445770263671875, -0.058929443359375, 0.0267181396484375, 0.11236572265625, 0.1980133056640625, 0.283660888671875, 0.3693084716796875, 0.4549560546875, 0.5406036376953125, 0.626251220703125, 0.7118988037109375, 0.79754638671875, 0.8831939697265625, 0.968841552734375, 1.0544891357421875, 1.14013671875, 1.2257843017578125, 1.311431884765625, 1.3970794677734375, 1.48272705078125, 1.5683746337890625, 1.654022216796875, 1.7396697998046875, 1.8253173828125, 1.9109649658203125, 1.996612548828125, 2.0822601318359375, 2.16790771484375, 2.2535552978515625, 2.339202880859375, 2.4248504638671875, 2.510498046875, 2.5961456298828125, 2.681793212890625, 2.7674407958984375, 2.85308837890625, 2.9387359619140625, 3.024383544921875, 3.1100311279296875, 3.1956787109375, 3.2813262939453125, 3.366973876953125, 3.4526214599609375, 3.53826904296875, 3.6239166259765625, 3.709564208984375, 3.7952117919921875, 3.880859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 11.0, 32.0, 101.0, 272.0, 309.0, 171.0, 62.0, 21.0, 9.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.170495986938477, -28.445274353027344, -27.72005271911621, -26.994831085205078, -26.269609451293945, -25.544387817382812, -24.81916618347168, -24.093944549560547, -23.368722915649414, -22.64350128173828, -21.91827964782715, -21.193058013916016, -20.467836380004883, -19.74261474609375, -19.017393112182617, -18.292171478271484, -17.56694984436035, -16.84172821044922, -16.116506576538086, -15.391284942626953, -14.66606330871582, -13.940841674804688, -13.215620040893555, -12.490398406982422, -11.765176773071289, -11.039955139160156, -10.314733505249023, -9.58951187133789, -8.864290237426758, -8.139068603515625, -7.413846969604492, -6.688625335693359, -5.963405609130859, -5.238183975219727, -4.512962341308594, -3.787740707397461, -3.062519073486328, -2.3372974395751953, -1.6120758056640625, -0.8868541717529297, -0.16163253784179688, 0.5635890960693359, 1.2888107299804688, 2.0140323638916016, 2.7392539978027344, 3.464475631713867, 4.189697265625, 4.914918899536133, 5.640140533447266, 6.365362167358398, 7.090583801269531, 7.815805435180664, 8.541027069091797, 9.26624870300293, 9.991470336914062, 10.716691970825195, 11.441913604736328, 12.167135238647461, 12.892356872558594, 13.617578506469727, 14.34280014038086, 15.068021774291992, 15.793243408203125, 16.518465042114258, 17.24368667602539]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 4.0, 11.0, 14.0, 10.0, 18.0, 38.0, 31.0, 26.0, 38.0, 70.0, 58.0, 67.0, 77.0, 65.0, 61.0, 60.0, 49.0, 44.0, 49.0, 34.0, 37.0, 19.0, 29.0, 20.0, 11.0, 19.0, 5.0, 6.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.304987907409668, -6.130555152893066, -5.956122398376465, -5.781689643859863, -5.607256889343262, -5.43282413482666, -5.258391380310059, -5.083958625793457, -4.9095258712768555, -4.735093116760254, -4.560660362243652, -4.386227607727051, -4.211794853210449, -4.037362098693848, -3.862929105758667, -3.6884963512420654, -3.5140633583068848, -3.339630603790283, -3.1651978492736816, -2.99076509475708, -2.8163323402404785, -2.641899585723877, -2.4674665927886963, -2.2930338382720947, -2.118601083755493, -1.9441683292388916, -1.76973557472229, -1.595302700996399, -1.4208699464797974, -1.2464371919631958, -1.0720043182373047, -0.8975715637207031, -0.7231383323669434, -0.5487055778503418, -0.37427276372909546, -0.19983994960784912, -0.02540719509124756, 0.149025559425354, 0.3234584331512451, 0.4978911876678467, 0.6723239421844482, 0.8467566967010498, 1.0211894512176514, 1.1956223249435425, 1.370055079460144, 1.5444878339767456, 1.7189207077026367, 1.8933534622192383, 2.06778621673584, 2.2422189712524414, 2.416651725769043, 2.5910844802856445, 2.765517234802246, 2.9399499893188477, 3.1143829822540283, 3.28881573677063, 3.4632484912872314, 3.637681245803833, 3.8121140003204346, 3.9865469932556152, 4.160979747772217, 4.335412502288818, 4.50984525680542, 4.6842780113220215, 4.858710765838623]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 10.0, 4.0, 17.0, 19.0, 27.0, 34.0, 60.0, 67.0, 89.0, 170.0, 306.0, 488.0, 885.0, 1800.0, 4098.0, 11437.0, 41076.0, 169566.0, 478468.0, 252309.0, 61066.0, 16148.0, 5419.0, 2297.0, 1100.0, 582.0, 341.0, 219.0, 143.0, 84.0, 72.0, 40.0, 33.0, 16.0, 19.0, 11.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.553436279296875, -2.46429443359375, -2.375152587890625, -2.2860107421875, -2.196868896484375, -2.10772705078125, -2.018585205078125, -1.929443359375, -1.840301513671875, -1.75115966796875, -1.662017822265625, -1.5728759765625, -1.483734130859375, -1.39459228515625, -1.305450439453125, -1.21630859375, -1.127166748046875, -1.03802490234375, -0.948883056640625, -0.8597412109375, -0.770599365234375, -0.68145751953125, -0.592315673828125, -0.503173828125, -0.414031982421875, -0.32489013671875, -0.235748291015625, -0.1466064453125, -0.057464599609375, 0.03167724609375, 0.120819091796875, 0.2099609375, 0.299102783203125, 0.38824462890625, 0.477386474609375, 0.5665283203125, 0.655670166015625, 0.74481201171875, 0.833953857421875, 0.923095703125, 1.012237548828125, 1.10137939453125, 1.190521240234375, 1.2796630859375, 1.368804931640625, 1.45794677734375, 1.547088623046875, 1.63623046875, 1.725372314453125, 1.81451416015625, 1.903656005859375, 1.9927978515625, 2.081939697265625, 2.17108154296875, 2.260223388671875, 2.349365234375, 2.438507080078125, 2.52764892578125, 2.616790771484375, 2.7059326171875, 2.795074462890625, 2.88421630859375, 2.973358154296875, 3.0625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 15.0, 24.0, 24.0, 40.0, 39.0, 54.0, 56.0, 62.0, 70.0, 75.0, 70.0, 67.0, 68.0, 60.0, 58.0, 50.0, 42.0, 32.0, 16.0, 19.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49755859375, -0.4821281433105469, -0.46669769287109375, -0.4512672424316406, -0.4358367919921875, -0.4204063415527344, -0.40497589111328125, -0.3895454406738281, -0.374114990234375, -0.3586845397949219, -0.34325408935546875, -0.3278236389160156, -0.3123931884765625, -0.2969627380371094, -0.28153228759765625, -0.2661018371582031, -0.25067138671875, -0.23524093627929688, -0.21981048583984375, -0.20438003540039062, -0.1889495849609375, -0.17351913452148438, -0.15808868408203125, -0.14265823364257812, -0.127227783203125, -0.11179733276367188, -0.09636688232421875, -0.08093643188476562, -0.0655059814453125, -0.050075531005859375, -0.03464508056640625, -0.019214630126953125, -0.0037841796875, 0.011646270751953125, 0.02707672119140625, 0.042507171630859375, 0.0579376220703125, 0.07336807250976562, 0.08879852294921875, 0.10422897338867188, 0.119659423828125, 0.13508987426757812, 0.15052032470703125, 0.16595077514648438, 0.1813812255859375, 0.19681167602539062, 0.21224212646484375, 0.22767257690429688, 0.24310302734375, 0.2585334777832031, 0.27396392822265625, 0.2893943786621094, 0.3048248291015625, 0.3202552795410156, 0.33568572998046875, 0.3511161804199219, 0.366546630859375, 0.3819770812988281, 0.39740753173828125, 0.4128379821777344, 0.4282684326171875, 0.4436988830566406, 0.45912933349609375, 0.4745597839355469, 0.489990234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 22.0, 14.0, 32.0, 45.0, 55.0, 95.0, 127.0, 210.0, 345.0, 481.0, 922.0, 1856.0, 4280.0, 11506.0, 38635.0, 135895.0, 369441.0, 326233.0, 109876.0, 31288.0, 9632.0, 3754.0, 1607.0, 871.0, 419.0, 289.0, 201.0, 134.0, 89.0, 49.0, 52.0, 19.0, 23.0, 16.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.549835205078125, -1.49224853515625, -1.434661865234375, -1.3770751953125, -1.319488525390625, -1.26190185546875, -1.204315185546875, -1.146728515625, -1.089141845703125, -1.03155517578125, -0.973968505859375, -0.9163818359375, -0.858795166015625, -0.80120849609375, -0.743621826171875, -0.68603515625, -0.628448486328125, -0.57086181640625, -0.513275146484375, -0.4556884765625, -0.398101806640625, -0.34051513671875, -0.282928466796875, -0.225341796875, -0.167755126953125, -0.11016845703125, -0.052581787109375, 0.0050048828125, 0.062591552734375, 0.12017822265625, 0.177764892578125, 0.2353515625, 0.292938232421875, 0.35052490234375, 0.408111572265625, 0.4656982421875, 0.523284912109375, 0.58087158203125, 0.638458251953125, 0.696044921875, 0.753631591796875, 0.81121826171875, 0.868804931640625, 0.9263916015625, 0.983978271484375, 1.04156494140625, 1.099151611328125, 1.15673828125, 1.214324951171875, 1.27191162109375, 1.329498291015625, 1.3870849609375, 1.444671630859375, 1.50225830078125, 1.559844970703125, 1.617431640625, 1.675018310546875, 1.73260498046875, 1.790191650390625, 1.8477783203125, 1.905364990234375, 1.96295166015625, 2.020538330078125, 2.078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 2.0, 6.0, 11.0, 14.0, 9.0, 17.0, 28.0, 23.0, 24.0, 36.0, 38.0, 40.0, 32.0, 41.0, 42.0, 56.0, 48.0, 42.0, 61.0, 52.0, 42.0, 42.0, 41.0, 36.0, 29.0, 37.0, 30.0, 19.0, 20.0, 16.0, 17.0, 14.0, 10.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.88671875, -1.8379058837890625, -1.789093017578125, -1.7402801513671875, -1.69146728515625, -1.6426544189453125, -1.593841552734375, -1.5450286865234375, -1.4962158203125, -1.4474029541015625, -1.398590087890625, -1.3497772216796875, -1.30096435546875, -1.2521514892578125, -1.203338623046875, -1.1545257568359375, -1.105712890625, -1.0569000244140625, -1.008087158203125, -0.9592742919921875, -0.91046142578125, -0.8616485595703125, -0.812835693359375, -0.7640228271484375, -0.7152099609375, -0.6663970947265625, -0.617584228515625, -0.5687713623046875, -0.51995849609375, -0.4711456298828125, -0.422332763671875, -0.3735198974609375, -0.32470703125, -0.2758941650390625, -0.227081298828125, -0.1782684326171875, -0.12945556640625, -0.0806427001953125, -0.031829833984375, 0.0169830322265625, 0.0657958984375, 0.1146087646484375, 0.163421630859375, 0.2122344970703125, 0.26104736328125, 0.3098602294921875, 0.358673095703125, 0.4074859619140625, 0.456298828125, 0.5051116943359375, 0.553924560546875, 0.6027374267578125, 0.65155029296875, 0.7003631591796875, 0.749176025390625, 0.7979888916015625, 0.8468017578125, 0.8956146240234375, 0.944427490234375, 0.9932403564453125, 1.04205322265625, 1.0908660888671875, 1.139678955078125, 1.1884918212890625, 1.2373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 2.0, 8.0, 10.0, 11.0, 15.0, 32.0, 49.0, 73.0, 135.0, 201.0, 449.0, 920.0, 2404.0, 7916.0, 45350.0, 729111.0, 236670.0, 17795.0, 4504.0, 1520.0, 643.0, 312.0, 149.0, 89.0, 56.0, 29.0, 18.0, 20.0, 15.0, 5.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.857421875, -2.761444091796875, -2.66546630859375, -2.569488525390625, -2.4735107421875, -2.377532958984375, -2.28155517578125, -2.185577392578125, -2.089599609375, -1.993621826171875, -1.89764404296875, -1.801666259765625, -1.7056884765625, -1.609710693359375, -1.51373291015625, -1.417755126953125, -1.32177734375, -1.225799560546875, -1.12982177734375, -1.033843994140625, -0.9378662109375, -0.841888427734375, -0.74591064453125, -0.649932861328125, -0.553955078125, -0.457977294921875, -0.36199951171875, -0.266021728515625, -0.1700439453125, -0.074066162109375, 0.02191162109375, 0.117889404296875, 0.2138671875, 0.309844970703125, 0.40582275390625, 0.501800537109375, 0.5977783203125, 0.693756103515625, 0.78973388671875, 0.885711669921875, 0.981689453125, 1.077667236328125, 1.17364501953125, 1.269622802734375, 1.3656005859375, 1.461578369140625, 1.55755615234375, 1.653533935546875, 1.74951171875, 1.845489501953125, 1.94146728515625, 2.037445068359375, 2.1334228515625, 2.229400634765625, 2.32537841796875, 2.421356201171875, 2.517333984375, 2.613311767578125, 2.70928955078125, 2.805267333984375, 2.9012451171875, 2.997222900390625, 3.09320068359375, 3.189178466796875, 3.28515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 18.0, 20.0, 26.0, 34.0, 41.0, 56.0, 62.0, 80.0, 83.0, 106.0, 87.0, 61.0, 63.0, 34.0, 29.0, 29.0, 34.0, 20.0, 15.0, 15.0, 8.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015825405716896057, -0.00015319138765335083, -0.0001481287181377411, -0.00014306604862213135, -0.0001380033791065216, -0.00013294070959091187, -0.00012787804007530212, -0.00012281537055969238, -0.00011775270104408264, -0.0001126900315284729, -0.00010762736201286316, -0.00010256469249725342, -9.750202298164368e-05, -9.243935346603394e-05, -8.73766839504242e-05, -8.231401443481445e-05, -7.725134491920471e-05, -7.218867540359497e-05, -6.712600588798523e-05, -6.206333637237549e-05, -5.700066685676575e-05, -5.1937997341156006e-05, -4.6875327825546265e-05, -4.1812658309936523e-05, -3.674998879432678e-05, -3.168731927871704e-05, -2.66246497631073e-05, -2.156198024749756e-05, -1.6499310731887817e-05, -1.1436641216278076e-05, -6.373971700668335e-06, -1.3113021850585938e-06, 3.7513673305511475e-06, 8.814036846160889e-06, 1.387670636177063e-05, 1.893937587738037e-05, 2.4002045392990112e-05, 2.9064714908599854e-05, 3.4127384424209595e-05, 3.9190053939819336e-05, 4.425272345542908e-05, 4.931539297103882e-05, 5.437806248664856e-05, 5.94407320022583e-05, 6.450340151786804e-05, 6.956607103347778e-05, 7.462874054908752e-05, 7.969141006469727e-05, 8.475407958030701e-05, 8.981674909591675e-05, 9.487941861152649e-05, 9.994208812713623e-05, 0.00010500475764274597, 0.00011006742715835571, 0.00011513009667396545, 0.0001201927661895752, 0.00012525543570518494, 0.00013031810522079468, 0.00013538077473640442, 0.00014044344425201416, 0.0001455061137676239, 0.00015056878328323364, 0.00015563145279884338, 0.00016069412231445312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 10.0, 20.0, 21.0, 37.0, 58.0, 89.0, 131.0, 226.0, 350.0, 670.0, 1182.0, 2261.0, 4989.0, 16840.0, 255302.0, 713861.0, 38289.0, 7497.0, 3127.0, 1513.0, 760.0, 494.0, 280.0, 186.0, 101.0, 64.0, 54.0, 34.0, 22.0, 12.0, 9.0, 8.0, 5.0, 1.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.500274658203125, -2.40484619140625, -2.309417724609375, -2.2139892578125, -2.118560791015625, -2.02313232421875, -1.927703857421875, -1.832275390625, -1.736846923828125, -1.64141845703125, -1.545989990234375, -1.4505615234375, -1.355133056640625, -1.25970458984375, -1.164276123046875, -1.06884765625, -0.973419189453125, -0.87799072265625, -0.782562255859375, -0.6871337890625, -0.591705322265625, -0.49627685546875, -0.400848388671875, -0.305419921875, -0.209991455078125, -0.11456298828125, -0.019134521484375, 0.0762939453125, 0.171722412109375, 0.26715087890625, 0.362579345703125, 0.4580078125, 0.553436279296875, 0.64886474609375, 0.744293212890625, 0.8397216796875, 0.935150146484375, 1.03057861328125, 1.126007080078125, 1.221435546875, 1.316864013671875, 1.41229248046875, 1.507720947265625, 1.6031494140625, 1.698577880859375, 1.79400634765625, 1.889434814453125, 1.98486328125, 2.080291748046875, 2.17572021484375, 2.271148681640625, 2.3665771484375, 2.462005615234375, 2.55743408203125, 2.652862548828125, 2.748291015625, 2.843719482421875, 2.93914794921875, 3.034576416015625, 3.1300048828125, 3.225433349609375, 3.32086181640625, 3.416290283203125, 3.51171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 9.0, 15.0, 51.0, 137.0, 267.0, 247.0, 134.0, 61.0, 24.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.341094970703125, -3.24273681640625, -3.144378662109375, -3.0460205078125, -2.947662353515625, -2.84930419921875, -2.750946044921875, -2.652587890625, -2.554229736328125, -2.45587158203125, -2.357513427734375, -2.2591552734375, -2.160797119140625, -2.06243896484375, -1.964080810546875, -1.86572265625, -1.767364501953125, -1.66900634765625, -1.570648193359375, -1.4722900390625, -1.373931884765625, -1.27557373046875, -1.177215576171875, -1.078857421875, -0.980499267578125, -0.88214111328125, -0.783782958984375, -0.6854248046875, -0.587066650390625, -0.48870849609375, -0.390350341796875, -0.2919921875, -0.193634033203125, -0.09527587890625, 0.003082275390625, 0.1014404296875, 0.199798583984375, 0.29815673828125, 0.396514892578125, 0.494873046875, 0.593231201171875, 0.69158935546875, 0.789947509765625, 0.8883056640625, 0.986663818359375, 1.08502197265625, 1.183380126953125, 1.28173828125, 1.380096435546875, 1.47845458984375, 1.576812744140625, 1.6751708984375, 1.773529052734375, 1.87188720703125, 1.970245361328125, 2.068603515625, 2.166961669921875, 2.26531982421875, 2.363677978515625, 2.4620361328125, 2.560394287109375, 2.65875244140625, 2.757110595703125, 2.85546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 12.0, 15.0, 17.0, 23.0, 49.0, 78.0, 127.0, 157.0, 167.0, 135.0, 93.0, 57.0, 28.0, 15.0, 9.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.375171661376953, -18.81422233581543, -18.253273010253906, -17.692323684692383, -17.13137435913086, -16.570425033569336, -16.009475708007812, -15.448526382446289, -14.887577056884766, -14.326627731323242, -13.765678405761719, -13.204729080200195, -12.643779754638672, -12.082830429077148, -11.521881103515625, -10.960931777954102, -10.399982452392578, -9.839033126831055, -9.278083801269531, -8.717134475708008, -8.156185150146484, -7.595235824584961, -7.0342864990234375, -6.473337173461914, -5.912387847900391, -5.351438522338867, -4.790489196777344, -4.22953987121582, -3.668590545654297, -3.1076412200927734, -2.54669189453125, -1.9857425689697266, -1.4247913360595703, -0.8638420104980469, -0.30289268493652344, 0.258056640625, 0.8190059661865234, 1.3799552917480469, 1.9409046173095703, 2.5018539428710938, 3.062803268432617, 3.6237525939941406, 4.184701919555664, 4.7456512451171875, 5.306600570678711, 5.867549896240234, 6.428499221801758, 6.989448547363281, 7.550397872924805, 8.111347198486328, 8.672296524047852, 9.233245849609375, 9.794195175170898, 10.355144500732422, 10.916093826293945, 11.477043151855469, 12.037992477416992, 12.598941802978516, 13.159891128540039, 13.720840454101562, 14.281789779663086, 14.84273910522461, 15.403688430786133, 15.964637756347656, 16.52558708190918]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 9.0, 17.0, 30.0, 21.0, 27.0, 26.0, 42.0, 47.0, 68.0, 45.0, 52.0, 54.0, 59.0, 56.0, 53.0, 57.0, 39.0, 55.0, 34.0, 43.0, 32.0, 19.0, 19.0, 14.0, 12.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.465709686279297, -9.090006828308105, -8.714303970336914, -8.338601112365723, -7.962898254394531, -7.58719539642334, -7.211493015289307, -6.835790157318115, -6.460087299346924, -6.084384441375732, -5.708681583404541, -5.332979202270508, -4.957276344299316, -4.581573486328125, -4.205870628356934, -3.830167770385742, -3.454464912414551, -3.0787620544433594, -2.703059196472168, -2.3273565769195557, -1.9516537189483643, -1.5759508609771729, -1.2002482414245605, -0.8245453834533691, -0.44884252548217773, -0.0731397271156311, 0.3025630712509155, 0.6782658100128174, 1.0539686679840088, 1.4296715259552002, 1.8053741455078125, 2.181077003479004, 2.556778907775879, 2.9324817657470703, 3.3081846237182617, 3.683887243270874, 4.0595903396606445, 4.435293197631836, 4.810995578765869, 5.1866984367370605, 5.562401294708252, 5.938104152679443, 6.313807010650635, 6.689509391784668, 7.065212249755859, 7.440915107727051, 7.816617965698242, 8.192320823669434, 8.568023681640625, 8.943726539611816, 9.319429397583008, 9.6951322555542, 10.07083511352539, 10.446537971496582, 10.822240829467773, 11.197942733764648, 11.573646545410156, 11.949349403381348, 12.325052261352539, 12.70075511932373, 13.076457977294922, 13.452160835266113, 13.827863693237305, 14.20356559753418, 14.579268455505371]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 16.0, 35.0, 65.0, 88.0, 183.0, 338.0, 772.0, 2481.0, 14309.0, 988862.0, 3164369.0, 17926.0, 3165.0, 911.0, 356.0, 179.0, 85.0, 41.0, 32.0, 12.0, 15.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6796875, -7.46051025390625, -7.2413330078125, -7.02215576171875, -6.802978515625, -6.58380126953125, -6.3646240234375, -6.14544677734375, -5.92626953125, -5.70709228515625, -5.4879150390625, -5.26873779296875, -5.049560546875, -4.83038330078125, -4.6112060546875, -4.39202880859375, -4.1728515625, -3.95367431640625, -3.7344970703125, -3.51531982421875, -3.296142578125, -3.07696533203125, -2.8577880859375, -2.63861083984375, -2.41943359375, -2.20025634765625, -1.9810791015625, -1.76190185546875, -1.542724609375, -1.32354736328125, -1.1043701171875, -0.88519287109375, -0.666015625, -0.44683837890625, -0.2276611328125, -0.00848388671875, 0.210693359375, 0.42987060546875, 0.6490478515625, 0.86822509765625, 1.08740234375, 1.30657958984375, 1.5257568359375, 1.74493408203125, 1.964111328125, 2.18328857421875, 2.4024658203125, 2.62164306640625, 2.8408203125, 3.05999755859375, 3.2791748046875, 3.49835205078125, 3.717529296875, 3.93670654296875, 4.1558837890625, 4.37506103515625, 4.59423828125, 4.81341552734375, 5.0325927734375, 5.25177001953125, 5.470947265625, 5.69012451171875, 5.9093017578125, 6.12847900390625, 6.34765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 4.0, 8.0, 8.0, 13.0, 15.0, 9.0, 26.0, 30.0, 30.0, 44.0, 63.0, 51.0, 53.0, 53.0, 61.0, 71.0, 73.0, 54.0, 60.0, 37.0, 41.0, 44.0, 41.0, 22.0, 27.0, 8.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.484619140625, -0.47092437744140625, -0.4572296142578125, -0.44353485107421875, -0.429840087890625, -0.41614532470703125, -0.4024505615234375, -0.38875579833984375, -0.37506103515625, -0.36136627197265625, -0.3476715087890625, -0.33397674560546875, -0.320281982421875, -0.30658721923828125, -0.2928924560546875, -0.27919769287109375, -0.2655029296875, -0.25180816650390625, -0.2381134033203125, -0.22441864013671875, -0.210723876953125, -0.19702911376953125, -0.1833343505859375, -0.16963958740234375, -0.15594482421875, -0.14225006103515625, -0.1285552978515625, -0.11486053466796875, -0.101165771484375, -0.08747100830078125, -0.0737762451171875, -0.06008148193359375, -0.04638671875, -0.03269195556640625, -0.0189971923828125, -0.00530242919921875, 0.008392333984375, 0.02208709716796875, 0.0357818603515625, 0.04947662353515625, 0.06317138671875, 0.07686614990234375, 0.0905609130859375, 0.10425567626953125, 0.117950439453125, 0.13164520263671875, 0.1453399658203125, 0.15903472900390625, 0.1727294921875, 0.18642425537109375, 0.2001190185546875, 0.21381378173828125, 0.227508544921875, 0.24120330810546875, 0.2548980712890625, 0.26859283447265625, 0.28228759765625, 0.29598236083984375, 0.3096771240234375, 0.32337188720703125, 0.337066650390625, 0.35076141357421875, 0.3644561767578125, 0.37815093994140625, 0.391845703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 7.0, 5.0, 6.0, 14.0, 20.0, 8.0, 36.0, 29.0, 31.0, 57.0, 87.0, 143.0, 261.0, 560.0, 1596.0, 6263.0, 44340.0, 3544291.0, 568293.0, 22310.0, 3836.0, 1019.0, 427.0, 216.0, 118.0, 49.0, 61.0, 43.0, 36.0, 25.0, 23.0, 8.0, 18.0, 4.0, 7.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2685546875, -4.115234375, -3.9619140625, -3.80859375, -3.6552734375, -3.501953125, -3.3486328125, -3.1953125, -3.0419921875, -2.888671875, -2.7353515625, -2.58203125, -2.4287109375, -2.275390625, -2.1220703125, -1.96875, -1.8154296875, -1.662109375, -1.5087890625, -1.35546875, -1.2021484375, -1.048828125, -0.8955078125, -0.7421875, -0.5888671875, -0.435546875, -0.2822265625, -0.12890625, 0.0244140625, 0.177734375, 0.3310546875, 0.484375, 0.6376953125, 0.791015625, 0.9443359375, 1.09765625, 1.2509765625, 1.404296875, 1.5576171875, 1.7109375, 1.8642578125, 2.017578125, 2.1708984375, 2.32421875, 2.4775390625, 2.630859375, 2.7841796875, 2.9375, 3.0908203125, 3.244140625, 3.3974609375, 3.55078125, 3.7041015625, 3.857421875, 4.0107421875, 4.1640625, 4.3173828125, 4.470703125, 4.6240234375, 4.77734375, 4.9306640625, 5.083984375, 5.2373046875, 5.390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 10.0, 14.0, 8.0, 37.0, 42.0, 106.0, 241.0, 668.0, 1865.0, 611.0, 201.0, 98.0, 52.0, 37.0, 26.0, 18.0, 8.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1163482666015625, -1.078399658203125, -1.0404510498046875, -1.00250244140625, -0.9645538330078125, -0.926605224609375, -0.8886566162109375, -0.8507080078125, -0.8127593994140625, -0.774810791015625, -0.7368621826171875, -0.69891357421875, -0.6609649658203125, -0.623016357421875, -0.5850677490234375, -0.547119140625, -0.5091705322265625, -0.471221923828125, -0.4332733154296875, -0.39532470703125, -0.3573760986328125, -0.319427490234375, -0.2814788818359375, -0.2435302734375, -0.2055816650390625, -0.167633056640625, -0.1296844482421875, -0.09173583984375, -0.0537872314453125, -0.015838623046875, 0.0221099853515625, 0.06005859375, 0.0980072021484375, 0.135955810546875, 0.1739044189453125, 0.21185302734375, 0.2498016357421875, 0.287750244140625, 0.3256988525390625, 0.3636474609375, 0.4015960693359375, 0.439544677734375, 0.4774932861328125, 0.51544189453125, 0.5533905029296875, 0.591339111328125, 0.6292877197265625, 0.667236328125, 0.7051849365234375, 0.743133544921875, 0.7810821533203125, 0.81903076171875, 0.8569793701171875, 0.894927978515625, 0.9328765869140625, 0.9708251953125, 1.0087738037109375, 1.046722412109375, 1.0846710205078125, 1.12261962890625, 1.1605682373046875, 1.198516845703125, 1.2364654541015625, 1.2744140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 19.0, 57.0, 167.0, 270.0, 258.0, 135.0, 59.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.97625160217285, -17.565088272094727, -17.1539249420166, -16.742759704589844, -16.33159637451172, -15.920433044433594, -15.509268760681152, -15.098105430603027, -14.686941146850586, -14.275777816772461, -13.86461353302002, -13.453450202941895, -13.042285919189453, -12.631122589111328, -12.219958305358887, -11.808794975280762, -11.39763069152832, -10.986467361450195, -10.575303077697754, -10.164139747619629, -9.752975463867188, -9.341812133789062, -8.930647850036621, -8.519484519958496, -8.108321189880371, -7.697157382965088, -7.285993576049805, -6.8748297691345215, -6.463665962219238, -6.052502632141113, -5.641338348388672, -5.230175018310547, -4.8190107345581055, -4.407846927642822, -3.996683120727539, -3.585519313812256, -3.1743555068969727, -2.7631919384002686, -2.3520281314849854, -1.9408643245697021, -1.529700517654419, -1.1185367107391357, -0.7073729634284973, -0.2962092161178589, 0.11495459079742432, 0.526118278503418, 0.9372820854187012, 1.3484458923339844, 1.7596096992492676, 2.170773506164551, 2.581937313079834, 2.993101119995117, 3.4042649269104004, 3.8154284954071045, 4.226592063903809, 4.63775634765625, 5.048919677734375, 5.460083484649658, 5.871247291564941, 6.282411098480225, 6.693574905395508, 7.104738235473633, 7.515902519226074, 7.927065849304199, 8.33823013305664]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 6.0, 10.0, 22.0, 18.0, 23.0, 31.0, 41.0, 52.0, 41.0, 65.0, 63.0, 56.0, 72.0, 73.0, 57.0, 51.0, 58.0, 48.0, 44.0, 47.0, 33.0, 28.0, 13.0, 19.0, 8.0, 8.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.697535037994385, -4.567294597625732, -4.43705415725708, -4.306813716888428, -4.176573753356934, -4.046333312988281, -3.916092872619629, -3.7858524322509766, -3.655611991882324, -3.525371551513672, -3.3951311111450195, -3.2648909091949463, -3.134650468826294, -3.0044100284576416, -2.8741698265075684, -2.743929386138916, -2.6136889457702637, -2.4834485054016113, -2.353208065032959, -2.2229678630828857, -2.0927274227142334, -1.962486982345581, -1.8322466611862183, -1.7020063400268555, -1.5717658996582031, -1.4415254592895508, -1.311285138130188, -1.1810448169708252, -1.0508043766021729, -0.9205639958381653, -0.7903236150741577, -0.6600832343101501, -0.5298428535461426, -0.399602472782135, -0.26936209201812744, -0.13912171125411987, -0.008881330490112305, 0.12135905027389526, 0.25159943103790283, 0.3818398118019104, 0.512080192565918, 0.6423205733299255, 0.7725609540939331, 0.9028013348579407, 1.0330417156219482, 1.1632821559906006, 1.2935224771499634, 1.4237627983093262, 1.5540032386779785, 1.6842436790466309, 1.8144840002059937, 1.9447243213653564, 2.074964761734009, 2.205205202102661, 2.3354454040527344, 2.4656858444213867, 2.595926284790039, 2.7261667251586914, 2.8564071655273438, 2.986647367477417, 3.1168878078460693, 3.2471282482147217, 3.377368450164795, 3.5076088905334473, 3.6378493309020996]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 7.0, 26.0, 18.0, 32.0, 29.0, 42.0, 59.0, 89.0, 128.0, 184.0, 281.0, 525.0, 817.0, 1504.0, 2934.0, 6530.0, 16793.0, 52565.0, 188764.0, 438792.0, 237120.0, 65571.0, 20448.0, 7675.0, 3486.0, 1691.0, 920.0, 490.0, 305.0, 232.0, 153.0, 95.0, 67.0, 41.0, 31.0, 22.0, 16.0, 4.0, 11.0, 11.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.44921875, -2.363555908203125, -2.27789306640625, -2.192230224609375, -2.1065673828125, -2.020904541015625, -1.93524169921875, -1.849578857421875, -1.763916015625, -1.678253173828125, -1.59259033203125, -1.506927490234375, -1.4212646484375, -1.335601806640625, -1.24993896484375, -1.164276123046875, -1.07861328125, -0.992950439453125, -0.90728759765625, -0.821624755859375, -0.7359619140625, -0.650299072265625, -0.56463623046875, -0.478973388671875, -0.393310546875, -0.307647705078125, -0.22198486328125, -0.136322021484375, -0.0506591796875, 0.035003662109375, 0.12066650390625, 0.206329345703125, 0.2919921875, 0.377655029296875, 0.46331787109375, 0.548980712890625, 0.6346435546875, 0.720306396484375, 0.80596923828125, 0.891632080078125, 0.977294921875, 1.062957763671875, 1.14862060546875, 1.234283447265625, 1.3199462890625, 1.405609130859375, 1.49127197265625, 1.576934814453125, 1.66259765625, 1.748260498046875, 1.83392333984375, 1.919586181640625, 2.0052490234375, 2.090911865234375, 2.17657470703125, 2.262237548828125, 2.347900390625, 2.433563232421875, 2.51922607421875, 2.604888916015625, 2.6905517578125, 2.776214599609375, 2.86187744140625, 2.947540283203125, 3.033203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 11.0, 17.0, 19.0, 21.0, 25.0, 32.0, 51.0, 37.0, 46.0, 44.0, 73.0, 62.0, 70.0, 64.0, 53.0, 57.0, 48.0, 39.0, 42.0, 39.0, 19.0, 24.0, 22.0, 18.0, 13.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4853515625, -0.471771240234375, -0.45819091796875, -0.444610595703125, -0.4310302734375, -0.417449951171875, -0.40386962890625, -0.390289306640625, -0.376708984375, -0.363128662109375, -0.34954833984375, -0.335968017578125, -0.3223876953125, -0.308807373046875, -0.29522705078125, -0.281646728515625, -0.26806640625, -0.254486083984375, -0.24090576171875, -0.227325439453125, -0.2137451171875, -0.200164794921875, -0.18658447265625, -0.173004150390625, -0.159423828125, -0.145843505859375, -0.13226318359375, -0.118682861328125, -0.1051025390625, -0.091522216796875, -0.07794189453125, -0.064361572265625, -0.05078125, -0.037200927734375, -0.02362060546875, -0.010040283203125, 0.0035400390625, 0.017120361328125, 0.03070068359375, 0.044281005859375, 0.057861328125, 0.071441650390625, 0.08502197265625, 0.098602294921875, 0.1121826171875, 0.125762939453125, 0.13934326171875, 0.152923583984375, 0.16650390625, 0.180084228515625, 0.19366455078125, 0.207244873046875, 0.2208251953125, 0.234405517578125, 0.24798583984375, 0.261566162109375, 0.275146484375, 0.288726806640625, 0.30230712890625, 0.315887451171875, 0.3294677734375, 0.343048095703125, 0.35662841796875, 0.370208740234375, 0.3837890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 0.0, 10.0, 13.0, 13.0, 16.0, 18.0, 35.0, 41.0, 85.0, 108.0, 137.0, 208.0, 314.0, 478.0, 810.0, 1683.0, 4631.0, 17033.0, 76282.0, 304845.0, 444864.0, 149870.0, 33519.0, 8167.0, 2556.0, 1111.0, 624.0, 327.0, 241.0, 155.0, 88.0, 70.0, 51.0, 39.0, 44.0, 17.0, 13.0, 11.0, 9.0, 8.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.115234375, -2.045257568359375, -1.97528076171875, -1.905303955078125, -1.8353271484375, -1.765350341796875, -1.69537353515625, -1.625396728515625, -1.555419921875, -1.485443115234375, -1.41546630859375, -1.345489501953125, -1.2755126953125, -1.205535888671875, -1.13555908203125, -1.065582275390625, -0.99560546875, -0.925628662109375, -0.85565185546875, -0.785675048828125, -0.7156982421875, -0.645721435546875, -0.57574462890625, -0.505767822265625, -0.435791015625, -0.365814208984375, -0.29583740234375, -0.225860595703125, -0.1558837890625, -0.085906982421875, -0.01593017578125, 0.054046630859375, 0.1240234375, 0.194000244140625, 0.26397705078125, 0.333953857421875, 0.4039306640625, 0.473907470703125, 0.54388427734375, 0.613861083984375, 0.683837890625, 0.753814697265625, 0.82379150390625, 0.893768310546875, 0.9637451171875, 1.033721923828125, 1.10369873046875, 1.173675537109375, 1.24365234375, 1.313629150390625, 1.38360595703125, 1.453582763671875, 1.5235595703125, 1.593536376953125, 1.66351318359375, 1.733489990234375, 1.803466796875, 1.873443603515625, 1.94342041015625, 2.013397216796875, 2.0833740234375, 2.153350830078125, 2.22332763671875, 2.293304443359375, 2.36328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 18.0, 13.0, 17.0, 11.0, 21.0, 35.0, 19.0, 25.0, 31.0, 36.0, 31.0, 34.0, 45.0, 40.0, 37.0, 43.0, 41.0, 38.0, 37.0, 47.0, 42.0, 36.0, 35.0, 32.0, 25.0, 26.0, 23.0, 28.0, 25.0, 23.0, 18.0, 13.0, 10.0, 8.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3828125, -1.3404998779296875, -1.298187255859375, -1.2558746337890625, -1.21356201171875, -1.1712493896484375, -1.128936767578125, -1.0866241455078125, -1.0443115234375, -1.0019989013671875, -0.959686279296875, -0.9173736572265625, -0.87506103515625, -0.8327484130859375, -0.790435791015625, -0.7481231689453125, -0.705810546875, -0.6634979248046875, -0.621185302734375, -0.5788726806640625, -0.53656005859375, -0.4942474365234375, -0.451934814453125, -0.4096221923828125, -0.3673095703125, -0.3249969482421875, -0.282684326171875, -0.2403717041015625, -0.19805908203125, -0.1557464599609375, -0.113433837890625, -0.0711212158203125, -0.02880859375, 0.0135040283203125, 0.055816650390625, 0.0981292724609375, 0.14044189453125, 0.1827545166015625, 0.225067138671875, 0.2673797607421875, 0.3096923828125, 0.3520050048828125, 0.394317626953125, 0.4366302490234375, 0.47894287109375, 0.5212554931640625, 0.563568115234375, 0.6058807373046875, 0.648193359375, 0.6905059814453125, 0.732818603515625, 0.7751312255859375, 0.81744384765625, 0.8597564697265625, 0.902069091796875, 0.9443817138671875, 0.9866943359375, 1.0290069580078125, 1.071319580078125, 1.1136322021484375, 1.15594482421875, 1.1982574462890625, 1.240570068359375, 1.2828826904296875, 1.3251953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 14.0, 30.0, 46.0, 75.0, 131.0, 205.0, 379.0, 853.0, 1882.0, 5329.0, 20163.0, 145867.0, 720438.0, 126114.0, 18413.0, 5112.0, 1811.0, 811.0, 403.0, 181.0, 107.0, 63.0, 39.0, 25.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37890625, -2.307830810546875, -2.23675537109375, -2.165679931640625, -2.0946044921875, -2.023529052734375, -1.95245361328125, -1.881378173828125, -1.810302734375, -1.739227294921875, -1.66815185546875, -1.597076416015625, -1.5260009765625, -1.454925537109375, -1.38385009765625, -1.312774658203125, -1.24169921875, -1.170623779296875, -1.09954833984375, -1.028472900390625, -0.9573974609375, -0.886322021484375, -0.81524658203125, -0.744171142578125, -0.673095703125, -0.602020263671875, -0.53094482421875, -0.459869384765625, -0.3887939453125, -0.317718505859375, -0.24664306640625, -0.175567626953125, -0.1044921875, -0.033416748046875, 0.03765869140625, 0.108734130859375, 0.1798095703125, 0.250885009765625, 0.32196044921875, 0.393035888671875, 0.464111328125, 0.535186767578125, 0.60626220703125, 0.677337646484375, 0.7484130859375, 0.819488525390625, 0.89056396484375, 0.961639404296875, 1.03271484375, 1.103790283203125, 1.17486572265625, 1.245941162109375, 1.3170166015625, 1.388092041015625, 1.45916748046875, 1.530242919921875, 1.601318359375, 1.672393798828125, 1.74346923828125, 1.814544677734375, 1.8856201171875, 1.956695556640625, 2.02777099609375, 2.098846435546875, 2.169921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 16.0, 18.0, 22.0, 37.0, 32.0, 55.0, 93.0, 115.0, 126.0, 97.0, 66.0, 61.0, 57.0, 41.0, 20.0, 22.0, 11.0, 8.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002562999725341797, -0.00024925172328948975, -0.0002422034740447998, -0.00023515522480010986, -0.00022810697555541992, -0.00022105872631072998, -0.00021401047706604004, -0.0002069622278213501, -0.00019991397857666016, -0.00019286572933197021, -0.00018581748008728027, -0.00017876923084259033, -0.0001717209815979004, -0.00016467273235321045, -0.0001576244831085205, -0.00015057623386383057, -0.00014352798461914062, -0.00013647973537445068, -0.00012943148612976074, -0.0001223832368850708, -0.00011533498764038086, -0.00010828673839569092, -0.00010123848915100098, -9.419023990631104e-05, -8.71419906616211e-05, -8.009374141693115e-05, -7.304549217224121e-05, -6.599724292755127e-05, -5.894899368286133e-05, -5.190074443817139e-05, -4.4852495193481445e-05, -3.7804245948791504e-05, -3.075599670410156e-05, -2.370774745941162e-05, -1.665949821472168e-05, -9.611248970031738e-06, -2.562999725341797e-06, 4.4852495193481445e-06, 1.1533498764038086e-05, 1.8581748008728027e-05, 2.562999725341797e-05, 3.267824649810791e-05, 3.972649574279785e-05, 4.677474498748779e-05, 5.3822994232177734e-05, 6.0871243476867676e-05, 6.791949272155762e-05, 7.496774196624756e-05, 8.20159912109375e-05, 8.906424045562744e-05, 9.611248970031738e-05, 0.00010316073894500732, 0.00011020898818969727, 0.00011725723743438721, 0.00012430548667907715, 0.0001313537359237671, 0.00013840198516845703, 0.00014545023441314697, 0.00015249848365783691, 0.00015954673290252686, 0.0001665949821472168, 0.00017364323139190674, 0.00018069148063659668, 0.00018773972988128662, 0.00019478797912597656]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 16.0, 29.0, 37.0, 53.0, 109.0, 212.0, 383.0, 890.0, 2919.0, 14384.0, 223354.0, 766518.0, 32189.0, 5015.0, 1365.0, 504.0, 235.0, 128.0, 73.0, 46.0, 29.0, 12.0, 14.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.53515625, -3.418060302734375, -3.30096435546875, -3.183868408203125, -3.0667724609375, -2.949676513671875, -2.83258056640625, -2.715484619140625, -2.598388671875, -2.481292724609375, -2.36419677734375, -2.247100830078125, -2.1300048828125, -2.012908935546875, -1.89581298828125, -1.778717041015625, -1.66162109375, -1.544525146484375, -1.42742919921875, -1.310333251953125, -1.1932373046875, -1.076141357421875, -0.95904541015625, -0.841949462890625, -0.724853515625, -0.607757568359375, -0.49066162109375, -0.373565673828125, -0.2564697265625, -0.139373779296875, -0.02227783203125, 0.094818115234375, 0.2119140625, 0.329010009765625, 0.44610595703125, 0.563201904296875, 0.6802978515625, 0.797393798828125, 0.91448974609375, 1.031585693359375, 1.148681640625, 1.265777587890625, 1.38287353515625, 1.499969482421875, 1.6170654296875, 1.734161376953125, 1.85125732421875, 1.968353271484375, 2.08544921875, 2.202545166015625, 2.31964111328125, 2.436737060546875, 2.5538330078125, 2.670928955078125, 2.78802490234375, 2.905120849609375, 3.022216796875, 3.139312744140625, 3.25640869140625, 3.373504638671875, 3.4906005859375, 3.607696533203125, 3.72479248046875, 3.841888427734375, 3.958984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 10.0, 12.0, 14.0, 29.0, 48.0, 60.0, 108.0, 163.0, 186.0, 128.0, 80.0, 51.0, 26.0, 15.0, 17.0, 13.0, 7.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8647308349609375, -1.808563232421875, -1.7523956298828125, -1.69622802734375, -1.6400604248046875, -1.583892822265625, -1.5277252197265625, -1.4715576171875, -1.4153900146484375, -1.359222412109375, -1.3030548095703125, -1.24688720703125, -1.1907196044921875, -1.134552001953125, -1.0783843994140625, -1.022216796875, -0.9660491943359375, -0.909881591796875, -0.8537139892578125, -0.79754638671875, -0.7413787841796875, -0.685211181640625, -0.6290435791015625, -0.5728759765625, -0.5167083740234375, -0.460540771484375, -0.4043731689453125, -0.34820556640625, -0.2920379638671875, -0.235870361328125, -0.1797027587890625, -0.12353515625, -0.0673675537109375, -0.011199951171875, 0.0449676513671875, 0.10113525390625, 0.1573028564453125, 0.213470458984375, 0.2696380615234375, 0.3258056640625, 0.3819732666015625, 0.438140869140625, 0.4943084716796875, 0.55047607421875, 0.6066436767578125, 0.662811279296875, 0.7189788818359375, 0.775146484375, 0.8313140869140625, 0.887481689453125, 0.9436492919921875, 0.99981689453125, 1.0559844970703125, 1.112152099609375, 1.1683197021484375, 1.2244873046875, 1.2806549072265625, 1.336822509765625, 1.3929901123046875, 1.44915771484375, 1.5053253173828125, 1.561492919921875, 1.6176605224609375, 1.673828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 11.0, 63.0, 151.0, 295.0, 276.0, 148.0, 33.0, 19.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.460739135742188, -25.25513458251953, -24.049531936645508, -22.84392738342285, -21.638324737548828, -20.432720184326172, -19.227115631103516, -18.021512985229492, -16.81591033935547, -15.610306739807129, -14.404703140258789, -13.199098587036133, -11.99349594116211, -10.787891387939453, -9.582287788391113, -8.376684188842773, -7.171079635620117, -5.965476036071777, -4.7598724365234375, -3.5542683601379395, -2.3486647605895996, -1.1430611610412598, 0.06254291534423828, 1.2681465148925781, 2.473750114440918, 3.679353713989258, 4.884957313537598, 6.090561389923096, 7.2961649894714355, 8.501768112182617, 9.707372665405273, 10.912976264953613, 12.118579864501953, 13.324183464050293, 14.529787063598633, 15.735391616821289, 16.940994262695312, 18.14659881591797, 19.352203369140625, 20.55780601501465, 21.763408660888672, 22.969013214111328, 24.17461585998535, 25.380220413208008, 26.58582305908203, 27.791427612304688, 28.997032165527344, 30.202634811401367, 31.408239364624023, 32.61384201049805, 33.8194465637207, 35.02505111694336, 36.230655670166016, 37.436256408691406, 38.64186096191406, 39.84746551513672, 41.053070068359375, 42.25867462158203, 43.46427917480469, 44.66987991333008, 45.875484466552734, 47.08108901977539, 48.28669357299805, 49.49229431152344, 50.697898864746094]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 11.0, 11.0, 24.0, 15.0, 24.0, 25.0, 18.0, 33.0, 38.0, 25.0, 37.0, 35.0, 42.0, 39.0, 40.0, 38.0, 52.0, 34.0, 41.0, 27.0, 31.0, 40.0, 50.0, 34.0, 27.0, 44.0, 21.0, 16.0, 13.0, 16.0, 12.0, 15.0, 9.0, 8.0, 6.0, 6.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0], "bins": [-9.608081817626953, -9.353487014770508, -9.098893165588379, -8.844298362731934, -8.589704513549805, -8.33510971069336, -8.08051586151123, -7.825921058654785, -7.571327209472656, -7.316732883453369, -7.062138557434082, -6.807544231414795, -6.552949905395508, -6.298355579376221, -6.043761253356934, -5.789166450500488, -5.534572124481201, -5.279977798461914, -5.025383472442627, -4.77078914642334, -4.516194820404053, -4.261600494384766, -4.00700569152832, -3.7524116039276123, -3.497817277908325, -3.243222951889038, -2.988628625869751, -2.7340340614318848, -2.4794397354125977, -2.2248454093933105, -1.9702510833740234, -1.7156567573547363, -1.4610624313354492, -1.206468105316162, -0.9518737196922302, -0.6972793340682983, -0.44268500804901123, -0.18809068202972412, 0.06650376319885254, 0.32109808921813965, 0.5756924152374268, 0.8302867412567139, 1.084881067276001, 1.3394755125045776, 1.5940698385238647, 1.8486641645431519, 2.1032586097717285, 2.3578529357910156, 2.6124472618103027, 2.86704158782959, 3.121635913848877, 3.376230239868164, 3.630824565887451, 3.8854188919067383, 4.140013694763184, 4.3946075439453125, 4.649202346801758, 4.903796672821045, 5.158390998840332, 5.412985324859619, 5.667579650878906, 5.922173976898193, 6.1767683029174805, 6.431363105773926, 6.685956954956055]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 12.0, 17.0, 20.0, 22.0, 42.0, 49.0, 68.0, 85.0, 124.0, 177.0, 273.0, 443.0, 720.0, 1403.0, 3060.0, 6505.0, 18102.0, 76773.0, 2534349.0, 1454108.0, 67883.0, 17055.0, 6383.0, 2983.0, 1478.0, 868.0, 469.0, 271.0, 173.0, 122.0, 59.0, 47.0, 28.0, 31.0, 12.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71875, -3.612396240234375, -3.50604248046875, -3.399688720703125, -3.2933349609375, -3.186981201171875, -3.08062744140625, -2.974273681640625, -2.867919921875, -2.761566162109375, -2.65521240234375, -2.548858642578125, -2.4425048828125, -2.336151123046875, -2.22979736328125, -2.123443603515625, -2.01708984375, -1.910736083984375, -1.80438232421875, -1.698028564453125, -1.5916748046875, -1.485321044921875, -1.37896728515625, -1.272613525390625, -1.166259765625, -1.059906005859375, -0.95355224609375, -0.847198486328125, -0.7408447265625, -0.634490966796875, -0.52813720703125, -0.421783447265625, -0.3154296875, -0.209075927734375, -0.10272216796875, 0.003631591796875, 0.1099853515625, 0.216339111328125, 0.32269287109375, 0.429046630859375, 0.535400390625, 0.641754150390625, 0.74810791015625, 0.854461669921875, 0.9608154296875, 1.067169189453125, 1.17352294921875, 1.279876708984375, 1.38623046875, 1.492584228515625, 1.59893798828125, 1.705291748046875, 1.8116455078125, 1.917999267578125, 2.02435302734375, 2.130706787109375, 2.237060546875, 2.343414306640625, 2.44976806640625, 2.556121826171875, 2.6624755859375, 2.768829345703125, 2.87518310546875, 2.981536865234375, 3.087890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 6.0, 10.0, 18.0, 21.0, 28.0, 31.0, 35.0, 47.0, 37.0, 57.0, 50.0, 58.0, 73.0, 56.0, 63.0, 51.0, 64.0, 53.0, 36.0, 36.0, 24.0, 35.0, 21.0, 10.0, 13.0, 6.0, 15.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.509765625, -0.4956817626953125, -0.481597900390625, -0.4675140380859375, -0.45343017578125, -0.4393463134765625, -0.425262451171875, -0.4111785888671875, -0.3970947265625, -0.3830108642578125, -0.368927001953125, -0.3548431396484375, -0.34075927734375, -0.3266754150390625, -0.312591552734375, -0.2985076904296875, -0.284423828125, -0.2703399658203125, -0.256256103515625, -0.2421722412109375, -0.22808837890625, -0.2140045166015625, -0.199920654296875, -0.1858367919921875, -0.1717529296875, -0.1576690673828125, -0.143585205078125, -0.1295013427734375, -0.11541748046875, -0.1013336181640625, -0.087249755859375, -0.0731658935546875, -0.05908203125, -0.0449981689453125, -0.030914306640625, -0.0168304443359375, -0.00274658203125, 0.0113372802734375, 0.025421142578125, 0.0395050048828125, 0.0535888671875, 0.0676727294921875, 0.081756591796875, 0.0958404541015625, 0.10992431640625, 0.1240081787109375, 0.138092041015625, 0.1521759033203125, 0.166259765625, 0.1803436279296875, 0.194427490234375, 0.2085113525390625, 0.22259521484375, 0.2366790771484375, 0.250762939453125, 0.2648468017578125, 0.2789306640625, 0.2930145263671875, 0.307098388671875, 0.3211822509765625, 0.33526611328125, 0.3493499755859375, 0.363433837890625, 0.3775177001953125, 0.3916015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 9.0, 15.0, 15.0, 29.0, 24.0, 33.0, 62.0, 103.0, 162.0, 265.0, 621.0, 1471.0, 4492.0, 24172.0, 493295.0, 3589376.0, 67082.0, 8791.0, 2367.0, 921.0, 365.0, 222.0, 96.0, 60.0, 52.0, 27.0, 26.0, 26.0, 19.0, 8.0, 11.0, 13.0, 8.0, 2.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.76666259765625, -4.6231689453125, -4.47967529296875, -4.336181640625, -4.19268798828125, -4.0491943359375, -3.90570068359375, -3.76220703125, -3.61871337890625, -3.4752197265625, -3.33172607421875, -3.188232421875, -3.04473876953125, -2.9012451171875, -2.75775146484375, -2.6142578125, -2.47076416015625, -2.3272705078125, -2.18377685546875, -2.040283203125, -1.89678955078125, -1.7532958984375, -1.60980224609375, -1.46630859375, -1.32281494140625, -1.1793212890625, -1.03582763671875, -0.892333984375, -0.74884033203125, -0.6053466796875, -0.46185302734375, -0.318359375, -0.17486572265625, -0.0313720703125, 0.11212158203125, 0.255615234375, 0.39910888671875, 0.5426025390625, 0.68609619140625, 0.82958984375, 0.97308349609375, 1.1165771484375, 1.26007080078125, 1.403564453125, 1.54705810546875, 1.6905517578125, 1.83404541015625, 1.9775390625, 2.12103271484375, 2.2645263671875, 2.40802001953125, 2.551513671875, 2.69500732421875, 2.8385009765625, 2.98199462890625, 3.12548828125, 3.26898193359375, 3.4124755859375, 3.55596923828125, 3.699462890625, 3.84295654296875, 3.9864501953125, 4.12994384765625, 4.2734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 4.0, 8.0, 11.0, 23.0, 35.0, 60.0, 125.0, 298.0, 784.0, 1721.0, 580.0, 217.0, 101.0, 41.0, 15.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5857696533203125, -1.536773681640625, -1.4877777099609375, -1.43878173828125, -1.3897857666015625, -1.340789794921875, -1.2917938232421875, -1.2427978515625, -1.1938018798828125, -1.144805908203125, -1.0958099365234375, -1.04681396484375, -0.9978179931640625, -0.948822021484375, -0.8998260498046875, -0.850830078125, -0.8018341064453125, -0.752838134765625, -0.7038421630859375, -0.65484619140625, -0.6058502197265625, -0.556854248046875, -0.5078582763671875, -0.4588623046875, -0.4098663330078125, -0.360870361328125, -0.3118743896484375, -0.26287841796875, -0.2138824462890625, -0.164886474609375, -0.1158905029296875, -0.06689453125, -0.0178985595703125, 0.031097412109375, 0.0800933837890625, 0.12908935546875, 0.1780853271484375, 0.227081298828125, 0.2760772705078125, 0.3250732421875, 0.3740692138671875, 0.423065185546875, 0.4720611572265625, 0.52105712890625, 0.5700531005859375, 0.619049072265625, 0.6680450439453125, 0.717041015625, 0.7660369873046875, 0.815032958984375, 0.8640289306640625, 0.91302490234375, 0.9620208740234375, 1.011016845703125, 1.0600128173828125, 1.1090087890625, 1.1580047607421875, 1.207000732421875, 1.2559967041015625, 1.30499267578125, 1.3539886474609375, 1.402984619140625, 1.4519805908203125, 1.5009765625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 6.0, 16.0, 18.0, 27.0, 55.0, 79.0, 93.0, 147.0, 116.0, 143.0, 113.0, 55.0, 47.0, 34.0, 18.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21065616607666, -5.977004051208496, -5.743351936340332, -5.509699821472168, -5.276047706604004, -5.04239559173584, -4.808743476867676, -4.575091361999512, -4.341439247131348, -4.107787132263184, -3.8741350173950195, -3.6404829025268555, -3.4068307876586914, -3.1731786727905273, -2.9395267963409424, -2.7058746814727783, -2.4722228050231934, -2.2385706901550293, -2.0049185752868652, -1.7712665796279907, -1.5376144647598267, -1.3039623498916626, -1.070310354232788, -0.836658239364624, -0.60300612449646, -0.3693540394306183, -0.1357019543647766, 0.09795010089874268, 0.33160221576690674, 0.5652543306350708, 0.7989063262939453, 1.0325584411621094, 1.2662105560302734, 1.4998626708984375, 1.7335147857666016, 1.967166781425476, 2.2008190155029297, 2.4344711303710938, 2.6681230068206787, 2.9017751216888428, 3.135427236557007, 3.369079351425171, 3.602731466293335, 3.83638334274292, 4.070035457611084, 4.303687572479248, 4.537339687347412, 4.770991802215576, 5.00464391708374, 5.238296031951904, 5.471948146820068, 5.705600261688232, 5.9392523765563965, 6.1729044914245605, 6.406556129455566, 6.6402082443237305, 6.8738603591918945, 7.107512474060059, 7.341164588928223, 7.574816703796387, 7.808468818664551, 8.042120933532715, 8.275773048400879, 8.509425163269043, 8.743077278137207]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 13.0, 11.0, 12.0, 17.0, 21.0, 22.0, 27.0, 35.0, 47.0, 47.0, 46.0, 50.0, 45.0, 79.0, 53.0, 52.0, 52.0, 62.0, 52.0, 45.0, 38.0, 39.0, 24.0, 24.0, 24.0, 15.0, 12.0, 5.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4587721824645996, -3.318309783935547, -3.177847385406494, -3.0373847484588623, -2.8969223499298096, -2.756459951400757, -2.615997314453125, -2.4755349159240723, -2.3350725173950195, -2.194610118865967, -2.054147720336914, -1.9136850833892822, -1.7732226848602295, -1.6327602863311768, -1.4922977685928345, -1.3518352508544922, -1.2113728523254395, -1.0709104537963867, -0.9304479360580444, -0.7899854779243469, -0.6495230197906494, -0.5090605616569519, -0.3685981035232544, -0.22813564538955688, -0.08767318725585938, 0.052789270877838135, 0.19325172901153564, 0.33371418714523315, 0.47417664527893066, 0.6146391034126282, 0.7551015615463257, 0.8955640196800232, 1.0360264778137207, 1.1764888763427734, 1.3169513940811157, 1.457413911819458, 1.5978763103485107, 1.7383387088775635, 1.8788012266159058, 2.019263744354248, 2.159726142883301, 2.3001885414123535, 2.4406509399414062, 2.581113576889038, 2.721575975418091, 2.8620383739471436, 3.0025010108947754, 3.142963409423828, 3.283425807952881, 3.4238882064819336, 3.5643506050109863, 3.704813241958618, 3.845275640487671, 3.9857380390167236, 4.1262006759643555, 4.266663074493408, 4.407125473022461, 4.547587871551514, 4.688050270080566, 4.828512668609619, 4.968975067138672, 5.109437942504883, 5.2499003410339355, 5.390362739562988, 5.530825138092041]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 7.0, 5.0, 18.0, 30.0, 47.0, 69.0, 151.0, 278.0, 631.0, 1575.0, 4364.0, 18520.0, 119148.0, 705327.0, 165860.0, 23880.0, 5434.0, 1788.0, 748.0, 319.0, 159.0, 85.0, 38.0, 28.0, 17.0, 18.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.0987548828125, -3.955322265625, -3.8118896484375, -3.66845703125, -3.5250244140625, -3.381591796875, -3.2381591796875, -3.0947265625, -2.9512939453125, -2.807861328125, -2.6644287109375, -2.52099609375, -2.3775634765625, -2.234130859375, -2.0906982421875, -1.947265625, -1.8038330078125, -1.660400390625, -1.5169677734375, -1.37353515625, -1.2301025390625, -1.086669921875, -0.9432373046875, -0.7998046875, -0.6563720703125, -0.512939453125, -0.3695068359375, -0.22607421875, -0.0826416015625, 0.060791015625, 0.2042236328125, 0.34765625, 0.4910888671875, 0.634521484375, 0.7779541015625, 0.92138671875, 1.0648193359375, 1.208251953125, 1.3516845703125, 1.4951171875, 1.6385498046875, 1.781982421875, 1.9254150390625, 2.06884765625, 2.2122802734375, 2.355712890625, 2.4991455078125, 2.642578125, 2.7860107421875, 2.929443359375, 3.0728759765625, 3.21630859375, 3.3597412109375, 3.503173828125, 3.6466064453125, 3.7900390625, 3.9334716796875, 4.076904296875, 4.2203369140625, 4.36376953125, 4.5072021484375, 4.650634765625, 4.7940673828125, 4.9375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 10.0, 10.0, 19.0, 10.0, 33.0, 33.0, 24.0, 37.0, 58.0, 57.0, 54.0, 62.0, 59.0, 65.0, 65.0, 57.0, 58.0, 49.0, 48.0, 37.0, 34.0, 27.0, 11.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5498046875, -0.5346870422363281, -0.5195693969726562, -0.5044517517089844, -0.4893341064453125, -0.4742164611816406, -0.45909881591796875, -0.4439811706542969, -0.428863525390625, -0.4137458801269531, -0.39862823486328125, -0.3835105895996094, -0.3683929443359375, -0.3532752990722656, -0.33815765380859375, -0.3230400085449219, -0.30792236328125, -0.2928047180175781, -0.27768707275390625, -0.2625694274902344, -0.2474517822265625, -0.23233413696289062, -0.21721649169921875, -0.20209884643554688, -0.186981201171875, -0.17186355590820312, -0.15674591064453125, -0.14162826538085938, -0.1265106201171875, -0.11139297485351562, -0.09627532958984375, -0.08115768432617188, -0.0660400390625, -0.050922393798828125, -0.03580474853515625, -0.020687103271484375, -0.0055694580078125, 0.009548187255859375, 0.02466583251953125, 0.039783477783203125, 0.054901123046875, 0.07001876831054688, 0.08513641357421875, 0.10025405883789062, 0.1153717041015625, 0.13048934936523438, 0.14560699462890625, 0.16072463989257812, 0.17584228515625, 0.19095993041992188, 0.20607757568359375, 0.22119522094726562, 0.2363128662109375, 0.2514305114746094, 0.26654815673828125, 0.2816658020019531, 0.296783447265625, 0.3119010925292969, 0.32701873779296875, 0.3421363830566406, 0.3572540283203125, 0.3723716735839844, 0.38748931884765625, 0.4026069641113281, 0.417724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 6.0, 8.0, 13.0, 8.0, 25.0, 37.0, 32.0, 52.0, 82.0, 109.0, 136.0, 222.0, 340.0, 628.0, 1072.0, 2268.0, 6080.0, 19562.0, 74596.0, 340462.0, 458312.0, 103999.0, 26340.0, 8087.0, 2872.0, 1313.0, 654.0, 360.0, 256.0, 163.0, 117.0, 87.0, 61.0, 44.0, 28.0, 21.0, 22.0, 23.0, 11.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.408203125, -2.333221435546875, -2.25823974609375, -2.183258056640625, -2.1082763671875, -2.033294677734375, -1.95831298828125, -1.883331298828125, -1.808349609375, -1.733367919921875, -1.65838623046875, -1.583404541015625, -1.5084228515625, -1.433441162109375, -1.35845947265625, -1.283477783203125, -1.20849609375, -1.133514404296875, -1.05853271484375, -0.983551025390625, -0.9085693359375, -0.833587646484375, -0.75860595703125, -0.683624267578125, -0.608642578125, -0.533660888671875, -0.45867919921875, -0.383697509765625, -0.3087158203125, -0.233734130859375, -0.15875244140625, -0.083770751953125, -0.0087890625, 0.066192626953125, 0.14117431640625, 0.216156005859375, 0.2911376953125, 0.366119384765625, 0.44110107421875, 0.516082763671875, 0.591064453125, 0.666046142578125, 0.74102783203125, 0.816009521484375, 0.8909912109375, 0.965972900390625, 1.04095458984375, 1.115936279296875, 1.19091796875, 1.265899658203125, 1.34088134765625, 1.415863037109375, 1.4908447265625, 1.565826416015625, 1.64080810546875, 1.715789794921875, 1.790771484375, 1.865753173828125, 1.94073486328125, 2.015716552734375, 2.0906982421875, 2.165679931640625, 2.24066162109375, 2.315643310546875, 2.390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 4.0, 12.0, 14.0, 25.0, 16.0, 28.0, 23.0, 53.0, 52.0, 50.0, 51.0, 39.0, 55.0, 52.0, 72.0, 55.0, 47.0, 55.0, 54.0, 37.0, 42.0, 32.0, 20.0, 28.0, 19.0, 13.0, 11.0, 7.0, 6.0, 8.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.02734375, -1.96722412109375, -1.9071044921875, -1.84698486328125, -1.786865234375, -1.72674560546875, -1.6666259765625, -1.60650634765625, -1.54638671875, -1.48626708984375, -1.4261474609375, -1.36602783203125, -1.305908203125, -1.24578857421875, -1.1856689453125, -1.12554931640625, -1.0654296875, -1.00531005859375, -0.9451904296875, -0.88507080078125, -0.824951171875, -0.76483154296875, -0.7047119140625, -0.64459228515625, -0.58447265625, -0.52435302734375, -0.4642333984375, -0.40411376953125, -0.343994140625, -0.28387451171875, -0.2237548828125, -0.16363525390625, -0.103515625, -0.04339599609375, 0.0167236328125, 0.07684326171875, 0.136962890625, 0.19708251953125, 0.2572021484375, 0.31732177734375, 0.37744140625, 0.43756103515625, 0.4976806640625, 0.55780029296875, 0.617919921875, 0.67803955078125, 0.7381591796875, 0.79827880859375, 0.8583984375, 0.91851806640625, 0.9786376953125, 1.03875732421875, 1.098876953125, 1.15899658203125, 1.2191162109375, 1.27923583984375, 1.33935546875, 1.39947509765625, 1.4595947265625, 1.51971435546875, 1.579833984375, 1.63995361328125, 1.7000732421875, 1.76019287109375, 1.8203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 11.0, 9.0, 20.0, 40.0, 48.0, 100.0, 149.0, 286.0, 645.0, 1539.0, 4888.0, 20452.0, 143080.0, 761612.0, 93661.0, 15606.0, 3972.0, 1281.0, 521.0, 263.0, 140.0, 83.0, 55.0, 36.0, 19.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.175079345703125, -2.10797119140625, -2.040863037109375, -1.9737548828125, -1.906646728515625, -1.83953857421875, -1.772430419921875, -1.705322265625, -1.638214111328125, -1.57110595703125, -1.503997802734375, -1.4368896484375, -1.369781494140625, -1.30267333984375, -1.235565185546875, -1.16845703125, -1.101348876953125, -1.03424072265625, -0.967132568359375, -0.9000244140625, -0.832916259765625, -0.76580810546875, -0.698699951171875, -0.631591796875, -0.564483642578125, -0.49737548828125, -0.430267333984375, -0.3631591796875, -0.296051025390625, -0.22894287109375, -0.161834716796875, -0.0947265625, -0.027618408203125, 0.03948974609375, 0.106597900390625, 0.1737060546875, 0.240814208984375, 0.30792236328125, 0.375030517578125, 0.442138671875, 0.509246826171875, 0.57635498046875, 0.643463134765625, 0.7105712890625, 0.777679443359375, 0.84478759765625, 0.911895751953125, 0.97900390625, 1.046112060546875, 1.11322021484375, 1.180328369140625, 1.2474365234375, 1.314544677734375, 1.38165283203125, 1.448760986328125, 1.515869140625, 1.582977294921875, 1.65008544921875, 1.717193603515625, 1.7843017578125, 1.851409912109375, 1.91851806640625, 1.985626220703125, 2.052734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 17.0, 14.0, 32.0, 37.0, 71.0, 237.0, 346.0, 102.0, 53.0, 23.0, 23.0, 12.0, 8.0, 7.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006055831909179688, -0.0005901232361793518, -0.0005746632814407349, -0.0005592033267021179, -0.000543743371963501, -0.000528283417224884, -0.0005128234624862671, -0.0004973635077476501, -0.0004819035530090332, -0.00046644359827041626, -0.0004509836435317993, -0.0004355236887931824, -0.00042006373405456543, -0.0004046037793159485, -0.00038914382457733154, -0.0003736838698387146, -0.00035822391510009766, -0.0003427639603614807, -0.00032730400562286377, -0.0003118440508842468, -0.0002963840961456299, -0.00028092414140701294, -0.000265464186668396, -0.00025000423192977905, -0.0002345442771911621, -0.00021908432245254517, -0.00020362436771392822, -0.00018816441297531128, -0.00017270445823669434, -0.0001572445034980774, -0.00014178454875946045, -0.0001263245940208435, -0.00011086463928222656, -9.540468454360962e-05, -7.994472980499268e-05, -6.448477506637573e-05, -4.902482032775879e-05, -3.3564865589141846e-05, -1.8104910850524902e-05, -2.644956111907959e-06, 1.2814998626708984e-05, 2.8274953365325928e-05, 4.373490810394287e-05, 5.9194862842559814e-05, 7.465481758117676e-05, 9.01147723197937e-05, 0.00010557472705841064, 0.00012103468179702759, 0.00013649463653564453, 0.00015195459127426147, 0.00016741454601287842, 0.00018287450075149536, 0.0001983344554901123, 0.00021379441022872925, 0.0002292543649673462, 0.00024471431970596313, 0.0002601742744445801, 0.000275634229183197, 0.00029109418392181396, 0.0003065541386604309, 0.00032201409339904785, 0.0003374740481376648, 0.00035293400287628174, 0.0003683939576148987, 0.0003838539123535156]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 12.0, 13.0, 16.0, 15.0, 22.0, 35.0, 26.0, 42.0, 76.0, 100.0, 131.0, 271.0, 495.0, 996.0, 2381.0, 6156.0, 18936.0, 73313.0, 687874.0, 205020.0, 35272.0, 10403.0, 3780.0, 1463.0, 696.0, 412.0, 185.0, 121.0, 78.0, 57.0, 44.0, 30.0, 24.0, 19.0, 16.0, 7.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.674041748046875, -1.61370849609375, -1.553375244140625, -1.4930419921875, -1.432708740234375, -1.37237548828125, -1.312042236328125, -1.251708984375, -1.191375732421875, -1.13104248046875, -1.070709228515625, -1.0103759765625, -0.950042724609375, -0.88970947265625, -0.829376220703125, -0.76904296875, -0.708709716796875, -0.64837646484375, -0.588043212890625, -0.5277099609375, -0.467376708984375, -0.40704345703125, -0.346710205078125, -0.286376953125, -0.226043701171875, -0.16571044921875, -0.105377197265625, -0.0450439453125, 0.015289306640625, 0.07562255859375, 0.135955810546875, 0.1962890625, 0.256622314453125, 0.31695556640625, 0.377288818359375, 0.4376220703125, 0.497955322265625, 0.55828857421875, 0.618621826171875, 0.678955078125, 0.739288330078125, 0.79962158203125, 0.859954833984375, 0.9202880859375, 0.980621337890625, 1.04095458984375, 1.101287841796875, 1.16162109375, 1.221954345703125, 1.28228759765625, 1.342620849609375, 1.4029541015625, 1.463287353515625, 1.52362060546875, 1.583953857421875, 1.644287109375, 1.704620361328125, 1.76495361328125, 1.825286865234375, 1.8856201171875, 1.945953369140625, 2.00628662109375, 2.066619873046875, 2.126953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 9.0, 4.0, 12.0, 12.0, 12.0, 21.0, 21.0, 25.0, 45.0, 68.0, 100.0, 151.0, 160.0, 110.0, 69.0, 34.0, 28.0, 20.0, 18.0, 15.0, 19.0, 18.0, 8.0, 2.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9423751831054688, -0.9018402099609375, -0.8613052368164062, -0.820770263671875, -0.7802352905273438, -0.7397003173828125, -0.6991653442382812, -0.65863037109375, -0.6180953979492188, -0.5775604248046875, -0.5370254516601562, -0.496490478515625, -0.45595550537109375, -0.4154205322265625, -0.37488555908203125, -0.3343505859375, -0.29381561279296875, -0.2532806396484375, -0.21274566650390625, -0.172210693359375, -0.13167572021484375, -0.0911407470703125, -0.05060577392578125, -0.01007080078125, 0.03046417236328125, 0.0709991455078125, 0.11153411865234375, 0.152069091796875, 0.19260406494140625, 0.2331390380859375, 0.27367401123046875, 0.314208984375, 0.35474395751953125, 0.3952789306640625, 0.43581390380859375, 0.476348876953125, 0.5168838500976562, 0.5574188232421875, 0.5979537963867188, 0.63848876953125, 0.6790237426757812, 0.7195587158203125, 0.7600936889648438, 0.800628662109375, 0.8411636352539062, 0.8816986083984375, 0.9222335815429688, 0.9627685546875, 1.0033035278320312, 1.0438385009765625, 1.0843734741210938, 1.124908447265625, 1.1654434204101562, 1.2059783935546875, 1.2465133666992188, 1.28704833984375, 1.3275833129882812, 1.3681182861328125, 1.4086532592773438, 1.449188232421875, 1.4897232055664062, 1.5302581787109375, 1.5707931518554688, 1.611328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 12.0, 14.0, 31.0, 68.0, 127.0, 176.0, 186.0, 165.0, 115.0, 52.0, 31.0, 14.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.84744644165039, -24.052867889404297, -23.25828742980957, -22.463708877563477, -21.66912841796875, -20.874549865722656, -20.079971313476562, -19.285390853881836, -18.49081039428711, -17.696231842041016, -16.90165138244629, -16.107072830200195, -15.312492370605469, -14.517913818359375, -13.723334312438965, -12.928754806518555, -12.134176254272461, -11.33959674835205, -10.54501724243164, -9.750438690185547, -8.95585823059082, -8.161279678344727, -7.366700172424316, -6.572120666503906, -5.777541160583496, -4.982961654663086, -4.188382148742676, -3.393803119659424, -2.5992236137390137, -1.8046441078186035, -1.0100650787353516, -0.2154855728149414, 0.5790958404541016, 1.3736752271652222, 2.1682546138763428, 2.962833881378174, 3.757413387298584, 4.551992893218994, 5.346571922302246, 6.141151428222656, 6.935730934143066, 7.730310440063477, 8.524889945983887, 9.319469451904297, 10.11404800415039, 10.908628463745117, 11.703207015991211, 12.497786521911621, 13.292366027832031, 14.086945533752441, 14.881525039672852, 15.676103591918945, 16.470684051513672, 17.265262603759766, 18.05984115600586, 18.854421615600586, 19.649002075195312, 20.443580627441406, 21.238161087036133, 22.032739639282227, 22.827320098876953, 23.621898651123047, 24.41647720336914, 25.211057662963867, 26.00563621520996]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 4.0, 8.0, 9.0, 4.0, 12.0, 14.0, 9.0, 15.0, 12.0, 23.0, 23.0, 26.0, 21.0, 23.0, 35.0, 33.0, 28.0, 39.0, 36.0, 37.0, 31.0, 39.0, 34.0, 38.0, 41.0, 44.0, 40.0, 35.0, 27.0, 32.0, 29.0, 17.0, 23.0, 23.0, 27.0, 8.0, 14.0, 13.0, 12.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.466588497161865, -7.238072395324707, -7.009555816650391, -6.781039714813232, -6.552523136138916, -6.324007034301758, -6.095490455627441, -5.866974353790283, -5.638458251953125, -5.409942150115967, -5.18142557144165, -4.952909469604492, -4.724392890930176, -4.495876789093018, -4.267360687255859, -4.038844108581543, -3.8103275299072266, -3.5818111896514893, -3.353294849395752, -3.1247787475585938, -2.8962621688842773, -2.667746067047119, -2.439229726791382, -2.2107133865356445, -1.9821970462799072, -1.75368070602417, -1.5251643657684326, -1.2966481447219849, -1.0681318044662476, -0.8396154642105103, -0.6110992431640625, -0.3825829029083252, -0.1540665626525879, 0.07444974780082703, 0.30296605825424194, 0.5314823389053345, 0.7599986791610718, 0.9885150194168091, 1.2170312404632568, 1.4455475807189941, 1.6740639209747314, 1.9025802612304688, 2.131096601486206, 2.3596129417419434, 2.5881290435791016, 2.816645622253418, 3.045161724090576, 3.2736780643463135, 3.502194404602051, 3.730710744857788, 3.9592270851135254, 4.187743186950684, 4.416259765625, 4.644775867462158, 4.873291969299316, 5.101808547973633, 5.330325126647949, 5.558841228485107, 5.787357807159424, 6.015873908996582, 6.244390487670898, 6.472906589508057, 6.701422691345215, 6.929939270019531, 7.1584553718566895]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 16.0, 22.0, 27.0, 25.0, 44.0, 48.0, 71.0, 92.0, 138.0, 205.0, 284.0, 489.0, 928.0, 1726.0, 3564.0, 8578.0, 25818.0, 124598.0, 3425362.0, 521178.0, 54047.0, 14892.0, 5939.0, 2662.0, 1412.0, 810.0, 461.0, 269.0, 187.0, 107.0, 75.0, 60.0, 32.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 2.0], "bins": [-4.1796875, -4.071868896484375, -3.96405029296875, -3.856231689453125, -3.7484130859375, -3.640594482421875, -3.53277587890625, -3.424957275390625, -3.317138671875, -3.209320068359375, -3.10150146484375, -2.993682861328125, -2.8858642578125, -2.778045654296875, -2.67022705078125, -2.562408447265625, -2.45458984375, -2.346771240234375, -2.23895263671875, -2.131134033203125, -2.0233154296875, -1.915496826171875, -1.80767822265625, -1.699859619140625, -1.592041015625, -1.484222412109375, -1.37640380859375, -1.268585205078125, -1.1607666015625, -1.052947998046875, -0.94512939453125, -0.837310791015625, -0.7294921875, -0.621673583984375, -0.51385498046875, -0.406036376953125, -0.2982177734375, -0.190399169921875, -0.08258056640625, 0.025238037109375, 0.133056640625, 0.240875244140625, 0.34869384765625, 0.456512451171875, 0.5643310546875, 0.672149658203125, 0.77996826171875, 0.887786865234375, 0.99560546875, 1.103424072265625, 1.21124267578125, 1.319061279296875, 1.4268798828125, 1.534698486328125, 1.64251708984375, 1.750335693359375, 1.858154296875, 1.965972900390625, 2.07379150390625, 2.181610107421875, 2.2894287109375, 2.397247314453125, 2.50506591796875, 2.612884521484375, 2.720703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 3.0, 9.0, 8.0, 17.0, 24.0, 24.0, 32.0, 35.0, 33.0, 43.0, 43.0, 56.0, 51.0, 64.0, 72.0, 57.0, 57.0, 50.0, 54.0, 39.0, 40.0, 34.0, 36.0, 28.0, 20.0, 14.0, 14.0, 9.0, 5.0, 10.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.51220703125, -0.4975318908691406, -0.48285675048828125, -0.4681816101074219, -0.4535064697265625, -0.4388313293457031, -0.42415618896484375, -0.4094810485839844, -0.394805908203125, -0.3801307678222656, -0.36545562744140625, -0.3507804870605469, -0.3361053466796875, -0.3214302062988281, -0.30675506591796875, -0.2920799255371094, -0.27740478515625, -0.2627296447753906, -0.24805450439453125, -0.23337936401367188, -0.2187042236328125, -0.20402908325195312, -0.18935394287109375, -0.17467880249023438, -0.160003662109375, -0.14532852172851562, -0.13065338134765625, -0.11597824096679688, -0.1013031005859375, -0.08662796020507812, -0.07195281982421875, -0.057277679443359375, -0.0426025390625, -0.027927398681640625, -0.01325225830078125, 0.001422882080078125, 0.0160980224609375, 0.030773162841796875, 0.04544830322265625, 0.060123443603515625, 0.074798583984375, 0.08947372436523438, 0.10414886474609375, 0.11882400512695312, 0.1334991455078125, 0.14817428588867188, 0.16284942626953125, 0.17752456665039062, 0.19219970703125, 0.20687484741210938, 0.22154998779296875, 0.23622512817382812, 0.2509002685546875, 0.2655754089355469, 0.28025054931640625, 0.2949256896972656, 0.309600830078125, 0.3242759704589844, 0.33895111083984375, 0.3536262512207031, 0.3683013916015625, 0.3829765319824219, 0.39765167236328125, 0.4123268127441406, 0.427001953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 7.0, 15.0, 17.0, 15.0, 29.0, 19.0, 39.0, 50.0, 71.0, 102.0, 130.0, 222.0, 307.0, 708.0, 2132.0, 12830.0, 424871.0, 3719186.0, 27894.0, 3510.0, 935.0, 406.0, 221.0, 155.0, 81.0, 72.0, 65.0, 39.0, 38.0, 34.0, 17.0, 13.0, 10.0, 12.0, 8.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.5859375, -8.3609619140625, -8.135986328125, -7.9110107421875, -7.68603515625, -7.4610595703125, -7.236083984375, -7.0111083984375, -6.7861328125, -6.5611572265625, -6.336181640625, -6.1112060546875, -5.88623046875, -5.6612548828125, -5.436279296875, -5.2113037109375, -4.986328125, -4.7613525390625, -4.536376953125, -4.3114013671875, -4.08642578125, -3.8614501953125, -3.636474609375, -3.4114990234375, -3.1865234375, -2.9615478515625, -2.736572265625, -2.5115966796875, -2.28662109375, -2.0616455078125, -1.836669921875, -1.6116943359375, -1.38671875, -1.1617431640625, -0.936767578125, -0.7117919921875, -0.48681640625, -0.2618408203125, -0.036865234375, 0.1881103515625, 0.4130859375, 0.6380615234375, 0.863037109375, 1.0880126953125, 1.31298828125, 1.5379638671875, 1.762939453125, 1.9879150390625, 2.212890625, 2.4378662109375, 2.662841796875, 2.8878173828125, 3.11279296875, 3.3377685546875, 3.562744140625, 3.7877197265625, 4.0126953125, 4.2376708984375, 4.462646484375, 4.6876220703125, 4.91259765625, 5.1375732421875, 5.362548828125, 5.5875244140625, 5.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 10.0, 26.0, 48.0, 116.0, 610.0, 2649.0, 459.0, 94.0, 38.0, 14.0, 10.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.9769287109375, -3.887451171875, -3.7979736328125, -3.70849609375, -3.6190185546875, -3.529541015625, -3.4400634765625, -3.3505859375, -3.2611083984375, -3.171630859375, -3.0821533203125, -2.99267578125, -2.9031982421875, -2.813720703125, -2.7242431640625, -2.634765625, -2.5452880859375, -2.455810546875, -2.3663330078125, -2.27685546875, -2.1873779296875, -2.097900390625, -2.0084228515625, -1.9189453125, -1.8294677734375, -1.739990234375, -1.6505126953125, -1.56103515625, -1.4715576171875, -1.382080078125, -1.2926025390625, -1.203125, -1.1136474609375, -1.024169921875, -0.9346923828125, -0.84521484375, -0.7557373046875, -0.666259765625, -0.5767822265625, -0.4873046875, -0.3978271484375, -0.308349609375, -0.2188720703125, -0.12939453125, -0.0399169921875, 0.049560546875, 0.1390380859375, 0.228515625, 0.3179931640625, 0.407470703125, 0.4969482421875, 0.58642578125, 0.6759033203125, 0.765380859375, 0.8548583984375, 0.9443359375, 1.0338134765625, 1.123291015625, 1.2127685546875, 1.30224609375, 1.3917236328125, 1.481201171875, 1.5706787109375, 1.66015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 42.0, 58.0, 90.0, 129.0, 169.0, 170.0, 123.0, 62.0, 50.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-10.343038558959961, -10.069808959960938, -9.796579360961914, -9.52334976196289, -9.25011920928955, -8.976889610290527, -8.703660011291504, -8.43043041229248, -8.157200813293457, -7.883971214294434, -7.610741138458252, -7.3375115394592285, -7.064281940460205, -6.791051864624023, -6.517822265625, -6.244592666625977, -5.971362590789795, -5.6981329917907715, -5.42490291595459, -5.151673316955566, -4.878443717956543, -4.6052141189575195, -4.331984043121338, -4.0587544441223145, -3.785524606704712, -3.5122947692871094, -3.239065170288086, -2.9658353328704834, -2.692605495452881, -2.4193758964538574, -2.146146059036255, -1.872916340827942, -1.5996861457824707, -1.3264564275741577, -1.0532267093658447, -0.7799968719482422, -0.5067671537399292, -0.2335374355316162, 0.03969240188598633, 0.3129221200942993, 0.5861518383026123, 0.8593815565109253, 1.1326112747192383, 1.4058411121368408, 1.6790708303451538, 1.9523005485534668, 2.2255303859710693, 2.498760223388672, 2.7719898223876953, 3.045219659805298, 3.3184492588043213, 3.591679096221924, 3.8649086952209473, 4.138138771057129, 4.411368370056152, 4.684597969055176, 4.957827568054199, 5.231057167053223, 5.504287242889404, 5.777516841888428, 6.050746440887451, 6.323976516723633, 6.597206115722656, 6.87043571472168, 7.143665790557861]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 11.0, 12.0, 22.0, 26.0, 58.0, 74.0, 65.0, 95.0, 96.0, 92.0, 76.0, 80.0, 72.0, 62.0, 44.0, 31.0, 17.0, 20.0, 14.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.705615043640137, -8.498294830322266, -8.290974617004395, -8.083654403686523, -7.876333713531494, -7.669013500213623, -7.461693286895752, -7.254373073577881, -7.047052383422852, -6.8397321701049805, -6.632411956787109, -6.425091743469238, -6.217771053314209, -6.010450839996338, -5.803130626678467, -5.595810413360596, -5.388490200042725, -5.1811699867248535, -4.973849773406982, -4.766529083251953, -4.559208869934082, -4.351888656616211, -4.14456844329834, -3.9372482299804688, -3.7299277782440186, -3.5226075649261475, -3.3152871131896973, -3.107966899871826, -2.900646686553955, -2.693326234817505, -2.486006021499634, -2.2786855697631836, -2.0713658332824707, -1.86404550075531, -1.6567251682281494, -1.4494049549102783, -1.2420846223831177, -1.034764289855957, -0.8274440765380859, -0.6201237440109253, -0.41280341148376465, -0.2054831087589264, 0.0018371939659118652, 0.20915746688842773, 0.4164777994155884, 0.623798131942749, 0.8311183452606201, 1.0384386777877808, 1.2457590103149414, 1.453079342842102, 1.6603996753692627, 1.8677198886871338, 2.075040340423584, 2.282360553741455, 2.489680767059326, 2.6970009803771973, 2.9043214321136475, 3.1116416454315186, 3.3189620971679688, 3.52628231048584, 3.733602523803711, 3.940922975540161, 4.148242950439453, 4.355563640594482, 4.5628838539123535]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 6.0, 8.0, 15.0, 38.0, 55.0, 78.0, 108.0, 156.0, 277.0, 415.0, 878.0, 1891.0, 4824.0, 16099.0, 67042.0, 416978.0, 442629.0, 71200.0, 16810.0, 4984.0, 1952.0, 887.0, 443.0, 247.0, 196.0, 103.0, 69.0, 50.0, 38.0, 23.0, 15.0, 14.0, 10.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.400146484375, -3.29052734375, -3.180908203125, -3.0712890625, -2.961669921875, -2.85205078125, -2.742431640625, -2.6328125, -2.523193359375, -2.41357421875, -2.303955078125, -2.1943359375, -2.084716796875, -1.97509765625, -1.865478515625, -1.755859375, -1.646240234375, -1.53662109375, -1.427001953125, -1.3173828125, -1.207763671875, -1.09814453125, -0.988525390625, -0.87890625, -0.769287109375, -0.65966796875, -0.550048828125, -0.4404296875, -0.330810546875, -0.22119140625, -0.111572265625, -0.001953125, 0.107666015625, 0.21728515625, 0.326904296875, 0.4365234375, 0.546142578125, 0.65576171875, 0.765380859375, 0.875, 0.984619140625, 1.09423828125, 1.203857421875, 1.3134765625, 1.423095703125, 1.53271484375, 1.642333984375, 1.751953125, 1.861572265625, 1.97119140625, 2.080810546875, 2.1904296875, 2.300048828125, 2.40966796875, 2.519287109375, 2.62890625, 2.738525390625, 2.84814453125, 2.957763671875, 3.0673828125, 3.177001953125, 3.28662109375, 3.396240234375, 3.505859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 14.0, 13.0, 30.0, 33.0, 38.0, 37.0, 68.0, 66.0, 65.0, 72.0, 87.0, 72.0, 72.0, 68.0, 54.0, 45.0, 42.0, 34.0, 17.0, 16.0, 14.0, 16.0, 6.0, 3.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7314453125, -0.712005615234375, -0.69256591796875, -0.673126220703125, -0.6536865234375, -0.634246826171875, -0.61480712890625, -0.595367431640625, -0.575927734375, -0.556488037109375, -0.53704833984375, -0.517608642578125, -0.4981689453125, -0.478729248046875, -0.45928955078125, -0.439849853515625, -0.42041015625, -0.400970458984375, -0.38153076171875, -0.362091064453125, -0.3426513671875, -0.323211669921875, -0.30377197265625, -0.284332275390625, -0.264892578125, -0.245452880859375, -0.22601318359375, -0.206573486328125, -0.1871337890625, -0.167694091796875, -0.14825439453125, -0.128814697265625, -0.109375, -0.089935302734375, -0.07049560546875, -0.051055908203125, -0.0316162109375, -0.012176513671875, 0.00726318359375, 0.026702880859375, 0.046142578125, 0.065582275390625, 0.08502197265625, 0.104461669921875, 0.1239013671875, 0.143341064453125, 0.16278076171875, 0.182220458984375, 0.20166015625, 0.221099853515625, 0.24053955078125, 0.259979248046875, 0.2794189453125, 0.298858642578125, 0.31829833984375, 0.337738037109375, 0.357177734375, 0.376617431640625, 0.39605712890625, 0.415496826171875, 0.4349365234375, 0.454376220703125, 0.47381591796875, 0.493255615234375, 0.5126953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 10.0, 22.0, 25.0, 39.0, 51.0, 76.0, 87.0, 150.0, 220.0, 343.0, 600.0, 1108.0, 2296.0, 4958.0, 10947.0, 26471.0, 68342.0, 208686.0, 425368.0, 190796.0, 63717.0, 24539.0, 10376.0, 4540.0, 2085.0, 1027.0, 587.0, 315.0, 236.0, 144.0, 106.0, 71.0, 61.0, 29.0, 22.0, 21.0, 12.0, 10.0, 8.0, 4.0, 4.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.48919677734375, -1.4403076171875, -1.39141845703125, -1.342529296875, -1.29364013671875, -1.2447509765625, -1.19586181640625, -1.14697265625, -1.09808349609375, -1.0491943359375, -1.00030517578125, -0.951416015625, -0.90252685546875, -0.8536376953125, -0.80474853515625, -0.755859375, -0.70697021484375, -0.6580810546875, -0.60919189453125, -0.560302734375, -0.51141357421875, -0.4625244140625, -0.41363525390625, -0.36474609375, -0.31585693359375, -0.2669677734375, -0.21807861328125, -0.169189453125, -0.12030029296875, -0.0714111328125, -0.02252197265625, 0.0263671875, 0.07525634765625, 0.1241455078125, 0.17303466796875, 0.221923828125, 0.27081298828125, 0.3197021484375, 0.36859130859375, 0.41748046875, 0.46636962890625, 0.5152587890625, 0.56414794921875, 0.613037109375, 0.66192626953125, 0.7108154296875, 0.75970458984375, 0.80859375, 0.85748291015625, 0.9063720703125, 0.95526123046875, 1.004150390625, 1.05303955078125, 1.1019287109375, 1.15081787109375, 1.19970703125, 1.24859619140625, 1.2974853515625, 1.34637451171875, 1.395263671875, 1.44415283203125, 1.4930419921875, 1.54193115234375, 1.5908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 15.0, 11.0, 13.0, 17.0, 16.0, 14.0, 24.0, 13.0, 29.0, 26.0, 31.0, 36.0, 28.0, 39.0, 47.0, 27.0, 34.0, 51.0, 32.0, 55.0, 36.0, 39.0, 43.0, 44.0, 28.0, 28.0, 16.0, 20.0, 34.0, 23.0, 21.0, 10.0, 14.0, 18.0, 8.0, 5.0, 6.0, 11.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.4296875, -1.388214111328125, -1.34674072265625, -1.305267333984375, -1.2637939453125, -1.222320556640625, -1.18084716796875, -1.139373779296875, -1.097900390625, -1.056427001953125, -1.01495361328125, -0.973480224609375, -0.9320068359375, -0.890533447265625, -0.84906005859375, -0.807586669921875, -0.76611328125, -0.724639892578125, -0.68316650390625, -0.641693115234375, -0.6002197265625, -0.558746337890625, -0.51727294921875, -0.475799560546875, -0.434326171875, -0.392852783203125, -0.35137939453125, -0.309906005859375, -0.2684326171875, -0.226959228515625, -0.18548583984375, -0.144012451171875, -0.1025390625, -0.061065673828125, -0.01959228515625, 0.021881103515625, 0.0633544921875, 0.104827880859375, 0.14630126953125, 0.187774658203125, 0.229248046875, 0.270721435546875, 0.31219482421875, 0.353668212890625, 0.3951416015625, 0.436614990234375, 0.47808837890625, 0.519561767578125, 0.56103515625, 0.602508544921875, 0.64398193359375, 0.685455322265625, 0.7269287109375, 0.768402099609375, 0.80987548828125, 0.851348876953125, 0.892822265625, 0.934295654296875, 0.97576904296875, 1.017242431640625, 1.0587158203125, 1.100189208984375, 1.14166259765625, 1.183135986328125, 1.224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 27.0, 39.0, 52.0, 83.0, 118.0, 170.0, 294.0, 506.0, 1049.0, 2315.0, 5887.0, 20013.0, 98126.0, 737430.0, 144588.0, 25357.0, 7203.0, 2544.0, 1225.0, 635.0, 298.0, 193.0, 108.0, 74.0, 51.0, 37.0, 29.0, 12.0, 15.0, 10.0, 5.0, 4.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.1905670166015625, -1.145782470703125, -1.1009979248046875, -1.05621337890625, -1.0114288330078125, -0.966644287109375, -0.9218597412109375, -0.8770751953125, -0.8322906494140625, -0.787506103515625, -0.7427215576171875, -0.69793701171875, -0.6531524658203125, -0.608367919921875, -0.5635833740234375, -0.518798828125, -0.4740142822265625, -0.429229736328125, -0.3844451904296875, -0.33966064453125, -0.2948760986328125, -0.250091552734375, -0.2053070068359375, -0.1605224609375, -0.1157379150390625, -0.070953369140625, -0.0261688232421875, 0.01861572265625, 0.0634002685546875, 0.108184814453125, 0.1529693603515625, 0.19775390625, 0.2425384521484375, 0.287322998046875, 0.3321075439453125, 0.37689208984375, 0.4216766357421875, 0.466461181640625, 0.5112457275390625, 0.5560302734375, 0.6008148193359375, 0.645599365234375, 0.6903839111328125, 0.73516845703125, 0.7799530029296875, 0.824737548828125, 0.8695220947265625, 0.914306640625, 0.9590911865234375, 1.003875732421875, 1.0486602783203125, 1.09344482421875, 1.1382293701171875, 1.183013916015625, 1.2277984619140625, 1.2725830078125, 1.3173675537109375, 1.362152099609375, 1.4069366455078125, 1.45172119140625, 1.4965057373046875, 1.541290283203125, 1.5860748291015625, 1.630859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 7.0, 10.0, 18.0, 10.0, 11.0, 26.0, 19.0, 49.0, 139.0, 353.0, 186.0, 70.0, 41.0, 16.0, 16.0, 9.0, 7.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025177001953125, -0.00024109333753585815, -0.0002304166555404663, -0.00021973997354507446, -0.00020906329154968262, -0.00019838660955429077, -0.00018770992755889893, -0.00017703324556350708, -0.00016635656356811523, -0.0001556798815727234, -0.00014500319957733154, -0.0001343265175819397, -0.00012364983558654785, -0.000112973153591156, -0.00010229647159576416, -9.161978960037231e-05, -8.094310760498047e-05, -7.026642560958862e-05, -5.958974361419678e-05, -4.891306161880493e-05, -3.8236379623413086e-05, -2.755969762802124e-05, -1.6883015632629395e-05, -6.206333637237549e-06, 4.470348358154297e-06, 1.5147030353546143e-05, 2.5823712348937988e-05, 3.6500394344329834e-05, 4.717707633972168e-05, 5.7853758335113525e-05, 6.853044033050537e-05, 7.920712232589722e-05, 8.988380432128906e-05, 0.00010056048631668091, 0.00011123716831207275, 0.0001219138503074646, 0.00013259053230285645, 0.0001432672142982483, 0.00015394389629364014, 0.00016462057828903198, 0.00017529726028442383, 0.00018597394227981567, 0.00019665062427520752, 0.00020732730627059937, 0.0002180039882659912, 0.00022868067026138306, 0.0002393573522567749, 0.00025003403425216675, 0.0002607107162475586, 0.00027138739824295044, 0.0002820640802383423, 0.00029274076223373413, 0.000303417444229126, 0.0003140941262245178, 0.00032477080821990967, 0.0003354474902153015, 0.00034612417221069336, 0.0003568008542060852, 0.00036747753620147705, 0.0003781542181968689, 0.00038883090019226074, 0.0003995075821876526, 0.00041018426418304443, 0.0004208609461784363, 0.0004315376281738281]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 8.0, 17.0, 21.0, 21.0, 44.0, 53.0, 123.0, 172.0, 304.0, 604.0, 1279.0, 3312.0, 9837.0, 38258.0, 388444.0, 542189.0, 45728.0, 11570.0, 3696.0, 1382.0, 661.0, 324.0, 216.0, 108.0, 67.0, 43.0, 24.0, 18.0, 12.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.729949951171875, -1.68060302734375, -1.631256103515625, -1.5819091796875, -1.532562255859375, -1.48321533203125, -1.433868408203125, -1.384521484375, -1.335174560546875, -1.28582763671875, -1.236480712890625, -1.1871337890625, -1.137786865234375, -1.08843994140625, -1.039093017578125, -0.98974609375, -0.940399169921875, -0.89105224609375, -0.841705322265625, -0.7923583984375, -0.743011474609375, -0.69366455078125, -0.644317626953125, -0.594970703125, -0.545623779296875, -0.49627685546875, -0.446929931640625, -0.3975830078125, -0.348236083984375, -0.29888916015625, -0.249542236328125, -0.2001953125, -0.150848388671875, -0.10150146484375, -0.052154541015625, -0.0028076171875, 0.046539306640625, 0.09588623046875, 0.145233154296875, 0.194580078125, 0.243927001953125, 0.29327392578125, 0.342620849609375, 0.3919677734375, 0.441314697265625, 0.49066162109375, 0.540008544921875, 0.58935546875, 0.638702392578125, 0.68804931640625, 0.737396240234375, 0.7867431640625, 0.836090087890625, 0.88543701171875, 0.934783935546875, 0.984130859375, 1.033477783203125, 1.08282470703125, 1.132171630859375, 1.1815185546875, 1.230865478515625, 1.28021240234375, 1.329559326171875, 1.37890625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 11.0, 11.0, 15.0, 32.0, 35.0, 57.0, 101.0, 161.0, 164.0, 140.0, 93.0, 37.0, 17.0, 17.0, 18.0, 10.0, 11.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.4873046875, -1.4513168334960938, -1.4153289794921875, -1.3793411254882812, -1.343353271484375, -1.3073654174804688, -1.2713775634765625, -1.2353897094726562, -1.19940185546875, -1.1634140014648438, -1.1274261474609375, -1.0914382934570312, -1.055450439453125, -1.0194625854492188, -0.9834747314453125, -0.9474868774414062, -0.9114990234375, -0.8755111694335938, -0.8395233154296875, -0.8035354614257812, -0.767547607421875, -0.7315597534179688, -0.6955718994140625, -0.6595840454101562, -0.62359619140625, -0.5876083374023438, -0.5516204833984375, -0.5156326293945312, -0.479644775390625, -0.44365692138671875, -0.4076690673828125, -0.37168121337890625, -0.335693359375, -0.29970550537109375, -0.2637176513671875, -0.22772979736328125, -0.191741943359375, -0.15575408935546875, -0.1197662353515625, -0.08377838134765625, -0.04779052734375, -0.01180267333984375, 0.0241851806640625, 0.06017303466796875, 0.096160888671875, 0.13214874267578125, 0.1681365966796875, 0.20412445068359375, 0.2401123046875, 0.27610015869140625, 0.3120880126953125, 0.34807586669921875, 0.384063720703125, 0.42005157470703125, 0.4560394287109375, 0.49202728271484375, 0.52801513671875, 0.5640029907226562, 0.5999908447265625, 0.6359786987304688, 0.671966552734375, 0.7079544067382812, 0.7439422607421875, 0.7799301147460938, 0.81591796875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 12.0, 24.0, 47.0, 86.0, 121.0, 149.0, 160.0, 142.0, 106.0, 72.0, 40.0, 25.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.285001754760742, -25.67831039428711, -25.07162094116211, -24.46493148803711, -23.858240127563477, -23.251548767089844, -22.644859313964844, -22.038169860839844, -21.43147850036621, -20.824787139892578, -20.218097686767578, -19.611408233642578, -19.004716873168945, -18.398025512695312, -17.791336059570312, -17.184646606445312, -16.57795524597168, -15.971264839172363, -15.364574432373047, -14.75788402557373, -14.151193618774414, -13.544503211975098, -12.937812805175781, -12.331122398376465, -11.724431991577148, -11.117741584777832, -10.511051177978516, -9.9043607711792, -9.297670364379883, -8.690979957580566, -8.08428955078125, -7.477599143981934, -6.87091064453125, -6.264220237731934, -5.657529830932617, -5.050839424133301, -4.444149017333984, -3.837458610534668, -3.2307682037353516, -2.624077796936035, -2.0173873901367188, -1.4106969833374023, -0.8040065765380859, -0.19731616973876953, 0.4093742370605469, 1.0160646438598633, 1.6227550506591797, 2.229445457458496, 2.8361358642578125, 3.442826271057129, 4.049516677856445, 4.656207084655762, 5.262897491455078, 5.8695878982543945, 6.476278305053711, 7.082968711853027, 7.689659118652344, 8.29634952545166, 8.903039932250977, 9.509730339050293, 10.11642074584961, 10.723111152648926, 11.329801559448242, 11.936491966247559, 12.543182373046875]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 7.0, 4.0, 8.0, 14.0, 20.0, 18.0, 19.0, 34.0, 27.0, 27.0, 23.0, 40.0, 19.0, 44.0, 38.0, 41.0, 45.0, 45.0, 36.0, 36.0, 35.0, 37.0, 36.0, 42.0, 23.0, 34.0, 28.0, 29.0, 25.0, 24.0, 11.0, 15.0, 17.0, 9.0, 15.0, 9.0, 8.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.608931064605713, -6.402459621429443, -6.195988178253174, -5.989516735076904, -5.783045291900635, -5.576573848724365, -5.370102405548096, -5.163630962371826, -4.957159519195557, -4.750688076019287, -4.544216632843018, -4.337745189666748, -4.1312737464904785, -3.924802303314209, -3.7183308601379395, -3.51185941696167, -3.3053879737854004, -3.098916530609131, -2.8924450874328613, -2.685973644256592, -2.4795022010803223, -2.2730307579040527, -2.066559314727783, -1.8600878715515137, -1.6536164283752441, -1.4471449851989746, -1.240673542022705, -1.0342020988464355, -0.827730655670166, -0.6212592124938965, -0.41478776931762695, -0.20831632614135742, -0.0018453598022460938, 0.20462608337402344, 0.41109752655029297, 0.6175689697265625, 0.824040412902832, 1.0305118560791016, 1.236983299255371, 1.4434547424316406, 1.6499261856079102, 1.8563976287841797, 2.062869071960449, 2.2693405151367188, 2.4758119583129883, 2.682283401489258, 2.8887548446655273, 3.095226287841797, 3.3016977310180664, 3.508169174194336, 3.7146406173706055, 3.921112060546875, 4.1275835037231445, 4.334054946899414, 4.540526390075684, 4.746997833251953, 4.953469276428223, 5.159940719604492, 5.366412162780762, 5.572883605957031, 5.779355049133301, 5.98582649230957, 6.19229793548584, 6.398769378662109, 6.605240821838379]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 11.0, 13.0, 17.0, 18.0, 21.0, 39.0, 64.0, 73.0, 121.0, 164.0, 270.0, 423.0, 697.0, 1373.0, 2965.0, 7949.0, 28749.0, 277955.0, 3763264.0, 84298.0, 15932.0, 5110.0, 2139.0, 1099.0, 580.0, 336.0, 193.0, 115.0, 98.0, 56.0, 38.0, 16.0, 18.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3125, -6.1385498046875, -5.964599609375, -5.7906494140625, -5.61669921875, -5.4427490234375, -5.268798828125, -5.0948486328125, -4.9208984375, -4.7469482421875, -4.572998046875, -4.3990478515625, -4.22509765625, -4.0511474609375, -3.877197265625, -3.7032470703125, -3.529296875, -3.3553466796875, -3.181396484375, -3.0074462890625, -2.83349609375, -2.6595458984375, -2.485595703125, -2.3116455078125, -2.1376953125, -1.9637451171875, -1.789794921875, -1.6158447265625, -1.44189453125, -1.2679443359375, -1.093994140625, -0.9200439453125, -0.74609375, -0.5721435546875, -0.398193359375, -0.2242431640625, -0.05029296875, 0.1236572265625, 0.297607421875, 0.4715576171875, 0.6455078125, 0.8194580078125, 0.993408203125, 1.1673583984375, 1.34130859375, 1.5152587890625, 1.689208984375, 1.8631591796875, 2.037109375, 2.2110595703125, 2.385009765625, 2.5589599609375, 2.73291015625, 2.9068603515625, 3.080810546875, 3.2547607421875, 3.4287109375, 3.6026611328125, 3.776611328125, 3.9505615234375, 4.12451171875, 4.2984619140625, 4.472412109375, 4.6463623046875, 4.8203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 18.0, 32.0, 31.0, 32.0, 42.0, 57.0, 61.0, 68.0, 80.0, 83.0, 76.0, 70.0, 58.0, 64.0, 50.0, 41.0, 31.0, 27.0, 21.0, 15.0, 5.0, 13.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.79345703125, -0.7735137939453125, -0.753570556640625, -0.7336273193359375, -0.71368408203125, -0.6937408447265625, -0.673797607421875, -0.6538543701171875, -0.6339111328125, -0.6139678955078125, -0.594024658203125, -0.5740814208984375, -0.55413818359375, -0.5341949462890625, -0.514251708984375, -0.4943084716796875, -0.474365234375, -0.4544219970703125, -0.434478759765625, -0.4145355224609375, -0.39459228515625, -0.3746490478515625, -0.354705810546875, -0.3347625732421875, -0.3148193359375, -0.2948760986328125, -0.274932861328125, -0.2549896240234375, -0.23504638671875, -0.2151031494140625, -0.195159912109375, -0.1752166748046875, -0.1552734375, -0.1353302001953125, -0.115386962890625, -0.0954437255859375, -0.07550048828125, -0.0555572509765625, -0.035614013671875, -0.0156707763671875, 0.0042724609375, 0.0242156982421875, 0.044158935546875, 0.0641021728515625, 0.08404541015625, 0.1039886474609375, 0.123931884765625, 0.1438751220703125, 0.163818359375, 0.1837615966796875, 0.203704833984375, 0.2236480712890625, 0.24359130859375, 0.2635345458984375, 0.283477783203125, 0.3034210205078125, 0.3233642578125, 0.3433074951171875, 0.363250732421875, 0.3831939697265625, 0.40313720703125, 0.4230804443359375, 0.443023681640625, 0.4629669189453125, 0.48291015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 10.0, 6.0, 13.0, 13.0, 12.0, 26.0, 27.0, 55.0, 61.0, 71.0, 115.0, 186.0, 236.0, 489.0, 957.0, 2785.0, 10662.0, 73824.0, 3807163.0, 268394.0, 21614.0, 4557.0, 1399.0, 612.0, 344.0, 198.0, 111.0, 92.0, 68.0, 39.0, 33.0, 35.0, 14.0, 17.0, 9.0, 6.0, 12.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.11004638671875, -5.9232177734375, -5.73638916015625, -5.549560546875, -5.36273193359375, -5.1759033203125, -4.98907470703125, -4.80224609375, -4.61541748046875, -4.4285888671875, -4.24176025390625, -4.054931640625, -3.86810302734375, -3.6812744140625, -3.49444580078125, -3.3076171875, -3.12078857421875, -2.9339599609375, -2.74713134765625, -2.560302734375, -2.37347412109375, -2.1866455078125, -1.99981689453125, -1.81298828125, -1.62615966796875, -1.4393310546875, -1.25250244140625, -1.065673828125, -0.87884521484375, -0.6920166015625, -0.50518798828125, -0.318359375, -0.13153076171875, 0.0552978515625, 0.24212646484375, 0.428955078125, 0.61578369140625, 0.8026123046875, 0.98944091796875, 1.17626953125, 1.36309814453125, 1.5499267578125, 1.73675537109375, 1.923583984375, 2.11041259765625, 2.2972412109375, 2.48406982421875, 2.6708984375, 2.85772705078125, 3.0445556640625, 3.23138427734375, 3.418212890625, 3.60504150390625, 3.7918701171875, 3.97869873046875, 4.16552734375, 4.35235595703125, 4.5391845703125, 4.72601318359375, 4.912841796875, 5.09967041015625, 5.2864990234375, 5.47332763671875, 5.66015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 7.0, 5.0, 11.0, 17.0, 24.0, 32.0, 49.0, 135.0, 271.0, 903.0, 1891.0, 350.0, 158.0, 74.0, 41.0, 26.0, 27.0, 18.0, 11.0, 10.0, 6.0, 5.0, 1.0, 4.0, 2.0], "bins": [-2.365234375, -2.3171463012695312, -2.2690582275390625, -2.2209701538085938, -2.172882080078125, -2.1247940063476562, -2.0767059326171875, -2.0286178588867188, -1.98052978515625, -1.9324417114257812, -1.8843536376953125, -1.8362655639648438, -1.788177490234375, -1.7400894165039062, -1.6920013427734375, -1.6439132690429688, -1.5958251953125, -1.5477371215820312, -1.4996490478515625, -1.4515609741210938, -1.403472900390625, -1.3553848266601562, -1.3072967529296875, -1.2592086791992188, -1.21112060546875, -1.1630325317382812, -1.1149444580078125, -1.0668563842773438, -1.018768310546875, -0.9706802368164062, -0.9225921630859375, -0.8745040893554688, -0.826416015625, -0.7783279418945312, -0.7302398681640625, -0.6821517944335938, -0.634063720703125, -0.5859756469726562, -0.5378875732421875, -0.48979949951171875, -0.44171142578125, -0.39362335205078125, -0.3455352783203125, -0.29744720458984375, -0.249359130859375, -0.20127105712890625, -0.1531829833984375, -0.10509490966796875, -0.0570068359375, -0.00891876220703125, 0.0391693115234375, 0.08725738525390625, 0.135345458984375, 0.18343353271484375, 0.2315216064453125, 0.27960968017578125, 0.32769775390625, 0.37578582763671875, 0.4238739013671875, 0.47196197509765625, 0.520050048828125, 0.5681381225585938, 0.6162261962890625, 0.6643142700195312, 0.71240234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 16.0, 23.0, 69.0, 83.0, 164.0, 194.0, 168.0, 119.0, 63.0, 30.0, 25.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.199235916137695, -9.905003547668457, -9.610770225524902, -9.316537857055664, -9.022305488586426, -8.728072166442871, -8.433839797973633, -8.139606475830078, -7.84537410736084, -7.551141262054443, -7.256908893585205, -6.962676048278809, -6.668443202972412, -6.374210357666016, -6.079977989196777, -5.785745143890381, -5.491512775421143, -5.197279930114746, -4.903047561645508, -4.608814716339111, -4.314581871032715, -4.020349502563477, -3.72611665725708, -3.4318838119506836, -3.137651205062866, -2.843418598175049, -2.5491857528686523, -2.254953145980835, -1.960720419883728, -1.666487693786621, -1.3722550868988037, -1.0780222415924072, -0.7837896347045898, -0.4895569384098053, -0.19532424211502075, 0.0989084243774414, 0.39314115047454834, 0.6873738765716553, 0.9816064834594727, 1.2758393287658691, 1.5700719356536865, 1.8643046617507935, 2.1585373878479004, 2.4527699947357178, 2.747002601623535, 3.0412354469299316, 3.335468053817749, 3.6297008991241455, 3.923933506011963, 4.218166351318359, 4.512398719787598, 4.806631565093994, 5.100864410400391, 5.395096778869629, 5.689329624176025, 5.983562469482422, 6.27779483795166, 6.572027683258057, 6.866260051727295, 7.160492897033691, 7.454725742340088, 7.748958587646484, 8.043190956115723, 8.337423324584961, 8.631656646728516]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 21.0, 22.0, 32.0, 32.0, 43.0, 53.0, 54.0, 57.0, 58.0, 65.0, 73.0, 67.0, 65.0, 82.0, 73.0, 38.0, 34.0, 25.0, 24.0, 24.0, 16.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.457943916320801, -5.303596019744873, -5.149248123168945, -4.994900226593018, -4.84055233001709, -4.68620491027832, -4.531857013702393, -4.377509117126465, -4.223161220550537, -4.068813323974609, -3.9144654273986816, -3.760117769241333, -3.6057698726654053, -3.4514219760894775, -3.297074317932129, -3.142726421356201, -2.9883785247802734, -2.8340306282043457, -2.679682731628418, -2.5253350734710693, -2.3709871768951416, -2.216639280319214, -2.0622916221618652, -1.9079437255859375, -1.7535958290100098, -1.599247932434082, -1.4449001550674438, -1.2905523777008057, -1.136204481124878, -0.981856644153595, -0.827508807182312, -0.6731610298156738, -0.5188136100769043, -0.36446577310562134, -0.21011793613433838, -0.05577009916305542, 0.09857773780822754, 0.2529255747795105, 0.40727341175079346, 0.5616211891174316, 0.7159690856933594, 0.8703169226646423, 1.0246647596359253, 1.1790125370025635, 1.3333604335784912, 1.487708330154419, 1.6420561075210571, 1.7964038848876953, 1.950751781463623, 2.105099678039551, 2.2594475746154785, 2.413795232772827, 2.568143129348755, 2.7224910259246826, 2.8768386840820312, 3.031186580657959, 3.1855344772338867, 3.3398823738098145, 3.494230270385742, 3.648577928543091, 3.8029258251190186, 3.9572737216949463, 4.111621379852295, 4.265969276428223, 4.42031717300415]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 20.0, 30.0, 52.0, 65.0, 84.0, 112.0, 177.0, 290.0, 420.0, 764.0, 1410.0, 2683.0, 5984.0, 16258.0, 50038.0, 174750.0, 453084.0, 237980.0, 68496.0, 20990.0, 7628.0, 3247.0, 1637.0, 872.0, 462.0, 305.0, 206.0, 122.0, 86.0, 63.0, 62.0, 30.0, 25.0, 19.0, 13.0, 11.0, 10.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.490447998046875, -2.39691162109375, -2.303375244140625, -2.2098388671875, -2.116302490234375, -2.02276611328125, -1.929229736328125, -1.835693359375, -1.742156982421875, -1.64862060546875, -1.555084228515625, -1.4615478515625, -1.368011474609375, -1.27447509765625, -1.180938720703125, -1.08740234375, -0.993865966796875, -0.90032958984375, -0.806793212890625, -0.7132568359375, -0.619720458984375, -0.52618408203125, -0.432647705078125, -0.339111328125, -0.245574951171875, -0.15203857421875, -0.058502197265625, 0.0350341796875, 0.128570556640625, 0.22210693359375, 0.315643310546875, 0.4091796875, 0.502716064453125, 0.59625244140625, 0.689788818359375, 0.7833251953125, 0.876861572265625, 0.97039794921875, 1.063934326171875, 1.157470703125, 1.251007080078125, 1.34454345703125, 1.438079833984375, 1.5316162109375, 1.625152587890625, 1.71868896484375, 1.812225341796875, 1.90576171875, 1.999298095703125, 2.09283447265625, 2.186370849609375, 2.2799072265625, 2.373443603515625, 2.46697998046875, 2.560516357421875, 2.654052734375, 2.747589111328125, 2.84112548828125, 2.934661865234375, 3.0281982421875, 3.121734619140625, 3.21527099609375, 3.308807373046875, 3.40234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 13.0, 23.0, 15.0, 43.0, 38.0, 59.0, 74.0, 73.0, 72.0, 63.0, 74.0, 72.0, 67.0, 55.0, 58.0, 35.0, 47.0, 24.0, 27.0, 14.0, 10.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7669601440429688, -0.7463226318359375, -0.7256851196289062, -0.705047607421875, -0.6844100952148438, -0.6637725830078125, -0.6431350708007812, -0.62249755859375, -0.6018600463867188, -0.5812225341796875, -0.5605850219726562, -0.539947509765625, -0.5193099975585938, -0.4986724853515625, -0.47803497314453125, -0.4573974609375, -0.43675994873046875, -0.4161224365234375, -0.39548492431640625, -0.374847412109375, -0.35420989990234375, -0.3335723876953125, -0.31293487548828125, -0.29229736328125, -0.27165985107421875, -0.2510223388671875, -0.23038482666015625, -0.209747314453125, -0.18910980224609375, -0.1684722900390625, -0.14783477783203125, -0.127197265625, -0.10655975341796875, -0.0859222412109375, -0.06528472900390625, -0.044647216796875, -0.02400970458984375, -0.0033721923828125, 0.01726531982421875, 0.03790283203125, 0.05854034423828125, 0.0791778564453125, 0.09981536865234375, 0.120452880859375, 0.14109039306640625, 0.1617279052734375, 0.18236541748046875, 0.2030029296875, 0.22364044189453125, 0.2442779541015625, 0.26491546630859375, 0.285552978515625, 0.30619049072265625, 0.3268280029296875, 0.34746551513671875, 0.36810302734375, 0.38874053955078125, 0.4093780517578125, 0.43001556396484375, 0.450653076171875, 0.47129058837890625, 0.4919281005859375, 0.5125656127929688, 0.533203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 5.0, 14.0, 13.0, 14.0, 22.0, 21.0, 40.0, 64.0, 62.0, 98.0, 150.0, 217.0, 359.0, 665.0, 1403.0, 4481.0, 19836.0, 118342.0, 555544.0, 285341.0, 48058.0, 9083.0, 2390.0, 968.0, 472.0, 240.0, 201.0, 110.0, 84.0, 66.0, 41.0, 36.0, 25.0, 16.0, 13.0, 9.0, 7.0, 11.0, 5.0, 7.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.20703125, -3.109100341796875, -3.01116943359375, -2.913238525390625, -2.8153076171875, -2.717376708984375, -2.61944580078125, -2.521514892578125, -2.423583984375, -2.325653076171875, -2.22772216796875, -2.129791259765625, -2.0318603515625, -1.933929443359375, -1.83599853515625, -1.738067626953125, -1.64013671875, -1.542205810546875, -1.44427490234375, -1.346343994140625, -1.2484130859375, -1.150482177734375, -1.05255126953125, -0.954620361328125, -0.856689453125, -0.758758544921875, -0.66082763671875, -0.562896728515625, -0.4649658203125, -0.367034912109375, -0.26910400390625, -0.171173095703125, -0.0732421875, 0.024688720703125, 0.12261962890625, 0.220550537109375, 0.3184814453125, 0.416412353515625, 0.51434326171875, 0.612274169921875, 0.710205078125, 0.808135986328125, 0.90606689453125, 1.003997802734375, 1.1019287109375, 1.199859619140625, 1.29779052734375, 1.395721435546875, 1.49365234375, 1.591583251953125, 1.68951416015625, 1.787445068359375, 1.8853759765625, 1.983306884765625, 2.08123779296875, 2.179168701171875, 2.277099609375, 2.375030517578125, 2.47296142578125, 2.570892333984375, 2.6688232421875, 2.766754150390625, 2.86468505859375, 2.962615966796875, 3.060546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 7.0, 11.0, 21.0, 26.0, 26.0, 40.0, 38.0, 42.0, 28.0, 55.0, 42.0, 50.0, 43.0, 46.0, 39.0, 39.0, 55.0, 50.0, 43.0, 53.0, 36.0, 27.0, 36.0, 21.0, 29.0, 12.0, 10.0, 8.0, 9.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8447265625, -1.7843475341796875, -1.723968505859375, -1.6635894775390625, -1.60321044921875, -1.5428314208984375, -1.482452392578125, -1.4220733642578125, -1.3616943359375, -1.3013153076171875, -1.240936279296875, -1.1805572509765625, -1.12017822265625, -1.0597991943359375, -0.999420166015625, -0.9390411376953125, -0.878662109375, -0.8182830810546875, -0.757904052734375, -0.6975250244140625, -0.63714599609375, -0.5767669677734375, -0.516387939453125, -0.4560089111328125, -0.3956298828125, -0.3352508544921875, -0.274871826171875, -0.2144927978515625, -0.15411376953125, -0.0937347412109375, -0.033355712890625, 0.0270233154296875, 0.08740234375, 0.1477813720703125, 0.208160400390625, 0.2685394287109375, 0.32891845703125, 0.3892974853515625, 0.449676513671875, 0.5100555419921875, 0.5704345703125, 0.6308135986328125, 0.691192626953125, 0.7515716552734375, 0.81195068359375, 0.8723297119140625, 0.932708740234375, 0.9930877685546875, 1.053466796875, 1.1138458251953125, 1.174224853515625, 1.2346038818359375, 1.29498291015625, 1.3553619384765625, 1.415740966796875, 1.4761199951171875, 1.5364990234375, 1.5968780517578125, 1.657257080078125, 1.7176361083984375, 1.77801513671875, 1.8383941650390625, 1.898773193359375, 1.9591522216796875, 2.01953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 10.0, 9.0, 18.0, 16.0, 22.0, 42.0, 55.0, 85.0, 159.0, 223.0, 392.0, 749.0, 1358.0, 2904.0, 6411.0, 16392.0, 49720.0, 189400.0, 582903.0, 136117.0, 37934.0, 13161.0, 5344.0, 2342.0, 1248.0, 623.0, 349.0, 202.0, 129.0, 70.0, 48.0, 35.0, 23.0, 12.0, 14.0, 9.0, 7.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.599609375, -1.5556488037109375, -1.511688232421875, -1.4677276611328125, -1.42376708984375, -1.3798065185546875, -1.335845947265625, -1.2918853759765625, -1.2479248046875, -1.2039642333984375, -1.160003662109375, -1.1160430908203125, -1.07208251953125, -1.0281219482421875, -0.984161376953125, -0.9402008056640625, -0.896240234375, -0.8522796630859375, -0.808319091796875, -0.7643585205078125, -0.72039794921875, -0.6764373779296875, -0.632476806640625, -0.5885162353515625, -0.5445556640625, -0.5005950927734375, -0.456634521484375, -0.4126739501953125, -0.36871337890625, -0.3247528076171875, -0.280792236328125, -0.2368316650390625, -0.19287109375, -0.1489105224609375, -0.104949951171875, -0.0609893798828125, -0.01702880859375, 0.0269317626953125, 0.070892333984375, 0.1148529052734375, 0.1588134765625, 0.2027740478515625, 0.246734619140625, 0.2906951904296875, 0.33465576171875, 0.3786163330078125, 0.422576904296875, 0.4665374755859375, 0.510498046875, 0.5544586181640625, 0.598419189453125, 0.6423797607421875, 0.68634033203125, 0.7303009033203125, 0.774261474609375, 0.8182220458984375, 0.8621826171875, 0.9061431884765625, 0.950103759765625, 0.9940643310546875, 1.03802490234375, 1.0819854736328125, 1.125946044921875, 1.1699066162109375, 1.2138671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 1.0, 4.0, 7.0, 7.0, 8.0, 6.0, 21.0, 10.0, 32.0, 21.0, 27.0, 31.0, 43.0, 45.0, 85.0, 119.0, 141.0, 74.0, 80.0, 40.0, 34.0, 38.0, 24.0, 26.0, 20.0, 14.0, 13.0, 4.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021791458129882812, -0.00021151266992092133, -0.00020511075854301453, -0.00019870884716510773, -0.00019230693578720093, -0.00018590502440929413, -0.00017950311303138733, -0.00017310120165348053, -0.00016669929027557373, -0.00016029737889766693, -0.00015389546751976013, -0.00014749355614185333, -0.00014109164476394653, -0.00013468973338603973, -0.00012828782200813293, -0.00012188591063022614, -0.00011548399925231934, -0.00010908208787441254, -0.00010268017649650574, -9.627826511859894e-05, -8.987635374069214e-05, -8.347444236278534e-05, -7.707253098487854e-05, -7.067061960697174e-05, -6.426870822906494e-05, -5.786679685115814e-05, -5.146488547325134e-05, -4.5062974095344543e-05, -3.8661062717437744e-05, -3.2259151339530945e-05, -2.5857239961624146e-05, -1.9455328583717346e-05, -1.3053417205810547e-05, -6.6515058279037476e-06, -2.4959444999694824e-07, 6.152316927909851e-06, 1.255422830581665e-05, 1.895613968372345e-05, 2.535805106163025e-05, 3.175996243953705e-05, 3.816187381744385e-05, 4.456378519535065e-05, 5.0965696573257446e-05, 5.7367607951164246e-05, 6.376951932907104e-05, 7.017143070697784e-05, 7.657334208488464e-05, 8.297525346279144e-05, 8.937716484069824e-05, 9.577907621860504e-05, 0.00010218098759651184, 0.00010858289897441864, 0.00011498481035232544, 0.00012138672173023224, 0.00012778863310813904, 0.00013419054448604584, 0.00014059245586395264, 0.00014699436724185944, 0.00015339627861976624, 0.00015979818999767303, 0.00016620010137557983, 0.00017260201275348663, 0.00017900392413139343, 0.00018540583550930023, 0.00019180774688720703]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 5.0, 6.0, 7.0, 13.0, 15.0, 22.0, 51.0, 70.0, 124.0, 236.0, 376.0, 913.0, 2495.0, 10201.0, 82717.0, 820827.0, 113016.0, 12574.0, 2951.0, 935.0, 447.0, 225.0, 106.0, 67.0, 51.0, 36.0, 9.0, 16.0, 10.0, 8.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.182952880859375, -3.07879638671875, -2.974639892578125, -2.8704833984375, -2.766326904296875, -2.66217041015625, -2.558013916015625, -2.453857421875, -2.349700927734375, -2.24554443359375, -2.141387939453125, -2.0372314453125, -1.933074951171875, -1.82891845703125, -1.724761962890625, -1.62060546875, -1.516448974609375, -1.41229248046875, -1.308135986328125, -1.2039794921875, -1.099822998046875, -0.99566650390625, -0.891510009765625, -0.787353515625, -0.683197021484375, -0.57904052734375, -0.474884033203125, -0.3707275390625, -0.266571044921875, -0.16241455078125, -0.058258056640625, 0.0458984375, 0.150054931640625, 0.25421142578125, 0.358367919921875, 0.4625244140625, 0.566680908203125, 0.67083740234375, 0.774993896484375, 0.879150390625, 0.983306884765625, 1.08746337890625, 1.191619873046875, 1.2957763671875, 1.399932861328125, 1.50408935546875, 1.608245849609375, 1.71240234375, 1.816558837890625, 1.92071533203125, 2.024871826171875, 2.1290283203125, 2.233184814453125, 2.33734130859375, 2.441497802734375, 2.545654296875, 2.649810791015625, 2.75396728515625, 2.858123779296875, 2.9622802734375, 3.066436767578125, 3.17059326171875, 3.274749755859375, 3.37890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 9.0, 9.0, 12.0, 17.0, 17.0, 11.0, 39.0, 33.0, 57.0, 90.0, 168.0, 169.0, 107.0, 68.0, 51.0, 37.0, 18.0, 21.0, 15.0, 11.0, 9.0, 8.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.5775299072265625, -2.516387939453125, -2.4552459716796875, -2.39410400390625, -2.3329620361328125, -2.271820068359375, -2.2106781005859375, -2.1495361328125, -2.0883941650390625, -2.027252197265625, -1.9661102294921875, -1.90496826171875, -1.8438262939453125, -1.782684326171875, -1.7215423583984375, -1.660400390625, -1.5992584228515625, -1.538116455078125, -1.4769744873046875, -1.41583251953125, -1.3546905517578125, -1.293548583984375, -1.2324066162109375, -1.1712646484375, -1.1101226806640625, -1.048980712890625, -0.9878387451171875, -0.92669677734375, -0.8655548095703125, -0.804412841796875, -0.7432708740234375, -0.68212890625, -0.6209869384765625, -0.559844970703125, -0.4987030029296875, -0.43756103515625, -0.3764190673828125, -0.315277099609375, -0.2541351318359375, -0.1929931640625, -0.1318511962890625, -0.070709228515625, -0.0095672607421875, 0.05157470703125, 0.1127166748046875, 0.173858642578125, 0.2350006103515625, 0.296142578125, 0.3572845458984375, 0.418426513671875, 0.4795684814453125, 0.54071044921875, 0.6018524169921875, 0.662994384765625, 0.7241363525390625, 0.7852783203125, 0.8464202880859375, 0.907562255859375, 0.9687042236328125, 1.02984619140625, 1.0909881591796875, 1.152130126953125, 1.2132720947265625, 1.2744140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 11.0, 25.0, 43.0, 94.0, 203.0, 232.0, 180.0, 123.0, 59.0, 20.0, 8.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.7812557220459, -15.626142501831055, -14.471028327941895, -13.315914154052734, -12.16080093383789, -11.005687713623047, -9.850573539733887, -8.695459365844727, -7.540346145629883, -6.385232448577881, -5.230118751525879, -4.075005054473877, -2.919891357421875, -1.764777660369873, -0.6096639633178711, 0.5454502105712891, 1.7005634307861328, 2.8556771278381348, 4.010790824890137, 5.165904521942139, 6.321018218994141, 7.476131916046143, 8.631245613098145, 9.786359786987305, 10.941473007202148, 12.096586227416992, 13.251700401306152, 14.406814575195312, 15.561927795410156, 16.717041015625, 17.872154235839844, 19.02726936340332, 20.182384490966797, 21.33749771118164, 22.492610931396484, 23.64772605895996, 24.802839279174805, 25.95795249938965, 27.113067626953125, 28.26818084716797, 29.423294067382812, 30.578407287597656, 31.7335205078125, 32.888633728027344, 34.04374694824219, 35.1988639831543, 36.35397720336914, 37.509090423583984, 38.66420364379883, 39.81931686401367, 40.974430084228516, 42.12954330444336, 43.28466033935547, 44.43977355957031, 45.594886779785156, 46.75, 47.905113220214844, 49.06022644042969, 50.21533966064453, 51.370452880859375, 52.52556610107422, 53.68068313598633, 54.83579635620117, 55.990909576416016, 57.14602279663086]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 6.0, 12.0, 13.0, 15.0, 16.0, 19.0, 20.0, 20.0, 31.0, 30.0, 27.0, 31.0, 41.0, 34.0, 34.0, 47.0, 47.0, 46.0, 40.0, 38.0, 40.0, 49.0, 32.0, 28.0, 41.0, 36.0, 28.0, 30.0, 20.0, 18.0, 12.0, 19.0, 16.0, 12.0, 13.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.910199165344238, -7.616495609283447, -7.322792053222656, -7.029088973999023, -6.735385417938232, -6.441681861877441, -6.147978782653809, -5.854275226593018, -5.560571670532227, -5.2668681144714355, -4.9731645584106445, -4.679461479187012, -4.385757923126221, -4.09205436706543, -3.7983510494232178, -3.504647731781006, -3.210944175720215, -2.917240619659424, -2.623537302017212, -2.329833984375, -2.036130428314209, -1.7424269914627075, -1.448723554611206, -1.1550202369689941, -0.8613166809082031, -0.5676132440567017, -0.2739098072052002, 0.01979362964630127, 0.31349706649780273, 0.6072005033493042, 0.9009039402008057, 1.1946072578430176, 1.488311767578125, 1.7820152044296265, 2.075718641281128, 2.36942195892334, 2.663125514984131, 2.956829071044922, 3.250532388687134, 3.5442357063293457, 3.8379392623901367, 4.131642818450928, 4.425346374511719, 4.719049453735352, 5.012753009796143, 5.306456565856934, 5.600159645080566, 5.893863201141357, 6.187566757202148, 6.4812703132629395, 6.7749738693237305, 7.068676948547363, 7.362380504608154, 7.656084060668945, 7.949787139892578, 8.243490219116211, 8.53719425201416, 8.830897331237793, 9.124601364135742, 9.418304443359375, 9.712007522583008, 10.005711555480957, 10.29941463470459, 10.593118667602539, 10.886821746826172]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 9.0, 4.0, 13.0, 7.0, 25.0, 15.0, 25.0, 50.0, 64.0, 86.0, 127.0, 199.0, 310.0, 558.0, 1049.0, 2350.0, 6409.0, 24992.0, 271522.0, 3765249.0, 97414.0, 15068.0, 4665.0, 1879.0, 880.0, 480.0, 287.0, 168.0, 127.0, 66.0, 40.0, 36.0, 21.0, 18.0, 18.0, 8.0, 7.0, 6.0, 0.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2147216796875, -6.038818359375, -5.8629150390625, -5.68701171875, -5.5111083984375, -5.335205078125, -5.1593017578125, -4.9833984375, -4.8074951171875, -4.631591796875, -4.4556884765625, -4.27978515625, -4.1038818359375, -3.927978515625, -3.7520751953125, -3.576171875, -3.4002685546875, -3.224365234375, -3.0484619140625, -2.87255859375, -2.6966552734375, -2.520751953125, -2.3448486328125, -2.1689453125, -1.9930419921875, -1.817138671875, -1.6412353515625, -1.46533203125, -1.2894287109375, -1.113525390625, -0.9376220703125, -0.76171875, -0.5858154296875, -0.409912109375, -0.2340087890625, -0.05810546875, 0.1177978515625, 0.293701171875, 0.4696044921875, 0.6455078125, 0.8214111328125, 0.997314453125, 1.1732177734375, 1.34912109375, 1.5250244140625, 1.700927734375, 1.8768310546875, 2.052734375, 2.2286376953125, 2.404541015625, 2.5804443359375, 2.75634765625, 2.9322509765625, 3.108154296875, 3.2840576171875, 3.4599609375, 3.6358642578125, 3.811767578125, 3.9876708984375, 4.16357421875, 4.3394775390625, 4.515380859375, 4.6912841796875, 4.8671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 17.0, 14.0, 20.0, 20.0, 39.0, 36.0, 53.0, 58.0, 62.0, 63.0, 69.0, 82.0, 64.0, 69.0, 65.0, 56.0, 51.0, 29.0, 31.0, 21.0, 26.0, 14.0, 10.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.798828125, -0.7780838012695312, -0.7573394775390625, -0.7365951538085938, -0.715850830078125, -0.6951065063476562, -0.6743621826171875, -0.6536178588867188, -0.63287353515625, -0.6121292114257812, -0.5913848876953125, -0.5706405639648438, -0.549896240234375, -0.5291519165039062, -0.5084075927734375, -0.48766326904296875, -0.4669189453125, -0.44617462158203125, -0.4254302978515625, -0.40468597412109375, -0.383941650390625, -0.36319732666015625, -0.3424530029296875, -0.32170867919921875, -0.30096435546875, -0.28022003173828125, -0.2594757080078125, -0.23873138427734375, -0.217987060546875, -0.19724273681640625, -0.1764984130859375, -0.15575408935546875, -0.135009765625, -0.11426544189453125, -0.0935211181640625, -0.07277679443359375, -0.052032470703125, -0.03128814697265625, -0.0105438232421875, 0.01020050048828125, 0.03094482421875, 0.05168914794921875, 0.0724334716796875, 0.09317779541015625, 0.113922119140625, 0.13466644287109375, 0.1554107666015625, 0.17615509033203125, 0.1968994140625, 0.21764373779296875, 0.2383880615234375, 0.25913238525390625, 0.279876708984375, 0.30062103271484375, 0.3213653564453125, 0.34210968017578125, 0.36285400390625, 0.38359832763671875, 0.4043426513671875, 0.42508697509765625, 0.445831298828125, 0.46657562255859375, 0.4873199462890625, 0.5080642700195312, 0.52880859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 15.0, 20.0, 26.0, 26.0, 53.0, 70.0, 99.0, 171.0, 285.0, 413.0, 813.0, 1656.0, 3428.0, 7868.0, 20878.0, 75520.0, 702115.0, 3166686.0, 159211.0, 33724.0, 11509.0, 4817.0, 2280.0, 1086.0, 597.0, 334.0, 213.0, 119.0, 91.0, 38.0, 37.0, 25.0, 11.0, 9.0, 10.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.142578125, -3.045013427734375, -2.94744873046875, -2.849884033203125, -2.7523193359375, -2.654754638671875, -2.55718994140625, -2.459625244140625, -2.362060546875, -2.264495849609375, -2.16693115234375, -2.069366455078125, -1.9718017578125, -1.874237060546875, -1.77667236328125, -1.679107666015625, -1.58154296875, -1.483978271484375, -1.38641357421875, -1.288848876953125, -1.1912841796875, -1.093719482421875, -0.99615478515625, -0.898590087890625, -0.801025390625, -0.703460693359375, -0.60589599609375, -0.508331298828125, -0.4107666015625, -0.313201904296875, -0.21563720703125, -0.118072509765625, -0.0205078125, 0.077056884765625, 0.17462158203125, 0.272186279296875, 0.3697509765625, 0.467315673828125, 0.56488037109375, 0.662445068359375, 0.760009765625, 0.857574462890625, 0.95513916015625, 1.052703857421875, 1.1502685546875, 1.247833251953125, 1.34539794921875, 1.442962646484375, 1.54052734375, 1.638092041015625, 1.73565673828125, 1.833221435546875, 1.9307861328125, 2.028350830078125, 2.12591552734375, 2.223480224609375, 2.321044921875, 2.418609619140625, 2.51617431640625, 2.613739013671875, 2.7113037109375, 2.808868408203125, 2.90643310546875, 3.003997802734375, 3.1015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 13.0, 9.0, 18.0, 19.0, 44.0, 43.0, 107.0, 175.0, 414.0, 1100.0, 1316.0, 350.0, 177.0, 83.0, 59.0, 38.0, 27.0, 16.0, 14.0, 5.0, 10.0, 4.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.2677459716796875, -1.217132568359375, -1.1665191650390625, -1.11590576171875, -1.0652923583984375, -1.014678955078125, -0.9640655517578125, -0.9134521484375, -0.8628387451171875, -0.812225341796875, -0.7616119384765625, -0.71099853515625, -0.6603851318359375, -0.609771728515625, -0.5591583251953125, -0.508544921875, -0.4579315185546875, -0.407318115234375, -0.3567047119140625, -0.30609130859375, -0.2554779052734375, -0.204864501953125, -0.1542510986328125, -0.1036376953125, -0.0530242919921875, -0.002410888671875, 0.0482025146484375, 0.09881591796875, 0.1494293212890625, 0.200042724609375, 0.2506561279296875, 0.30126953125, 0.3518829345703125, 0.402496337890625, 0.4531097412109375, 0.50372314453125, 0.5543365478515625, 0.604949951171875, 0.6555633544921875, 0.7061767578125, 0.7567901611328125, 0.807403564453125, 0.8580169677734375, 0.90863037109375, 0.9592437744140625, 1.009857177734375, 1.0604705810546875, 1.111083984375, 1.1616973876953125, 1.212310791015625, 1.2629241943359375, 1.31353759765625, 1.3641510009765625, 1.414764404296875, 1.4653778076171875, 1.5159912109375, 1.5666046142578125, 1.617218017578125, 1.6678314208984375, 1.71844482421875, 1.7690582275390625, 1.819671630859375, 1.8702850341796875, 1.9208984375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 8.0, 18.0, 34.0, 50.0, 85.0, 147.0, 192.0, 179.0, 129.0, 75.0, 31.0, 21.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.364502906799316, -13.94583797454834, -13.527173042297363, -13.10850715637207, -12.689842224121094, -12.271177291870117, -11.85251235961914, -11.433847427368164, -11.015182495117188, -10.596517562866211, -10.177852630615234, -9.759187698364258, -9.340521812438965, -8.921856880187988, -8.503191947937012, -8.084527015686035, -7.6658616065979, -7.247196674346924, -6.828531265258789, -6.4098663330078125, -5.991201400756836, -5.572536468505859, -5.153871059417725, -4.735206127166748, -4.316540718078613, -3.8978755474090576, -3.479210615158081, -3.0605454444885254, -2.641880512237549, -2.223215341567993, -1.8045501708984375, -1.385885238647461, -0.9672203063964844, -0.5485552549362183, -0.12989014387130737, 0.2887749671936035, 0.7074400186538696, 1.1261050701141357, 1.5447702407836914, 1.963435173034668, 2.3821003437042236, 2.8007655143737793, 3.219430446624756, 3.6380956172943115, 4.056760787963867, 4.475425720214844, 4.89409065246582, 5.312755584716797, 5.731420993804932, 6.150085926055908, 6.568751335144043, 6.9874162673950195, 7.406081199645996, 7.824746131896973, 8.243412017822266, 8.662076950073242, 9.080741882324219, 9.499406814575195, 9.918071746826172, 10.336736679077148, 10.755402565002441, 11.174067497253418, 11.592732429504395, 12.011397361755371, 12.430062294006348]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 16.0, 13.0, 11.0, 20.0, 19.0, 35.0, 26.0, 26.0, 46.0, 43.0, 45.0, 40.0, 44.0, 57.0, 43.0, 48.0, 55.0, 47.0, 50.0, 35.0, 40.0, 27.0, 28.0, 34.0, 23.0, 20.0, 14.0, 18.0, 11.0, 10.0, 6.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.550609588623047, -4.380953311920166, -4.211296558380127, -4.041640281677246, -3.8719840049743652, -3.7023274898529053, -3.5326709747314453, -3.3630146980285645, -3.1933581829071045, -3.0237016677856445, -2.8540453910827637, -2.6843888759613037, -2.5147323608398438, -2.345076084136963, -2.175419569015503, -2.005763053894043, -1.836106777191162, -1.6664503812789917, -1.4967939853668213, -1.3271374702453613, -1.157481074333191, -0.9878246784210205, -0.8181681632995605, -0.6485117673873901, -0.4788553714752197, -0.30919894576072693, -0.13954252004623413, 0.030113935470581055, 0.19977033138275146, 0.3694267272949219, 0.5390832424163818, 0.7087396383285522, 0.8783965110778809, 1.0480529069900513, 1.2177093029022217, 1.3873658180236816, 1.557022213935852, 1.7266786098480225, 1.8963351249694824, 2.0659914016723633, 2.2356479167938232, 2.405304431915283, 2.574960708618164, 2.744617223739624, 2.914273738861084, 3.083930015563965, 3.253586530685425, 3.4232430458068848, 3.5928993225097656, 3.7625558376312256, 3.9322121143341064, 4.101868629455566, 4.271524906158447, 4.441181182861328, 4.610837936401367, 4.780494213104248, 4.950150489807129, 5.11980676651001, 5.289463520050049, 5.45911979675293, 5.6287760734558105, 5.798432350158691, 5.9680891036987305, 6.137745380401611, 6.30740213394165]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 13.0, 19.0, 25.0, 36.0, 61.0, 113.0, 145.0, 257.0, 427.0, 633.0, 1318.0, 2589.0, 6035.0, 15409.0, 44064.0, 134306.0, 314559.0, 318191.0, 137023.0, 45836.0, 15618.0, 6142.0, 2633.0, 1283.0, 716.0, 392.0, 236.0, 147.0, 86.0, 61.0, 46.0, 40.0, 22.0, 16.0, 11.0, 5.0, 6.0, 4.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.666015625, -2.582733154296875, -2.49945068359375, -2.416168212890625, -2.3328857421875, -2.249603271484375, -2.16632080078125, -2.083038330078125, -1.999755859375, -1.916473388671875, -1.83319091796875, -1.749908447265625, -1.6666259765625, -1.583343505859375, -1.50006103515625, -1.416778564453125, -1.33349609375, -1.250213623046875, -1.16693115234375, -1.083648681640625, -1.0003662109375, -0.917083740234375, -0.83380126953125, -0.750518798828125, -0.667236328125, -0.583953857421875, -0.50067138671875, -0.417388916015625, -0.3341064453125, -0.250823974609375, -0.16754150390625, -0.084259033203125, -0.0009765625, 0.082305908203125, 0.16558837890625, 0.248870849609375, 0.3321533203125, 0.415435791015625, 0.49871826171875, 0.582000732421875, 0.665283203125, 0.748565673828125, 0.83184814453125, 0.915130615234375, 0.9984130859375, 1.081695556640625, 1.16497802734375, 1.248260498046875, 1.33154296875, 1.414825439453125, 1.49810791015625, 1.581390380859375, 1.6646728515625, 1.747955322265625, 1.83123779296875, 1.914520263671875, 1.997802734375, 2.081085205078125, 2.16436767578125, 2.247650146484375, 2.3309326171875, 2.414215087890625, 2.49749755859375, 2.580780029296875, 2.6640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 17.0, 14.0, 15.0, 33.0, 42.0, 35.0, 43.0, 62.0, 66.0, 68.0, 76.0, 60.0, 67.0, 67.0, 56.0, 50.0, 48.0, 36.0, 34.0, 20.0, 16.0, 17.0, 13.0, 8.0, 9.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.900390625, -0.8780746459960938, -0.8557586669921875, -0.8334426879882812, -0.811126708984375, -0.7888107299804688, -0.7664947509765625, -0.7441787719726562, -0.72186279296875, -0.6995468139648438, -0.6772308349609375, -0.6549148559570312, -0.632598876953125, -0.6102828979492188, -0.5879669189453125, -0.5656509399414062, -0.5433349609375, -0.5210189819335938, -0.4987030029296875, -0.47638702392578125, -0.454071044921875, -0.43175506591796875, -0.4094390869140625, -0.38712310791015625, -0.36480712890625, -0.34249114990234375, -0.3201751708984375, -0.29785919189453125, -0.275543212890625, -0.25322723388671875, -0.2309112548828125, -0.20859527587890625, -0.186279296875, -0.16396331787109375, -0.1416473388671875, -0.11933135986328125, -0.097015380859375, -0.07469940185546875, -0.0523834228515625, -0.03006744384765625, -0.00775146484375, 0.01456451416015625, 0.0368804931640625, 0.05919647216796875, 0.081512451171875, 0.10382843017578125, 0.1261444091796875, 0.14846038818359375, 0.1707763671875, 0.19309234619140625, 0.2154083251953125, 0.23772430419921875, 0.260040283203125, 0.28235626220703125, 0.3046722412109375, 0.32698822021484375, 0.34930419921875, 0.37162017822265625, 0.3939361572265625, 0.41625213623046875, 0.438568115234375, 0.46088409423828125, 0.4832000732421875, 0.5055160522460938, 0.52783203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 10.0, 9.0, 7.0, 14.0, 10.0, 23.0, 34.0, 46.0, 79.0, 86.0, 111.0, 226.0, 318.0, 592.0, 1313.0, 4609.0, 29396.0, 286185.0, 621855.0, 88723.0, 10428.0, 2292.0, 865.0, 437.0, 277.0, 185.0, 122.0, 76.0, 59.0, 38.0, 27.0, 21.0, 19.0, 12.0, 11.0, 2.0, 6.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.4437255859375, -4.301513671875, -4.1593017578125, -4.01708984375, -3.8748779296875, -3.732666015625, -3.5904541015625, -3.4482421875, -3.3060302734375, -3.163818359375, -3.0216064453125, -2.87939453125, -2.7371826171875, -2.594970703125, -2.4527587890625, -2.310546875, -2.1683349609375, -2.026123046875, -1.8839111328125, -1.74169921875, -1.5994873046875, -1.457275390625, -1.3150634765625, -1.1728515625, -1.0306396484375, -0.888427734375, -0.7462158203125, -0.60400390625, -0.4617919921875, -0.319580078125, -0.1773681640625, -0.03515625, 0.1070556640625, 0.249267578125, 0.3914794921875, 0.53369140625, 0.6759033203125, 0.818115234375, 0.9603271484375, 1.1025390625, 1.2447509765625, 1.386962890625, 1.5291748046875, 1.67138671875, 1.8135986328125, 1.955810546875, 2.0980224609375, 2.240234375, 2.3824462890625, 2.524658203125, 2.6668701171875, 2.80908203125, 2.9512939453125, 3.093505859375, 3.2357177734375, 3.3779296875, 3.5201416015625, 3.662353515625, 3.8045654296875, 3.94677734375, 4.0889892578125, 4.231201171875, 4.3734130859375, 4.515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 13.0, 22.0, 14.0, 18.0, 20.0, 31.0, 26.0, 26.0, 38.0, 37.0, 33.0, 32.0, 42.0, 37.0, 46.0, 49.0, 39.0, 46.0, 39.0, 36.0, 39.0, 35.0, 28.0, 29.0, 26.0, 21.0, 14.0, 20.0, 17.0, 19.0, 10.0, 15.0, 10.0, 14.0, 3.0, 5.0, 10.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.96875, -1.906036376953125, -1.84332275390625, -1.780609130859375, -1.7178955078125, -1.655181884765625, -1.59246826171875, -1.529754638671875, -1.467041015625, -1.404327392578125, -1.34161376953125, -1.278900146484375, -1.2161865234375, -1.153472900390625, -1.09075927734375, -1.028045654296875, -0.96533203125, -0.902618408203125, -0.83990478515625, -0.777191162109375, -0.7144775390625, -0.651763916015625, -0.58905029296875, -0.526336669921875, -0.463623046875, -0.400909423828125, -0.33819580078125, -0.275482177734375, -0.2127685546875, -0.150054931640625, -0.08734130859375, -0.024627685546875, 0.0380859375, 0.100799560546875, 0.16351318359375, 0.226226806640625, 0.2889404296875, 0.351654052734375, 0.41436767578125, 0.477081298828125, 0.539794921875, 0.602508544921875, 0.66522216796875, 0.727935791015625, 0.7906494140625, 0.853363037109375, 0.91607666015625, 0.978790283203125, 1.04150390625, 1.104217529296875, 1.16693115234375, 1.229644775390625, 1.2923583984375, 1.355072021484375, 1.41778564453125, 1.480499267578125, 1.543212890625, 1.605926513671875, 1.66864013671875, 1.731353759765625, 1.7940673828125, 1.856781005859375, 1.91949462890625, 1.982208251953125, 2.044921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 6.0, 8.0, 12.0, 15.0, 12.0, 29.0, 26.0, 38.0, 59.0, 92.0, 138.0, 268.0, 475.0, 963.0, 2276.0, 6050.0, 18977.0, 81406.0, 404469.0, 418415.0, 84276.0, 19876.0, 6083.0, 2396.0, 975.0, 524.0, 272.0, 141.0, 86.0, 61.0, 40.0, 33.0, 17.0, 15.0, 12.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.3143157958984375, -1.254608154296875, -1.1949005126953125, -1.13519287109375, -1.0754852294921875, -1.015777587890625, -0.9560699462890625, -0.8963623046875, -0.8366546630859375, -0.776947021484375, -0.7172393798828125, -0.65753173828125, -0.5978240966796875, -0.538116455078125, -0.4784088134765625, -0.418701171875, -0.3589935302734375, -0.299285888671875, -0.2395782470703125, -0.17987060546875, -0.1201629638671875, -0.060455322265625, -0.0007476806640625, 0.0589599609375, 0.1186676025390625, 0.178375244140625, 0.2380828857421875, 0.29779052734375, 0.3574981689453125, 0.417205810546875, 0.4769134521484375, 0.53662109375, 0.5963287353515625, 0.656036376953125, 0.7157440185546875, 0.77545166015625, 0.8351593017578125, 0.894866943359375, 0.9545745849609375, 1.0142822265625, 1.0739898681640625, 1.133697509765625, 1.1934051513671875, 1.25311279296875, 1.3128204345703125, 1.372528076171875, 1.4322357177734375, 1.491943359375, 1.5516510009765625, 1.611358642578125, 1.6710662841796875, 1.73077392578125, 1.7904815673828125, 1.850189208984375, 1.9098968505859375, 1.9696044921875, 2.0293121337890625, 2.089019775390625, 2.1487274169921875, 2.20843505859375, 2.2681427001953125, 2.327850341796875, 2.3875579833984375, 2.447265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 14.0, 15.0, 17.0, 23.0, 26.0, 20.0, 38.0, 36.0, 58.0, 58.0, 64.0, 68.0, 66.0, 70.0, 77.0, 66.0, 63.0, 50.0, 37.0, 17.0, 29.0, 23.0, 13.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.0001826845109462738, -0.00017630308866500854, -0.00016992166638374329, -0.00016354024410247803, -0.00015715882182121277, -0.0001507773995399475, -0.00014439597725868225, -0.000138014554977417, -0.00013163313269615173, -0.00012525171041488647, -0.00011887028813362122, -0.00011248886585235596, -0.0001061074435710907, -9.972602128982544e-05, -9.334459900856018e-05, -8.696317672729492e-05, -8.058175444602966e-05, -7.42003321647644e-05, -6.781890988349915e-05, -6.143748760223389e-05, -5.505606532096863e-05, -4.867464303970337e-05, -4.229322075843811e-05, -3.591179847717285e-05, -2.9530376195907593e-05, -2.3148953914642334e-05, -1.6767531633377075e-05, -1.0386109352111816e-05, -4.004687070846558e-06, 2.376735210418701e-06, 8.75815749168396e-06, 1.5139579772949219e-05, 2.1521002054214478e-05, 2.7902424335479736e-05, 3.4283846616744995e-05, 4.0665268898010254e-05, 4.704669117927551e-05, 5.342811346054077e-05, 5.980953574180603e-05, 6.619095802307129e-05, 7.257238030433655e-05, 7.89538025856018e-05, 8.533522486686707e-05, 9.171664714813232e-05, 9.809806942939758e-05, 0.00010447949171066284, 0.0001108609139919281, 0.00011724233627319336, 0.00012362375855445862, 0.00013000518083572388, 0.00013638660311698914, 0.0001427680253982544, 0.00014914944767951965, 0.0001555308699607849, 0.00016191229224205017, 0.00016829371452331543, 0.0001746751368045807, 0.00018105655908584595, 0.0001874379813671112, 0.00019381940364837646, 0.00020020082592964172, 0.00020658224821090698, 0.00021296367049217224, 0.0002193450927734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 16.0, 23.0, 58.0, 78.0, 111.0, 223.0, 434.0, 1060.0, 3227.0, 16296.0, 185588.0, 749278.0, 79085.0, 9173.0, 2298.0, 767.0, 377.0, 180.0, 108.0, 73.0, 27.0, 15.0, 14.0, 12.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.960113525390625, -2.85186767578125, -2.743621826171875, -2.6353759765625, -2.527130126953125, -2.41888427734375, -2.310638427734375, -2.202392578125, -2.094146728515625, -1.98590087890625, -1.877655029296875, -1.7694091796875, -1.661163330078125, -1.55291748046875, -1.444671630859375, -1.33642578125, -1.228179931640625, -1.11993408203125, -1.011688232421875, -0.9034423828125, -0.795196533203125, -0.68695068359375, -0.578704833984375, -0.470458984375, -0.362213134765625, -0.25396728515625, -0.145721435546875, -0.0374755859375, 0.070770263671875, 0.17901611328125, 0.287261962890625, 0.3955078125, 0.503753662109375, 0.61199951171875, 0.720245361328125, 0.8284912109375, 0.936737060546875, 1.04498291015625, 1.153228759765625, 1.261474609375, 1.369720458984375, 1.47796630859375, 1.586212158203125, 1.6944580078125, 1.802703857421875, 1.91094970703125, 2.019195556640625, 2.12744140625, 2.235687255859375, 2.34393310546875, 2.452178955078125, 2.5604248046875, 2.668670654296875, 2.77691650390625, 2.885162353515625, 2.993408203125, 3.101654052734375, 3.20989990234375, 3.318145751953125, 3.4263916015625, 3.534637451171875, 3.64288330078125, 3.751129150390625, 3.859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 18.0, 19.0, 26.0, 25.0, 38.0, 46.0, 49.0, 79.0, 68.0, 90.0, 89.0, 84.0, 77.0, 50.0, 45.0, 28.0, 28.0, 18.0, 12.0, 18.0, 11.0, 12.0, 4.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8544921875, -1.801513671875, -1.74853515625, -1.695556640625, -1.642578125, -1.589599609375, -1.53662109375, -1.483642578125, -1.4306640625, -1.377685546875, -1.32470703125, -1.271728515625, -1.21875, -1.165771484375, -1.11279296875, -1.059814453125, -1.0068359375, -0.953857421875, -0.90087890625, -0.847900390625, -0.794921875, -0.741943359375, -0.68896484375, -0.635986328125, -0.5830078125, -0.530029296875, -0.47705078125, -0.424072265625, -0.37109375, -0.318115234375, -0.26513671875, -0.212158203125, -0.1591796875, -0.106201171875, -0.05322265625, -0.000244140625, 0.052734375, 0.105712890625, 0.15869140625, 0.211669921875, 0.2646484375, 0.317626953125, 0.37060546875, 0.423583984375, 0.4765625, 0.529541015625, 0.58251953125, 0.635498046875, 0.6884765625, 0.741455078125, 0.79443359375, 0.847412109375, 0.900390625, 0.953369140625, 1.00634765625, 1.059326171875, 1.1123046875, 1.165283203125, 1.21826171875, 1.271240234375, 1.32421875, 1.377197265625, 1.43017578125, 1.483154296875, 1.5361328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 12.0, 24.0, 50.0, 104.0, 155.0, 184.0, 172.0, 131.0, 82.0, 36.0, 25.0, 9.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.456741333007812, -21.41472053527832, -20.372697830200195, -19.330677032470703, -18.288654327392578, -17.246633529663086, -16.204612731933594, -15.162590980529785, -14.120569229125977, -13.078547477722168, -12.03652572631836, -10.994504928588867, -9.952483177185059, -8.91046142578125, -7.8684401512146, -6.826418876647949, -5.784397125244141, -4.742375373840332, -3.7003540992736816, -2.658332586288452, -1.6163110733032227, -0.5742893218994141, 0.46773195266723633, 1.5097532272338867, 2.5517749786376953, 3.593796491622925, 4.635818004608154, 5.677839279174805, 6.719861030578613, 7.761882781982422, 8.803903579711914, 9.845925331115723, 10.887947082519531, 11.92996883392334, 12.971990585327148, 14.01401138305664, 15.05603313446045, 16.098054885864258, 17.14007568359375, 18.182098388671875, 19.224119186401367, 20.26613998413086, 21.308162689208984, 22.350183486938477, 23.39220428466797, 24.434226989746094, 25.476247787475586, 26.518268585205078, 27.560291290283203, 28.602312088012695, 29.64433479309082, 30.686355590820312, 31.728378295898438, 32.77040100097656, 33.81241989135742, 34.85444259643555, 35.896461486816406, 36.93848419189453, 37.98050308227539, 39.022525787353516, 40.06454849243164, 41.1065673828125, 42.148590087890625, 43.19061279296875, 44.232635498046875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 6.0, 8.0, 9.0, 13.0, 10.0, 15.0, 20.0, 33.0, 22.0, 25.0, 39.0, 47.0, 49.0, 43.0, 56.0, 44.0, 43.0, 39.0, 54.0, 30.0, 31.0, 43.0, 44.0, 39.0, 34.0, 29.0, 27.0, 31.0, 20.0, 24.0, 9.0, 15.0, 10.0, 5.0, 8.0, 6.0, 3.0, 9.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.737166404724121, -11.365572929382324, -10.993978500366211, -10.622385025024414, -10.250791549682617, -9.87919807434082, -9.507604598999023, -9.13601016998291, -8.764416694641113, -8.392823219299316, -8.021228790283203, -7.649635314941406, -7.278041839599609, -6.9064483642578125, -6.534854412078857, -6.163260459899902, -5.7916669845581055, -5.420073509216309, -5.0484795570373535, -4.676885604858398, -4.305292129516602, -3.9336984157562256, -3.5621047019958496, -3.1905109882354736, -2.8189172744750977, -2.4473235607147217, -2.0757298469543457, -1.7041361331939697, -1.3325424194335938, -0.9609487056732178, -0.5893549919128418, -0.21776127815246582, 0.15383148193359375, 0.5254251956939697, 0.8970189094543457, 1.2686126232147217, 1.6402063369750977, 2.0118000507354736, 2.3833937644958496, 2.7549874782562256, 3.1265811920166016, 3.4981749057769775, 3.8697686195373535, 4.241362571716309, 4.6129560470581055, 4.984549522399902, 5.356143474578857, 5.7277374267578125, 6.099330902099609, 6.470924377441406, 6.842518329620361, 7.214112281799316, 7.585705757141113, 7.95729923248291, 8.328893661499023, 8.70048713684082, 9.072080612182617, 9.443674087524414, 9.815267562866211, 10.186861991882324, 10.558455467224121, 10.930048942565918, 11.301643371582031, 11.673236846923828, 12.044830322265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 17.0, 29.0, 36.0, 65.0, 128.0, 199.0, 391.0, 776.0, 4127.0, 3936858.0, 246800.0, 3271.0, 713.0, 327.0, 174.0, 113.0, 75.0, 41.0, 27.0, 23.0, 7.0, 7.0, 15.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-19.3125, -18.8289794921875, -18.345458984375, -17.8619384765625, -17.37841796875, -16.8948974609375, -16.411376953125, -15.9278564453125, -15.4443359375, -14.9608154296875, -14.477294921875, -13.9937744140625, -13.51025390625, -13.0267333984375, -12.543212890625, -12.0596923828125, -11.576171875, -11.0926513671875, -10.609130859375, -10.1256103515625, -9.64208984375, -9.1585693359375, -8.675048828125, -8.1915283203125, -7.7080078125, -7.2244873046875, -6.740966796875, -6.2574462890625, -5.77392578125, -5.2904052734375, -4.806884765625, -4.3233642578125, -3.83984375, -3.3563232421875, -2.872802734375, -2.3892822265625, -1.90576171875, -1.4222412109375, -0.938720703125, -0.4552001953125, 0.0283203125, 0.5118408203125, 0.995361328125, 1.4788818359375, 1.96240234375, 2.4459228515625, 2.929443359375, 3.4129638671875, 3.896484375, 4.3800048828125, 4.863525390625, 5.3470458984375, 5.83056640625, 6.3140869140625, 6.797607421875, 7.2811279296875, 7.7646484375, 8.2481689453125, 8.731689453125, 9.2152099609375, 9.69873046875, 10.1822509765625, 10.665771484375, 11.1492919921875, 11.6328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 5.0, 9.0, 13.0, 17.0, 22.0, 24.0, 34.0, 38.0, 46.0, 53.0, 53.0, 55.0, 52.0, 58.0, 57.0, 51.0, 56.0, 62.0, 61.0, 42.0, 44.0, 23.0, 40.0, 33.0, 12.0, 9.0, 6.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.9130859375, -0.8897933959960938, -0.8665008544921875, -0.8432083129882812, -0.819915771484375, -0.7966232299804688, -0.7733306884765625, -0.7500381469726562, -0.72674560546875, -0.7034530639648438, -0.6801605224609375, -0.6568679809570312, -0.633575439453125, -0.6102828979492188, -0.5869903564453125, -0.5636978149414062, -0.5404052734375, -0.5171127319335938, -0.4938201904296875, -0.47052764892578125, -0.447235107421875, -0.42394256591796875, -0.4006500244140625, -0.37735748291015625, -0.35406494140625, -0.33077239990234375, -0.3074798583984375, -0.28418731689453125, -0.260894775390625, -0.23760223388671875, -0.2143096923828125, -0.19101715087890625, -0.167724609375, -0.14443206787109375, -0.1211395263671875, -0.09784698486328125, -0.074554443359375, -0.05126190185546875, -0.0279693603515625, -0.00467681884765625, 0.01861572265625, 0.04190826416015625, 0.0652008056640625, 0.08849334716796875, 0.111785888671875, 0.13507843017578125, 0.1583709716796875, 0.18166351318359375, 0.2049560546875, 0.22824859619140625, 0.2515411376953125, 0.27483367919921875, 0.298126220703125, 0.32141876220703125, 0.3447113037109375, 0.36800384521484375, 0.39129638671875, 0.41458892822265625, 0.4378814697265625, 0.46117401123046875, 0.484466552734375, 0.5077590942382812, 0.5310516357421875, 0.5543441772460938, 0.57763671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 6.0, 12.0, 22.0, 20.0, 28.0, 38.0, 54.0, 56.0, 66.0, 96.0, 148.0, 176.0, 240.0, 324.0, 419.0, 602.0, 861.0, 1324.0, 2372.0, 4621.0, 11764.0, 48329.0, 1033662.0, 3014736.0, 50125.0, 12243.0, 4787.0, 2375.0, 1413.0, 902.0, 621.0, 463.0, 354.0, 230.0, 204.0, 123.0, 120.0, 61.0, 57.0, 55.0, 39.0, 24.0, 26.0, 15.0, 12.0, 10.0, 5.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.8359375, -2.747344970703125, -2.65875244140625, -2.570159912109375, -2.4815673828125, -2.392974853515625, -2.30438232421875, -2.215789794921875, -2.127197265625, -2.038604736328125, -1.95001220703125, -1.861419677734375, -1.7728271484375, -1.684234619140625, -1.59564208984375, -1.507049560546875, -1.41845703125, -1.329864501953125, -1.24127197265625, -1.152679443359375, -1.0640869140625, -0.975494384765625, -0.88690185546875, -0.798309326171875, -0.709716796875, -0.621124267578125, -0.53253173828125, -0.443939208984375, -0.3553466796875, -0.266754150390625, -0.17816162109375, -0.089569091796875, -0.0009765625, 0.087615966796875, 0.17620849609375, 0.264801025390625, 0.3533935546875, 0.441986083984375, 0.53057861328125, 0.619171142578125, 0.707763671875, 0.796356201171875, 0.88494873046875, 0.973541259765625, 1.0621337890625, 1.150726318359375, 1.23931884765625, 1.327911376953125, 1.41650390625, 1.505096435546875, 1.59368896484375, 1.682281494140625, 1.7708740234375, 1.859466552734375, 1.94805908203125, 2.036651611328125, 2.125244140625, 2.213836669921875, 2.30242919921875, 2.391021728515625, 2.4796142578125, 2.568206787109375, 2.65679931640625, 2.745391845703125, 2.833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 5.0, 5.0, 23.0, 26.0, 65.0, 130.0, 466.0, 2941.0, 202.0, 93.0, 44.0, 21.0, 11.0, 12.0, 7.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8349609375, -0.811920166015625, -0.78887939453125, -0.765838623046875, -0.7427978515625, -0.719757080078125, -0.69671630859375, -0.673675537109375, -0.650634765625, -0.627593994140625, -0.60455322265625, -0.581512451171875, -0.5584716796875, -0.535430908203125, -0.51239013671875, -0.489349365234375, -0.46630859375, -0.443267822265625, -0.42022705078125, -0.397186279296875, -0.3741455078125, -0.351104736328125, -0.32806396484375, -0.305023193359375, -0.281982421875, -0.258941650390625, -0.23590087890625, -0.212860107421875, -0.1898193359375, -0.166778564453125, -0.14373779296875, -0.120697021484375, -0.09765625, -0.074615478515625, -0.05157470703125, -0.028533935546875, -0.0054931640625, 0.017547607421875, 0.04058837890625, 0.063629150390625, 0.086669921875, 0.109710693359375, 0.13275146484375, 0.155792236328125, 0.1788330078125, 0.201873779296875, 0.22491455078125, 0.247955322265625, 0.27099609375, 0.294036865234375, 0.31707763671875, 0.340118408203125, 0.3631591796875, 0.386199951171875, 0.40924072265625, 0.432281494140625, 0.455322265625, 0.478363037109375, 0.50140380859375, 0.524444580078125, 0.5474853515625, 0.570526123046875, 0.59356689453125, 0.616607666015625, 0.6396484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 17.0, 27.0, 54.0, 66.0, 95.0, 119.0, 123.0, 115.0, 110.0, 81.0, 55.0, 38.0, 31.0, 17.0, 7.0, 10.0, 11.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1890366077423096, -2.0963294506073, -2.00362229347229, -1.9109150171279907, -1.8182077407836914, -1.7255005836486816, -1.6327934265136719, -1.540086269378662, -1.4473789930343628, -1.354671835899353, -1.2619645595550537, -1.169257402420044, -1.0765502452850342, -0.9838429689407349, -0.8911358118057251, -0.7984285950660706, -0.705721378326416, -0.6130141615867615, -0.5203069448471069, -0.42759978771209717, -0.3348925709724426, -0.24218535423278809, -0.14947819709777832, -0.05677098035812378, 0.03593623638153076, 0.1286434382200241, 0.22135064005851746, 0.3140578269958496, 0.40676504373550415, 0.4994722604751587, 0.5921794176101685, 0.684886634349823, 0.7775936126708984, 0.870300829410553, 0.9630080461502075, 1.0557152032852173, 1.1484224796295166, 1.2411296367645264, 1.3338367938995361, 1.426543951034546, 1.5192512273788452, 1.611958384513855, 1.7046656608581543, 1.797372817993164, 1.8900799751281738, 1.9827872514724731, 2.0754942893981934, 2.1682016849517822, 2.260908842086792, 2.3536159992218018, 2.4463231563568115, 2.5390305519104004, 2.63173770904541, 2.72444486618042, 2.8171520233154297, 2.9098591804504395, 3.002566337585449, 3.095273494720459, 3.1879806518554688, 3.2806878089904785, 3.3733952045440674, 3.466102361679077, 3.558809518814087, 3.6515166759490967, 3.7442240715026855]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 14.0, 6.0, 11.0, 8.0, 19.0, 18.0, 25.0, 24.0, 28.0, 26.0, 38.0, 42.0, 31.0, 38.0, 38.0, 41.0, 40.0, 35.0, 34.0, 45.0, 33.0, 35.0, 49.0, 40.0, 36.0, 36.0, 25.0, 27.0, 13.0, 25.0, 18.0, 18.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3123985528945923, -1.2752782106399536, -1.2381579875946045, -1.2010376453399658, -1.1639174222946167, -1.126797080039978, -1.089676856994629, -1.0525565147399902, -1.0154361724853516, -0.9783158898353577, -0.9411956071853638, -0.9040753245353699, -0.866955041885376, -0.8298346996307373, -0.7927144169807434, -0.7555941343307495, -0.7184739112854004, -0.6813536286354065, -0.6442333459854126, -0.6071130633354187, -0.5699927806854248, -0.5328724384307861, -0.49575215578079224, -0.45863187313079834, -0.42151159048080444, -0.38439130783081055, -0.34727102518081665, -0.31015071272850037, -0.27303043007850647, -0.23591014742851257, -0.19878984987735748, -0.1616695523262024, -0.12454915046691895, -0.08742886036634445, -0.05030857026576996, -0.013188280165195465, 0.02393200993537903, 0.061052292585372925, 0.09817259013652802, 0.1352928876876831, 0.172413170337677, 0.2095334529876709, 0.246653750538826, 0.2837740480899811, 0.320894330739975, 0.35801461338996887, 0.39513492584228516, 0.43225520849227905, 0.46937549114227295, 0.5064957737922668, 0.5436160564422607, 0.5807363390922546, 0.6178566217422485, 0.6549769639968872, 0.6920972466468811, 0.729217529296875, 0.7663378119468689, 0.8034580945968628, 0.8405783772468567, 0.8776986598968506, 0.9148190021514893, 0.9519392251968384, 0.989059567451477, 1.0261797904968262, 1.0633001327514648]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 16.0, 17.0, 28.0, 35.0, 47.0, 63.0, 97.0, 173.0, 254.0, 404.0, 588.0, 1136.0, 2059.0, 4168.0, 8587.0, 19632.0, 45649.0, 104759.0, 208480.0, 275655.0, 199791.0, 98548.0, 43161.0, 18219.0, 8192.0, 3919.0, 2003.0, 1069.0, 616.0, 410.0, 247.0, 157.0, 116.0, 73.0, 60.0, 37.0, 20.0, 24.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8012237548828125, -1.742095947265625, -1.6829681396484375, -1.62384033203125, -1.5647125244140625, -1.505584716796875, -1.4464569091796875, -1.3873291015625, -1.3282012939453125, -1.269073486328125, -1.2099456787109375, -1.15081787109375, -1.0916900634765625, -1.032562255859375, -0.9734344482421875, -0.914306640625, -0.8551788330078125, -0.796051025390625, -0.7369232177734375, -0.67779541015625, -0.6186676025390625, -0.559539794921875, -0.5004119873046875, -0.4412841796875, -0.3821563720703125, -0.323028564453125, -0.2639007568359375, -0.20477294921875, -0.1456451416015625, -0.086517333984375, -0.0273895263671875, 0.03173828125, 0.0908660888671875, 0.149993896484375, 0.2091217041015625, 0.26824951171875, 0.3273773193359375, 0.386505126953125, 0.4456329345703125, 0.5047607421875, 0.5638885498046875, 0.623016357421875, 0.6821441650390625, 0.74127197265625, 0.8003997802734375, 0.859527587890625, 0.9186553955078125, 0.977783203125, 1.0369110107421875, 1.096038818359375, 1.1551666259765625, 1.21429443359375, 1.2734222412109375, 1.332550048828125, 1.3916778564453125, 1.4508056640625, 1.5099334716796875, 1.569061279296875, 1.6281890869140625, 1.68731689453125, 1.7464447021484375, 1.805572509765625, 1.8647003173828125, 1.923828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 7.0, 4.0, 3.0, 4.0, 9.0, 7.0, 13.0, 15.0, 20.0, 21.0, 33.0, 43.0, 38.0, 48.0, 58.0, 51.0, 64.0, 55.0, 54.0, 63.0, 60.0, 49.0, 42.0, 42.0, 40.0, 39.0, 31.0, 25.0, 22.0, 14.0, 9.0, 10.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.9228515625, -0.8993453979492188, -0.8758392333984375, -0.8523330688476562, -0.828826904296875, -0.8053207397460938, -0.7818145751953125, -0.7583084106445312, -0.73480224609375, -0.7112960815429688, -0.6877899169921875, -0.6642837524414062, -0.640777587890625, -0.6172714233398438, -0.5937652587890625, -0.5702590942382812, -0.5467529296875, -0.5232467651367188, -0.4997406005859375, -0.47623443603515625, -0.452728271484375, -0.42922210693359375, -0.4057159423828125, -0.38220977783203125, -0.35870361328125, -0.33519744873046875, -0.3116912841796875, -0.28818511962890625, -0.264678955078125, -0.24117279052734375, -0.2176666259765625, -0.19416046142578125, -0.170654296875, -0.14714813232421875, -0.1236419677734375, -0.10013580322265625, -0.076629638671875, -0.05312347412109375, -0.0296173095703125, -0.00611114501953125, 0.01739501953125, 0.04090118408203125, 0.0644073486328125, 0.08791351318359375, 0.111419677734375, 0.13492584228515625, 0.1584320068359375, 0.18193817138671875, 0.2054443359375, 0.22895050048828125, 0.2524566650390625, 0.27596282958984375, 0.299468994140625, 0.32297515869140625, 0.3464813232421875, 0.36998748779296875, 0.39349365234375, 0.41699981689453125, 0.4405059814453125, 0.46401214599609375, 0.487518310546875, 0.5110244750976562, 0.5345306396484375, 0.5580368041992188, 0.58154296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 12.0, 19.0, 25.0, 28.0, 29.0, 41.0, 61.0, 87.0, 107.0, 139.0, 223.0, 302.0, 471.0, 741.0, 1411.0, 4831.0, 39239.0, 533320.0, 428839.0, 30913.0, 4161.0, 1326.0, 692.0, 418.0, 296.0, 186.0, 177.0, 107.0, 84.0, 62.0, 38.0, 41.0, 26.0, 17.0, 14.0, 12.0, 12.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.50390625, -5.341796875, -5.1796875, -5.017578125, -4.85546875, -4.693359375, -4.53125, -4.369140625, -4.20703125, -4.044921875, -3.8828125, -3.720703125, -3.55859375, -3.396484375, -3.234375, -3.072265625, -2.91015625, -2.748046875, -2.5859375, -2.423828125, -2.26171875, -2.099609375, -1.9375, -1.775390625, -1.61328125, -1.451171875, -1.2890625, -1.126953125, -0.96484375, -0.802734375, -0.640625, -0.478515625, -0.31640625, -0.154296875, 0.0078125, 0.169921875, 0.33203125, 0.494140625, 0.65625, 0.818359375, 0.98046875, 1.142578125, 1.3046875, 1.466796875, 1.62890625, 1.791015625, 1.953125, 2.115234375, 2.27734375, 2.439453125, 2.6015625, 2.763671875, 2.92578125, 3.087890625, 3.25, 3.412109375, 3.57421875, 3.736328125, 3.8984375, 4.060546875, 4.22265625, 4.384765625, 4.546875, 4.708984375, 4.87109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 2.0, 8.0, 9.0, 5.0, 6.0, 8.0, 17.0, 19.0, 15.0, 19.0, 23.0, 26.0, 30.0, 33.0, 39.0, 40.0, 30.0, 44.0, 43.0, 48.0, 50.0, 40.0, 36.0, 34.0, 41.0, 31.0, 32.0, 29.0, 32.0, 29.0, 28.0, 29.0, 30.0, 21.0, 14.0, 10.0, 8.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.595703125, -2.51544189453125, -2.4351806640625, -2.35491943359375, -2.274658203125, -2.19439697265625, -2.1141357421875, -2.03387451171875, -1.95361328125, -1.87335205078125, -1.7930908203125, -1.71282958984375, -1.632568359375, -1.55230712890625, -1.4720458984375, -1.39178466796875, -1.3115234375, -1.23126220703125, -1.1510009765625, -1.07073974609375, -0.990478515625, -0.91021728515625, -0.8299560546875, -0.74969482421875, -0.66943359375, -0.58917236328125, -0.5089111328125, -0.42864990234375, -0.348388671875, -0.26812744140625, -0.1878662109375, -0.10760498046875, -0.02734375, 0.05291748046875, 0.1331787109375, 0.21343994140625, 0.293701171875, 0.37396240234375, 0.4542236328125, 0.53448486328125, 0.61474609375, 0.69500732421875, 0.7752685546875, 0.85552978515625, 0.935791015625, 1.01605224609375, 1.0963134765625, 1.17657470703125, 1.2568359375, 1.33709716796875, 1.4173583984375, 1.49761962890625, 1.577880859375, 1.65814208984375, 1.7384033203125, 1.81866455078125, 1.89892578125, 1.97918701171875, 2.0594482421875, 2.13970947265625, 2.219970703125, 2.30023193359375, 2.3804931640625, 2.46075439453125, 2.541015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 4.0, 9.0, 8.0, 9.0, 15.0, 11.0, 18.0, 34.0, 48.0, 75.0, 142.0, 292.0, 694.0, 2113.0, 9651.0, 68241.0, 593680.0, 330633.0, 34692.0, 5623.0, 1476.0, 513.0, 249.0, 118.0, 76.0, 38.0, 26.0, 19.0, 14.0, 4.0, 9.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.029998779296875, -1.96624755859375, -1.902496337890625, -1.8387451171875, -1.774993896484375, -1.71124267578125, -1.647491455078125, -1.583740234375, -1.519989013671875, -1.45623779296875, -1.392486572265625, -1.3287353515625, -1.264984130859375, -1.20123291015625, -1.137481689453125, -1.07373046875, -1.009979248046875, -0.94622802734375, -0.882476806640625, -0.8187255859375, -0.754974365234375, -0.69122314453125, -0.627471923828125, -0.563720703125, -0.499969482421875, -0.43621826171875, -0.372467041015625, -0.3087158203125, -0.244964599609375, -0.18121337890625, -0.117462158203125, -0.0537109375, 0.010040283203125, 0.07379150390625, 0.137542724609375, 0.2012939453125, 0.265045166015625, 0.32879638671875, 0.392547607421875, 0.456298828125, 0.520050048828125, 0.58380126953125, 0.647552490234375, 0.7113037109375, 0.775054931640625, 0.83880615234375, 0.902557373046875, 0.96630859375, 1.030059814453125, 1.09381103515625, 1.157562255859375, 1.2213134765625, 1.285064697265625, 1.34881591796875, 1.412567138671875, 1.476318359375, 1.540069580078125, 1.60382080078125, 1.667572021484375, 1.7313232421875, 1.795074462890625, 1.85882568359375, 1.922576904296875, 1.986328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 5.0, 13.0, 10.0, 18.0, 21.0, 21.0, 33.0, 35.0, 48.0, 70.0, 64.0, 104.0, 87.0, 82.0, 85.0, 72.0, 62.0, 39.0, 26.0, 15.0, 21.0, 17.0, 9.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003135204315185547, -0.0003064200282096863, -0.00029931962490081787, -0.00029221922159194946, -0.00028511881828308105, -0.00027801841497421265, -0.00027091801166534424, -0.00026381760835647583, -0.0002567172050476074, -0.000249616801738739, -0.0002425163984298706, -0.0002354159951210022, -0.0002283155918121338, -0.00022121518850326538, -0.00021411478519439697, -0.00020701438188552856, -0.00019991397857666016, -0.00019281357526779175, -0.00018571317195892334, -0.00017861276865005493, -0.00017151236534118652, -0.00016441196203231812, -0.0001573115587234497, -0.0001502111554145813, -0.0001431107521057129, -0.00013601034879684448, -0.00012890994548797607, -0.00012180954217910767, -0.00011470913887023926, -0.00010760873556137085, -0.00010050833225250244, -9.340792894363403e-05, -8.630752563476562e-05, -7.920712232589722e-05, -7.210671901702881e-05, -6.50063157081604e-05, -5.790591239929199e-05, -5.0805509090423584e-05, -4.3705105781555176e-05, -3.660470247268677e-05, -2.950429916381836e-05, -2.240389585494995e-05, -1.5303492546081543e-05, -8.203089237213135e-06, -1.1026859283447266e-06, 5.997717380523682e-06, 1.309812068939209e-05, 2.0198523998260498e-05, 2.7298927307128906e-05, 3.4399330615997314e-05, 4.149973392486572e-05, 4.860013723373413e-05, 5.570054054260254e-05, 6.280094385147095e-05, 6.990134716033936e-05, 7.700175046920776e-05, 8.410215377807617e-05, 9.120255708694458e-05, 9.830296039581299e-05, 0.0001054033637046814, 0.0001125037670135498, 0.00011960417032241821, 0.00012670457363128662, 0.00013380497694015503, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 4.0, 12.0, 9.0, 19.0, 25.0, 42.0, 59.0, 76.0, 122.0, 209.0, 413.0, 744.0, 1646.0, 4505.0, 19403.0, 160432.0, 709395.0, 127736.0, 16459.0, 4159.0, 1473.0, 662.0, 357.0, 195.0, 131.0, 83.0, 54.0, 37.0, 24.0, 21.0, 11.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4882965087890625, -1.424835205078125, -1.3613739013671875, -1.29791259765625, -1.2344512939453125, -1.170989990234375, -1.1075286865234375, -1.0440673828125, -0.9806060791015625, -0.917144775390625, -0.8536834716796875, -0.79022216796875, -0.7267608642578125, -0.663299560546875, -0.5998382568359375, -0.536376953125, -0.4729156494140625, -0.409454345703125, -0.3459930419921875, -0.28253173828125, -0.2190704345703125, -0.155609130859375, -0.0921478271484375, -0.0286865234375, 0.0347747802734375, 0.098236083984375, 0.1616973876953125, 0.22515869140625, 0.2886199951171875, 0.352081298828125, 0.4155426025390625, 0.47900390625, 0.5424652099609375, 0.605926513671875, 0.6693878173828125, 0.73284912109375, 0.7963104248046875, 0.859771728515625, 0.9232330322265625, 0.9866943359375, 1.0501556396484375, 1.113616943359375, 1.1770782470703125, 1.24053955078125, 1.3040008544921875, 1.367462158203125, 1.4309234619140625, 1.494384765625, 1.5578460693359375, 1.621307373046875, 1.6847686767578125, 1.74822998046875, 1.8116912841796875, 1.875152587890625, 1.9386138916015625, 2.0020751953125, 2.0655364990234375, 2.128997802734375, 2.1924591064453125, 2.25592041015625, 2.3193817138671875, 2.382843017578125, 2.4463043212890625, 2.509765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 15.0, 19.0, 40.0, 45.0, 50.0, 60.0, 90.0, 108.0, 90.0, 103.0, 68.0, 65.0, 44.0, 37.0, 25.0, 21.0, 22.0, 17.0, 14.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6654205322265625, -1.611114501953125, -1.5568084716796875, -1.50250244140625, -1.4481964111328125, -1.393890380859375, -1.3395843505859375, -1.2852783203125, -1.2309722900390625, -1.176666259765625, -1.1223602294921875, -1.06805419921875, -1.0137481689453125, -0.959442138671875, -0.9051361083984375, -0.850830078125, -0.7965240478515625, -0.742218017578125, -0.6879119873046875, -0.63360595703125, -0.5792999267578125, -0.524993896484375, -0.4706878662109375, -0.4163818359375, -0.3620758056640625, -0.307769775390625, -0.2534637451171875, -0.19915771484375, -0.1448516845703125, -0.090545654296875, -0.0362396240234375, 0.01806640625, 0.0723724365234375, 0.126678466796875, 0.1809844970703125, 0.23529052734375, 0.2895965576171875, 0.343902587890625, 0.3982086181640625, 0.4525146484375, 0.5068206787109375, 0.561126708984375, 0.6154327392578125, 0.66973876953125, 0.7240447998046875, 0.778350830078125, 0.8326568603515625, 0.886962890625, 0.9412689208984375, 0.995574951171875, 1.0498809814453125, 1.10418701171875, 1.1584930419921875, 1.212799072265625, 1.2671051025390625, 1.3214111328125, 1.3757171630859375, 1.430023193359375, 1.4843292236328125, 1.53863525390625, 1.5929412841796875, 1.647247314453125, 1.7015533447265625, 1.755859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 23.0, 109.0, 185.0, 262.0, 243.0, 108.0, 40.0, 4.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03076934814453, -34.6136589050293, -33.19654846191406, -31.77943992614746, -30.36233139038086, -28.945220947265625, -27.52811050415039, -26.111000061035156, -24.693891525268555, -23.27678108215332, -21.85967254638672, -20.442562103271484, -19.02545166015625, -17.60834312438965, -16.191232681274414, -14.774123191833496, -13.357013702392578, -11.93990421295166, -10.522794723510742, -9.105684280395508, -7.68857479095459, -6.271465301513672, -4.8543548583984375, -3.4372453689575195, -2.0201358795166016, -0.6030261516571045, 0.8140835762023926, 2.2311935424804688, 3.6483030319213867, 5.065412521362305, 6.482522964477539, 7.899632453918457, 9.31673812866211, 10.733847618103027, 12.150957107543945, 13.56806755065918, 14.985177040100098, 16.402286529541016, 17.81939697265625, 19.236507415771484, 20.653615951538086, 22.07072639465332, 23.487834930419922, 24.904945373535156, 26.32205581665039, 27.739164352416992, 29.156274795532227, 30.573383331298828, 31.990493774414062, 33.4076042175293, 34.82471466064453, 36.2418212890625, 37.658931732177734, 39.07604217529297, 40.4931526184082, 41.91026306152344, 43.327369689941406, 44.74448013305664, 46.161590576171875, 47.578697204589844, 48.99580764770508, 50.41291809082031, 51.83002853393555, 53.24713897705078, 54.664249420166016]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 9.0, 4.0, 3.0, 9.0, 9.0, 8.0, 19.0, 17.0, 19.0, 17.0, 27.0, 34.0, 23.0, 38.0, 25.0, 48.0, 36.0, 53.0, 56.0, 49.0, 56.0, 47.0, 42.0, 38.0, 43.0, 44.0, 28.0, 26.0, 25.0, 24.0, 27.0, 28.0, 13.0, 8.0, 10.0, 5.0, 5.0, 11.0, 5.0, 1.0, 2.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.027986526489258, -12.592302322387695, -12.156618118286133, -11.720934867858887, -11.285250663757324, -10.849566459655762, -10.413883209228516, -9.978199005126953, -9.54251480102539, -9.106830596923828, -8.671146392822266, -8.23546314239502, -7.799778938293457, -7.3640947341918945, -6.92841100692749, -6.492727279663086, -6.057043075561523, -5.621358871459961, -5.185675144195557, -4.749991416931152, -4.31430721282959, -3.8786232471466064, -3.442939281463623, -3.0072553157806396, -2.5715713500976562, -2.135887384414673, -1.7002034187316895, -1.264519453048706, -0.8288354873657227, -0.39315152168273926, 0.04253244400024414, 0.47821640968322754, 0.9139003753662109, 1.3495843410491943, 1.7852683067321777, 2.220952272415161, 2.6566362380981445, 3.092320203781128, 3.5280041694641113, 3.9636881351470947, 4.399372100830078, 4.835056304931641, 5.270740032196045, 5.706423759460449, 6.142107963562012, 6.577792167663574, 7.0134758949279785, 7.449159622192383, 7.884843826293945, 8.320528030395508, 8.75621223449707, 9.191895484924316, 9.627579689025879, 10.063263893127441, 10.498947143554688, 10.93463134765625, 11.370315551757812, 11.805999755859375, 12.241683959960938, 12.677367210388184, 13.113051414489746, 13.548735618591309, 13.984418869018555, 14.420103073120117, 14.85578727722168]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 8.0, 11.0, 29.0, 38.0, 64.0, 90.0, 169.0, 367.0, 943.0, 8059.0, 4164181.0, 18082.0, 1288.0, 432.0, 204.0, 101.0, 57.0, 45.0, 24.0, 26.0, 7.0, 9.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.90625, -16.4793701171875, -16.052490234375, -15.6256103515625, -15.19873046875, -14.7718505859375, -14.344970703125, -13.9180908203125, -13.4912109375, -13.0643310546875, -12.637451171875, -12.2105712890625, -11.78369140625, -11.3568115234375, -10.929931640625, -10.5030517578125, -10.076171875, -9.6492919921875, -9.222412109375, -8.7955322265625, -8.36865234375, -7.9417724609375, -7.514892578125, -7.0880126953125, -6.6611328125, -6.2342529296875, -5.807373046875, -5.3804931640625, -4.95361328125, -4.5267333984375, -4.099853515625, -3.6729736328125, -3.24609375, -2.8192138671875, -2.392333984375, -1.9654541015625, -1.53857421875, -1.1116943359375, -0.684814453125, -0.2579345703125, 0.1689453125, 0.5958251953125, 1.022705078125, 1.4495849609375, 1.87646484375, 2.3033447265625, 2.730224609375, 3.1571044921875, 3.583984375, 4.0108642578125, 4.437744140625, 4.8646240234375, 5.29150390625, 5.7183837890625, 6.145263671875, 6.5721435546875, 6.9990234375, 7.4259033203125, 7.852783203125, 8.2796630859375, 8.70654296875, 9.1334228515625, 9.560302734375, 9.9871826171875, 10.4140625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 12.0, 18.0, 10.0, 18.0, 24.0, 22.0, 45.0, 32.0, 56.0, 66.0, 53.0, 56.0, 75.0, 65.0, 42.0, 48.0, 50.0, 40.0, 49.0, 45.0, 37.0, 25.0, 29.0, 12.0, 12.0, 13.0, 2.0, 13.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8427810668945312, -0.8193511962890625, -0.7959213256835938, -0.772491455078125, -0.7490615844726562, -0.7256317138671875, -0.7022018432617188, -0.67877197265625, -0.6553421020507812, -0.6319122314453125, -0.6084823608398438, -0.585052490234375, -0.5616226196289062, -0.5381927490234375, -0.5147628784179688, -0.4913330078125, -0.46790313720703125, -0.4444732666015625, -0.42104339599609375, -0.397613525390625, -0.37418365478515625, -0.3507537841796875, -0.32732391357421875, -0.30389404296875, -0.28046417236328125, -0.2570343017578125, -0.23360443115234375, -0.210174560546875, -0.18674468994140625, -0.1633148193359375, -0.13988494873046875, -0.116455078125, -0.09302520751953125, -0.0695953369140625, -0.04616546630859375, -0.022735595703125, 0.00069427490234375, 0.0241241455078125, 0.04755401611328125, 0.07098388671875, 0.09441375732421875, 0.1178436279296875, 0.14127349853515625, 0.164703369140625, 0.18813323974609375, 0.2115631103515625, 0.23499298095703125, 0.2584228515625, 0.28185272216796875, 0.3052825927734375, 0.32871246337890625, 0.352142333984375, 0.37557220458984375, 0.3990020751953125, 0.42243194580078125, 0.44586181640625, 0.46929168701171875, 0.4927215576171875, 0.5161514282226562, 0.539581298828125, 0.5630111694335938, 0.5864410400390625, 0.6098709106445312, 0.63330078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 9.0, 21.0, 11.0, 17.0, 42.0, 47.0, 60.0, 83.0, 104.0, 190.0, 243.0, 411.0, 574.0, 933.0, 1520.0, 2750.0, 5444.0, 12905.0, 42955.0, 367419.0, 3645889.0, 77727.0, 18850.0, 7278.0, 3588.0, 1938.0, 1134.0, 680.0, 453.0, 282.0, 191.0, 155.0, 98.0, 71.0, 56.0, 44.0, 30.0, 17.0, 16.0, 2.0, 10.0, 4.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.091796875, -2.022491455078125, -1.95318603515625, -1.883880615234375, -1.8145751953125, -1.745269775390625, -1.67596435546875, -1.606658935546875, -1.537353515625, -1.468048095703125, -1.39874267578125, -1.329437255859375, -1.2601318359375, -1.190826416015625, -1.12152099609375, -1.052215576171875, -0.98291015625, -0.913604736328125, -0.84429931640625, -0.774993896484375, -0.7056884765625, -0.636383056640625, -0.56707763671875, -0.497772216796875, -0.428466796875, -0.359161376953125, -0.28985595703125, -0.220550537109375, -0.1512451171875, -0.081939697265625, -0.01263427734375, 0.056671142578125, 0.1259765625, 0.195281982421875, 0.26458740234375, 0.333892822265625, 0.4031982421875, 0.472503662109375, 0.54180908203125, 0.611114501953125, 0.680419921875, 0.749725341796875, 0.81903076171875, 0.888336181640625, 0.9576416015625, 1.026947021484375, 1.09625244140625, 1.165557861328125, 1.23486328125, 1.304168701171875, 1.37347412109375, 1.442779541015625, 1.5120849609375, 1.581390380859375, 1.65069580078125, 1.720001220703125, 1.789306640625, 1.858612060546875, 1.92791748046875, 1.997222900390625, 2.0665283203125, 2.135833740234375, 2.20513916015625, 2.274444580078125, 2.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 8.0, 9.0, 15.0, 15.0, 30.0, 73.0, 114.0, 399.0, 2989.0, 211.0, 93.0, 32.0, 24.0, 12.0, 10.0, 9.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.781951904296875, -0.75775146484375, -0.733551025390625, -0.7093505859375, -0.685150146484375, -0.66094970703125, -0.636749267578125, -0.612548828125, -0.588348388671875, -0.56414794921875, -0.539947509765625, -0.5157470703125, -0.491546630859375, -0.46734619140625, -0.443145751953125, -0.4189453125, -0.394744873046875, -0.37054443359375, -0.346343994140625, -0.3221435546875, -0.297943115234375, -0.27374267578125, -0.249542236328125, -0.225341796875, -0.201141357421875, -0.17694091796875, -0.152740478515625, -0.1285400390625, -0.104339599609375, -0.08013916015625, -0.055938720703125, -0.03173828125, -0.007537841796875, 0.01666259765625, 0.040863037109375, 0.0650634765625, 0.089263916015625, 0.11346435546875, 0.137664794921875, 0.161865234375, 0.186065673828125, 0.21026611328125, 0.234466552734375, 0.2586669921875, 0.282867431640625, 0.30706787109375, 0.331268310546875, 0.35546875, 0.379669189453125, 0.40386962890625, 0.428070068359375, 0.4522705078125, 0.476470947265625, 0.50067138671875, 0.524871826171875, 0.549072265625, 0.573272705078125, 0.59747314453125, 0.621673583984375, 0.6458740234375, 0.670074462890625, 0.69427490234375, 0.718475341796875, 0.74267578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 11.0, 16.0, 40.0, 71.0, 124.0, 184.0, 219.0, 166.0, 100.0, 41.0, 20.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.143086910247803, -5.97553014755249, -5.8079729080200195, -5.640416145324707, -5.4728593826293945, -5.305302619934082, -5.137745380401611, -4.970188617706299, -4.802631378173828, -4.635074615478516, -4.467517375946045, -4.299960613250732, -4.13240385055542, -3.9648468494415283, -3.7972898483276367, -3.629733085632324, -3.4621763229370117, -3.29461932182312, -3.1270625591278076, -2.959505558013916, -2.7919487953186035, -2.624391794204712, -2.4568347930908203, -2.289278030395508, -2.121721029281616, -1.9541641473770142, -1.786607265472412, -1.6190502643585205, -1.4514933824539185, -1.2839365005493164, -1.1163794994354248, -0.9488226175308228, -0.7812662124633789, -0.6137093305587769, -0.44615238904953003, -0.2785954475402832, -0.11103856563568115, 0.0565183162689209, 0.2240753173828125, 0.39163219928741455, 0.5591890811920166, 0.7267459630966187, 0.8943029046058655, 1.0618598461151123, 1.2294167280197144, 1.3969736099243164, 1.564530611038208, 1.73208749294281, 1.899644374847412, 2.0672013759613037, 2.234758138656616, 2.402315139770508, 2.5698719024658203, 2.737428903579712, 2.9049859046936035, 3.072542667388916, 3.2400996685028076, 3.407656669616699, 3.5752134323120117, 3.7427704334259033, 3.910327434539795, 4.077884197235107, 4.245441436767578, 4.412998199462891, 4.580554962158203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 6.0, 8.0, 13.0, 17.0, 19.0, 25.0, 20.0, 35.0, 16.0, 29.0, 22.0, 43.0, 42.0, 36.0, 44.0, 34.0, 47.0, 35.0, 38.0, 40.0, 44.0, 40.0, 37.0, 34.0, 36.0, 35.0, 25.0, 22.0, 25.0, 26.0, 17.0, 15.0, 6.0, 6.0, 15.0, 7.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7347486019134521, -1.6803596019744873, -1.625970482826233, -1.571581482887268, -1.5171924829483032, -1.4628033638000488, -1.408414363861084, -1.3540253639221191, -1.2996362447738647, -1.2452472448349, -1.1908581256866455, -1.1364691257476807, -1.0820801258087158, -1.0276910066604614, -0.9733020067214966, -0.918912947177887, -0.8645239472389221, -0.8101348876953125, -0.7557458877563477, -0.701356828212738, -0.6469677686691284, -0.5925787687301636, -0.538189709186554, -0.48380064964294434, -0.4294116199016571, -0.3750225901603699, -0.32063353061676025, -0.266244500875473, -0.2118554562330246, -0.15746641159057617, -0.10307738184928894, -0.04868832230567932, 0.00570070743560791, 0.06008974835276604, 0.11447878926992416, 0.168867826461792, 0.22325687110424042, 0.27764591574668884, 0.3320349454879761, 0.3864240050315857, 0.4408130347728729, 0.49520206451416016, 0.5495911240577698, 0.6039801836013794, 0.6583691835403442, 0.7127582430839539, 0.7671473026275635, 0.8215363025665283, 0.8759253621101379, 0.9303144216537476, 0.9847034215927124, 1.0390925407409668, 1.0934815406799316, 1.1478705406188965, 1.2022595405578613, 1.2566486597061157, 1.3110376596450806, 1.3654266595840454, 1.4198157787322998, 1.4742047786712646, 1.5285937786102295, 1.5829828977584839, 1.6373718976974487, 1.6917610168457031, 1.746150016784668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 11.0, 9.0, 9.0, 13.0, 15.0, 27.0, 24.0, 40.0, 54.0, 66.0, 97.0, 173.0, 251.0, 406.0, 632.0, 1002.0, 1812.0, 3397.0, 6663.0, 13731.0, 31133.0, 73371.0, 165301.0, 273988.0, 244627.0, 129512.0, 55642.0, 23677.0, 10920.0, 5296.0, 2744.0, 1458.0, 859.0, 528.0, 338.0, 225.0, 141.0, 95.0, 68.0, 58.0, 50.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6167144775390625, -1.562530517578125, -1.5083465576171875, -1.45416259765625, -1.3999786376953125, -1.345794677734375, -1.2916107177734375, -1.2374267578125, -1.1832427978515625, -1.129058837890625, -1.0748748779296875, -1.02069091796875, -0.9665069580078125, -0.912322998046875, -0.8581390380859375, -0.803955078125, -0.7497711181640625, -0.695587158203125, -0.6414031982421875, -0.58721923828125, -0.5330352783203125, -0.478851318359375, -0.4246673583984375, -0.3704833984375, -0.3162994384765625, -0.262115478515625, -0.2079315185546875, -0.15374755859375, -0.0995635986328125, -0.045379638671875, 0.0088043212890625, 0.06298828125, 0.1171722412109375, 0.171356201171875, 0.2255401611328125, 0.27972412109375, 0.3339080810546875, 0.388092041015625, 0.4422760009765625, 0.4964599609375, 0.5506439208984375, 0.604827880859375, 0.6590118408203125, 0.71319580078125, 0.7673797607421875, 0.821563720703125, 0.8757476806640625, 0.929931640625, 0.9841156005859375, 1.038299560546875, 1.0924835205078125, 1.14666748046875, 1.2008514404296875, 1.255035400390625, 1.3092193603515625, 1.3634033203125, 1.4175872802734375, 1.471771240234375, 1.5259552001953125, 1.58013916015625, 1.6343231201171875, 1.688507080078125, 1.7426910400390625, 1.796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 5.0, 7.0, 10.0, 12.0, 22.0, 10.0, 24.0, 30.0, 30.0, 32.0, 43.0, 31.0, 50.0, 50.0, 60.0, 50.0, 55.0, 60.0, 42.0, 43.0, 45.0, 45.0, 45.0, 36.0, 35.0, 32.0, 19.0, 14.0, 12.0, 13.0, 11.0, 8.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.8251953125, -0.8025283813476562, -0.7798614501953125, -0.7571945190429688, -0.734527587890625, -0.7118606567382812, -0.6891937255859375, -0.6665267944335938, -0.64385986328125, -0.6211929321289062, -0.5985260009765625, -0.5758590698242188, -0.553192138671875, -0.5305252075195312, -0.5078582763671875, -0.48519134521484375, -0.4625244140625, -0.43985748291015625, -0.4171905517578125, -0.39452362060546875, -0.371856689453125, -0.34918975830078125, -0.3265228271484375, -0.30385589599609375, -0.28118896484375, -0.25852203369140625, -0.2358551025390625, -0.21318817138671875, -0.190521240234375, -0.16785430908203125, -0.1451873779296875, -0.12252044677734375, -0.099853515625, -0.07718658447265625, -0.0545196533203125, -0.03185272216796875, -0.009185791015625, 0.01348114013671875, 0.0361480712890625, 0.05881500244140625, 0.08148193359375, 0.10414886474609375, 0.1268157958984375, 0.14948272705078125, 0.172149658203125, 0.19481658935546875, 0.2174835205078125, 0.24015045166015625, 0.2628173828125, 0.28548431396484375, 0.3081512451171875, 0.33081817626953125, 0.353485107421875, 0.37615203857421875, 0.3988189697265625, 0.42148590087890625, 0.44415283203125, 0.46681976318359375, 0.4894866943359375, 0.5121536254882812, 0.534820556640625, 0.5574874877929688, 0.5801544189453125, 0.6028213500976562, 0.62548828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 19.0, 23.0, 22.0, 38.0, 66.0, 100.0, 115.0, 172.0, 266.0, 365.0, 602.0, 1085.0, 3060.0, 22592.0, 625591.0, 375131.0, 14197.0, 2469.0, 1024.0, 523.0, 322.0, 207.0, 146.0, 112.0, 75.0, 54.0, 43.0, 31.0, 31.0, 16.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.46484375, -6.2796630859375, -6.094482421875, -5.9093017578125, -5.72412109375, -5.5389404296875, -5.353759765625, -5.1685791015625, -4.9833984375, -4.7982177734375, -4.613037109375, -4.4278564453125, -4.24267578125, -4.0574951171875, -3.872314453125, -3.6871337890625, -3.501953125, -3.3167724609375, -3.131591796875, -2.9464111328125, -2.76123046875, -2.5760498046875, -2.390869140625, -2.2056884765625, -2.0205078125, -1.8353271484375, -1.650146484375, -1.4649658203125, -1.27978515625, -1.0946044921875, -0.909423828125, -0.7242431640625, -0.5390625, -0.3538818359375, -0.168701171875, 0.0164794921875, 0.20166015625, 0.3868408203125, 0.572021484375, 0.7572021484375, 0.9423828125, 1.1275634765625, 1.312744140625, 1.4979248046875, 1.68310546875, 1.8682861328125, 2.053466796875, 2.2386474609375, 2.423828125, 2.6090087890625, 2.794189453125, 2.9793701171875, 3.16455078125, 3.3497314453125, 3.534912109375, 3.7200927734375, 3.9052734375, 4.0904541015625, 4.275634765625, 4.4608154296875, 4.64599609375, 4.8311767578125, 5.016357421875, 5.2015380859375, 5.38671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 15.0, 16.0, 24.0, 19.0, 20.0, 25.0, 31.0, 41.0, 37.0, 35.0, 44.0, 39.0, 30.0, 34.0, 50.0, 54.0, 44.0, 47.0, 41.0, 33.0, 41.0, 46.0, 31.0, 35.0, 20.0, 17.0, 15.0, 16.0, 14.0, 9.0, 6.0, 8.0, 6.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.30755615234375, -2.2225341796875, -2.13751220703125, -2.052490234375, -1.96746826171875, -1.8824462890625, -1.79742431640625, -1.71240234375, -1.62738037109375, -1.5423583984375, -1.45733642578125, -1.372314453125, -1.28729248046875, -1.2022705078125, -1.11724853515625, -1.0322265625, -0.94720458984375, -0.8621826171875, -0.77716064453125, -0.692138671875, -0.60711669921875, -0.5220947265625, -0.43707275390625, -0.35205078125, -0.26702880859375, -0.1820068359375, -0.09698486328125, -0.011962890625, 0.07305908203125, 0.1580810546875, 0.24310302734375, 0.328125, 0.41314697265625, 0.4981689453125, 0.58319091796875, 0.668212890625, 0.75323486328125, 0.8382568359375, 0.92327880859375, 1.00830078125, 1.09332275390625, 1.1783447265625, 1.26336669921875, 1.348388671875, 1.43341064453125, 1.5184326171875, 1.60345458984375, 1.6884765625, 1.77349853515625, 1.8585205078125, 1.94354248046875, 2.028564453125, 2.11358642578125, 2.1986083984375, 2.28363037109375, 2.36865234375, 2.45367431640625, 2.5386962890625, 2.62371826171875, 2.708740234375, 2.79376220703125, 2.8787841796875, 2.96380615234375, 3.048828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 25.0, 19.0, 36.0, 44.0, 74.0, 81.0, 122.0, 204.0, 365.0, 733.0, 1829.0, 6037.0, 34443.0, 402963.0, 544851.0, 45298.0, 7429.0, 2063.0, 787.0, 415.0, 204.0, 152.0, 81.0, 76.0, 53.0, 33.0, 19.0, 20.0, 10.0, 9.0, 5.0, 8.0, 9.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.9306640625, -1.8685150146484375, -1.806365966796875, -1.7442169189453125, -1.68206787109375, -1.6199188232421875, -1.557769775390625, -1.4956207275390625, -1.4334716796875, -1.3713226318359375, -1.309173583984375, -1.2470245361328125, -1.18487548828125, -1.1227264404296875, -1.060577392578125, -0.9984283447265625, -0.936279296875, -0.8741302490234375, -0.811981201171875, -0.7498321533203125, -0.68768310546875, -0.6255340576171875, -0.563385009765625, -0.5012359619140625, -0.4390869140625, -0.3769378662109375, -0.314788818359375, -0.2526397705078125, -0.19049072265625, -0.1283416748046875, -0.066192626953125, -0.0040435791015625, 0.05810546875, 0.1202545166015625, 0.182403564453125, 0.2445526123046875, 0.30670166015625, 0.3688507080078125, 0.430999755859375, 0.4931488037109375, 0.5552978515625, 0.6174468994140625, 0.679595947265625, 0.7417449951171875, 0.80389404296875, 0.8660430908203125, 0.928192138671875, 0.9903411865234375, 1.052490234375, 1.1146392822265625, 1.176788330078125, 1.2389373779296875, 1.30108642578125, 1.3632354736328125, 1.425384521484375, 1.4875335693359375, 1.5496826171875, 1.6118316650390625, 1.673980712890625, 1.7361297607421875, 1.79827880859375, 1.8604278564453125, 1.922576904296875, 1.9847259521484375, 2.046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 11.0, 16.0, 33.0, 38.0, 47.0, 72.0, 94.0, 98.0, 120.0, 105.0, 86.0, 74.0, 64.0, 35.0, 22.0, 11.0, 13.0, 12.0, 6.0, 9.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000186920166015625, -0.00017854943871498108, -0.00017017871141433716, -0.00016180798411369324, -0.00015343725681304932, -0.0001450665295124054, -0.00013669580221176147, -0.00012832507491111755, -0.00011995434761047363, -0.00011158362030982971, -0.00010321289300918579, -9.484216570854187e-05, -8.647143840789795e-05, -7.810071110725403e-05, -6.972998380661011e-05, -6.135925650596619e-05, -5.2988529205322266e-05, -4.4617801904678345e-05, -3.6247074604034424e-05, -2.7876347303390503e-05, -1.9505620002746582e-05, -1.1134892702102661e-05, -2.7641654014587402e-06, 5.606561899185181e-06, 1.3977289199829102e-05, 2.2348016500473022e-05, 3.071874380111694e-05, 3.9089471101760864e-05, 4.7460198402404785e-05, 5.5830925703048706e-05, 6.420165300369263e-05, 7.257238030433655e-05, 8.094310760498047e-05, 8.931383490562439e-05, 9.768456220626831e-05, 0.00010605528950691223, 0.00011442601680755615, 0.00012279674410820007, 0.000131167471408844, 0.00013953819870948792, 0.00014790892601013184, 0.00015627965331077576, 0.00016465038061141968, 0.0001730211079120636, 0.00018139183521270752, 0.00018976256251335144, 0.00019813328981399536, 0.00020650401711463928, 0.0002148747444152832, 0.00022324547171592712, 0.00023161619901657104, 0.00023998692631721497, 0.0002483576536178589, 0.0002567283809185028, 0.00026509910821914673, 0.00027346983551979065, 0.00028184056282043457, 0.0002902112901210785, 0.0002985820174217224, 0.00030695274472236633, 0.00031532347202301025, 0.0003236941993236542, 0.0003320649266242981, 0.000340435653924942, 0.00034880638122558594]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 4.0, 8.0, 7.0, 16.0, 15.0, 14.0, 32.0, 47.0, 56.0, 97.0, 141.0, 240.0, 465.0, 849.0, 2152.0, 6704.0, 34801.0, 457532.0, 497345.0, 36684.0, 7046.0, 2205.0, 872.0, 485.0, 235.0, 157.0, 102.0, 60.0, 50.0, 33.0, 24.0, 18.0, 8.0, 7.0, 4.0, 7.0, 1.0, 4.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.16796875, -2.100250244140625, -2.03253173828125, -1.964813232421875, -1.8970947265625, -1.829376220703125, -1.76165771484375, -1.693939208984375, -1.626220703125, -1.558502197265625, -1.49078369140625, -1.423065185546875, -1.3553466796875, -1.287628173828125, -1.21990966796875, -1.152191162109375, -1.08447265625, -1.016754150390625, -0.94903564453125, -0.881317138671875, -0.8135986328125, -0.745880126953125, -0.67816162109375, -0.610443115234375, -0.542724609375, -0.475006103515625, -0.40728759765625, -0.339569091796875, -0.2718505859375, -0.204132080078125, -0.13641357421875, -0.068695068359375, -0.0009765625, 0.066741943359375, 0.13446044921875, 0.202178955078125, 0.2698974609375, 0.337615966796875, 0.40533447265625, 0.473052978515625, 0.540771484375, 0.608489990234375, 0.67620849609375, 0.743927001953125, 0.8116455078125, 0.879364013671875, 0.94708251953125, 1.014801025390625, 1.08251953125, 1.150238037109375, 1.21795654296875, 1.285675048828125, 1.3533935546875, 1.421112060546875, 1.48883056640625, 1.556549072265625, 1.624267578125, 1.691986083984375, 1.75970458984375, 1.827423095703125, 1.8951416015625, 1.962860107421875, 2.03057861328125, 2.098297119140625, 2.166015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 1.0, 10.0, 16.0, 24.0, 45.0, 59.0, 105.0, 102.0, 125.0, 110.0, 103.0, 74.0, 51.0, 39.0, 34.0, 20.0, 13.0, 4.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.10009765625, -2.0361328125, -1.97216796875, -1.908203125, -1.84423828125, -1.7802734375, -1.71630859375, -1.65234375, -1.58837890625, -1.5244140625, -1.46044921875, -1.396484375, -1.33251953125, -1.2685546875, -1.20458984375, -1.140625, -1.07666015625, -1.0126953125, -0.94873046875, -0.884765625, -0.82080078125, -0.7568359375, -0.69287109375, -0.62890625, -0.56494140625, -0.5009765625, -0.43701171875, -0.373046875, -0.30908203125, -0.2451171875, -0.18115234375, -0.1171875, -0.05322265625, 0.0107421875, 0.07470703125, 0.138671875, 0.20263671875, 0.2666015625, 0.33056640625, 0.39453125, 0.45849609375, 0.5224609375, 0.58642578125, 0.650390625, 0.71435546875, 0.7783203125, 0.84228515625, 0.90625, 0.97021484375, 1.0341796875, 1.09814453125, 1.162109375, 1.22607421875, 1.2900390625, 1.35400390625, 1.41796875, 1.48193359375, 1.5458984375, 1.60986328125, 1.673828125, 1.73779296875, 1.8017578125, 1.86572265625, 1.9296875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 14.0, 15.0, 22.0, 30.0, 38.0, 55.0, 73.0, 93.0, 117.0, 116.0, 103.0, 104.0, 58.0, 44.0, 32.0, 19.0, 18.0, 10.0, 4.0, 9.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.40669059753418, -15.849669456481934, -15.292649269104004, -14.735628128051758, -14.178607940673828, -13.621586799621582, -13.064565658569336, -12.507545471191406, -11.950525283813477, -11.39350414276123, -10.8364839553833, -10.279462814331055, -9.722442626953125, -9.165421485900879, -8.608400344848633, -8.051380157470703, -7.494359016418457, -6.937338352203369, -6.380317687988281, -5.823296546936035, -5.2662763595581055, -4.709255218505859, -4.1522345542907715, -3.5952138900756836, -3.0381932258605957, -2.481172561645508, -1.9241517782211304, -1.367130994796753, -0.810110330581665, -0.25308966636657715, 0.30393123626708984, 0.8609519004821777, 1.4179725646972656, 1.9749932289123535, 2.5320138931274414, 3.0890347957611084, 3.6460554599761963, 4.203076362609863, 4.760097026824951, 5.317117691040039, 5.874138355255127, 6.431159019470215, 6.988179683685303, 7.545200347900391, 8.102221488952637, 8.659241676330566, 9.216262817382812, 9.773283004760742, 10.330304145812988, 10.887325286865234, 11.444345474243164, 12.00136661529541, 12.55838680267334, 13.115407943725586, 13.672428131103516, 14.229449272155762, 14.786470413208008, 15.343491554260254, 15.900511741638184, 16.45753288269043, 17.01455307006836, 17.57157325744629, 18.12859535217285, 18.68561553955078, 19.24263572692871]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 11.0, 11.0, 15.0, 19.0, 19.0, 15.0, 31.0, 29.0, 40.0, 42.0, 39.0, 44.0, 45.0, 50.0, 45.0, 46.0, 47.0, 49.0, 44.0, 45.0, 36.0, 40.0, 47.0, 27.0, 18.0, 23.0, 27.0, 11.0, 16.0, 13.0, 13.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.54494857788086, -14.098066329956055, -13.65118408203125, -13.204301834106445, -12.75741958618164, -12.310537338256836, -11.863655090332031, -11.416772842407227, -10.969890594482422, -10.523008346557617, -10.076126098632812, -9.629243850708008, -9.182361602783203, -8.735479354858398, -8.288597106933594, -7.841714382171631, -7.394831657409668, -6.947949409484863, -6.501067161560059, -6.054184913635254, -5.607302665710449, -5.1604204177856445, -4.713537693023682, -4.266655445098877, -3.8197731971740723, -3.3728909492492676, -2.926008701324463, -2.479126214981079, -2.0322439670562744, -1.5853617191314697, -1.138479232788086, -0.6915969848632812, -0.24471378326416016, 0.2021685242652893, 0.6490508317947388, 1.095933198928833, 1.5428154468536377, 1.9896976947784424, 2.436580181121826, 2.883462429046631, 3.3303446769714355, 3.7772269248962402, 4.224109172821045, 4.670991897583008, 5.1178741455078125, 5.564756393432617, 6.011638641357422, 6.458520889282227, 6.905403137207031, 7.352285385131836, 7.799167633056641, 8.246049880981445, 8.69293212890625, 9.139814376831055, 9.58669662475586, 10.033578872680664, 10.480461120605469, 10.927343368530273, 11.374225616455078, 11.821107864379883, 12.267990112304688, 12.714872360229492, 13.161754608154297, 13.608636856079102, 14.055520057678223]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 17.0, 22.0, 43.0, 55.0, 88.0, 134.0, 247.0, 551.0, 2223.0, 41773.0, 4139690.0, 7361.0, 1144.0, 384.0, 229.0, 99.0, 54.0, 40.0, 30.0, 13.0, 11.0, 9.0, 12.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.390625, -13.0496826171875, -12.708740234375, -12.3677978515625, -12.02685546875, -11.6859130859375, -11.344970703125, -11.0040283203125, -10.6630859375, -10.3221435546875, -9.981201171875, -9.6402587890625, -9.29931640625, -8.9583740234375, -8.617431640625, -8.2764892578125, -7.935546875, -7.5946044921875, -7.253662109375, -6.9127197265625, -6.57177734375, -6.2308349609375, -5.889892578125, -5.5489501953125, -5.2080078125, -4.8670654296875, -4.526123046875, -4.1851806640625, -3.84423828125, -3.5032958984375, -3.162353515625, -2.8214111328125, -2.48046875, -2.1395263671875, -1.798583984375, -1.4576416015625, -1.11669921875, -0.7757568359375, -0.434814453125, -0.0938720703125, 0.2470703125, 0.5880126953125, 0.928955078125, 1.2698974609375, 1.61083984375, 1.9517822265625, 2.292724609375, 2.6336669921875, 2.974609375, 3.3155517578125, 3.656494140625, 3.9974365234375, 4.33837890625, 4.6793212890625, 5.020263671875, 5.3612060546875, 5.7021484375, 6.0430908203125, 6.384033203125, 6.7249755859375, 7.06591796875, 7.4068603515625, 7.747802734375, 8.0887451171875, 8.4296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 8.0, 10.0, 15.0, 15.0, 30.0, 26.0, 23.0, 55.0, 42.0, 57.0, 46.0, 70.0, 62.0, 64.0, 63.0, 60.0, 50.0, 40.0, 41.0, 42.0, 34.0, 30.0, 26.0, 19.0, 14.0, 16.0, 7.0, 7.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8100433349609375, -0.782684326171875, -0.7553253173828125, -0.72796630859375, -0.7006072998046875, -0.673248291015625, -0.6458892822265625, -0.6185302734375, -0.5911712646484375, -0.563812255859375, -0.5364532470703125, -0.50909423828125, -0.4817352294921875, -0.454376220703125, -0.4270172119140625, -0.399658203125, -0.3722991943359375, -0.344940185546875, -0.3175811767578125, -0.29022216796875, -0.2628631591796875, -0.235504150390625, -0.2081451416015625, -0.1807861328125, -0.1534271240234375, -0.126068115234375, -0.0987091064453125, -0.07135009765625, -0.0439910888671875, -0.016632080078125, 0.0107269287109375, 0.0380859375, 0.0654449462890625, 0.092803955078125, 0.1201629638671875, 0.14752197265625, 0.1748809814453125, 0.202239990234375, 0.2295989990234375, 0.2569580078125, 0.2843170166015625, 0.311676025390625, 0.3390350341796875, 0.36639404296875, 0.3937530517578125, 0.421112060546875, 0.4484710693359375, 0.475830078125, 0.5031890869140625, 0.530548095703125, 0.5579071044921875, 0.58526611328125, 0.6126251220703125, 0.639984130859375, 0.6673431396484375, 0.6947021484375, 0.7220611572265625, 0.749420166015625, 0.7767791748046875, 0.80413818359375, 0.8314971923828125, 0.858856201171875, 0.8862152099609375, 0.91357421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 5.0, 3.0, 14.0, 18.0, 22.0, 31.0, 53.0, 66.0, 91.0, 115.0, 181.0, 346.0, 620.0, 1110.0, 2436.0, 6118.0, 21587.0, 257002.0, 3853134.0, 36748.0, 8336.0, 3110.0, 1360.0, 702.0, 372.0, 223.0, 161.0, 78.0, 60.0, 50.0, 40.0, 20.0, 20.0, 8.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.4915771484375, -2.403076171875, -2.3145751953125, -2.22607421875, -2.1375732421875, -2.049072265625, -1.9605712890625, -1.8720703125, -1.7835693359375, -1.695068359375, -1.6065673828125, -1.51806640625, -1.4295654296875, -1.341064453125, -1.2525634765625, -1.1640625, -1.0755615234375, -0.987060546875, -0.8985595703125, -0.81005859375, -0.7215576171875, -0.633056640625, -0.5445556640625, -0.4560546875, -0.3675537109375, -0.279052734375, -0.1905517578125, -0.10205078125, -0.0135498046875, 0.074951171875, 0.1634521484375, 0.251953125, 0.3404541015625, 0.428955078125, 0.5174560546875, 0.60595703125, 0.6944580078125, 0.782958984375, 0.8714599609375, 0.9599609375, 1.0484619140625, 1.136962890625, 1.2254638671875, 1.31396484375, 1.4024658203125, 1.490966796875, 1.5794677734375, 1.66796875, 1.7564697265625, 1.844970703125, 1.9334716796875, 2.02197265625, 2.1104736328125, 2.198974609375, 2.2874755859375, 2.3759765625, 2.4644775390625, 2.552978515625, 2.6414794921875, 2.72998046875, 2.8184814453125, 2.906982421875, 2.9954833984375, 3.083984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 25.0, 55.0, 146.0, 3173.0, 455.0, 102.0, 36.0, 14.0, 6.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0783615112304688, -1.0532073974609375, -1.0280532836914062, -1.002899169921875, -0.9777450561523438, -0.9525909423828125, -0.9274368286132812, -0.90228271484375, -0.8771286010742188, -0.8519744873046875, -0.8268203735351562, -0.801666259765625, -0.7765121459960938, -0.7513580322265625, -0.7262039184570312, -0.7010498046875, -0.6758956909179688, -0.6507415771484375, -0.6255874633789062, -0.600433349609375, -0.5752792358398438, -0.5501251220703125, -0.5249710083007812, -0.49981689453125, -0.47466278076171875, -0.4495086669921875, -0.42435455322265625, -0.399200439453125, -0.37404632568359375, -0.3488922119140625, -0.32373809814453125, -0.298583984375, -0.27342987060546875, -0.2482757568359375, -0.22312164306640625, -0.197967529296875, -0.17281341552734375, -0.1476593017578125, -0.12250518798828125, -0.09735107421875, -0.07219696044921875, -0.0470428466796875, -0.02188873291015625, 0.003265380859375, 0.02841949462890625, 0.0535736083984375, 0.07872772216796875, 0.1038818359375, 0.12903594970703125, 0.1541900634765625, 0.17934417724609375, 0.204498291015625, 0.22965240478515625, 0.2548065185546875, 0.27996063232421875, 0.30511474609375, 0.33026885986328125, 0.3554229736328125, 0.38057708740234375, 0.405731201171875, 0.43088531494140625, 0.4560394287109375, 0.48119354248046875, 0.50634765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 10.0, 20.0, 26.0, 49.0, 84.0, 118.0, 163.0, 151.0, 137.0, 111.0, 45.0, 31.0, 18.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039318323135376, -2.9488184452056885, -2.85831880569458, -2.7678189277648926, -2.677319049835205, -2.5868191719055176, -2.496319532394409, -2.4058196544647217, -2.315319776535034, -2.2248198986053467, -2.1343202590942383, -2.043820381164551, -1.9533205032348633, -1.8628207445144653, -1.7723209857940674, -1.6818211078643799, -1.591321349143982, -1.500821590423584, -1.4103217124938965, -1.3198219537734985, -1.229322075843811, -1.138822317123413, -1.0483224391937256, -0.9578226804733276, -0.8673228621482849, -0.7768230438232422, -0.6863232254981995, -0.5958234071731567, -0.5053236484527588, -0.4148238003253937, -0.32432401180267334, -0.23382419347763062, -0.1433243751525879, -0.05282456427812576, 0.037675246596336365, 0.1281750500202179, 0.21867486834526062, 0.30917468667030334, 0.3996744751930237, 0.4901742935180664, 0.5806741118431091, 0.6711739301681519, 0.7616737484931946, 0.8521735668182373, 0.9426733255386353, 1.0331732034683228, 1.1236729621887207, 1.2141728401184082, 1.3046725988388062, 1.395172357559204, 1.4856722354888916, 1.5761719942092896, 1.666671872138977, 1.757171630859375, 1.8476715087890625, 1.9381712675094604, 2.0286710262298584, 2.119170904159546, 2.2096705436706543, 2.300170421600342, 2.3906702995300293, 2.481170177459717, 2.571669816970825, 2.6621696949005127, 2.7526695728302]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 11.0, 9.0, 14.0, 7.0, 24.0, 22.0, 32.0, 29.0, 32.0, 33.0, 40.0, 52.0, 51.0, 44.0, 64.0, 47.0, 44.0, 63.0, 46.0, 42.0, 31.0, 33.0, 28.0, 37.0, 36.0, 23.0, 32.0, 18.0, 12.0, 6.0, 4.0, 2.0, 5.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.798314094543457, -1.747164011001587, -1.6960139274597168, -1.6448638439178467, -1.5937137603759766, -1.5425636768341064, -1.4914137125015259, -1.4402636289596558, -1.3891135454177856, -1.3379634618759155, -1.2868133783340454, -1.2356632947921753, -1.1845133304595947, -1.1333632469177246, -1.0822131633758545, -1.0310630798339844, -0.9799129962921143, -0.9287629127502441, -0.877612829208374, -0.8264628052711487, -0.7753127217292786, -0.7241626381874084, -0.6730126142501831, -0.621862530708313, -0.5707124471664429, -0.5195623636245728, -0.468412309885025, -0.4172622561454773, -0.3661121726036072, -0.31496208906173706, -0.26381203532218933, -0.2126619815826416, -0.16151189804077148, -0.11036182940006256, -0.05921176075935364, -0.008061692118644714, 0.04308837652206421, 0.09423846006393433, 0.14538851380348206, 0.19653856754302979, 0.2476886510848999, 0.29883873462677, 0.34998878836631775, 0.4011388421058655, 0.4522889256477356, 0.5034390091896057, 0.554589033126831, 0.6057391166687012, 0.6568892002105713, 0.7080392837524414, 0.7591893672943115, 0.8103393912315369, 0.861489474773407, 0.9126395583152771, 0.9637895822525024, 1.0149396657943726, 1.0660897493362427, 1.1172398328781128, 1.168389916419983, 1.219539999961853, 1.2706899642944336, 1.3218400478363037, 1.3729901313781738, 1.424140214920044, 1.475290298461914]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 5.0, 13.0, 19.0, 31.0, 55.0, 69.0, 139.0, 266.0, 561.0, 1141.0, 2871.0, 9184.0, 37109.0, 178648.0, 513278.0, 238060.0, 49100.0, 11849.0, 3618.0, 1334.0, 553.0, 269.0, 132.0, 91.0, 49.0, 30.0, 22.0, 10.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.498046875, -3.404998779296875, -3.31195068359375, -3.218902587890625, -3.1258544921875, -3.032806396484375, -2.93975830078125, -2.846710205078125, -2.753662109375, -2.660614013671875, -2.56756591796875, -2.474517822265625, -2.3814697265625, -2.288421630859375, -2.19537353515625, -2.102325439453125, -2.00927734375, -1.916229248046875, -1.82318115234375, -1.730133056640625, -1.6370849609375, -1.544036865234375, -1.45098876953125, -1.357940673828125, -1.264892578125, -1.171844482421875, -1.07879638671875, -0.985748291015625, -0.8927001953125, -0.799652099609375, -0.70660400390625, -0.613555908203125, -0.5205078125, -0.427459716796875, -0.33441162109375, -0.241363525390625, -0.1483154296875, -0.055267333984375, 0.03778076171875, 0.130828857421875, 0.223876953125, 0.316925048828125, 0.40997314453125, 0.503021240234375, 0.5960693359375, 0.689117431640625, 0.78216552734375, 0.875213623046875, 0.96826171875, 1.061309814453125, 1.15435791015625, 1.247406005859375, 1.3404541015625, 1.433502197265625, 1.52655029296875, 1.619598388671875, 1.712646484375, 1.805694580078125, 1.89874267578125, 1.991790771484375, 2.0848388671875, 2.177886962890625, 2.27093505859375, 2.363983154296875, 2.45703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 11.0, 12.0, 19.0, 19.0, 32.0, 36.0, 32.0, 56.0, 63.0, 56.0, 58.0, 65.0, 67.0, 73.0, 57.0, 51.0, 48.0, 43.0, 37.0, 37.0, 23.0, 21.0, 14.0, 16.0, 10.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.7950592041015625, -0.763946533203125, -0.7328338623046875, -0.70172119140625, -0.6706085205078125, -0.639495849609375, -0.6083831787109375, -0.5772705078125, -0.5461578369140625, -0.515045166015625, -0.4839324951171875, -0.45281982421875, -0.4217071533203125, -0.390594482421875, -0.3594818115234375, -0.328369140625, -0.2972564697265625, -0.266143798828125, -0.2350311279296875, -0.20391845703125, -0.1728057861328125, -0.141693115234375, -0.1105804443359375, -0.0794677734375, -0.0483551025390625, -0.017242431640625, 0.0138702392578125, 0.04498291015625, 0.0760955810546875, 0.107208251953125, 0.1383209228515625, 0.16943359375, 0.2005462646484375, 0.231658935546875, 0.2627716064453125, 0.29388427734375, 0.3249969482421875, 0.356109619140625, 0.3872222900390625, 0.4183349609375, 0.4494476318359375, 0.480560302734375, 0.5116729736328125, 0.54278564453125, 0.5738983154296875, 0.605010986328125, 0.6361236572265625, 0.667236328125, 0.6983489990234375, 0.729461669921875, 0.7605743408203125, 0.79168701171875, 0.8227996826171875, 0.853912353515625, 0.8850250244140625, 0.9161376953125, 0.9472503662109375, 0.978363037109375, 1.0094757080078125, 1.04058837890625, 1.0717010498046875, 1.102813720703125, 1.1339263916015625, 1.1650390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 11.0, 8.0, 9.0, 10.0, 30.0, 46.0, 81.0, 84.0, 114.0, 210.0, 328.0, 601.0, 1155.0, 2887.0, 25646.0, 858131.0, 149706.0, 6021.0, 1577.0, 766.0, 429.0, 257.0, 164.0, 93.0, 70.0, 49.0, 20.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.9705810546875, -6.757568359375, -6.5445556640625, -6.33154296875, -6.1185302734375, -5.905517578125, -5.6925048828125, -5.4794921875, -5.2664794921875, -5.053466796875, -4.8404541015625, -4.62744140625, -4.4144287109375, -4.201416015625, -3.9884033203125, -3.775390625, -3.5623779296875, -3.349365234375, -3.1363525390625, -2.92333984375, -2.7103271484375, -2.497314453125, -2.2843017578125, -2.0712890625, -1.8582763671875, -1.645263671875, -1.4322509765625, -1.21923828125, -1.0062255859375, -0.793212890625, -0.5802001953125, -0.3671875, -0.1541748046875, 0.058837890625, 0.2718505859375, 0.48486328125, 0.6978759765625, 0.910888671875, 1.1239013671875, 1.3369140625, 1.5499267578125, 1.762939453125, 1.9759521484375, 2.18896484375, 2.4019775390625, 2.614990234375, 2.8280029296875, 3.041015625, 3.2540283203125, 3.467041015625, 3.6800537109375, 3.89306640625, 4.1060791015625, 4.319091796875, 4.5321044921875, 4.7451171875, 4.9581298828125, 5.171142578125, 5.3841552734375, 5.59716796875, 5.8101806640625, 6.023193359375, 6.2362060546875, 6.44921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 0.0, 7.0, 7.0, 9.0, 10.0, 18.0, 25.0, 28.0, 23.0, 38.0, 46.0, 58.0, 53.0, 48.0, 89.0, 66.0, 58.0, 72.0, 60.0, 47.0, 46.0, 47.0, 38.0, 26.0, 21.0, 19.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.11285400390625, -3.9522705078125, -3.79168701171875, -3.631103515625, -3.47052001953125, -3.3099365234375, -3.14935302734375, -2.98876953125, -2.82818603515625, -2.6676025390625, -2.50701904296875, -2.346435546875, -2.18585205078125, -2.0252685546875, -1.86468505859375, -1.7041015625, -1.54351806640625, -1.3829345703125, -1.22235107421875, -1.061767578125, -0.90118408203125, -0.7406005859375, -0.58001708984375, -0.41943359375, -0.25885009765625, -0.0982666015625, 0.06231689453125, 0.222900390625, 0.38348388671875, 0.5440673828125, 0.70465087890625, 0.865234375, 1.02581787109375, 1.1864013671875, 1.34698486328125, 1.507568359375, 1.66815185546875, 1.8287353515625, 1.98931884765625, 2.14990234375, 2.31048583984375, 2.4710693359375, 2.63165283203125, 2.792236328125, 2.95281982421875, 3.1134033203125, 3.27398681640625, 3.4345703125, 3.59515380859375, 3.7557373046875, 3.91632080078125, 4.076904296875, 4.23748779296875, 4.3980712890625, 4.55865478515625, 4.71923828125, 4.87982177734375, 5.0404052734375, 5.20098876953125, 5.361572265625, 5.52215576171875, 5.6827392578125, 5.84332275390625, 6.00390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 7.0, 19.0, 15.0, 35.0, 50.0, 57.0, 127.0, 182.0, 374.0, 1031.0, 10553.0, 974315.0, 58658.0, 1952.0, 545.0, 228.0, 130.0, 82.0, 59.0, 34.0, 22.0, 11.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.64227294921875, -5.4642333984375, -5.28619384765625, -5.108154296875, -4.93011474609375, -4.7520751953125, -4.57403564453125, -4.39599609375, -4.21795654296875, -4.0399169921875, -3.86187744140625, -3.683837890625, -3.50579833984375, -3.3277587890625, -3.14971923828125, -2.9716796875, -2.79364013671875, -2.6156005859375, -2.43756103515625, -2.259521484375, -2.08148193359375, -1.9034423828125, -1.72540283203125, -1.54736328125, -1.36932373046875, -1.1912841796875, -1.01324462890625, -0.835205078125, -0.65716552734375, -0.4791259765625, -0.30108642578125, -0.123046875, 0.05499267578125, 0.2330322265625, 0.41107177734375, 0.589111328125, 0.76715087890625, 0.9451904296875, 1.12322998046875, 1.30126953125, 1.47930908203125, 1.6573486328125, 1.83538818359375, 2.013427734375, 2.19146728515625, 2.3695068359375, 2.54754638671875, 2.7255859375, 2.90362548828125, 3.0816650390625, 3.25970458984375, 3.437744140625, 3.61578369140625, 3.7938232421875, 3.97186279296875, 4.14990234375, 4.32794189453125, 4.5059814453125, 4.68402099609375, 4.862060546875, 5.04010009765625, 5.2181396484375, 5.39617919921875, 5.57421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 6.0, 3.0, 11.0, 5.0, 11.0, 16.0, 20.0, 23.0, 36.0, 31.0, 58.0, 73.0, 98.0, 103.0, 115.0, 84.0, 59.0, 55.0, 39.0, 37.0, 25.0, 20.0, 10.0, 9.0, 11.0, 8.0, 4.0, 4.0, 3.0, 4.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022470951080322266, -0.0002178587019443512, -0.00021100789308547974, -0.00020415708422660828, -0.00019730627536773682, -0.00019045546650886536, -0.0001836046576499939, -0.00017675384879112244, -0.00016990303993225098, -0.00016305223107337952, -0.00015620142221450806, -0.0001493506133556366, -0.00014249980449676514, -0.00013564899563789368, -0.00012879818677902222, -0.00012194737792015076, -0.0001150965690612793, -0.00010824576020240784, -0.00010139495134353638, -9.454414248466492e-05, -8.769333362579346e-05, -8.0842524766922e-05, -7.399171590805054e-05, -6.714090704917908e-05, -6.029009819030762e-05, -5.343928933143616e-05, -4.65884804725647e-05, -3.973767161369324e-05, -3.288686275482178e-05, -2.6036053895950317e-05, -1.9185245037078857e-05, -1.2334436178207397e-05, -5.4836273193359375e-06, 1.3671815395355225e-06, 8.217990398406982e-06, 1.5068799257278442e-05, 2.1919608116149902e-05, 2.8770416975021362e-05, 3.562122583389282e-05, 4.247203469276428e-05, 4.932284355163574e-05, 5.61736524105072e-05, 6.302446126937866e-05, 6.987527012825012e-05, 7.672607898712158e-05, 8.357688784599304e-05, 9.04276967048645e-05, 9.727850556373596e-05, 0.00010412931442260742, 0.00011098012328147888, 0.00011783093214035034, 0.0001246817409992218, 0.00013153254985809326, 0.00013838335871696472, 0.00014523416757583618, 0.00015208497643470764, 0.0001589357852935791, 0.00016578659415245056, 0.00017263740301132202, 0.00017948821187019348, 0.00018633902072906494, 0.0001931898295879364, 0.00020004063844680786, 0.00020689144730567932, 0.00021374225616455078]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 12.0, 4.0, 11.0, 7.0, 20.0, 25.0, 40.0, 41.0, 72.0, 118.0, 180.0, 322.0, 794.0, 2212.0, 10675.0, 251798.0, 757432.0, 19608.0, 3113.0, 987.0, 449.0, 237.0, 140.0, 78.0, 48.0, 41.0, 25.0, 17.0, 10.0, 10.0, 9.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.442413330078125, -3.32818603515625, -3.213958740234375, -3.0997314453125, -2.985504150390625, -2.87127685546875, -2.757049560546875, -2.642822265625, -2.528594970703125, -2.41436767578125, -2.300140380859375, -2.1859130859375, -2.071685791015625, -1.95745849609375, -1.843231201171875, -1.72900390625, -1.614776611328125, -1.50054931640625, -1.386322021484375, -1.2720947265625, -1.157867431640625, -1.04364013671875, -0.929412841796875, -0.815185546875, -0.700958251953125, -0.58673095703125, -0.472503662109375, -0.3582763671875, -0.244049072265625, -0.12982177734375, -0.015594482421875, 0.0986328125, 0.212860107421875, 0.32708740234375, 0.441314697265625, 0.5555419921875, 0.669769287109375, 0.78399658203125, 0.898223876953125, 1.012451171875, 1.126678466796875, 1.24090576171875, 1.355133056640625, 1.4693603515625, 1.583587646484375, 1.69781494140625, 1.812042236328125, 1.92626953125, 2.040496826171875, 2.15472412109375, 2.268951416015625, 2.3831787109375, 2.497406005859375, 2.61163330078125, 2.725860595703125, 2.840087890625, 2.954315185546875, 3.06854248046875, 3.182769775390625, 3.2969970703125, 3.411224365234375, 3.52545166015625, 3.639678955078125, 3.75390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 8.0, 10.0, 28.0, 39.0, 51.0, 53.0, 94.0, 132.0, 134.0, 129.0, 71.0, 72.0, 59.0, 28.0, 20.0, 11.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.59381103515625, -2.5079345703125, -2.42205810546875, -2.336181640625, -2.25030517578125, -2.1644287109375, -2.07855224609375, -1.99267578125, -1.90679931640625, -1.8209228515625, -1.73504638671875, -1.649169921875, -1.56329345703125, -1.4774169921875, -1.39154052734375, -1.3056640625, -1.21978759765625, -1.1339111328125, -1.04803466796875, -0.962158203125, -0.87628173828125, -0.7904052734375, -0.70452880859375, -0.61865234375, -0.53277587890625, -0.4468994140625, -0.36102294921875, -0.275146484375, -0.18927001953125, -0.1033935546875, -0.01751708984375, 0.068359375, 0.15423583984375, 0.2401123046875, 0.32598876953125, 0.411865234375, 0.49774169921875, 0.5836181640625, 0.66949462890625, 0.75537109375, 0.84124755859375, 0.9271240234375, 1.01300048828125, 1.098876953125, 1.18475341796875, 1.2706298828125, 1.35650634765625, 1.4423828125, 1.52825927734375, 1.6141357421875, 1.70001220703125, 1.785888671875, 1.87176513671875, 1.9576416015625, 2.04351806640625, 2.12939453125, 2.21527099609375, 2.3011474609375, 2.38702392578125, 2.472900390625, 2.55877685546875, 2.6446533203125, 2.73052978515625, 2.81640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 28.0, 142.0, 433.0, 325.0, 60.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.46310424804688, -102.12818908691406, -99.79326629638672, -97.45834350585938, -95.12342834472656, -92.78851318359375, -90.4535903930664, -88.11866760253906, -85.78375244140625, -83.44883728027344, -81.1139144897461, -78.77899169921875, -76.44407653808594, -74.10916137695312, -71.77423858642578, -69.43931579589844, -67.10440063476562, -64.76948547363281, -62.43456268310547, -60.09964370727539, -57.76472473144531, -55.429805755615234, -53.094886779785156, -50.75996780395508, -48.425048828125, -46.09012985229492, -43.755210876464844, -41.420291900634766, -39.08537292480469, -36.75045394897461, -34.41553497314453, -32.08061599731445, -29.745704650878906, -27.410785675048828, -25.07586669921875, -22.740947723388672, -20.406028747558594, -18.071109771728516, -15.736190795898438, -13.40127182006836, -11.066352844238281, -8.731433868408203, -6.396514892578125, -4.061595916748047, -1.7266769409179688, 0.6082420349121094, 2.9431610107421875, 5.278079986572266, 7.612998962402344, 9.947917938232422, 12.2828369140625, 14.617755889892578, 16.952674865722656, 19.287593841552734, 21.622512817382812, 23.95743179321289, 26.29235076904297, 28.627269744873047, 30.962188720703125, 33.2971076965332, 35.63202667236328, 37.96694564819336, 40.30186462402344, 42.636783599853516, 44.971702575683594]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 6.0, 4.0, 12.0, 7.0, 9.0, 11.0, 18.0, 17.0, 17.0, 21.0, 25.0, 30.0, 32.0, 35.0, 34.0, 34.0, 38.0, 43.0, 53.0, 34.0, 47.0, 45.0, 50.0, 41.0, 40.0, 38.0, 27.0, 28.0, 21.0, 25.0, 32.0, 24.0, 19.0, 9.0, 7.0, 5.0, 13.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.858171463012695, -15.4027681350708, -14.947365760803223, -14.491962432861328, -14.03656005859375, -13.581156730651855, -13.125754356384277, -12.670351028442383, -12.214948654174805, -11.75954532623291, -11.304142951965332, -10.848739624023438, -10.39333724975586, -9.937933921813965, -9.482531547546387, -9.027128219604492, -8.571725845336914, -8.11632251739502, -7.660920143127441, -7.205517292022705, -6.750114440917969, -6.294711112976074, -5.839308738708496, -5.383905410766602, -4.928502082824707, -4.473099231719971, -4.017696380615234, -3.562293529510498, -3.1068906784057617, -2.6514875888824463, -2.19608473777771, -1.7406818866729736, -1.2852792739868164, -0.8298764228820801, -0.374473512172699, 0.08092939853668213, 0.5363322496414185, 0.9917352199554443, 1.4471380710601807, 1.902540922164917, 2.3579437732696533, 2.8133466243743896, 3.268749475479126, 3.7241525650024414, 4.179555416107178, 4.634958267211914, 5.09036111831665, 5.545763969421387, 6.001166820526123, 6.456569671630859, 6.911972522735596, 7.367375373840332, 7.822778224945068, 8.278181076049805, 8.7335844039917, 9.188986778259277, 9.644390106201172, 10.099793434143066, 10.555195808410645, 11.010599136352539, 11.466001510620117, 11.921404838562012, 12.37680721282959, 12.832210540771484, 13.287612915039062]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 12.0, 16.0, 24.0, 42.0, 66.0, 113.0, 169.0, 261.0, 529.0, 1086.0, 3374.0, 24605.0, 4050376.0, 103531.0, 6759.0, 1683.0, 723.0, 373.0, 191.0, 123.0, 64.0, 43.0, 27.0, 15.0, 12.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0], "bins": [-6.80859375, -6.63714599609375, -6.4656982421875, -6.29425048828125, -6.122802734375, -5.95135498046875, -5.7799072265625, -5.60845947265625, -5.43701171875, -5.26556396484375, -5.0941162109375, -4.92266845703125, -4.751220703125, -4.57977294921875, -4.4083251953125, -4.23687744140625, -4.0654296875, -3.89398193359375, -3.7225341796875, -3.55108642578125, -3.379638671875, -3.20819091796875, -3.0367431640625, -2.86529541015625, -2.69384765625, -2.52239990234375, -2.3509521484375, -2.17950439453125, -2.008056640625, -1.83660888671875, -1.6651611328125, -1.49371337890625, -1.322265625, -1.15081787109375, -0.9793701171875, -0.80792236328125, -0.636474609375, -0.46502685546875, -0.2935791015625, -0.12213134765625, 0.04931640625, 0.22076416015625, 0.3922119140625, 0.56365966796875, 0.735107421875, 0.90655517578125, 1.0780029296875, 1.24945068359375, 1.4208984375, 1.59234619140625, 1.7637939453125, 1.93524169921875, 2.106689453125, 2.27813720703125, 2.4495849609375, 2.62103271484375, 2.79248046875, 2.96392822265625, 3.1353759765625, 3.30682373046875, 3.478271484375, 3.64971923828125, 3.8211669921875, 3.99261474609375, 4.1640625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 6.0, 2.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 12.0, 26.0, 37.0, 36.0, 41.0, 46.0, 51.0, 62.0, 61.0, 52.0, 41.0, 51.0, 45.0, 47.0, 61.0, 35.0, 31.0, 34.0, 36.0, 21.0, 15.0, 14.0, 16.0, 13.0, 7.0, 6.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.9150390625, -0.889007568359375, -0.86297607421875, -0.836944580078125, -0.8109130859375, -0.784881591796875, -0.75885009765625, -0.732818603515625, -0.706787109375, -0.680755615234375, -0.65472412109375, -0.628692626953125, -0.6026611328125, -0.576629638671875, -0.55059814453125, -0.524566650390625, -0.49853515625, -0.472503662109375, -0.44647216796875, -0.420440673828125, -0.3944091796875, -0.368377685546875, -0.34234619140625, -0.316314697265625, -0.290283203125, -0.264251708984375, -0.23822021484375, -0.212188720703125, -0.1861572265625, -0.160125732421875, -0.13409423828125, -0.108062744140625, -0.08203125, -0.055999755859375, -0.02996826171875, -0.003936767578125, 0.0220947265625, 0.048126220703125, 0.07415771484375, 0.100189208984375, 0.126220703125, 0.152252197265625, 0.17828369140625, 0.204315185546875, 0.2303466796875, 0.256378173828125, 0.28240966796875, 0.308441162109375, 0.33447265625, 0.360504150390625, 0.38653564453125, 0.412567138671875, 0.4385986328125, 0.464630126953125, 0.49066162109375, 0.516693115234375, 0.542724609375, 0.568756103515625, 0.59478759765625, 0.620819091796875, 0.6468505859375, 0.672882080078125, 0.69891357421875, 0.724945068359375, 0.7509765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 10.0, 7.0, 19.0, 11.0, 22.0, 28.0, 36.0, 41.0, 50.0, 79.0, 105.0, 172.0, 268.0, 416.0, 663.0, 1235.0, 2625.0, 6999.0, 27291.0, 336434.0, 3752924.0, 47351.0, 10187.0, 3471.0, 1607.0, 814.0, 456.0, 285.0, 209.0, 130.0, 88.0, 60.0, 60.0, 26.0, 18.0, 22.0, 16.0, 13.0, 7.0, 6.0, 8.0, 3.0, 6.0, 1.0, 6.0, 0.0, 1.0, 3.0], "bins": [-3.119140625, -3.032867431640625, -2.94659423828125, -2.860321044921875, -2.7740478515625, -2.687774658203125, -2.60150146484375, -2.515228271484375, -2.428955078125, -2.342681884765625, -2.25640869140625, -2.170135498046875, -2.0838623046875, -1.997589111328125, -1.91131591796875, -1.825042724609375, -1.73876953125, -1.652496337890625, -1.56622314453125, -1.479949951171875, -1.3936767578125, -1.307403564453125, -1.22113037109375, -1.134857177734375, -1.048583984375, -0.962310791015625, -0.87603759765625, -0.789764404296875, -0.7034912109375, -0.617218017578125, -0.53094482421875, -0.444671630859375, -0.3583984375, -0.272125244140625, -0.18585205078125, -0.099578857421875, -0.0133056640625, 0.072967529296875, 0.15924072265625, 0.245513916015625, 0.331787109375, 0.418060302734375, 0.50433349609375, 0.590606689453125, 0.6768798828125, 0.763153076171875, 0.84942626953125, 0.935699462890625, 1.02197265625, 1.108245849609375, 1.19451904296875, 1.280792236328125, 1.3670654296875, 1.453338623046875, 1.53961181640625, 1.625885009765625, 1.712158203125, 1.798431396484375, 1.88470458984375, 1.970977783203125, 2.0572509765625, 2.143524169921875, 2.22979736328125, 2.316070556640625, 2.40234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 19.0, 49.0, 83.0, 417.0, 3124.0, 209.0, 58.0, 31.0, 22.0, 15.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.26971435546875, -1.2152099609375, -1.16070556640625, -1.106201171875, -1.05169677734375, -0.9971923828125, -0.94268798828125, -0.88818359375, -0.83367919921875, -0.7791748046875, -0.72467041015625, -0.670166015625, -0.61566162109375, -0.5611572265625, -0.50665283203125, -0.4521484375, -0.39764404296875, -0.3431396484375, -0.28863525390625, -0.234130859375, -0.17962646484375, -0.1251220703125, -0.07061767578125, -0.01611328125, 0.03839111328125, 0.0928955078125, 0.14739990234375, 0.201904296875, 0.25640869140625, 0.3109130859375, 0.36541748046875, 0.419921875, 0.47442626953125, 0.5289306640625, 0.58343505859375, 0.637939453125, 0.69244384765625, 0.7469482421875, 0.80145263671875, 0.85595703125, 0.91046142578125, 0.9649658203125, 1.01947021484375, 1.073974609375, 1.12847900390625, 1.1829833984375, 1.23748779296875, 1.2919921875, 1.34649658203125, 1.4010009765625, 1.45550537109375, 1.510009765625, 1.56451416015625, 1.6190185546875, 1.67352294921875, 1.72802734375, 1.78253173828125, 1.8370361328125, 1.89154052734375, 1.946044921875, 2.00054931640625, 2.0550537109375, 2.10955810546875, 2.1640625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 14.0, 32.0, 64.0, 136.0, 208.0, 234.0, 148.0, 81.0, 39.0, 17.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1591782569885254, -2.898341178894043, -2.6375041007995605, -2.376666784286499, -2.1158297061920166, -1.8549926280975342, -1.5941554307937622, -1.3333182334899902, -1.0724811553955078, -0.8116440176963806, -0.5508068799972534, -0.2899697422981262, -0.029132604598999023, 0.2317044734954834, 0.49254167079925537, 0.7533788681030273, 1.0142159461975098, 1.2750530242919922, 1.5358902215957642, 1.7967274188995361, 2.0575644969940186, 2.318401575088501, 2.5792388916015625, 2.840075969696045, 3.1009130477905273, 3.3617501258850098, 3.622587203979492, 3.8834245204925537, 4.144261360168457, 4.405098915100098, 4.66593599319458, 4.9267730712890625, 5.187610626220703, 5.4484477043151855, 5.709284782409668, 5.97012186050415, 6.230958938598633, 6.491796493530273, 6.752633571624756, 7.013470649719238, 7.274307727813721, 7.535144805908203, 7.7959818840026855, 8.056818962097168, 8.317656517028809, 8.578493118286133, 8.839330673217773, 9.100168228149414, 9.361004829406738, 9.621842384338379, 9.882678985595703, 10.143516540527344, 10.404353141784668, 10.665190696716309, 10.926027297973633, 11.186864852905273, 11.447702407836914, 11.708539962768555, 11.969376564025879, 12.23021411895752, 12.491050720214844, 12.751888275146484, 13.012724876403809, 13.27356243133545, 13.534399032592773]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 14.0, 18.0, 20.0, 35.0, 36.0, 28.0, 41.0, 45.0, 53.0, 64.0, 59.0, 55.0, 67.0, 52.0, 58.0, 57.0, 46.0, 38.0, 35.0, 21.0, 28.0, 21.0, 18.0, 10.0, 10.0, 8.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.197094440460205, -4.079265117645264, -3.961435317993164, -3.8436059951782227, -3.725776433944702, -3.6079468727111816, -3.490117311477661, -3.3722877502441406, -3.254458427429199, -3.1366288661956787, -3.018799304962158, -2.900969982147217, -2.7831404209136963, -2.665310859680176, -2.5474812984466553, -2.4296517372131348, -2.3118221759796143, -2.1939926147460938, -2.0761630535125732, -1.9583336114883423, -1.8405041694641113, -1.7226746082305908, -1.6048450469970703, -1.4870154857635498, -1.3691860437393188, -1.2513564825057983, -1.1335270404815674, -1.0156974792480469, -0.8978679776191711, -0.7800384759902954, -0.6622089147567749, -0.5443794131278992, -0.42654991149902344, -0.3087204098701477, -0.19089087843894958, -0.07306134700775146, 0.04476815462112427, 0.16259765625, 0.2804272174835205, 0.39825671911239624, 0.516086220741272, 0.6339157223701477, 0.7517452239990234, 0.869574785232544, 0.9874042868614197, 1.1052337884902954, 1.223063349723816, 1.3408927917480469, 1.4587223529815674, 1.576551914215088, 1.6943813562393188, 1.8122109174728394, 1.9300403594970703, 2.047869920730591, 2.1656994819641113, 2.283529043197632, 2.4013586044311523, 2.519188165664673, 2.6370177268981934, 2.7548470497131348, 2.8726766109466553, 2.990506172180176, 3.1083357334136963, 3.226165294647217, 3.343994617462158]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 18.0, 36.0, 46.0, 62.0, 118.0, 201.0, 419.0, 857.0, 1965.0, 5700.0, 21539.0, 117615.0, 546344.0, 289656.0, 47702.0, 10467.0, 3337.0, 1241.0, 561.0, 265.0, 158.0, 72.0, 45.0, 39.0, 21.0, 16.0, 10.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.046875, -2.940887451171875, -2.83489990234375, -2.728912353515625, -2.6229248046875, -2.516937255859375, -2.41094970703125, -2.304962158203125, -2.198974609375, -2.092987060546875, -1.98699951171875, -1.881011962890625, -1.7750244140625, -1.669036865234375, -1.56304931640625, -1.457061767578125, -1.35107421875, -1.245086669921875, -1.13909912109375, -1.033111572265625, -0.9271240234375, -0.821136474609375, -0.71514892578125, -0.609161376953125, -0.503173828125, -0.397186279296875, -0.29119873046875, -0.185211181640625, -0.0792236328125, 0.026763916015625, 0.13275146484375, 0.238739013671875, 0.3447265625, 0.450714111328125, 0.55670166015625, 0.662689208984375, 0.7686767578125, 0.874664306640625, 0.98065185546875, 1.086639404296875, 1.192626953125, 1.298614501953125, 1.40460205078125, 1.510589599609375, 1.6165771484375, 1.722564697265625, 1.82855224609375, 1.934539794921875, 2.04052734375, 2.146514892578125, 2.25250244140625, 2.358489990234375, 2.4644775390625, 2.570465087890625, 2.67645263671875, 2.782440185546875, 2.888427734375, 2.994415283203125, 3.10040283203125, 3.206390380859375, 3.3123779296875, 3.418365478515625, 3.52435302734375, 3.630340576171875, 3.736328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 5.0, 7.0, 3.0, 12.0, 13.0, 24.0, 30.0, 37.0, 28.0, 41.0, 44.0, 42.0, 48.0, 51.0, 51.0, 48.0, 74.0, 54.0, 56.0, 39.0, 33.0, 43.0, 30.0, 35.0, 28.0, 20.0, 9.0, 12.0, 15.0, 10.0, 8.0, 7.0, 11.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8998947143554688, -0.8725433349609375, -0.8451919555664062, -0.817840576171875, -0.7904891967773438, -0.7631378173828125, -0.7357864379882812, -0.70843505859375, -0.6810836791992188, -0.6537322998046875, -0.6263809204101562, -0.599029541015625, -0.5716781616210938, -0.5443267822265625, -0.5169754028320312, -0.4896240234375, -0.46227264404296875, -0.4349212646484375, -0.40756988525390625, -0.380218505859375, -0.35286712646484375, -0.3255157470703125, -0.29816436767578125, -0.27081298828125, -0.24346160888671875, -0.2161102294921875, -0.18875885009765625, -0.161407470703125, -0.13405609130859375, -0.1067047119140625, -0.07935333251953125, -0.052001953125, -0.02465057373046875, 0.0027008056640625, 0.03005218505859375, 0.057403564453125, 0.08475494384765625, 0.1121063232421875, 0.13945770263671875, 0.16680908203125, 0.19416046142578125, 0.2215118408203125, 0.24886322021484375, 0.276214599609375, 0.30356597900390625, 0.3309173583984375, 0.35826873779296875, 0.3856201171875, 0.41297149658203125, 0.4403228759765625, 0.46767425537109375, 0.495025634765625, 0.5223770141601562, 0.5497283935546875, 0.5770797729492188, 0.60443115234375, 0.6317825317382812, 0.6591339111328125, 0.6864852905273438, 0.713836669921875, 0.7411880493164062, 0.7685394287109375, 0.7958908081054688, 0.8232421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 7.0, 10.0, 23.0, 27.0, 30.0, 45.0, 74.0, 91.0, 118.0, 193.0, 305.0, 489.0, 947.0, 2328.0, 8413.0, 90980.0, 856468.0, 75862.0, 7517.0, 2204.0, 987.0, 521.0, 318.0, 167.0, 125.0, 81.0, 52.0, 41.0, 37.0, 23.0, 16.0, 12.0, 7.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.59185791015625, -5.4141845703125, -5.23651123046875, -5.058837890625, -4.88116455078125, -4.7034912109375, -4.52581787109375, -4.34814453125, -4.17047119140625, -3.9927978515625, -3.81512451171875, -3.637451171875, -3.45977783203125, -3.2821044921875, -3.10443115234375, -2.9267578125, -2.74908447265625, -2.5714111328125, -2.39373779296875, -2.216064453125, -2.03839111328125, -1.8607177734375, -1.68304443359375, -1.50537109375, -1.32769775390625, -1.1500244140625, -0.97235107421875, -0.794677734375, -0.61700439453125, -0.4393310546875, -0.26165771484375, -0.083984375, 0.09368896484375, 0.2713623046875, 0.44903564453125, 0.626708984375, 0.80438232421875, 0.9820556640625, 1.15972900390625, 1.33740234375, 1.51507568359375, 1.6927490234375, 1.87042236328125, 2.048095703125, 2.22576904296875, 2.4034423828125, 2.58111572265625, 2.7587890625, 2.93646240234375, 3.1141357421875, 3.29180908203125, 3.469482421875, 3.64715576171875, 3.8248291015625, 4.00250244140625, 4.18017578125, 4.35784912109375, 4.5355224609375, 4.71319580078125, 4.890869140625, 5.06854248046875, 5.2462158203125, 5.42388916015625, 5.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 12.0, 8.0, 17.0, 28.0, 29.0, 41.0, 44.0, 60.0, 59.0, 61.0, 73.0, 84.0, 76.0, 77.0, 74.0, 46.0, 42.0, 31.0, 32.0, 29.0, 16.0, 15.0, 9.0, 9.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.109375, -5.93841552734375, -5.7674560546875, -5.59649658203125, -5.425537109375, -5.25457763671875, -5.0836181640625, -4.91265869140625, -4.74169921875, -4.57073974609375, -4.3997802734375, -4.22882080078125, -4.057861328125, -3.88690185546875, -3.7159423828125, -3.54498291015625, -3.3740234375, -3.20306396484375, -3.0321044921875, -2.86114501953125, -2.690185546875, -2.51922607421875, -2.3482666015625, -2.17730712890625, -2.00634765625, -1.83538818359375, -1.6644287109375, -1.49346923828125, -1.322509765625, -1.15155029296875, -0.9805908203125, -0.80963134765625, -0.638671875, -0.46771240234375, -0.2967529296875, -0.12579345703125, 0.045166015625, 0.21612548828125, 0.3870849609375, 0.55804443359375, 0.72900390625, 0.89996337890625, 1.0709228515625, 1.24188232421875, 1.412841796875, 1.58380126953125, 1.7547607421875, 1.92572021484375, 2.0966796875, 2.26763916015625, 2.4385986328125, 2.60955810546875, 2.780517578125, 2.95147705078125, 3.1224365234375, 3.29339599609375, 3.46435546875, 3.63531494140625, 3.8062744140625, 3.97723388671875, 4.148193359375, 4.31915283203125, 4.4901123046875, 4.66107177734375, 4.83203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 12.0, 8.0, 8.0, 18.0, 36.0, 30.0, 42.0, 71.0, 96.0, 120.0, 197.0, 317.0, 611.0, 1416.0, 4467.0, 21928.0, 183337.0, 717859.0, 98693.0, 13602.0, 3213.0, 1140.0, 522.0, 267.0, 170.0, 119.0, 66.0, 61.0, 47.0, 24.0, 30.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9580078125, -0.9202423095703125, -0.882476806640625, -0.8447113037109375, -0.80694580078125, -0.7691802978515625, -0.731414794921875, -0.6936492919921875, -0.6558837890625, -0.6181182861328125, -0.580352783203125, -0.5425872802734375, -0.50482177734375, -0.4670562744140625, -0.429290771484375, -0.3915252685546875, -0.353759765625, -0.3159942626953125, -0.278228759765625, -0.2404632568359375, -0.20269775390625, -0.1649322509765625, -0.127166748046875, -0.0894012451171875, -0.0516357421875, -0.0138702392578125, 0.023895263671875, 0.0616607666015625, 0.09942626953125, 0.1371917724609375, 0.174957275390625, 0.2127227783203125, 0.25048828125, 0.2882537841796875, 0.326019287109375, 0.3637847900390625, 0.40155029296875, 0.4393157958984375, 0.477081298828125, 0.5148468017578125, 0.5526123046875, 0.5903778076171875, 0.628143310546875, 0.6659088134765625, 0.70367431640625, 0.7414398193359375, 0.779205322265625, 0.8169708251953125, 0.854736328125, 0.8925018310546875, 0.930267333984375, 0.9680328369140625, 1.00579833984375, 1.0435638427734375, 1.081329345703125, 1.1190948486328125, 1.1568603515625, 1.1946258544921875, 1.232391357421875, 1.2701568603515625, 1.30792236328125, 1.3456878662109375, 1.383453369140625, 1.4212188720703125, 1.458984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 12.0, 28.0, 33.0, 37.0, 38.0, 75.0, 115.0, 150.0, 161.0, 104.0, 76.0, 44.0, 34.0, 21.0, 21.0, 13.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003228187561035156, -0.00031472742557525635, -0.00030663609504699707, -0.0002985447645187378, -0.0002904534339904785, -0.00028236210346221924, -0.00027427077293395996, -0.0002661794424057007, -0.0002580881118774414, -0.00024999678134918213, -0.00024190545082092285, -0.00023381412029266357, -0.0002257227897644043, -0.00021763145923614502, -0.00020954012870788574, -0.00020144879817962646, -0.0001933574676513672, -0.0001852661371231079, -0.00017717480659484863, -0.00016908347606658936, -0.00016099214553833008, -0.0001529008150100708, -0.00014480948448181152, -0.00013671815395355225, -0.00012862682342529297, -0.00012053549289703369, -0.00011244416236877441, -0.00010435283184051514, -9.626150131225586e-05, -8.817017078399658e-05, -8.00788402557373e-05, -7.198750972747803e-05, -6.389617919921875e-05, -5.580484867095947e-05, -4.7713518142700195e-05, -3.962218761444092e-05, -3.153085708618164e-05, -2.3439526557922363e-05, -1.5348196029663086e-05, -7.256865501403809e-06, 8.344650268554688e-07, 8.925795555114746e-06, 1.7017126083374023e-05, 2.51084566116333e-05, 3.319978713989258e-05, 4.1291117668151855e-05, 4.938244819641113e-05, 5.747377872467041e-05, 6.556510925292969e-05, 7.365643978118896e-05, 8.174777030944824e-05, 8.983910083770752e-05, 9.79304313659668e-05, 0.00010602176189422607, 0.00011411309242248535, 0.00012220442295074463, 0.0001302957534790039, 0.00013838708400726318, 0.00014647841453552246, 0.00015456974506378174, 0.00016266107559204102, 0.0001707524061203003, 0.00017884373664855957, 0.00018693506717681885, 0.00019502639770507812]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 15.0, 19.0, 22.0, 41.0, 65.0, 75.0, 106.0, 198.0, 324.0, 533.0, 1019.0, 2423.0, 8085.0, 44455.0, 525835.0, 416608.0, 37077.0, 7196.0, 2229.0, 948.0, 495.0, 278.0, 157.0, 111.0, 70.0, 57.0, 23.0, 18.0, 18.0, 13.0, 12.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0693359375, -1.0296630859375, -0.989990234375, -0.9503173828125, -0.91064453125, -0.8709716796875, -0.831298828125, -0.7916259765625, -0.751953125, -0.7122802734375, -0.672607421875, -0.6329345703125, -0.59326171875, -0.5535888671875, -0.513916015625, -0.4742431640625, -0.4345703125, -0.3948974609375, -0.355224609375, -0.3155517578125, -0.27587890625, -0.2362060546875, -0.196533203125, -0.1568603515625, -0.1171875, -0.0775146484375, -0.037841796875, 0.0018310546875, 0.04150390625, 0.0811767578125, 0.120849609375, 0.1605224609375, 0.2001953125, 0.2398681640625, 0.279541015625, 0.3192138671875, 0.35888671875, 0.3985595703125, 0.438232421875, 0.4779052734375, 0.517578125, 0.5572509765625, 0.596923828125, 0.6365966796875, 0.67626953125, 0.7159423828125, 0.755615234375, 0.7952880859375, 0.8349609375, 0.8746337890625, 0.914306640625, 0.9539794921875, 0.99365234375, 1.0333251953125, 1.072998046875, 1.1126708984375, 1.15234375, 1.1920166015625, 1.231689453125, 1.2713623046875, 1.31103515625, 1.3507080078125, 1.390380859375, 1.4300537109375, 1.4697265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 6.0, 15.0, 15.0, 27.0, 32.0, 46.0, 58.0, 59.0, 89.0, 113.0, 101.0, 106.0, 69.0, 67.0, 56.0, 28.0, 20.0, 17.0, 13.0, 7.0, 7.0, 3.0, 7.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1303253173828125, -1.091705322265625, -1.0530853271484375, -1.01446533203125, -0.9758453369140625, -0.937225341796875, -0.8986053466796875, -0.8599853515625, -0.8213653564453125, -0.782745361328125, -0.7441253662109375, -0.70550537109375, -0.6668853759765625, -0.628265380859375, -0.5896453857421875, -0.551025390625, -0.5124053955078125, -0.473785400390625, -0.4351654052734375, -0.39654541015625, -0.3579254150390625, -0.319305419921875, -0.2806854248046875, -0.2420654296875, -0.2034454345703125, -0.164825439453125, -0.1262054443359375, -0.08758544921875, -0.0489654541015625, -0.010345458984375, 0.0282745361328125, 0.06689453125, 0.1055145263671875, 0.144134521484375, 0.1827545166015625, 0.22137451171875, 0.2599945068359375, 0.298614501953125, 0.3372344970703125, 0.3758544921875, 0.4144744873046875, 0.453094482421875, 0.4917144775390625, 0.53033447265625, 0.5689544677734375, 0.607574462890625, 0.6461944580078125, 0.684814453125, 0.7234344482421875, 0.762054443359375, 0.8006744384765625, 0.83929443359375, 0.8779144287109375, 0.916534423828125, 0.9551544189453125, 0.9937744140625, 1.0323944091796875, 1.071014404296875, 1.1096343994140625, 1.14825439453125, 1.1868743896484375, 1.225494384765625, 1.2641143798828125, 1.302734375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 16.0, 24.0, 47.0, 86.0, 136.0, 174.0, 176.0, 154.0, 84.0, 46.0, 17.0, 13.0, 4.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.5147705078125, -33.63487243652344, -32.754974365234375, -31.875076293945312, -30.99517822265625, -30.115280151367188, -29.235383987426758, -28.355485916137695, -27.475587844848633, -26.59568977355957, -25.715791702270508, -24.835893630981445, -23.955997467041016, -23.076099395751953, -22.19620132446289, -21.316303253173828, -20.436405181884766, -19.556507110595703, -18.67660903930664, -17.796710968017578, -16.916812896728516, -16.036914825439453, -15.157018661499023, -14.277120590209961, -13.397222518920898, -12.517324447631836, -11.637426376342773, -10.757529258728027, -9.877631187438965, -8.997733116149902, -8.117835998535156, -7.237937927246094, -6.358037948608398, -5.478139877319336, -4.598242282867432, -3.7183444499969482, -2.838446617126465, -1.9585485458374023, -1.078650951385498, -0.19875335693359375, 0.6811447143554688, 1.5610425472259521, 2.4409403800964355, 3.320838212966919, 4.200736045837402, 5.080634117126465, 5.960531711578369, 6.840429306030273, 7.720327377319336, 8.600225448608398, 9.480123519897461, 10.360020637512207, 11.23991870880127, 12.119816780090332, 12.999713897705078, 13.87961196899414, 14.759510040283203, 15.639408111572266, 16.519306182861328, 17.39920425415039, 18.279102325439453, 19.159000396728516, 20.038896560668945, 20.918794631958008, 21.79869270324707]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 16.0, 11.0, 19.0, 9.0, 32.0, 28.0, 32.0, 44.0, 25.0, 54.0, 37.0, 51.0, 46.0, 43.0, 57.0, 56.0, 39.0, 43.0, 34.0, 42.0, 25.0, 38.0, 28.0, 30.0, 22.0, 16.0, 19.0, 15.0, 10.0, 8.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-17.00653839111328, -16.527070999145508, -16.047605514526367, -15.568138122558594, -15.088671684265137, -14.60920524597168, -14.129738807678223, -13.650272369384766, -13.170804977416992, -12.691338539123535, -12.211872100830078, -11.732404708862305, -11.252938270568848, -10.77347183227539, -10.294005393981934, -9.814538955688477, -9.33507251739502, -8.855606079101562, -8.376139640808105, -7.89667272567749, -7.417205810546875, -6.937739372253418, -6.458272933959961, -5.978806495666504, -5.499339580535889, -5.019873142242432, -4.540406227111816, -4.060939788818359, -3.5814731121063232, -3.102006435394287, -2.62253999710083, -2.143073320388794, -1.6636066436767578, -1.1841399669647217, -0.7046734094619751, -0.22520685195922852, 0.2542598247528076, 0.7337265014648438, 1.2131929397583008, 1.692659616470337, 2.172126293182373, 2.651592969894409, 3.1310596466064453, 3.6105260848999023, 4.089992523193359, 4.569459438323975, 5.048925876617432, 5.528392791748047, 6.007859230041504, 6.487325668334961, 6.966792583465576, 7.446259021759033, 7.925725936889648, 8.405192375183105, 8.884658813476562, 9.36412525177002, 9.843591690063477, 10.323058128356934, 10.80252456665039, 11.281991958618164, 11.761458396911621, 12.240924835205078, 12.720391273498535, 13.199857711791992, 13.679325103759766]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 3.0, 6.0, 9.0, 11.0, 16.0, 16.0, 30.0, 32.0, 54.0, 86.0, 104.0, 153.0, 244.0, 331.0, 596.0, 1001.0, 1813.0, 3490.0, 7249.0, 16282.0, 45543.0, 235943.0, 3310723.0, 468714.0, 62339.0, 20470.0, 8891.0, 4293.0, 2345.0, 1376.0, 784.0, 456.0, 291.0, 199.0, 124.0, 75.0, 55.0, 43.0, 45.0, 17.0, 5.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.415130615234375, -1.36737060546875, -1.319610595703125, -1.2718505859375, -1.224090576171875, -1.17633056640625, -1.128570556640625, -1.080810546875, -1.033050537109375, -0.98529052734375, -0.937530517578125, -0.8897705078125, -0.842010498046875, -0.79425048828125, -0.746490478515625, -0.69873046875, -0.650970458984375, -0.60321044921875, -0.555450439453125, -0.5076904296875, -0.459930419921875, -0.41217041015625, -0.364410400390625, -0.316650390625, -0.268890380859375, -0.22113037109375, -0.173370361328125, -0.1256103515625, -0.077850341796875, -0.03009033203125, 0.017669677734375, 0.0654296875, 0.113189697265625, 0.16094970703125, 0.208709716796875, 0.2564697265625, 0.304229736328125, 0.35198974609375, 0.399749755859375, 0.447509765625, 0.495269775390625, 0.54302978515625, 0.590789794921875, 0.6385498046875, 0.686309814453125, 0.73406982421875, 0.781829833984375, 0.82958984375, 0.877349853515625, 0.92510986328125, 0.972869873046875, 1.0206298828125, 1.068389892578125, 1.11614990234375, 1.163909912109375, 1.211669921875, 1.259429931640625, 1.30718994140625, 1.354949951171875, 1.4027099609375, 1.450469970703125, 1.49822998046875, 1.545989990234375, 1.59375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 3.0, 10.0, 12.0, 18.0, 25.0, 22.0, 33.0, 42.0, 53.0, 52.0, 72.0, 83.0, 76.0, 81.0, 76.0, 59.0, 38.0, 44.0, 31.0, 36.0, 33.0, 18.0, 19.0, 20.0, 11.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.1289825439453125, -1.094879150390625, -1.0607757568359375, -1.02667236328125, -0.9925689697265625, -0.958465576171875, -0.9243621826171875, -0.8902587890625, -0.8561553955078125, -0.822052001953125, -0.7879486083984375, -0.75384521484375, -0.7197418212890625, -0.685638427734375, -0.6515350341796875, -0.617431640625, -0.5833282470703125, -0.549224853515625, -0.5151214599609375, -0.48101806640625, -0.4469146728515625, -0.412811279296875, -0.3787078857421875, -0.3446044921875, -0.3105010986328125, -0.276397705078125, -0.2422943115234375, -0.20819091796875, -0.1740875244140625, -0.139984130859375, -0.1058807373046875, -0.07177734375, -0.0376739501953125, -0.003570556640625, 0.0305328369140625, 0.06463623046875, 0.0987396240234375, 0.132843017578125, 0.1669464111328125, 0.2010498046875, 0.2351531982421875, 0.269256591796875, 0.3033599853515625, 0.33746337890625, 0.3715667724609375, 0.405670166015625, 0.4397735595703125, 0.473876953125, 0.5079803466796875, 0.542083740234375, 0.5761871337890625, 0.61029052734375, 0.6443939208984375, 0.678497314453125, 0.7126007080078125, 0.7467041015625, 0.7808074951171875, 0.814910888671875, 0.8490142822265625, 0.88311767578125, 0.9172210693359375, 0.951324462890625, 0.9854278564453125, 1.01953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 12.0, 16.0, 31.0, 30.0, 63.0, 88.0, 165.0, 444.0, 1306.0, 5923.0, 43659.0, 3505316.0, 606915.0, 24805.0, 3875.0, 911.0, 350.0, 157.0, 75.0, 43.0, 25.0, 18.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.03326416015625, -3.9141845703125, -3.79510498046875, -3.676025390625, -3.55694580078125, -3.4378662109375, -3.31878662109375, -3.19970703125, -3.08062744140625, -2.9615478515625, -2.84246826171875, -2.723388671875, -2.60430908203125, -2.4852294921875, -2.36614990234375, -2.2470703125, -2.12799072265625, -2.0089111328125, -1.88983154296875, -1.770751953125, -1.65167236328125, -1.5325927734375, -1.41351318359375, -1.29443359375, -1.17535400390625, -1.0562744140625, -0.93719482421875, -0.818115234375, -0.69903564453125, -0.5799560546875, -0.46087646484375, -0.341796875, -0.22271728515625, -0.1036376953125, 0.01544189453125, 0.134521484375, 0.25360107421875, 0.3726806640625, 0.49176025390625, 0.61083984375, 0.72991943359375, 0.8489990234375, 0.96807861328125, 1.087158203125, 1.20623779296875, 1.3253173828125, 1.44439697265625, 1.5634765625, 1.68255615234375, 1.8016357421875, 1.92071533203125, 2.039794921875, 2.15887451171875, 2.2779541015625, 2.39703369140625, 2.51611328125, 2.63519287109375, 2.7542724609375, 2.87335205078125, 2.992431640625, 3.11151123046875, 3.2305908203125, 3.34967041015625, 3.46875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 15.0, 16.0, 21.0, 30.0, 58.0, 112.0, 299.0, 1048.0, 1620.0, 470.0, 145.0, 86.0, 42.0, 31.0, 18.0, 11.0, 11.0, 15.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.296875, -4.2018585205078125, -4.106842041015625, -4.0118255615234375, -3.91680908203125, -3.8217926025390625, -3.726776123046875, -3.6317596435546875, -3.5367431640625, -3.4417266845703125, -3.346710205078125, -3.2516937255859375, -3.15667724609375, -3.0616607666015625, -2.966644287109375, -2.8716278076171875, -2.776611328125, -2.6815948486328125, -2.586578369140625, -2.4915618896484375, -2.39654541015625, -2.3015289306640625, -2.206512451171875, -2.1114959716796875, -2.0164794921875, -1.9214630126953125, -1.826446533203125, -1.7314300537109375, -1.63641357421875, -1.5413970947265625, -1.446380615234375, -1.3513641357421875, -1.25634765625, -1.1613311767578125, -1.066314697265625, -0.9712982177734375, -0.87628173828125, -0.7812652587890625, -0.686248779296875, -0.5912322998046875, -0.4962158203125, -0.4011993408203125, -0.306182861328125, -0.2111663818359375, -0.11614990234375, -0.0211334228515625, 0.073883056640625, 0.1688995361328125, 0.263916015625, 0.3589324951171875, 0.453948974609375, 0.5489654541015625, 0.64398193359375, 0.7389984130859375, 0.834014892578125, 0.9290313720703125, 1.0240478515625, 1.1190643310546875, 1.214080810546875, 1.3090972900390625, 1.40411376953125, 1.4991302490234375, 1.594146728515625, 1.6891632080078125, 1.7841796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 20.0, 22.0, 86.0, 161.0, 165.0, 178.0, 142.0, 86.0, 52.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.77971076965332, -13.158794403076172, -12.537877082824707, -11.916959762573242, -11.296043395996094, -10.675127029418945, -10.05420970916748, -9.433292388916016, -8.812376022338867, -8.191459655761719, -7.570542335510254, -6.949625492095947, -6.328708648681641, -5.707791805267334, -5.086874961853027, -4.465958118438721, -3.845041275024414, -3.2241244316101074, -2.603207588195801, -1.9822907447814941, -1.3613739013671875, -0.7404570579528809, -0.11954021453857422, 0.5013766288757324, 1.122293472290039, 1.7432103157043457, 2.3641271591186523, 2.985044002532959, 3.6059608459472656, 4.226877689361572, 4.847794532775879, 5.4687113761901855, 6.089630126953125, 6.710546970367432, 7.331463813781738, 7.952380657196045, 8.573297500610352, 9.1942138671875, 9.815131187438965, 10.43604850769043, 11.056964874267578, 11.677881240844727, 12.298798561096191, 12.919715881347656, 13.540632247924805, 14.161548614501953, 14.782465934753418, 15.403383255004883, 16.02429962158203, 16.64521598815918, 17.266132354736328, 17.88705062866211, 18.507966995239258, 19.128883361816406, 19.749801635742188, 20.370718002319336, 20.991634368896484, 21.612550735473633, 22.23346710205078, 22.854385375976562, 23.47530174255371, 24.09621810913086, 24.71713638305664, 25.33805274963379, 25.958969116210938]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 14.0, 6.0, 8.0, 16.0, 15.0, 23.0, 23.0, 26.0, 32.0, 36.0, 34.0, 32.0, 34.0, 47.0, 43.0, 38.0, 38.0, 41.0, 44.0, 55.0, 48.0, 34.0, 39.0, 29.0, 30.0, 35.0, 37.0, 24.0, 23.0, 21.0, 18.0, 11.0, 6.0, 11.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.446706295013428, -7.216037750244141, -6.985368728637695, -6.754700183868408, -6.524031639099121, -6.293362617492676, -6.062694072723389, -5.832025527954102, -5.601356506347656, -5.370687961578369, -5.140018939971924, -4.909350395202637, -4.678681373596191, -4.448012828826904, -4.217344284057617, -3.986675500869751, -3.7560067176818848, -3.5253379344940186, -3.2946691513061523, -3.0640006065368652, -2.833331823348999, -2.602663040161133, -2.3719944953918457, -2.1413257122039795, -1.9106569290161133, -1.679988145828247, -1.4493194818496704, -1.2186508178710938, -0.9879820346832275, -0.7573132514953613, -0.5266445875167847, -0.295975923538208, -0.0653076171875, 0.16536110639572144, 0.39602982997894287, 0.6266985535621643, 0.8573672771453857, 1.088036060333252, 1.3187047243118286, 1.5493733882904053, 1.7800421714782715, 2.0107109546661377, 2.241379737854004, 2.472048282623291, 2.7027170658111572, 2.9333858489990234, 3.1640543937683105, 3.3947231769561768, 3.625391960144043, 3.856060743331909, 4.086729526519775, 4.3173980712890625, 4.548067092895508, 4.778735637664795, 5.009404182434082, 5.240073204040527, 5.4707417488098145, 5.701410293579102, 5.932079315185547, 6.162747859954834, 6.393416404724121, 6.624085426330566, 6.8547539710998535, 7.085422515869141, 7.316091537475586]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 10.0, 7.0, 20.0, 33.0, 25.0, 38.0, 73.0, 129.0, 206.0, 397.0, 738.0, 1296.0, 2970.0, 7433.0, 20242.0, 61442.0, 215915.0, 482460.0, 175197.0, 51256.0, 17022.0, 6286.0, 2611.0, 1301.0, 620.0, 317.0, 190.0, 94.0, 74.0, 46.0, 33.0, 23.0, 11.0, 9.0, 6.0, 4.0, 6.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.2578125, -2.18817138671875, -2.1185302734375, -2.04888916015625, -1.979248046875, -1.90960693359375, -1.8399658203125, -1.77032470703125, -1.70068359375, -1.63104248046875, -1.5614013671875, -1.49176025390625, -1.422119140625, -1.35247802734375, -1.2828369140625, -1.21319580078125, -1.1435546875, -1.07391357421875, -1.0042724609375, -0.93463134765625, -0.864990234375, -0.79534912109375, -0.7257080078125, -0.65606689453125, -0.58642578125, -0.51678466796875, -0.4471435546875, -0.37750244140625, -0.307861328125, -0.23822021484375, -0.1685791015625, -0.09893798828125, -0.029296875, 0.04034423828125, 0.1099853515625, 0.17962646484375, 0.249267578125, 0.31890869140625, 0.3885498046875, 0.45819091796875, 0.52783203125, 0.59747314453125, 0.6671142578125, 0.73675537109375, 0.806396484375, 0.87603759765625, 0.9456787109375, 1.01531982421875, 1.0849609375, 1.15460205078125, 1.2242431640625, 1.29388427734375, 1.363525390625, 1.43316650390625, 1.5028076171875, 1.57244873046875, 1.64208984375, 1.71173095703125, 1.7813720703125, 1.85101318359375, 1.920654296875, 1.99029541015625, 2.0599365234375, 2.12957763671875, 2.19921875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 5.0, 5.0, 21.0, 15.0, 20.0, 36.0, 56.0, 46.0, 61.0, 66.0, 75.0, 69.0, 78.0, 69.0, 63.0, 44.0, 58.0, 27.0, 34.0, 21.0, 28.0, 19.0, 14.0, 13.0, 3.0, 13.0, 9.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1727523803710938, -1.1404266357421875, -1.1081008911132812, -1.075775146484375, -1.0434494018554688, -1.0111236572265625, -0.9787979125976562, -0.94647216796875, -0.9141464233398438, -0.8818206787109375, -0.8494949340820312, -0.817169189453125, -0.7848434448242188, -0.7525177001953125, -0.7201919555664062, -0.6878662109375, -0.6555404663085938, -0.6232147216796875, -0.5908889770507812, -0.558563232421875, -0.5262374877929688, -0.4939117431640625, -0.46158599853515625, -0.42926025390625, -0.39693450927734375, -0.3646087646484375, -0.33228302001953125, -0.299957275390625, -0.26763153076171875, -0.2353057861328125, -0.20298004150390625, -0.170654296875, -0.13832855224609375, -0.1060028076171875, -0.07367706298828125, -0.041351318359375, -0.00902557373046875, 0.0233001708984375, 0.05562591552734375, 0.08795166015625, 0.12027740478515625, 0.1526031494140625, 0.18492889404296875, 0.217254638671875, 0.24958038330078125, 0.2819061279296875, 0.31423187255859375, 0.3465576171875, 0.37888336181640625, 0.4112091064453125, 0.44353485107421875, 0.475860595703125, 0.5081863403320312, 0.5405120849609375, 0.5728378295898438, 0.60516357421875, 0.6374893188476562, 0.6698150634765625, 0.7021408081054688, 0.734466552734375, 0.7667922973632812, 0.7991180419921875, 0.8314437866210938, 0.86376953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 12.0, 20.0, 26.0, 30.0, 38.0, 56.0, 76.0, 90.0, 124.0, 192.0, 350.0, 566.0, 1187.0, 3115.0, 11280.0, 116772.0, 845896.0, 56048.0, 7760.0, 2451.0, 1008.0, 528.0, 295.0, 169.0, 146.0, 71.0, 54.0, 44.0, 35.0, 15.0, 20.0, 15.0, 6.0, 10.0, 4.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.876953125, -4.7109375, -4.544921875, -4.37890625, -4.212890625, -4.046875, -3.880859375, -3.71484375, -3.548828125, -3.3828125, -3.216796875, -3.05078125, -2.884765625, -2.71875, -2.552734375, -2.38671875, -2.220703125, -2.0546875, -1.888671875, -1.72265625, -1.556640625, -1.390625, -1.224609375, -1.05859375, -0.892578125, -0.7265625, -0.560546875, -0.39453125, -0.228515625, -0.0625, 0.103515625, 0.26953125, 0.435546875, 0.6015625, 0.767578125, 0.93359375, 1.099609375, 1.265625, 1.431640625, 1.59765625, 1.763671875, 1.9296875, 2.095703125, 2.26171875, 2.427734375, 2.59375, 2.759765625, 2.92578125, 3.091796875, 3.2578125, 3.423828125, 3.58984375, 3.755859375, 3.921875, 4.087890625, 4.25390625, 4.419921875, 4.5859375, 4.751953125, 4.91796875, 5.083984375, 5.25, 5.416015625, 5.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 11.0, 15.0, 17.0, 22.0, 33.0, 43.0, 40.0, 52.0, 55.0, 72.0, 72.0, 75.0, 80.0, 79.0, 50.0, 60.0, 48.0, 29.0, 31.0, 18.0, 17.0, 13.0, 9.0, 3.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.78717041015625, -4.6251220703125, -4.46307373046875, -4.301025390625, -4.13897705078125, -3.9769287109375, -3.81488037109375, -3.65283203125, -3.49078369140625, -3.3287353515625, -3.16668701171875, -3.004638671875, -2.84259033203125, -2.6805419921875, -2.51849365234375, -2.3564453125, -2.19439697265625, -2.0323486328125, -1.87030029296875, -1.708251953125, -1.54620361328125, -1.3841552734375, -1.22210693359375, -1.06005859375, -0.89801025390625, -0.7359619140625, -0.57391357421875, -0.411865234375, -0.24981689453125, -0.0877685546875, 0.07427978515625, 0.236328125, 0.39837646484375, 0.5604248046875, 0.72247314453125, 0.884521484375, 1.04656982421875, 1.2086181640625, 1.37066650390625, 1.53271484375, 1.69476318359375, 1.8568115234375, 2.01885986328125, 2.180908203125, 2.34295654296875, 2.5050048828125, 2.66705322265625, 2.8291015625, 2.99114990234375, 3.1531982421875, 3.31524658203125, 3.477294921875, 3.63934326171875, 3.8013916015625, 3.96343994140625, 4.12548828125, 4.28753662109375, 4.4495849609375, 4.61163330078125, 4.773681640625, 4.93572998046875, 5.0977783203125, 5.25982666015625, 5.421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 12.0, 26.0, 20.0, 28.0, 35.0, 61.0, 84.0, 159.0, 290.0, 749.0, 2303.0, 12662.0, 347521.0, 663224.0, 16948.0, 2700.0, 848.0, 350.0, 171.0, 92.0, 76.0, 48.0, 29.0, 27.0, 21.0, 9.0, 8.0, 10.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.64453125, -2.571197509765625, -2.49786376953125, -2.424530029296875, -2.3511962890625, -2.277862548828125, -2.20452880859375, -2.131195068359375, -2.057861328125, -1.984527587890625, -1.91119384765625, -1.837860107421875, -1.7645263671875, -1.691192626953125, -1.61785888671875, -1.544525146484375, -1.47119140625, -1.397857666015625, -1.32452392578125, -1.251190185546875, -1.1778564453125, -1.104522705078125, -1.03118896484375, -0.957855224609375, -0.884521484375, -0.811187744140625, -0.73785400390625, -0.664520263671875, -0.5911865234375, -0.517852783203125, -0.44451904296875, -0.371185302734375, -0.2978515625, -0.224517822265625, -0.15118408203125, -0.077850341796875, -0.0045166015625, 0.068817138671875, 0.14215087890625, 0.215484619140625, 0.288818359375, 0.362152099609375, 0.43548583984375, 0.508819580078125, 0.5821533203125, 0.655487060546875, 0.72882080078125, 0.802154541015625, 0.87548828125, 0.948822021484375, 1.02215576171875, 1.095489501953125, 1.1688232421875, 1.242156982421875, 1.31549072265625, 1.388824462890625, 1.462158203125, 1.535491943359375, 1.60882568359375, 1.682159423828125, 1.7554931640625, 1.828826904296875, 1.90216064453125, 1.975494384765625, 2.048828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 11.0, 17.0, 27.0, 32.0, 51.0, 75.0, 114.0, 170.0, 180.0, 95.0, 62.0, 36.0, 35.0, 22.0, 15.0, 18.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003750324249267578, -0.0003658607602119446, -0.00035668909549713135, -0.0003475174307823181, -0.0003383457660675049, -0.00032917410135269165, -0.0003200024366378784, -0.0003108307719230652, -0.00030165910720825195, -0.0002924874424934387, -0.0002833157777786255, -0.00027414411306381226, -0.000264972448348999, -0.0002558007836341858, -0.00024662911891937256, -0.00023745745420455933, -0.0002282857894897461, -0.00021911412477493286, -0.00020994246006011963, -0.0002007707953453064, -0.00019159913063049316, -0.00018242746591567993, -0.0001732558012008667, -0.00016408413648605347, -0.00015491247177124023, -0.000145740807056427, -0.00013656914234161377, -0.00012739747762680054, -0.0001182258129119873, -0.00010905414819717407, -9.988248348236084e-05, -9.071081876754761e-05, -8.153915405273438e-05, -7.236748933792114e-05, -6.319582462310791e-05, -5.402415990829468e-05, -4.4852495193481445e-05, -3.568083047866821e-05, -2.650916576385498e-05, -1.7337501049041748e-05, -8.165836334228516e-06, 1.0058283805847168e-06, 1.017749309539795e-05, 1.934915781021118e-05, 2.8520822525024414e-05, 3.7692487239837646e-05, 4.686415195465088e-05, 5.603581666946411e-05, 6.520748138427734e-05, 7.437914609909058e-05, 8.355081081390381e-05, 9.272247552871704e-05, 0.00010189414024353027, 0.0001110658049583435, 0.00012023746967315674, 0.00012940913438796997, 0.0001385807991027832, 0.00014775246381759644, 0.00015692412853240967, 0.0001660957932472229, 0.00017526745796203613, 0.00018443912267684937, 0.0001936107873916626, 0.00020278245210647583, 0.00021195411682128906]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 10.0, 21.0, 26.0, 33.0, 29.0, 42.0, 91.0, 138.0, 196.0, 347.0, 679.0, 1461.0, 4322.0, 20215.0, 296792.0, 679992.0, 34251.0, 6027.0, 1996.0, 849.0, 385.0, 239.0, 127.0, 76.0, 69.0, 34.0, 22.0, 21.0, 14.0, 9.0, 4.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.7691497802734375, -1.714080810546875, -1.6590118408203125, -1.60394287109375, -1.5488739013671875, -1.493804931640625, -1.4387359619140625, -1.3836669921875, -1.3285980224609375, -1.273529052734375, -1.2184600830078125, -1.16339111328125, -1.1083221435546875, -1.053253173828125, -0.9981842041015625, -0.943115234375, -0.8880462646484375, -0.832977294921875, -0.7779083251953125, -0.72283935546875, -0.6677703857421875, -0.612701416015625, -0.5576324462890625, -0.5025634765625, -0.4474945068359375, -0.392425537109375, -0.3373565673828125, -0.28228759765625, -0.2272186279296875, -0.172149658203125, -0.1170806884765625, -0.06201171875, -0.0069427490234375, 0.048126220703125, 0.1031951904296875, 0.15826416015625, 0.2133331298828125, 0.268402099609375, 0.3234710693359375, 0.3785400390625, 0.4336090087890625, 0.488677978515625, 0.5437469482421875, 0.59881591796875, 0.6538848876953125, 0.708953857421875, 0.7640228271484375, 0.819091796875, 0.8741607666015625, 0.929229736328125, 0.9842987060546875, 1.03936767578125, 1.0944366455078125, 1.149505615234375, 1.2045745849609375, 1.2596435546875, 1.3147125244140625, 1.369781494140625, 1.4248504638671875, 1.47991943359375, 1.5349884033203125, 1.590057373046875, 1.6451263427734375, 1.7001953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 26.0, 16.0, 28.0, 28.0, 33.0, 55.0, 74.0, 82.0, 80.0, 101.0, 108.0, 74.0, 52.0, 41.0, 44.0, 27.0, 16.0, 25.0, 13.0, 7.0, 8.0, 8.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.2902984619140625, -1.252471923828125, -1.2146453857421875, -1.17681884765625, -1.1389923095703125, -1.101165771484375, -1.0633392333984375, -1.0255126953125, -0.9876861572265625, -0.949859619140625, -0.9120330810546875, -0.87420654296875, -0.8363800048828125, -0.798553466796875, -0.7607269287109375, -0.722900390625, -0.6850738525390625, -0.647247314453125, -0.6094207763671875, -0.57159423828125, -0.5337677001953125, -0.495941162109375, -0.4581146240234375, -0.4202880859375, -0.3824615478515625, -0.344635009765625, -0.3068084716796875, -0.26898193359375, -0.2311553955078125, -0.193328857421875, -0.1555023193359375, -0.11767578125, -0.0798492431640625, -0.042022705078125, -0.0041961669921875, 0.03363037109375, 0.0714569091796875, 0.109283447265625, 0.1471099853515625, 0.1849365234375, 0.2227630615234375, 0.260589599609375, 0.2984161376953125, 0.33624267578125, 0.3740692138671875, 0.411895751953125, 0.4497222900390625, 0.487548828125, 0.5253753662109375, 0.563201904296875, 0.6010284423828125, 0.63885498046875, 0.6766815185546875, 0.714508056640625, 0.7523345947265625, 0.7901611328125, 0.8279876708984375, 0.865814208984375, 0.9036407470703125, 0.94146728515625, 0.9792938232421875, 1.017120361328125, 1.0549468994140625, 1.0927734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 23.0, 41.0, 118.0, 207.0, 258.0, 213.0, 65.0, 28.0, 16.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.58578872680664, -46.51209259033203, -45.43840026855469, -44.36470413208008, -43.29100799560547, -42.217315673828125, -41.143619537353516, -40.069923400878906, -38.99623107910156, -37.92253494262695, -36.84884262084961, -35.775146484375, -34.70145034790039, -33.62775421142578, -32.55406188964844, -31.480365753173828, -30.40666961669922, -29.332975387573242, -28.259279251098633, -27.185585021972656, -26.111888885498047, -25.03819465637207, -23.964500427246094, -22.890804290771484, -21.817110061645508, -20.74341583251953, -19.669719696044922, -18.596025466918945, -17.52233123779297, -16.44863510131836, -15.374940872192383, -14.30124568939209, -13.227546691894531, -12.153851509094238, -11.080156326293945, -10.006462097167969, -8.932766914367676, -7.859071731567383, -6.785377025604248, -5.711682319641113, -4.63798713684082, -3.5642921924591064, -2.4905972480773926, -1.4169023036956787, -0.34320735931396484, 0.7304878234863281, 1.804182529449463, 2.8778772354125977, 3.9515724182128906, 5.025267601013184, 6.098962306976318, 7.172657012939453, 8.246352195739746, 9.320047378540039, 10.393741607666016, 11.467436790466309, 12.541131973266602, 13.614827156066895, 14.688522338867188, 15.762216567993164, 16.83591079711914, 17.90960693359375, 18.983301162719727, 20.056995391845703, 21.130691528320312]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 8.0, 7.0, 5.0, 11.0, 8.0, 9.0, 13.0, 12.0, 21.0, 19.0, 19.0, 19.0, 24.0, 36.0, 43.0, 41.0, 46.0, 56.0, 55.0, 58.0, 55.0, 44.0, 53.0, 43.0, 43.0, 26.0, 26.0, 25.0, 34.0, 26.0, 26.0, 23.0, 6.0, 9.0, 4.0, 6.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-12.86214828491211, -12.477662086486816, -12.093174934387207, -11.708688735961914, -11.324201583862305, -10.939715385437012, -10.555229187011719, -10.17074203491211, -9.7862548828125, -9.401768684387207, -9.017281532287598, -8.632795333862305, -8.248308181762695, -7.863821983337402, -7.479335308074951, -7.0948486328125, -6.710362434387207, -6.325875759124756, -5.941389083862305, -5.556902885437012, -5.172415733337402, -4.787929534912109, -4.403442859649658, -4.018956184387207, -3.634469509124756, -3.2499828338623047, -2.8654961585998535, -2.4810097217559814, -2.0965230464935303, -1.712036371231079, -1.327549934387207, -0.9430632591247559, -0.5585775375366211, -0.1740909218788147, 0.2103956937789917, 0.5948822498321533, 0.9793689250946045, 1.3638556003570557, 1.7483420372009277, 2.132828712463379, 2.51731538772583, 2.9018020629882812, 3.2862887382507324, 3.6707751750946045, 4.055261611938477, 4.439748764038086, 4.824234962463379, 5.20872163772583, 5.593208312988281, 5.977694988250732, 6.362181663513184, 6.746667861938477, 7.131155014038086, 7.515641212463379, 7.90012788772583, 8.284614562988281, 8.66910171508789, 9.053587913513184, 9.438075065612793, 9.822561264038086, 10.207048416137695, 10.591534614562988, 10.976020812988281, 11.36050796508789, 11.744994163513184]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 7.0, 7.0, 14.0, 16.0, 28.0, 36.0, 46.0, 55.0, 87.0, 163.0, 220.0, 381.0, 782.0, 1599.0, 3453.0, 8557.0, 27591.0, 179509.0, 3462499.0, 445291.0, 42894.0, 11866.0, 4681.0, 2134.0, 1068.0, 550.0, 289.0, 177.0, 101.0, 62.0, 35.0, 21.0, 18.0, 12.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.076171875, -2.0162506103515625, -1.956329345703125, -1.8964080810546875, -1.83648681640625, -1.7765655517578125, -1.716644287109375, -1.6567230224609375, -1.5968017578125, -1.5368804931640625, -1.476959228515625, -1.4170379638671875, -1.35711669921875, -1.2971954345703125, -1.237274169921875, -1.1773529052734375, -1.117431640625, -1.0575103759765625, -0.997589111328125, -0.9376678466796875, -0.87774658203125, -0.8178253173828125, -0.757904052734375, -0.6979827880859375, -0.6380615234375, -0.5781402587890625, -0.518218994140625, -0.4582977294921875, -0.39837646484375, -0.3384552001953125, -0.278533935546875, -0.2186126708984375, -0.15869140625, -0.0987701416015625, -0.038848876953125, 0.0210723876953125, 0.08099365234375, 0.1409149169921875, 0.200836181640625, 0.2607574462890625, 0.3206787109375, 0.3805999755859375, 0.440521240234375, 0.5004425048828125, 0.56036376953125, 0.6202850341796875, 0.680206298828125, 0.7401275634765625, 0.800048828125, 0.8599700927734375, 0.919891357421875, 0.9798126220703125, 1.03973388671875, 1.0996551513671875, 1.159576416015625, 1.2194976806640625, 1.2794189453125, 1.3393402099609375, 1.399261474609375, 1.4591827392578125, 1.51910400390625, 1.5790252685546875, 1.638946533203125, 1.6988677978515625, 1.7587890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 15.0, 15.0, 25.0, 21.0, 35.0, 33.0, 50.0, 58.0, 62.0, 52.0, 49.0, 65.0, 62.0, 45.0, 61.0, 51.0, 41.0, 51.0, 32.0, 28.0, 18.0, 21.0, 16.0, 18.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.107421875, -1.0788955688476562, -1.0503692626953125, -1.0218429565429688, -0.993316650390625, -0.9647903442382812, -0.9362640380859375, -0.9077377319335938, -0.87921142578125, -0.8506851196289062, -0.8221588134765625, -0.7936325073242188, -0.765106201171875, -0.7365798950195312, -0.7080535888671875, -0.6795272827148438, -0.6510009765625, -0.6224746704101562, -0.5939483642578125, -0.5654220581054688, -0.536895751953125, -0.5083694458007812, -0.4798431396484375, -0.45131683349609375, -0.42279052734375, -0.39426422119140625, -0.3657379150390625, -0.33721160888671875, -0.308685302734375, -0.28015899658203125, -0.2516326904296875, -0.22310638427734375, -0.194580078125, -0.16605377197265625, -0.1375274658203125, -0.10900115966796875, -0.080474853515625, -0.05194854736328125, -0.0234222412109375, 0.00510406494140625, 0.03363037109375, 0.06215667724609375, 0.0906829833984375, 0.11920928955078125, 0.147735595703125, 0.17626190185546875, 0.2047882080078125, 0.23331451416015625, 0.2618408203125, 0.29036712646484375, 0.3188934326171875, 0.34741973876953125, 0.375946044921875, 0.40447235107421875, 0.4329986572265625, 0.46152496337890625, 0.49005126953125, 0.5185775756835938, 0.5471038818359375, 0.5756301879882812, 0.604156494140625, 0.6326828002929688, 0.6612091064453125, 0.6897354125976562, 0.71826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 22.0, 50.0, 69.0, 172.0, 254.0, 489.0, 1170.0, 3757.0, 16002.0, 142813.0, 3830704.0, 176338.0, 16954.0, 3523.0, 1105.0, 451.0, 204.0, 100.0, 40.0, 25.0, 12.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.132232666015625, -3.03594970703125, -2.939666748046875, -2.8433837890625, -2.747100830078125, -2.65081787109375, -2.554534912109375, -2.458251953125, -2.361968994140625, -2.26568603515625, -2.169403076171875, -2.0731201171875, -1.976837158203125, -1.88055419921875, -1.784271240234375, -1.68798828125, -1.591705322265625, -1.49542236328125, -1.399139404296875, -1.3028564453125, -1.206573486328125, -1.11029052734375, -1.014007568359375, -0.917724609375, -0.821441650390625, -0.72515869140625, -0.628875732421875, -0.5325927734375, -0.436309814453125, -0.34002685546875, -0.243743896484375, -0.1474609375, -0.051177978515625, 0.04510498046875, 0.141387939453125, 0.2376708984375, 0.333953857421875, 0.43023681640625, 0.526519775390625, 0.622802734375, 0.719085693359375, 0.81536865234375, 0.911651611328125, 1.0079345703125, 1.104217529296875, 1.20050048828125, 1.296783447265625, 1.39306640625, 1.489349365234375, 1.58563232421875, 1.681915283203125, 1.7781982421875, 1.874481201171875, 1.97076416015625, 2.067047119140625, 2.163330078125, 2.259613037109375, 2.35589599609375, 2.452178955078125, 2.5484619140625, 2.644744873046875, 2.74102783203125, 2.837310791015625, 2.93359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 30.0, 54.0, 81.0, 172.0, 468.0, 1135.0, 1205.0, 480.0, 209.0, 75.0, 57.0, 19.0, 16.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.090606689453125, -3.00933837890625, -2.928070068359375, -2.8468017578125, -2.765533447265625, -2.68426513671875, -2.602996826171875, -2.521728515625, -2.440460205078125, -2.35919189453125, -2.277923583984375, -2.1966552734375, -2.115386962890625, -2.03411865234375, -1.952850341796875, -1.87158203125, -1.790313720703125, -1.70904541015625, -1.627777099609375, -1.5465087890625, -1.465240478515625, -1.38397216796875, -1.302703857421875, -1.221435546875, -1.140167236328125, -1.05889892578125, -0.977630615234375, -0.8963623046875, -0.815093994140625, -0.73382568359375, -0.652557373046875, -0.5712890625, -0.490020751953125, -0.40875244140625, -0.327484130859375, -0.2462158203125, -0.164947509765625, -0.08367919921875, -0.002410888671875, 0.078857421875, 0.160125732421875, 0.24139404296875, 0.322662353515625, 0.4039306640625, 0.485198974609375, 0.56646728515625, 0.647735595703125, 0.72900390625, 0.810272216796875, 0.89154052734375, 0.972808837890625, 1.0540771484375, 1.135345458984375, 1.21661376953125, 1.297882080078125, 1.379150390625, 1.460418701171875, 1.54168701171875, 1.622955322265625, 1.7042236328125, 1.785491943359375, 1.86676025390625, 1.948028564453125, 2.029296875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 15.0, 58.0, 253.0, 387.0, 203.0, 47.0, 16.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.369407653808594, -18.183977127075195, -16.99854850769043, -15.813117980957031, -14.627687454223633, -13.44225788116455, -12.256828308105469, -11.07139778137207, -9.885968208312988, -8.700538635253906, -7.515108108520508, -6.329678535461426, -5.1442484855651855, -3.9588184356689453, -2.7733888626098633, -1.5879583358764648, -0.4025287628173828, 0.7829011678695679, 1.9683310985565186, 3.1537609100341797, 4.33919095993042, 5.52462100982666, 6.710050582885742, 7.895481109619141, 9.080910682678223, 10.266340255737305, 11.451770782470703, 12.637200355529785, 13.822629928588867, 15.008060455322266, 16.19348907470703, 17.378921508789062, 18.564350128173828, 19.749780654907227, 20.935209274291992, 22.12063980102539, 23.30607032775879, 24.491500854492188, 25.676929473876953, 26.86236000061035, 28.04779052734375, 29.23322105407715, 30.418649673461914, 31.604080200195312, 32.78950881958008, 33.97494125366211, 35.160369873046875, 36.345802307128906, 37.531227111816406, 38.71665573120117, 39.9020881652832, 41.08751678466797, 42.272945404052734, 43.458377838134766, 44.64380645751953, 45.82923889160156, 47.01466751098633, 48.200096130371094, 49.385528564453125, 50.57095718383789, 51.756385803222656, 52.94181823730469, 54.12724685668945, 55.31267547607422, 56.49810791015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 12.0, 11.0, 10.0, 23.0, 23.0, 32.0, 34.0, 39.0, 53.0, 48.0, 45.0, 49.0, 49.0, 59.0, 42.0, 50.0, 61.0, 54.0, 43.0, 37.0, 53.0, 32.0, 22.0, 22.0, 24.0, 15.0, 13.0, 7.0, 4.0, 7.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.749755382537842, -7.472809791564941, -7.195863723754883, -6.918918132781982, -6.641972064971924, -6.365026473999023, -6.088080406188965, -5.8111348152160645, -5.534189224243164, -5.257243633270264, -4.980297565460205, -4.703351974487305, -4.426405906677246, -4.149460315704346, -3.872514486312866, -3.5955686569213867, -3.318622589111328, -3.0416767597198486, -2.764730930328369, -2.4877853393554688, -2.21083927154541, -1.9338935613632202, -1.6569478511810303, -1.3800020217895508, -1.1030561923980713, -0.8261103630065918, -0.5491645932197571, -0.27221882343292236, 0.004727005958557129, 0.2816728353500366, 0.5586185455322266, 0.835564374923706, 1.1125097274780273, 1.3894555568695068, 1.6664013862609863, 1.9433470964431763, 2.2202930450439453, 2.4972386360168457, 2.774184465408325, 3.0511302947998047, 3.328076124191284, 3.6050219535827637, 3.881967782974243, 4.158913612365723, 4.435859203338623, 4.712805271148682, 4.989750862121582, 5.266696929931641, 5.543642520904541, 5.820588111877441, 6.0975341796875, 6.3744797706604, 6.651425838470459, 6.928371429443359, 7.205317497253418, 7.482263088226318, 7.759208679199219, 8.036154747009277, 8.31309986114502, 8.590045928955078, 8.866991996765137, 9.143938064575195, 9.420883178710938, 9.697829246520996, 9.974775314331055]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 12.0, 24.0, 27.0, 34.0, 62.0, 106.0, 145.0, 248.0, 504.0, 833.0, 1511.0, 3229.0, 7003.0, 16738.0, 45458.0, 136654.0, 401281.0, 290985.0, 89678.0, 31264.0, 12339.0, 5235.0, 2393.0, 1205.0, 636.0, 343.0, 213.0, 132.0, 73.0, 49.0, 38.0, 26.0, 9.0, 10.0, 11.0, 10.0, 10.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9460601806640625, -1.890167236328125, -1.8342742919921875, -1.77838134765625, -1.7224884033203125, -1.666595458984375, -1.6107025146484375, -1.5548095703125, -1.4989166259765625, -1.443023681640625, -1.3871307373046875, -1.33123779296875, -1.2753448486328125, -1.219451904296875, -1.1635589599609375, -1.107666015625, -1.0517730712890625, -0.995880126953125, -0.9399871826171875, -0.88409423828125, -0.8282012939453125, -0.772308349609375, -0.7164154052734375, -0.6605224609375, -0.6046295166015625, -0.548736572265625, -0.4928436279296875, -0.43695068359375, -0.3810577392578125, -0.325164794921875, -0.2692718505859375, -0.21337890625, -0.1574859619140625, -0.101593017578125, -0.0457000732421875, 0.01019287109375, 0.0660858154296875, 0.121978759765625, 0.1778717041015625, 0.2337646484375, 0.2896575927734375, 0.345550537109375, 0.4014434814453125, 0.45733642578125, 0.5132293701171875, 0.569122314453125, 0.6250152587890625, 0.680908203125, 0.7368011474609375, 0.792694091796875, 0.8485870361328125, 0.90447998046875, 0.9603729248046875, 1.016265869140625, 1.0721588134765625, 1.1280517578125, 1.1839447021484375, 1.239837646484375, 1.2957305908203125, 1.35162353515625, 1.4075164794921875, 1.463409423828125, 1.5193023681640625, 1.5751953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 8.0, 15.0, 8.0, 21.0, 19.0, 19.0, 29.0, 44.0, 39.0, 39.0, 59.0, 46.0, 51.0, 50.0, 58.0, 54.0, 54.0, 34.0, 39.0, 59.0, 32.0, 42.0, 29.0, 33.0, 20.0, 11.0, 15.0, 9.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.98291015625, -0.9573593139648438, -0.9318084716796875, -0.9062576293945312, -0.880706787109375, -0.8551559448242188, -0.8296051025390625, -0.8040542602539062, -0.77850341796875, -0.7529525756835938, -0.7274017333984375, -0.7018508911132812, -0.676300048828125, -0.6507492065429688, -0.6251983642578125, -0.5996475219726562, -0.5740966796875, -0.5485458374023438, -0.5229949951171875, -0.49744415283203125, -0.471893310546875, -0.44634246826171875, -0.4207916259765625, -0.39524078369140625, -0.36968994140625, -0.34413909912109375, -0.3185882568359375, -0.29303741455078125, -0.267486572265625, -0.24193572998046875, -0.2163848876953125, -0.19083404541015625, -0.165283203125, -0.13973236083984375, -0.1141815185546875, -0.08863067626953125, -0.063079833984375, -0.03752899169921875, -0.0119781494140625, 0.01357269287109375, 0.03912353515625, 0.06467437744140625, 0.0902252197265625, 0.11577606201171875, 0.141326904296875, 0.16687774658203125, 0.1924285888671875, 0.21797943115234375, 0.2435302734375, 0.26908111572265625, 0.2946319580078125, 0.32018280029296875, 0.345733642578125, 0.37128448486328125, 0.3968353271484375, 0.42238616943359375, 0.44793701171875, 0.47348785400390625, 0.4990386962890625, 0.5245895385742188, 0.550140380859375, 0.5756912231445312, 0.6012420654296875, 0.6267929077148438, 0.65234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 9.0, 10.0, 10.0, 10.0, 8.0, 36.0, 43.0, 49.0, 83.0, 128.0, 242.0, 391.0, 736.0, 1552.0, 4132.0, 18365.0, 135598.0, 740389.0, 122342.0, 17160.0, 4166.0, 1465.0, 678.0, 332.0, 201.0, 134.0, 90.0, 54.0, 48.0, 26.0, 15.0, 13.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.631103515625, -2.52783203125, -2.424560546875, -2.3212890625, -2.218017578125, -2.11474609375, -2.011474609375, -1.908203125, -1.804931640625, -1.70166015625, -1.598388671875, -1.4951171875, -1.391845703125, -1.28857421875, -1.185302734375, -1.08203125, -0.978759765625, -0.87548828125, -0.772216796875, -0.6689453125, -0.565673828125, -0.46240234375, -0.359130859375, -0.255859375, -0.152587890625, -0.04931640625, 0.053955078125, 0.1572265625, 0.260498046875, 0.36376953125, 0.467041015625, 0.5703125, 0.673583984375, 0.77685546875, 0.880126953125, 0.9833984375, 1.086669921875, 1.18994140625, 1.293212890625, 1.396484375, 1.499755859375, 1.60302734375, 1.706298828125, 1.8095703125, 1.912841796875, 2.01611328125, 2.119384765625, 2.22265625, 2.325927734375, 2.42919921875, 2.532470703125, 2.6357421875, 2.739013671875, 2.84228515625, 2.945556640625, 3.048828125, 3.152099609375, 3.25537109375, 3.358642578125, 3.4619140625, 3.565185546875, 3.66845703125, 3.771728515625, 3.875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 8.0, 12.0, 11.0, 14.0, 18.0, 19.0, 22.0, 23.0, 30.0, 36.0, 36.0, 37.0, 39.0, 45.0, 45.0, 49.0, 39.0, 46.0, 58.0, 53.0, 37.0, 37.0, 49.0, 32.0, 25.0, 30.0, 16.0, 15.0, 14.0, 13.0, 13.0, 8.0, 10.0, 12.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.78515625, -2.70001220703125, -2.6148681640625, -2.52972412109375, -2.444580078125, -2.35943603515625, -2.2742919921875, -2.18914794921875, -2.10400390625, -2.01885986328125, -1.9337158203125, -1.84857177734375, -1.763427734375, -1.67828369140625, -1.5931396484375, -1.50799560546875, -1.4228515625, -1.33770751953125, -1.2525634765625, -1.16741943359375, -1.082275390625, -0.99713134765625, -0.9119873046875, -0.82684326171875, -0.74169921875, -0.65655517578125, -0.5714111328125, -0.48626708984375, -0.401123046875, -0.31597900390625, -0.2308349609375, -0.14569091796875, -0.060546875, 0.02459716796875, 0.1097412109375, 0.19488525390625, 0.280029296875, 0.36517333984375, 0.4503173828125, 0.53546142578125, 0.62060546875, 0.70574951171875, 0.7908935546875, 0.87603759765625, 0.961181640625, 1.04632568359375, 1.1314697265625, 1.21661376953125, 1.3017578125, 1.38690185546875, 1.4720458984375, 1.55718994140625, 1.642333984375, 1.72747802734375, 1.8126220703125, 1.89776611328125, 1.98291015625, 2.06805419921875, 2.1531982421875, 2.23834228515625, 2.323486328125, 2.40863037109375, 2.4937744140625, 2.57891845703125, 2.6640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 7.0, 12.0, 29.0, 47.0, 108.0, 345.0, 2171.0, 256132.0, 786085.0, 2970.0, 422.0, 122.0, 52.0, 15.0, 14.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.790130615234375, -3.64471435546875, -3.499298095703125, -3.3538818359375, -3.208465576171875, -3.06304931640625, -2.917633056640625, -2.772216796875, -2.626800537109375, -2.48138427734375, -2.335968017578125, -2.1905517578125, -2.045135498046875, -1.89971923828125, -1.754302978515625, -1.60888671875, -1.463470458984375, -1.31805419921875, -1.172637939453125, -1.0272216796875, -0.881805419921875, -0.73638916015625, -0.590972900390625, -0.445556640625, -0.300140380859375, -0.15472412109375, -0.009307861328125, 0.1361083984375, 0.281524658203125, 0.42694091796875, 0.572357177734375, 0.7177734375, 0.863189697265625, 1.00860595703125, 1.154022216796875, 1.2994384765625, 1.444854736328125, 1.59027099609375, 1.735687255859375, 1.881103515625, 2.026519775390625, 2.17193603515625, 2.317352294921875, 2.4627685546875, 2.608184814453125, 2.75360107421875, 2.899017333984375, 3.04443359375, 3.189849853515625, 3.33526611328125, 3.480682373046875, 3.6260986328125, 3.771514892578125, 3.91693115234375, 4.062347412109375, 4.207763671875, 4.353179931640625, 4.49859619140625, 4.644012451171875, 4.7894287109375, 4.934844970703125, 5.08026123046875, 5.225677490234375, 5.37109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 10.0, 8.0, 5.0, 8.0, 11.0, 20.0, 16.0, 34.0, 40.0, 63.0, 74.0, 108.0, 143.0, 130.0, 85.0, 66.0, 43.0, 34.0, 16.0, 24.0, 6.0, 13.0, 16.0, 4.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016164779663085938, -0.00015586242079734802, -0.00015007704496383667, -0.00014429166913032532, -0.00013850629329681396, -0.0001327209174633026, -0.00012693554162979126, -0.00012115016579627991, -0.00011536478996276855, -0.0001095794141292572, -0.00010379403829574585, -9.80086624622345e-05, -9.222328662872314e-05, -8.643791079521179e-05, -8.065253496170044e-05, -7.486715912818909e-05, -6.908178329467773e-05, -6.329640746116638e-05, -5.751103162765503e-05, -5.172565579414368e-05, -4.5940279960632324e-05, -4.015490412712097e-05, -3.436952829360962e-05, -2.8584152460098267e-05, -2.2798776626586914e-05, -1.701340079307556e-05, -1.1228024959564209e-05, -5.4426491260528564e-06, 3.427267074584961e-07, 6.128102540969849e-06, 1.1913478374481201e-05, 1.7698854207992554e-05, 2.3484230041503906e-05, 2.926960587501526e-05, 3.505498170852661e-05, 4.0840357542037964e-05, 4.6625733375549316e-05, 5.241110920906067e-05, 5.819648504257202e-05, 6.398186087608337e-05, 6.976723670959473e-05, 7.555261254310608e-05, 8.133798837661743e-05, 8.712336421012878e-05, 9.290874004364014e-05, 9.869411587715149e-05, 0.00010447949171066284, 0.0001102648675441742, 0.00011605024337768555, 0.0001218356192111969, 0.00012762099504470825, 0.0001334063708782196, 0.00013919174671173096, 0.0001449771225452423, 0.00015076249837875366, 0.00015654787421226501, 0.00016233325004577637, 0.00016811862587928772, 0.00017390400171279907, 0.00017968937754631042, 0.00018547475337982178, 0.00019126012921333313, 0.00019704550504684448, 0.00020283088088035583, 0.0002086162567138672]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 11.0, 15.0, 26.0, 40.0, 66.0, 114.0, 222.0, 477.0, 1117.0, 3599.0, 18200.0, 275592.0, 704149.0, 36440.0, 5583.0, 1672.0, 584.0, 264.0, 141.0, 74.0, 55.0, 29.0, 27.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.975067138671875, -0.92669677734375, -0.878326416015625, -0.8299560546875, -0.781585693359375, -0.73321533203125, -0.684844970703125, -0.636474609375, -0.588104248046875, -0.53973388671875, -0.491363525390625, -0.4429931640625, -0.394622802734375, -0.34625244140625, -0.297882080078125, -0.24951171875, -0.201141357421875, -0.15277099609375, -0.104400634765625, -0.0560302734375, -0.007659912109375, 0.04071044921875, 0.089080810546875, 0.137451171875, 0.185821533203125, 0.23419189453125, 0.282562255859375, 0.3309326171875, 0.379302978515625, 0.42767333984375, 0.476043701171875, 0.5244140625, 0.572784423828125, 0.62115478515625, 0.669525146484375, 0.7178955078125, 0.766265869140625, 0.81463623046875, 0.863006591796875, 0.911376953125, 0.959747314453125, 1.00811767578125, 1.056488037109375, 1.1048583984375, 1.153228759765625, 1.20159912109375, 1.249969482421875, 1.29833984375, 1.346710205078125, 1.39508056640625, 1.443450927734375, 1.4918212890625, 1.540191650390625, 1.58856201171875, 1.636932373046875, 1.685302734375, 1.733673095703125, 1.78204345703125, 1.830413818359375, 1.8787841796875, 1.927154541015625, 1.97552490234375, 2.023895263671875, 2.072265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 5.0, 12.0, 10.0, 22.0, 36.0, 43.0, 65.0, 87.0, 107.0, 128.0, 121.0, 93.0, 73.0, 50.0, 49.0, 36.0, 17.0, 13.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.980621337890625, -0.94268798828125, -0.904754638671875, -0.8668212890625, -0.828887939453125, -0.79095458984375, -0.753021240234375, -0.715087890625, -0.677154541015625, -0.63922119140625, -0.601287841796875, -0.5633544921875, -0.525421142578125, -0.48748779296875, -0.449554443359375, -0.41162109375, -0.373687744140625, -0.33575439453125, -0.297821044921875, -0.2598876953125, -0.221954345703125, -0.18402099609375, -0.146087646484375, -0.108154296875, -0.070220947265625, -0.03228759765625, 0.005645751953125, 0.0435791015625, 0.081512451171875, 0.11944580078125, 0.157379150390625, 0.1953125, 0.233245849609375, 0.27117919921875, 0.309112548828125, 0.3470458984375, 0.384979248046875, 0.42291259765625, 0.460845947265625, 0.498779296875, 0.536712646484375, 0.57464599609375, 0.612579345703125, 0.6505126953125, 0.688446044921875, 0.72637939453125, 0.764312744140625, 0.80224609375, 0.840179443359375, 0.87811279296875, 0.916046142578125, 0.9539794921875, 0.991912841796875, 1.02984619140625, 1.067779541015625, 1.105712890625, 1.143646240234375, 1.18157958984375, 1.219512939453125, 1.2574462890625, 1.295379638671875, 1.33331298828125, 1.371246337890625, 1.4091796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 69.0, 183.0, 351.0, 229.0, 71.0, 31.0, 10.0, 10.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.86699676513672, -38.75015640258789, -37.63331604003906, -36.516475677490234, -35.399635314941406, -34.28279495239258, -33.16595458984375, -32.04911804199219, -30.932275772094727, -29.8154354095459, -28.69859504699707, -27.581754684448242, -26.464916229248047, -25.34807586669922, -24.23123550415039, -23.114395141601562, -21.997554779052734, -20.880714416503906, -19.763874053955078, -18.64703369140625, -17.530193328857422, -16.413352966308594, -15.296514511108398, -14.17967414855957, -13.062833786010742, -11.945993423461914, -10.829153060913086, -9.712313652038574, -8.595473289489746, -7.478632926940918, -6.361793041229248, -5.244953155517578, -4.12811279296875, -3.011272668838501, -1.894432544708252, -0.7775924205780029, 0.3392477035522461, 1.4560880661010742, 2.572927951812744, 3.689767837524414, 4.806608200073242, 5.92344856262207, 7.04028844833374, 8.15712833404541, 9.273968696594238, 10.390809059143066, 11.507648468017578, 12.624488830566406, 13.741329193115234, 14.858169555664062, 15.97500991821289, 17.09185028076172, 18.208690643310547, 19.325531005859375, 20.44236946105957, 21.5592098236084, 22.676050186157227, 23.792890548706055, 24.909730911254883, 26.02657127380371, 27.143409729003906, 28.260250091552734, 29.377090454101562, 30.49393081665039, 31.61077117919922]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 9.0, 10.0, 15.0, 11.0, 23.0, 19.0, 29.0, 29.0, 34.0, 40.0, 37.0, 45.0, 55.0, 45.0, 55.0, 51.0, 52.0, 52.0, 49.0, 43.0, 31.0, 34.0, 25.0, 19.0, 25.0, 24.0, 21.0, 19.0, 16.0, 13.0, 7.0, 13.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.482670783996582, -9.140835762023926, -8.79900074005127, -8.457165718078613, -8.115331649780273, -7.773496150970459, -7.431661605834961, -7.089826583862305, -6.747991561889648, -6.406156539916992, -6.064321517944336, -5.722486972808838, -5.380651950836182, -5.038816928863525, -4.696982383728027, -4.355147361755371, -4.013312339782715, -3.6714773178100586, -3.3296425342559814, -2.9878077507019043, -2.645972728729248, -2.304137706756592, -1.9623029232025146, -1.6204681396484375, -1.2786331176757812, -0.9367982149124146, -0.5949633121490479, -0.25312840938568115, 0.08870649337768555, 0.43054139614105225, 0.772376298904419, 1.114211082458496, 1.456045150756836, 1.7978800535202026, 2.1397149562835693, 2.4815497398376465, 2.8233847618103027, 3.165219783782959, 3.507054567337036, 3.8488893508911133, 4.1907243728637695, 4.532559394836426, 4.874394416809082, 5.21622896194458, 5.558063983917236, 5.899899005889893, 6.241733551025391, 6.583568572998047, 6.925403594970703, 7.267238616943359, 7.609073638916016, 7.950908184051514, 8.292743682861328, 8.634577751159668, 8.976412773132324, 9.31824779510498, 9.660082817077637, 10.001917839050293, 10.34375286102295, 10.685587882995605, 11.027421951293945, 11.369256973266602, 11.711091995239258, 12.052927017211914, 12.39476203918457]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 14.0, 4.0, 9.0, 23.0, 26.0, 34.0, 38.0, 59.0, 86.0, 121.0, 178.0, 294.0, 444.0, 804.0, 1394.0, 2636.0, 5661.0, 13338.0, 37410.0, 147057.0, 1218279.0, 2385928.0, 287098.0, 58793.0, 19009.0, 7535.0, 3557.0, 1805.0, 973.0, 558.0, 370.0, 233.0, 156.0, 98.0, 61.0, 57.0, 38.0, 26.0, 20.0, 12.0, 11.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.306640625, -1.2684173583984375, -1.230194091796875, -1.1919708251953125, -1.15374755859375, -1.1155242919921875, -1.077301025390625, -1.0390777587890625, -1.0008544921875, -0.9626312255859375, -0.924407958984375, -0.8861846923828125, -0.84796142578125, -0.8097381591796875, -0.771514892578125, -0.7332916259765625, -0.695068359375, -0.6568450927734375, -0.618621826171875, -0.5803985595703125, -0.54217529296875, -0.5039520263671875, -0.465728759765625, -0.4275054931640625, -0.3892822265625, -0.3510589599609375, -0.312835693359375, -0.2746124267578125, -0.23638916015625, -0.1981658935546875, -0.159942626953125, -0.1217193603515625, -0.08349609375, -0.0452728271484375, -0.007049560546875, 0.0311737060546875, 0.06939697265625, 0.1076202392578125, 0.145843505859375, 0.1840667724609375, 0.2222900390625, 0.2605133056640625, 0.298736572265625, 0.3369598388671875, 0.37518310546875, 0.4134063720703125, 0.451629638671875, 0.4898529052734375, 0.528076171875, 0.5662994384765625, 0.604522705078125, 0.6427459716796875, 0.68096923828125, 0.7191925048828125, 0.757415771484375, 0.7956390380859375, 0.8338623046875, 0.8720855712890625, 0.910308837890625, 0.9485321044921875, 0.98675537109375, 1.0249786376953125, 1.063201904296875, 1.1014251708984375, 1.1396484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 20.0, 21.0, 30.0, 43.0, 49.0, 60.0, 67.0, 81.0, 81.0, 81.0, 69.0, 72.0, 68.0, 51.0, 57.0, 42.0, 26.0, 14.0, 19.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1061859130859375, -1.070770263671875, -1.0353546142578125, -0.99993896484375, -0.9645233154296875, -0.929107666015625, -0.8936920166015625, -0.8582763671875, -0.8228607177734375, -0.787445068359375, -0.7520294189453125, -0.71661376953125, -0.6811981201171875, -0.645782470703125, -0.6103668212890625, -0.574951171875, -0.5395355224609375, -0.504119873046875, -0.4687042236328125, -0.43328857421875, -0.3978729248046875, -0.362457275390625, -0.3270416259765625, -0.2916259765625, -0.2562103271484375, -0.220794677734375, -0.1853790283203125, -0.14996337890625, -0.1145477294921875, -0.079132080078125, -0.0437164306640625, -0.00830078125, 0.0271148681640625, 0.062530517578125, 0.0979461669921875, 0.13336181640625, 0.1687774658203125, 0.204193115234375, 0.2396087646484375, 0.2750244140625, 0.3104400634765625, 0.345855712890625, 0.3812713623046875, 0.41668701171875, 0.4521026611328125, 0.487518310546875, 0.5229339599609375, 0.558349609375, 0.5937652587890625, 0.629180908203125, 0.6645965576171875, 0.70001220703125, 0.7354278564453125, 0.770843505859375, 0.8062591552734375, 0.8416748046875, 0.8770904541015625, 0.912506103515625, 0.9479217529296875, 0.98333740234375, 1.0187530517578125, 1.054168701171875, 1.0895843505859375, 1.125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 12.0, 27.0, 23.0, 35.0, 51.0, 74.0, 137.0, 212.0, 415.0, 847.0, 2156.0, 6016.0, 20020.0, 86916.0, 983631.0, 2865149.0, 180300.0, 33731.0, 9169.0, 2966.0, 1187.0, 523.0, 276.0, 145.0, 79.0, 48.0, 36.0, 23.0, 22.0, 11.0, 10.0, 3.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.707122802734375, -1.65057373046875, -1.594024658203125, -1.5374755859375, -1.480926513671875, -1.42437744140625, -1.367828369140625, -1.311279296875, -1.254730224609375, -1.19818115234375, -1.141632080078125, -1.0850830078125, -1.028533935546875, -0.97198486328125, -0.915435791015625, -0.85888671875, -0.802337646484375, -0.74578857421875, -0.689239501953125, -0.6326904296875, -0.576141357421875, -0.51959228515625, -0.463043212890625, -0.406494140625, -0.349945068359375, -0.29339599609375, -0.236846923828125, -0.1802978515625, -0.123748779296875, -0.06719970703125, -0.010650634765625, 0.0458984375, 0.102447509765625, 0.15899658203125, 0.215545654296875, 0.2720947265625, 0.328643798828125, 0.38519287109375, 0.441741943359375, 0.498291015625, 0.554840087890625, 0.61138916015625, 0.667938232421875, 0.7244873046875, 0.781036376953125, 0.83758544921875, 0.894134521484375, 0.95068359375, 1.007232666015625, 1.06378173828125, 1.120330810546875, 1.1768798828125, 1.233428955078125, 1.28997802734375, 1.346527099609375, 1.403076171875, 1.459625244140625, 1.51617431640625, 1.572723388671875, 1.6292724609375, 1.685821533203125, 1.74237060546875, 1.798919677734375, 1.85546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 10.0, 11.0, 21.0, 16.0, 27.0, 28.0, 43.0, 40.0, 63.0, 111.0, 138.0, 210.0, 330.0, 494.0, 553.0, 584.0, 395.0, 275.0, 186.0, 120.0, 89.0, 62.0, 53.0, 39.0, 29.0, 18.0, 17.0, 12.0, 17.0, 14.0, 7.0, 3.0, 6.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.494140625, -1.4512481689453125, -1.408355712890625, -1.3654632568359375, -1.32257080078125, -1.2796783447265625, -1.236785888671875, -1.1938934326171875, -1.1510009765625, -1.1081085205078125, -1.065216064453125, -1.0223236083984375, -0.97943115234375, -0.9365386962890625, -0.893646240234375, -0.8507537841796875, -0.807861328125, -0.7649688720703125, -0.722076416015625, -0.6791839599609375, -0.63629150390625, -0.5933990478515625, -0.550506591796875, -0.5076141357421875, -0.4647216796875, -0.4218292236328125, -0.378936767578125, -0.3360443115234375, -0.29315185546875, -0.2502593994140625, -0.207366943359375, -0.1644744873046875, -0.12158203125, -0.0786895751953125, -0.035797119140625, 0.0070953369140625, 0.04998779296875, 0.0928802490234375, 0.135772705078125, 0.1786651611328125, 0.2215576171875, 0.2644500732421875, 0.307342529296875, 0.3502349853515625, 0.39312744140625, 0.4360198974609375, 0.478912353515625, 0.5218048095703125, 0.564697265625, 0.6075897216796875, 0.650482177734375, 0.6933746337890625, 0.73626708984375, 0.7791595458984375, 0.822052001953125, 0.8649444580078125, 0.9078369140625, 0.9507293701171875, 0.993621826171875, 1.0365142822265625, 1.07940673828125, 1.1222991943359375, 1.165191650390625, 1.2080841064453125, 1.2509765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 9.0, 13.0, 26.0, 64.0, 107.0, 164.0, 192.0, 161.0, 116.0, 62.0, 38.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.264766693115234, -22.661638259887695, -22.058509826660156, -21.45538330078125, -20.85225486755371, -20.249126434326172, -19.645998001098633, -19.042869567871094, -18.439743041992188, -17.83661460876465, -17.23348617553711, -16.630359649658203, -16.027231216430664, -15.424102783203125, -14.820974349975586, -14.217846870422363, -13.614718437194824, -13.011590003967285, -12.408462524414062, -11.805334091186523, -11.2022066116333, -10.599078178405762, -9.995950698852539, -9.392822265625, -8.789693832397461, -8.186565399169922, -7.583437919616699, -6.98030948638916, -6.3771820068359375, -5.774053573608398, -5.170925617218018, -4.567797660827637, -3.9646692276000977, -3.361541271209717, -2.758413314819336, -2.155285120010376, -1.5521571636199951, -0.9490292072296143, -0.3459010124206543, 0.25722694396972656, 0.8603549003601074, 1.4634828567504883, 2.066610813140869, 2.669739007949829, 3.27286696434021, 3.875994920730591, 4.479123115539551, 5.082251071929932, 5.6853790283203125, 6.288506984710693, 6.891634941101074, 7.494763374328613, 8.097890853881836, 8.701019287109375, 9.304147720336914, 9.907275199890137, 10.51040267944336, 11.113531112670898, 11.716658592224121, 12.31978702545166, 12.922914505004883, 13.526042938232422, 14.129171371459961, 14.732298851013184, 15.335427284240723]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 12.0, 15.0, 15.0, 17.0, 24.0, 14.0, 34.0, 36.0, 45.0, 55.0, 42.0, 72.0, 56.0, 63.0, 66.0, 65.0, 33.0, 49.0, 42.0, 42.0, 32.0, 20.0, 22.0, 33.0, 20.0, 25.0, 13.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.27517318725586, -9.972159385681152, -9.669144630432129, -9.366130828857422, -9.063117027282715, -8.760102272033691, -8.457088470458984, -8.154073715209961, -7.851059913635254, -7.548045635223389, -7.245031833648682, -6.942017555236816, -6.639003276824951, -6.335988998413086, -6.032975196838379, -5.729960918426514, -5.426947116851807, -5.123932838439941, -4.820919036865234, -4.517904758453369, -4.214890480041504, -3.9118764400482178, -3.6088624000549316, -3.3058481216430664, -3.0028340816497803, -2.699820041656494, -2.396805763244629, -2.0937917232513428, -1.790777564048767, -1.4877634048461914, -1.1847493648529053, -0.88173508644104, -0.5787210464477539, -0.2757069170475006, 0.027307212352752686, 0.3303213119506836, 0.6333354711532593, 0.936349630355835, 1.239363670349121, 1.5423779487609863, 1.8453919887542725, 2.1484060287475586, 2.451420307159424, 2.75443434715271, 3.057448387145996, 3.3604626655578613, 3.6634767055511475, 3.9664909839630127, 4.269505023956299, 4.572519302368164, 4.875533103942871, 5.178547382354736, 5.481561660766602, 5.784575462341309, 6.087589740753174, 6.390604019165039, 6.693617820739746, 6.996632099151611, 7.299645900726318, 7.602660179138184, 7.905674457550049, 8.208688735961914, 8.511702537536621, 8.814716339111328, 9.117731094360352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 5.0, 8.0, 21.0, 20.0, 25.0, 28.0, 52.0, 73.0, 115.0, 147.0, 241.0, 341.0, 552.0, 1085.0, 1862.0, 3515.0, 7308.0, 16444.0, 38229.0, 93208.0, 225661.0, 352007.0, 177667.0, 73458.0, 30568.0, 13069.0, 5974.0, 2937.0, 1592.0, 847.0, 477.0, 308.0, 216.0, 148.0, 81.0, 68.0, 61.0, 27.0, 31.0, 17.0, 10.0, 7.0, 11.0, 9.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.546875, -1.501861572265625, -1.45684814453125, -1.411834716796875, -1.3668212890625, -1.321807861328125, -1.27679443359375, -1.231781005859375, -1.186767578125, -1.141754150390625, -1.09674072265625, -1.051727294921875, -1.0067138671875, -0.961700439453125, -0.91668701171875, -0.871673583984375, -0.82666015625, -0.781646728515625, -0.73663330078125, -0.691619873046875, -0.6466064453125, -0.601593017578125, -0.55657958984375, -0.511566162109375, -0.466552734375, -0.421539306640625, -0.37652587890625, -0.331512451171875, -0.2864990234375, -0.241485595703125, -0.19647216796875, -0.151458740234375, -0.1064453125, -0.061431884765625, -0.01641845703125, 0.028594970703125, 0.0736083984375, 0.118621826171875, 0.16363525390625, 0.208648681640625, 0.253662109375, 0.298675537109375, 0.34368896484375, 0.388702392578125, 0.4337158203125, 0.478729248046875, 0.52374267578125, 0.568756103515625, 0.61376953125, 0.658782958984375, 0.70379638671875, 0.748809814453125, 0.7938232421875, 0.838836669921875, 0.88385009765625, 0.928863525390625, 0.973876953125, 1.018890380859375, 1.06390380859375, 1.108917236328125, 1.1539306640625, 1.198944091796875, 1.24395751953125, 1.288970947265625, 1.333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 17.0, 26.0, 32.0, 50.0, 54.0, 53.0, 59.0, 72.0, 91.0, 81.0, 80.0, 81.0, 66.0, 60.0, 47.0, 27.0, 26.0, 20.0, 10.0, 12.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.11456298828125, -1.0787353515625, -1.04290771484375, -1.007080078125, -0.97125244140625, -0.9354248046875, -0.89959716796875, -0.86376953125, -0.82794189453125, -0.7921142578125, -0.75628662109375, -0.720458984375, -0.68463134765625, -0.6488037109375, -0.61297607421875, -0.5771484375, -0.54132080078125, -0.5054931640625, -0.46966552734375, -0.433837890625, -0.39801025390625, -0.3621826171875, -0.32635498046875, -0.29052734375, -0.25469970703125, -0.2188720703125, -0.18304443359375, -0.147216796875, -0.11138916015625, -0.0755615234375, -0.03973388671875, -0.00390625, 0.03192138671875, 0.0677490234375, 0.10357666015625, 0.139404296875, 0.17523193359375, 0.2110595703125, 0.24688720703125, 0.28271484375, 0.31854248046875, 0.3543701171875, 0.39019775390625, 0.426025390625, 0.46185302734375, 0.4976806640625, 0.53350830078125, 0.5693359375, 0.60516357421875, 0.6409912109375, 0.67681884765625, 0.712646484375, 0.74847412109375, 0.7843017578125, 0.82012939453125, 0.85595703125, 0.89178466796875, 0.9276123046875, 0.96343994140625, 0.999267578125, 1.03509521484375, 1.0709228515625, 1.10675048828125, 1.142578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 15.0, 22.0, 30.0, 47.0, 64.0, 125.0, 187.0, 346.0, 573.0, 1054.0, 2592.0, 9851.0, 116116.0, 847104.0, 59169.0, 6880.0, 2130.0, 939.0, 508.0, 289.0, 173.0, 117.0, 61.0, 50.0, 29.0, 22.0, 13.0, 8.0, 12.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.56463623046875, -4.4144287109375, -4.26422119140625, -4.114013671875, -3.96380615234375, -3.8135986328125, -3.66339111328125, -3.51318359375, -3.36297607421875, -3.2127685546875, -3.06256103515625, -2.912353515625, -2.76214599609375, -2.6119384765625, -2.46173095703125, -2.3115234375, -2.16131591796875, -2.0111083984375, -1.86090087890625, -1.710693359375, -1.56048583984375, -1.4102783203125, -1.26007080078125, -1.10986328125, -0.95965576171875, -0.8094482421875, -0.65924072265625, -0.509033203125, -0.35882568359375, -0.2086181640625, -0.05841064453125, 0.091796875, 0.24200439453125, 0.3922119140625, 0.54241943359375, 0.692626953125, 0.84283447265625, 0.9930419921875, 1.14324951171875, 1.29345703125, 1.44366455078125, 1.5938720703125, 1.74407958984375, 1.894287109375, 2.04449462890625, 2.1947021484375, 2.34490966796875, 2.4951171875, 2.64532470703125, 2.7955322265625, 2.94573974609375, 3.095947265625, 3.24615478515625, 3.3963623046875, 3.54656982421875, 3.69677734375, 3.84698486328125, 3.9971923828125, 4.14739990234375, 4.297607421875, 4.44781494140625, 4.5980224609375, 4.74822998046875, 4.8984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 2.0, 10.0, 10.0, 12.0, 14.0, 22.0, 17.0, 24.0, 24.0, 37.0, 44.0, 43.0, 43.0, 56.0, 58.0, 59.0, 50.0, 79.0, 63.0, 43.0, 42.0, 39.0, 42.0, 28.0, 20.0, 22.0, 20.0, 7.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.6328125, -3.51812744140625, -3.4034423828125, -3.28875732421875, -3.174072265625, -3.05938720703125, -2.9447021484375, -2.83001708984375, -2.71533203125, -2.60064697265625, -2.4859619140625, -2.37127685546875, -2.256591796875, -2.14190673828125, -2.0272216796875, -1.91253662109375, -1.7978515625, -1.68316650390625, -1.5684814453125, -1.45379638671875, -1.339111328125, -1.22442626953125, -1.1097412109375, -0.99505615234375, -0.88037109375, -0.76568603515625, -0.6510009765625, -0.53631591796875, -0.421630859375, -0.30694580078125, -0.1922607421875, -0.07757568359375, 0.037109375, 0.15179443359375, 0.2664794921875, 0.38116455078125, 0.495849609375, 0.61053466796875, 0.7252197265625, 0.83990478515625, 0.95458984375, 1.06927490234375, 1.1839599609375, 1.29864501953125, 1.413330078125, 1.52801513671875, 1.6427001953125, 1.75738525390625, 1.8720703125, 1.98675537109375, 2.1014404296875, 2.21612548828125, 2.330810546875, 2.44549560546875, 2.5601806640625, 2.67486572265625, 2.78955078125, 2.90423583984375, 3.0189208984375, 3.13360595703125, 3.248291015625, 3.36297607421875, 3.4776611328125, 3.59234619140625, 3.70703125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 5.0, 7.0, 13.0, 14.0, 17.0, 13.0, 21.0, 36.0, 42.0, 69.0, 114.0, 155.0, 219.0, 419.0, 985.0, 2986.0, 14526.0, 168576.0, 792568.0, 57215.0, 7121.0, 1733.0, 697.0, 351.0, 186.0, 145.0, 70.0, 60.0, 41.0, 23.0, 29.0, 18.0, 13.0, 12.0, 9.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2494049072265625, -1.210723876953125, -1.1720428466796875, -1.13336181640625, -1.0946807861328125, -1.055999755859375, -1.0173187255859375, -0.9786376953125, -0.9399566650390625, -0.901275634765625, -0.8625946044921875, -0.82391357421875, -0.7852325439453125, -0.746551513671875, -0.7078704833984375, -0.669189453125, -0.6305084228515625, -0.591827392578125, -0.5531463623046875, -0.51446533203125, -0.4757843017578125, -0.437103271484375, -0.3984222412109375, -0.3597412109375, -0.3210601806640625, -0.282379150390625, -0.2436981201171875, -0.20501708984375, -0.1663360595703125, -0.127655029296875, -0.0889739990234375, -0.05029296875, -0.0116119384765625, 0.027069091796875, 0.0657501220703125, 0.10443115234375, 0.1431121826171875, 0.181793212890625, 0.2204742431640625, 0.2591552734375, 0.2978363037109375, 0.336517333984375, 0.3751983642578125, 0.41387939453125, 0.4525604248046875, 0.491241455078125, 0.5299224853515625, 0.568603515625, 0.6072845458984375, 0.645965576171875, 0.6846466064453125, 0.72332763671875, 0.7620086669921875, 0.800689697265625, 0.8393707275390625, 0.8780517578125, 0.9167327880859375, 0.955413818359375, 0.9940948486328125, 1.03277587890625, 1.0714569091796875, 1.110137939453125, 1.1488189697265625, 1.1875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 3.0, 5.0, 6.0, 16.0, 11.0, 11.0, 16.0, 12.0, 18.0, 25.0, 34.0, 45.0, 55.0, 69.0, 90.0, 106.0, 79.0, 71.0, 65.0, 45.0, 28.0, 28.0, 24.0, 27.0, 13.0, 14.0, 21.0, 7.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013649463653564453, -0.00013159587979316711, -0.0001266971230506897, -0.00012179836630821228, -0.00011689960956573486, -0.00011200085282325745, -0.00010710209608078003, -0.00010220333933830261, -9.73045825958252e-05, -9.240582585334778e-05, -8.750706911087036e-05, -8.260831236839294e-05, -7.770955562591553e-05, -7.281079888343811e-05, -6.79120421409607e-05, -6.301328539848328e-05, -5.811452865600586e-05, -5.321577191352844e-05, -4.8317015171051025e-05, -4.341825842857361e-05, -3.851950168609619e-05, -3.3620744943618774e-05, -2.8721988201141357e-05, -2.382323145866394e-05, -1.8924474716186523e-05, -1.4025717973709106e-05, -9.12696123123169e-06, -4.2282044887542725e-06, 6.705522537231445e-07, 5.5693089962005615e-06, 1.0468065738677979e-05, 1.5366822481155396e-05, 2.0265579223632812e-05, 2.516433596611023e-05, 3.0063092708587646e-05, 3.4961849451065063e-05, 3.986060619354248e-05, 4.47593629360199e-05, 4.9658119678497314e-05, 5.455687642097473e-05, 5.945563316345215e-05, 6.435438990592957e-05, 6.925314664840698e-05, 7.41519033908844e-05, 7.905066013336182e-05, 8.394941687583923e-05, 8.884817361831665e-05, 9.374693036079407e-05, 9.864568710327148e-05, 0.0001035444438457489, 0.00010844320058822632, 0.00011334195733070374, 0.00011824071407318115, 0.00012313947081565857, 0.00012803822755813599, 0.0001329369843006134, 0.00013783574104309082, 0.00014273449778556824, 0.00014763325452804565, 0.00015253201127052307, 0.0001574307680130005, 0.0001623295247554779, 0.00016722828149795532, 0.00017212703824043274, 0.00017702579498291016]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 17.0, 14.0, 16.0, 17.0, 33.0, 46.0, 63.0, 84.0, 126.0, 195.0, 317.0, 629.0, 1329.0, 3839.0, 13773.0, 112238.0, 826733.0, 72269.0, 10952.0, 3202.0, 1243.0, 558.0, 300.0, 156.0, 112.0, 56.0, 55.0, 46.0, 32.0, 24.0, 14.0, 15.0, 10.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2555999755859375, -1.214324951171875, -1.1730499267578125, -1.13177490234375, -1.0904998779296875, -1.049224853515625, -1.0079498291015625, -0.9666748046875, -0.9253997802734375, -0.884124755859375, -0.8428497314453125, -0.80157470703125, -0.7602996826171875, -0.719024658203125, -0.6777496337890625, -0.636474609375, -0.5951995849609375, -0.553924560546875, -0.5126495361328125, -0.47137451171875, -0.4300994873046875, -0.388824462890625, -0.3475494384765625, -0.3062744140625, -0.2649993896484375, -0.223724365234375, -0.1824493408203125, -0.14117431640625, -0.0998992919921875, -0.058624267578125, -0.0173492431640625, 0.02392578125, 0.0652008056640625, 0.106475830078125, 0.1477508544921875, 0.18902587890625, 0.2303009033203125, 0.271575927734375, 0.3128509521484375, 0.3541259765625, 0.3954010009765625, 0.436676025390625, 0.4779510498046875, 0.51922607421875, 0.5605010986328125, 0.601776123046875, 0.6430511474609375, 0.684326171875, 0.7256011962890625, 0.766876220703125, 0.8081512451171875, 0.84942626953125, 0.8907012939453125, 0.931976318359375, 0.9732513427734375, 1.0145263671875, 1.0558013916015625, 1.097076416015625, 1.1383514404296875, 1.17962646484375, 1.2209014892578125, 1.262176513671875, 1.3034515380859375, 1.3447265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 6.0, 8.0, 10.0, 17.0, 23.0, 40.0, 37.0, 45.0, 63.0, 81.0, 93.0, 109.0, 112.0, 84.0, 76.0, 46.0, 33.0, 19.0, 18.0, 14.0, 8.0, 10.0, 4.0, 4.0, 7.0, 0.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.92626953125, -0.8948593139648438, -0.8634490966796875, -0.8320388793945312, -0.800628662109375, -0.7692184448242188, -0.7378082275390625, -0.7063980102539062, -0.67498779296875, -0.6435775756835938, -0.6121673583984375, -0.5807571411132812, -0.549346923828125, -0.5179367065429688, -0.4865264892578125, -0.45511627197265625, -0.4237060546875, -0.39229583740234375, -0.3608856201171875, -0.32947540283203125, -0.298065185546875, -0.26665496826171875, -0.2352447509765625, -0.20383453369140625, -0.17242431640625, -0.14101409912109375, -0.1096038818359375, -0.07819366455078125, -0.046783447265625, -0.01537322998046875, 0.0160369873046875, 0.04744720458984375, 0.078857421875, 0.11026763916015625, 0.1416778564453125, 0.17308807373046875, 0.204498291015625, 0.23590850830078125, 0.2673187255859375, 0.29872894287109375, 0.33013916015625, 0.36154937744140625, 0.3929595947265625, 0.42436981201171875, 0.455780029296875, 0.48719024658203125, 0.5186004638671875, 0.5500106811523438, 0.5814208984375, 0.6128311157226562, 0.6442413330078125, 0.6756515502929688, 0.707061767578125, 0.7384719848632812, 0.7698822021484375, 0.8012924194335938, 0.83270263671875, 0.8641128540039062, 0.8955230712890625, 0.9269332885742188, 0.958343505859375, 0.9897537231445312, 1.0211639404296875, 1.0525741577148438, 1.083984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 5.0, 16.0, 21.0, 48.0, 47.0, 102.0, 112.0, 178.0, 166.0, 105.0, 68.0, 51.0, 23.0, 11.0, 7.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.943916320800781, -15.443807601928711, -14.94369888305664, -14.44359016418457, -13.943480491638184, -13.443371772766113, -12.943263053894043, -12.443154335021973, -11.943044662475586, -11.442935943603516, -10.942827224731445, -10.442718505859375, -9.942608833312988, -9.442500114440918, -8.942391395568848, -8.442282676696777, -7.942173957824707, -7.442065238952637, -6.941956043243408, -6.441847324371338, -5.941738128662109, -5.441629409790039, -4.941520690917969, -4.441411972045898, -3.94130277633667, -3.4411938190460205, -2.941084861755371, -2.440976142883301, -1.9408671855926514, -1.440758228302002, -0.9406495094299316, -0.4405405521392822, 0.05956840515136719, 0.5596773028373718, 1.0597862005233765, 1.5598950386047363, 2.0600039958953857, 2.560112953186035, 3.0602216720581055, 3.560330629348755, 4.060439586639404, 4.560548305511475, 5.060657501220703, 5.560766220092773, 6.060874938964844, 6.560984134674072, 7.061092853546143, 7.561202049255371, 8.061310768127441, 8.561419486999512, 9.061528205871582, 9.561637878417969, 10.061746597290039, 10.56185531616211, 11.06196403503418, 11.56207275390625, 12.06218147277832, 12.56229019165039, 13.062398910522461, 13.562507629394531, 14.062617301940918, 14.562726020812988, 15.062834739685059, 15.562943458557129, 16.063053131103516]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 9.0, 19.0, 15.0, 22.0, 20.0, 34.0, 21.0, 35.0, 40.0, 38.0, 30.0, 70.0, 86.0, 80.0, 72.0, 53.0, 49.0, 45.0, 37.0, 16.0, 28.0, 24.0, 25.0, 26.0, 11.0, 25.0, 18.0, 14.0, 3.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.230524063110352, -14.78946304321289, -14.348401069641113, -13.907340049743652, -13.466278076171875, -13.025217056274414, -12.584156036376953, -12.143094062805176, -11.702033042907715, -11.260972023010254, -10.819910049438477, -10.378849029541016, -9.937787055969238, -9.496726036071777, -9.0556640625, -8.614603042602539, -8.173542022705078, -7.732480525970459, -7.29141902923584, -6.850358009338379, -6.40929651260376, -5.968235015869141, -5.5271735191345215, -5.086112022399902, -4.645050048828125, -4.203988552093506, -3.762927293777466, -3.3218657970428467, -2.8808045387268066, -2.4397430419921875, -1.9986815452575684, -1.5576202869415283, -1.1165590286254883, -0.6754976511001587, -0.23443621397018433, 0.20662522315979004, 0.6476866006851196, 1.0887479782104492, 1.5298094749450684, 1.9708707332611084, 2.4119322299957275, 2.8529937267303467, 3.2940549850463867, 3.735116481781006, 4.176177978515625, 4.617238998413086, 5.058300971984863, 5.499361991882324, 5.940423488616943, 6.3814849853515625, 6.822546482086182, 7.263607978820801, 7.704668998718262, 8.145730972290039, 8.5867919921875, 9.027853012084961, 9.468914985656738, 9.9099760055542, 10.351037979125977, 10.792098999023438, 11.233160972595215, 11.674221992492676, 12.115283966064453, 12.556344985961914, 12.997406005859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 15.0, 20.0, 28.0, 38.0, 58.0, 100.0, 173.0, 324.0, 687.0, 1637.0, 4340.0, 15467.0, 83652.0, 1501718.0, 2434640.0, 122639.0, 19689.0, 5362.0, 1985.0, 803.0, 384.0, 241.0, 122.0, 51.0, 45.0, 23.0, 17.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.05059814453125, -1.9937744140625, -1.93695068359375, -1.880126953125, -1.82330322265625, -1.7664794921875, -1.70965576171875, -1.65283203125, -1.59600830078125, -1.5391845703125, -1.48236083984375, -1.425537109375, -1.36871337890625, -1.3118896484375, -1.25506591796875, -1.1982421875, -1.14141845703125, -1.0845947265625, -1.02777099609375, -0.970947265625, -0.91412353515625, -0.8572998046875, -0.80047607421875, -0.74365234375, -0.68682861328125, -0.6300048828125, -0.57318115234375, -0.516357421875, -0.45953369140625, -0.4027099609375, -0.34588623046875, -0.2890625, -0.23223876953125, -0.1754150390625, -0.11859130859375, -0.061767578125, -0.00494384765625, 0.0518798828125, 0.10870361328125, 0.16552734375, 0.22235107421875, 0.2791748046875, 0.33599853515625, 0.392822265625, 0.44964599609375, 0.5064697265625, 0.56329345703125, 0.6201171875, 0.67694091796875, 0.7337646484375, 0.79058837890625, 0.847412109375, 0.90423583984375, 0.9610595703125, 1.01788330078125, 1.07470703125, 1.13153076171875, 1.1883544921875, 1.24517822265625, 1.302001953125, 1.35882568359375, 1.4156494140625, 1.47247314453125, 1.529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 6.0, 9.0, 11.0, 7.0, 11.0, 16.0, 16.0, 24.0, 25.0, 25.0, 37.0, 26.0, 49.0, 50.0, 59.0, 56.0, 57.0, 54.0, 63.0, 50.0, 50.0, 52.0, 45.0, 48.0, 27.0, 26.0, 25.0, 13.0, 13.0, 15.0, 5.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.613189697265625, -0.58868408203125, -0.564178466796875, -0.5396728515625, -0.515167236328125, -0.49066162109375, -0.466156005859375, -0.441650390625, -0.417144775390625, -0.39263916015625, -0.368133544921875, -0.3436279296875, -0.319122314453125, -0.29461669921875, -0.270111083984375, -0.24560546875, -0.221099853515625, -0.19659423828125, -0.172088623046875, -0.1475830078125, -0.123077392578125, -0.09857177734375, -0.074066162109375, -0.049560546875, -0.025054931640625, -0.00054931640625, 0.023956298828125, 0.0484619140625, 0.072967529296875, 0.09747314453125, 0.121978759765625, 0.146484375, 0.170989990234375, 0.19549560546875, 0.220001220703125, 0.2445068359375, 0.269012451171875, 0.29351806640625, 0.318023681640625, 0.342529296875, 0.367034912109375, 0.39154052734375, 0.416046142578125, 0.4405517578125, 0.465057373046875, 0.48956298828125, 0.514068603515625, 0.53857421875, 0.563079833984375, 0.58758544921875, 0.612091064453125, 0.6365966796875, 0.661102294921875, 0.68560791015625, 0.710113525390625, 0.734619140625, 0.759124755859375, 0.78363037109375, 0.808135986328125, 0.8326416015625, 0.857147216796875, 0.88165283203125, 0.906158447265625, 0.9306640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 10.0, 8.0, 11.0, 23.0, 25.0, 49.0, 77.0, 109.0, 159.0, 272.0, 485.0, 915.0, 2233.0, 7710.0, 38747.0, 514684.0, 3425594.0, 170953.0, 23130.0, 5449.0, 1862.0, 752.0, 430.0, 249.0, 142.0, 79.0, 62.0, 23.0, 16.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.552734375, -2.4843292236328125, -2.415924072265625, -2.3475189208984375, -2.27911376953125, -2.2107086181640625, -2.142303466796875, -2.0738983154296875, -2.0054931640625, -1.9370880126953125, -1.868682861328125, -1.8002777099609375, -1.73187255859375, -1.6634674072265625, -1.595062255859375, -1.5266571044921875, -1.458251953125, -1.3898468017578125, -1.321441650390625, -1.2530364990234375, -1.18463134765625, -1.1162261962890625, -1.047821044921875, -0.9794158935546875, -0.9110107421875, -0.8426055908203125, -0.774200439453125, -0.7057952880859375, -0.63739013671875, -0.5689849853515625, -0.500579833984375, -0.4321746826171875, -0.36376953125, -0.2953643798828125, -0.226959228515625, -0.1585540771484375, -0.09014892578125, -0.0217437744140625, 0.046661376953125, 0.1150665283203125, 0.1834716796875, 0.2518768310546875, 0.320281982421875, 0.3886871337890625, 0.45709228515625, 0.5254974365234375, 0.593902587890625, 0.6623077392578125, 0.730712890625, 0.7991180419921875, 0.867523193359375, 0.9359283447265625, 1.00433349609375, 1.0727386474609375, 1.141143798828125, 1.2095489501953125, 1.2779541015625, 1.3463592529296875, 1.414764404296875, 1.4831695556640625, 1.55157470703125, 1.6199798583984375, 1.688385009765625, 1.7567901611328125, 1.8251953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 9.0, 31.0, 75.0, 165.0, 483.0, 1339.0, 1154.0, 429.0, 182.0, 77.0, 40.0, 30.0, 18.0, 11.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1341552734375, -4.022216796875, -3.9102783203125, -3.79833984375, -3.6864013671875, -3.574462890625, -3.4625244140625, -3.3505859375, -3.2386474609375, -3.126708984375, -3.0147705078125, -2.90283203125, -2.7908935546875, -2.678955078125, -2.5670166015625, -2.455078125, -2.3431396484375, -2.231201171875, -2.1192626953125, -2.00732421875, -1.8953857421875, -1.783447265625, -1.6715087890625, -1.5595703125, -1.4476318359375, -1.335693359375, -1.2237548828125, -1.11181640625, -0.9998779296875, -0.887939453125, -0.7760009765625, -0.6640625, -0.5521240234375, -0.440185546875, -0.3282470703125, -0.21630859375, -0.1043701171875, 0.007568359375, 0.1195068359375, 0.2314453125, 0.3433837890625, 0.455322265625, 0.5672607421875, 0.67919921875, 0.7911376953125, 0.903076171875, 1.0150146484375, 1.126953125, 1.2388916015625, 1.350830078125, 1.4627685546875, 1.57470703125, 1.6866455078125, 1.798583984375, 1.9105224609375, 2.0224609375, 2.1343994140625, 2.246337890625, 2.3582763671875, 2.47021484375, 2.5821533203125, 2.694091796875, 2.8060302734375, 2.91796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 13.0, 34.0, 104.0, 207.0, 309.0, 192.0, 67.0, 25.0, 14.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.147830963134766, -20.235191345214844, -19.322551727294922, -18.409912109375, -17.497272491455078, -16.584632873535156, -15.671993255615234, -14.759353637695312, -13.84671401977539, -12.934074401855469, -12.021434783935547, -11.108795166015625, -10.196155548095703, -9.283515930175781, -8.37087631225586, -7.458237171173096, -6.545598030090332, -5.63295841217041, -4.720318794250488, -3.8076794147491455, -2.8950397968292236, -1.9824004173278809, -1.069760799407959, -0.1571211814880371, 0.7555184364318848, 1.6681580543518066, 2.5807976722717285, 3.4934370517730713, 4.406076431274414, 5.318716049194336, 6.231355667114258, 7.14399528503418, 8.056634902954102, 8.969274520874023, 9.881914138793945, 10.794553756713867, 11.707193374633789, 12.619832992553711, 13.532472610473633, 14.445112228393555, 15.357751846313477, 16.2703914642334, 17.18303108215332, 18.095670700073242, 19.008310317993164, 19.920949935913086, 20.833589553833008, 21.74622917175293, 22.65886688232422, 23.57150650024414, 24.484146118164062, 25.396785736083984, 26.309425354003906, 27.222064971923828, 28.13470458984375, 29.047344207763672, 29.959983825683594, 30.872623443603516, 31.785263061523438, 32.69790267944336, 33.61054229736328, 34.5231819152832, 35.435821533203125, 36.34846115112305, 37.26110076904297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 27.0, 37.0, 62.0, 81.0, 88.0, 105.0, 114.0, 94.0, 106.0, 75.0, 55.0, 53.0, 42.0, 22.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.85193634033203, -26.208160400390625, -25.564382553100586, -24.920604705810547, -24.27682876586914, -23.633052825927734, -22.989274978637695, -22.345497131347656, -21.70172119140625, -21.057945251464844, -20.414167404174805, -19.770389556884766, -19.12661361694336, -18.482837677001953, -17.839059829711914, -17.195281982421875, -16.55150604248047, -15.907729148864746, -15.263952255249023, -14.6201753616333, -13.976398468017578, -13.332621574401855, -12.688844680786133, -12.04506778717041, -11.401290893554688, -10.757513999938965, -10.113737106323242, -9.46996021270752, -8.826183319091797, -8.182406425476074, -7.538629531860352, -6.894852638244629, -6.251073837280273, -5.607296943664551, -4.963520050048828, -4.3197431564331055, -3.675966262817383, -3.03218936920166, -2.3884124755859375, -1.7446355819702148, -1.1008586883544922, -0.45708179473876953, 0.18669509887695312, 0.8304719924926758, 1.4742488861083984, 2.118025779724121, 2.7618026733398438, 3.4055795669555664, 4.049356460571289, 4.693133354187012, 5.336910247802734, 5.980687141418457, 6.62446403503418, 7.268240928649902, 7.912017822265625, 8.555794715881348, 9.19957160949707, 9.843348503112793, 10.487125396728516, 11.130902290344238, 11.774679183959961, 12.418456077575684, 13.062232971191406, 13.706009864807129, 14.349786758422852]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 11.0, 13.0, 11.0, 29.0, 24.0, 44.0, 46.0, 68.0, 101.0, 162.0, 277.0, 394.0, 772.0, 1319.0, 2748.0, 5870.0, 14332.0, 39033.0, 116296.0, 370094.0, 335377.0, 102836.0, 34694.0, 12976.0, 5452.0, 2527.0, 1322.0, 699.0, 328.0, 203.0, 143.0, 94.0, 59.0, 56.0, 31.0, 20.0, 17.0, 15.0, 13.0, 11.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7041015625, -1.6507568359375, -1.597412109375, -1.5440673828125, -1.49072265625, -1.4373779296875, -1.384033203125, -1.3306884765625, -1.27734375, -1.2239990234375, -1.170654296875, -1.1173095703125, -1.06396484375, -1.0106201171875, -0.957275390625, -0.9039306640625, -0.8505859375, -0.7972412109375, -0.743896484375, -0.6905517578125, -0.63720703125, -0.5838623046875, -0.530517578125, -0.4771728515625, -0.423828125, -0.3704833984375, -0.317138671875, -0.2637939453125, -0.21044921875, -0.1571044921875, -0.103759765625, -0.0504150390625, 0.0029296875, 0.0562744140625, 0.109619140625, 0.1629638671875, 0.21630859375, 0.2696533203125, 0.322998046875, 0.3763427734375, 0.4296875, 0.4830322265625, 0.536376953125, 0.5897216796875, 0.64306640625, 0.6964111328125, 0.749755859375, 0.8031005859375, 0.8564453125, 0.9097900390625, 0.963134765625, 1.0164794921875, 1.06982421875, 1.1231689453125, 1.176513671875, 1.2298583984375, 1.283203125, 1.3365478515625, 1.389892578125, 1.4432373046875, 1.49658203125, 1.5499267578125, 1.603271484375, 1.6566162109375, 1.7099609375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 4.0, 12.0, 7.0, 5.0, 16.0, 13.0, 22.0, 24.0, 25.0, 34.0, 21.0, 32.0, 38.0, 49.0, 44.0, 45.0, 45.0, 47.0, 38.0, 43.0, 45.0, 53.0, 42.0, 27.0, 43.0, 27.0, 34.0, 30.0, 24.0, 21.0, 15.0, 16.0, 10.0, 13.0, 5.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6650390625, -0.6449203491210938, -0.6248016357421875, -0.6046829223632812, -0.584564208984375, -0.5644454956054688, -0.5443267822265625, -0.5242080688476562, -0.50408935546875, -0.48397064208984375, -0.4638519287109375, -0.44373321533203125, -0.423614501953125, -0.40349578857421875, -0.3833770751953125, -0.36325836181640625, -0.3431396484375, -0.32302093505859375, -0.3029022216796875, -0.28278350830078125, -0.262664794921875, -0.24254608154296875, -0.2224273681640625, -0.20230865478515625, -0.18218994140625, -0.16207122802734375, -0.1419525146484375, -0.12183380126953125, -0.101715087890625, -0.08159637451171875, -0.0614776611328125, -0.04135894775390625, -0.021240234375, -0.00112152099609375, 0.0189971923828125, 0.03911590576171875, 0.059234619140625, 0.07935333251953125, 0.0994720458984375, 0.11959075927734375, 0.13970947265625, 0.15982818603515625, 0.1799468994140625, 0.20006561279296875, 0.220184326171875, 0.24030303955078125, 0.2604217529296875, 0.28054046630859375, 0.3006591796875, 0.32077789306640625, 0.3408966064453125, 0.36101531982421875, 0.381134033203125, 0.40125274658203125, 0.4213714599609375, 0.44149017333984375, 0.46160888671875, 0.48172760009765625, 0.5018463134765625, 0.5219650268554688, 0.542083740234375, 0.5622024536132812, 0.5823211669921875, 0.6024398803710938, 0.62255859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 12.0, 23.0, 21.0, 63.0, 109.0, 248.0, 523.0, 1531.0, 6490.0, 171642.0, 847223.0, 16910.0, 2284.0, 759.0, 352.0, 151.0, 72.0, 44.0, 34.0, 14.0, 15.0, 6.0, 7.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.8812255859375, -5.672607421875, -5.4639892578125, -5.25537109375, -5.0467529296875, -4.838134765625, -4.6295166015625, -4.4208984375, -4.2122802734375, -4.003662109375, -3.7950439453125, -3.58642578125, -3.3778076171875, -3.169189453125, -2.9605712890625, -2.751953125, -2.5433349609375, -2.334716796875, -2.1260986328125, -1.91748046875, -1.7088623046875, -1.500244140625, -1.2916259765625, -1.0830078125, -0.8743896484375, -0.665771484375, -0.4571533203125, -0.24853515625, -0.0399169921875, 0.168701171875, 0.3773193359375, 0.5859375, 0.7945556640625, 1.003173828125, 1.2117919921875, 1.42041015625, 1.6290283203125, 1.837646484375, 2.0462646484375, 2.2548828125, 2.4635009765625, 2.672119140625, 2.8807373046875, 3.08935546875, 3.2979736328125, 3.506591796875, 3.7152099609375, 3.923828125, 4.1324462890625, 4.341064453125, 4.5496826171875, 4.75830078125, 4.9669189453125, 5.175537109375, 5.3841552734375, 5.5927734375, 5.8013916015625, 6.010009765625, 6.2186279296875, 6.42724609375, 6.6358642578125, 6.844482421875, 7.0531005859375, 7.26171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 9.0, 9.0, 13.0, 11.0, 15.0, 16.0, 21.0, 20.0, 31.0, 30.0, 31.0, 44.0, 49.0, 59.0, 41.0, 48.0, 53.0, 43.0, 50.0, 42.0, 53.0, 37.0, 39.0, 40.0, 24.0, 31.0, 22.0, 20.0, 9.0, 11.0, 7.0, 16.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.52288818359375, -2.4442138671875, -2.36553955078125, -2.286865234375, -2.20819091796875, -2.1295166015625, -2.05084228515625, -1.97216796875, -1.89349365234375, -1.8148193359375, -1.73614501953125, -1.657470703125, -1.57879638671875, -1.5001220703125, -1.42144775390625, -1.3427734375, -1.26409912109375, -1.1854248046875, -1.10675048828125, -1.028076171875, -0.94940185546875, -0.8707275390625, -0.79205322265625, -0.71337890625, -0.63470458984375, -0.5560302734375, -0.47735595703125, -0.398681640625, -0.32000732421875, -0.2413330078125, -0.16265869140625, -0.083984375, -0.00531005859375, 0.0733642578125, 0.15203857421875, 0.230712890625, 0.30938720703125, 0.3880615234375, 0.46673583984375, 0.54541015625, 0.62408447265625, 0.7027587890625, 0.78143310546875, 0.860107421875, 0.93878173828125, 1.0174560546875, 1.09613037109375, 1.1748046875, 1.25347900390625, 1.3321533203125, 1.41082763671875, 1.489501953125, 1.56817626953125, 1.6468505859375, 1.72552490234375, 1.80419921875, 1.88287353515625, 1.9615478515625, 2.04022216796875, 2.118896484375, 2.19757080078125, 2.2762451171875, 2.35491943359375, 2.43359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 6.0, 11.0, 11.0, 9.0, 22.0, 25.0, 37.0, 57.0, 88.0, 158.0, 455.0, 1713.0, 17066.0, 877163.0, 144508.0, 5616.0, 874.0, 281.0, 143.0, 74.0, 50.0, 35.0, 28.0, 22.0, 10.0, 18.0, 9.0, 8.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.34375, -2.274383544921875, -2.20501708984375, -2.135650634765625, -2.0662841796875, -1.996917724609375, -1.92755126953125, -1.858184814453125, -1.788818359375, -1.719451904296875, -1.65008544921875, -1.580718994140625, -1.5113525390625, -1.441986083984375, -1.37261962890625, -1.303253173828125, -1.23388671875, -1.164520263671875, -1.09515380859375, -1.025787353515625, -0.9564208984375, -0.887054443359375, -0.81768798828125, -0.748321533203125, -0.678955078125, -0.609588623046875, -0.54022216796875, -0.470855712890625, -0.4014892578125, -0.332122802734375, -0.26275634765625, -0.193389892578125, -0.1240234375, -0.054656982421875, 0.01470947265625, 0.084075927734375, 0.1534423828125, 0.222808837890625, 0.29217529296875, 0.361541748046875, 0.430908203125, 0.500274658203125, 0.56964111328125, 0.639007568359375, 0.7083740234375, 0.777740478515625, 0.84710693359375, 0.916473388671875, 0.98583984375, 1.055206298828125, 1.12457275390625, 1.193939208984375, 1.2633056640625, 1.332672119140625, 1.40203857421875, 1.471405029296875, 1.540771484375, 1.610137939453125, 1.67950439453125, 1.748870849609375, 1.8182373046875, 1.887603759765625, 1.95697021484375, 2.026336669921875, 2.095703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 2.0, 9.0, 5.0, 2.0, 9.0, 7.0, 10.0, 9.0, 19.0, 30.0, 29.0, 34.0, 51.0, 66.0, 89.0, 109.0, 117.0, 109.0, 72.0, 40.0, 29.0, 30.0, 14.0, 20.0, 14.0, 17.0, 15.0, 11.0, 9.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016951560974121094, -0.00016369298100471497, -0.000157870352268219, -0.00015204772353172302, -0.00014622509479522705, -0.00014040246605873108, -0.0001345798373222351, -0.00012875720858573914, -0.00012293457984924316, -0.00011711195111274719, -0.00011128932237625122, -0.00010546669363975525, -9.964406490325928e-05, -9.38214361667633e-05, -8.799880743026733e-05, -8.217617869377136e-05, -7.635354995727539e-05, -7.053092122077942e-05, -6.470829248428345e-05, -5.8885663747787476e-05, -5.3063035011291504e-05, -4.724040627479553e-05, -4.141777753829956e-05, -3.559514880180359e-05, -2.9772520065307617e-05, -2.3949891328811646e-05, -1.8127262592315674e-05, -1.2304633855819702e-05, -6.4820051193237305e-06, -6.593763828277588e-07, 5.163252353668213e-06, 1.0985881090164185e-05, 1.6808509826660156e-05, 2.2631138563156128e-05, 2.84537672996521e-05, 3.427639603614807e-05, 4.009902477264404e-05, 4.5921653509140015e-05, 5.1744282245635986e-05, 5.756691098213196e-05, 6.338953971862793e-05, 6.92121684551239e-05, 7.503479719161987e-05, 8.085742592811584e-05, 8.668005466461182e-05, 9.250268340110779e-05, 9.832531213760376e-05, 0.00010414794087409973, 0.0001099705696105957, 0.00011579319834709167, 0.00012161582708358765, 0.00012743845582008362, 0.0001332610845565796, 0.00013908371329307556, 0.00014490634202957153, 0.0001507289707660675, 0.00015655159950256348, 0.00016237422823905945, 0.00016819685697555542, 0.0001740194857120514, 0.00017984211444854736, 0.00018566474318504333, 0.0001914873719215393, 0.00019731000065803528, 0.00020313262939453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 11.0, 9.0, 12.0, 15.0, 34.0, 41.0, 52.0, 101.0, 146.0, 217.0, 401.0, 732.0, 1939.0, 6212.0, 33971.0, 589893.0, 376174.0, 29410.0, 5667.0, 1790.0, 741.0, 384.0, 215.0, 99.0, 88.0, 61.0, 45.0, 22.0, 13.0, 20.0, 13.0, 8.0, 2.0, 4.0, 4.0, 2.0, 5.0], "bins": [-1.546875, -1.5108718872070312, -1.4748687744140625, -1.4388656616210938, -1.402862548828125, -1.3668594360351562, -1.3308563232421875, -1.2948532104492188, -1.25885009765625, -1.2228469848632812, -1.1868438720703125, -1.1508407592773438, -1.114837646484375, -1.0788345336914062, -1.0428314208984375, -1.0068283081054688, -0.9708251953125, -0.9348220825195312, -0.8988189697265625, -0.8628158569335938, -0.826812744140625, -0.7908096313476562, -0.7548065185546875, -0.7188034057617188, -0.68280029296875, -0.6467971801757812, -0.6107940673828125, -0.5747909545898438, -0.538787841796875, -0.5027847290039062, -0.4667816162109375, -0.43077850341796875, -0.394775390625, -0.35877227783203125, -0.3227691650390625, -0.28676605224609375, -0.250762939453125, -0.21475982666015625, -0.1787567138671875, -0.14275360107421875, -0.10675048828125, -0.07074737548828125, -0.0347442626953125, 0.00125885009765625, 0.037261962890625, 0.07326507568359375, 0.1092681884765625, 0.14527130126953125, 0.1812744140625, 0.21727752685546875, 0.2532806396484375, 0.28928375244140625, 0.325286865234375, 0.36128997802734375, 0.3972930908203125, 0.43329620361328125, 0.46929931640625, 0.5053024291992188, 0.5413055419921875, 0.5773086547851562, 0.613311767578125, 0.6493148803710938, 0.6853179931640625, 0.7213211059570312, 0.75732421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 13.0, 19.0, 28.0, 30.0, 32.0, 65.0, 108.0, 125.0, 127.0, 127.0, 70.0, 59.0, 43.0, 24.0, 21.0, 16.0, 10.0, 6.0, 16.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.865814208984375, -0.83612060546875, -0.806427001953125, -0.7767333984375, -0.747039794921875, -0.71734619140625, -0.687652587890625, -0.657958984375, -0.628265380859375, -0.59857177734375, -0.568878173828125, -0.5391845703125, -0.509490966796875, -0.47979736328125, -0.450103759765625, -0.42041015625, -0.390716552734375, -0.36102294921875, -0.331329345703125, -0.3016357421875, -0.271942138671875, -0.24224853515625, -0.212554931640625, -0.182861328125, -0.153167724609375, -0.12347412109375, -0.093780517578125, -0.0640869140625, -0.034393310546875, -0.00469970703125, 0.024993896484375, 0.0546875, 0.084381103515625, 0.11407470703125, 0.143768310546875, 0.1734619140625, 0.203155517578125, 0.23284912109375, 0.262542724609375, 0.292236328125, 0.321929931640625, 0.35162353515625, 0.381317138671875, 0.4110107421875, 0.440704345703125, 0.47039794921875, 0.500091552734375, 0.52978515625, 0.559478759765625, 0.58917236328125, 0.618865966796875, 0.6485595703125, 0.678253173828125, 0.70794677734375, 0.737640380859375, 0.767333984375, 0.797027587890625, 0.82672119140625, 0.856414794921875, 0.8861083984375, 0.915802001953125, 0.94549560546875, 0.975189208984375, 1.0048828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 24.0, 37.0, 140.0, 422.0, 234.0, 88.0, 28.0, 12.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.05577850341797, -51.840389251708984, -50.624996185302734, -49.40960693359375, -48.194217681884766, -46.97882843017578, -45.76343536376953, -44.54804611206055, -43.33265686035156, -42.11726760864258, -40.90187454223633, -39.686485290527344, -38.47109603881836, -37.255706787109375, -36.040313720703125, -34.82492446899414, -33.60953140258789, -32.394142150878906, -31.17875099182129, -29.963359832763672, -28.747970581054688, -27.53257942199707, -26.317188262939453, -25.10179901123047, -23.88640785217285, -22.671016693115234, -21.45562744140625, -20.240236282348633, -19.024845123291016, -17.80945587158203, -16.594064712524414, -15.378674507141113, -14.163284301757812, -12.947894096374512, -11.732503890991211, -10.517112731933594, -9.301722526550293, -8.086332321166992, -6.870941638946533, -5.655550956726074, -4.440160751342773, -3.2247703075408936, -2.0093798637390137, -0.7939894199371338, 0.4214010238647461, 1.6367912292480469, 2.852181911468506, 4.067572593688965, 5.282962799072266, 6.498353004455566, 7.713743686676025, 8.929134368896484, 10.144524574279785, 11.359914779663086, 12.575305938720703, 13.790696144104004, 15.006086349487305, 16.221477508544922, 17.436866760253906, 18.652257919311523, 19.86764907836914, 21.083038330078125, 22.298429489135742, 23.51382064819336, 24.729209899902344]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 23.0, 13.0, 15.0, 18.0, 28.0, 26.0, 31.0, 35.0, 37.0, 36.0, 44.0, 62.0, 81.0, 80.0, 56.0, 43.0, 49.0, 43.0, 26.0, 46.0, 25.0, 21.0, 14.0, 26.0, 14.0, 19.0, 8.0, 10.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.179211616516113, -9.824738502502441, -9.470264434814453, -9.115791320800781, -8.76131820678711, -8.406845092773438, -8.052371978759766, -7.697897911071777, -7.3434247970581055, -6.988951683044434, -6.6344780921936035, -6.280004501342773, -5.925531387329102, -5.57105827331543, -5.2165846824646, -4.8621110916137695, -4.507637977600098, -4.153164863586426, -3.7986912727355957, -3.4442179203033447, -3.0897445678710938, -2.7352712154388428, -2.380797863006592, -2.026324510574341, -1.6718511581420898, -1.3173778057098389, -0.9629044532775879, -0.6084311008453369, -0.25395774841308594, 0.10051560401916504, 0.454988956451416, 0.809462308883667, 1.1639366149902344, 1.5184099674224854, 1.8728833198547363, 2.2273566722869873, 2.5818300247192383, 2.9363033771514893, 3.2907767295837402, 3.645250082015991, 3.999723434448242, 4.354196548461914, 4.708670139312744, 5.063143730163574, 5.417616844177246, 5.772089958190918, 6.126563549041748, 6.481037139892578, 6.83551025390625, 7.189983367919922, 7.544456958770752, 7.898930549621582, 8.253403663635254, 8.607876777648926, 8.962350845336914, 9.316823959350586, 9.671297073364258, 10.02577018737793, 10.380243301391602, 10.73471736907959, 11.089190483093262, 11.443663597106934, 11.798137664794922, 12.152610778808594, 12.507083892822266]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 9.0, 5.0, 19.0, 27.0, 39.0, 84.0, 145.0, 294.0, 683.0, 1966.0, 7566.0, 53210.0, 2759006.0, 1327172.0, 35197.0, 6028.0, 1722.0, 587.0, 229.0, 117.0, 60.0, 43.0, 24.0, 17.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.056640625, -2.98370361328125, -2.9107666015625, -2.83782958984375, -2.764892578125, -2.69195556640625, -2.6190185546875, -2.54608154296875, -2.47314453125, -2.40020751953125, -2.3272705078125, -2.25433349609375, -2.181396484375, -2.10845947265625, -2.0355224609375, -1.96258544921875, -1.8896484375, -1.81671142578125, -1.7437744140625, -1.67083740234375, -1.597900390625, -1.52496337890625, -1.4520263671875, -1.37908935546875, -1.30615234375, -1.23321533203125, -1.1602783203125, -1.08734130859375, -1.014404296875, -0.94146728515625, -0.8685302734375, -0.79559326171875, -0.72265625, -0.64971923828125, -0.5767822265625, -0.50384521484375, -0.430908203125, -0.35797119140625, -0.2850341796875, -0.21209716796875, -0.13916015625, -0.06622314453125, 0.0067138671875, 0.07965087890625, 0.152587890625, 0.22552490234375, 0.2984619140625, 0.37139892578125, 0.4443359375, 0.51727294921875, 0.5902099609375, 0.66314697265625, 0.736083984375, 0.80902099609375, 0.8819580078125, 0.95489501953125, 1.02783203125, 1.10076904296875, 1.1737060546875, 1.24664306640625, 1.319580078125, 1.39251708984375, 1.4654541015625, 1.53839111328125, 1.611328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 13.0, 18.0, 20.0, 21.0, 26.0, 35.0, 51.0, 52.0, 62.0, 65.0, 65.0, 72.0, 62.0, 76.0, 70.0, 63.0, 50.0, 40.0, 39.0, 30.0, 19.0, 15.0, 17.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9130859375, -0.8834609985351562, -0.8538360595703125, -0.8242111206054688, -0.794586181640625, -0.7649612426757812, -0.7353363037109375, -0.7057113647460938, -0.67608642578125, -0.6464614868164062, -0.6168365478515625, -0.5872116088867188, -0.557586669921875, -0.5279617309570312, -0.4983367919921875, -0.46871185302734375, -0.4390869140625, -0.40946197509765625, -0.3798370361328125, -0.35021209716796875, -0.320587158203125, -0.29096221923828125, -0.2613372802734375, -0.23171234130859375, -0.20208740234375, -0.17246246337890625, -0.1428375244140625, -0.11321258544921875, -0.083587646484375, -0.05396270751953125, -0.0243377685546875, 0.00528717041015625, 0.034912109375, 0.06453704833984375, 0.0941619873046875, 0.12378692626953125, 0.153411865234375, 0.18303680419921875, 0.2126617431640625, 0.24228668212890625, 0.27191162109375, 0.30153656005859375, 0.3311614990234375, 0.36078643798828125, 0.390411376953125, 0.42003631591796875, 0.4496612548828125, 0.47928619384765625, 0.5089111328125, 0.5385360717773438, 0.5681610107421875, 0.5977859497070312, 0.627410888671875, 0.6570358276367188, 0.6866607666015625, 0.7162857055664062, 0.74591064453125, 0.7755355834960938, 0.8051605224609375, 0.8347854614257812, 0.864410400390625, 0.8940353393554688, 0.9236602783203125, 0.9532852172851562, 0.98291015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 31.0, 50.0, 72.0, 123.0, 187.0, 394.0, 944.0, 2475.0, 10631.0, 128377.0, 3910957.0, 125088.0, 10239.0, 2599.0, 1032.0, 498.0, 248.0, 120.0, 76.0, 34.0, 28.0, 15.0, 12.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.09698486328125, -2.9986572265625, -2.90032958984375, -2.802001953125, -2.70367431640625, -2.6053466796875, -2.50701904296875, -2.40869140625, -2.31036376953125, -2.2120361328125, -2.11370849609375, -2.015380859375, -1.91705322265625, -1.8187255859375, -1.72039794921875, -1.6220703125, -1.52374267578125, -1.4254150390625, -1.32708740234375, -1.228759765625, -1.13043212890625, -1.0321044921875, -0.93377685546875, -0.83544921875, -0.73712158203125, -0.6387939453125, -0.54046630859375, -0.442138671875, -0.34381103515625, -0.2454833984375, -0.14715576171875, -0.048828125, 0.04949951171875, 0.1478271484375, 0.24615478515625, 0.344482421875, 0.44281005859375, 0.5411376953125, 0.63946533203125, 0.73779296875, 0.83612060546875, 0.9344482421875, 1.03277587890625, 1.131103515625, 1.22943115234375, 1.3277587890625, 1.42608642578125, 1.5244140625, 1.62274169921875, 1.7210693359375, 1.81939697265625, 1.917724609375, 2.01605224609375, 2.1143798828125, 2.21270751953125, 2.31103515625, 2.40936279296875, 2.5076904296875, 2.60601806640625, 2.704345703125, 2.80267333984375, 2.9010009765625, 2.99932861328125, 3.09765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 3.0, 17.0, 26.0, 40.0, 132.0, 447.0, 1507.0, 1384.0, 315.0, 110.0, 42.0, 27.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.033721923828125, -3.90728759765625, -3.780853271484375, -3.6544189453125, -3.527984619140625, -3.40155029296875, -3.275115966796875, -3.148681640625, -3.022247314453125, -2.89581298828125, -2.769378662109375, -2.6429443359375, -2.516510009765625, -2.39007568359375, -2.263641357421875, -2.13720703125, -2.010772705078125, -1.88433837890625, -1.757904052734375, -1.6314697265625, -1.505035400390625, -1.37860107421875, -1.252166748046875, -1.125732421875, -0.999298095703125, -0.87286376953125, -0.746429443359375, -0.6199951171875, -0.493560791015625, -0.36712646484375, -0.240692138671875, -0.1142578125, 0.012176513671875, 0.13861083984375, 0.265045166015625, 0.3914794921875, 0.517913818359375, 0.64434814453125, 0.770782470703125, 0.897216796875, 1.023651123046875, 1.15008544921875, 1.276519775390625, 1.4029541015625, 1.529388427734375, 1.65582275390625, 1.782257080078125, 1.90869140625, 2.035125732421875, 2.16156005859375, 2.287994384765625, 2.4144287109375, 2.540863037109375, 2.66729736328125, 2.793731689453125, 2.920166015625, 3.046600341796875, 3.17303466796875, 3.299468994140625, 3.4259033203125, 3.552337646484375, 3.67877197265625, 3.805206298828125, 3.931640625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 10.0, 10.0, 20.0, 59.0, 162.0, 261.0, 221.0, 148.0, 54.0, 25.0, 5.0, 7.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.847034454345703, -21.13936996459961, -20.431703567504883, -19.72403907775879, -19.016374588012695, -18.30870819091797, -17.601043701171875, -16.89337921142578, -16.185712814331055, -15.478047370910645, -14.77038288116455, -14.06271743774414, -13.35505199432373, -12.64738655090332, -11.939722061157227, -11.232056617736816, -10.524392127990723, -9.816726684570312, -9.109062194824219, -8.401396751403809, -7.693731307983398, -6.9860663414001465, -6.2784013748168945, -5.570735931396484, -4.863070964813232, -4.1554059982299805, -3.4477405548095703, -2.7400755882263184, -2.0324103832244873, -1.3247451782226562, -0.6170802116394043, 0.09058523178100586, 0.7982501983642578, 1.5059154033660889, 2.21358060836792, 2.921245574951172, 3.628910779953003, 4.336575984954834, 5.044240951538086, 5.751906394958496, 6.459571361541748, 7.167236328125, 7.87490177154541, 8.58256721496582, 9.290231704711914, 9.997897148132324, 10.705562591552734, 11.413227081298828, 12.120892524719238, 12.828557968139648, 13.536222457885742, 14.243887901306152, 14.951553344726562, 15.659217834472656, 16.36688232421875, 17.074548721313477, 17.78221321105957, 18.489877700805664, 19.19754409790039, 19.905208587646484, 20.612873077392578, 21.320539474487305, 22.0282039642334, 22.735870361328125, 23.44353485107422]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 10.0, 25.0, 57.0, 99.0, 156.0, 211.0, 195.0, 121.0, 83.0, 27.0, 11.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.64105796813965, -24.809375762939453, -23.977691650390625, -23.146007537841797, -22.3143253326416, -21.482643127441406, -20.650959014892578, -19.81927490234375, -18.987592697143555, -18.15591049194336, -17.32422637939453, -16.492542266845703, -15.660860061645508, -14.829176902770996, -13.997493743896484, -13.165810585021973, -12.334127426147461, -11.50244426727295, -10.670761108398438, -9.839077949523926, -9.007394790649414, -8.175711631774902, -7.344028472900391, -6.512345314025879, -5.680662155151367, -4.8489789962768555, -4.017295837402344, -3.185612678527832, -2.3539295196533203, -1.5222463607788086, -0.6905632019042969, 0.14111995697021484, 0.9728012084960938, 1.8044843673706055, 2.636167526245117, 3.467850685119629, 4.299533843994141, 5.131217002868652, 5.962900161743164, 6.794583320617676, 7.6262664794921875, 8.4579496383667, 9.289632797241211, 10.121315956115723, 10.952999114990234, 11.784682273864746, 12.616365432739258, 13.44804859161377, 14.279731750488281, 15.111414909362793, 15.943098068237305, 16.7747802734375, 17.606464385986328, 18.438148498535156, 19.26983070373535, 20.101512908935547, 20.933197021484375, 21.764881134033203, 22.5965633392334, 23.428245544433594, 24.259929656982422, 25.09161376953125, 25.923295974731445, 26.75497817993164, 27.58666229248047]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 16.0, 23.0, 57.0, 90.0, 151.0, 249.0, 504.0, 1005.0, 2275.0, 6082.0, 20531.0, 95198.0, 439937.0, 379991.0, 75918.0, 17344.0, 5256.0, 2009.0, 866.0, 424.0, 218.0, 125.0, 84.0, 43.0, 30.0, 20.0, 24.0, 14.0, 12.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7566680908203125, -1.695953369140625, -1.6352386474609375, -1.57452392578125, -1.5138092041015625, -1.453094482421875, -1.3923797607421875, -1.3316650390625, -1.2709503173828125, -1.210235595703125, -1.1495208740234375, -1.08880615234375, -1.0280914306640625, -0.967376708984375, -0.9066619873046875, -0.845947265625, -0.7852325439453125, -0.724517822265625, -0.6638031005859375, -0.60308837890625, -0.5423736572265625, -0.481658935546875, -0.4209442138671875, -0.3602294921875, -0.2995147705078125, -0.238800048828125, -0.1780853271484375, -0.11737060546875, -0.0566558837890625, 0.004058837890625, 0.0647735595703125, 0.12548828125, 0.1862030029296875, 0.246917724609375, 0.3076324462890625, 0.36834716796875, 0.4290618896484375, 0.489776611328125, 0.5504913330078125, 0.6112060546875, 0.6719207763671875, 0.732635498046875, 0.7933502197265625, 0.85406494140625, 0.9147796630859375, 0.975494384765625, 1.0362091064453125, 1.096923828125, 1.1576385498046875, 1.218353271484375, 1.2790679931640625, 1.33978271484375, 1.4004974365234375, 1.461212158203125, 1.5219268798828125, 1.5826416015625, 1.6433563232421875, 1.704071044921875, 1.7647857666015625, 1.82550048828125, 1.8862152099609375, 1.946929931640625, 2.0076446533203125, 2.068359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 9.0, 11.0, 15.0, 19.0, 28.0, 32.0, 52.0, 40.0, 66.0, 83.0, 62.0, 71.0, 66.0, 68.0, 73.0, 61.0, 47.0, 46.0, 35.0, 37.0, 25.0, 14.0, 10.0, 11.0, 7.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8736343383789062, -0.8424835205078125, -0.8113327026367188, -0.780181884765625, -0.7490310668945312, -0.7178802490234375, -0.6867294311523438, -0.65557861328125, -0.6244277954101562, -0.5932769775390625, -0.5621261596679688, -0.530975341796875, -0.49982452392578125, -0.4686737060546875, -0.43752288818359375, -0.4063720703125, -0.37522125244140625, -0.3440704345703125, -0.31291961669921875, -0.281768798828125, -0.25061798095703125, -0.2194671630859375, -0.18831634521484375, -0.15716552734375, -0.12601470947265625, -0.0948638916015625, -0.06371307373046875, -0.032562255859375, -0.00141143798828125, 0.0297393798828125, 0.06089019775390625, 0.092041015625, 0.12319183349609375, 0.1543426513671875, 0.18549346923828125, 0.216644287109375, 0.24779510498046875, 0.2789459228515625, 0.31009674072265625, 0.34124755859375, 0.37239837646484375, 0.4035491943359375, 0.43470001220703125, 0.465850830078125, 0.49700164794921875, 0.5281524658203125, 0.5593032836914062, 0.5904541015625, 0.6216049194335938, 0.6527557373046875, 0.6839065551757812, 0.715057373046875, 0.7462081909179688, 0.7773590087890625, 0.8085098266601562, 0.83966064453125, 0.8708114624023438, 0.9019622802734375, 0.9331130981445312, 0.964263916015625, 0.9954147338867188, 1.0265655517578125, 1.0577163696289062, 1.0888671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 11.0, 21.0, 35.0, 56.0, 77.0, 158.0, 250.0, 525.0, 1400.0, 4369.0, 18172.0, 115158.0, 696503.0, 177232.0, 25714.0, 5752.0, 1759.0, 646.0, 321.0, 158.0, 72.0, 55.0, 30.0, 24.0, 15.0, 11.0, 8.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.3481597900390625, -2.280303955078125, -2.2124481201171875, -2.14459228515625, -2.0767364501953125, -2.008880615234375, -1.9410247802734375, -1.8731689453125, -1.8053131103515625, -1.737457275390625, -1.6696014404296875, -1.60174560546875, -1.5338897705078125, -1.466033935546875, -1.3981781005859375, -1.330322265625, -1.2624664306640625, -1.194610595703125, -1.1267547607421875, -1.05889892578125, -0.9910430908203125, -0.923187255859375, -0.8553314208984375, -0.7874755859375, -0.7196197509765625, -0.651763916015625, -0.5839080810546875, -0.51605224609375, -0.4481964111328125, -0.380340576171875, -0.3124847412109375, -0.24462890625, -0.1767730712890625, -0.108917236328125, -0.0410614013671875, 0.02679443359375, 0.0946502685546875, 0.162506103515625, 0.2303619384765625, 0.2982177734375, 0.3660736083984375, 0.433929443359375, 0.5017852783203125, 0.56964111328125, 0.6374969482421875, 0.705352783203125, 0.7732086181640625, 0.841064453125, 0.9089202880859375, 0.976776123046875, 1.0446319580078125, 1.11248779296875, 1.1803436279296875, 1.248199462890625, 1.3160552978515625, 1.3839111328125, 1.4517669677734375, 1.519622802734375, 1.5874786376953125, 1.65533447265625, 1.7231903076171875, 1.791046142578125, 1.8589019775390625, 1.9267578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 4.0, 4.0, 5.0, 15.0, 11.0, 16.0, 13.0, 24.0, 20.0, 21.0, 38.0, 26.0, 39.0, 38.0, 40.0, 45.0, 54.0, 46.0, 31.0, 59.0, 46.0, 40.0, 31.0, 34.0, 34.0, 41.0, 27.0, 34.0, 25.0, 18.0, 27.0, 18.0, 12.0, 12.0, 10.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.7483673095703125, -1.683258056640625, -1.6181488037109375, -1.55303955078125, -1.4879302978515625, -1.422821044921875, -1.3577117919921875, -1.2926025390625, -1.2274932861328125, -1.162384033203125, -1.0972747802734375, -1.03216552734375, -0.9670562744140625, -0.901947021484375, -0.8368377685546875, -0.771728515625, -0.7066192626953125, -0.641510009765625, -0.5764007568359375, -0.51129150390625, -0.4461822509765625, -0.381072998046875, -0.3159637451171875, -0.2508544921875, -0.1857452392578125, -0.120635986328125, -0.0555267333984375, 0.00958251953125, 0.0746917724609375, 0.139801025390625, 0.2049102783203125, 0.27001953125, 0.3351287841796875, 0.400238037109375, 0.4653472900390625, 0.53045654296875, 0.5955657958984375, 0.660675048828125, 0.7257843017578125, 0.7908935546875, 0.8560028076171875, 0.921112060546875, 0.9862213134765625, 1.05133056640625, 1.1164398193359375, 1.181549072265625, 1.2466583251953125, 1.311767578125, 1.3768768310546875, 1.441986083984375, 1.5070953369140625, 1.57220458984375, 1.6373138427734375, 1.702423095703125, 1.7675323486328125, 1.8326416015625, 1.8977508544921875, 1.962860107421875, 2.0279693603515625, 2.09307861328125, 2.1581878662109375, 2.223297119140625, 2.2884063720703125, 2.353515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 14.0, 26.0, 41.0, 81.0, 172.0, 412.0, 1257.0, 4931.0, 25772.0, 209615.0, 722728.0, 68804.0, 10936.0, 2438.0, 765.0, 289.0, 127.0, 51.0, 32.0, 19.0, 17.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0227737426757812, -0.9967193603515625, -0.9706649780273438, -0.944610595703125, -0.9185562133789062, -0.8925018310546875, -0.8664474487304688, -0.84039306640625, -0.8143386840820312, -0.7882843017578125, -0.7622299194335938, -0.736175537109375, -0.7101211547851562, -0.6840667724609375, -0.6580123901367188, -0.6319580078125, -0.6059036254882812, -0.5798492431640625, -0.5537948608398438, -0.527740478515625, -0.5016860961914062, -0.4756317138671875, -0.44957733154296875, -0.42352294921875, -0.39746856689453125, -0.3714141845703125, -0.34535980224609375, -0.319305419921875, -0.29325103759765625, -0.2671966552734375, -0.24114227294921875, -0.215087890625, -0.18903350830078125, -0.1629791259765625, -0.13692474365234375, -0.110870361328125, -0.08481597900390625, -0.0587615966796875, -0.03270721435546875, -0.00665283203125, 0.01940155029296875, 0.0454559326171875, 0.07151031494140625, 0.097564697265625, 0.12361907958984375, 0.1496734619140625, 0.17572784423828125, 0.2017822265625, 0.22783660888671875, 0.2538909912109375, 0.27994537353515625, 0.305999755859375, 0.33205413818359375, 0.3581085205078125, 0.38416290283203125, 0.41021728515625, 0.43627166748046875, 0.4623260498046875, 0.48838043212890625, 0.514434814453125, 0.5404891967773438, 0.5665435791015625, 0.5925979614257812, 0.61865234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 4.0, 11.0, 14.0, 21.0, 22.0, 28.0, 32.0, 44.0, 53.0, 73.0, 82.0, 101.0, 101.0, 67.0, 70.0, 67.0, 44.0, 33.0, 24.0, 21.0, 11.0, 5.0, 15.0, 3.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011515617370605469, -0.00011120177805423737, -0.00010724738240242004, -0.00010329298675060272, -9.93385910987854e-05, -9.538419544696808e-05, -9.142979979515076e-05, -8.747540414333344e-05, -8.352100849151611e-05, -7.956661283969879e-05, -7.561221718788147e-05, -7.165782153606415e-05, -6.770342588424683e-05, -6.37490302324295e-05, -5.979463458061218e-05, -5.584023892879486e-05, -5.188584327697754e-05, -4.793144762516022e-05, -4.3977051973342896e-05, -4.0022656321525574e-05, -3.606826066970825e-05, -3.211386501789093e-05, -2.815946936607361e-05, -2.4205073714256287e-05, -2.0250678062438965e-05, -1.6296282410621643e-05, -1.2341886758804321e-05, -8.387491106987e-06, -4.433095455169678e-06, -4.78699803352356e-07, 3.475695848464966e-06, 7.430091500282288e-06, 1.138448715209961e-05, 1.533888280391693e-05, 1.9293278455734253e-05, 2.3247674107551575e-05, 2.7202069759368896e-05, 3.115646541118622e-05, 3.511086106300354e-05, 3.906525671482086e-05, 4.3019652366638184e-05, 4.6974048018455505e-05, 5.092844367027283e-05, 5.488283932209015e-05, 5.883723497390747e-05, 6.279163062572479e-05, 6.674602627754211e-05, 7.070042192935944e-05, 7.465481758117676e-05, 7.860921323299408e-05, 8.25636088848114e-05, 8.651800453662872e-05, 9.047240018844604e-05, 9.442679584026337e-05, 9.838119149208069e-05, 0.00010233558714389801, 0.00010628998279571533, 0.00011024437844753265, 0.00011419877409934998, 0.0001181531697511673, 0.00012210756540298462, 0.00012606196105480194, 0.00013001635670661926, 0.00013397075235843658, 0.0001379251480102539]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 16.0, 24.0, 38.0, 61.0, 90.0, 133.0, 239.0, 402.0, 733.0, 1448.0, 3095.0, 7525.0, 21106.0, 71115.0, 273733.0, 525002.0, 98457.0, 28197.0, 9531.0, 3818.0, 1710.0, 838.0, 461.0, 247.0, 185.0, 100.0, 49.0, 40.0, 26.0, 27.0, 19.0, 8.0, 14.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.47021484375, -0.4546051025390625, -0.438995361328125, -0.4233856201171875, -0.40777587890625, -0.3921661376953125, -0.376556396484375, -0.3609466552734375, -0.3453369140625, -0.3297271728515625, -0.314117431640625, -0.2985076904296875, -0.28289794921875, -0.2672882080078125, -0.251678466796875, -0.2360687255859375, -0.220458984375, -0.2048492431640625, -0.189239501953125, -0.1736297607421875, -0.15802001953125, -0.1424102783203125, -0.126800537109375, -0.1111907958984375, -0.0955810546875, -0.0799713134765625, -0.064361572265625, -0.0487518310546875, -0.03314208984375, -0.0175323486328125, -0.001922607421875, 0.0136871337890625, 0.029296875, 0.0449066162109375, 0.060516357421875, 0.0761260986328125, 0.09173583984375, 0.1073455810546875, 0.122955322265625, 0.1385650634765625, 0.1541748046875, 0.1697845458984375, 0.185394287109375, 0.2010040283203125, 0.21661376953125, 0.2322235107421875, 0.247833251953125, 0.2634429931640625, 0.279052734375, 0.2946624755859375, 0.310272216796875, 0.3258819580078125, 0.34149169921875, 0.3571014404296875, 0.372711181640625, 0.3883209228515625, 0.4039306640625, 0.4195404052734375, 0.435150146484375, 0.4507598876953125, 0.46636962890625, 0.4819793701171875, 0.497589111328125, 0.5131988525390625, 0.52880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 8.0, 1.0, 6.0, 9.0, 16.0, 9.0, 20.0, 16.0, 21.0, 26.0, 42.0, 43.0, 45.0, 67.0, 66.0, 80.0, 75.0, 84.0, 57.0, 55.0, 44.0, 48.0, 29.0, 31.0, 27.0, 14.0, 10.0, 13.0, 9.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4137077331542969, -0.39894866943359375, -0.3841896057128906, -0.3694305419921875, -0.3546714782714844, -0.33991241455078125, -0.3251533508300781, -0.310394287109375, -0.2956352233886719, -0.28087615966796875, -0.2661170959472656, -0.2513580322265625, -0.23659896850585938, -0.22183990478515625, -0.20708084106445312, -0.19232177734375, -0.17756271362304688, -0.16280364990234375, -0.14804458618164062, -0.1332855224609375, -0.11852645874023438, -0.10376739501953125, -0.08900833129882812, -0.074249267578125, -0.059490203857421875, -0.04473114013671875, -0.029972076416015625, -0.0152130126953125, -0.000453948974609375, 0.01430511474609375, 0.029064178466796875, 0.0438232421875, 0.058582305908203125, 0.07334136962890625, 0.08810043334960938, 0.1028594970703125, 0.11761856079101562, 0.13237762451171875, 0.14713668823242188, 0.161895751953125, 0.17665481567382812, 0.19141387939453125, 0.20617294311523438, 0.2209320068359375, 0.23569107055664062, 0.25045013427734375, 0.2652091979980469, 0.27996826171875, 0.2947273254394531, 0.30948638916015625, 0.3242454528808594, 0.3390045166015625, 0.3537635803222656, 0.36852264404296875, 0.3832817077636719, 0.398040771484375, 0.4127998352050781, 0.42755889892578125, 0.4423179626464844, 0.4570770263671875, 0.4718360900878906, 0.48659515380859375, 0.5013542175292969, 0.51611328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 15.0, 43.0, 90.0, 159.0, 347.0, 179.0, 89.0, 31.0, 20.0, 5.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.13393783569336, -22.502058029174805, -21.870176315307617, -21.238296508789062, -20.606414794921875, -19.97453498840332, -19.342655181884766, -18.710773468017578, -18.078893661499023, -17.44701385498047, -16.81513214111328, -16.183252334594727, -15.551371574401855, -14.919490814208984, -14.287610054016113, -13.655729293823242, -13.023848533630371, -12.3919677734375, -11.760087013244629, -11.128206253051758, -10.496326446533203, -9.864445686340332, -9.232564926147461, -8.600685119628906, -7.968803882598877, -7.336923122406006, -6.705042839050293, -6.073162078857422, -5.441281318664551, -4.809401035308838, -4.177520275115967, -3.545639991760254, -2.913759231567383, -2.281878709793091, -1.6499980688095093, -1.0181174278259277, -0.38623690605163574, 0.24564361572265625, 0.8775243759155273, 1.5094046592712402, 2.1412854194641113, 2.7731659412384033, 3.4050464630126953, 4.036927223205566, 4.6688079833984375, 5.30068826675415, 5.9325690269470215, 6.564449310302734, 7.1963300704956055, 7.828210830688477, 8.460091590881348, 9.091972351074219, 9.723852157592773, 10.355732917785645, 10.987613677978516, 11.61949348449707, 12.251375198364258, 12.883255958557129, 13.51513671875, 14.147016525268555, 14.778897285461426, 15.410778045654297, 16.042659759521484, 16.67453956604004, 17.306419372558594]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 14.0, 19.0, 16.0, 14.0, 24.0, 26.0, 44.0, 39.0, 42.0, 48.0, 61.0, 95.0, 99.0, 82.0, 42.0, 43.0, 33.0, 40.0, 30.0, 38.0, 22.0, 20.0, 20.0, 6.0, 10.0, 9.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.887272834777832, -7.574706554412842, -7.262140274047852, -6.949573993682861, -6.637007713317871, -6.324440956115723, -6.011874675750732, -5.699308395385742, -5.386742115020752, -5.074175834655762, -4.7616095542907715, -4.449043273925781, -4.136476516723633, -3.8239104747772217, -3.5113439559936523, -3.198777675628662, -2.886211395263672, -2.5736451148986816, -2.2610788345336914, -1.948512315750122, -1.6359460353851318, -1.3233797550201416, -1.0108133554458618, -0.698246955871582, -0.3856806755065918, -0.07311433553695679, 0.23945200443267822, 0.5520183444023132, 0.8645846843719482, 1.1771509647369385, 1.4897173643112183, 1.802283763885498, 2.114849090576172, 2.427415370941162, 2.7399816513061523, 3.0525481700897217, 3.365114450454712, 3.677680730819702, 3.9902472496032715, 4.302813529968262, 4.615379810333252, 4.927946090698242, 5.240512371063232, 5.553078651428223, 5.865645408630371, 6.178211212158203, 6.490777969360352, 6.803344249725342, 7.115910530090332, 7.428476810455322, 7.7410430908203125, 8.053609848022461, 8.366175651550293, 8.678742408752441, 8.991308212280273, 9.303874969482422, 9.61644172668457, 9.929008483886719, 10.24157428741455, 10.5541410446167, 10.866706848144531, 11.17927360534668, 11.491839408874512, 11.80440616607666, 12.116971969604492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 14.0, 13.0, 16.0, 15.0, 29.0, 47.0, 68.0, 93.0, 167.0, 282.0, 524.0, 1003.0, 2080.0, 4828.0, 12791.0, 49607.0, 419744.0, 2971520.0, 640138.0, 65310.0, 15569.0, 5594.0, 2427.0, 1076.0, 537.0, 307.0, 169.0, 77.0, 70.0, 48.0, 39.0, 17.0, 18.0, 12.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.451171875, -1.4145050048828125, -1.377838134765625, -1.3411712646484375, -1.30450439453125, -1.2678375244140625, -1.231170654296875, -1.1945037841796875, -1.1578369140625, -1.1211700439453125, -1.084503173828125, -1.0478363037109375, -1.01116943359375, -0.9745025634765625, -0.937835693359375, -0.9011688232421875, -0.864501953125, -0.8278350830078125, -0.791168212890625, -0.7545013427734375, -0.71783447265625, -0.6811676025390625, -0.644500732421875, -0.6078338623046875, -0.5711669921875, -0.5345001220703125, -0.497833251953125, -0.4611663818359375, -0.42449951171875, -0.3878326416015625, -0.351165771484375, -0.3144989013671875, -0.27783203125, -0.2411651611328125, -0.204498291015625, -0.1678314208984375, -0.13116455078125, -0.0944976806640625, -0.057830810546875, -0.0211639404296875, 0.0155029296875, 0.0521697998046875, 0.088836669921875, 0.1255035400390625, 0.16217041015625, 0.1988372802734375, 0.235504150390625, 0.2721710205078125, 0.308837890625, 0.3455047607421875, 0.382171630859375, 0.4188385009765625, 0.45550537109375, 0.4921722412109375, 0.528839111328125, 0.5655059814453125, 0.6021728515625, 0.6388397216796875, 0.675506591796875, 0.7121734619140625, 0.74884033203125, 0.7855072021484375, 0.822174072265625, 0.8588409423828125, 0.8955078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 12.0, 15.0, 9.0, 26.0, 37.0, 46.0, 38.0, 42.0, 54.0, 56.0, 70.0, 78.0, 84.0, 69.0, 55.0, 61.0, 43.0, 50.0, 37.0, 25.0, 32.0, 15.0, 10.0, 6.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66552734375, -0.6387405395507812, -0.6119537353515625, -0.5851669311523438, -0.558380126953125, -0.5315933227539062, -0.5048065185546875, -0.47801971435546875, -0.45123291015625, -0.42444610595703125, -0.3976593017578125, -0.37087249755859375, -0.344085693359375, -0.31729888916015625, -0.2905120849609375, -0.26372528076171875, -0.2369384765625, -0.21015167236328125, -0.1833648681640625, -0.15657806396484375, -0.129791259765625, -0.10300445556640625, -0.0762176513671875, -0.04943084716796875, -0.02264404296875, 0.00414276123046875, 0.0309295654296875, 0.05771636962890625, 0.084503173828125, 0.11128997802734375, 0.1380767822265625, 0.16486358642578125, 0.191650390625, 0.21843719482421875, 0.2452239990234375, 0.27201080322265625, 0.298797607421875, 0.32558441162109375, 0.3523712158203125, 0.37915802001953125, 0.40594482421875, 0.43273162841796875, 0.4595184326171875, 0.48630523681640625, 0.513092041015625, 0.5398788452148438, 0.5666656494140625, 0.5934524536132812, 0.6202392578125, 0.6470260620117188, 0.6738128662109375, 0.7005996704101562, 0.727386474609375, 0.7541732788085938, 0.7809600830078125, 0.8077468872070312, 0.83453369140625, 0.8613204956054688, 0.8881072998046875, 0.9148941040039062, 0.941680908203125, 0.9684677124023438, 0.9952545166015625, 1.0220413208007812, 1.048828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 5.0, 7.0, 12.0, 12.0, 26.0, 32.0, 58.0, 87.0, 152.0, 276.0, 639.0, 1455.0, 4727.0, 18066.0, 126112.0, 2971672.0, 997993.0, 56643.0, 10937.0, 3187.0, 1156.0, 455.0, 212.0, 134.0, 82.0, 35.0, 34.0, 11.0, 15.0, 11.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.34722900390625, -1.2969970703125, -1.24676513671875, -1.196533203125, -1.14630126953125, -1.0960693359375, -1.04583740234375, -0.99560546875, -0.94537353515625, -0.8951416015625, -0.84490966796875, -0.794677734375, -0.74444580078125, -0.6942138671875, -0.64398193359375, -0.59375, -0.54351806640625, -0.4932861328125, -0.44305419921875, -0.392822265625, -0.34259033203125, -0.2923583984375, -0.24212646484375, -0.19189453125, -0.14166259765625, -0.0914306640625, -0.04119873046875, 0.009033203125, 0.05926513671875, 0.1094970703125, 0.15972900390625, 0.2099609375, 0.26019287109375, 0.3104248046875, 0.36065673828125, 0.410888671875, 0.46112060546875, 0.5113525390625, 0.56158447265625, 0.61181640625, 0.66204833984375, 0.7122802734375, 0.76251220703125, 0.812744140625, 0.86297607421875, 0.9132080078125, 0.96343994140625, 1.013671875, 1.06390380859375, 1.1141357421875, 1.16436767578125, 1.214599609375, 1.26483154296875, 1.3150634765625, 1.36529541015625, 1.41552734375, 1.46575927734375, 1.5159912109375, 1.56622314453125, 1.616455078125, 1.66668701171875, 1.7169189453125, 1.76715087890625, 1.8173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 7.0, 18.0, 18.0, 26.0, 50.0, 72.0, 113.0, 169.0, 305.0, 504.0, 738.0, 671.0, 499.0, 317.0, 173.0, 109.0, 79.0, 40.0, 48.0, 26.0, 20.0, 6.0, 10.0, 6.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4109954833984375, -1.366912841796875, -1.3228302001953125, -1.27874755859375, -1.2346649169921875, -1.190582275390625, -1.1464996337890625, -1.1024169921875, -1.0583343505859375, -1.014251708984375, -0.9701690673828125, -0.92608642578125, -0.8820037841796875, -0.837921142578125, -0.7938385009765625, -0.749755859375, -0.7056732177734375, -0.661590576171875, -0.6175079345703125, -0.57342529296875, -0.5293426513671875, -0.485260009765625, -0.4411773681640625, -0.3970947265625, -0.3530120849609375, -0.308929443359375, -0.2648468017578125, -0.22076416015625, -0.1766815185546875, -0.132598876953125, -0.0885162353515625, -0.04443359375, -0.0003509521484375, 0.043731689453125, 0.0878143310546875, 0.13189697265625, 0.1759796142578125, 0.220062255859375, 0.2641448974609375, 0.3082275390625, 0.3523101806640625, 0.396392822265625, 0.4404754638671875, 0.48455810546875, 0.5286407470703125, 0.572723388671875, 0.6168060302734375, 0.660888671875, 0.7049713134765625, 0.749053955078125, 0.7931365966796875, 0.83721923828125, 0.8813018798828125, 0.925384521484375, 0.9694671630859375, 1.0135498046875, 1.0576324462890625, 1.101715087890625, 1.1457977294921875, 1.18988037109375, 1.2339630126953125, 1.278045654296875, 1.3221282958984375, 1.3662109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 10.0, 8.0, 10.0, 22.0, 25.0, 51.0, 66.0, 106.0, 150.0, 151.0, 141.0, 102.0, 59.0, 43.0, 22.0, 19.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.021146774291992, -4.669943332672119, -4.318739414215088, -3.967535972595215, -3.616332530975342, -3.2651288509368896, -2.9139251708984375, -2.5627217292785645, -2.2115180492401123, -1.8603144884109497, -1.509110927581787, -1.157907247543335, -0.8067036867141724, -0.45550012588500977, -0.10429644584655762, 0.24690699577331543, 0.5981106758117676, 0.9493142366409302, 1.3005177974700928, 1.651721477508545, 2.002924919128418, 2.35412859916687, 2.7053322792053223, 3.0565357208251953, 3.4077394008636475, 3.7589430809020996, 4.110146522521973, 4.461350440979004, 4.812553882598877, 5.16375732421875, 5.514961242675781, 5.866164207458496, 6.217368125915527, 6.5685715675354, 6.919775485992432, 7.270978927612305, 7.622182369232178, 7.973385810852051, 8.324589729309082, 8.675792694091797, 9.026996612548828, 9.37820053100586, 9.729403495788574, 10.080607414245605, 10.431811332702637, 10.783014297485352, 11.134218215942383, 11.485422134399414, 11.836626052856445, 12.187829971313477, 12.539032936096191, 12.890236854553223, 13.241440773010254, 13.592643737792969, 13.94384765625, 14.295051574707031, 14.646254539489746, 14.997458457946777, 15.348661422729492, 15.699865341186523, 16.051069259643555, 16.402273178100586, 16.753475189208984, 17.104679107666016, 17.455883026123047]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 18.0, 13.0, 20.0, 28.0, 20.0, 31.0, 29.0, 37.0, 34.0, 36.0, 52.0, 35.0, 49.0, 45.0, 33.0, 49.0, 47.0, 34.0, 51.0, 38.0, 34.0, 27.0, 28.0, 30.0, 23.0, 17.0, 19.0, 28.0, 11.0, 10.0, 8.0, 11.0, 5.0, 8.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.5354461669921875, -5.352889060974121, -5.170332431793213, -4.9877753257751465, -4.805218696594238, -4.622661590576172, -4.440104961395264, -4.257547855377197, -4.074991226196289, -3.8924343585968018, -3.7098774909973145, -3.527320623397827, -3.34476375579834, -3.1622068881988525, -2.9796500205993652, -2.797092914581299, -2.6145360469818115, -2.431979179382324, -2.249422311782837, -2.0668654441833496, -1.8843085765838623, -1.701751708984375, -1.5191947221755981, -1.3366378545761108, -1.1540809869766235, -0.9715241193771362, -0.7889672517776489, -0.6064103245735168, -0.42385345697402954, -0.24129658937454224, -0.058739662170410156, 0.12381720542907715, 0.30637407302856445, 0.48893094062805176, 0.6714878082275391, 0.8540447354316711, 1.0366015434265137, 1.219158411026001, 1.4017153978347778, 1.5842722654342651, 1.7668291330337524, 1.9493860006332397, 2.1319429874420166, 2.314499855041504, 2.497056722640991, 2.6796135902404785, 2.862170457839966, 3.044727325439453, 3.2272841930389404, 3.4098410606384277, 3.592397928237915, 3.7749547958374023, 3.9575116634368896, 4.140068531036377, 4.322625637054443, 4.505182266235352, 4.687739372253418, 4.870296478271484, 5.052853107452393, 5.235410213470459, 5.417966842651367, 5.600523948669434, 5.783080577850342, 5.965637683868408, 6.148194313049316]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 8.0, 2.0, 7.0, 7.0, 12.0, 19.0, 36.0, 37.0, 76.0, 89.0, 168.0, 238.0, 384.0, 811.0, 1595.0, 3775.0, 9919.0, 29689.0, 104195.0, 374157.0, 372939.0, 103676.0, 29636.0, 9834.0, 3716.0, 1636.0, 770.0, 413.0, 268.0, 162.0, 86.0, 54.0, 56.0, 20.0, 21.0, 15.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.470703125, -1.428680419921875, -1.38665771484375, -1.344635009765625, -1.3026123046875, -1.260589599609375, -1.21856689453125, -1.176544189453125, -1.134521484375, -1.092498779296875, -1.05047607421875, -1.008453369140625, -0.9664306640625, -0.924407958984375, -0.88238525390625, -0.840362548828125, -0.79833984375, -0.756317138671875, -0.71429443359375, -0.672271728515625, -0.6302490234375, -0.588226318359375, -0.54620361328125, -0.504180908203125, -0.462158203125, -0.420135498046875, -0.37811279296875, -0.336090087890625, -0.2940673828125, -0.252044677734375, -0.21002197265625, -0.167999267578125, -0.1259765625, -0.083953857421875, -0.04193115234375, 9.1552734375e-05, 0.0421142578125, 0.084136962890625, 0.12615966796875, 0.168182373046875, 0.210205078125, 0.252227783203125, 0.29425048828125, 0.336273193359375, 0.3782958984375, 0.420318603515625, 0.46234130859375, 0.504364013671875, 0.54638671875, 0.588409423828125, 0.63043212890625, 0.672454833984375, 0.7144775390625, 0.756500244140625, 0.79852294921875, 0.840545654296875, 0.882568359375, 0.924591064453125, 0.96661376953125, 1.008636474609375, 1.0506591796875, 1.092681884765625, 1.13470458984375, 1.176727294921875, 1.21875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 9.0, 13.0, 24.0, 23.0, 31.0, 39.0, 42.0, 43.0, 46.0, 55.0, 52.0, 70.0, 66.0, 76.0, 58.0, 56.0, 46.0, 56.0, 38.0, 39.0, 42.0, 16.0, 16.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.635040283203125, -0.60797119140625, -0.580902099609375, -0.5538330078125, -0.526763916015625, -0.49969482421875, -0.472625732421875, -0.445556640625, -0.418487548828125, -0.39141845703125, -0.364349365234375, -0.3372802734375, -0.310211181640625, -0.28314208984375, -0.256072998046875, -0.22900390625, -0.201934814453125, -0.17486572265625, -0.147796630859375, -0.1207275390625, -0.093658447265625, -0.06658935546875, -0.039520263671875, -0.012451171875, 0.014617919921875, 0.04168701171875, 0.068756103515625, 0.0958251953125, 0.122894287109375, 0.14996337890625, 0.177032470703125, 0.2041015625, 0.231170654296875, 0.25823974609375, 0.285308837890625, 0.3123779296875, 0.339447021484375, 0.36651611328125, 0.393585205078125, 0.420654296875, 0.447723388671875, 0.47479248046875, 0.501861572265625, 0.5289306640625, 0.555999755859375, 0.58306884765625, 0.610137939453125, 0.63720703125, 0.664276123046875, 0.69134521484375, 0.718414306640625, 0.7454833984375, 0.772552490234375, 0.79962158203125, 0.826690673828125, 0.853759765625, 0.880828857421875, 0.90789794921875, 0.934967041015625, 0.9620361328125, 0.989105224609375, 1.01617431640625, 1.043243408203125, 1.0703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 10.0, 11.0, 13.0, 33.0, 45.0, 47.0, 56.0, 85.0, 134.0, 243.0, 339.0, 701.0, 1339.0, 3667.0, 15877.0, 123012.0, 779121.0, 103363.0, 14015.0, 3479.0, 1282.0, 621.0, 352.0, 217.0, 148.0, 102.0, 65.0, 36.0, 31.0, 31.0, 15.0, 9.0, 12.0, 7.0, 7.0, 2.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.490234375, -2.420013427734375, -2.34979248046875, -2.279571533203125, -2.2093505859375, -2.139129638671875, -2.06890869140625, -1.998687744140625, -1.928466796875, -1.858245849609375, -1.78802490234375, -1.717803955078125, -1.6475830078125, -1.577362060546875, -1.50714111328125, -1.436920166015625, -1.36669921875, -1.296478271484375, -1.22625732421875, -1.156036376953125, -1.0858154296875, -1.015594482421875, -0.94537353515625, -0.875152587890625, -0.804931640625, -0.734710693359375, -0.66448974609375, -0.594268798828125, -0.5240478515625, -0.453826904296875, -0.38360595703125, -0.313385009765625, -0.2431640625, -0.172943115234375, -0.10272216796875, -0.032501220703125, 0.0377197265625, 0.107940673828125, 0.17816162109375, 0.248382568359375, 0.318603515625, 0.388824462890625, 0.45904541015625, 0.529266357421875, 0.5994873046875, 0.669708251953125, 0.73992919921875, 0.810150146484375, 0.88037109375, 0.950592041015625, 1.02081298828125, 1.091033935546875, 1.1612548828125, 1.231475830078125, 1.30169677734375, 1.371917724609375, 1.442138671875, 1.512359619140625, 1.58258056640625, 1.652801513671875, 1.7230224609375, 1.793243408203125, 1.86346435546875, 1.933685302734375, 2.00390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 6.0, 17.0, 16.0, 10.0, 22.0, 30.0, 23.0, 44.0, 50.0, 51.0, 58.0, 44.0, 44.0, 65.0, 41.0, 46.0, 54.0, 39.0, 53.0, 39.0, 40.0, 42.0, 35.0, 19.0, 16.0, 12.0, 14.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.073699951171875, -1.99700927734375, -1.920318603515625, -1.8436279296875, -1.766937255859375, -1.69024658203125, -1.613555908203125, -1.536865234375, -1.460174560546875, -1.38348388671875, -1.306793212890625, -1.2301025390625, -1.153411865234375, -1.07672119140625, -1.000030517578125, -0.92333984375, -0.846649169921875, -0.76995849609375, -0.693267822265625, -0.6165771484375, -0.539886474609375, -0.46319580078125, -0.386505126953125, -0.309814453125, -0.233123779296875, -0.15643310546875, -0.079742431640625, -0.0030517578125, 0.073638916015625, 0.15032958984375, 0.227020263671875, 0.3037109375, 0.380401611328125, 0.45709228515625, 0.533782958984375, 0.6104736328125, 0.687164306640625, 0.76385498046875, 0.840545654296875, 0.917236328125, 0.993927001953125, 1.07061767578125, 1.147308349609375, 1.2239990234375, 1.300689697265625, 1.37738037109375, 1.454071044921875, 1.53076171875, 1.607452392578125, 1.68414306640625, 1.760833740234375, 1.8375244140625, 1.914215087890625, 1.99090576171875, 2.067596435546875, 2.144287109375, 2.220977783203125, 2.29766845703125, 2.374359130859375, 2.4510498046875, 2.527740478515625, 2.60443115234375, 2.681121826171875, 2.7578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 5.0, 6.0, 15.0, 19.0, 37.0, 43.0, 70.0, 81.0, 177.0, 287.0, 608.0, 1373.0, 3649.0, 11727.0, 48927.0, 636260.0, 291193.0, 38495.0, 9940.0, 3062.0, 1280.0, 549.0, 293.0, 172.0, 85.0, 62.0, 39.0, 25.0, 19.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5810546875, -0.5616378784179688, -0.5422210693359375, -0.5228042602539062, -0.503387451171875, -0.48397064208984375, -0.4645538330078125, -0.44513702392578125, -0.42572021484375, -0.40630340576171875, -0.3868865966796875, -0.36746978759765625, -0.348052978515625, -0.32863616943359375, -0.3092193603515625, -0.28980255126953125, -0.2703857421875, -0.25096893310546875, -0.2315521240234375, -0.21213531494140625, -0.192718505859375, -0.17330169677734375, -0.1538848876953125, -0.13446807861328125, -0.11505126953125, -0.09563446044921875, -0.0762176513671875, -0.05680084228515625, -0.037384033203125, -0.01796722412109375, 0.0014495849609375, 0.02086639404296875, 0.040283203125, 0.05970001220703125, 0.0791168212890625, 0.09853363037109375, 0.117950439453125, 0.13736724853515625, 0.1567840576171875, 0.17620086669921875, 0.19561767578125, 0.21503448486328125, 0.2344512939453125, 0.25386810302734375, 0.273284912109375, 0.29270172119140625, 0.3121185302734375, 0.33153533935546875, 0.3509521484375, 0.37036895751953125, 0.3897857666015625, 0.40920257568359375, 0.428619384765625, 0.44803619384765625, 0.4674530029296875, 0.48686981201171875, 0.50628662109375, 0.5257034301757812, 0.5451202392578125, 0.5645370483398438, 0.583953857421875, 0.6033706665039062, 0.6227874755859375, 0.6422042846679688, 0.66162109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 7.0, 9.0, 19.0, 18.0, 22.0, 34.0, 48.0, 54.0, 97.0, 98.0, 116.0, 103.0, 64.0, 51.0, 51.0, 27.0, 15.0, 26.0, 17.0, 15.0, 10.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010734796524047852, -0.00010401848703622818, -0.00010068900883197784, -9.735953062772751e-05, -9.403005242347717e-05, -9.070057421922684e-05, -8.73710960149765e-05, -8.404161781072617e-05, -8.071213960647583e-05, -7.73826614022255e-05, -7.405318319797516e-05, -7.072370499372482e-05, -6.739422678947449e-05, -6.406474858522415e-05, -6.0735270380973816e-05, -5.740579217672348e-05, -5.4076313972473145e-05, -5.074683576822281e-05, -4.741735756397247e-05, -4.408787935972214e-05, -4.07584011554718e-05, -3.7428922951221466e-05, -3.409944474697113e-05, -3.0769966542720795e-05, -2.744048833847046e-05, -2.4111010134220123e-05, -2.0781531929969788e-05, -1.7452053725719452e-05, -1.4122575521469116e-05, -1.079309731721878e-05, -7.463619112968445e-06, -4.134140908718109e-06, -8.046627044677734e-07, 2.5248154997825623e-06, 5.854293704032898e-06, 9.183771908283234e-06, 1.251325011253357e-05, 1.5842728316783905e-05, 1.917220652103424e-05, 2.2501684725284576e-05, 2.5831162929534912e-05, 2.9160641133785248e-05, 3.2490119338035583e-05, 3.581959754228592e-05, 3.9149075746536255e-05, 4.247855395078659e-05, 4.5808032155036926e-05, 4.913751035928726e-05, 5.24669885635376e-05, 5.579646676778793e-05, 5.912594497203827e-05, 6.24554231762886e-05, 6.578490138053894e-05, 6.911437958478928e-05, 7.244385778903961e-05, 7.577333599328995e-05, 7.910281419754028e-05, 8.243229240179062e-05, 8.576177060604095e-05, 8.909124881029129e-05, 9.242072701454163e-05, 9.575020521879196e-05, 9.90796834230423e-05, 0.00010240916162729263, 0.00010573863983154297]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 16.0, 14.0, 38.0, 44.0, 55.0, 95.0, 170.0, 302.0, 524.0, 1305.0, 3948.0, 15899.0, 97910.0, 799065.0, 105554.0, 16860.0, 4104.0, 1360.0, 555.0, 297.0, 151.0, 94.0, 56.0, 45.0, 20.0, 19.0, 10.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.544708251953125, -0.52154541015625, -0.498382568359375, -0.4752197265625, -0.452056884765625, -0.42889404296875, -0.405731201171875, -0.382568359375, -0.359405517578125, -0.33624267578125, -0.313079833984375, -0.2899169921875, -0.266754150390625, -0.24359130859375, -0.220428466796875, -0.197265625, -0.174102783203125, -0.15093994140625, -0.127777099609375, -0.1046142578125, -0.081451416015625, -0.05828857421875, -0.035125732421875, -0.011962890625, 0.011199951171875, 0.03436279296875, 0.057525634765625, 0.0806884765625, 0.103851318359375, 0.12701416015625, 0.150177001953125, 0.17333984375, 0.196502685546875, 0.21966552734375, 0.242828369140625, 0.2659912109375, 0.289154052734375, 0.31231689453125, 0.335479736328125, 0.358642578125, 0.381805419921875, 0.40496826171875, 0.428131103515625, 0.4512939453125, 0.474456787109375, 0.49761962890625, 0.520782470703125, 0.5439453125, 0.567108154296875, 0.59027099609375, 0.613433837890625, 0.6365966796875, 0.659759521484375, 0.68292236328125, 0.706085205078125, 0.729248046875, 0.752410888671875, 0.77557373046875, 0.798736572265625, 0.8218994140625, 0.845062255859375, 0.86822509765625, 0.891387939453125, 0.91455078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 13.0, 15.0, 16.0, 28.0, 23.0, 27.0, 39.0, 50.0, 69.0, 95.0, 102.0, 109.0, 87.0, 54.0, 39.0, 40.0, 32.0, 19.0, 21.0, 14.0, 14.0, 7.0, 12.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5390625, -0.5232086181640625, -0.507354736328125, -0.4915008544921875, -0.47564697265625, -0.4597930908203125, -0.443939208984375, -0.4280853271484375, -0.4122314453125, -0.3963775634765625, -0.380523681640625, -0.3646697998046875, -0.34881591796875, -0.3329620361328125, -0.317108154296875, -0.3012542724609375, -0.285400390625, -0.2695465087890625, -0.253692626953125, -0.2378387451171875, -0.22198486328125, -0.2061309814453125, -0.190277099609375, -0.1744232177734375, -0.1585693359375, -0.1427154541015625, -0.126861572265625, -0.1110076904296875, -0.09515380859375, -0.0792999267578125, -0.063446044921875, -0.0475921630859375, -0.03173828125, -0.0158843994140625, -3.0517578125e-05, 0.0158233642578125, 0.03167724609375, 0.0475311279296875, 0.063385009765625, 0.0792388916015625, 0.0950927734375, 0.1109466552734375, 0.126800537109375, 0.1426544189453125, 0.15850830078125, 0.1743621826171875, 0.190216064453125, 0.2060699462890625, 0.221923828125, 0.2377777099609375, 0.253631591796875, 0.2694854736328125, 0.28533935546875, 0.3011932373046875, 0.317047119140625, 0.3329010009765625, 0.3487548828125, 0.3646087646484375, 0.380462646484375, 0.3963165283203125, 0.41217041015625, 0.4280242919921875, 0.443878173828125, 0.4597320556640625, 0.4755859375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 8.0, 18.0, 45.0, 117.0, 365.0, 285.0, 102.0, 26.0, 12.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.106849670410156, -33.36344909667969, -32.62004852294922, -31.876649856567383, -31.133251190185547, -30.389850616455078, -29.646451950073242, -28.903051376342773, -28.159652709960938, -27.41625213623047, -26.672853469848633, -25.929452896118164, -25.186054229736328, -24.44265365600586, -23.699254989624023, -22.955854415893555, -22.21245574951172, -21.46905517578125, -20.725656509399414, -19.982255935668945, -19.23885726928711, -18.49545669555664, -17.752058029174805, -17.008657455444336, -16.265256881713867, -15.521857261657715, -14.778457641601562, -14.03505802154541, -13.291658401489258, -12.548258781433105, -11.804859161376953, -11.061458587646484, -10.318059921264648, -9.574660301208496, -8.831260681152344, -8.087861061096191, -7.344461441040039, -6.601061820983887, -5.857661724090576, -5.114262104034424, -4.3708624839782715, -3.627462863922119, -2.884063243865967, -2.1406633853912354, -1.397263765335083, -0.6538641452789307, 0.08953571319580078, 0.8329353332519531, 1.5763349533081055, 2.319734573364258, 3.06313419342041, 3.8065340518951416, 4.549933433532715, 5.293333053588867, 6.036733150482178, 6.78013277053833, 7.523532390594482, 8.266932487487793, 9.010332107543945, 9.753731727600098, 10.49713134765625, 11.240530967712402, 11.983930587768555, 12.727330207824707, 13.47072982788086]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 10.0, 2.0, 10.0, 16.0, 7.0, 12.0, 19.0, 28.0, 16.0, 33.0, 23.0, 26.0, 42.0, 41.0, 58.0, 75.0, 106.0, 90.0, 55.0, 37.0, 49.0, 20.0, 38.0, 31.0, 30.0, 14.0, 19.0, 14.0, 19.0, 4.0, 6.0, 6.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-10.810636520385742, -10.506580352783203, -10.202524185180664, -9.898468017578125, -9.594411849975586, -9.290355682373047, -8.986299514770508, -8.682243347167969, -8.37818717956543, -8.07413101196289, -7.770074844360352, -7.4660186767578125, -7.161962509155273, -6.857906341552734, -6.553850173950195, -6.249794006347656, -5.945737361907959, -5.64168119430542, -5.337625026702881, -5.033568859100342, -4.729512691497803, -4.425456523895264, -4.121399879455566, -3.8173439502716064, -3.5132877826690674, -3.2092316150665283, -2.9051754474639893, -2.601119041442871, -2.297062873840332, -1.9930068254470825, -1.688950538635254, -1.3848943710327148, -1.0808382034301758, -0.7767820358276367, -0.4727258086204529, -0.16866958141326904, 0.13538658618927002, 0.4394427537918091, 0.7434990406036377, 1.0475552082061768, 1.3516113758087158, 1.6556675434112549, 1.959723711013794, 2.263780117034912, 2.567836284637451, 2.8718924522399902, 3.1759486198425293, 3.4800047874450684, 3.7840609550476074, 4.0881171226501465, 4.3921732902526855, 4.696229457855225, 5.000285625457764, 5.304341793060303, 5.6083984375, 5.912454605102539, 6.216510772705078, 6.520566940307617, 6.824623107910156, 7.128679275512695, 7.432735443115234, 7.736791610717773, 8.040847778320312, 8.344903945922852, 8.64896011352539]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 2.0, 12.0, 13.0, 18.0, 25.0, 47.0, 68.0, 97.0, 168.0, 346.0, 665.0, 1339.0, 3310.0, 9568.0, 40378.0, 309086.0, 2618778.0, 1081913.0, 100136.0, 18555.0, 5539.0, 2137.0, 941.0, 488.0, 236.0, 142.0, 95.0, 59.0, 40.0, 19.0, 16.0, 14.0, 5.0, 2.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2607421875, -1.223388671875, -1.18603515625, -1.148681640625, -1.111328125, -1.073974609375, -1.03662109375, -0.999267578125, -0.9619140625, -0.924560546875, -0.88720703125, -0.849853515625, -0.8125, -0.775146484375, -0.73779296875, -0.700439453125, -0.6630859375, -0.625732421875, -0.58837890625, -0.551025390625, -0.513671875, -0.476318359375, -0.43896484375, -0.401611328125, -0.3642578125, -0.326904296875, -0.28955078125, -0.252197265625, -0.21484375, -0.177490234375, -0.14013671875, -0.102783203125, -0.0654296875, -0.028076171875, 0.00927734375, 0.046630859375, 0.083984375, 0.121337890625, 0.15869140625, 0.196044921875, 0.2333984375, 0.270751953125, 0.30810546875, 0.345458984375, 0.3828125, 0.420166015625, 0.45751953125, 0.494873046875, 0.5322265625, 0.569580078125, 0.60693359375, 0.644287109375, 0.681640625, 0.718994140625, 0.75634765625, 0.793701171875, 0.8310546875, 0.868408203125, 0.90576171875, 0.943115234375, 0.98046875, 1.017822265625, 1.05517578125, 1.092529296875, 1.1298828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 12.0, 14.0, 16.0, 16.0, 24.0, 30.0, 41.0, 50.0, 27.0, 51.0, 48.0, 46.0, 60.0, 54.0, 65.0, 59.0, 41.0, 51.0, 48.0, 44.0, 43.0, 29.0, 34.0, 20.0, 11.0, 17.0, 9.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6767578125, -0.6533203125, -0.6298828125, -0.6064453125, -0.5830078125, -0.5595703125, -0.5361328125, -0.5126953125, -0.4892578125, -0.4658203125, -0.4423828125, -0.4189453125, -0.3955078125, -0.3720703125, -0.3486328125, -0.3251953125, -0.3017578125, -0.2783203125, -0.2548828125, -0.2314453125, -0.2080078125, -0.1845703125, -0.1611328125, -0.1376953125, -0.1142578125, -0.0908203125, -0.0673828125, -0.0439453125, -0.0205078125, 0.0029296875, 0.0263671875, 0.0498046875, 0.0732421875, 0.0966796875, 0.1201171875, 0.1435546875, 0.1669921875, 0.1904296875, 0.2138671875, 0.2373046875, 0.2607421875, 0.2841796875, 0.3076171875, 0.3310546875, 0.3544921875, 0.3779296875, 0.4013671875, 0.4248046875, 0.4482421875, 0.4716796875, 0.4951171875, 0.5185546875, 0.5419921875, 0.5654296875, 0.5888671875, 0.6123046875, 0.6357421875, 0.6591796875, 0.6826171875, 0.7060546875, 0.7294921875, 0.7529296875, 0.7763671875, 0.7998046875, 0.8232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 5.0, 9.0, 13.0, 9.0, 13.0, 24.0, 58.0, 76.0, 115.0, 156.0, 334.0, 803.0, 2116.0, 7418.0, 40789.0, 659587.0, 3289378.0, 167564.0, 18813.0, 4460.0, 1315.0, 559.0, 284.0, 151.0, 74.0, 41.0, 36.0, 24.0, 9.0, 13.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8123626708984375, -1.762420654296875, -1.7124786376953125, -1.66253662109375, -1.6125946044921875, -1.562652587890625, -1.5127105712890625, -1.4627685546875, -1.4128265380859375, -1.362884521484375, -1.3129425048828125, -1.26300048828125, -1.2130584716796875, -1.163116455078125, -1.1131744384765625, -1.063232421875, -1.0132904052734375, -0.963348388671875, -0.9134063720703125, -0.86346435546875, -0.8135223388671875, -0.763580322265625, -0.7136383056640625, -0.6636962890625, -0.6137542724609375, -0.563812255859375, -0.5138702392578125, -0.46392822265625, -0.4139862060546875, -0.364044189453125, -0.3141021728515625, -0.26416015625, -0.2142181396484375, -0.164276123046875, -0.1143341064453125, -0.06439208984375, -0.0144500732421875, 0.035491943359375, 0.0854339599609375, 0.1353759765625, 0.1853179931640625, 0.235260009765625, 0.2852020263671875, 0.33514404296875, 0.3850860595703125, 0.435028076171875, 0.4849700927734375, 0.534912109375, 0.5848541259765625, 0.634796142578125, 0.6847381591796875, 0.73468017578125, 0.7846221923828125, 0.834564208984375, 0.8845062255859375, 0.9344482421875, 0.9843902587890625, 1.034332275390625, 1.0842742919921875, 1.13421630859375, 1.1841583251953125, 1.234100341796875, 1.2840423583984375, 1.333984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 4.0, 5.0, 12.0, 26.0, 41.0, 37.0, 83.0, 93.0, 129.0, 203.0, 296.0, 394.0, 526.0, 556.0, 469.0, 347.0, 251.0, 150.0, 115.0, 69.0, 66.0, 38.0, 46.0, 19.0, 18.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0298614501953125, -0.993316650390625, -0.9567718505859375, -0.92022705078125, -0.8836822509765625, -0.847137451171875, -0.8105926513671875, -0.7740478515625, -0.7375030517578125, -0.700958251953125, -0.6644134521484375, -0.62786865234375, -0.5913238525390625, -0.554779052734375, -0.5182342529296875, -0.481689453125, -0.4451446533203125, -0.408599853515625, -0.3720550537109375, -0.33551025390625, -0.2989654541015625, -0.262420654296875, -0.2258758544921875, -0.1893310546875, -0.1527862548828125, -0.116241455078125, -0.0796966552734375, -0.04315185546875, -0.0066070556640625, 0.029937744140625, 0.0664825439453125, 0.10302734375, 0.1395721435546875, 0.176116943359375, 0.2126617431640625, 0.24920654296875, 0.2857513427734375, 0.322296142578125, 0.3588409423828125, 0.3953857421875, 0.4319305419921875, 0.468475341796875, 0.5050201416015625, 0.54156494140625, 0.5781097412109375, 0.614654541015625, 0.6511993408203125, 0.687744140625, 0.7242889404296875, 0.760833740234375, 0.7973785400390625, 0.83392333984375, 0.8704681396484375, 0.907012939453125, 0.9435577392578125, 0.9801025390625, 1.0166473388671875, 1.053192138671875, 1.0897369384765625, 1.12628173828125, 1.1628265380859375, 1.199371337890625, 1.2359161376953125, 1.2724609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 11.0, 13.0, 29.0, 49.0, 94.0, 145.0, 181.0, 176.0, 125.0, 61.0, 49.0, 24.0, 12.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.183838844299316, -7.769847869873047, -7.355856895446777, -6.941866397857666, -6.5278754234313965, -6.113884449005127, -5.699893951416016, -5.285902976989746, -4.871912002563477, -4.457921028137207, -4.0439300537109375, -3.629939556121826, -3.2159485816955566, -2.801957607269287, -2.3879668712615967, -1.9739761352539062, -1.5599851608276367, -1.1459943056106567, -0.7320034503936768, -0.3180125951766968, 0.0959782600402832, 0.5099692344665527, 0.9239599704742432, 1.3379507064819336, 1.7519416809082031, 2.1659326553344727, 2.579923391342163, 2.9939141273498535, 3.407905101776123, 3.8218960762023926, 4.235886573791504, 4.649877548217773, 5.063869476318359, 5.477860450744629, 5.891851425170898, 6.30584192276001, 6.719832897186279, 7.133823871612549, 7.54781436920166, 7.96180534362793, 8.3757963180542, 8.789787292480469, 9.203778266906738, 9.617769241333008, 10.031759262084961, 10.445751190185547, 10.8597412109375, 11.27373218536377, 11.687723159790039, 12.101714134216309, 12.515705108642578, 12.929696083068848, 13.343687057495117, 13.75767707824707, 14.17166805267334, 14.58565902709961, 14.999650001525879, 15.413640975952148, 15.827631950378418, 16.241622924804688, 16.65561294555664, 17.069604873657227, 17.48359489440918, 17.897586822509766, 18.31157684326172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 8.0, 19.0, 23.0, 23.0, 19.0, 33.0, 37.0, 38.0, 31.0, 51.0, 37.0, 41.0, 52.0, 43.0, 48.0, 44.0, 45.0, 32.0, 30.0, 47.0, 32.0, 39.0, 27.0, 24.0, 22.0, 23.0, 10.0, 12.0, 15.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0], "bins": [-6.707261085510254, -6.5287370681762695, -6.350213050842285, -6.171689033508301, -5.993165493011475, -5.81464147567749, -5.636117458343506, -5.4575934410095215, -5.279069423675537, -5.100545406341553, -4.922021389007568, -4.743497848510742, -4.564973831176758, -4.386449813842773, -4.207925796508789, -4.029401779174805, -3.8508780002593994, -3.672353982925415, -3.4938302040100098, -3.3153061866760254, -3.136782169342041, -2.9582581520080566, -2.7797343730926514, -2.601210355758667, -2.4226865768432617, -2.2441625595092773, -2.065638780593872, -1.8871147632598877, -1.7085907459259033, -1.5300668478012085, -1.3515429496765137, -1.1730189323425293, -0.9944949150085449, -0.8159709572792053, -0.6374469995498657, -0.4589231014251709, -0.2803991436958313, -0.1018751859664917, 0.07664871215820312, 0.2551727294921875, 0.4336966276168823, 0.6122205853462219, 0.7907445430755615, 0.9692684412002563, 1.1477923393249512, 1.3263163566589355, 1.5048402547836304, 1.6833642721176147, 1.8618881702423096, 2.040412187576294, 2.218935966491699, 2.3974599838256836, 2.575984001159668, 2.7545080184936523, 2.9330317974090576, 3.111555814743042, 3.2900795936584473, 3.4686036109924316, 3.647127389907837, 3.8256514072418213, 4.004175186157227, 4.182699203491211, 4.361223220825195, 4.53974723815918, 4.718271255493164]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 10.0, 7.0, 9.0, 11.0, 26.0, 40.0, 51.0, 92.0, 183.0, 334.0, 630.0, 1302.0, 2813.0, 6863.0, 17919.0, 54502.0, 206201.0, 492176.0, 186938.0, 50212.0, 16634.0, 6308.0, 2722.0, 1220.0, 603.0, 296.0, 186.0, 101.0, 70.0, 33.0, 21.0, 16.0, 6.0, 11.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1298828125, -1.087188720703125, -1.04449462890625, -1.001800537109375, -0.9591064453125, -0.916412353515625, -0.87371826171875, -0.831024169921875, -0.788330078125, -0.745635986328125, -0.70294189453125, -0.660247802734375, -0.6175537109375, -0.574859619140625, -0.53216552734375, -0.489471435546875, -0.44677734375, -0.404083251953125, -0.36138916015625, -0.318695068359375, -0.2760009765625, -0.233306884765625, -0.19061279296875, -0.147918701171875, -0.105224609375, -0.062530517578125, -0.01983642578125, 0.022857666015625, 0.0655517578125, 0.108245849609375, 0.15093994140625, 0.193634033203125, 0.236328125, 0.279022216796875, 0.32171630859375, 0.364410400390625, 0.4071044921875, 0.449798583984375, 0.49249267578125, 0.535186767578125, 0.577880859375, 0.620574951171875, 0.66326904296875, 0.705963134765625, 0.7486572265625, 0.791351318359375, 0.83404541015625, 0.876739501953125, 0.91943359375, 0.962127685546875, 1.00482177734375, 1.047515869140625, 1.0902099609375, 1.132904052734375, 1.17559814453125, 1.218292236328125, 1.260986328125, 1.303680419921875, 1.34637451171875, 1.389068603515625, 1.4317626953125, 1.474456787109375, 1.51715087890625, 1.559844970703125, 1.6025390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 11.0, 11.0, 13.0, 11.0, 21.0, 22.0, 27.0, 32.0, 27.0, 48.0, 43.0, 39.0, 44.0, 56.0, 65.0, 55.0, 46.0, 59.0, 44.0, 54.0, 27.0, 53.0, 32.0, 30.0, 34.0, 18.0, 11.0, 12.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65869140625, -0.6354446411132812, -0.6121978759765625, -0.5889511108398438, -0.565704345703125, -0.5424575805664062, -0.5192108154296875, -0.49596405029296875, -0.47271728515625, -0.44947052001953125, -0.4262237548828125, -0.40297698974609375, -0.379730224609375, -0.35648345947265625, -0.3332366943359375, -0.30998992919921875, -0.2867431640625, -0.26349639892578125, -0.2402496337890625, -0.21700286865234375, -0.193756103515625, -0.17050933837890625, -0.1472625732421875, -0.12401580810546875, -0.10076904296875, -0.07752227783203125, -0.0542755126953125, -0.03102874755859375, -0.007781982421875, 0.01546478271484375, 0.0387115478515625, 0.06195831298828125, 0.085205078125, 0.10845184326171875, 0.1316986083984375, 0.15494537353515625, 0.178192138671875, 0.20143890380859375, 0.2246856689453125, 0.24793243408203125, 0.27117919921875, 0.29442596435546875, 0.3176727294921875, 0.34091949462890625, 0.364166259765625, 0.38741302490234375, 0.4106597900390625, 0.43390655517578125, 0.4571533203125, 0.48040008544921875, 0.5036468505859375, 0.5268936157226562, 0.550140380859375, 0.5733871459960938, 0.5966339111328125, 0.6198806762695312, 0.64312744140625, 0.6663742065429688, 0.6896209716796875, 0.7128677368164062, 0.736114501953125, 0.7593612670898438, 0.7826080322265625, 0.8058547973632812, 0.8291015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 21.0, 18.0, 15.0, 31.0, 33.0, 46.0, 74.0, 95.0, 148.0, 218.0, 344.0, 507.0, 892.0, 1696.0, 4239.0, 17860.0, 171297.0, 785405.0, 51473.0, 8394.0, 2592.0, 1156.0, 669.0, 412.0, 266.0, 182.0, 138.0, 92.0, 60.0, 45.0, 42.0, 29.0, 17.0, 15.0, 2.0, 6.0, 8.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.9354248046875, -1.866943359375, -1.7984619140625, -1.72998046875, -1.6614990234375, -1.593017578125, -1.5245361328125, -1.4560546875, -1.3875732421875, -1.319091796875, -1.2506103515625, -1.18212890625, -1.1136474609375, -1.045166015625, -0.9766845703125, -0.908203125, -0.8397216796875, -0.771240234375, -0.7027587890625, -0.63427734375, -0.5657958984375, -0.497314453125, -0.4288330078125, -0.3603515625, -0.2918701171875, -0.223388671875, -0.1549072265625, -0.08642578125, -0.0179443359375, 0.050537109375, 0.1190185546875, 0.1875, 0.2559814453125, 0.324462890625, 0.3929443359375, 0.46142578125, 0.5299072265625, 0.598388671875, 0.6668701171875, 0.7353515625, 0.8038330078125, 0.872314453125, 0.9407958984375, 1.00927734375, 1.0777587890625, 1.146240234375, 1.2147216796875, 1.283203125, 1.3516845703125, 1.420166015625, 1.4886474609375, 1.55712890625, 1.6256103515625, 1.694091796875, 1.7625732421875, 1.8310546875, 1.8995361328125, 1.968017578125, 2.0364990234375, 2.10498046875, 2.1734619140625, 2.241943359375, 2.3104248046875, 2.37890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 4.0, 3.0, 9.0, 9.0, 9.0, 13.0, 16.0, 21.0, 15.0, 31.0, 33.0, 31.0, 41.0, 47.0, 44.0, 61.0, 46.0, 55.0, 71.0, 58.0, 49.0, 61.0, 41.0, 28.0, 37.0, 33.0, 20.0, 16.0, 13.0, 13.0, 14.0, 12.0, 9.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.050048828125, -1.97314453125, -1.896240234375, -1.8193359375, -1.742431640625, -1.66552734375, -1.588623046875, -1.51171875, -1.434814453125, -1.35791015625, -1.281005859375, -1.2041015625, -1.127197265625, -1.05029296875, -0.973388671875, -0.896484375, -0.819580078125, -0.74267578125, -0.665771484375, -0.5888671875, -0.511962890625, -0.43505859375, -0.358154296875, -0.28125, -0.204345703125, -0.12744140625, -0.050537109375, 0.0263671875, 0.103271484375, 0.18017578125, 0.257080078125, 0.333984375, 0.410888671875, 0.48779296875, 0.564697265625, 0.6416015625, 0.718505859375, 0.79541015625, 0.872314453125, 0.94921875, 1.026123046875, 1.10302734375, 1.179931640625, 1.2568359375, 1.333740234375, 1.41064453125, 1.487548828125, 1.564453125, 1.641357421875, 1.71826171875, 1.795166015625, 1.8720703125, 1.948974609375, 2.02587890625, 2.102783203125, 2.1796875, 2.256591796875, 2.33349609375, 2.410400390625, 2.4873046875, 2.564208984375, 2.64111328125, 2.718017578125, 2.794921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 6.0, 6.0, 9.0, 22.0, 35.0, 65.0, 103.0, 163.0, 299.0, 695.0, 1749.0, 6163.0, 41817.0, 875283.0, 107005.0, 10750.0, 2565.0, 929.0, 369.0, 210.0, 112.0, 54.0, 39.0, 30.0, 20.0, 14.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8466796875, -0.821533203125, -0.79638671875, -0.771240234375, -0.74609375, -0.720947265625, -0.69580078125, -0.670654296875, -0.6455078125, -0.620361328125, -0.59521484375, -0.570068359375, -0.544921875, -0.519775390625, -0.49462890625, -0.469482421875, -0.4443359375, -0.419189453125, -0.39404296875, -0.368896484375, -0.34375, -0.318603515625, -0.29345703125, -0.268310546875, -0.2431640625, -0.218017578125, -0.19287109375, -0.167724609375, -0.142578125, -0.117431640625, -0.09228515625, -0.067138671875, -0.0419921875, -0.016845703125, 0.00830078125, 0.033447265625, 0.05859375, 0.083740234375, 0.10888671875, 0.134033203125, 0.1591796875, 0.184326171875, 0.20947265625, 0.234619140625, 0.259765625, 0.284912109375, 0.31005859375, 0.335205078125, 0.3603515625, 0.385498046875, 0.41064453125, 0.435791015625, 0.4609375, 0.486083984375, 0.51123046875, 0.536376953125, 0.5615234375, 0.586669921875, 0.61181640625, 0.636962890625, 0.662109375, 0.687255859375, 0.71240234375, 0.737548828125, 0.7626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 15.0, 5.0, 11.0, 28.0, 30.0, 29.0, 39.0, 68.0, 102.0, 181.0, 153.0, 101.0, 63.0, 46.0, 24.0, 26.0, 15.0, 17.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013506412506103516, -0.00013003312051296234, -0.00012500211596488953, -0.00011997111141681671, -0.0001149401068687439, -0.00010990910232067108, -0.00010487809777259827, -9.984709322452545e-05, -9.481608867645264e-05, -8.978508412837982e-05, -8.475407958030701e-05, -7.972307503223419e-05, -7.469207048416138e-05, -6.966106593608856e-05, -6.463006138801575e-05, -5.959905683994293e-05, -5.456805229187012e-05, -4.95370477437973e-05, -4.450604319572449e-05, -3.947503864765167e-05, -3.444403409957886e-05, -2.9413029551506042e-05, -2.4382025003433228e-05, -1.9351020455360413e-05, -1.4320015907287598e-05, -9.289011359214783e-06, -4.258006811141968e-06, 7.729977369308472e-07, 5.804002285003662e-06, 1.0835006833076477e-05, 1.5866011381149292e-05, 2.0897015929222107e-05, 2.5928020477294922e-05, 3.095902502536774e-05, 3.599002957344055e-05, 4.102103412151337e-05, 4.605203866958618e-05, 5.1083043217658997e-05, 5.611404776573181e-05, 6.114505231380463e-05, 6.617605686187744e-05, 7.120706140995026e-05, 7.623806595802307e-05, 8.126907050609589e-05, 8.63000750541687e-05, 9.133107960224152e-05, 9.636208415031433e-05, 0.00010139308869838715, 0.00010642409324645996, 0.00011145509779453278, 0.00011648610234260559, 0.0001215171068906784, 0.00012654811143875122, 0.00013157911598682404, 0.00013661012053489685, 0.00014164112508296967, 0.00014667212963104248, 0.0001517031341791153, 0.0001567341387271881, 0.00016176514327526093, 0.00016679614782333374, 0.00017182715237140656, 0.00017685815691947937, 0.00018188916146755219, 0.000186920166015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 11.0, 7.0, 18.0, 19.0, 36.0, 48.0, 59.0, 81.0, 126.0, 203.0, 386.0, 732.0, 1499.0, 3406.0, 9508.0, 38936.0, 295212.0, 633376.0, 46993.0, 10678.0, 3712.0, 1560.0, 789.0, 461.0, 237.0, 132.0, 92.0, 63.0, 45.0, 35.0, 25.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.404052734375, -0.3885459899902344, -0.37303924560546875, -0.3575325012207031, -0.3420257568359375, -0.3265190124511719, -0.31101226806640625, -0.2955055236816406, -0.279998779296875, -0.2644920349121094, -0.24898529052734375, -0.23347854614257812, -0.2179718017578125, -0.20246505737304688, -0.18695831298828125, -0.17145156860351562, -0.15594482421875, -0.14043807983398438, -0.12493133544921875, -0.10942459106445312, -0.0939178466796875, -0.07841110229492188, -0.06290435791015625, -0.047397613525390625, -0.031890869140625, -0.016384124755859375, -0.00087738037109375, 0.014629364013671875, 0.0301361083984375, 0.045642852783203125, 0.06114959716796875, 0.07665634155273438, 0.0921630859375, 0.10766983032226562, 0.12317657470703125, 0.13868331909179688, 0.1541900634765625, 0.16969680786132812, 0.18520355224609375, 0.20071029663085938, 0.216217041015625, 0.23172378540039062, 0.24723052978515625, 0.2627372741699219, 0.2782440185546875, 0.2937507629394531, 0.30925750732421875, 0.3247642517089844, 0.34027099609375, 0.3557777404785156, 0.37128448486328125, 0.3867912292480469, 0.4022979736328125, 0.4178047180175781, 0.43331146240234375, 0.4488182067871094, 0.464324951171875, 0.4798316955566406, 0.49533843994140625, 0.5108451843261719, 0.5263519287109375, 0.5418586730957031, 0.5573654174804688, 0.5728721618652344, 0.58837890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 6.0, 2.0, 4.0, 11.0, 9.0, 18.0, 14.0, 14.0, 29.0, 29.0, 35.0, 55.0, 56.0, 67.0, 111.0, 121.0, 98.0, 73.0, 63.0, 36.0, 34.0, 24.0, 20.0, 17.0, 14.0, 7.0, 5.0, 8.0, 3.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.406494140625, -0.3922462463378906, -0.37799835205078125, -0.3637504577636719, -0.3495025634765625, -0.3352546691894531, -0.32100677490234375, -0.3067588806152344, -0.292510986328125, -0.2782630920410156, -0.26401519775390625, -0.24976730346679688, -0.2355194091796875, -0.22127151489257812, -0.20702362060546875, -0.19277572631835938, -0.17852783203125, -0.16427993774414062, -0.15003204345703125, -0.13578414916992188, -0.1215362548828125, -0.10728836059570312, -0.09304046630859375, -0.07879257202148438, -0.064544677734375, -0.050296783447265625, -0.03604888916015625, -0.021800994873046875, -0.0075531005859375, 0.006694793701171875, 0.02094268798828125, 0.035190582275390625, 0.0494384765625, 0.06368637084960938, 0.07793426513671875, 0.09218215942382812, 0.1064300537109375, 0.12067794799804688, 0.13492584228515625, 0.14917373657226562, 0.163421630859375, 0.17766952514648438, 0.19191741943359375, 0.20616531372070312, 0.2204132080078125, 0.23466110229492188, 0.24890899658203125, 0.2631568908691406, 0.27740478515625, 0.2916526794433594, 0.30590057373046875, 0.3201484680175781, 0.3343963623046875, 0.3486442565917969, 0.36289215087890625, 0.3771400451660156, 0.391387939453125, 0.4056358337402344, 0.41988372802734375, 0.4341316223144531, 0.4483795166015625, 0.4626274108886719, 0.47687530517578125, 0.4911231994628906, 0.50537109375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 14.0, 31.0, 114.0, 513.0, 235.0, 63.0, 19.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.60491180419922, -33.66425323486328, -32.72359085083008, -31.78293228149414, -30.84227180480957, -29.901611328125, -28.960952758789062, -28.020292282104492, -27.079631805419922, -26.13897132873535, -25.198312759399414, -24.257652282714844, -23.316991806030273, -22.376331329345703, -21.435672760009766, -20.495012283325195, -19.554351806640625, -18.613691329956055, -17.673032760620117, -16.732372283935547, -15.791711807250977, -14.851052284240723, -13.910392761230469, -12.969732284545898, -12.029073715209961, -11.088414192199707, -10.147753715515137, -9.207094192504883, -8.266433715820312, -7.325774192810059, -6.3851141929626465, -5.444454193115234, -4.503793716430664, -3.563133716583252, -2.62247371673584, -1.6818139553070068, -0.7411539554595947, 0.19950580596923828, 1.1401658058166504, 2.0808258056640625, 3.0214858055114746, 3.9621458053588867, 4.902805805206299, 5.843465805053711, 6.784125328063965, 7.724785327911377, 8.665445327758789, 9.60610580444336, 10.546765327453613, 11.487424850463867, 12.428085327148438, 13.368744850158691, 14.309405326843262, 15.250064849853516, 16.190725326538086, 17.131385803222656, 18.072044372558594, 19.012704849243164, 19.9533634185791, 20.894023895263672, 21.834684371948242, 22.775344848632812, 23.71600341796875, 24.65666389465332, 25.59732437133789]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 10.0, 13.0, 18.0, 15.0, 12.0, 14.0, 14.0, 30.0, 30.0, 34.0, 39.0, 47.0, 90.0, 140.0, 90.0, 58.0, 42.0, 32.0, 39.0, 23.0, 25.0, 11.0, 21.0, 16.0, 17.0, 14.0, 6.0, 9.0, 7.0, 10.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.924737930297852, -8.6578950881958, -8.39105224609375, -8.1242094039917, -7.857367038726807, -7.590524196624756, -7.323681354522705, -7.056838512420654, -6.789996147155762, -6.523153305053711, -6.25631046295166, -5.989467620849609, -5.722625255584717, -5.455782413482666, -5.188939571380615, -4.9220967292785645, -4.655253887176514, -4.388411045074463, -4.121568202972412, -3.8547255992889404, -3.5878829956054688, -3.321040153503418, -3.054197311401367, -2.7873544692993164, -2.5205118656158447, -2.253669023513794, -1.9868264198303223, -1.7199835777282715, -1.4531408548355103, -1.186298131942749, -0.9194552898406982, -0.652612566947937, -0.3857698440551758, -0.11892709136009216, 0.14791566133499146, 0.41475844383239746, 0.6816011667251587, 0.9484438896179199, 1.2152867317199707, 1.482129454612732, 1.7489721775054932, 2.015815019607544, 2.2826576232910156, 2.5495004653930664, 2.816343307495117, 3.083185911178589, 3.3500287532806396, 3.6168713569641113, 3.883714199066162, 4.150557041168213, 4.417399883270264, 4.684242248535156, 4.951085090637207, 5.217927932739258, 5.484770774841309, 5.751613616943359, 6.01845645904541, 6.285299301147461, 6.552142143249512, 6.8189849853515625, 7.085827350616455, 7.352670192718506, 7.619513034820557, 7.886355876922607, 8.1531982421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 6.0, 11.0, 12.0, 12.0, 29.0, 27.0, 30.0, 70.0, 134.0, 234.0, 406.0, 887.0, 2009.0, 5197.0, 17682.0, 97352.0, 955745.0, 2592758.0, 452376.0, 51312.0, 11485.0, 3669.0, 1398.0, 662.0, 331.0, 170.0, 98.0, 60.0, 48.0, 26.0, 11.0, 13.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.650390625, -1.602325439453125, -1.55426025390625, -1.506195068359375, -1.4581298828125, -1.410064697265625, -1.36199951171875, -1.313934326171875, -1.265869140625, -1.217803955078125, -1.16973876953125, -1.121673583984375, -1.0736083984375, -1.025543212890625, -0.97747802734375, -0.929412841796875, -0.88134765625, -0.833282470703125, -0.78521728515625, -0.737152099609375, -0.6890869140625, -0.641021728515625, -0.59295654296875, -0.544891357421875, -0.496826171875, -0.448760986328125, -0.40069580078125, -0.352630615234375, -0.3045654296875, -0.256500244140625, -0.20843505859375, -0.160369873046875, -0.1123046875, -0.064239501953125, -0.01617431640625, 0.031890869140625, 0.0799560546875, 0.128021240234375, 0.17608642578125, 0.224151611328125, 0.272216796875, 0.320281982421875, 0.36834716796875, 0.416412353515625, 0.4644775390625, 0.512542724609375, 0.56060791015625, 0.608673095703125, 0.65673828125, 0.704803466796875, 0.75286865234375, 0.800933837890625, 0.8489990234375, 0.897064208984375, 0.94512939453125, 0.993194580078125, 1.041259765625, 1.089324951171875, 1.13739013671875, 1.185455322265625, 1.2335205078125, 1.281585693359375, 1.32965087890625, 1.377716064453125, 1.42578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 6.0, 6.0, 5.0, 12.0, 14.0, 15.0, 13.0, 40.0, 24.0, 26.0, 32.0, 30.0, 33.0, 43.0, 42.0, 37.0, 47.0, 49.0, 49.0, 52.0, 40.0, 40.0, 44.0, 52.0, 29.0, 35.0, 25.0, 24.0, 27.0, 21.0, 17.0, 11.0, 14.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.490966796875, -0.4728431701660156, -0.45471954345703125, -0.4365959167480469, -0.4184722900390625, -0.4003486633300781, -0.38222503662109375, -0.3641014099121094, -0.345977783203125, -0.3278541564941406, -0.30973052978515625, -0.2916069030761719, -0.2734832763671875, -0.2553596496582031, -0.23723602294921875, -0.21911239624023438, -0.20098876953125, -0.18286514282226562, -0.16474151611328125, -0.14661788940429688, -0.1284942626953125, -0.11037063598632812, -0.09224700927734375, -0.07412338256835938, -0.055999755859375, -0.037876129150390625, -0.01975250244140625, -0.001628875732421875, 0.0164947509765625, 0.034618377685546875, 0.05274200439453125, 0.07086563110351562, 0.0889892578125, 0.10711288452148438, 0.12523651123046875, 0.14336013793945312, 0.1614837646484375, 0.17960739135742188, 0.19773101806640625, 0.21585464477539062, 0.233978271484375, 0.2521018981933594, 0.27022552490234375, 0.2883491516113281, 0.3064727783203125, 0.3245964050292969, 0.34272003173828125, 0.3608436584472656, 0.37896728515625, 0.3970909118652344, 0.41521453857421875, 0.4333381652832031, 0.4514617919921875, 0.4695854187011719, 0.48770904541015625, 0.5058326721191406, 0.523956298828125, 0.5420799255371094, 0.5602035522460938, 0.5783271789550781, 0.5964508056640625, 0.6145744323730469, 0.6326980590820312, 0.6508216857910156, 0.6689453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 10.0, 13.0, 15.0, 14.0, 36.0, 41.0, 44.0, 53.0, 110.0, 159.0, 229.0, 416.0, 749.0, 1570.0, 3829.0, 13870.0, 140130.0, 3774932.0, 231894.0, 17804.0, 4503.0, 1788.0, 835.0, 459.0, 269.0, 157.0, 99.0, 55.0, 49.0, 31.0, 34.0, 10.0, 19.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.626800537109375, -2.53485107421875, -2.442901611328125, -2.3509521484375, -2.259002685546875, -2.16705322265625, -2.075103759765625, -1.983154296875, -1.891204833984375, -1.79925537109375, -1.707305908203125, -1.6153564453125, -1.523406982421875, -1.43145751953125, -1.339508056640625, -1.24755859375, -1.155609130859375, -1.06365966796875, -0.971710205078125, -0.8797607421875, -0.787811279296875, -0.69586181640625, -0.603912353515625, -0.511962890625, -0.420013427734375, -0.32806396484375, -0.236114501953125, -0.1441650390625, -0.052215576171875, 0.03973388671875, 0.131683349609375, 0.2236328125, 0.315582275390625, 0.40753173828125, 0.499481201171875, 0.5914306640625, 0.683380126953125, 0.77532958984375, 0.867279052734375, 0.959228515625, 1.051177978515625, 1.14312744140625, 1.235076904296875, 1.3270263671875, 1.418975830078125, 1.51092529296875, 1.602874755859375, 1.69482421875, 1.786773681640625, 1.87872314453125, 1.970672607421875, 2.0626220703125, 2.154571533203125, 2.24652099609375, 2.338470458984375, 2.430419921875, 2.522369384765625, 2.61431884765625, 2.706268310546875, 2.7982177734375, 2.890167236328125, 2.98211669921875, 3.074066162109375, 3.166015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 10.0, 23.0, 29.0, 32.0, 40.0, 70.0, 100.0, 114.0, 192.0, 248.0, 433.0, 536.0, 587.0, 455.0, 311.0, 259.0, 166.0, 129.0, 85.0, 56.0, 41.0, 29.0, 27.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.112213134765625, -2.04669189453125, -1.981170654296875, -1.9156494140625, -1.850128173828125, -1.78460693359375, -1.719085693359375, -1.653564453125, -1.588043212890625, -1.52252197265625, -1.457000732421875, -1.3914794921875, -1.325958251953125, -1.26043701171875, -1.194915771484375, -1.12939453125, -1.063873291015625, -0.99835205078125, -0.932830810546875, -0.8673095703125, -0.801788330078125, -0.73626708984375, -0.670745849609375, -0.605224609375, -0.539703369140625, -0.47418212890625, -0.408660888671875, -0.3431396484375, -0.277618408203125, -0.21209716796875, -0.146575927734375, -0.0810546875, -0.015533447265625, 0.04998779296875, 0.115509033203125, 0.1810302734375, 0.246551513671875, 0.31207275390625, 0.377593994140625, 0.443115234375, 0.508636474609375, 0.57415771484375, 0.639678955078125, 0.7052001953125, 0.770721435546875, 0.83624267578125, 0.901763916015625, 0.96728515625, 1.032806396484375, 1.09832763671875, 1.163848876953125, 1.2293701171875, 1.294891357421875, 1.36041259765625, 1.425933837890625, 1.491455078125, 1.556976318359375, 1.62249755859375, 1.688018798828125, 1.7535400390625, 1.819061279296875, 1.88458251953125, 1.950103759765625, 2.015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 5.0, 14.0, 11.0, 23.0, 36.0, 114.0, 199.0, 250.0, 173.0, 83.0, 45.0, 17.0, 11.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.30022430419922, -42.137691497802734, -40.97515869140625, -39.8126220703125, -38.650089263916016, -37.48755645751953, -36.32502365112305, -35.16249084472656, -33.99995422363281, -32.83742141723633, -31.67488670349121, -30.512353897094727, -29.34981918334961, -28.187286376953125, -27.02475357055664, -25.862220764160156, -24.699687957763672, -23.537155151367188, -22.37462043762207, -21.212087631225586, -20.04955291748047, -18.887020111083984, -17.7244873046875, -16.561954498291016, -15.399419784545898, -14.236886024475098, -13.074352264404297, -11.911819458007812, -10.749285697937012, -9.586751937866211, -8.424219131469727, -7.261685371398926, -6.099153518676758, -4.936619758605957, -3.7740864753723145, -2.6115529537200928, -1.449019432067871, -0.2864856719970703, 0.8760476112365723, 2.038580894470215, 3.2011146545410156, 4.363648414611816, 5.526181697845459, 6.688714981079102, 7.851248741149902, 9.013782501220703, 10.176315307617188, 11.338849067687988, 12.501382827758789, 13.66391658782959, 14.82645034790039, 15.988983154296875, 17.15151596069336, 18.314050674438477, 19.47658348083496, 20.639118194580078, 21.801651000976562, 22.964183807373047, 24.126718521118164, 25.28925132751465, 26.451786041259766, 27.61431884765625, 28.776851654052734, 29.93938446044922, 31.101919174194336]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 10.0, 11.0, 22.0, 15.0, 17.0, 30.0, 26.0, 29.0, 36.0, 44.0, 38.0, 53.0, 61.0, 57.0, 72.0, 65.0, 47.0, 47.0, 40.0, 42.0, 28.0, 39.0, 35.0, 26.0, 20.0, 15.0, 10.0, 13.0, 5.0, 6.0, 6.0, 11.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.77409839630127, -12.343695640563965, -11.91329288482666, -11.482890129089355, -11.05248737335205, -10.622084617614746, -10.191682815551758, -9.761280059814453, -9.330877304077148, -8.900474548339844, -8.470071792602539, -8.039669036865234, -7.60926628112793, -7.178863525390625, -6.7484612464904785, -6.318058490753174, -5.887655258178711, -5.457252502441406, -5.026849746704102, -4.596446990966797, -4.166044235229492, -3.7356417179107666, -3.305239200592041, -2.8748364448547363, -2.4444336891174316, -2.014030933380127, -1.5836282968521118, -1.1532256603240967, -0.722822904586792, -0.2924201488494873, 0.13798236846923828, 0.568385124206543, 0.9987869262695312, 1.429189682006836, 1.859592318534851, 2.289994955062866, 2.720397710800171, 3.1508004665374756, 3.581202983856201, 4.011605739593506, 4.4420084953308105, 4.872411251068115, 5.30281400680542, 5.733216285705566, 6.163619041442871, 6.594021797180176, 7.0244245529174805, 7.454827308654785, 7.88523006439209, 8.315632820129395, 8.7460355758667, 9.176438331604004, 9.606841087341309, 10.037243843078613, 10.467645645141602, 10.898048400878906, 11.328451156616211, 11.758853912353516, 12.18925666809082, 12.619659423828125, 13.05006217956543, 13.480464935302734, 13.910867691040039, 14.341270446777344, 14.771673202514648]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 16.0, 23.0, 25.0, 30.0, 59.0, 76.0, 100.0, 185.0, 321.0, 569.0, 1166.0, 2374.0, 5474.0, 15660.0, 52034.0, 274125.0, 571678.0, 87291.0, 23000.0, 7988.0, 3136.0, 1485.0, 746.0, 332.0, 217.0, 131.0, 76.0, 76.0, 48.0, 34.0, 13.0, 8.0, 11.0, 6.0, 3.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.240234375, -1.201690673828125, -1.16314697265625, -1.124603271484375, -1.0860595703125, -1.047515869140625, -1.00897216796875, -0.970428466796875, -0.931884765625, -0.893341064453125, -0.85479736328125, -0.816253662109375, -0.7777099609375, -0.739166259765625, -0.70062255859375, -0.662078857421875, -0.62353515625, -0.584991455078125, -0.54644775390625, -0.507904052734375, -0.4693603515625, -0.430816650390625, -0.39227294921875, -0.353729248046875, -0.315185546875, -0.276641845703125, -0.23809814453125, -0.199554443359375, -0.1610107421875, -0.122467041015625, -0.08392333984375, -0.045379638671875, -0.0068359375, 0.031707763671875, 0.07025146484375, 0.108795166015625, 0.1473388671875, 0.185882568359375, 0.22442626953125, 0.262969970703125, 0.301513671875, 0.340057373046875, 0.37860107421875, 0.417144775390625, 0.4556884765625, 0.494232177734375, 0.53277587890625, 0.571319580078125, 0.60986328125, 0.648406982421875, 0.68695068359375, 0.725494384765625, 0.7640380859375, 0.802581787109375, 0.84112548828125, 0.879669189453125, 0.918212890625, 0.956756591796875, 0.99530029296875, 1.033843994140625, 1.0723876953125, 1.110931396484375, 1.14947509765625, 1.188018798828125, 1.2265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 15.0, 15.0, 29.0, 33.0, 47.0, 42.0, 60.0, 44.0, 80.0, 68.0, 78.0, 71.0, 69.0, 74.0, 48.0, 44.0, 35.0, 34.0, 31.0, 22.0, 17.0, 12.0, 11.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7572479248046875, -0.722503662109375, -0.6877593994140625, -0.65301513671875, -0.6182708740234375, -0.583526611328125, -0.5487823486328125, -0.5140380859375, -0.4792938232421875, -0.444549560546875, -0.4098052978515625, -0.37506103515625, -0.3403167724609375, -0.305572509765625, -0.2708282470703125, -0.236083984375, -0.2013397216796875, -0.166595458984375, -0.1318511962890625, -0.09710693359375, -0.0623626708984375, -0.027618408203125, 0.0071258544921875, 0.0418701171875, 0.0766143798828125, 0.111358642578125, 0.1461029052734375, 0.18084716796875, 0.2155914306640625, 0.250335693359375, 0.2850799560546875, 0.31982421875, 0.3545684814453125, 0.389312744140625, 0.4240570068359375, 0.45880126953125, 0.4935455322265625, 0.528289794921875, 0.5630340576171875, 0.5977783203125, 0.6325225830078125, 0.667266845703125, 0.7020111083984375, 0.73675537109375, 0.7714996337890625, 0.806243896484375, 0.8409881591796875, 0.875732421875, 0.9104766845703125, 0.945220947265625, 0.9799652099609375, 1.01470947265625, 1.0494537353515625, 1.084197998046875, 1.1189422607421875, 1.1536865234375, 1.1884307861328125, 1.223175048828125, 1.2579193115234375, 1.29266357421875, 1.3274078369140625, 1.362152099609375, 1.3968963623046875, 1.431640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 8.0, 8.0, 10.0, 14.0, 23.0, 23.0, 36.0, 52.0, 86.0, 122.0, 156.0, 265.0, 373.0, 771.0, 1859.0, 6833.0, 49896.0, 891703.0, 82467.0, 9460.0, 2259.0, 862.0, 450.0, 269.0, 178.0, 106.0, 68.0, 48.0, 36.0, 32.0, 15.0, 15.0, 5.0, 12.0, 5.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5478515625, -1.5017852783203125, -1.455718994140625, -1.4096527099609375, -1.36358642578125, -1.3175201416015625, -1.271453857421875, -1.2253875732421875, -1.1793212890625, -1.1332550048828125, -1.087188720703125, -1.0411224365234375, -0.99505615234375, -0.9489898681640625, -0.902923583984375, -0.8568572998046875, -0.810791015625, -0.7647247314453125, -0.718658447265625, -0.6725921630859375, -0.62652587890625, -0.5804595947265625, -0.534393310546875, -0.4883270263671875, -0.4422607421875, -0.3961944580078125, -0.350128173828125, -0.3040618896484375, -0.25799560546875, -0.2119293212890625, -0.165863037109375, -0.1197967529296875, -0.07373046875, -0.0276641845703125, 0.018402099609375, 0.0644683837890625, 0.11053466796875, 0.1566009521484375, 0.202667236328125, 0.2487335205078125, 0.2947998046875, 0.3408660888671875, 0.386932373046875, 0.4329986572265625, 0.47906494140625, 0.5251312255859375, 0.571197509765625, 0.6172637939453125, 0.663330078125, 0.7093963623046875, 0.755462646484375, 0.8015289306640625, 0.84759521484375, 0.8936614990234375, 0.939727783203125, 0.9857940673828125, 1.0318603515625, 1.0779266357421875, 1.123992919921875, 1.1700592041015625, 1.21612548828125, 1.2621917724609375, 1.308258056640625, 1.3543243408203125, 1.400390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 10.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 15.0, 19.0, 21.0, 29.0, 28.0, 56.0, 54.0, 58.0, 62.0, 80.0, 59.0, 68.0, 64.0, 52.0, 40.0, 33.0, 34.0, 12.0, 21.0, 20.0, 19.0, 20.0, 8.0, 10.0, 9.0, 6.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.49609375, -2.41912841796875, -2.3421630859375, -2.26519775390625, -2.188232421875, -2.11126708984375, -2.0343017578125, -1.95733642578125, -1.88037109375, -1.80340576171875, -1.7264404296875, -1.64947509765625, -1.572509765625, -1.49554443359375, -1.4185791015625, -1.34161376953125, -1.2646484375, -1.18768310546875, -1.1107177734375, -1.03375244140625, -0.956787109375, -0.87982177734375, -0.8028564453125, -0.72589111328125, -0.64892578125, -0.57196044921875, -0.4949951171875, -0.41802978515625, -0.341064453125, -0.26409912109375, -0.1871337890625, -0.11016845703125, -0.033203125, 0.04376220703125, 0.1207275390625, 0.19769287109375, 0.274658203125, 0.35162353515625, 0.4285888671875, 0.50555419921875, 0.58251953125, 0.65948486328125, 0.7364501953125, 0.81341552734375, 0.890380859375, 0.96734619140625, 1.0443115234375, 1.12127685546875, 1.1982421875, 1.27520751953125, 1.3521728515625, 1.42913818359375, 1.506103515625, 1.58306884765625, 1.6600341796875, 1.73699951171875, 1.81396484375, 1.89093017578125, 1.9678955078125, 2.04486083984375, 2.121826171875, 2.19879150390625, 2.2757568359375, 2.35272216796875, 2.4296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 9.0, 11.0, 19.0, 29.0, 38.0, 53.0, 92.0, 157.0, 268.0, 520.0, 1216.0, 3597.0, 14236.0, 183021.0, 817976.0, 19849.0, 4517.0, 1501.0, 653.0, 308.0, 171.0, 89.0, 66.0, 37.0, 31.0, 25.0, 16.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.37534332275390625, -0.3649444580078125, -0.35454559326171875, -0.344146728515625, -0.33374786376953125, -0.3233489990234375, -0.31295013427734375, -0.30255126953125, -0.29215240478515625, -0.2817535400390625, -0.27135467529296875, -0.260955810546875, -0.25055694580078125, -0.2401580810546875, -0.22975921630859375, -0.2193603515625, -0.20896148681640625, -0.1985626220703125, -0.18816375732421875, -0.177764892578125, -0.16736602783203125, -0.1569671630859375, -0.14656829833984375, -0.13616943359375, -0.12577056884765625, -0.1153717041015625, -0.10497283935546875, -0.094573974609375, -0.08417510986328125, -0.0737762451171875, -0.06337738037109375, -0.052978515625, -0.04257965087890625, -0.0321807861328125, -0.02178192138671875, -0.011383056640625, -0.00098419189453125, 0.0094146728515625, 0.01981353759765625, 0.03021240234375, 0.04061126708984375, 0.0510101318359375, 0.06140899658203125, 0.071807861328125, 0.08220672607421875, 0.0926055908203125, 0.10300445556640625, 0.1134033203125, 0.12380218505859375, 0.1342010498046875, 0.14459991455078125, 0.154998779296875, 0.16539764404296875, 0.1757965087890625, 0.18619537353515625, 0.19659423828125, 0.20699310302734375, 0.2173919677734375, 0.22779083251953125, 0.238189697265625, 0.24858856201171875, 0.2589874267578125, 0.26938629150390625, 0.27978515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 7.0, 7.0, 10.0, 13.0, 13.0, 26.0, 36.0, 60.0, 110.0, 146.0, 154.0, 155.0, 67.0, 39.0, 37.0, 24.0, 19.0, 10.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.636713027954102e-05, -8.399225771427155e-05, -8.161738514900208e-05, -7.92425125837326e-05, -7.686764001846313e-05, -7.449276745319366e-05, -7.21178948879242e-05, -6.974302232265472e-05, -6.736814975738525e-05, -6.499327719211578e-05, -6.261840462684631e-05, -6.024353206157684e-05, -5.786865949630737e-05, -5.54937869310379e-05, -5.311891436576843e-05, -5.074404180049896e-05, -4.836916923522949e-05, -4.599429666996002e-05, -4.361942410469055e-05, -4.124455153942108e-05, -3.886967897415161e-05, -3.649480640888214e-05, -3.411993384361267e-05, -3.17450612783432e-05, -2.937018871307373e-05, -2.699531614780426e-05, -2.462044358253479e-05, -2.224557101726532e-05, -1.987069845199585e-05, -1.749582588672638e-05, -1.512095332145691e-05, -1.2746080756187439e-05, -1.0371208190917969e-05, -7.996335625648499e-06, -5.621463060379028e-06, -3.246590495109558e-06, -8.717179298400879e-07, 1.5031546354293823e-06, 3.8780272006988525e-06, 6.252899765968323e-06, 8.627772331237793e-06, 1.1002644896507263e-05, 1.3377517461776733e-05, 1.5752390027046204e-05, 1.8127262592315674e-05, 2.0502135157585144e-05, 2.2877007722854614e-05, 2.5251880288124084e-05, 2.7626752853393555e-05, 3.0001625418663025e-05, 3.2376497983932495e-05, 3.4751370549201965e-05, 3.7126243114471436e-05, 3.9501115679740906e-05, 4.1875988245010376e-05, 4.4250860810279846e-05, 4.6625733375549316e-05, 4.900060594081879e-05, 5.137547850608826e-05, 5.375035107135773e-05, 5.61252236366272e-05, 5.850009620189667e-05, 6.087496876716614e-05, 6.324984133243561e-05, 6.562471389770508e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 21.0, 26.0, 23.0, 47.0, 67.0, 101.0, 157.0, 264.0, 418.0, 764.0, 1378.0, 2775.0, 6157.0, 16501.0, 63245.0, 809634.0, 108661.0, 22977.0, 7930.0, 3522.0, 1631.0, 885.0, 500.0, 282.0, 162.0, 114.0, 77.0, 62.0, 49.0, 32.0, 21.0, 13.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.19930648803710938, -0.19280242919921875, -0.18629837036132812, -0.1797943115234375, -0.17329025268554688, -0.16678619384765625, -0.16028213500976562, -0.153778076171875, -0.14727401733398438, -0.14076995849609375, -0.13426589965820312, -0.1277618408203125, -0.12125778198242188, -0.11475372314453125, -0.10824966430664062, -0.10174560546875, -0.09524154663085938, -0.08873748779296875, -0.08223342895507812, -0.0757293701171875, -0.06922531127929688, -0.06272125244140625, -0.056217193603515625, -0.049713134765625, -0.043209075927734375, -0.03670501708984375, -0.030200958251953125, -0.0236968994140625, -0.017192840576171875, -0.01068878173828125, -0.004184722900390625, 0.0023193359375, 0.008823394775390625, 0.01532745361328125, 0.021831512451171875, 0.0283355712890625, 0.034839630126953125, 0.04134368896484375, 0.047847747802734375, 0.054351806640625, 0.060855865478515625, 0.06735992431640625, 0.07386398315429688, 0.0803680419921875, 0.08687210083007812, 0.09337615966796875, 0.09988021850585938, 0.10638427734375, 0.11288833618164062, 0.11939239501953125, 0.12589645385742188, 0.1324005126953125, 0.13890457153320312, 0.14540863037109375, 0.15191268920898438, 0.158416748046875, 0.16492080688476562, 0.17142486572265625, 0.17792892456054688, 0.1844329833984375, 0.19093704223632812, 0.19744110107421875, 0.20394515991210938, 0.21044921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 2.0, 5.0, 7.0, 6.0, 14.0, 25.0, 11.0, 18.0, 27.0, 50.0, 76.0, 140.0, 156.0, 141.0, 86.0, 57.0, 40.0, 20.0, 20.0, 16.0, 23.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.339599609375, -0.33008575439453125, -0.3205718994140625, -0.31105804443359375, -0.301544189453125, -0.29203033447265625, -0.2825164794921875, -0.27300262451171875, -0.26348876953125, -0.25397491455078125, -0.2444610595703125, -0.23494720458984375, -0.225433349609375, -0.21591949462890625, -0.2064056396484375, -0.19689178466796875, -0.1873779296875, -0.17786407470703125, -0.1683502197265625, -0.15883636474609375, -0.149322509765625, -0.13980865478515625, -0.1302947998046875, -0.12078094482421875, -0.11126708984375, -0.10175323486328125, -0.0922393798828125, -0.08272552490234375, -0.073211669921875, -0.06369781494140625, -0.0541839599609375, -0.04467010498046875, -0.03515625, -0.02564239501953125, -0.0161285400390625, -0.00661468505859375, 0.002899169921875, 0.01241302490234375, 0.0219268798828125, 0.03144073486328125, 0.04095458984375, 0.05046844482421875, 0.0599822998046875, 0.06949615478515625, 0.079010009765625, 0.08852386474609375, 0.0980377197265625, 0.10755157470703125, 0.1170654296875, 0.12657928466796875, 0.1360931396484375, 0.14560699462890625, 0.155120849609375, 0.16463470458984375, 0.1741485595703125, 0.18366241455078125, 0.19317626953125, 0.20269012451171875, 0.2122039794921875, 0.22171783447265625, 0.231231689453125, 0.24074554443359375, 0.2502593994140625, 0.25977325439453125, 0.269287109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 11.0, 20.0, 23.0, 43.0, 64.0, 129.0, 482.0, 103.0, 50.0, 18.0, 14.0, 8.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.590933799743652, -12.262884140014648, -11.934834480285645, -11.606783866882324, -11.27873420715332, -10.950684547424316, -10.622634887695312, -10.294585227966309, -9.966535568237305, -9.6384859085083, -9.310436248779297, -8.982385635375977, -8.654335975646973, -8.326286315917969, -7.998236656188965, -7.670186996459961, -7.342136383056641, -7.014086723327637, -6.686036586761475, -6.357986927032471, -6.029936790466309, -5.701887130737305, -5.373837471008301, -5.045787811279297, -4.717737674713135, -4.389688014984131, -4.061637878417969, -3.733588218688965, -3.405538320541382, -3.077488422393799, -2.749438762664795, -2.421388864517212, -2.0933399200439453, -1.7652900218963623, -1.4372402429580688, -1.1091904640197754, -0.7811405658721924, -0.4530906677246094, -0.12504088878631592, 0.20300889015197754, 0.5310587882995605, 0.8591086268424988, 1.187158465385437, 1.5152082443237305, 1.8432581424713135, 2.1713080406188965, 2.4993577003479004, 2.8274075984954834, 3.1554574966430664, 3.4835073947906494, 3.8115572929382324, 4.139606952667236, 4.467657089233398, 4.795706748962402, 5.123756408691406, 5.45180606842041, 5.779856204986572, 6.107905864715576, 6.435956001281738, 6.764005661010742, 7.092055320739746, 7.420105457305908, 7.748155117034912, 8.076205253601074, 8.404254913330078]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 12.0, 12.0, 13.0, 16.0, 16.0, 21.0, 15.0, 27.0, 24.0, 24.0, 43.0, 185.0, 256.0, 54.0, 34.0, 19.0, 34.0, 25.0, 21.0, 18.0, 12.0, 13.0, 11.0, 8.0, 10.0, 9.0, 2.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.607936859130859, -7.3912434577941895, -7.1745500564575195, -6.95785665512085, -6.74116325378418, -6.52446985244751, -6.30777645111084, -6.091082572937012, -5.8743896484375, -5.65769624710083, -5.44100284576416, -5.22430944442749, -5.00761604309082, -4.79092264175415, -4.5742292404174805, -4.357535362243652, -4.140841960906982, -3.9241485595703125, -3.7074551582336426, -3.4907617568969727, -3.2740683555603027, -3.057374954223633, -2.840681314468384, -2.623987913131714, -2.407294511795044, -2.190601110458374, -1.973907709121704, -1.7572141885757446, -1.5405207872390747, -1.3238273859024048, -1.1071338653564453, -0.8904404640197754, -0.6737470626831055, -0.45705363154411316, -0.24036020040512085, -0.023666739463806152, 0.19302666187286377, 0.4097200632095337, 0.6264135837554932, 0.8431069850921631, 1.059800386428833, 1.276493787765503, 1.4931871891021729, 1.7098807096481323, 1.9265741109848022, 2.1432676315307617, 2.3599610328674316, 2.5766544342041016, 2.7933478355407715, 3.0100412368774414, 3.2267346382141113, 3.4434280395507812, 3.660121440887451, 3.876814842224121, 4.093508720397949, 4.310201644897461, 4.526895523071289, 4.743588924407959, 4.960282325744629, 5.176975727081299, 5.393669128417969, 5.610362529754639, 5.827055931091309, 6.043749809265137, 6.260442733764648]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 10.0, 6.0, 8.0, 17.0, 19.0, 32.0, 38.0, 42.0, 43.0, 55.0, 139.0, 254.0, 67.0, 46.0, 43.0, 28.0, 24.0, 22.0, 25.0, 17.0, 17.0, 9.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.891357421875, -0.86279296875, -0.834228515625, -0.8056640625, -0.777099609375, -0.74853515625, -0.719970703125, -0.69140625, -0.662841796875, -0.63427734375, -0.605712890625, -0.5771484375, -0.548583984375, -0.52001953125, -0.491455078125, -0.462890625, -0.434326171875, -0.40576171875, -0.377197265625, -0.3486328125, -0.320068359375, -0.29150390625, -0.262939453125, -0.234375, -0.205810546875, -0.17724609375, -0.148681640625, -0.1201171875, -0.091552734375, -0.06298828125, -0.034423828125, -0.005859375, 0.022705078125, 0.05126953125, 0.079833984375, 0.1083984375, 0.136962890625, 0.16552734375, 0.194091796875, 0.22265625, 0.251220703125, 0.27978515625, 0.308349609375, 0.3369140625, 0.365478515625, 0.39404296875, 0.422607421875, 0.451171875, 0.479736328125, 0.50830078125, 0.536865234375, 0.5654296875, 0.593994140625, 0.62255859375, 0.651123046875, 0.6796875, 0.708251953125, 0.73681640625, 0.765380859375, 0.7939453125, 0.822509765625, 0.85107421875, 0.879638671875, 0.908203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 10.0, 11.0, 13.0, 17.0, 22.0, 23.0, 48.0, 98.0, 222.0, 628.0, 2842.0, 32289.0, 8343188.0, 7162.0, 1235.0, 369.0, 147.0, 86.0, 42.0, 33.0, 12.0, 11.0, 14.0, 16.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0], "bins": [-10.011630058288574, -9.680545806884766, -9.34946060180664, -9.018376350402832, -8.687292098999023, -8.356207847595215, -8.025123596191406, -7.694038391113281, -7.362954139709473, -7.031869888305664, -6.700785160064697, -6.3697004318237305, -6.038616180419922, -5.707531929016113, -5.3764472007751465, -5.04536247253418, -4.714278221130371, -4.3831939697265625, -4.052109241485596, -3.721024751663208, -3.3899402618408203, -3.0588557720184326, -2.727771282196045, -2.3966867923736572, -2.0656023025512695, -1.7345178127288818, -1.4034333229064941, -1.0723488330841064, -0.7412643432617188, -0.41017985343933105, -0.07909536361694336, 0.25198912620544434, 0.5830726623535156, 0.9141571521759033, 1.245241641998291, 1.5763261318206787, 1.9074106216430664, 2.238495111465454, 2.569579601287842, 2.9006640911102295, 3.231748580932617, 3.562833070755005, 3.8939175605773926, 4.225002288818359, 4.556086540222168, 4.887170791625977, 5.218255519866943, 5.54934024810791, 5.880424499511719, 6.211508750915527, 6.542593479156494, 6.873678207397461, 7.2047624588012695, 7.535846710205078, 7.866931438446045, 8.198016166687012, 8.52910041809082, 8.860184669494629, 9.191268920898438, 9.522354125976562, 9.853438377380371, 10.18452262878418, 10.515607833862305, 10.846692085266113, 11.177776336669922]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 11.0, 5.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.871780395507812, -14.41817569732666, -13.964570999145508, -13.510966300964355, -13.057361602783203, -12.60375690460205, -12.150152206420898, -11.696547508239746, -11.242942810058594, -10.789338111877441, -10.335733413696289, -9.882128715515137, -9.428524017333984, -8.974919319152832, -8.52131462097168, -8.067709922790527, -7.614105224609375, -7.160500526428223, -6.70689582824707, -6.253291130065918, -5.799686431884766, -5.346081733703613, -4.892477035522461, -4.438872337341309, -3.9852676391601562, -3.531662940979004, -3.0780582427978516, -2.624453544616699, -2.170848846435547, -1.7172441482543945, -1.2636394500732422, -0.8100347518920898, -0.3564291000366211, 0.09717559814453125, 0.5507802963256836, 1.004384994506836, 1.4579896926879883, 1.9115943908691406, 2.365199089050293, 2.8188037872314453, 3.2724084854125977, 3.72601318359375, 4.179617881774902, 4.633222579956055, 5.086827278137207, 5.540431976318359, 5.994036674499512, 6.447641372680664, 6.901246070861816, 7.354850769042969, 7.808455467224121, 8.262060165405273, 8.715664863586426, 9.169269561767578, 9.62287425994873, 10.076478958129883, 10.530083656311035, 10.983688354492188, 11.43729305267334, 11.890897750854492, 12.344502449035645, 12.798107147216797, 13.25171184539795, 13.705316543579102, 14.158921241760254]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 18.0, 16.0, 21.0, 34.0, 54.0, 71.0, 75.0, 121.0, 153.0, 232.0, 387.0, 679.0, 1330.0, 3075.0, 8772.0, 26407.0, 85508.0, 208518.0, 127887.0, 40188.0, 12588.0, 4308.0, 1657.0, 759.0, 383.0, 265.0, 188.0, 132.0, 101.0, 65.0, 52.0, 40.0, 35.0, 34.0, 26.0, 19.0, 9.0, 13.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.4296875, -6.2200927734375, -6.010498046875, -5.8009033203125, -5.59130859375, -5.3817138671875, -5.172119140625, -4.9625244140625, -4.7529296875, -4.5433349609375, -4.333740234375, -4.1241455078125, -3.91455078125, -3.7049560546875, -3.495361328125, -3.2857666015625, -3.076171875, -2.8665771484375, -2.656982421875, -2.4473876953125, -2.23779296875, -2.0281982421875, -1.818603515625, -1.6090087890625, -1.3994140625, -1.1898193359375, -0.980224609375, -0.7706298828125, -0.56103515625, -0.3514404296875, -0.141845703125, 0.0677490234375, 0.27734375, 0.4869384765625, 0.696533203125, 0.9061279296875, 1.11572265625, 1.3253173828125, 1.534912109375, 1.7445068359375, 1.9541015625, 2.1636962890625, 2.373291015625, 2.5828857421875, 2.79248046875, 3.0020751953125, 3.211669921875, 3.4212646484375, 3.630859375, 3.8404541015625, 4.050048828125, 4.2596435546875, 4.46923828125, 4.6788330078125, 4.888427734375, 5.0980224609375, 5.3076171875, 5.5172119140625, 5.726806640625, 5.9364013671875, 6.14599609375, 6.3555908203125, 6.565185546875, 6.7747802734375, 6.984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 14.0, 18.0, 20.0, 28.0, 45.0, 43.0, 64.0, 92.0, 98.0, 105.0, 87.0, 93.0, 60.0, 53.0, 74.0, 30.0, 15.0, 25.0, 7.0, 12.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8467559814453125, -0.807769775390625, -0.7687835693359375, -0.72979736328125, -0.6908111572265625, -0.651824951171875, -0.6128387451171875, -0.5738525390625, -0.5348663330078125, -0.495880126953125, -0.4568939208984375, -0.41790771484375, -0.3789215087890625, -0.339935302734375, -0.3009490966796875, -0.261962890625, -0.2229766845703125, -0.183990478515625, -0.1450042724609375, -0.10601806640625, -0.0670318603515625, -0.028045654296875, 0.0109405517578125, 0.0499267578125, 0.0889129638671875, 0.127899169921875, 0.1668853759765625, 0.20587158203125, 0.2448577880859375, 0.283843994140625, 0.3228302001953125, 0.36181640625, 0.4008026123046875, 0.439788818359375, 0.4787750244140625, 0.51776123046875, 0.5567474365234375, 0.595733642578125, 0.6347198486328125, 0.6737060546875, 0.7126922607421875, 0.751678466796875, 0.7906646728515625, 0.82965087890625, 0.8686370849609375, 0.907623291015625, 0.9466094970703125, 0.985595703125, 1.0245819091796875, 1.063568115234375, 1.1025543212890625, 1.14154052734375, 1.1805267333984375, 1.219512939453125, 1.2584991455078125, 1.2974853515625, 1.3364715576171875, 1.375457763671875, 1.4144439697265625, 1.45343017578125, 1.4924163818359375, 1.531402587890625, 1.5703887939453125, 1.609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 12.0, 8.0, 24.0, 35.0, 54.0, 77.0, 71.0, 68.0, 59.0, 34.0, 13.0, 15.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21453857421875, -7.9825663566589355, -7.750594139099121, -7.518621921539307, -7.286649703979492, -7.054677486419678, -6.822705268859863, -6.590733051300049, -6.358760833740234, -6.12678861618042, -5.8948163986206055, -5.662844181060791, -5.430871963500977, -5.198899745941162, -4.966927528381348, -4.734955310821533, -4.502983093261719, -4.271010875701904, -4.03903865814209, -3.8070664405822754, -3.575094223022461, -3.3431220054626465, -3.111149787902832, -2.8791775703430176, -2.647205352783203, -2.4152331352233887, -2.183260917663574, -1.9512887001037598, -1.7193164825439453, -1.4873442649841309, -1.2553720474243164, -1.023399829864502, -0.7914276123046875, -0.559455394744873, -0.3274831771850586, -0.09551095962524414, 0.1364612579345703, 0.36843347549438477, 0.6004056930541992, 0.8323779106140137, 1.0643501281738281, 1.2963223457336426, 1.528294563293457, 1.7602667808532715, 1.992238998413086, 2.2242112159729004, 2.456183433532715, 2.6881556510925293, 2.9201278686523438, 3.152100086212158, 3.3840723037719727, 3.616044521331787, 3.8480167388916016, 4.079988956451416, 4.3119611740112305, 4.543933391571045, 4.775905609130859, 5.007877826690674, 5.239850044250488, 5.471822261810303, 5.703794479370117, 5.935766696929932, 6.167738914489746, 6.3997111320495605, 6.631683349609375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 5.0, 9.0, 23.0, 58.0, 135.0, 120.0, 51.0, 18.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.148806095123291, -5.946475028991699, -5.744144439697266, -5.541813373565674, -5.339482307434082, -5.137151718139648, -4.934820652008057, -4.732489585876465, -4.530158996582031, -4.3278279304504395, -4.125497341156006, -3.923166275024414, -3.7208352088928223, -3.5185043811798096, -3.316173553466797, -3.113842487335205, -2.9115114212036133, -2.7091805934906006, -2.506849527359009, -2.304518699645996, -2.1021876335144043, -1.8998568058013916, -1.697525978088379, -1.4951950311660767, -1.2928640842437744, -1.0905331373214722, -0.8882022500038147, -0.6858713626861572, -0.483540415763855, -0.28120946884155273, -0.07887864112854004, 0.12345230579376221, 0.32578277587890625, 0.5281137228012085, 0.730444610118866, 0.9327754974365234, 1.1351064443588257, 1.337437391281128, 1.5397682189941406, 1.7420991659164429, 1.9444301128387451, 2.146760940551758, 2.3490920066833496, 2.5514228343963623, 2.753753662109375, 2.956084728240967, 3.1584155559539795, 3.360746383666992, 3.563077449798584, 3.7654082775115967, 3.9677393436431885, 4.170070171356201, 4.372401237487793, 4.574731826782227, 4.777062892913818, 4.97939395904541, 5.181724548339844, 5.3840556144714355, 5.586386203765869, 5.788717269897461, 5.991048336029053, 6.1933794021606445, 6.395709991455078, 6.59804105758667, 6.800372123718262]}, "eval/loss": 5.364102363586426, "eval/wer": 1.4310574042105682, "eval/runtime": 1110.1846, "eval/samples_per_second": 2.38, "eval/steps_per_second": 0.298, "train/train_runtime": 28486.3453, "train/train_samples_per_second": 5.009, "train/train_steps_per_second": 0.157, "train/total_flos": 0.0, "train/train_loss": 6.089906092074955} \ No newline at end of file