diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.856, "train/learning_rate": 0.0001684185630143819, "train/epoch": 1.54, "train/global_step": 5000, "_runtime": 47341, "_timestamp": 1651721430, "_step": 5009, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 54.0, 967.0], "bins": [-162.1786346435547, -159.61509704589844, -157.0515594482422, -154.48802185058594, -151.9244842529297, -149.36093139648438, -146.79739379882812, -144.23385620117188, -141.67031860351562, -139.10678100585938, -136.54324340820312, -133.97970581054688, -131.41616821289062, -128.85263061523438, -126.2890853881836, -123.72554779052734, -121.1620101928711, -118.59847259521484, -116.0349349975586, -113.47138977050781, -110.90785217285156, -108.34431457519531, -105.78077697753906, -103.21723937988281, -100.65370178222656, -98.09016418457031, -95.52662658691406, -92.96308135986328, -90.39954376220703, -87.83600616455078, -85.27246856689453, -82.70893096923828, -80.1453857421875, -77.58184814453125, -75.018310546875, -72.45476531982422, -69.89122772216797, -67.32769012451172, -64.76415252685547, -62.20061492919922, -59.63706970214844, -57.07353210449219, -54.50999069213867, -51.94645309448242, -49.382911682128906, -46.819374084472656, -44.255836486816406, -41.692298889160156, -39.12875747680664, -36.56521987915039, -34.001678466796875, -31.438140869140625, -28.874601364135742, -26.31106185913086, -23.74752426147461, -21.183984756469727, -18.620445251464844, -16.05690574645996, -13.493367195129395, -10.929828643798828, -8.366289138793945, -5.8027496337890625, -3.239211082458496, -0.6756725311279297, 1.8878662586212158]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 10.0, 15.0, 17.0, 24.0, 23.0, 31.0, 26.0, 38.0, 42.0, 49.0, 52.0, 51.0, 47.0, 56.0, 62.0, 56.0, 55.0, 49.0, 42.0, 33.0, 41.0, 33.0, 26.0, 16.0, 18.0, 14.0, 10.0, 15.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.286391735076904, -7.084299564361572, -6.882206916809082, -6.68011474609375, -6.478022575378418, -6.275930404663086, -6.073838233947754, -5.871745586395264, -5.669653415679932, -5.4675612449646, -5.265468597412109, -5.063376426696777, -4.861284255981445, -4.659192085266113, -4.457099914550781, -4.255007266998291, -4.052915096282959, -3.850822925567627, -3.648730516433716, -3.4466381072998047, -3.2445459365844727, -3.0424537658691406, -2.8403613567352295, -2.6382689476013184, -2.4361767768859863, -2.2340846061706543, -2.031992197036743, -1.8298999071121216, -1.6278076171875, -1.4257153272628784, -1.2236230373382568, -1.0215307474136353, -0.8194384574890137, -0.6173461675643921, -0.4152538776397705, -0.21316158771514893, -0.011069297790527344, 0.19102299213409424, 0.3931152820587158, 0.5952075719833374, 0.797299861907959, 0.9993921518325806, 1.2014844417572021, 1.4035767316818237, 1.6056690216064453, 1.807761311531067, 2.0098536014556885, 2.2119460105895996, 2.4140381813049316, 2.6161303520202637, 2.818222761154175, 3.020315170288086, 3.222407341003418, 3.42449951171875, 3.626591920852661, 3.8286843299865723, 4.030776500701904, 4.232868671417236, 4.434961318969727, 4.637053489685059, 4.839145660400391, 5.041237831115723, 5.243330001831055, 5.445422649383545, 5.647514820098877]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 6.0, 7.0, 1.0, 13.0, 13.0, 16.0, 24.0, 33.0, 62.0, 61.0, 87.0, 147.0, 226.0, 350.0, 617.0, 993.0, 1666.0, 2917.0, 5495.0, 9986.0, 19120.0, 35183.0, 67868.0, 150003.0, 661350.0, 2750105.0, 279358.0, 100349.0, 49927.0, 26718.0, 14123.0, 7512.0, 4171.0, 2273.0, 1352.0, 781.0, 473.0, 293.0, 192.0, 122.0, 95.0, 57.0, 39.0, 31.0, 27.0, 20.0, 8.0, 8.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.3935546875, -2.314453125, -2.2353515625, -2.15625, -2.0771484375, -1.998046875, -1.9189453125, -1.83984375, -1.7607421875, -1.681640625, -1.6025390625, -1.5234375, -1.4443359375, -1.365234375, -1.2861328125, -1.20703125, -1.1279296875, -1.048828125, -0.9697265625, -0.890625, -0.8115234375, -0.732421875, -0.6533203125, -0.57421875, -0.4951171875, -0.416015625, -0.3369140625, -0.2578125, -0.1787109375, -0.099609375, -0.0205078125, 0.05859375, 0.1376953125, 0.216796875, 0.2958984375, 0.375, 0.4541015625, 0.533203125, 0.6123046875, 0.69140625, 0.7705078125, 0.849609375, 0.9287109375, 1.0078125, 1.0869140625, 1.166015625, 1.2451171875, 1.32421875, 1.4033203125, 1.482421875, 1.5615234375, 1.640625, 1.7197265625, 1.798828125, 1.8779296875, 1.95703125, 2.0361328125, 2.115234375, 2.1943359375, 2.2734375, 2.3525390625, 2.431640625, 2.5107421875, 2.58984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 10.0, 12.0, 13.0, 12.0, 24.0, 30.0, 28.0, 30.0, 42.0, 30.0, 41.0, 44.0, 47.0, 54.0, 46.0, 44.0, 47.0, 49.0, 58.0, 44.0, 40.0, 42.0, 26.0, 30.0, 18.0, 18.0, 20.0, 11.0, 12.0, 11.0, 7.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-5.74609375, -5.5877685546875, -5.429443359375, -5.2711181640625, -5.11279296875, -4.9544677734375, -4.796142578125, -4.6378173828125, -4.4794921875, -4.3211669921875, -4.162841796875, -4.0045166015625, -3.84619140625, -3.6878662109375, -3.529541015625, -3.3712158203125, -3.212890625, -3.0545654296875, -2.896240234375, -2.7379150390625, -2.57958984375, -2.4212646484375, -2.262939453125, -2.1046142578125, -1.9462890625, -1.7879638671875, -1.629638671875, -1.4713134765625, -1.31298828125, -1.1546630859375, -0.996337890625, -0.8380126953125, -0.6796875, -0.5213623046875, -0.363037109375, -0.2047119140625, -0.04638671875, 0.1119384765625, 0.270263671875, 0.4285888671875, 0.5869140625, 0.7452392578125, 0.903564453125, 1.0618896484375, 1.22021484375, 1.3785400390625, 1.536865234375, 1.6951904296875, 1.853515625, 2.0118408203125, 2.170166015625, 2.3284912109375, 2.48681640625, 2.6451416015625, 2.803466796875, 2.9617919921875, 3.1201171875, 3.2784423828125, 3.436767578125, 3.5950927734375, 3.75341796875, 3.9117431640625, 4.070068359375, 4.2283935546875, 4.38671875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 9.0, 7.0, 3.0, 16.0, 14.0, 22.0, 22.0, 48.0, 59.0, 112.0, 333.0, 4189877.0, 3321.0, 215.0, 86.0, 39.0, 37.0, 20.0, 8.0, 12.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.375, -156.73828125, -152.1015625, -147.46484375, -142.828125, -138.19140625, -133.5546875, -128.91796875, -124.28125, -119.64453125, -115.0078125, -110.37109375, -105.734375, -101.09765625, -96.4609375, -91.82421875, -87.1875, -82.55078125, -77.9140625, -73.27734375, -68.640625, -64.00390625, -59.3671875, -54.73046875, -50.09375, -45.45703125, -40.8203125, -36.18359375, -31.546875, -26.91015625, -22.2734375, -17.63671875, -13.0, -8.36328125, -3.7265625, 0.91015625, 5.546875, 10.18359375, 14.8203125, 19.45703125, 24.09375, 28.73046875, 33.3671875, 38.00390625, 42.640625, 47.27734375, 51.9140625, 56.55078125, 61.1875, 65.82421875, 70.4609375, 75.09765625, 79.734375, 84.37109375, 89.0078125, 93.64453125, 98.28125, 102.91796875, 107.5546875, 112.19140625, 116.828125, 121.46484375, 126.1015625, 130.73828125, 135.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 6.0, 6.0, 9.0, 15.0, 26.0, 24.0, 38.0, 57.0, 89.0, 149.0, 975.0, 2182.0, 225.0, 101.0, 51.0, 44.0, 17.0, 16.0, 8.0, 6.0, 4.0, 8.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.973297119140625, -2.88604736328125, -2.798797607421875, -2.7115478515625, -2.624298095703125, -2.53704833984375, -2.449798583984375, -2.362548828125, -2.275299072265625, -2.18804931640625, -2.100799560546875, -2.0135498046875, -1.926300048828125, -1.83905029296875, -1.751800537109375, -1.66455078125, -1.577301025390625, -1.49005126953125, -1.402801513671875, -1.3155517578125, -1.228302001953125, -1.14105224609375, -1.053802490234375, -0.966552734375, -0.879302978515625, -0.79205322265625, -0.704803466796875, -0.6175537109375, -0.530303955078125, -0.44305419921875, -0.355804443359375, -0.2685546875, -0.181304931640625, -0.09405517578125, -0.006805419921875, 0.0804443359375, 0.167694091796875, 0.25494384765625, 0.342193603515625, 0.429443359375, 0.516693115234375, 0.60394287109375, 0.691192626953125, 0.7784423828125, 0.865692138671875, 0.95294189453125, 1.040191650390625, 1.12744140625, 1.214691162109375, 1.30194091796875, 1.389190673828125, 1.4764404296875, 1.563690185546875, 1.65093994140625, 1.738189697265625, 1.825439453125, 1.912689208984375, 1.99993896484375, 2.087188720703125, 2.1744384765625, 2.261688232421875, 2.34893798828125, 2.436187744140625, 2.5234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 5.0, 4.0, 9.0, 11.0, 13.0, 20.0, 53.0, 73.0, 78.0, 113.0, 131.0, 141.0, 103.0, 78.0, 59.0, 37.0, 24.0, 16.0, 9.0, 8.0, 8.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.38481330871582, -9.143033981323242, -8.901254653930664, -8.659476280212402, -8.417696952819824, -8.175917625427246, -7.934138774871826, -7.692359924316406, -7.450580596923828, -7.20880126953125, -6.96702241897583, -6.72524356842041, -6.483464241027832, -6.241684913635254, -5.999906063079834, -5.758127212524414, -5.516347885131836, -5.274568557739258, -5.032789707183838, -4.791010856628418, -4.54923152923584, -4.307452201843262, -4.065673351287842, -3.8238942623138428, -3.5821151733398438, -3.3403360843658447, -3.0985569953918457, -2.8567779064178467, -2.6149988174438477, -2.3732197284698486, -2.1314406394958496, -1.8896615505218506, -1.6478829383850098, -1.4061038494110107, -1.1643247604370117, -0.9225456714630127, -0.6807665824890137, -0.43898749351501465, -0.19720840454101562, 0.0445706844329834, 0.2863497734069824, 0.5281288623809814, 0.7699079513549805, 1.0116870403289795, 1.2534661293029785, 1.4952452182769775, 1.7370243072509766, 1.9788033962249756, 2.2205824851989746, 2.4623615741729736, 2.7041406631469727, 2.9459197521209717, 3.1876988410949707, 3.4294779300689697, 3.6712570190429688, 3.9130361080169678, 4.154815196990967, 4.396594047546387, 4.638373374938965, 4.880152702331543, 5.121931552886963, 5.363710403442383, 5.605489730834961, 5.847269058227539, 6.089047908782959]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 6.0, 0.0, 5.0, 5.0, 10.0, 18.0, 11.0, 13.0, 15.0, 17.0, 14.0, 19.0, 34.0, 29.0, 27.0, 29.0, 39.0, 46.0, 48.0, 35.0, 48.0, 41.0, 46.0, 59.0, 32.0, 42.0, 40.0, 25.0, 29.0, 23.0, 25.0, 27.0, 23.0, 25.0, 8.0, 21.0, 15.0, 13.0, 5.0, 4.0, 7.0, 6.0, 2.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.468169212341309, -4.336191177368164, -4.2042131423950195, -4.072235584259033, -3.9402575492858887, -3.808279514312744, -3.6763017177581787, -3.5443239212036133, -3.4123458862304688, -3.280367851257324, -3.148390054702759, -3.0164122581481934, -2.884434223175049, -2.7524561882019043, -2.620478391647339, -2.4885005950927734, -2.356522560119629, -2.2245445251464844, -2.092566728591919, -1.960588812828064, -1.828610897064209, -1.696632981300354, -1.564655065536499, -1.432677149772644, -1.300699234008789, -1.168721318244934, -1.036743402481079, -0.9047654867172241, -0.7727875709533691, -0.6408096551895142, -0.5088317394256592, -0.3768538236618042, -0.24487590789794922, -0.11289799213409424, 0.019079923629760742, 0.15105783939361572, 0.2830357551574707, 0.4150136709213257, 0.5469915866851807, 0.6789695024490356, 0.8109474182128906, 0.9429253339767456, 1.0749032497406006, 1.2068811655044556, 1.3388590812683105, 1.4708369970321655, 1.6028149127960205, 1.7347928285598755, 1.8667707443237305, 1.9987486600875854, 2.1307265758514404, 2.262704372406006, 2.3946824073791504, 2.526660442352295, 2.6586382389068604, 2.790616035461426, 2.9225940704345703, 3.054572105407715, 3.1865499019622803, 3.3185276985168457, 3.4505057334899902, 3.5824837684631348, 3.7144615650177, 3.8464393615722656, 3.97841739654541]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 14.0, 28.0, 30.0, 60.0, 85.0, 133.0, 241.0, 403.0, 866.0, 2433.0, 8934.0, 44627.0, 333967.0, 557354.0, 79466.0, 14204.0, 3426.0, 1113.0, 483.0, 247.0, 156.0, 88.0, 58.0, 46.0, 22.0, 22.0, 11.0, 9.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2353515625, -1.196929931640625, -1.15850830078125, -1.120086669921875, -1.0816650390625, -1.043243408203125, -1.00482177734375, -0.966400146484375, -0.927978515625, -0.889556884765625, -0.85113525390625, -0.812713623046875, -0.7742919921875, -0.735870361328125, -0.69744873046875, -0.659027099609375, -0.62060546875, -0.582183837890625, -0.54376220703125, -0.505340576171875, -0.4669189453125, -0.428497314453125, -0.39007568359375, -0.351654052734375, -0.313232421875, -0.274810791015625, -0.23638916015625, -0.197967529296875, -0.1595458984375, -0.121124267578125, -0.08270263671875, -0.044281005859375, -0.005859375, 0.032562255859375, 0.07098388671875, 0.109405517578125, 0.1478271484375, 0.186248779296875, 0.22467041015625, 0.263092041015625, 0.301513671875, 0.339935302734375, 0.37835693359375, 0.416778564453125, 0.4552001953125, 0.493621826171875, 0.53204345703125, 0.570465087890625, 0.60888671875, 0.647308349609375, 0.68572998046875, 0.724151611328125, 0.7625732421875, 0.800994873046875, 0.83941650390625, 0.877838134765625, 0.916259765625, 0.954681396484375, 0.99310302734375, 1.031524658203125, 1.0699462890625, 1.108367919921875, 1.14678955078125, 1.185211181640625, 1.2236328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 7.0, 9.0, 17.0, 21.0, 14.0, 30.0, 35.0, 33.0, 49.0, 56.0, 46.0, 67.0, 65.0, 64.0, 69.0, 62.0, 59.0, 61.0, 38.0, 39.0, 35.0, 23.0, 23.0, 15.0, 19.0, 9.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-6.32421875, -6.174896240234375, -6.02557373046875, -5.876251220703125, -5.7269287109375, -5.577606201171875, -5.42828369140625, -5.278961181640625, -5.129638671875, -4.980316162109375, -4.83099365234375, -4.681671142578125, -4.5323486328125, -4.383026123046875, -4.23370361328125, -4.084381103515625, -3.93505859375, -3.785736083984375, -3.63641357421875, -3.487091064453125, -3.3377685546875, -3.188446044921875, -3.03912353515625, -2.889801025390625, -2.740478515625, -2.591156005859375, -2.44183349609375, -2.292510986328125, -2.1431884765625, -1.993865966796875, -1.84454345703125, -1.695220947265625, -1.5458984375, -1.396575927734375, -1.24725341796875, -1.097930908203125, -0.9486083984375, -0.799285888671875, -0.64996337890625, -0.500640869140625, -0.351318359375, -0.201995849609375, -0.05267333984375, 0.096649169921875, 0.2459716796875, 0.395294189453125, 0.54461669921875, 0.693939208984375, 0.84326171875, 0.992584228515625, 1.14190673828125, 1.291229248046875, 1.4405517578125, 1.589874267578125, 1.73919677734375, 1.888519287109375, 2.037841796875, 2.187164306640625, 2.33648681640625, 2.485809326171875, 2.6351318359375, 2.784454345703125, 2.93377685546875, 3.083099365234375, 3.232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 7.0, 18.0, 14.0, 26.0, 23.0, 17.0, 40.0, 34.0, 46.0, 60.0, 73.0, 73.0, 99.0, 117.0, 133.0, 205.0, 280.0, 408.0, 725.0, 2492.0, 15484.0, 172384.0, 731503.0, 109169.0, 10803.0, 1941.0, 676.0, 339.0, 300.0, 218.0, 143.0, 114.0, 113.0, 93.0, 79.0, 67.0, 51.0, 36.0, 33.0, 19.0, 27.0, 14.0, 13.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.77685546875, -0.7521209716796875, -0.727386474609375, -0.7026519775390625, -0.67791748046875, -0.6531829833984375, -0.628448486328125, -0.6037139892578125, -0.5789794921875, -0.5542449951171875, -0.529510498046875, -0.5047760009765625, -0.48004150390625, -0.4553070068359375, -0.430572509765625, -0.4058380126953125, -0.381103515625, -0.3563690185546875, -0.331634521484375, -0.3069000244140625, -0.28216552734375, -0.2574310302734375, -0.232696533203125, -0.2079620361328125, -0.1832275390625, -0.1584930419921875, -0.133758544921875, -0.1090240478515625, -0.08428955078125, -0.0595550537109375, -0.034820556640625, -0.0100860595703125, 0.0146484375, 0.0393829345703125, 0.064117431640625, 0.0888519287109375, 0.11358642578125, 0.1383209228515625, 0.163055419921875, 0.1877899169921875, 0.2125244140625, 0.2372589111328125, 0.261993408203125, 0.2867279052734375, 0.31146240234375, 0.3361968994140625, 0.360931396484375, 0.3856658935546875, 0.410400390625, 0.4351348876953125, 0.459869384765625, 0.4846038818359375, 0.50933837890625, 0.5340728759765625, 0.558807373046875, 0.5835418701171875, 0.6082763671875, 0.6330108642578125, 0.657745361328125, 0.6824798583984375, 0.70721435546875, 0.7319488525390625, 0.756683349609375, 0.7814178466796875, 0.80615234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 12.0, 8.0, 16.0, 17.0, 13.0, 20.0, 28.0, 30.0, 23.0, 36.0, 32.0, 46.0, 54.0, 44.0, 50.0, 50.0, 41.0, 61.0, 40.0, 43.0, 49.0, 46.0, 43.0, 24.0, 17.0, 19.0, 15.0, 23.0, 20.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.320068359375, -6.09716796875, -5.874267578125, -5.6513671875, -5.428466796875, -5.20556640625, -4.982666015625, -4.759765625, -4.536865234375, -4.31396484375, -4.091064453125, -3.8681640625, -3.645263671875, -3.42236328125, -3.199462890625, -2.9765625, -2.753662109375, -2.53076171875, -2.307861328125, -2.0849609375, -1.862060546875, -1.63916015625, -1.416259765625, -1.193359375, -0.970458984375, -0.74755859375, -0.524658203125, -0.3017578125, -0.078857421875, 0.14404296875, 0.366943359375, 0.58984375, 0.812744140625, 1.03564453125, 1.258544921875, 1.4814453125, 1.704345703125, 1.92724609375, 2.150146484375, 2.373046875, 2.595947265625, 2.81884765625, 3.041748046875, 3.2646484375, 3.487548828125, 3.71044921875, 3.933349609375, 4.15625, 4.379150390625, 4.60205078125, 4.824951171875, 5.0478515625, 5.270751953125, 5.49365234375, 5.716552734375, 5.939453125, 6.162353515625, 6.38525390625, 6.608154296875, 6.8310546875, 7.053955078125, 7.27685546875, 7.499755859375, 7.72265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 9.0, 13.0, 24.0, 30.0, 39.0, 74.0, 140.0, 349.0, 1437.0, 136529.0, 907201.0, 1910.0, 408.0, 144.0, 75.0, 51.0, 45.0, 12.0, 19.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39111328125, -0.3776664733886719, -0.36421966552734375, -0.3507728576660156, -0.3373260498046875, -0.3238792419433594, -0.31043243408203125, -0.2969856262207031, -0.283538818359375, -0.2700920104980469, -0.25664520263671875, -0.24319839477539062, -0.2297515869140625, -0.21630477905273438, -0.20285797119140625, -0.18941116333007812, -0.17596435546875, -0.16251754760742188, -0.14907073974609375, -0.13562393188476562, -0.1221771240234375, -0.10873031616210938, -0.09528350830078125, -0.08183670043945312, -0.068389892578125, -0.054943084716796875, -0.04149627685546875, -0.028049468994140625, -0.0146026611328125, -0.001155853271484375, 0.01229095458984375, 0.025737762451171875, 0.0391845703125, 0.052631378173828125, 0.06607818603515625, 0.07952499389648438, 0.0929718017578125, 0.10641860961914062, 0.11986541748046875, 0.13331222534179688, 0.146759033203125, 0.16020584106445312, 0.17365264892578125, 0.18709945678710938, 0.2005462646484375, 0.21399307250976562, 0.22743988037109375, 0.24088668823242188, 0.25433349609375, 0.2677803039550781, 0.28122711181640625, 0.2946739196777344, 0.3081207275390625, 0.3215675354003906, 0.33501434326171875, 0.3484611511230469, 0.361907958984375, 0.3753547668457031, 0.38880157470703125, 0.4022483825683594, 0.4156951904296875, 0.4291419982910156, 0.44258880615234375, 0.4560356140136719, 0.469482421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 14.0, 10.0, 26.0, 35.0, 37.0, 55.0, 50.0, 82.0, 98.0, 98.0, 108.0, 85.0, 84.0, 38.0, 44.0, 40.0, 32.0, 13.0, 7.0, 11.0, 3.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.857778549194336e-05, -4.6426430344581604e-05, -4.427507519721985e-05, -4.212372004985809e-05, -3.997236490249634e-05, -3.782100975513458e-05, -3.566965460777283e-05, -3.351829946041107e-05, -3.1366944313049316e-05, -2.921558916568756e-05, -2.7064234018325806e-05, -2.491287887096405e-05, -2.2761523723602295e-05, -2.061016857624054e-05, -1.8458813428878784e-05, -1.630745828151703e-05, -1.4156103134155273e-05, -1.2004747986793518e-05, -9.853392839431763e-06, -7.702037692070007e-06, -5.550682544708252e-06, -3.3993273973464966e-06, -1.2479722499847412e-06, 9.033828973770142e-07, 3.0547380447387695e-06, 5.206093192100525e-06, 7.35744833946228e-06, 9.508803486824036e-06, 1.1660158634185791e-05, 1.3811513781547546e-05, 1.5962868928909302e-05, 1.8114224076271057e-05, 2.0265579223632812e-05, 2.2416934370994568e-05, 2.4568289518356323e-05, 2.671964466571808e-05, 2.8870999813079834e-05, 3.102235496044159e-05, 3.3173710107803345e-05, 3.53250652551651e-05, 3.7476420402526855e-05, 3.962777554988861e-05, 4.1779130697250366e-05, 4.393048584461212e-05, 4.608184099197388e-05, 4.823319613933563e-05, 5.038455128669739e-05, 5.253590643405914e-05, 5.46872615814209e-05, 5.6838616728782654e-05, 5.898997187614441e-05, 6.114132702350616e-05, 6.329268217086792e-05, 6.544403731822968e-05, 6.759539246559143e-05, 6.974674761295319e-05, 7.189810276031494e-05, 7.40494579076767e-05, 7.620081305503845e-05, 7.835216820240021e-05, 8.050352334976196e-05, 8.265487849712372e-05, 8.480623364448547e-05, 8.695758879184723e-05, 8.910894393920898e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 10.0, 27.0, 30.0, 57.0, 109.0, 427.0, 10678.0, 1033168.0, 3550.0, 257.0, 83.0, 38.0, 34.0, 15.0, 5.0, 6.0, 7.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2236328125, -1.19000244140625, -1.1563720703125, -1.12274169921875, -1.089111328125, -1.05548095703125, -1.0218505859375, -0.98822021484375, -0.95458984375, -0.92095947265625, -0.8873291015625, -0.85369873046875, -0.820068359375, -0.78643798828125, -0.7528076171875, -0.71917724609375, -0.685546875, -0.65191650390625, -0.6182861328125, -0.58465576171875, -0.551025390625, -0.51739501953125, -0.4837646484375, -0.45013427734375, -0.41650390625, -0.38287353515625, -0.3492431640625, -0.31561279296875, -0.281982421875, -0.24835205078125, -0.2147216796875, -0.18109130859375, -0.1474609375, -0.11383056640625, -0.0802001953125, -0.04656982421875, -0.012939453125, 0.02069091796875, 0.0543212890625, 0.08795166015625, 0.12158203125, 0.15521240234375, 0.1888427734375, 0.22247314453125, 0.256103515625, 0.28973388671875, 0.3233642578125, 0.35699462890625, 0.390625, 0.42425537109375, 0.4578857421875, 0.49151611328125, 0.525146484375, 0.55877685546875, 0.5924072265625, 0.62603759765625, 0.65966796875, 0.69329833984375, 0.7269287109375, 0.76055908203125, 0.794189453125, 0.82781982421875, 0.8614501953125, 0.89508056640625, 0.9287109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 10.0, 15.0, 29.0, 39.0, 66.0, 111.0, 125.0, 231.0, 120.0, 74.0, 56.0, 31.0, 17.0, 12.0, 6.0, 8.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07989501953125, -0.0776987075805664, -0.07550239562988281, -0.07330608367919922, -0.07110977172851562, -0.06891345977783203, -0.06671714782714844, -0.06452083587646484, -0.06232452392578125, -0.060128211975097656, -0.05793190002441406, -0.05573558807373047, -0.053539276123046875, -0.05134296417236328, -0.04914665222167969, -0.046950340270996094, -0.0447540283203125, -0.042557716369628906, -0.04036140441894531, -0.03816509246826172, -0.035968780517578125, -0.03377246856689453, -0.03157615661621094, -0.029379844665527344, -0.02718353271484375, -0.024987220764160156, -0.022790908813476562, -0.02059459686279297, -0.018398284912109375, -0.01620197296142578, -0.014005661010742188, -0.011809349060058594, -0.009613037109375, -0.007416725158691406, -0.0052204132080078125, -0.0030241012573242188, -0.000827789306640625, 0.0013685226440429688, 0.0035648345947265625, 0.005761146545410156, 0.00795745849609375, 0.010153770446777344, 0.012350082397460938, 0.014546394348144531, 0.016742706298828125, 0.01893901824951172, 0.021135330200195312, 0.023331642150878906, 0.0255279541015625, 0.027724266052246094, 0.029920578002929688, 0.03211688995361328, 0.034313201904296875, 0.03650951385498047, 0.03870582580566406, 0.040902137756347656, 0.04309844970703125, 0.045294761657714844, 0.04749107360839844, 0.04968738555908203, 0.051883697509765625, 0.05408000946044922, 0.05627632141113281, 0.058472633361816406, 0.0606689453125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 10.0, 22.0, 60.0, 125.0, 197.0, 220.0, 158.0, 102.0, 47.0, 15.0, 8.0, 8.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.618609428405762, -11.289319038391113, -10.960028648376465, -10.630738258361816, -10.301447868347168, -9.97215747833252, -9.642867088317871, -9.313577651977539, -8.98428726196289, -8.654996871948242, -8.325706481933594, -7.996416091918945, -7.667125701904297, -7.337835311889648, -7.008545398712158, -6.67925500869751, -6.349964141845703, -6.020673751831055, -5.691383361816406, -5.362092971801758, -5.032802581787109, -4.703512191772461, -4.374222278594971, -4.044931888580322, -3.715641498565674, -3.3863511085510254, -3.057060718536377, -2.7277705669403076, -2.398480176925659, -2.0691897869110107, -1.7398995161056519, -1.410609245300293, -1.0813179016113281, -0.7520275712013245, -0.4227372407913208, -0.09344691038131714, 0.23584342002868652, 0.565133810043335, 0.8944240808486938, 1.2237143516540527, 1.5530047416687012, 1.8822951316833496, 2.211585521697998, 2.5408756732940674, 2.870166063308716, 3.1994564533233643, 3.5287466049194336, 3.858036994934082, 4.1873273849487305, 4.516617774963379, 4.845908164978027, 5.175198554992676, 5.504488945007324, 5.833779335021973, 6.163069248199463, 6.492359638214111, 6.82165002822876, 7.150940418243408, 7.480230808258057, 7.809521198272705, 8.138811111450195, 8.468101501464844, 8.797391891479492, 9.12668228149414, 9.455972671508789]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 19.0, 17.0, 19.0, 25.0, 33.0, 37.0, 50.0, 54.0, 69.0, 77.0, 62.0, 80.0, 80.0, 66.0, 48.0, 37.0, 41.0, 44.0, 32.0, 28.0, 20.0, 6.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.2737016677856445, -6.120598793029785, -5.967495918273926, -5.814392566680908, -5.661289691925049, -5.5081868171691895, -5.35508394241333, -5.2019805908203125, -5.048877716064453, -4.895774841308594, -4.742671966552734, -4.589568614959717, -4.436465740203857, -4.283362865447998, -4.130259990692139, -3.9771568775177, -3.824054002761841, -3.6709511280059814, -3.517848014831543, -3.3647451400756836, -3.211642026901245, -3.0585391521453857, -2.9054360389709473, -2.752333164215088, -2.5992302894592285, -2.446127414703369, -2.2930243015289307, -2.1399214267730713, -1.9868183135986328, -1.8337154388427734, -1.6806124448776245, -1.5275094509124756, -1.374406099319458, -1.221303105354309, -1.0682001113891602, -0.915097177028656, -0.7619941830635071, -0.6088911890983582, -0.455788254737854, -0.3026852607727051, -0.14958226680755615, 0.0035207122564315796, 0.1566236913204193, 0.30972665548324585, 0.4628296494483948, 0.6159326434135437, 0.7690355777740479, 0.9221385717391968, 1.0752415657043457, 1.2283445596694946, 1.3814475536346436, 1.534550428390503, 1.6876535415649414, 1.8407564163208008, 1.9938594102859497, 2.1469624042510986, 2.300065517425537, 2.4531683921813965, 2.606271505355835, 2.7593743801116943, 2.912477493286133, 3.065580368041992, 3.2186832427978516, 3.37178635597229, 3.5248892307281494]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 18.0, 15.0, 22.0, 52.0, 97.0, 159.0, 314.0, 562.0, 1073.0, 2124.0, 4714.0, 11488.0, 32148.0, 122632.0, 522296.0, 262699.0, 57124.0, 17839.0, 7006.0, 3025.0, 1451.0, 718.0, 419.0, 215.0, 117.0, 68.0, 49.0, 28.0, 13.0, 13.0, 11.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.669921875, -2.588348388671875, -2.50677490234375, -2.425201416015625, -2.3436279296875, -2.262054443359375, -2.18048095703125, -2.098907470703125, -2.017333984375, -1.935760498046875, -1.85418701171875, -1.772613525390625, -1.6910400390625, -1.609466552734375, -1.52789306640625, -1.446319580078125, -1.36474609375, -1.283172607421875, -1.20159912109375, -1.120025634765625, -1.0384521484375, -0.956878662109375, -0.87530517578125, -0.793731689453125, -0.712158203125, -0.630584716796875, -0.54901123046875, -0.467437744140625, -0.3858642578125, -0.304290771484375, -0.22271728515625, -0.141143798828125, -0.0595703125, 0.022003173828125, 0.10357666015625, 0.185150146484375, 0.2667236328125, 0.348297119140625, 0.42987060546875, 0.511444091796875, 0.593017578125, 0.674591064453125, 0.75616455078125, 0.837738037109375, 0.9193115234375, 1.000885009765625, 1.08245849609375, 1.164031982421875, 1.24560546875, 1.327178955078125, 1.40875244140625, 1.490325927734375, 1.5718994140625, 1.653472900390625, 1.73504638671875, 1.816619873046875, 1.898193359375, 1.979766845703125, 2.06134033203125, 2.142913818359375, 2.2244873046875, 2.306060791015625, 2.38763427734375, 2.469207763671875, 2.55078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 9.0, 6.0, 8.0, 12.0, 17.0, 19.0, 29.0, 47.0, 53.0, 54.0, 73.0, 87.0, 84.0, 71.0, 85.0, 62.0, 55.0, 49.0, 40.0, 36.0, 26.0, 32.0, 15.0, 13.0, 8.0, 8.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -19.034912109375, -18.50732421875, -17.979736328125, -17.4521484375, -16.924560546875, -16.39697265625, -15.869384765625, -15.341796875, -14.814208984375, -14.28662109375, -13.759033203125, -13.2314453125, -12.703857421875, -12.17626953125, -11.648681640625, -11.12109375, -10.593505859375, -10.06591796875, -9.538330078125, -9.0107421875, -8.483154296875, -7.95556640625, -7.427978515625, -6.900390625, -6.372802734375, -5.84521484375, -5.317626953125, -4.7900390625, -4.262451171875, -3.73486328125, -3.207275390625, -2.6796875, -2.152099609375, -1.62451171875, -1.096923828125, -0.5693359375, -0.041748046875, 0.48583984375, 1.013427734375, 1.541015625, 2.068603515625, 2.59619140625, 3.123779296875, 3.6513671875, 4.178955078125, 4.70654296875, 5.234130859375, 5.76171875, 6.289306640625, 6.81689453125, 7.344482421875, 7.8720703125, 8.399658203125, 8.92724609375, 9.454833984375, 9.982421875, 10.510009765625, 11.03759765625, 11.565185546875, 12.0927734375, 12.620361328125, 13.14794921875, 13.675537109375, 14.203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 9.0, 13.0, 35.0, 25.0, 42.0, 63.0, 96.0, 219.0, 697.0, 25221.0, 1018636.0, 2620.0, 376.0, 160.0, 99.0, 62.0, 37.0, 40.0, 18.0, 24.0, 15.0, 11.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.0625, -16.359375, -15.65625, -14.953125, -14.25, -13.546875, -12.84375, -12.140625, -11.4375, -10.734375, -10.03125, -9.328125, -8.625, -7.921875, -7.21875, -6.515625, -5.8125, -5.109375, -4.40625, -3.703125, -3.0, -2.296875, -1.59375, -0.890625, -0.1875, 0.515625, 1.21875, 1.921875, 2.625, 3.328125, 4.03125, 4.734375, 5.4375, 6.140625, 6.84375, 7.546875, 8.25, 8.953125, 9.65625, 10.359375, 11.0625, 11.765625, 12.46875, 13.171875, 13.875, 14.578125, 15.28125, 15.984375, 16.6875, 17.390625, 18.09375, 18.796875, 19.5, 20.203125, 20.90625, 21.609375, 22.3125, 23.015625, 23.71875, 24.421875, 25.125, 25.828125, 26.53125, 27.234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 2.0, 4.0, 6.0, 6.0, 16.0, 8.0, 10.0, 13.0, 16.0, 18.0, 24.0, 28.0, 33.0, 35.0, 24.0, 40.0, 51.0, 42.0, 46.0, 47.0, 35.0, 30.0, 38.0, 30.0, 34.0, 44.0, 28.0, 28.0, 33.0, 20.0, 35.0, 33.0, 15.0, 18.0, 19.0, 10.0, 7.0, 19.0, 7.0, 10.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.484375, -8.189208984375, -7.89404296875, -7.598876953125, -7.3037109375, -7.008544921875, -6.71337890625, -6.418212890625, -6.123046875, -5.827880859375, -5.53271484375, -5.237548828125, -4.9423828125, -4.647216796875, -4.35205078125, -4.056884765625, -3.76171875, -3.466552734375, -3.17138671875, -2.876220703125, -2.5810546875, -2.285888671875, -1.99072265625, -1.695556640625, -1.400390625, -1.105224609375, -0.81005859375, -0.514892578125, -0.2197265625, 0.075439453125, 0.37060546875, 0.665771484375, 0.9609375, 1.256103515625, 1.55126953125, 1.846435546875, 2.1416015625, 2.436767578125, 2.73193359375, 3.027099609375, 3.322265625, 3.617431640625, 3.91259765625, 4.207763671875, 4.5029296875, 4.798095703125, 5.09326171875, 5.388427734375, 5.68359375, 5.978759765625, 6.27392578125, 6.569091796875, 6.8642578125, 7.159423828125, 7.45458984375, 7.749755859375, 8.044921875, 8.340087890625, 8.63525390625, 8.930419921875, 9.2255859375, 9.520751953125, 9.81591796875, 10.111083984375, 10.40625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 9.0, 7.0, 6.0, 17.0, 20.0, 30.0, 66.0, 135.0, 376.0, 1338.0, 8068.0, 203800.0, 819380.0, 12747.0, 1745.0, 465.0, 148.0, 80.0, 35.0, 36.0, 9.0, 12.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9208526611328125, -1.866119384765625, -1.8113861083984375, -1.75665283203125, -1.7019195556640625, -1.647186279296875, -1.5924530029296875, -1.5377197265625, -1.4829864501953125, -1.428253173828125, -1.3735198974609375, -1.31878662109375, -1.2640533447265625, -1.209320068359375, -1.1545867919921875, -1.099853515625, -1.0451202392578125, -0.990386962890625, -0.9356536865234375, -0.88092041015625, -0.8261871337890625, -0.771453857421875, -0.7167205810546875, -0.6619873046875, -0.6072540283203125, -0.552520751953125, -0.4977874755859375, -0.44305419921875, -0.3883209228515625, -0.333587646484375, -0.2788543701171875, -0.22412109375, -0.1693878173828125, -0.114654541015625, -0.0599212646484375, -0.00518798828125, 0.0495452880859375, 0.104278564453125, 0.1590118408203125, 0.2137451171875, 0.2684783935546875, 0.323211669921875, 0.3779449462890625, 0.43267822265625, 0.4874114990234375, 0.542144775390625, 0.5968780517578125, 0.651611328125, 0.7063446044921875, 0.761077880859375, 0.8158111572265625, 0.87054443359375, 0.9252777099609375, 0.980010986328125, 1.0347442626953125, 1.0894775390625, 1.1442108154296875, 1.198944091796875, 1.2536773681640625, 1.30841064453125, 1.3631439208984375, 1.417877197265625, 1.4726104736328125, 1.52734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 9.0, 7.0, 6.0, 6.0, 11.0, 23.0, 29.0, 41.0, 74.0, 131.0, 281.0, 155.0, 71.0, 53.0, 25.0, 13.0, 13.0, 12.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018715858459472656, -0.0001813843846321106, -0.00017561018466949463, -0.00016983598470687866, -0.0001640617847442627, -0.00015828758478164673, -0.00015251338481903076, -0.0001467391848564148, -0.00014096498489379883, -0.00013519078493118286, -0.0001294165849685669, -0.00012364238500595093, -0.00011786818504333496, -0.000112093985080719, -0.00010631978511810303, -0.00010054558515548706, -9.47713851928711e-05, -8.899718523025513e-05, -8.322298526763916e-05, -7.74487853050232e-05, -7.167458534240723e-05, -6.590038537979126e-05, -6.012618541717529e-05, -5.4351985454559326e-05, -4.857778549194336e-05, -4.280358552932739e-05, -3.7029385566711426e-05, -3.125518560409546e-05, -2.5480985641479492e-05, -1.9706785678863525e-05, -1.3932585716247559e-05, -8.158385753631592e-06, -2.384185791015625e-06, 3.390014171600342e-06, 9.164214134216309e-06, 1.4938414096832275e-05, 2.0712614059448242e-05, 2.648681402206421e-05, 3.2261013984680176e-05, 3.803521394729614e-05, 4.380941390991211e-05, 4.9583613872528076e-05, 5.535781383514404e-05, 6.113201379776001e-05, 6.690621376037598e-05, 7.268041372299194e-05, 7.845461368560791e-05, 8.422881364822388e-05, 9.000301361083984e-05, 9.577721357345581e-05, 0.00010155141353607178, 0.00010732561349868774, 0.00011309981346130371, 0.00011887401342391968, 0.00012464821338653564, 0.0001304224133491516, 0.00013619661331176758, 0.00014197081327438354, 0.0001477450132369995, 0.00015351921319961548, 0.00015929341316223145, 0.0001650676131248474, 0.00017084181308746338, 0.00017661601305007935, 0.0001823902130126953]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 10.0, 6.0, 4.0, 14.0, 19.0, 48.0, 99.0, 233.0, 934.0, 7767.0, 814192.0, 218738.0, 5312.0, 770.0, 194.0, 91.0, 38.0, 26.0, 9.0, 10.0, 8.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.069793701171875, -2.00286865234375, -1.935943603515625, -1.8690185546875, -1.802093505859375, -1.73516845703125, -1.668243408203125, -1.601318359375, -1.534393310546875, -1.46746826171875, -1.400543212890625, -1.3336181640625, -1.266693115234375, -1.19976806640625, -1.132843017578125, -1.06591796875, -0.998992919921875, -0.93206787109375, -0.865142822265625, -0.7982177734375, -0.731292724609375, -0.66436767578125, -0.597442626953125, -0.530517578125, -0.463592529296875, -0.39666748046875, -0.329742431640625, -0.2628173828125, -0.195892333984375, -0.12896728515625, -0.062042236328125, 0.0048828125, 0.071807861328125, 0.13873291015625, 0.205657958984375, 0.2725830078125, 0.339508056640625, 0.40643310546875, 0.473358154296875, 0.540283203125, 0.607208251953125, 0.67413330078125, 0.741058349609375, 0.8079833984375, 0.874908447265625, 0.94183349609375, 1.008758544921875, 1.07568359375, 1.142608642578125, 1.20953369140625, 1.276458740234375, 1.3433837890625, 1.410308837890625, 1.47723388671875, 1.544158935546875, 1.611083984375, 1.678009033203125, 1.74493408203125, 1.811859130859375, 1.8787841796875, 1.945709228515625, 2.01263427734375, 2.079559326171875, 2.146484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 8.0, 11.0, 21.0, 28.0, 37.0, 55.0, 98.0, 373.0, 126.0, 65.0, 53.0, 24.0, 13.0, 18.0, 8.0, 12.0, 11.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.39269256591796875, -0.3798675537109375, -0.36704254150390625, -0.354217529296875, -0.34139251708984375, -0.3285675048828125, -0.31574249267578125, -0.30291748046875, -0.29009246826171875, -0.2772674560546875, -0.26444244384765625, -0.251617431640625, -0.23879241943359375, -0.2259674072265625, -0.21314239501953125, -0.2003173828125, -0.18749237060546875, -0.1746673583984375, -0.16184234619140625, -0.149017333984375, -0.13619232177734375, -0.1233673095703125, -0.11054229736328125, -0.09771728515625, -0.08489227294921875, -0.0720672607421875, -0.05924224853515625, -0.046417236328125, -0.03359222412109375, -0.0207672119140625, -0.00794219970703125, 0.0048828125, 0.01770782470703125, 0.0305328369140625, 0.04335784912109375, 0.056182861328125, 0.06900787353515625, 0.0818328857421875, 0.09465789794921875, 0.10748291015625, 0.12030792236328125, 0.1331329345703125, 0.14595794677734375, 0.158782958984375, 0.17160797119140625, 0.1844329833984375, 0.19725799560546875, 0.2100830078125, 0.22290802001953125, 0.2357330322265625, 0.24855804443359375, 0.261383056640625, 0.27420806884765625, 0.2870330810546875, 0.29985809326171875, 0.31268310546875, 0.32550811767578125, 0.3383331298828125, 0.35115814208984375, 0.363983154296875, 0.37680816650390625, 0.3896331787109375, 0.40245819091796875, 0.415283203125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 44.0, 778.0, 181.0, 10.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96755313873291, -10.187633514404297, -7.40771484375, -4.627795219421387, -1.8478765487670898, 0.932042121887207, 3.7119626998901367, 6.491881370544434, 9.27180004119873, 12.051719665527344, 14.83163833618164, 17.611557006835938, 20.391475677490234, 23.17139434814453, 25.951316833496094, 28.73123550415039, 31.511154174804688, 34.291072845458984, 37.07099151611328, 39.850914001464844, 42.630828857421875, 45.41075134277344, 48.190670013427734, 50.97058868408203, 53.75050735473633, 56.530426025390625, 59.31034469604492, 62.09026336669922, 64.87018585205078, 67.65010070800781, 70.43002319335938, 73.20994567871094, 75.98985290527344, 78.769775390625, 81.54969024658203, 84.3296127319336, 87.10952758789062, 89.88945007324219, 92.66937255859375, 95.44928741455078, 98.22920227050781, 101.00912475585938, 103.7890396118164, 106.56896209716797, 109.348876953125, 112.12879943847656, 114.90872192382812, 117.68863677978516, 120.46855926513672, 123.24848175048828, 126.02839660644531, 128.80831909179688, 131.58824157714844, 134.36814880371094, 137.1480712890625, 139.92799377441406, 142.70791625976562, 145.4878387451172, 148.26776123046875, 151.04766845703125, 153.8275909423828, 156.60751342773438, 159.38743591308594, 162.1673583984375, 164.947265625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 10.0, 6.0, 5.0, 17.0, 10.0, 15.0, 19.0, 21.0, 22.0, 27.0, 43.0, 40.0, 36.0, 28.0, 40.0, 35.0, 45.0, 60.0, 47.0, 49.0, 54.0, 40.0, 39.0, 51.0, 42.0, 29.0, 31.0, 27.0, 22.0, 15.0, 18.0, 15.0, 12.0, 9.0, 3.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.840543746948242, -17.29367446899414, -16.746807098388672, -16.19993782043457, -15.653068542480469, -15.106199264526367, -14.559330940246582, -14.012462615966797, -13.465593338012695, -12.918724060058594, -12.371855735778809, -11.824987411499023, -11.278118133544922, -10.73124885559082, -10.184380531311035, -9.63751220703125, -9.090642929077148, -8.543773651123047, -7.996905326843262, -7.450036525726318, -6.903167724609375, -6.356298923492432, -5.809430122375488, -5.262561321258545, -4.715692520141602, -4.168823719024658, -3.621954917907715, -3.0750861167907715, -2.528217315673828, -1.9813485145568848, -1.4344797134399414, -0.887610912322998, -0.3407402038574219, 0.20612859725952148, 0.7529973983764648, 1.2998661994934082, 1.8467350006103516, 2.393603801727295, 2.9404726028442383, 3.4873414039611816, 4.034210205078125, 4.581079006195068, 5.127947807312012, 5.674816608428955, 6.221685409545898, 6.768554210662842, 7.315423011779785, 7.8622918128967285, 8.409160614013672, 8.956029891967773, 9.502898216247559, 10.049766540527344, 10.596635818481445, 11.143505096435547, 11.690373420715332, 12.237241744995117, 12.784111022949219, 13.33098030090332, 13.877848625183105, 14.42471694946289, 14.971586227416992, 15.518455505371094, 16.065322875976562, 16.612192153930664, 17.159061431884766]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 8.0, 7.0, 6.0, 5.0, 14.0, 13.0, 18.0, 22.0, 31.0, 39.0, 47.0, 83.0, 128.0, 259.0, 509.0, 1387.0, 4100.0, 15033.0, 80942.0, 1408435.0, 2547408.0, 107887.0, 19495.0, 5254.0, 1755.0, 648.0, 317.0, 136.0, 76.0, 47.0, 33.0, 32.0, 32.0, 14.0, 8.0, 8.0, 8.0, 8.0, 11.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.13671875, -5.95660400390625, -5.7764892578125, -5.59637451171875, -5.416259765625, -5.23614501953125, -5.0560302734375, -4.87591552734375, -4.69580078125, -4.51568603515625, -4.3355712890625, -4.15545654296875, -3.975341796875, -3.79522705078125, -3.6151123046875, -3.43499755859375, -3.2548828125, -3.07476806640625, -2.8946533203125, -2.71453857421875, -2.534423828125, -2.35430908203125, -2.1741943359375, -1.99407958984375, -1.81396484375, -1.63385009765625, -1.4537353515625, -1.27362060546875, -1.093505859375, -0.91339111328125, -0.7332763671875, -0.55316162109375, -0.373046875, -0.19293212890625, -0.0128173828125, 0.16729736328125, 0.347412109375, 0.52752685546875, 0.7076416015625, 0.88775634765625, 1.06787109375, 1.24798583984375, 1.4281005859375, 1.60821533203125, 1.788330078125, 1.96844482421875, 2.1485595703125, 2.32867431640625, 2.5087890625, 2.68890380859375, 2.8690185546875, 3.04913330078125, 3.229248046875, 3.40936279296875, 3.5894775390625, 3.76959228515625, 3.94970703125, 4.12982177734375, 4.3099365234375, 4.49005126953125, 4.670166015625, 4.85028076171875, 5.0303955078125, 5.21051025390625, 5.390625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 13.0, 25.0, 29.0, 39.0, 45.0, 64.0, 84.0, 72.0, 90.0, 100.0, 88.0, 94.0, 65.0, 55.0, 39.0, 27.0, 17.0, 17.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5, -8.310943603515625, -8.12188720703125, -7.932830810546875, -7.7437744140625, -7.554718017578125, -7.36566162109375, -7.176605224609375, -6.987548828125, -6.798492431640625, -6.60943603515625, -6.420379638671875, -6.2313232421875, -6.042266845703125, -5.85321044921875, -5.664154052734375, -5.47509765625, -5.286041259765625, -5.09698486328125, -4.907928466796875, -4.7188720703125, -4.529815673828125, -4.34075927734375, -4.151702880859375, -3.962646484375, -3.773590087890625, -3.58453369140625, -3.395477294921875, -3.2064208984375, -3.017364501953125, -2.82830810546875, -2.639251708984375, -2.4501953125, -2.261138916015625, -2.07208251953125, -1.883026123046875, -1.6939697265625, -1.504913330078125, -1.31585693359375, -1.126800537109375, -0.937744140625, -0.748687744140625, -0.55963134765625, -0.370574951171875, -0.1815185546875, 0.007537841796875, 0.19659423828125, 0.385650634765625, 0.57470703125, 0.763763427734375, 0.95281982421875, 1.141876220703125, 1.3309326171875, 1.519989013671875, 1.70904541015625, 1.898101806640625, 2.087158203125, 2.276214599609375, 2.46527099609375, 2.654327392578125, 2.8433837890625, 3.032440185546875, 3.22149658203125, 3.410552978515625, 3.599609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 12.0, 19.0, 40.0, 105.0, 208.0, 1041.0, 4173731.0, 18334.0, 437.0, 146.0, 79.0, 43.0, 35.0, 12.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.82275390625, -47.3330078125, -45.84326171875, -44.353515625, -42.86376953125, -41.3740234375, -39.88427734375, -38.39453125, -36.90478515625, -35.4150390625, -33.92529296875, -32.435546875, -30.94580078125, -29.4560546875, -27.96630859375, -26.4765625, -24.98681640625, -23.4970703125, -22.00732421875, -20.517578125, -19.02783203125, -17.5380859375, -16.04833984375, -14.55859375, -13.06884765625, -11.5791015625, -10.08935546875, -8.599609375, -7.10986328125, -5.6201171875, -4.13037109375, -2.640625, -1.15087890625, 0.3388671875, 1.82861328125, 3.318359375, 4.80810546875, 6.2978515625, 7.78759765625, 9.27734375, 10.76708984375, 12.2568359375, 13.74658203125, 15.236328125, 16.72607421875, 18.2158203125, 19.70556640625, 21.1953125, 22.68505859375, 24.1748046875, 25.66455078125, 27.154296875, 28.64404296875, 30.1337890625, 31.62353515625, 33.11328125, 34.60302734375, 36.0927734375, 37.58251953125, 39.072265625, 40.56201171875, 42.0517578125, 43.54150390625, 45.03125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 6.0, 11.0, 17.0, 39.0, 56.0, 94.0, 136.0, 320.0, 827.0, 1428.0, 536.0, 253.0, 119.0, 67.0, 49.0, 40.0, 27.0, 10.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9691314697265625, -1.914825439453125, -1.8605194091796875, -1.80621337890625, -1.7519073486328125, -1.697601318359375, -1.6432952880859375, -1.5889892578125, -1.5346832275390625, -1.480377197265625, -1.4260711669921875, -1.37176513671875, -1.3174591064453125, -1.263153076171875, -1.2088470458984375, -1.154541015625, -1.1002349853515625, -1.045928955078125, -0.9916229248046875, -0.93731689453125, -0.8830108642578125, -0.828704833984375, -0.7743988037109375, -0.7200927734375, -0.6657867431640625, -0.611480712890625, -0.5571746826171875, -0.50286865234375, -0.4485626220703125, -0.394256591796875, -0.3399505615234375, -0.28564453125, -0.2313385009765625, -0.177032470703125, -0.1227264404296875, -0.06842041015625, -0.0141143798828125, 0.040191650390625, 0.0944976806640625, 0.1488037109375, 0.2031097412109375, 0.257415771484375, 0.3117218017578125, 0.36602783203125, 0.4203338623046875, 0.474639892578125, 0.5289459228515625, 0.583251953125, 0.6375579833984375, 0.691864013671875, 0.7461700439453125, 0.80047607421875, 0.8547821044921875, 0.909088134765625, 0.9633941650390625, 1.0177001953125, 1.0720062255859375, 1.126312255859375, 1.1806182861328125, 1.23492431640625, 1.2892303466796875, 1.343536376953125, 1.3978424072265625, 1.4521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 9.0, 27.0, 36.0, 104.0, 222.0, 253.0, 175.0, 81.0, 46.0, 14.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.656396865844727, -11.24353313446045, -10.830670356750488, -10.417806625366211, -10.004942893981934, -9.592079162597656, -9.179216384887695, -8.766352653503418, -8.35348892211914, -7.9406256675720215, -7.527761936187744, -7.114898681640625, -6.702034950256348, -6.2891716957092285, -5.876308441162109, -5.463444709777832, -5.050581932067871, -4.637718677520752, -4.224854946136475, -3.8119916915893555, -3.3991281986236572, -2.986264705657959, -2.57340145111084, -2.1605379581451416, -1.7476744651794434, -1.3348109722137451, -0.9219475984573364, -0.5090842247009277, -0.09622073173522949, 0.31664276123046875, 0.7295060157775879, 1.1423695087432861, 1.5552330017089844, 1.9680964946746826, 2.380959987640381, 2.7938232421875, 3.2066867351531982, 3.6195502281188965, 4.032413482666016, 4.445277214050293, 4.858140468597412, 5.271003723144531, 5.683867454528809, 6.096730709075928, 6.509593963623047, 6.922457695007324, 7.335320949554443, 7.7481842041015625, 8.16104793548584, 8.573911666870117, 8.986774444580078, 9.399638175964355, 9.812501907348633, 10.225364685058594, 10.638228416442871, 11.051092147827148, 11.46395492553711, 11.876818656921387, 12.289681434631348, 12.702545166015625, 13.115408897399902, 13.52827262878418, 13.94113540649414, 14.353999137878418, 14.766862869262695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 12.0, 12.0, 8.0, 15.0, 26.0, 35.0, 55.0, 58.0, 71.0, 69.0, 79.0, 65.0, 90.0, 84.0, 70.0, 58.0, 44.0, 39.0, 27.0, 22.0, 17.0, 15.0, 5.0, 10.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.451784610748291, -7.277875900268555, -7.103967189788818, -6.930058479309082, -6.7561492919921875, -6.582240581512451, -6.408331871032715, -6.2344231605529785, -6.060514450073242, -5.886605739593506, -5.7126970291137695, -5.538787841796875, -5.364879131317139, -5.190970420837402, -5.017061710357666, -4.84315299987793, -4.669243812561035, -4.495335102081299, -4.3214263916015625, -4.147517204284668, -3.9736084938049316, -3.7996997833251953, -3.625791072845459, -3.4518823623657227, -3.2779734134674072, -3.104064702987671, -2.9301557540893555, -2.756247043609619, -2.582338333129883, -2.4084293842315674, -2.234520673751831, -2.0606117248535156, -1.8867030143737793, -1.7127941846847534, -1.5388853549957275, -1.3649766445159912, -1.1910678148269653, -1.0171589851379395, -0.8432502746582031, -0.6693414449691772, -0.49543261528015137, -0.3215238153934479, -0.14761501550674438, 0.02629375457763672, 0.2002025842666626, 0.3741114139556885, 0.5480201244354248, 0.7219289541244507, 0.8958377838134766, 1.0697466135025024, 1.2436554431915283, 1.4175641536712646, 1.5914729833602905, 1.7653818130493164, 1.9392905235290527, 2.113199234008789, 2.2871081829071045, 2.461016893386841, 2.6349258422851562, 2.8088345527648926, 2.982743263244629, 3.1566522121429443, 3.3305609226226807, 3.504469871520996, 3.6783785820007324]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 14.0, 34.0, 48.0, 88.0, 153.0, 324.0, 640.0, 1421.0, 5328.0, 80386.0, 918648.0, 35488.0, 3666.0, 1162.0, 545.0, 282.0, 143.0, 69.0, 41.0, 27.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.716796875, -1.66961669921875, -1.6224365234375, -1.57525634765625, -1.528076171875, -1.48089599609375, -1.4337158203125, -1.38653564453125, -1.33935546875, -1.29217529296875, -1.2449951171875, -1.19781494140625, -1.150634765625, -1.10345458984375, -1.0562744140625, -1.00909423828125, -0.9619140625, -0.91473388671875, -0.8675537109375, -0.82037353515625, -0.773193359375, -0.72601318359375, -0.6788330078125, -0.63165283203125, -0.58447265625, -0.53729248046875, -0.4901123046875, -0.44293212890625, -0.395751953125, -0.34857177734375, -0.3013916015625, -0.25421142578125, -0.20703125, -0.15985107421875, -0.1126708984375, -0.06549072265625, -0.018310546875, 0.02886962890625, 0.0760498046875, 0.12322998046875, 0.17041015625, 0.21759033203125, 0.2647705078125, 0.31195068359375, 0.359130859375, 0.40631103515625, 0.4534912109375, 0.50067138671875, 0.5478515625, 0.59503173828125, 0.6422119140625, 0.68939208984375, 0.736572265625, 0.78375244140625, 0.8309326171875, 0.87811279296875, 0.92529296875, 0.97247314453125, 1.0196533203125, 1.06683349609375, 1.114013671875, 1.16119384765625, 1.2083740234375, 1.25555419921875, 1.302734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 12.0, 15.0, 9.0, 13.0, 22.0, 42.0, 46.0, 73.0, 83.0, 90.0, 101.0, 100.0, 75.0, 87.0, 61.0, 48.0, 36.0, 18.0, 24.0, 16.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.30859375, -6.164947509765625, -6.02130126953125, -5.877655029296875, -5.7340087890625, -5.590362548828125, -5.44671630859375, -5.303070068359375, -5.159423828125, -5.015777587890625, -4.87213134765625, -4.728485107421875, -4.5848388671875, -4.441192626953125, -4.29754638671875, -4.153900146484375, -4.01025390625, -3.866607666015625, -3.72296142578125, -3.579315185546875, -3.4356689453125, -3.292022705078125, -3.14837646484375, -3.004730224609375, -2.861083984375, -2.717437744140625, -2.57379150390625, -2.430145263671875, -2.2864990234375, -2.142852783203125, -1.99920654296875, -1.855560302734375, -1.7119140625, -1.568267822265625, -1.42462158203125, -1.280975341796875, -1.1373291015625, -0.993682861328125, -0.85003662109375, -0.706390380859375, -0.562744140625, -0.419097900390625, -0.27545166015625, -0.131805419921875, 0.0118408203125, 0.155487060546875, 0.29913330078125, 0.442779541015625, 0.58642578125, 0.730072021484375, 0.87371826171875, 1.017364501953125, 1.1610107421875, 1.304656982421875, 1.44830322265625, 1.591949462890625, 1.735595703125, 1.879241943359375, 2.02288818359375, 2.166534423828125, 2.3101806640625, 2.453826904296875, 2.59747314453125, 2.741119384765625, 2.884765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 21.0, 17.0, 40.0, 43.0, 55.0, 86.0, 121.0, 175.0, 236.0, 385.0, 847.0, 2960.0, 38411.0, 749366.0, 242263.0, 10467.0, 1399.0, 529.0, 349.0, 213.0, 145.0, 113.0, 78.0, 66.0, 46.0, 27.0, 24.0, 12.0, 13.0, 8.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.76416015625, -0.7449493408203125, -0.725738525390625, -0.7065277099609375, -0.68731689453125, -0.6681060791015625, -0.648895263671875, -0.6296844482421875, -0.6104736328125, -0.5912628173828125, -0.572052001953125, -0.5528411865234375, -0.53363037109375, -0.5144195556640625, -0.495208740234375, -0.4759979248046875, -0.456787109375, -0.4375762939453125, -0.418365478515625, -0.3991546630859375, -0.37994384765625, -0.3607330322265625, -0.341522216796875, -0.3223114013671875, -0.3031005859375, -0.2838897705078125, -0.264678955078125, -0.2454681396484375, -0.22625732421875, -0.2070465087890625, -0.187835693359375, -0.1686248779296875, -0.1494140625, -0.1302032470703125, -0.110992431640625, -0.0917816162109375, -0.07257080078125, -0.0533599853515625, -0.034149169921875, -0.0149383544921875, 0.0042724609375, 0.0234832763671875, 0.042694091796875, 0.0619049072265625, 0.08111572265625, 0.1003265380859375, 0.119537353515625, 0.1387481689453125, 0.157958984375, 0.1771697998046875, 0.196380615234375, 0.2155914306640625, 0.23480224609375, 0.2540130615234375, 0.273223876953125, 0.2924346923828125, 0.3116455078125, 0.3308563232421875, 0.350067138671875, 0.3692779541015625, 0.38848876953125, 0.4076995849609375, 0.426910400390625, 0.4461212158203125, 0.46533203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 7.0, 7.0, 15.0, 5.0, 14.0, 19.0, 19.0, 21.0, 25.0, 24.0, 27.0, 38.0, 31.0, 32.0, 41.0, 50.0, 45.0, 39.0, 45.0, 42.0, 48.0, 46.0, 43.0, 42.0, 31.0, 35.0, 27.0, 22.0, 16.0, 19.0, 26.0, 12.0, 15.0, 19.0, 8.0, 6.0, 11.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.7421875, -4.60552978515625, -4.4688720703125, -4.33221435546875, -4.195556640625, -4.05889892578125, -3.9222412109375, -3.78558349609375, -3.64892578125, -3.51226806640625, -3.3756103515625, -3.23895263671875, -3.102294921875, -2.96563720703125, -2.8289794921875, -2.69232177734375, -2.5556640625, -2.41900634765625, -2.2823486328125, -2.14569091796875, -2.009033203125, -1.87237548828125, -1.7357177734375, -1.59906005859375, -1.46240234375, -1.32574462890625, -1.1890869140625, -1.05242919921875, -0.915771484375, -0.77911376953125, -0.6424560546875, -0.50579833984375, -0.369140625, -0.23248291015625, -0.0958251953125, 0.04083251953125, 0.177490234375, 0.31414794921875, 0.4508056640625, 0.58746337890625, 0.72412109375, 0.86077880859375, 0.9974365234375, 1.13409423828125, 1.270751953125, 1.40740966796875, 1.5440673828125, 1.68072509765625, 1.8173828125, 1.95404052734375, 2.0906982421875, 2.22735595703125, 2.364013671875, 2.50067138671875, 2.6373291015625, 2.77398681640625, 2.91064453125, 3.04730224609375, 3.1839599609375, 3.32061767578125, 3.457275390625, 3.59393310546875, 3.7305908203125, 3.86724853515625, 4.00390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 16.0, 25.0, 23.0, 51.0, 74.0, 101.0, 159.0, 293.0, 471.0, 954.0, 3209.0, 27010.0, 927955.0, 80389.0, 5134.0, 1255.0, 551.0, 285.0, 181.0, 136.0, 84.0, 46.0, 41.0, 21.0, 13.0, 20.0, 6.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.0743112564086914, -0.07116889953613281, -0.06802654266357422, -0.06488418579101562, -0.06174182891845703, -0.05859947204589844, -0.055457115173339844, -0.05231475830078125, -0.049172401428222656, -0.04603004455566406, -0.04288768768310547, -0.039745330810546875, -0.03660297393798828, -0.03346061706542969, -0.030318260192871094, -0.0271759033203125, -0.024033546447753906, -0.020891189575195312, -0.01774883270263672, -0.014606475830078125, -0.011464118957519531, -0.008321762084960938, -0.005179405212402344, -0.00203704833984375, 0.0011053085327148438, 0.0042476654052734375, 0.007390022277832031, 0.010532379150390625, 0.013674736022949219, 0.016817092895507812, 0.019959449768066406, 0.023101806640625, 0.026244163513183594, 0.029386520385742188, 0.03252887725830078, 0.035671234130859375, 0.03881359100341797, 0.04195594787597656, 0.045098304748535156, 0.04824066162109375, 0.051383018493652344, 0.05452537536621094, 0.05766773223876953, 0.060810089111328125, 0.06395244598388672, 0.06709480285644531, 0.0702371597290039, 0.0733795166015625, 0.0765218734741211, 0.07966423034667969, 0.08280658721923828, 0.08594894409179688, 0.08909130096435547, 0.09223365783691406, 0.09537601470947266, 0.09851837158203125, 0.10166072845458984, 0.10480308532714844, 0.10794544219970703, 0.11108779907226562, 0.11423015594482422, 0.11737251281738281, 0.1205148696899414, 0.1236572265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 11.0, 19.0, 17.0, 36.0, 57.0, 46.0, 117.0, 115.0, 122.0, 107.0, 98.0, 80.0, 51.0, 34.0, 23.0, 15.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.758646875619888e-05, -5.5866315960884094e-05, -5.4146163165569305e-05, -5.2426010370254517e-05, -5.070585757493973e-05, -4.898570477962494e-05, -4.726555198431015e-05, -4.554539918899536e-05, -4.382524639368057e-05, -4.2105093598365784e-05, -4.0384940803050995e-05, -3.8664788007736206e-05, -3.694463521242142e-05, -3.522448241710663e-05, -3.350432962179184e-05, -3.178417682647705e-05, -3.0064024031162262e-05, -2.8343871235847473e-05, -2.6623718440532684e-05, -2.4903565645217896e-05, -2.3183412849903107e-05, -2.1463260054588318e-05, -1.974310725927353e-05, -1.802295446395874e-05, -1.630280166864395e-05, -1.4582648873329163e-05, -1.2862496078014374e-05, -1.1142343282699585e-05, -9.422190487384796e-06, -7.702037692070007e-06, -5.9818848967552185e-06, -4.26173210144043e-06, -2.541579306125641e-06, -8.21426510810852e-07, 8.987262845039368e-07, 2.6188790798187256e-06, 4.339031875133514e-06, 6.059184670448303e-06, 7.779337465763092e-06, 9.499490261077881e-06, 1.121964305639267e-05, 1.2939795851707458e-05, 1.4659948647022247e-05, 1.6380101442337036e-05, 1.8100254237651825e-05, 1.9820407032966614e-05, 2.1540559828281403e-05, 2.326071262359619e-05, 2.498086541891098e-05, 2.670101821422577e-05, 2.8421171009540558e-05, 3.0141323804855347e-05, 3.1861476600170135e-05, 3.3581629395484924e-05, 3.530178219079971e-05, 3.70219349861145e-05, 3.874208778142929e-05, 4.046224057674408e-05, 4.218239337205887e-05, 4.390254616737366e-05, 4.5622698962688446e-05, 4.7342851758003235e-05, 4.9063004553318024e-05, 5.078315734863281e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 5.0, 5.0, 8.0, 10.0, 17.0, 19.0, 29.0, 104.0, 293.0, 2497.0, 161262.0, 879322.0, 4323.0, 425.0, 97.0, 51.0, 16.0, 16.0, 9.0, 15.0, 5.0, 4.0, 9.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.37890625, -0.3670997619628906, -0.35529327392578125, -0.3434867858886719, -0.3316802978515625, -0.3198738098144531, -0.30806732177734375, -0.2962608337402344, -0.284454345703125, -0.2726478576660156, -0.26084136962890625, -0.24903488159179688, -0.2372283935546875, -0.22542190551757812, -0.21361541748046875, -0.20180892944335938, -0.19000244140625, -0.17819595336914062, -0.16638946533203125, -0.15458297729492188, -0.1427764892578125, -0.13097000122070312, -0.11916351318359375, -0.10735702514648438, -0.095550537109375, -0.08374404907226562, -0.07193756103515625, -0.060131072998046875, -0.0483245849609375, -0.036518096923828125, -0.02471160888671875, -0.012905120849609375, -0.0010986328125, 0.010707855224609375, 0.02251434326171875, 0.034320831298828125, 0.0461273193359375, 0.057933807373046875, 0.06974029541015625, 0.08154678344726562, 0.093353271484375, 0.10515975952148438, 0.11696624755859375, 0.12877273559570312, 0.1405792236328125, 0.15238571166992188, 0.16419219970703125, 0.17599868774414062, 0.18780517578125, 0.19961166381835938, 0.21141815185546875, 0.22322463989257812, 0.2350311279296875, 0.24683761596679688, 0.25864410400390625, 0.2704505920410156, 0.282257080078125, 0.2940635681152344, 0.30587005615234375, 0.3176765441894531, 0.3294830322265625, 0.3412895202636719, 0.35309600830078125, 0.3649024963378906, 0.376708984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 16.0, 11.0, 27.0, 55.0, 63.0, 120.0, 215.0, 210.0, 105.0, 54.0, 26.0, 25.0, 10.0, 16.0, 6.0, 4.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.027252197265625, -0.026397705078125, -0.025543212890625, -0.024688720703125, -0.023834228515625, -0.022979736328125, -0.022125244140625, -0.021270751953125, -0.020416259765625, -0.019561767578125, -0.018707275390625, -0.017852783203125, -0.016998291015625, -0.016143798828125, -0.015289306640625, -0.014434814453125, -0.013580322265625, -0.012725830078125, -0.011871337890625, -0.011016845703125, -0.010162353515625, -0.009307861328125, -0.008453369140625, -0.007598876953125, -0.006744384765625, -0.005889892578125, -0.005035400390625, -0.004180908203125, -0.003326416015625, -0.002471923828125, -0.001617431640625, -0.000762939453125, 9.1552734375e-05, 0.000946044921875, 0.001800537109375, 0.002655029296875, 0.003509521484375, 0.004364013671875, 0.005218505859375, 0.006072998046875, 0.006927490234375, 0.007781982421875, 0.008636474609375, 0.009490966796875, 0.010345458984375, 0.011199951171875, 0.012054443359375, 0.012908935546875, 0.013763427734375, 0.014617919921875, 0.015472412109375, 0.016326904296875, 0.017181396484375, 0.018035888671875, 0.018890380859375, 0.019744873046875, 0.020599365234375, 0.021453857421875, 0.022308349609375, 0.023162841796875, 0.024017333984375, 0.024871826171875, 0.025726318359375, 0.026580810546875, 0.027435302734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 9.0, 11.0, 16.0, 43.0, 170.0, 341.0, 253.0, 90.0, 37.0, 19.0, 10.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.284192085266113, -10.916738510131836, -10.549283981323242, -10.181829452514648, -9.814375877380371, -9.446922302246094, -9.0794677734375, -8.712013244628906, -8.344559669494629, -7.977105617523193, -7.609651565551758, -7.242197513580322, -6.874743461608887, -6.507289409637451, -6.139835357666016, -5.77238130569458, -5.4049272537231445, -5.037473201751709, -4.670019149780273, -4.302565097808838, -3.9351110458374023, -3.567656993865967, -3.2002029418945312, -2.8327488899230957, -2.46529483795166, -2.0978407859802246, -1.730386734008789, -1.3629326820373535, -0.995478630065918, -0.6280245780944824, -0.2605705261230469, 0.10688352584838867, 0.4743385314941406, 0.8417925834655762, 1.2092466354370117, 1.5767006874084473, 1.9441547393798828, 2.3116087913513184, 2.679062843322754, 3.0465168952941895, 3.413970947265625, 3.7814249992370605, 4.148879051208496, 4.516333103179932, 4.883787155151367, 5.251241207122803, 5.618695259094238, 5.986149311065674, 6.353603363037109, 6.721057415008545, 7.0885114669799805, 7.455965518951416, 7.823419570922852, 8.190874099731445, 8.558327674865723, 8.92578125, 9.293235778808594, 9.660690307617188, 10.028143882751465, 10.395597457885742, 10.763051986694336, 11.13050651550293, 11.497960090637207, 11.865413665771484, 12.232868194580078]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 7.0, 9.0, 8.0, 10.0, 13.0, 30.0, 46.0, 53.0, 88.0, 89.0, 88.0, 97.0, 108.0, 88.0, 70.0, 57.0, 41.0, 27.0, 23.0, 17.0, 14.0, 8.0, 2.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.077759742736816, -5.9345526695251465, -5.791345596313477, -5.648138046264648, -5.5049309730529785, -5.361723899841309, -5.2185163497924805, -5.0753092765808105, -4.932102203369141, -4.788895130157471, -4.645688056945801, -4.502480506896973, -4.359273433685303, -4.216066360473633, -4.072858810424805, -3.9296517372131348, -3.786444664001465, -3.643237590789795, -3.500030279159546, -3.356822967529297, -3.213615894317627, -3.070408821105957, -2.927201509475708, -2.783994197845459, -2.640787124633789, -2.497580051422119, -2.35437273979187, -2.211165428161621, -2.067958354949951, -1.9247511625289917, -1.7815439701080322, -1.6383367776870728, -1.4951298236846924, -1.351922631263733, -1.2087154388427734, -1.065508246421814, -0.9223010540008545, -0.779093861579895, -0.6358866691589355, -0.4926794767379761, -0.3494722843170166, -0.20626509189605713, -0.06305789947509766, 0.08014929294586182, 0.2233564853668213, 0.36656367778778076, 0.5097708702087402, 0.6529780626296997, 0.7961852550506592, 0.9393924474716187, 1.0825996398925781, 1.2258068323135376, 1.369014024734497, 1.5122212171554565, 1.655428409576416, 1.7986356019973755, 1.941842794418335, 2.085050106048584, 2.228257179260254, 2.371464252471924, 2.514671564102173, 2.657878875732422, 2.801085948944092, 2.9442930221557617, 3.0875003337860107]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 10.0, 11.0, 9.0, 26.0, 34.0, 43.0, 87.0, 191.0, 395.0, 844.0, 1998.0, 5573.0, 17582.0, 72958.0, 611438.0, 277180.0, 42254.0, 11428.0, 3780.0, 1436.0, 626.0, 290.0, 143.0, 80.0, 54.0, 43.0, 11.0, 17.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.04296875, -3.950714111328125, -3.85845947265625, -3.766204833984375, -3.6739501953125, -3.581695556640625, -3.48944091796875, -3.397186279296875, -3.304931640625, -3.212677001953125, -3.12042236328125, -3.028167724609375, -2.9359130859375, -2.843658447265625, -2.75140380859375, -2.659149169921875, -2.56689453125, -2.474639892578125, -2.38238525390625, -2.290130615234375, -2.1978759765625, -2.105621337890625, -2.01336669921875, -1.921112060546875, -1.828857421875, -1.736602783203125, -1.64434814453125, -1.552093505859375, -1.4598388671875, -1.367584228515625, -1.27532958984375, -1.183074951171875, -1.0908203125, -0.998565673828125, -0.90631103515625, -0.814056396484375, -0.7218017578125, -0.629547119140625, -0.53729248046875, -0.445037841796875, -0.352783203125, -0.260528564453125, -0.16827392578125, -0.076019287109375, 0.0162353515625, 0.108489990234375, 0.20074462890625, 0.292999267578125, 0.38525390625, 0.477508544921875, 0.56976318359375, 0.662017822265625, 0.7542724609375, 0.846527099609375, 0.93878173828125, 1.031036376953125, 1.123291015625, 1.215545654296875, 1.30780029296875, 1.400054931640625, 1.4923095703125, 1.584564208984375, 1.67681884765625, 1.769073486328125, 1.861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 2.0, 9.0, 7.0, 12.0, 17.0, 23.0, 23.0, 40.0, 37.0, 59.0, 56.0, 74.0, 78.0, 90.0, 98.0, 86.0, 56.0, 48.0, 44.0, 33.0, 20.0, 26.0, 13.0, 15.0, 14.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.1201171875, -9.857421875, -9.5947265625, -9.33203125, -9.0693359375, -8.806640625, -8.5439453125, -8.28125, -8.0185546875, -7.755859375, -7.4931640625, -7.23046875, -6.9677734375, -6.705078125, -6.4423828125, -6.1796875, -5.9169921875, -5.654296875, -5.3916015625, -5.12890625, -4.8662109375, -4.603515625, -4.3408203125, -4.078125, -3.8154296875, -3.552734375, -3.2900390625, -3.02734375, -2.7646484375, -2.501953125, -2.2392578125, -1.9765625, -1.7138671875, -1.451171875, -1.1884765625, -0.92578125, -0.6630859375, -0.400390625, -0.1376953125, 0.125, 0.3876953125, 0.650390625, 0.9130859375, 1.17578125, 1.4384765625, 1.701171875, 1.9638671875, 2.2265625, 2.4892578125, 2.751953125, 3.0146484375, 3.27734375, 3.5400390625, 3.802734375, 4.0654296875, 4.328125, 4.5908203125, 4.853515625, 5.1162109375, 5.37890625, 5.6416015625, 5.904296875, 6.1669921875, 6.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 16.0, 12.0, 14.0, 23.0, 27.0, 28.0, 39.0, 37.0, 41.0, 57.0, 60.0, 123.0, 802.0, 1041586.0, 5104.0, 178.0, 71.0, 51.0, 48.0, 46.0, 39.0, 26.0, 26.0, 23.0, 17.0, 10.0, 6.0, 12.0, 2.0, 3.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-26.890625, -26.176513671875, -25.46240234375, -24.748291015625, -24.0341796875, -23.320068359375, -22.60595703125, -21.891845703125, -21.177734375, -20.463623046875, -19.74951171875, -19.035400390625, -18.3212890625, -17.607177734375, -16.89306640625, -16.178955078125, -15.46484375, -14.750732421875, -14.03662109375, -13.322509765625, -12.6083984375, -11.894287109375, -11.18017578125, -10.466064453125, -9.751953125, -9.037841796875, -8.32373046875, -7.609619140625, -6.8955078125, -6.181396484375, -5.46728515625, -4.753173828125, -4.0390625, -3.324951171875, -2.61083984375, -1.896728515625, -1.1826171875, -0.468505859375, 0.24560546875, 0.959716796875, 1.673828125, 2.387939453125, 3.10205078125, 3.816162109375, 4.5302734375, 5.244384765625, 5.95849609375, 6.672607421875, 7.38671875, 8.100830078125, 8.81494140625, 9.529052734375, 10.2431640625, 10.957275390625, 11.67138671875, 12.385498046875, 13.099609375, 13.813720703125, 14.52783203125, 15.241943359375, 15.9560546875, 16.670166015625, 17.38427734375, 18.098388671875, 18.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 4.0, 9.0, 12.0, 9.0, 20.0, 21.0, 26.0, 28.0, 45.0, 41.0, 34.0, 47.0, 46.0, 46.0, 54.0, 62.0, 81.0, 49.0, 40.0, 47.0, 50.0, 42.0, 40.0, 25.0, 25.0, 19.0, 24.0, 12.0, 6.0, 12.0, 2.0, 2.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-9.40625, -9.15631103515625, -8.9063720703125, -8.65643310546875, -8.406494140625, -8.15655517578125, -7.9066162109375, -7.65667724609375, -7.40673828125, -7.15679931640625, -6.9068603515625, -6.65692138671875, -6.406982421875, -6.15704345703125, -5.9071044921875, -5.65716552734375, -5.4072265625, -5.15728759765625, -4.9073486328125, -4.65740966796875, -4.407470703125, -4.15753173828125, -3.9075927734375, -3.65765380859375, -3.40771484375, -3.15777587890625, -2.9078369140625, -2.65789794921875, -2.407958984375, -2.15802001953125, -1.9080810546875, -1.65814208984375, -1.408203125, -1.15826416015625, -0.9083251953125, -0.65838623046875, -0.408447265625, -0.15850830078125, 0.0914306640625, 0.34136962890625, 0.59130859375, 0.84124755859375, 1.0911865234375, 1.34112548828125, 1.591064453125, 1.84100341796875, 2.0909423828125, 2.34088134765625, 2.5908203125, 2.84075927734375, 3.0906982421875, 3.34063720703125, 3.590576171875, 3.84051513671875, 4.0904541015625, 4.34039306640625, 4.59033203125, 4.84027099609375, 5.0902099609375, 5.34014892578125, 5.590087890625, 5.84002685546875, 6.0899658203125, 6.33990478515625, 6.58984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 11.0, 27.0, 33.0, 59.0, 87.0, 205.0, 515.0, 1666.0, 9945.0, 179509.0, 832659.0, 19996.0, 2645.0, 678.0, 243.0, 120.0, 50.0, 35.0, 22.0, 7.0, 7.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53515625, -1.478607177734375, -1.42205810546875, -1.365509033203125, -1.3089599609375, -1.252410888671875, -1.19586181640625, -1.139312744140625, -1.082763671875, -1.026214599609375, -0.96966552734375, -0.913116455078125, -0.8565673828125, -0.800018310546875, -0.74346923828125, -0.686920166015625, -0.63037109375, -0.573822021484375, -0.51727294921875, -0.460723876953125, -0.4041748046875, -0.347625732421875, -0.29107666015625, -0.234527587890625, -0.177978515625, -0.121429443359375, -0.06488037109375, -0.008331298828125, 0.0482177734375, 0.104766845703125, 0.16131591796875, 0.217864990234375, 0.2744140625, 0.330963134765625, 0.38751220703125, 0.444061279296875, 0.5006103515625, 0.557159423828125, 0.61370849609375, 0.670257568359375, 0.726806640625, 0.783355712890625, 0.83990478515625, 0.896453857421875, 0.9530029296875, 1.009552001953125, 1.06610107421875, 1.122650146484375, 1.17919921875, 1.235748291015625, 1.29229736328125, 1.348846435546875, 1.4053955078125, 1.461944580078125, 1.51849365234375, 1.575042724609375, 1.631591796875, 1.688140869140625, 1.74468994140625, 1.801239013671875, 1.8577880859375, 1.914337158203125, 1.97088623046875, 2.027435302734375, 2.083984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 9.0, 7.0, 8.0, 14.0, 14.0, 21.0, 29.0, 46.0, 54.0, 78.0, 124.0, 197.0, 110.0, 72.0, 61.0, 33.0, 23.0, 19.0, 10.0, 10.0, 6.0, 6.0, 2.0, 11.0, 3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074671745300293, -0.00010381732136011124, -0.00010016746819019318, -9.651761502027512e-05, -9.286776185035706e-05, -8.9217908680439e-05, -8.556805551052094e-05, -8.191820234060287e-05, -7.826834917068481e-05, -7.461849600076675e-05, -7.09686428308487e-05, -6.731878966093063e-05, -6.366893649101257e-05, -6.001908332109451e-05, -5.636923015117645e-05, -5.271937698125839e-05, -4.906952381134033e-05, -4.541967064142227e-05, -4.176981747150421e-05, -3.811996430158615e-05, -3.447011113166809e-05, -3.082025796175003e-05, -2.717040479183197e-05, -2.352055162191391e-05, -1.987069845199585e-05, -1.622084528207779e-05, -1.2570992112159729e-05, -8.921138942241669e-06, -5.271285772323608e-06, -1.621432602405548e-06, 2.028420567512512e-06, 5.6782737374305725e-06, 9.328126907348633e-06, 1.2977980077266693e-05, 1.6627833247184753e-05, 2.0277686417102814e-05, 2.3927539587020874e-05, 2.7577392756938934e-05, 3.1227245926856995e-05, 3.4877099096775055e-05, 3.8526952266693115e-05, 4.2176805436611176e-05, 4.5826658606529236e-05, 4.9476511776447296e-05, 5.3126364946365356e-05, 5.677621811628342e-05, 6.042607128620148e-05, 6.407592445611954e-05, 6.77257776260376e-05, 7.137563079595566e-05, 7.502548396587372e-05, 7.867533713579178e-05, 8.232519030570984e-05, 8.59750434756279e-05, 8.962489664554596e-05, 9.327474981546402e-05, 9.692460298538208e-05, 0.00010057445615530014, 0.0001042243093252182, 0.00010787416249513626, 0.00011152401566505432, 0.00011517386883497238, 0.00011882372200489044, 0.0001224735751748085, 0.00012612342834472656]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 2.0, 10.0, 11.0, 5.0, 13.0, 20.0, 27.0, 36.0, 77.0, 128.0, 246.0, 382.0, 923.0, 2402.0, 8768.0, 45402.0, 746191.0, 209472.0, 25586.0, 5583.0, 1755.0, 680.0, 334.0, 171.0, 107.0, 57.0, 51.0, 22.0, 18.0, 19.0, 8.0, 13.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.33203125, -1.2958755493164062, -1.2597198486328125, -1.2235641479492188, -1.187408447265625, -1.1512527465820312, -1.1150970458984375, -1.0789413452148438, -1.04278564453125, -1.0066299438476562, -0.9704742431640625, -0.9343185424804688, -0.898162841796875, -0.8620071411132812, -0.8258514404296875, -0.7896957397460938, -0.7535400390625, -0.7173843383789062, -0.6812286376953125, -0.6450729370117188, -0.608917236328125, -0.5727615356445312, -0.5366058349609375, -0.5004501342773438, -0.46429443359375, -0.42813873291015625, -0.3919830322265625, -0.35582733154296875, -0.319671630859375, -0.28351593017578125, -0.2473602294921875, -0.21120452880859375, -0.175048828125, -0.13889312744140625, -0.1027374267578125, -0.06658172607421875, -0.030426025390625, 0.00572967529296875, 0.0418853759765625, 0.07804107666015625, 0.11419677734375, 0.15035247802734375, 0.1865081787109375, 0.22266387939453125, 0.258819580078125, 0.29497528076171875, 0.3311309814453125, 0.36728668212890625, 0.4034423828125, 0.43959808349609375, 0.4757537841796875, 0.5119094848632812, 0.548065185546875, 0.5842208862304688, 0.6203765869140625, 0.6565322875976562, 0.69268798828125, 0.7288436889648438, 0.7649993896484375, 0.8011550903320312, 0.837310791015625, 0.8734664916992188, 0.9096221923828125, 0.9457778930664062, 0.98193359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 10.0, 8.0, 17.0, 10.0, 11.0, 21.0, 32.0, 27.0, 27.0, 43.0, 86.0, 258.0, 131.0, 56.0, 40.0, 39.0, 31.0, 25.0, 19.0, 25.0, 12.0, 7.0, 8.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2874259948730469, -0.27773284912109375, -0.2680397033691406, -0.2583465576171875, -0.24865341186523438, -0.23896026611328125, -0.22926712036132812, -0.219573974609375, -0.20988082885742188, -0.20018768310546875, -0.19049453735351562, -0.1808013916015625, -0.17110824584960938, -0.16141510009765625, -0.15172195434570312, -0.14202880859375, -0.13233566284179688, -0.12264251708984375, -0.11294937133789062, -0.1032562255859375, -0.09356307983398438, -0.08386993408203125, -0.07417678833007812, -0.064483642578125, -0.054790496826171875, -0.04509735107421875, -0.035404205322265625, -0.0257110595703125, -0.016017913818359375, -0.00632476806640625, 0.003368377685546875, 0.0130615234375, 0.022754669189453125, 0.03244781494140625, 0.042140960693359375, 0.0518341064453125, 0.061527252197265625, 0.07122039794921875, 0.08091354370117188, 0.090606689453125, 0.10029983520507812, 0.10999298095703125, 0.11968612670898438, 0.1293792724609375, 0.13907241821289062, 0.14876556396484375, 0.15845870971679688, 0.16815185546875, 0.17784500122070312, 0.18753814697265625, 0.19723129272460938, 0.2069244384765625, 0.21661758422851562, 0.22631072998046875, 0.23600387573242188, 0.245697021484375, 0.2553901672363281, 0.26508331298828125, 0.2747764587402344, 0.2844696044921875, 0.2941627502441406, 0.30385589599609375, 0.3135490417480469, 0.3232421875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 10.0, 30.0, 272.0, 561.0, 109.0, 22.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.65773010253906, -73.20014190673828, -71.74256134033203, -70.28497314453125, -68.82738494873047, -67.36979675292969, -65.91221618652344, -64.45462799072266, -62.997039794921875, -61.53945541381836, -60.08186721801758, -58.62428283691406, -57.16669464111328, -55.709110260009766, -54.25152587890625, -52.79393768310547, -51.33635330200195, -49.87876892089844, -48.421180725097656, -46.96359634399414, -45.50600814819336, -44.048423767089844, -42.59083557128906, -41.13325119018555, -39.67566680908203, -38.218082427978516, -36.760494232177734, -35.30290985107422, -33.84532165527344, -32.38773727416992, -30.930150985717773, -29.472564697265625, -28.014978408813477, -26.557392120361328, -25.09980583190918, -23.64221954345703, -22.184635162353516, -20.727046966552734, -19.26946258544922, -17.81187629699707, -16.354290008544922, -14.896703720092773, -13.439117431640625, -11.981532096862793, -10.523945808410645, -9.066359519958496, -7.608774185180664, -6.151187896728516, -4.693601608276367, -3.236015558242798, -1.7784295082092285, -0.3208436965942383, 1.1367425918579102, 2.5943288803100586, 4.051914215087891, 5.509500503540039, 6.9670867919921875, 8.424673080444336, 9.882259368896484, 11.339844703674316, 12.797430992126465, 14.255017280578613, 15.712602615356445, 17.170188903808594, 18.627775192260742]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 5.0, 3.0, 11.0, 10.0, 15.0, 17.0, 16.0, 18.0, 32.0, 23.0, 23.0, 30.0, 27.0, 36.0, 37.0, 37.0, 41.0, 29.0, 28.0, 42.0, 41.0, 40.0, 44.0, 36.0, 36.0, 27.0, 33.0, 35.0, 33.0, 23.0, 21.0, 20.0, 17.0, 15.0, 14.0, 12.0, 8.0, 10.0, 6.0, 9.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.958179473876953, -9.668221473693848, -9.378263473510742, -9.088306427001953, -8.798348426818848, -8.508390426635742, -8.218432426452637, -7.9284749031066895, -7.638517379760742, -7.348559379577637, -7.0586018562316895, -6.768643856048584, -6.478686332702637, -6.188728332519531, -5.898770332336426, -5.6088128089904785, -5.318854808807373, -5.028896808624268, -4.73893928527832, -4.448981285095215, -4.159023761749268, -3.869065761566162, -3.5791079998016357, -3.2891502380371094, -2.999192476272583, -2.7092347145080566, -2.4192769527435303, -2.129319190979004, -1.839361310005188, -1.5494035482406616, -1.2594456672668457, -0.9694879055023193, -0.679530143737793, -0.3895723521709442, -0.09961456060409546, 0.19034326076507568, 0.48030102252960205, 0.7702587842941284, 1.0602166652679443, 1.3501744270324707, 1.640132188796997, 1.9300899505615234, 2.22004771232605, 2.510005474090576, 2.7999634742736816, 3.089920997619629, 3.3798789978027344, 3.6698367595672607, 3.959794521331787, 4.249752521514893, 4.53971004486084, 4.829668045043945, 5.119625568389893, 5.409583568572998, 5.699541091918945, 5.989499092102051, 6.279457092285156, 6.569415092468262, 6.859372615814209, 7.1493306159973145, 7.439288139343262, 7.729246139526367, 8.019204139709473, 8.309162139892578, 8.599119186401367]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 6.0, 6.0, 9.0, 20.0, 20.0, 24.0, 33.0, 57.0, 81.0, 121.0, 177.0, 352.0, 760.0, 1709.0, 5195.0, 19824.0, 134807.0, 3394674.0, 573729.0, 47341.0, 9940.0, 3078.0, 1181.0, 490.0, 213.0, 110.0, 87.0, 62.0, 36.0, 29.0, 22.0, 15.0, 13.0, 11.0, 6.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.875, -6.6771240234375, -6.479248046875, -6.2813720703125, -6.08349609375, -5.8856201171875, -5.687744140625, -5.4898681640625, -5.2919921875, -5.0941162109375, -4.896240234375, -4.6983642578125, -4.50048828125, -4.3026123046875, -4.104736328125, -3.9068603515625, -3.708984375, -3.5111083984375, -3.313232421875, -3.1153564453125, -2.91748046875, -2.7196044921875, -2.521728515625, -2.3238525390625, -2.1259765625, -1.9281005859375, -1.730224609375, -1.5323486328125, -1.33447265625, -1.1365966796875, -0.938720703125, -0.7408447265625, -0.54296875, -0.3450927734375, -0.147216796875, 0.0506591796875, 0.24853515625, 0.4464111328125, 0.644287109375, 0.8421630859375, 1.0400390625, 1.2379150390625, 1.435791015625, 1.6336669921875, 1.83154296875, 2.0294189453125, 2.227294921875, 2.4251708984375, 2.623046875, 2.8209228515625, 3.018798828125, 3.2166748046875, 3.41455078125, 3.6124267578125, 3.810302734375, 4.0081787109375, 4.2060546875, 4.4039306640625, 4.601806640625, 4.7996826171875, 4.99755859375, 5.1954345703125, 5.393310546875, 5.5911865234375, 5.7890625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 15.0, 20.0, 28.0, 36.0, 69.0, 89.0, 108.0, 86.0, 110.0, 107.0, 85.0, 89.0, 34.0, 35.0, 20.0, 17.0, 10.0, 7.0, 5.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.02734375, -6.860626220703125, -6.69390869140625, -6.527191162109375, -6.3604736328125, -6.193756103515625, -6.02703857421875, -5.860321044921875, -5.693603515625, -5.526885986328125, -5.36016845703125, -5.193450927734375, -5.0267333984375, -4.860015869140625, -4.69329833984375, -4.526580810546875, -4.35986328125, -4.193145751953125, -4.02642822265625, -3.859710693359375, -3.6929931640625, -3.526275634765625, -3.35955810546875, -3.192840576171875, -3.026123046875, -2.859405517578125, -2.69268798828125, -2.525970458984375, -2.3592529296875, -2.192535400390625, -2.02581787109375, -1.859100341796875, -1.6923828125, -1.525665283203125, -1.35894775390625, -1.192230224609375, -1.0255126953125, -0.858795166015625, -0.69207763671875, -0.525360107421875, -0.358642578125, -0.191925048828125, -0.02520751953125, 0.141510009765625, 0.3082275390625, 0.474945068359375, 0.64166259765625, 0.808380126953125, 0.97509765625, 1.141815185546875, 1.30853271484375, 1.475250244140625, 1.6419677734375, 1.808685302734375, 1.97540283203125, 2.142120361328125, 2.308837890625, 2.475555419921875, 2.64227294921875, 2.808990478515625, 2.9757080078125, 3.142425537109375, 3.30914306640625, 3.475860595703125, 3.642578125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 26.0, 38.0, 70.0, 214.0, 1390.0, 572027.0, 3618297.0, 1784.0, 260.0, 101.0, 26.0, 18.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.90625, -39.07568359375, -38.2451171875, -37.41455078125, -36.583984375, -35.75341796875, -34.9228515625, -34.09228515625, -33.26171875, -32.43115234375, -31.6005859375, -30.77001953125, -29.939453125, -29.10888671875, -28.2783203125, -27.44775390625, -26.6171875, -25.78662109375, -24.9560546875, -24.12548828125, -23.294921875, -22.46435546875, -21.6337890625, -20.80322265625, -19.97265625, -19.14208984375, -18.3115234375, -17.48095703125, -16.650390625, -15.81982421875, -14.9892578125, -14.15869140625, -13.328125, -12.49755859375, -11.6669921875, -10.83642578125, -10.005859375, -9.17529296875, -8.3447265625, -7.51416015625, -6.68359375, -5.85302734375, -5.0224609375, -4.19189453125, -3.361328125, -2.53076171875, -1.7001953125, -0.86962890625, -0.0390625, 0.79150390625, 1.6220703125, 2.45263671875, 3.283203125, 4.11376953125, 4.9443359375, 5.77490234375, 6.60546875, 7.43603515625, 8.2666015625, 9.09716796875, 9.927734375, 10.75830078125, 11.5888671875, 12.41943359375, 13.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 11.0, 2.0, 8.0, 8.0, 12.0, 16.0, 20.0, 35.0, 33.0, 41.0, 54.0, 76.0, 84.0, 156.0, 204.0, 376.0, 787.0, 874.0, 411.0, 241.0, 201.0, 96.0, 83.0, 64.0, 54.0, 32.0, 23.0, 17.0, 14.0, 6.0, 5.0, 4.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1403121948242188, -1.1077728271484375, -1.0752334594726562, -1.042694091796875, -1.0101547241210938, -0.9776153564453125, -0.9450759887695312, -0.91253662109375, -0.8799972534179688, -0.8474578857421875, -0.8149185180664062, -0.782379150390625, -0.7498397827148438, -0.7173004150390625, -0.6847610473632812, -0.6522216796875, -0.6196823120117188, -0.5871429443359375, -0.5546035766601562, -0.522064208984375, -0.48952484130859375, -0.4569854736328125, -0.42444610595703125, -0.39190673828125, -0.35936737060546875, -0.3268280029296875, -0.29428863525390625, -0.261749267578125, -0.22920989990234375, -0.1966705322265625, -0.16413116455078125, -0.131591796875, -0.09905242919921875, -0.0665130615234375, -0.03397369384765625, -0.001434326171875, 0.03110504150390625, 0.0636444091796875, 0.09618377685546875, 0.12872314453125, 0.16126251220703125, 0.1938018798828125, 0.22634124755859375, 0.258880615234375, 0.29141998291015625, 0.3239593505859375, 0.35649871826171875, 0.3890380859375, 0.42157745361328125, 0.4541168212890625, 0.48665618896484375, 0.519195556640625, 0.5517349243164062, 0.5842742919921875, 0.6168136596679688, 0.64935302734375, 0.6818923950195312, 0.7144317626953125, 0.7469711303710938, 0.779510498046875, 0.8120498657226562, 0.8445892333984375, 0.8771286010742188, 0.90966796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 2.0, 5.0, 9.0, 23.0, 33.0, 69.0, 109.0, 204.0, 222.0, 152.0, 74.0, 36.0, 21.0, 13.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.142258644104004, -8.839942932128906, -8.537628173828125, -8.235312461853027, -7.932997226715088, -7.630681991577148, -7.328366279602051, -7.026051044464111, -6.723735809326172, -6.421420574188232, -6.119105339050293, -5.816789627075195, -5.514474391937256, -5.212159156799316, -4.909843444824219, -4.607528209686279, -4.30521297454834, -4.0028977394104, -3.700582265853882, -3.3982667922973633, -3.095951557159424, -2.7936363220214844, -2.491320848464966, -2.1890053749084473, -1.8866901397705078, -1.5843747854232788, -1.2820594310760498, -0.9797440767288208, -0.6774287223815918, -0.3751133680343628, -0.07279801368713379, 0.22951745986938477, 0.5318336486816406, 0.8341490030288696, 1.1364643573760986, 1.4387797117233276, 1.7410950660705566, 2.043410301208496, 2.3457257747650146, 2.648041248321533, 2.9503564834594727, 3.252671718597412, 3.5549871921539307, 3.857302665710449, 4.159617900848389, 4.461933135986328, 4.764248847961426, 5.066564083099365, 5.368879318237305, 5.671194553375244, 5.973509788513184, 6.275825500488281, 6.578140735626221, 6.88045597076416, 7.182771682739258, 7.485086917877197, 7.787402153015137, 8.089717864990234, 8.392032623291016, 8.694348335266113, 8.996664047241211, 9.298978805541992, 9.60129451751709, 9.903610229492188, 10.205924987792969]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 15.0, 15.0, 27.0, 31.0, 38.0, 63.0, 95.0, 105.0, 103.0, 92.0, 93.0, 88.0, 69.0, 46.0, 49.0, 26.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.074833393096924, -6.884274482727051, -6.693715572357178, -6.5031561851501465, -6.312597274780273, -6.1220383644104, -5.931479454040527, -5.740920066833496, -5.550361156463623, -5.35980224609375, -5.169243335723877, -4.978683948516846, -4.788125038146973, -4.5975661277771, -4.407007217407227, -4.216447830200195, -4.0258893966674805, -3.8353304862976074, -3.6447713375091553, -3.4542124271392822, -3.26365327835083, -3.073094367980957, -2.882535457611084, -2.691976308822632, -2.5014171600341797, -2.3108582496643066, -2.1202991008758545, -1.9297401905059814, -1.7391810417175293, -1.5486221313476562, -1.3580631017684937, -1.167504072189331, -0.9769449234008789, -0.7863858938217163, -0.5958268642425537, -0.4052678942680359, -0.2147088646888733, -0.024149835109710693, 0.16640913486480713, 0.3569681644439697, 0.5475271940231323, 0.7380862236022949, 0.9286452531814575, 1.1192042827606201, 1.3097631931304932, 1.5003223419189453, 1.6908812522888184, 1.881440281867981, 2.0719993114471436, 2.2625582218170166, 2.4531173706054688, 2.643676280975342, 2.834235429763794, 3.024794340133667, 3.215353488922119, 3.405912399291992, 3.5964713096618652, 3.7870302200317383, 3.9775893688201904, 4.168148517608643, 4.358707427978516, 4.549266338348389, 4.739825248718262, 4.930384635925293, 5.120943546295166]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 16.0, 23.0, 40.0, 78.0, 194.0, 541.0, 1771.0, 15990.0, 1006834.0, 20107.0, 2002.0, 527.0, 196.0, 96.0, 48.0, 22.0, 18.0, 14.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.396209716796875, -1.33929443359375, -1.282379150390625, -1.2254638671875, -1.168548583984375, -1.11163330078125, -1.054718017578125, -0.997802734375, -0.940887451171875, -0.88397216796875, -0.827056884765625, -0.7701416015625, -0.713226318359375, -0.65631103515625, -0.599395751953125, -0.54248046875, -0.485565185546875, -0.42864990234375, -0.371734619140625, -0.3148193359375, -0.257904052734375, -0.20098876953125, -0.144073486328125, -0.087158203125, -0.030242919921875, 0.02667236328125, 0.083587646484375, 0.1405029296875, 0.197418212890625, 0.25433349609375, 0.311248779296875, 0.3681640625, 0.425079345703125, 0.48199462890625, 0.538909912109375, 0.5958251953125, 0.652740478515625, 0.70965576171875, 0.766571044921875, 0.823486328125, 0.880401611328125, 0.93731689453125, 0.994232177734375, 1.0511474609375, 1.108062744140625, 1.16497802734375, 1.221893310546875, 1.27880859375, 1.335723876953125, 1.39263916015625, 1.449554443359375, 1.5064697265625, 1.563385009765625, 1.62030029296875, 1.677215576171875, 1.734130859375, 1.791046142578125, 1.84796142578125, 1.904876708984375, 1.9617919921875, 2.018707275390625, 2.07562255859375, 2.132537841796875, 2.189453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 11.0, 11.0, 15.0, 33.0, 42.0, 63.0, 99.0, 126.0, 140.0, 127.0, 99.0, 90.0, 55.0, 31.0, 23.0, 16.0, 7.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.467803955078125, -5.31842041015625, -5.169036865234375, -5.0196533203125, -4.870269775390625, -4.72088623046875, -4.571502685546875, -4.422119140625, -4.272735595703125, -4.12335205078125, -3.973968505859375, -3.8245849609375, -3.675201416015625, -3.52581787109375, -3.376434326171875, -3.22705078125, -3.077667236328125, -2.92828369140625, -2.778900146484375, -2.6295166015625, -2.480133056640625, -2.33074951171875, -2.181365966796875, -2.031982421875, -1.882598876953125, -1.73321533203125, -1.583831787109375, -1.4344482421875, -1.285064697265625, -1.13568115234375, -0.986297607421875, -0.8369140625, -0.687530517578125, -0.53814697265625, -0.388763427734375, -0.2393798828125, -0.089996337890625, 0.05938720703125, 0.208770751953125, 0.358154296875, 0.507537841796875, 0.65692138671875, 0.806304931640625, 0.9556884765625, 1.105072021484375, 1.25445556640625, 1.403839111328125, 1.55322265625, 1.702606201171875, 1.85198974609375, 2.001373291015625, 2.1507568359375, 2.300140380859375, 2.44952392578125, 2.598907470703125, 2.748291015625, 2.897674560546875, 3.04705810546875, 3.196441650390625, 3.3458251953125, 3.495208740234375, 3.64459228515625, 3.793975830078125, 3.943359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 5.0, 5.0, 8.0, 11.0, 18.0, 17.0, 26.0, 37.0, 50.0, 68.0, 72.0, 111.0, 142.0, 193.0, 259.0, 421.0, 879.0, 4023.0, 45402.0, 653801.0, 319543.0, 19284.0, 2157.0, 691.0, 372.0, 241.0, 175.0, 158.0, 98.0, 71.0, 58.0, 37.0, 35.0, 32.0, 19.0, 11.0, 7.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.393798828125, -0.3828086853027344, -0.37181854248046875, -0.3608283996582031, -0.3498382568359375, -0.3388481140136719, -0.32785797119140625, -0.3168678283691406, -0.305877685546875, -0.2948875427246094, -0.28389739990234375, -0.2729072570800781, -0.2619171142578125, -0.2509269714355469, -0.23993682861328125, -0.22894668579101562, -0.21795654296875, -0.20696640014648438, -0.19597625732421875, -0.18498611450195312, -0.1739959716796875, -0.16300582885742188, -0.15201568603515625, -0.14102554321289062, -0.130035400390625, -0.11904525756835938, -0.10805511474609375, -0.09706497192382812, -0.0860748291015625, -0.07508468627929688, -0.06409454345703125, -0.053104400634765625, -0.0421142578125, -0.031124114990234375, -0.02013397216796875, -0.009143829345703125, 0.0018463134765625, 0.012836456298828125, 0.02382659912109375, 0.034816741943359375, 0.045806884765625, 0.056797027587890625, 0.06778717041015625, 0.07877731323242188, 0.0897674560546875, 0.10075759887695312, 0.11174774169921875, 0.12273788452148438, 0.13372802734375, 0.14471817016601562, 0.15570831298828125, 0.16669845581054688, 0.1776885986328125, 0.18867874145507812, 0.19966888427734375, 0.21065902709960938, 0.221649169921875, 0.23263931274414062, 0.24362945556640625, 0.2546195983886719, 0.2656097412109375, 0.2765998840332031, 0.28759002685546875, 0.2985801696777344, 0.3095703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 13.0, 10.0, 11.0, 22.0, 19.0, 22.0, 26.0, 41.0, 33.0, 37.0, 34.0, 47.0, 51.0, 40.0, 46.0, 55.0, 41.0, 46.0, 50.0, 40.0, 46.0, 40.0, 46.0, 18.0, 31.0, 25.0, 20.0, 16.0, 11.0, 17.0, 6.0, 6.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.92578125, -3.8170166015625, -3.708251953125, -3.5994873046875, -3.49072265625, -3.3819580078125, -3.273193359375, -3.1644287109375, -3.0556640625, -2.9468994140625, -2.838134765625, -2.7293701171875, -2.62060546875, -2.5118408203125, -2.403076171875, -2.2943115234375, -2.185546875, -2.0767822265625, -1.968017578125, -1.8592529296875, -1.75048828125, -1.6417236328125, -1.532958984375, -1.4241943359375, -1.3154296875, -1.2066650390625, -1.097900390625, -0.9891357421875, -0.88037109375, -0.7716064453125, -0.662841796875, -0.5540771484375, -0.4453125, -0.3365478515625, -0.227783203125, -0.1190185546875, -0.01025390625, 0.0985107421875, 0.207275390625, 0.3160400390625, 0.4248046875, 0.5335693359375, 0.642333984375, 0.7510986328125, 0.85986328125, 0.9686279296875, 1.077392578125, 1.1861572265625, 1.294921875, 1.4036865234375, 1.512451171875, 1.6212158203125, 1.72998046875, 1.8387451171875, 1.947509765625, 2.0562744140625, 2.1650390625, 2.2738037109375, 2.382568359375, 2.4913330078125, 2.60009765625, 2.7088623046875, 2.817626953125, 2.9263916015625, 3.03515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 19.0, 14.0, 19.0, 39.0, 43.0, 59.0, 90.0, 95.0, 152.0, 192.0, 311.0, 654.0, 1990.0, 15504.0, 847556.0, 172525.0, 6496.0, 1347.0, 463.0, 290.0, 173.0, 129.0, 86.0, 75.0, 50.0, 34.0, 27.0, 22.0, 14.0, 22.0, 8.0, 3.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12922382354736328, -0.12551307678222656, -0.12180233001708984, -0.11809158325195312, -0.1143808364868164, -0.11067008972167969, -0.10695934295654297, -0.10324859619140625, -0.09953784942626953, -0.09582710266113281, -0.0921163558959961, -0.08840560913085938, -0.08469486236572266, -0.08098411560058594, -0.07727336883544922, -0.0735626220703125, -0.06985187530517578, -0.06614112854003906, -0.062430381774902344, -0.058719635009765625, -0.055008888244628906, -0.05129814147949219, -0.04758739471435547, -0.04387664794921875, -0.04016590118408203, -0.03645515441894531, -0.032744407653808594, -0.029033660888671875, -0.025322914123535156, -0.021612167358398438, -0.01790142059326172, -0.014190673828125, -0.010479927062988281, -0.0067691802978515625, -0.0030584335327148438, 0.000652313232421875, 0.004363059997558594, 0.008073806762695312, 0.011784553527832031, 0.01549530029296875, 0.01920604705810547, 0.022916793823242188, 0.026627540588378906, 0.030338287353515625, 0.034049034118652344, 0.03775978088378906, 0.04147052764892578, 0.0451812744140625, 0.04889202117919922, 0.05260276794433594, 0.056313514709472656, 0.060024261474609375, 0.0637350082397461, 0.06744575500488281, 0.07115650177001953, 0.07486724853515625, 0.07857799530029297, 0.08228874206542969, 0.0859994888305664, 0.08971023559570312, 0.09342098236083984, 0.09713172912597656, 0.10084247589111328, 0.10455322265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 14.0, 18.0, 19.0, 45.0, 44.0, 69.0, 83.0, 115.0, 122.0, 114.0, 98.0, 85.0, 57.0, 29.0, 13.0, 21.0, 9.0, 7.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61611557006836e-05, -6.457231938838959e-05, -6.298348307609558e-05, -6.139464676380157e-05, -5.980581045150757e-05, -5.821697413921356e-05, -5.6628137826919556e-05, -5.503930151462555e-05, -5.345046520233154e-05, -5.186162889003754e-05, -5.027279257774353e-05, -4.8683956265449524e-05, -4.709511995315552e-05, -4.550628364086151e-05, -4.3917447328567505e-05, -4.23286110162735e-05, -4.073977470397949e-05, -3.9150938391685486e-05, -3.756210207939148e-05, -3.597326576709747e-05, -3.438442945480347e-05, -3.279559314250946e-05, -3.1206756830215454e-05, -2.9617920517921448e-05, -2.802908420562744e-05, -2.6440247893333435e-05, -2.485141158103943e-05, -2.3262575268745422e-05, -2.1673738956451416e-05, -2.008490264415741e-05, -1.8496066331863403e-05, -1.6907230019569397e-05, -1.531839370727539e-05, -1.3729557394981384e-05, -1.2140721082687378e-05, -1.0551884770393372e-05, -8.963048458099365e-06, -7.374212145805359e-06, -5.7853758335113525e-06, -4.196539521217346e-06, -2.60770320892334e-06, -1.0188668966293335e-06, 5.699694156646729e-07, 2.158805727958679e-06, 3.7476420402526855e-06, 5.336478352546692e-06, 6.925314664840698e-06, 8.514150977134705e-06, 1.0102987289428711e-05, 1.1691823601722717e-05, 1.3280659914016724e-05, 1.486949622631073e-05, 1.6458332538604736e-05, 1.8047168850898743e-05, 1.963600516319275e-05, 2.1224841475486755e-05, 2.2813677787780762e-05, 2.4402514100074768e-05, 2.5991350412368774e-05, 2.758018672466278e-05, 2.9169023036956787e-05, 3.0757859349250793e-05, 3.23466956615448e-05, 3.3935531973838806e-05, 3.552436828613281e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 13.0, 23.0, 46.0, 114.0, 251.0, 739.0, 3012.0, 23061.0, 960526.0, 54588.0, 4502.0, 1020.0, 331.0, 142.0, 69.0, 31.0, 25.0, 18.0, 12.0, 8.0, 6.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21875, -0.21083450317382812, -0.20291900634765625, -0.19500350952148438, -0.1870880126953125, -0.17917251586914062, -0.17125701904296875, -0.16334152221679688, -0.155426025390625, -0.14751052856445312, -0.13959503173828125, -0.13167953491210938, -0.1237640380859375, -0.11584854125976562, -0.10793304443359375, -0.10001754760742188, -0.09210205078125, -0.08418655395507812, -0.07627105712890625, -0.06835556030273438, -0.0604400634765625, -0.052524566650390625, -0.04460906982421875, -0.036693572998046875, -0.028778076171875, -0.020862579345703125, -0.01294708251953125, -0.005031585693359375, 0.0028839111328125, 0.010799407958984375, 0.01871490478515625, 0.026630401611328125, 0.0345458984375, 0.042461395263671875, 0.05037689208984375, 0.058292388916015625, 0.0662078857421875, 0.07412338256835938, 0.08203887939453125, 0.08995437622070312, 0.097869873046875, 0.10578536987304688, 0.11370086669921875, 0.12161636352539062, 0.1295318603515625, 0.13744735717773438, 0.14536285400390625, 0.15327835083007812, 0.16119384765625, 0.16910934448242188, 0.17702484130859375, 0.18494033813476562, 0.1928558349609375, 0.20077133178710938, 0.20868682861328125, 0.21660232543945312, 0.224517822265625, 0.23243331909179688, 0.24034881591796875, 0.24826431274414062, 0.2561798095703125, 0.2640953063964844, 0.27201080322265625, 0.2799263000488281, 0.287841796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 9.0, 11.0, 22.0, 24.0, 31.0, 65.0, 135.0, 213.0, 189.0, 94.0, 46.0, 33.0, 25.0, 15.0, 18.0, 4.0, 12.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014862060546875, -0.014307260513305664, -0.013752460479736328, -0.013197660446166992, -0.012642860412597656, -0.01208806037902832, -0.011533260345458984, -0.010978460311889648, -0.010423660278320312, -0.009868860244750977, -0.00931406021118164, -0.008759260177612305, -0.008204460144042969, -0.007649660110473633, -0.007094860076904297, -0.006540060043334961, -0.005985260009765625, -0.005430459976196289, -0.004875659942626953, -0.004320859909057617, -0.0037660598754882812, -0.0032112598419189453, -0.0026564598083496094, -0.0021016597747802734, -0.0015468597412109375, -0.0009920597076416016, -0.0004372596740722656, 0.00011754035949707031, 0.0006723403930664062, 0.0012271404266357422, 0.0017819404602050781, 0.002336740493774414, 0.00289154052734375, 0.003446340560913086, 0.004001140594482422, 0.004555940628051758, 0.005110740661621094, 0.00566554069519043, 0.006220340728759766, 0.0067751407623291016, 0.0073299407958984375, 0.007884740829467773, 0.00843954086303711, 0.008994340896606445, 0.009549140930175781, 0.010103940963745117, 0.010658740997314453, 0.011213541030883789, 0.011768341064453125, 0.012323141098022461, 0.012877941131591797, 0.013432741165161133, 0.013987541198730469, 0.014542341232299805, 0.01509714126586914, 0.015651941299438477, 0.016206741333007812, 0.01676154136657715, 0.017316341400146484, 0.01787114143371582, 0.018425941467285156, 0.018980741500854492, 0.019535541534423828, 0.020090341567993164, 0.0206451416015625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 29.0, 45.0, 96.0, 223.0, 285.0, 154.0, 70.0, 38.0, 12.0, 13.0, 2.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.319628715515137, -8.090072631835938, -7.86051607131958, -7.630959510803223, -7.401403427124023, -7.171846866607666, -6.942290306091309, -6.712734222412109, -6.483177661895752, -6.2536211013793945, -6.024065017700195, -5.794508457183838, -5.5649518966674805, -5.335395812988281, -5.105839252471924, -4.876282691955566, -4.646726608276367, -4.41717004776001, -4.1876139640808105, -3.958057403564453, -3.728501081466675, -3.4989447593688965, -3.269388198852539, -3.0398318767547607, -2.8102755546569824, -2.580719232559204, -2.351162910461426, -2.1216063499450684, -1.89205002784729, -1.6624937057495117, -1.4329372644424438, -1.203380823135376, -0.9738240242004395, -0.7442676424980164, -0.5147112607955933, -0.28515487909317017, -0.05559849739074707, 0.17395782470703125, 0.4035142660140991, 0.633070707321167, 0.8626270294189453, 1.0921833515167236, 1.3217397928237915, 1.5512962341308594, 1.7808525562286377, 2.010408878326416, 2.2399654388427734, 2.4695217609405518, 2.69907808303833, 2.9286344051361084, 3.1581907272338867, 3.387747287750244, 3.6173036098480225, 3.846859931945801, 4.076416492462158, 4.305973052978516, 4.535529136657715, 4.765085697174072, 4.9946417808532715, 5.224198341369629, 5.453754425048828, 5.6833109855651855, 5.912867546081543, 6.142423629760742, 6.3719801902771]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 22.0, 23.0, 28.0, 48.0, 78.0, 129.0, 127.0, 132.0, 113.0, 99.0, 68.0, 52.0, 33.0, 20.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.416303634643555, -5.270781517028809, -5.1252593994140625, -4.979737281799316, -4.83421516418457, -4.688693046569824, -4.543170928955078, -4.39764928817749, -4.252127170562744, -4.106605052947998, -3.961082935333252, -3.815560817718506, -3.670038938522339, -3.5245168209075928, -3.3789947032928467, -3.2334728240966797, -3.0879504680633545, -2.9424283504486084, -2.7969062328338623, -2.6513843536376953, -2.505862236022949, -2.360340118408203, -2.214818000793457, -2.069295883178711, -1.9237738847732544, -1.7782517671585083, -1.6327297687530518, -1.4872076511383057, -1.3416855335235596, -1.196163535118103, -1.050641417503357, -0.9051194190979004, -0.7595973014831543, -0.614075243473053, -0.4685531556606293, -0.32303106784820557, -0.17750900983810425, -0.03198695182800293, 0.11353516578674316, 0.2590571641921997, 0.4045792818069458, 0.5501013398170471, 0.6956233978271484, 0.8411455154418945, 0.9866675734519958, 1.1321896314620972, 1.2777117490768433, 1.4232337474822998, 1.568755865097046, 1.714277982711792, 1.8597999811172485, 2.005321979522705, 2.150844097137451, 2.2963662147521973, 2.4418883323669434, 2.5874104499816895, 2.7329325675964355, 2.8784546852111816, 3.0239768028259277, 3.169498920440674, 3.315020799636841, 3.460542917251587, 3.606065034866333, 3.7515869140625, 3.897109031677246]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 8.0, 16.0, 22.0, 53.0, 88.0, 162.0, 350.0, 782.0, 2258.0, 6334.0, 25270.0, 146881.0, 690872.0, 141034.0, 24570.0, 6246.0, 2154.0, 793.0, 322.0, 141.0, 82.0, 43.0, 17.0, 20.0, 12.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.39654541015625, -3.2813720703125, -3.16619873046875, -3.051025390625, -2.93585205078125, -2.8206787109375, -2.70550537109375, -2.59033203125, -2.47515869140625, -2.3599853515625, -2.24481201171875, -2.129638671875, -2.01446533203125, -1.8992919921875, -1.78411865234375, -1.6689453125, -1.55377197265625, -1.4385986328125, -1.32342529296875, -1.208251953125, -1.09307861328125, -0.9779052734375, -0.86273193359375, -0.74755859375, -0.63238525390625, -0.5172119140625, -0.40203857421875, -0.286865234375, -0.17169189453125, -0.0565185546875, 0.05865478515625, 0.173828125, 0.28900146484375, 0.4041748046875, 0.51934814453125, 0.634521484375, 0.74969482421875, 0.8648681640625, 0.98004150390625, 1.09521484375, 1.21038818359375, 1.3255615234375, 1.44073486328125, 1.555908203125, 1.67108154296875, 1.7862548828125, 1.90142822265625, 2.0166015625, 2.13177490234375, 2.2469482421875, 2.36212158203125, 2.477294921875, 2.59246826171875, 2.7076416015625, 2.82281494140625, 2.93798828125, 3.05316162109375, 3.1683349609375, 3.28350830078125, 3.398681640625, 3.51385498046875, 3.6290283203125, 3.74420166015625, 3.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 16.0, 16.0, 28.0, 32.0, 52.0, 71.0, 108.0, 115.0, 96.0, 103.0, 102.0, 80.0, 55.0, 32.0, 35.0, 14.0, 8.0, 9.0, 2.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -8.9964599609375, -8.727294921875, -8.4581298828125, -8.18896484375, -7.9197998046875, -7.650634765625, -7.3814697265625, -7.1123046875, -6.8431396484375, -6.573974609375, -6.3048095703125, -6.03564453125, -5.7664794921875, -5.497314453125, -5.2281494140625, -4.958984375, -4.6898193359375, -4.420654296875, -4.1514892578125, -3.88232421875, -3.6131591796875, -3.343994140625, -3.0748291015625, -2.8056640625, -2.5364990234375, -2.267333984375, -1.9981689453125, -1.72900390625, -1.4598388671875, -1.190673828125, -0.9215087890625, -0.65234375, -0.3831787109375, -0.114013671875, 0.1551513671875, 0.42431640625, 0.6934814453125, 0.962646484375, 1.2318115234375, 1.5009765625, 1.7701416015625, 2.039306640625, 2.3084716796875, 2.57763671875, 2.8468017578125, 3.115966796875, 3.3851318359375, 3.654296875, 3.9234619140625, 4.192626953125, 4.4617919921875, 4.73095703125, 5.0001220703125, 5.269287109375, 5.5384521484375, 5.8076171875, 6.0767822265625, 6.345947265625, 6.6151123046875, 6.88427734375, 7.1534423828125, 7.422607421875, 7.6917724609375, 7.9609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 11.0, 13.0, 19.0, 14.0, 18.0, 23.0, 29.0, 32.0, 24.0, 23.0, 43.0, 46.0, 67.0, 212.0, 3767.0, 1012381.0, 30751.0, 572.0, 116.0, 58.0, 43.0, 36.0, 36.0, 29.0, 25.0, 32.0, 18.0, 14.0, 18.0, 12.0, 12.0, 6.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.125, -14.7012939453125, -14.277587890625, -13.8538818359375, -13.43017578125, -13.0064697265625, -12.582763671875, -12.1590576171875, -11.7353515625, -11.3116455078125, -10.887939453125, -10.4642333984375, -10.04052734375, -9.6168212890625, -9.193115234375, -8.7694091796875, -8.345703125, -7.9219970703125, -7.498291015625, -7.0745849609375, -6.65087890625, -6.2271728515625, -5.803466796875, -5.3797607421875, -4.9560546875, -4.5323486328125, -4.108642578125, -3.6849365234375, -3.26123046875, -2.8375244140625, -2.413818359375, -1.9901123046875, -1.56640625, -1.1427001953125, -0.718994140625, -0.2952880859375, 0.12841796875, 0.5521240234375, 0.975830078125, 1.3995361328125, 1.8232421875, 2.2469482421875, 2.670654296875, 3.0943603515625, 3.51806640625, 3.9417724609375, 4.365478515625, 4.7891845703125, 5.212890625, 5.6365966796875, 6.060302734375, 6.4840087890625, 6.90771484375, 7.3314208984375, 7.755126953125, 8.1788330078125, 8.6025390625, 9.0262451171875, 9.449951171875, 9.8736572265625, 10.29736328125, 10.7210693359375, 11.144775390625, 11.5684814453125, 11.9921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 9.0, 6.0, 11.0, 11.0, 15.0, 23.0, 19.0, 26.0, 19.0, 23.0, 39.0, 25.0, 32.0, 37.0, 38.0, 52.0, 43.0, 52.0, 40.0, 35.0, 58.0, 34.0, 47.0, 37.0, 29.0, 31.0, 25.0, 30.0, 28.0, 20.0, 17.0, 11.0, 11.0, 11.0, 6.0, 15.0, 5.0, 4.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.890625, -4.7554931640625, -4.620361328125, -4.4852294921875, -4.35009765625, -4.2149658203125, -4.079833984375, -3.9447021484375, -3.8095703125, -3.6744384765625, -3.539306640625, -3.4041748046875, -3.26904296875, -3.1339111328125, -2.998779296875, -2.8636474609375, -2.728515625, -2.5933837890625, -2.458251953125, -2.3231201171875, -2.18798828125, -2.0528564453125, -1.917724609375, -1.7825927734375, -1.6474609375, -1.5123291015625, -1.377197265625, -1.2420654296875, -1.10693359375, -0.9718017578125, -0.836669921875, -0.7015380859375, -0.56640625, -0.4312744140625, -0.296142578125, -0.1610107421875, -0.02587890625, 0.1092529296875, 0.244384765625, 0.3795166015625, 0.5146484375, 0.6497802734375, 0.784912109375, 0.9200439453125, 1.05517578125, 1.1903076171875, 1.325439453125, 1.4605712890625, 1.595703125, 1.7308349609375, 1.865966796875, 2.0010986328125, 2.13623046875, 2.2713623046875, 2.406494140625, 2.5416259765625, 2.6767578125, 2.8118896484375, 2.947021484375, 3.0821533203125, 3.21728515625, 3.3524169921875, 3.487548828125, 3.6226806640625, 3.7578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 10.0, 6.0, 18.0, 17.0, 52.0, 64.0, 136.0, 247.0, 568.0, 1527.0, 5046.0, 23871.0, 201854.0, 728683.0, 70499.0, 11336.0, 2753.0, 1002.0, 389.0, 201.0, 104.0, 62.0, 31.0, 19.0, 15.0, 8.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.6279296875, -1.584259033203125, -1.54058837890625, -1.496917724609375, -1.4532470703125, -1.409576416015625, -1.36590576171875, -1.322235107421875, -1.278564453125, -1.234893798828125, -1.19122314453125, -1.147552490234375, -1.1038818359375, -1.060211181640625, -1.01654052734375, -0.972869873046875, -0.92919921875, -0.885528564453125, -0.84185791015625, -0.798187255859375, -0.7545166015625, -0.710845947265625, -0.66717529296875, -0.623504638671875, -0.579833984375, -0.536163330078125, -0.49249267578125, -0.448822021484375, -0.4051513671875, -0.361480712890625, -0.31781005859375, -0.274139404296875, -0.23046875, -0.186798095703125, -0.14312744140625, -0.099456787109375, -0.0557861328125, -0.012115478515625, 0.03155517578125, 0.075225830078125, 0.118896484375, 0.162567138671875, 0.20623779296875, 0.249908447265625, 0.2935791015625, 0.337249755859375, 0.38092041015625, 0.424591064453125, 0.46826171875, 0.511932373046875, 0.55560302734375, 0.599273681640625, 0.6429443359375, 0.686614990234375, 0.73028564453125, 0.773956298828125, 0.817626953125, 0.861297607421875, 0.90496826171875, 0.948638916015625, 0.9923095703125, 1.035980224609375, 1.07965087890625, 1.123321533203125, 1.1669921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 12.0, 16.0, 22.0, 38.0, 48.0, 55.0, 67.0, 75.0, 104.0, 105.0, 87.0, 58.0, 60.0, 49.0, 27.0, 27.0, 28.0, 13.0, 10.0, 17.0, 10.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00015115737915039062, -0.00014696363359689713, -0.00014276988804340363, -0.00013857614248991013, -0.00013438239693641663, -0.00013018865138292313, -0.00012599490582942963, -0.00012180116027593613, -0.00011760741472244263, -0.00011341366916894913, -0.00010921992361545563, -0.00010502617806196213, -0.00010083243250846863, -9.663868695497513e-05, -9.244494140148163e-05, -8.825119584798813e-05, -8.405745029449463e-05, -7.986370474100113e-05, -7.566995918750763e-05, -7.147621363401413e-05, -6.728246808052063e-05, -6.308872252702713e-05, -5.889497697353363e-05, -5.470123142004013e-05, -5.050748586654663e-05, -4.631374031305313e-05, -4.211999475955963e-05, -3.792624920606613e-05, -3.373250365257263e-05, -2.9538758099079132e-05, -2.5345012545585632e-05, -2.1151266992092133e-05, -1.6957521438598633e-05, -1.2763775885105133e-05, -8.570030331611633e-06, -4.3762847781181335e-06, -1.825392246246338e-07, 4.011206328868866e-06, 8.204951882362366e-06, 1.2398697435855865e-05, 1.6592442989349365e-05, 2.0786188542842865e-05, 2.4979934096336365e-05, 2.9173679649829865e-05, 3.3367425203323364e-05, 3.7561170756816864e-05, 4.1754916310310364e-05, 4.5948661863803864e-05, 5.014240741729736e-05, 5.433615297079086e-05, 5.852989852428436e-05, 6.272364407777786e-05, 6.691738963127136e-05, 7.111113518476486e-05, 7.530488073825836e-05, 7.949862629175186e-05, 8.369237184524536e-05, 8.788611739873886e-05, 9.207986295223236e-05, 9.627360850572586e-05, 0.00010046735405921936, 0.00010466109961271286, 0.00010885484516620636, 0.00011304859071969986, 0.00011724233627319336]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 13.0, 13.0, 26.0, 35.0, 46.0, 75.0, 102.0, 196.0, 392.0, 885.0, 2099.0, 6110.0, 22624.0, 121482.0, 703657.0, 152688.0, 26844.0, 7010.0, 2269.0, 984.0, 411.0, 238.0, 126.0, 86.0, 43.0, 37.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.939453125, -0.90655517578125, -0.8736572265625, -0.84075927734375, -0.807861328125, -0.77496337890625, -0.7420654296875, -0.70916748046875, -0.67626953125, -0.64337158203125, -0.6104736328125, -0.57757568359375, -0.544677734375, -0.51177978515625, -0.4788818359375, -0.44598388671875, -0.4130859375, -0.38018798828125, -0.3472900390625, -0.31439208984375, -0.281494140625, -0.24859619140625, -0.2156982421875, -0.18280029296875, -0.14990234375, -0.11700439453125, -0.0841064453125, -0.05120849609375, -0.018310546875, 0.01458740234375, 0.0474853515625, 0.08038330078125, 0.11328125, 0.14617919921875, 0.1790771484375, 0.21197509765625, 0.244873046875, 0.27777099609375, 0.3106689453125, 0.34356689453125, 0.37646484375, 0.40936279296875, 0.4422607421875, 0.47515869140625, 0.508056640625, 0.54095458984375, 0.5738525390625, 0.60675048828125, 0.6396484375, 0.67254638671875, 0.7054443359375, 0.73834228515625, 0.771240234375, 0.80413818359375, 0.8370361328125, 0.86993408203125, 0.90283203125, 0.93572998046875, 0.9686279296875, 1.00152587890625, 1.034423828125, 1.06732177734375, 1.1002197265625, 1.13311767578125, 1.166015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 28.0, 25.0, 46.0, 68.0, 107.0, 152.0, 152.0, 128.0, 84.0, 44.0, 42.0, 31.0, 18.0, 7.0, 5.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5000381469726562, -0.4810333251953125, -0.46202850341796875, -0.443023681640625, -0.42401885986328125, -0.4050140380859375, -0.38600921630859375, -0.36700439453125, -0.34799957275390625, -0.3289947509765625, -0.30998992919921875, -0.290985107421875, -0.27198028564453125, -0.2529754638671875, -0.23397064208984375, -0.2149658203125, -0.19596099853515625, -0.1769561767578125, -0.15795135498046875, -0.138946533203125, -0.11994171142578125, -0.1009368896484375, -0.08193206787109375, -0.06292724609375, -0.04392242431640625, -0.0249176025390625, -0.00591278076171875, 0.013092041015625, 0.03209686279296875, 0.0511016845703125, 0.07010650634765625, 0.089111328125, 0.10811614990234375, 0.1271209716796875, 0.14612579345703125, 0.165130615234375, 0.18413543701171875, 0.2031402587890625, 0.22214508056640625, 0.24114990234375, 0.26015472412109375, 0.2791595458984375, 0.29816436767578125, 0.317169189453125, 0.33617401123046875, 0.3551788330078125, 0.37418365478515625, 0.3931884765625, 0.41219329833984375, 0.4311981201171875, 0.45020294189453125, 0.469207763671875, 0.48821258544921875, 0.5072174072265625, 0.5262222290039062, 0.54522705078125, 0.5642318725585938, 0.5832366943359375, 0.6022415161132812, 0.621246337890625, 0.6402511596679688, 0.6592559814453125, 0.6782608032226562, 0.697265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 34.0, 185.0, 526.0, 197.0, 35.0, 13.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-55.455902099609375, -54.43771743774414, -53.41952896118164, -52.401344299316406, -51.383155822753906, -50.36497116088867, -49.34678649902344, -48.32859802246094, -47.3104133605957, -46.29222869873047, -45.27404022216797, -44.255855560302734, -43.2376708984375, -42.219482421875, -41.201297760009766, -40.183109283447266, -39.16492462158203, -38.1467399597168, -37.1285514831543, -36.11036682128906, -35.09217834472656, -34.07399368286133, -33.055809020996094, -32.037620544433594, -31.01943588256836, -30.001249313354492, -28.983062744140625, -27.96487808227539, -26.946691513061523, -25.928504943847656, -24.910320281982422, -23.892133712768555, -22.873950958251953, -21.855764389038086, -20.83757781982422, -19.819393157958984, -18.801206588745117, -17.78302001953125, -16.764835357666016, -15.746648788452148, -14.728461265563965, -13.710275650024414, -12.692089080810547, -11.67390251159668, -10.655716896057129, -9.637531280517578, -8.619344711303711, -7.601158618927002, -6.582972526550293, -5.564786434173584, -4.546600341796875, -3.528414249420166, -2.510228157043457, -1.492042064666748, -0.47385597229003906, 0.5443301200866699, 1.562516212463379, 2.580702304840088, 3.598888397216797, 4.617074489593506, 5.635260581970215, 6.653446674346924, 7.671632766723633, 8.6898193359375, 9.70800495147705]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 13.0, 8.0, 13.0, 15.0, 26.0, 31.0, 34.0, 46.0, 47.0, 58.0, 58.0, 63.0, 69.0, 68.0, 57.0, 53.0, 49.0, 58.0, 40.0, 23.0, 28.0, 25.0, 27.0, 25.0, 11.0, 8.0, 9.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.137054443359375, -8.83527660369873, -8.533498764038086, -8.231721878051758, -7.929944038391113, -7.628166198730469, -7.326388835906982, -7.024611473083496, -6.722833633422852, -6.421055793762207, -6.119278430938721, -5.817501068115234, -5.51572322845459, -5.213945388793945, -4.912168025970459, -4.610390663146973, -4.308612823486328, -4.006834983825684, -3.7050576210021973, -3.403280019760132, -3.1015024185180664, -2.799724817276001, -2.4979472160339355, -2.19616961479187, -1.8943920135498047, -1.5926144123077393, -1.2908368110656738, -0.9890592098236084, -0.687281608581543, -0.38550400733947754, -0.08372640609741211, 0.21805119514465332, 0.5198287963867188, 0.8216063976287842, 1.1233839988708496, 1.425161600112915, 1.7269392013549805, 2.028716802597046, 2.3304944038391113, 2.6322720050811768, 2.934049606323242, 3.2358272075653076, 3.537604808807373, 3.8393824100494385, 4.141160011291504, 4.442937850952148, 4.744715213775635, 5.046492576599121, 5.348270416259766, 5.65004825592041, 5.9518256187438965, 6.253602981567383, 6.555380821228027, 6.857158660888672, 7.158936023712158, 7.4607133865356445, 7.762491226196289, 8.064269065856934, 8.366046905517578, 8.667823791503906, 8.96960163116455, 9.271379470825195, 9.573156356811523, 9.874934196472168, 10.176712036132812]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 8.0, 14.0, 12.0, 8.0, 21.0, 16.0, 26.0, 34.0, 41.0, 44.0, 74.0, 155.0, 642.0, 3474.0, 42414.0, 3751925.0, 380710.0, 12305.0, 1595.0, 368.0, 115.0, 62.0, 34.0, 25.0, 26.0, 26.0, 22.0, 10.0, 10.0, 5.0, 7.0, 12.0, 6.0, 8.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1015625, -8.7738037109375, -8.446044921875, -8.1182861328125, -7.79052734375, -7.4627685546875, -7.135009765625, -6.8072509765625, -6.4794921875, -6.1517333984375, -5.823974609375, -5.4962158203125, -5.16845703125, -4.8406982421875, -4.512939453125, -4.1851806640625, -3.857421875, -3.5296630859375, -3.201904296875, -2.8741455078125, -2.54638671875, -2.2186279296875, -1.890869140625, -1.5631103515625, -1.2353515625, -0.9075927734375, -0.579833984375, -0.2520751953125, 0.07568359375, 0.4034423828125, 0.731201171875, 1.0589599609375, 1.38671875, 1.7144775390625, 2.042236328125, 2.3699951171875, 2.69775390625, 3.0255126953125, 3.353271484375, 3.6810302734375, 4.0087890625, 4.3365478515625, 4.664306640625, 4.9920654296875, 5.31982421875, 5.6475830078125, 5.975341796875, 6.3031005859375, 6.630859375, 6.9586181640625, 7.286376953125, 7.6141357421875, 7.94189453125, 8.2696533203125, 8.597412109375, 8.9251708984375, 9.2529296875, 9.5806884765625, 9.908447265625, 10.2362060546875, 10.56396484375, 10.8917236328125, 11.219482421875, 11.5472412109375, 11.875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 7.0, 9.0, 12.0, 20.0, 42.0, 64.0, 67.0, 101.0, 119.0, 133.0, 128.0, 98.0, 73.0, 49.0, 22.0, 29.0, 14.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.07904052734375, -6.9080810546875, -6.73712158203125, -6.566162109375, -6.39520263671875, -6.2242431640625, -6.05328369140625, -5.88232421875, -5.71136474609375, -5.5404052734375, -5.36944580078125, -5.198486328125, -5.02752685546875, -4.8565673828125, -4.68560791015625, -4.5146484375, -4.34368896484375, -4.1727294921875, -4.00177001953125, -3.830810546875, -3.65985107421875, -3.4888916015625, -3.31793212890625, -3.14697265625, -2.97601318359375, -2.8050537109375, -2.63409423828125, -2.463134765625, -2.29217529296875, -2.1212158203125, -1.95025634765625, -1.779296875, -1.60833740234375, -1.4373779296875, -1.26641845703125, -1.095458984375, -0.92449951171875, -0.7535400390625, -0.58258056640625, -0.41162109375, -0.24066162109375, -0.0697021484375, 0.10125732421875, 0.272216796875, 0.44317626953125, 0.6141357421875, 0.78509521484375, 0.9560546875, 1.12701416015625, 1.2979736328125, 1.46893310546875, 1.639892578125, 1.81085205078125, 1.9818115234375, 2.15277099609375, 2.32373046875, 2.49468994140625, 2.6656494140625, 2.83660888671875, 3.007568359375, 3.17852783203125, 3.3494873046875, 3.52044677734375, 3.69140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 18.0, 17.0, 55.0, 183.0, 956.0, 308804.0, 3882414.0, 1484.0, 207.0, 70.0, 29.0, 15.0, 12.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.171875, -27.2939453125, -26.416015625, -25.5380859375, -24.66015625, -23.7822265625, -22.904296875, -22.0263671875, -21.1484375, -20.2705078125, -19.392578125, -18.5146484375, -17.63671875, -16.7587890625, -15.880859375, -15.0029296875, -14.125, -13.2470703125, -12.369140625, -11.4912109375, -10.61328125, -9.7353515625, -8.857421875, -7.9794921875, -7.1015625, -6.2236328125, -5.345703125, -4.4677734375, -3.58984375, -2.7119140625, -1.833984375, -0.9560546875, -0.078125, 0.7998046875, 1.677734375, 2.5556640625, 3.43359375, 4.3115234375, 5.189453125, 6.0673828125, 6.9453125, 7.8232421875, 8.701171875, 9.5791015625, 10.45703125, 11.3349609375, 12.212890625, 13.0908203125, 13.96875, 14.8466796875, 15.724609375, 16.6025390625, 17.48046875, 18.3583984375, 19.236328125, 20.1142578125, 20.9921875, 21.8701171875, 22.748046875, 23.6259765625, 24.50390625, 25.3818359375, 26.259765625, 27.1376953125, 28.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 12.0, 23.0, 38.0, 59.0, 71.0, 92.0, 130.0, 186.0, 315.0, 608.0, 967.0, 533.0, 314.0, 218.0, 128.0, 95.0, 74.0, 39.0, 29.0, 24.0, 18.0, 13.0, 11.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.002532958984375, -0.96600341796875, -0.929473876953125, -0.8929443359375, -0.856414794921875, -0.81988525390625, -0.783355712890625, -0.746826171875, -0.710296630859375, -0.67376708984375, -0.637237548828125, -0.6007080078125, -0.564178466796875, -0.52764892578125, -0.491119384765625, -0.45458984375, -0.418060302734375, -0.38153076171875, -0.345001220703125, -0.3084716796875, -0.271942138671875, -0.23541259765625, -0.198883056640625, -0.162353515625, -0.125823974609375, -0.08929443359375, -0.052764892578125, -0.0162353515625, 0.020294189453125, 0.05682373046875, 0.093353271484375, 0.1298828125, 0.166412353515625, 0.20294189453125, 0.239471435546875, 0.2760009765625, 0.312530517578125, 0.34906005859375, 0.385589599609375, 0.422119140625, 0.458648681640625, 0.49517822265625, 0.531707763671875, 0.5682373046875, 0.604766845703125, 0.64129638671875, 0.677825927734375, 0.71435546875, 0.750885009765625, 0.78741455078125, 0.823944091796875, 0.8604736328125, 0.897003173828125, 0.93353271484375, 0.970062255859375, 1.006591796875, 1.043121337890625, 1.07965087890625, 1.116180419921875, 1.1527099609375, 1.189239501953125, 1.22576904296875, 1.262298583984375, 1.298828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 18.0, 23.0, 32.0, 53.0, 84.0, 113.0, 144.0, 138.0, 126.0, 72.0, 65.0, 37.0, 15.0, 16.0, 12.0, 7.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.720313549041748, -4.545834064483643, -4.371354579925537, -4.196875095367432, -4.022396087646484, -3.8479163646698, -3.6734371185302734, -3.498957633972168, -3.3244781494140625, -3.149998664855957, -2.9755191802978516, -2.801039934158325, -2.6265604496002197, -2.4520809650421143, -2.277601718902588, -2.1031222343444824, -1.928642749786377, -1.7541632652282715, -1.5796838998794556, -1.4052045345306396, -1.2307250499725342, -1.0562455654144287, -0.8817662000656128, -0.7072868347167969, -0.5328073501586914, -0.3583279252052307, -0.18384850025177002, -0.009369075298309326, 0.16511034965515137, 0.33958977460861206, 0.5140691995620728, 0.6885485649108887, 0.8630285263061523, 1.0375080108642578, 1.2119873762130737, 1.3864667415618896, 1.5609462261199951, 1.7354257106781006, 1.9099050760269165, 2.0843844413757324, 2.258863925933838, 2.4333434104919434, 2.607822895050049, 2.782302141189575, 2.9567816257476807, 3.131261110305786, 3.3057403564453125, 3.480219841003418, 3.6546993255615234, 3.829178810119629, 4.003658294677734, 4.17813777923584, 4.352617263793945, 4.527096271514893, 4.701575756072998, 4.8760552406311035, 5.050534725189209, 5.2250142097473145, 5.39949369430542, 5.573973178863525, 5.748452186584473, 5.922931671142578, 6.097411155700684, 6.271890640258789, 6.4463701248168945]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 6.0, 16.0, 29.0, 42.0, 60.0, 53.0, 93.0, 84.0, 111.0, 95.0, 90.0, 67.0, 78.0, 49.0, 31.0, 22.0, 25.0, 15.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.394373416900635, -6.220241546630859, -6.046109199523926, -5.87197732925415, -5.697845458984375, -5.523713111877441, -5.349581241607666, -5.175449371337891, -5.001317024230957, -4.827185153961182, -4.653052806854248, -4.478920936584473, -4.304789066314697, -4.130657196044922, -3.9565248489379883, -3.782392978668213, -3.6082611083984375, -3.434128999710083, -3.2599971294403076, -3.085865020751953, -2.9117331504821777, -2.7376010417938232, -2.5634689331054688, -2.3893370628356934, -2.215204954147339, -2.0410728454589844, -1.866940975189209, -1.6928088665008545, -1.5186768770217896, -1.3445448875427246, -1.1704127788543701, -0.9962807893753052, -0.8221492767333984, -0.6480172872543335, -0.4738852381706238, -0.29975318908691406, -0.12562119960784912, 0.04851078987121582, 0.2226428985595703, 0.39677488803863525, 0.5709068775177002, 0.7450388669967651, 0.9191709160804749, 1.0933029651641846, 1.2674349546432495, 1.4415669441223145, 1.615699052810669, 1.7898310422897339, 1.9639630317687988, 2.1380951404571533, 2.3122270107269287, 2.486359119415283, 2.6604909896850586, 2.834623098373413, 3.0087552070617676, 3.182887077331543, 3.3570191860198975, 3.531151294708252, 3.7052831649780273, 3.879415273666382, 4.053547382354736, 4.227679252624512, 4.401811599731445, 4.575943470001221, 4.750075340270996]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 13.0, 12.0, 14.0, 25.0, 43.0, 87.0, 179.0, 514.0, 1607.0, 14641.0, 980156.0, 47379.0, 2697.0, 671.0, 239.0, 111.0, 65.0, 31.0, 21.0, 21.0, 8.0, 6.0, 4.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3971710205078125, -1.356842041015625, -1.3165130615234375, -1.27618408203125, -1.2358551025390625, -1.195526123046875, -1.1551971435546875, -1.1148681640625, -1.0745391845703125, -1.034210205078125, -0.9938812255859375, -0.95355224609375, -0.9132232666015625, -0.872894287109375, -0.8325653076171875, -0.792236328125, -0.7519073486328125, -0.711578369140625, -0.6712493896484375, -0.63092041015625, -0.5905914306640625, -0.550262451171875, -0.5099334716796875, -0.4696044921875, -0.4292755126953125, -0.388946533203125, -0.3486175537109375, -0.30828857421875, -0.2679595947265625, -0.227630615234375, -0.1873016357421875, -0.14697265625, -0.1066436767578125, -0.066314697265625, -0.0259857177734375, 0.01434326171875, 0.0546722412109375, 0.095001220703125, 0.1353302001953125, 0.1756591796875, 0.2159881591796875, 0.256317138671875, 0.2966461181640625, 0.33697509765625, 0.3773040771484375, 0.417633056640625, 0.4579620361328125, 0.498291015625, 0.5386199951171875, 0.578948974609375, 0.6192779541015625, 0.65960693359375, 0.6999359130859375, 0.740264892578125, 0.7805938720703125, 0.8209228515625, 0.8612518310546875, 0.901580810546875, 0.9419097900390625, 0.98223876953125, 1.0225677490234375, 1.062896728515625, 1.1032257080078125, 1.1435546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 10.0, 13.0, 30.0, 46.0, 76.0, 79.0, 104.0, 129.0, 105.0, 113.0, 89.0, 55.0, 40.0, 28.0, 21.0, 15.0, 8.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.4813232421875, -4.353271484375, -4.2252197265625, -4.09716796875, -3.9691162109375, -3.841064453125, -3.7130126953125, -3.5849609375, -3.4569091796875, -3.328857421875, -3.2008056640625, -3.07275390625, -2.9447021484375, -2.816650390625, -2.6885986328125, -2.560546875, -2.4324951171875, -2.304443359375, -2.1763916015625, -2.04833984375, -1.9202880859375, -1.792236328125, -1.6641845703125, -1.5361328125, -1.4080810546875, -1.280029296875, -1.1519775390625, -1.02392578125, -0.8958740234375, -0.767822265625, -0.6397705078125, -0.51171875, -0.3836669921875, -0.255615234375, -0.1275634765625, 0.00048828125, 0.1285400390625, 0.256591796875, 0.3846435546875, 0.5126953125, 0.6407470703125, 0.768798828125, 0.8968505859375, 1.02490234375, 1.1529541015625, 1.281005859375, 1.4090576171875, 1.537109375, 1.6651611328125, 1.793212890625, 1.9212646484375, 2.04931640625, 2.1773681640625, 2.305419921875, 2.4334716796875, 2.5615234375, 2.6895751953125, 2.817626953125, 2.9456787109375, 3.07373046875, 3.2017822265625, 3.329833984375, 3.4578857421875, 3.5859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 15.0, 14.0, 22.0, 21.0, 37.0, 55.0, 65.0, 60.0, 99.0, 145.0, 199.0, 308.0, 449.0, 941.0, 3785.0, 40511.0, 622197.0, 354332.0, 20653.0, 2556.0, 721.0, 405.0, 281.0, 180.0, 114.0, 78.0, 64.0, 57.0, 38.0, 25.0, 22.0, 9.0, 20.0, 13.0, 12.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.384521484375, -0.37380218505859375, -0.3630828857421875, -0.35236358642578125, -0.341644287109375, -0.33092498779296875, -0.3202056884765625, -0.30948638916015625, -0.29876708984375, -0.28804779052734375, -0.2773284912109375, -0.26660919189453125, -0.255889892578125, -0.24517059326171875, -0.2344512939453125, -0.22373199462890625, -0.2130126953125, -0.20229339599609375, -0.1915740966796875, -0.18085479736328125, -0.170135498046875, -0.15941619873046875, -0.1486968994140625, -0.13797760009765625, -0.12725830078125, -0.11653900146484375, -0.1058197021484375, -0.09510040283203125, -0.084381103515625, -0.07366180419921875, -0.0629425048828125, -0.05222320556640625, -0.04150390625, -0.03078460693359375, -0.0200653076171875, -0.00934600830078125, 0.001373291015625, 0.01209259033203125, 0.0228118896484375, 0.03353118896484375, 0.04425048828125, 0.05496978759765625, 0.0656890869140625, 0.07640838623046875, 0.087127685546875, 0.09784698486328125, 0.1085662841796875, 0.11928558349609375, 0.1300048828125, 0.14072418212890625, 0.1514434814453125, 0.16216278076171875, 0.172882080078125, 0.18360137939453125, 0.1943206787109375, 0.20503997802734375, 0.21575927734375, 0.22647857666015625, 0.2371978759765625, 0.24791717529296875, 0.258636474609375, 0.26935577392578125, 0.2800750732421875, 0.29079437255859375, 0.301513671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 11.0, 6.0, 20.0, 11.0, 11.0, 18.0, 22.0, 32.0, 32.0, 32.0, 29.0, 48.0, 44.0, 38.0, 37.0, 41.0, 54.0, 43.0, 55.0, 50.0, 38.0, 43.0, 48.0, 34.0, 33.0, 25.0, 22.0, 16.0, 11.0, 11.0, 13.0, 13.0, 7.0, 13.0, 4.0, 5.0, 4.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.39453125, -3.292022705078125, -3.18951416015625, -3.087005615234375, -2.9844970703125, -2.881988525390625, -2.77947998046875, -2.676971435546875, -2.574462890625, -2.471954345703125, -2.36944580078125, -2.266937255859375, -2.1644287109375, -2.061920166015625, -1.95941162109375, -1.856903076171875, -1.75439453125, -1.651885986328125, -1.54937744140625, -1.446868896484375, -1.3443603515625, -1.241851806640625, -1.13934326171875, -1.036834716796875, -0.934326171875, -0.831817626953125, -0.72930908203125, -0.626800537109375, -0.5242919921875, -0.421783447265625, -0.31927490234375, -0.216766357421875, -0.1142578125, -0.011749267578125, 0.09075927734375, 0.193267822265625, 0.2957763671875, 0.398284912109375, 0.50079345703125, 0.603302001953125, 0.705810546875, 0.808319091796875, 0.91082763671875, 1.013336181640625, 1.1158447265625, 1.218353271484375, 1.32086181640625, 1.423370361328125, 1.52587890625, 1.628387451171875, 1.73089599609375, 1.833404541015625, 1.9359130859375, 2.038421630859375, 2.14093017578125, 2.243438720703125, 2.345947265625, 2.448455810546875, 2.55096435546875, 2.653472900390625, 2.7559814453125, 2.858489990234375, 2.96099853515625, 3.063507080078125, 3.166015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 18.0, 16.0, 31.0, 22.0, 40.0, 65.0, 78.0, 96.0, 208.0, 351.0, 838.0, 3102.0, 78108.0, 951016.0, 11870.0, 1404.0, 503.0, 248.0, 164.0, 94.0, 72.0, 51.0, 28.0, 17.0, 20.0, 6.0, 15.0, 7.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10089111328125, -0.09673404693603516, -0.09257698059082031, -0.08841991424560547, -0.08426284790039062, -0.08010578155517578, -0.07594871520996094, -0.0717916488647461, -0.06763458251953125, -0.0634775161743164, -0.05932044982910156, -0.05516338348388672, -0.051006317138671875, -0.04684925079345703, -0.04269218444824219, -0.038535118103027344, -0.0343780517578125, -0.030220985412597656, -0.026063919067382812, -0.02190685272216797, -0.017749786376953125, -0.013592720031738281, -0.009435653686523438, -0.005278587341308594, -0.00112152099609375, 0.0030355453491210938, 0.0071926116943359375, 0.011349678039550781, 0.015506744384765625, 0.01966381072998047, 0.023820877075195312, 0.027977943420410156, 0.032135009765625, 0.036292076110839844, 0.04044914245605469, 0.04460620880126953, 0.048763275146484375, 0.05292034149169922, 0.05707740783691406, 0.061234474182128906, 0.06539154052734375, 0.0695486068725586, 0.07370567321777344, 0.07786273956298828, 0.08201980590820312, 0.08617687225341797, 0.09033393859863281, 0.09449100494384766, 0.0986480712890625, 0.10280513763427734, 0.10696220397949219, 0.11111927032470703, 0.11527633666992188, 0.11943340301513672, 0.12359046936035156, 0.1277475357055664, 0.13190460205078125, 0.1360616683959961, 0.14021873474121094, 0.14437580108642578, 0.14853286743164062, 0.15268993377685547, 0.1568470001220703, 0.16100406646728516, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 7.0, 11.0, 12.0, 12.0, 11.0, 8.0, 23.0, 29.0, 22.0, 36.0, 43.0, 50.0, 64.0, 72.0, 78.0, 75.0, 60.0, 59.0, 53.0, 53.0, 44.0, 30.0, 23.0, 25.0, 24.0, 13.0, 8.0, 7.0, 2.0, 6.0, 0.0, 6.0, 6.0, 1.0, 4.0, 0.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.47955322265625e-05, -2.3974105715751648e-05, -2.3152679204940796e-05, -2.2331252694129944e-05, -2.1509826183319092e-05, -2.068839967250824e-05, -1.9866973161697388e-05, -1.9045546650886536e-05, -1.8224120140075684e-05, -1.740269362926483e-05, -1.658126711845398e-05, -1.5759840607643127e-05, -1.4938414096832275e-05, -1.4116987586021423e-05, -1.3295561075210571e-05, -1.247413456439972e-05, -1.1652708053588867e-05, -1.0831281542778015e-05, -1.0009855031967163e-05, -9.188428521156311e-06, -8.367002010345459e-06, -7.545575499534607e-06, -6.724148988723755e-06, -5.902722477912903e-06, -5.081295967102051e-06, -4.259869456291199e-06, -3.4384429454803467e-06, -2.6170164346694946e-06, -1.7955899238586426e-06, -9.741634130477905e-07, -1.5273690223693848e-07, 6.686896085739136e-07, 1.4901161193847656e-06, 2.3115426301956177e-06, 3.1329691410064697e-06, 3.954395651817322e-06, 4.775822162628174e-06, 5.597248673439026e-06, 6.418675184249878e-06, 7.24010169506073e-06, 8.061528205871582e-06, 8.882954716682434e-06, 9.704381227493286e-06, 1.0525807738304138e-05, 1.134723424911499e-05, 1.2168660759925842e-05, 1.2990087270736694e-05, 1.3811513781547546e-05, 1.4632940292358398e-05, 1.545436680316925e-05, 1.6275793313980103e-05, 1.7097219824790955e-05, 1.7918646335601807e-05, 1.874007284641266e-05, 1.956149935722351e-05, 2.0382925868034363e-05, 2.1204352378845215e-05, 2.2025778889656067e-05, 2.284720540046692e-05, 2.366863191127777e-05, 2.4490058422088623e-05, 2.5311484932899475e-05, 2.6132911443710327e-05, 2.695433795452118e-05, 2.777576446533203e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 9.0, 15.0, 20.0, 25.0, 48.0, 74.0, 114.0, 189.0, 350.0, 673.0, 1288.0, 2848.0, 7322.0, 27330.0, 260808.0, 683601.0, 46311.0, 10461.0, 3718.0, 1532.0, 770.0, 421.0, 250.0, 148.0, 69.0, 43.0, 25.0, 26.0, 13.0, 10.0, 11.0, 5.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.0767812728881836, -0.07372856140136719, -0.07067584991455078, -0.06762313842773438, -0.06457042694091797, -0.06151771545410156, -0.058465003967285156, -0.05541229248046875, -0.052359580993652344, -0.04930686950683594, -0.04625415802001953, -0.043201446533203125, -0.04014873504638672, -0.03709602355957031, -0.034043312072753906, -0.0309906005859375, -0.027937889099121094, -0.024885177612304688, -0.02183246612548828, -0.018779754638671875, -0.01572704315185547, -0.012674331665039062, -0.009621620178222656, -0.00656890869140625, -0.0035161972045898438, -0.0004634857177734375, 0.0025892257690429688, 0.005641937255859375, 0.008694648742675781, 0.011747360229492188, 0.014800071716308594, 0.017852783203125, 0.020905494689941406, 0.023958206176757812, 0.02701091766357422, 0.030063629150390625, 0.03311634063720703, 0.03616905212402344, 0.039221763610839844, 0.04227447509765625, 0.045327186584472656, 0.04837989807128906, 0.05143260955810547, 0.054485321044921875, 0.05753803253173828, 0.06059074401855469, 0.0636434555053711, 0.0666961669921875, 0.0697488784790039, 0.07280158996582031, 0.07585430145263672, 0.07890701293945312, 0.08195972442626953, 0.08501243591308594, 0.08806514739990234, 0.09111785888671875, 0.09417057037353516, 0.09722328186035156, 0.10027599334716797, 0.10332870483398438, 0.10638141632080078, 0.10943412780761719, 0.1124868392944336, 0.11553955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 12.0, 11.0, 5.0, 12.0, 24.0, 40.0, 68.0, 116.0, 222.0, 208.0, 117.0, 52.0, 22.0, 19.0, 20.0, 8.0, 10.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.033660888671875, -0.032837629318237305, -0.03201436996459961, -0.031191110610961914, -0.03036785125732422, -0.029544591903686523, -0.028721332550048828, -0.027898073196411133, -0.027074813842773438, -0.026251554489135742, -0.025428295135498047, -0.02460503578186035, -0.023781776428222656, -0.02295851707458496, -0.022135257720947266, -0.02131199836730957, -0.020488739013671875, -0.01966547966003418, -0.018842220306396484, -0.01801896095275879, -0.017195701599121094, -0.0163724422454834, -0.015549182891845703, -0.014725923538208008, -0.013902664184570312, -0.013079404830932617, -0.012256145477294922, -0.011432886123657227, -0.010609626770019531, -0.009786367416381836, -0.00896310806274414, -0.008139848709106445, -0.00731658935546875, -0.006493330001831055, -0.005670070648193359, -0.004846811294555664, -0.004023551940917969, -0.0032002925872802734, -0.002377033233642578, -0.0015537738800048828, -0.0007305145263671875, 9.274482727050781e-05, 0.0009160041809082031, 0.0017392635345458984, 0.0025625228881835938, 0.003385782241821289, 0.004209041595458984, 0.00503230094909668, 0.005855560302734375, 0.00667881965637207, 0.007502079010009766, 0.008325338363647461, 0.009148597717285156, 0.009971857070922852, 0.010795116424560547, 0.011618375778198242, 0.012441635131835938, 0.013264894485473633, 0.014088153839111328, 0.014911413192749023, 0.01573467254638672, 0.016557931900024414, 0.01738119125366211, 0.018204450607299805, 0.0190277099609375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 14.0, 32.0, 44.0, 75.0, 157.0, 184.0, 199.0, 105.0, 69.0, 33.0, 24.0, 14.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.593433856964111, -5.445555686950684, -5.297677516937256, -5.149799823760986, -5.001921653747559, -4.854043483734131, -4.706165313720703, -4.558287143707275, -4.410408973693848, -4.26253080368042, -4.114652633666992, -3.9667747020721436, -3.818896770477295, -3.671018600463867, -3.5231404304504395, -3.3752622604370117, -3.227384567260742, -3.0795063972473145, -2.931628465652466, -2.783750295639038, -2.6358723640441895, -2.4879941940307617, -2.340116024017334, -2.1922378540039062, -2.0443599224090576, -1.8964818716049194, -1.7486038208007812, -1.6007256507873535, -1.4528475999832153, -1.3049695491790771, -1.1570913791656494, -1.0092133283615112, -0.8613357543945312, -0.7134577035903931, -0.5655795931816101, -0.41770151257514954, -0.26982343196868896, -0.12194538116455078, 0.025932729244232178, 0.17381083965301514, 0.3216888904571533, 0.4695669710636139, 0.6174450516700745, 0.7653231620788574, 0.9132012128829956, 1.0610792636871338, 1.2089574337005615, 1.3568354845046997, 1.504713535308838, 1.652591586112976, 1.8004696369171143, 1.948347806930542, 2.0962257385253906, 2.2441039085388184, 2.391982078552246, 2.539860248565674, 2.6877381801605225, 2.83561635017395, 2.983494281768799, 3.1313724517822266, 3.2792506217956543, 3.427128553390503, 3.5750067234039307, 3.7228846549987793, 3.870762825012207]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 12.0, 13.0, 28.0, 49.0, 71.0, 90.0, 108.0, 140.0, 127.0, 103.0, 77.0, 56.0, 36.0, 26.0, 20.0, 11.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.927026271820068, -4.793264865875244, -4.659503936767578, -4.525742530822754, -4.39198112487793, -4.2582197189331055, -4.1244587898254395, -3.9906973838806152, -3.85693621635437, -3.723175048828125, -3.589413642883301, -3.4556524753570557, -3.3218913078308105, -3.1881299018859863, -3.054368734359741, -2.920607566833496, -2.786846160888672, -2.6530849933624268, -2.5193235874176025, -2.3855624198913574, -2.251801013946533, -2.118039846420288, -1.984278678894043, -1.8505173921585083, -1.7167561054229736, -1.582994818687439, -1.4492335319519043, -1.3154723644256592, -1.1817110776901245, -1.0479497909545898, -0.9141885638237, -0.7804273366928101, -0.6466658115386963, -0.5129045248031616, -0.37914329767227173, -0.24538204073905945, -0.11162078380584717, 0.0221405029296875, 0.1559017300605774, 0.2896629571914673, 0.42342424392700195, 0.5571855306625366, 0.6909467577934265, 0.8247079849243164, 0.9584692716598511, 1.0922305583953857, 1.2259917259216309, 1.3597530126571655, 1.4935142993927002, 1.6272755861282349, 1.7610368728637695, 1.8947980403900146, 2.0285592079162598, 2.162320613861084, 2.296081781387329, 2.429842948913574, 2.5636043548583984, 2.6973655223846436, 2.8311269283294678, 2.964888095855713, 3.098649501800537, 3.2324106693267822, 3.3661718368530273, 3.4999332427978516, 3.6336944103240967]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 21.0, 21.0, 30.0, 33.0, 42.0, 58.0, 122.0, 145.0, 265.0, 388.0, 579.0, 988.0, 1563.0, 2900.0, 5627.0, 11268.0, 25556.0, 66094.0, 210112.0, 441694.0, 178331.0, 57838.0, 22922.0, 10078.0, 5081.0, 2707.0, 1510.0, 907.0, 568.0, 312.0, 238.0, 139.0, 98.0, 80.0, 56.0, 36.0, 39.0, 33.0, 14.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.548828125, -2.467742919921875, -2.38665771484375, -2.305572509765625, -2.2244873046875, -2.143402099609375, -2.06231689453125, -1.981231689453125, -1.900146484375, -1.819061279296875, -1.73797607421875, -1.656890869140625, -1.5758056640625, -1.494720458984375, -1.41363525390625, -1.332550048828125, -1.25146484375, -1.170379638671875, -1.08929443359375, -1.008209228515625, -0.9271240234375, -0.846038818359375, -0.76495361328125, -0.683868408203125, -0.602783203125, -0.521697998046875, -0.44061279296875, -0.359527587890625, -0.2784423828125, -0.197357177734375, -0.11627197265625, -0.035186767578125, 0.0458984375, 0.126983642578125, 0.20806884765625, 0.289154052734375, 0.3702392578125, 0.451324462890625, 0.53240966796875, 0.613494873046875, 0.694580078125, 0.775665283203125, 0.85675048828125, 0.937835693359375, 1.0189208984375, 1.100006103515625, 1.18109130859375, 1.262176513671875, 1.34326171875, 1.424346923828125, 1.50543212890625, 1.586517333984375, 1.6676025390625, 1.748687744140625, 1.82977294921875, 1.910858154296875, 1.991943359375, 2.073028564453125, 2.15411376953125, 2.235198974609375, 2.3162841796875, 2.397369384765625, 2.47845458984375, 2.559539794921875, 2.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 13.0, 11.0, 10.0, 28.0, 34.0, 40.0, 59.0, 79.0, 106.0, 130.0, 112.0, 87.0, 82.0, 51.0, 46.0, 33.0, 16.0, 17.0, 14.0, 8.0, 8.0, 7.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.93939208984375, -8.6834716796875, -8.42755126953125, -8.171630859375, -7.91571044921875, -7.6597900390625, -7.40386962890625, -7.14794921875, -6.89202880859375, -6.6361083984375, -6.38018798828125, -6.124267578125, -5.86834716796875, -5.6124267578125, -5.35650634765625, -5.1005859375, -4.84466552734375, -4.5887451171875, -4.33282470703125, -4.076904296875, -3.82098388671875, -3.5650634765625, -3.30914306640625, -3.05322265625, -2.79730224609375, -2.5413818359375, -2.28546142578125, -2.029541015625, -1.77362060546875, -1.5177001953125, -1.26177978515625, -1.005859375, -0.74993896484375, -0.4940185546875, -0.23809814453125, 0.017822265625, 0.27374267578125, 0.5296630859375, 0.78558349609375, 1.04150390625, 1.29742431640625, 1.5533447265625, 1.80926513671875, 2.065185546875, 2.32110595703125, 2.5770263671875, 2.83294677734375, 3.0888671875, 3.34478759765625, 3.6007080078125, 3.85662841796875, 4.112548828125, 4.36846923828125, 4.6243896484375, 4.88031005859375, 5.13623046875, 5.39215087890625, 5.6480712890625, 5.90399169921875, 6.159912109375, 6.41583251953125, 6.6717529296875, 6.92767333984375, 7.18359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 2.0, 6.0, 4.0, 7.0, 16.0, 7.0, 15.0, 16.0, 24.0, 17.0, 25.0, 38.0, 36.0, 32.0, 33.0, 66.0, 84.0, 160.0, 754.0, 9691.0, 903580.0, 130462.0, 2618.0, 359.0, 98.0, 76.0, 33.0, 31.0, 46.0, 24.0, 30.0, 34.0, 16.0, 25.0, 9.0, 11.0, 19.0, 4.0, 11.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.4765625, -14.0604248046875, -13.644287109375, -13.2281494140625, -12.81201171875, -12.3958740234375, -11.979736328125, -11.5635986328125, -11.1474609375, -10.7313232421875, -10.315185546875, -9.8990478515625, -9.48291015625, -9.0667724609375, -8.650634765625, -8.2344970703125, -7.818359375, -7.4022216796875, -6.986083984375, -6.5699462890625, -6.15380859375, -5.7376708984375, -5.321533203125, -4.9053955078125, -4.4892578125, -4.0731201171875, -3.656982421875, -3.2408447265625, -2.82470703125, -2.4085693359375, -1.992431640625, -1.5762939453125, -1.16015625, -0.7440185546875, -0.327880859375, 0.0882568359375, 0.50439453125, 0.9205322265625, 1.336669921875, 1.7528076171875, 2.1689453125, 2.5850830078125, 3.001220703125, 3.4173583984375, 3.83349609375, 4.2496337890625, 4.665771484375, 5.0819091796875, 5.498046875, 5.9141845703125, 6.330322265625, 6.7464599609375, 7.16259765625, 7.5787353515625, 7.994873046875, 8.4110107421875, 8.8271484375, 9.2432861328125, 9.659423828125, 10.0755615234375, 10.49169921875, 10.9078369140625, 11.323974609375, 11.7401123046875, 12.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 5.0, 3.0, 4.0, 10.0, 8.0, 7.0, 13.0, 14.0, 19.0, 18.0, 27.0, 20.0, 14.0, 43.0, 31.0, 34.0, 38.0, 48.0, 37.0, 35.0, 38.0, 31.0, 48.0, 33.0, 38.0, 31.0, 36.0, 41.0, 37.0, 25.0, 29.0, 29.0, 28.0, 17.0, 13.0, 19.0, 14.0, 15.0, 12.0, 8.0, 4.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.32415771484375, -4.1834716796875, -4.04278564453125, -3.902099609375, -3.76141357421875, -3.6207275390625, -3.48004150390625, -3.33935546875, -3.19866943359375, -3.0579833984375, -2.91729736328125, -2.776611328125, -2.63592529296875, -2.4952392578125, -2.35455322265625, -2.2138671875, -2.07318115234375, -1.9324951171875, -1.79180908203125, -1.651123046875, -1.51043701171875, -1.3697509765625, -1.22906494140625, -1.08837890625, -0.94769287109375, -0.8070068359375, -0.66632080078125, -0.525634765625, -0.38494873046875, -0.2442626953125, -0.10357666015625, 0.037109375, 0.17779541015625, 0.3184814453125, 0.45916748046875, 0.599853515625, 0.74053955078125, 0.8812255859375, 1.02191162109375, 1.16259765625, 1.30328369140625, 1.4439697265625, 1.58465576171875, 1.725341796875, 1.86602783203125, 2.0067138671875, 2.14739990234375, 2.2880859375, 2.42877197265625, 2.5694580078125, 2.71014404296875, 2.850830078125, 2.99151611328125, 3.1322021484375, 3.27288818359375, 3.41357421875, 3.55426025390625, 3.6949462890625, 3.83563232421875, 3.976318359375, 4.11700439453125, 4.2576904296875, 4.39837646484375, 4.5390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 9.0, 9.0, 10.0, 11.0, 31.0, 35.0, 63.0, 82.0, 130.0, 194.0, 348.0, 630.0, 1248.0, 2883.0, 8048.0, 26874.0, 111628.0, 439180.0, 344895.0, 81006.0, 20042.0, 6313.0, 2399.0, 1046.0, 543.0, 337.0, 174.0, 112.0, 67.0, 47.0, 29.0, 31.0, 15.0, 15.0, 16.0, 15.0, 8.0, 6.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.033203125, -1.0044174194335938, -0.9756317138671875, -0.9468460083007812, -0.918060302734375, -0.8892745971679688, -0.8604888916015625, -0.8317031860351562, -0.80291748046875, -0.7741317749023438, -0.7453460693359375, -0.7165603637695312, -0.687774658203125, -0.6589889526367188, -0.6302032470703125, -0.6014175415039062, -0.5726318359375, -0.5438461303710938, -0.5150604248046875, -0.48627471923828125, -0.457489013671875, -0.42870330810546875, -0.3999176025390625, -0.37113189697265625, -0.34234619140625, -0.31356048583984375, -0.2847747802734375, -0.25598907470703125, -0.227203369140625, -0.19841766357421875, -0.1696319580078125, -0.14084625244140625, -0.112060546875, -0.08327484130859375, -0.0544891357421875, -0.02570343017578125, 0.003082275390625, 0.03186798095703125, 0.0606536865234375, 0.08943939208984375, 0.11822509765625, 0.14701080322265625, 0.1757965087890625, 0.20458221435546875, 0.233367919921875, 0.26215362548828125, 0.2909393310546875, 0.31972503662109375, 0.3485107421875, 0.37729644775390625, 0.4060821533203125, 0.43486785888671875, 0.463653564453125, 0.49243927001953125, 0.5212249755859375, 0.5500106811523438, 0.57879638671875, 0.6075820922851562, 0.6363677978515625, 0.6651535034179688, 0.693939208984375, 0.7227249145507812, 0.7515106201171875, 0.7802963256835938, 0.80908203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 15.0, 18.0, 26.0, 24.0, 18.0, 39.0, 21.0, 46.0, 48.0, 54.0, 52.0, 61.0, 58.0, 73.0, 63.0, 40.0, 52.0, 52.0, 41.0, 26.0, 29.0, 24.0, 16.0, 11.0, 15.0, 12.0, 14.0, 1.0, 5.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00014317035675048828, -0.00013899803161621094, -0.0001348257064819336, -0.00013065338134765625, -0.0001264810562133789, -0.00012230873107910156, -0.00011813640594482422, -0.00011396408081054688, -0.00010979175567626953, -0.00010561943054199219, -0.00010144710540771484, -9.72747802734375e-05, -9.310245513916016e-05, -8.893013000488281e-05, -8.475780487060547e-05, -8.058547973632812e-05, -7.641315460205078e-05, -7.224082946777344e-05, -6.80685043334961e-05, -6.389617919921875e-05, -5.9723854064941406e-05, -5.555152893066406e-05, -5.137920379638672e-05, -4.7206878662109375e-05, -4.303455352783203e-05, -3.886222839355469e-05, -3.4689903259277344e-05, -3.0517578125e-05, -2.6345252990722656e-05, -2.2172927856445312e-05, -1.800060272216797e-05, -1.3828277587890625e-05, -9.655952453613281e-06, -5.4836273193359375e-06, -1.3113021850585938e-06, 2.86102294921875e-06, 7.033348083496094e-06, 1.1205673217773438e-05, 1.537799835205078e-05, 1.9550323486328125e-05, 2.372264862060547e-05, 2.7894973754882812e-05, 3.2067298889160156e-05, 3.62396240234375e-05, 4.0411949157714844e-05, 4.458427429199219e-05, 4.875659942626953e-05, 5.2928924560546875e-05, 5.710124969482422e-05, 6.127357482910156e-05, 6.54458999633789e-05, 6.961822509765625e-05, 7.37905502319336e-05, 7.796287536621094e-05, 8.213520050048828e-05, 8.630752563476562e-05, 9.047985076904297e-05, 9.465217590332031e-05, 9.882450103759766e-05, 0.000102996826171875, 0.00010716915130615234, 0.00011134147644042969, 0.00011551380157470703, 0.00011968612670898438]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 15.0, 16.0, 51.0, 56.0, 74.0, 106.0, 135.0, 225.0, 394.0, 713.0, 1331.0, 2862.0, 6634.0, 17497.0, 55064.0, 190215.0, 444170.0, 227452.0, 66559.0, 20812.0, 7534.0, 3185.0, 1445.0, 767.0, 436.0, 250.0, 152.0, 105.0, 73.0, 63.0, 28.0, 33.0, 20.0, 16.0, 14.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6909942626953125, -0.667633056640625, -0.6442718505859375, -0.62091064453125, -0.5975494384765625, -0.574188232421875, -0.5508270263671875, -0.5274658203125, -0.5041046142578125, -0.480743408203125, -0.4573822021484375, -0.43402099609375, -0.4106597900390625, -0.387298583984375, -0.3639373779296875, -0.340576171875, -0.3172149658203125, -0.293853759765625, -0.2704925537109375, -0.24713134765625, -0.2237701416015625, -0.200408935546875, -0.1770477294921875, -0.1536865234375, -0.1303253173828125, -0.106964111328125, -0.0836029052734375, -0.06024169921875, -0.0368804931640625, -0.013519287109375, 0.0098419189453125, 0.033203125, 0.0565643310546875, 0.079925537109375, 0.1032867431640625, 0.12664794921875, 0.1500091552734375, 0.173370361328125, 0.1967315673828125, 0.2200927734375, 0.2434539794921875, 0.266815185546875, 0.2901763916015625, 0.31353759765625, 0.3368988037109375, 0.360260009765625, 0.3836212158203125, 0.406982421875, 0.4303436279296875, 0.453704833984375, 0.4770660400390625, 0.50042724609375, 0.5237884521484375, 0.547149658203125, 0.5705108642578125, 0.5938720703125, 0.6172332763671875, 0.640594482421875, 0.6639556884765625, 0.68731689453125, 0.7106781005859375, 0.734039306640625, 0.7574005126953125, 0.78076171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 10.0, 11.0, 14.0, 24.0, 31.0, 19.0, 31.0, 36.0, 24.0, 27.0, 32.0, 52.0, 56.0, 56.0, 63.0, 46.0, 63.0, 36.0, 45.0, 34.0, 36.0, 38.0, 33.0, 25.0, 24.0, 19.0, 19.0, 17.0, 13.0, 11.0, 7.0, 10.0, 4.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.360107421875, -0.3492851257324219, -0.33846282958984375, -0.3276405334472656, -0.3168182373046875, -0.3059959411621094, -0.29517364501953125, -0.2843513488769531, -0.273529052734375, -0.2627067565917969, -0.25188446044921875, -0.24106216430664062, -0.2302398681640625, -0.21941757202148438, -0.20859527587890625, -0.19777297973632812, -0.18695068359375, -0.17612838745117188, -0.16530609130859375, -0.15448379516601562, -0.1436614990234375, -0.13283920288085938, -0.12201690673828125, -0.11119461059570312, -0.100372314453125, -0.08955001831054688, -0.07872772216796875, -0.06790542602539062, -0.0570831298828125, -0.046260833740234375, -0.03543853759765625, -0.024616241455078125, -0.0137939453125, -0.002971649169921875, 0.00785064697265625, 0.018672943115234375, 0.0294952392578125, 0.040317535400390625, 0.05113983154296875, 0.061962127685546875, 0.072784423828125, 0.08360671997070312, 0.09442901611328125, 0.10525131225585938, 0.1160736083984375, 0.12689590454101562, 0.13771820068359375, 0.14854049682617188, 0.15936279296875, 0.17018508911132812, 0.18100738525390625, 0.19182968139648438, 0.2026519775390625, 0.21347427368164062, 0.22429656982421875, 0.23511886596679688, 0.245941162109375, 0.2567634582519531, 0.26758575439453125, 0.2784080505371094, 0.2892303466796875, 0.3000526428222656, 0.31087493896484375, 0.3216972351074219, 0.33251953125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 8.0, 6.0, 13.0, 22.0, 38.0, 74.0, 125.0, 143.0, 167.0, 140.0, 83.0, 67.0, 37.0, 21.0, 15.0, 10.0, 0.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4451904296875, -9.169502258300781, -8.893815040588379, -8.618127822875977, -8.342439651489258, -8.066751480102539, -7.791064262390137, -7.515376567840576, -7.239688873291016, -6.964001178741455, -6.6883134841918945, -6.412625789642334, -6.136938095092773, -5.861250400543213, -5.585562705993652, -5.309875011444092, -5.034187316894531, -4.758499622344971, -4.48281192779541, -4.20712423324585, -3.931436538696289, -3.6557488441467285, -3.380061149597168, -3.1043734550476074, -2.828685760498047, -2.5529980659484863, -2.277310371398926, -2.0016226768493652, -1.7259349822998047, -1.4502472877502441, -1.1745595932006836, -0.898871898651123, -0.6231842041015625, -0.34749650955200195, -0.0718088150024414, 0.20387887954711914, 0.4795665740966797, 0.7552542686462402, 1.0309419631958008, 1.3066296577453613, 1.5823173522949219, 1.8580050468444824, 2.133692741394043, 2.4093804359436035, 2.685068130493164, 2.9607558250427246, 3.236443519592285, 3.5121312141418457, 3.7878189086914062, 4.063506603240967, 4.339194297790527, 4.614881992340088, 4.890569686889648, 5.166257381439209, 5.4419450759887695, 5.71763277053833, 5.993320465087891, 6.269008159637451, 6.544695854187012, 6.820383548736572, 7.096071243286133, 7.371758937835693, 7.647446632385254, 7.9231343269348145, 8.198822021484375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 9.0, 3.0, 6.0, 6.0, 11.0, 14.0, 18.0, 20.0, 18.0, 30.0, 31.0, 42.0, 39.0, 49.0, 60.0, 60.0, 41.0, 42.0, 65.0, 56.0, 62.0, 55.0, 35.0, 32.0, 27.0, 22.0, 29.0, 31.0, 17.0, 22.0, 6.0, 13.0, 6.0, 8.0, 3.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.960089683532715, -10.629469871520996, -10.298850059509277, -9.968230247497559, -9.63761043548584, -9.306990623474121, -8.976370811462402, -8.645751953125, -8.315132141113281, -7.9845123291015625, -7.653892517089844, -7.323272705078125, -6.992652893066406, -6.6620330810546875, -6.331413745880127, -6.000793933868408, -5.670173645019531, -5.3395538330078125, -5.008934020996094, -4.678314208984375, -4.347694396972656, -4.0170745849609375, -3.686455249786377, -3.355835437774658, -3.0252156257629395, -2.6945958137512207, -2.363976001739502, -2.0333564281463623, -1.7027366161346436, -1.3721168041229248, -1.0414971113204956, -0.7108774185180664, -0.38025665283203125, -0.049636900424957275, 0.2809828519821167, 0.6116026043891907, 0.9422223567962646, 1.2728421688079834, 1.6034618616104126, 1.9340815544128418, 2.2647013664245605, 2.5953211784362793, 2.925940990447998, 3.2565605640411377, 3.5871803760528564, 3.917800188064575, 4.248419761657715, 4.579039573669434, 4.909659385681152, 5.240279197692871, 5.57089900970459, 5.901518821716309, 6.232138633728027, 6.562758445739746, 6.893377780914307, 7.223997592926025, 7.554617404937744, 7.885237216949463, 8.215856552124023, 8.546476364135742, 8.877096176147461, 9.20771598815918, 9.538335800170898, 9.868955612182617, 10.199575424194336]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 11.0, 11.0, 13.0, 25.0, 35.0, 42.0, 88.0, 109.0, 169.0, 255.0, 397.0, 646.0, 1199.0, 2344.0, 5146.0, 12345.0, 36239.0, 152473.0, 2058517.0, 1728635.0, 139049.0, 33906.0, 11915.0, 5117.0, 2498.0, 1163.0, 696.0, 447.0, 276.0, 183.0, 107.0, 77.0, 39.0, 33.0, 24.0, 9.0, 14.0, 8.0, 7.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.320556640625, -3.21337890625, -3.106201171875, -2.9990234375, -2.891845703125, -2.78466796875, -2.677490234375, -2.5703125, -2.463134765625, -2.35595703125, -2.248779296875, -2.1416015625, -2.034423828125, -1.92724609375, -1.820068359375, -1.712890625, -1.605712890625, -1.49853515625, -1.391357421875, -1.2841796875, -1.177001953125, -1.06982421875, -0.962646484375, -0.85546875, -0.748291015625, -0.64111328125, -0.533935546875, -0.4267578125, -0.319580078125, -0.21240234375, -0.105224609375, 0.001953125, 0.109130859375, 0.21630859375, 0.323486328125, 0.4306640625, 0.537841796875, 0.64501953125, 0.752197265625, 0.859375, 0.966552734375, 1.07373046875, 1.180908203125, 1.2880859375, 1.395263671875, 1.50244140625, 1.609619140625, 1.716796875, 1.823974609375, 1.93115234375, 2.038330078125, 2.1455078125, 2.252685546875, 2.35986328125, 2.467041015625, 2.57421875, 2.681396484375, 2.78857421875, 2.895751953125, 3.0029296875, 3.110107421875, 3.21728515625, 3.324462890625, 3.431640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 7.0, 13.0, 17.0, 24.0, 37.0, 63.0, 78.0, 110.0, 110.0, 145.0, 114.0, 78.0, 63.0, 38.0, 35.0, 20.0, 16.0, 14.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.49609375, -6.326171875, -6.15625, -5.986328125, -5.81640625, -5.646484375, -5.4765625, -5.306640625, -5.13671875, -4.966796875, -4.796875, -4.626953125, -4.45703125, -4.287109375, -4.1171875, -3.947265625, -3.77734375, -3.607421875, -3.4375, -3.267578125, -3.09765625, -2.927734375, -2.7578125, -2.587890625, -2.41796875, -2.248046875, -2.078125, -1.908203125, -1.73828125, -1.568359375, -1.3984375, -1.228515625, -1.05859375, -0.888671875, -0.71875, -0.548828125, -0.37890625, -0.208984375, -0.0390625, 0.130859375, 0.30078125, 0.470703125, 0.640625, 0.810546875, 0.98046875, 1.150390625, 1.3203125, 1.490234375, 1.66015625, 1.830078125, 2.0, 2.169921875, 2.33984375, 2.509765625, 2.6796875, 2.849609375, 3.01953125, 3.189453125, 3.359375, 3.529296875, 3.69921875, 3.869140625, 4.0390625, 4.208984375, 4.37890625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 14.0, 18.0, 32.0, 58.0, 93.0, 152.0, 424.0, 3227.0, 502408.0, 3681468.0, 5352.0, 572.0, 194.0, 85.0, 58.0, 37.0, 20.0, 16.0, 13.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.078125, -14.576904296875, -14.07568359375, -13.574462890625, -13.0732421875, -12.572021484375, -12.07080078125, -11.569580078125, -11.068359375, -10.567138671875, -10.06591796875, -9.564697265625, -9.0634765625, -8.562255859375, -8.06103515625, -7.559814453125, -7.05859375, -6.557373046875, -6.05615234375, -5.554931640625, -5.0537109375, -4.552490234375, -4.05126953125, -3.550048828125, -3.048828125, -2.547607421875, -2.04638671875, -1.545166015625, -1.0439453125, -0.542724609375, -0.04150390625, 0.459716796875, 0.9609375, 1.462158203125, 1.96337890625, 2.464599609375, 2.9658203125, 3.467041015625, 3.96826171875, 4.469482421875, 4.970703125, 5.471923828125, 5.97314453125, 6.474365234375, 6.9755859375, 7.476806640625, 7.97802734375, 8.479248046875, 8.98046875, 9.481689453125, 9.98291015625, 10.484130859375, 10.9853515625, 11.486572265625, 11.98779296875, 12.489013671875, 12.990234375, 13.491455078125, 13.99267578125, 14.493896484375, 14.9951171875, 15.496337890625, 15.99755859375, 16.498779296875, 17.0]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 9.0, 14.0, 19.0, 29.0, 33.0, 38.0, 49.0, 90.0, 128.0, 172.0, 312.0, 589.0, 1110.0, 565.0, 313.0, 175.0, 106.0, 74.0, 56.0, 47.0, 37.0, 25.0, 21.0, 9.0, 10.0, 6.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.849609375, -0.8175048828125, -0.785400390625, -0.7532958984375, -0.72119140625, -0.6890869140625, -0.656982421875, -0.6248779296875, -0.5927734375, -0.5606689453125, -0.528564453125, -0.4964599609375, -0.46435546875, -0.4322509765625, -0.400146484375, -0.3680419921875, -0.3359375, -0.3038330078125, -0.271728515625, -0.2396240234375, -0.20751953125, -0.1754150390625, -0.143310546875, -0.1112060546875, -0.0791015625, -0.0469970703125, -0.014892578125, 0.0172119140625, 0.04931640625, 0.0814208984375, 0.113525390625, 0.1456298828125, 0.177734375, 0.2098388671875, 0.241943359375, 0.2740478515625, 0.30615234375, 0.3382568359375, 0.370361328125, 0.4024658203125, 0.4345703125, 0.4666748046875, 0.498779296875, 0.5308837890625, 0.56298828125, 0.5950927734375, 0.627197265625, 0.6593017578125, 0.69140625, 0.7235107421875, 0.755615234375, 0.7877197265625, 0.81982421875, 0.8519287109375, 0.884033203125, 0.9161376953125, 0.9482421875, 0.9803466796875, 1.012451171875, 1.0445556640625, 1.07666015625, 1.1087646484375, 1.140869140625, 1.1729736328125, 1.205078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 17.0, 23.0, 44.0, 78.0, 100.0, 166.0, 150.0, 112.0, 104.0, 56.0, 40.0, 24.0, 15.0, 10.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.421330451965332, -5.24224853515625, -5.063167095184326, -4.884085178375244, -4.70500373840332, -4.525921821594238, -4.346839904785156, -4.167757987976074, -3.9886765480041504, -3.8095948696136475, -3.6305131912231445, -3.4514312744140625, -3.2723495960235596, -3.0932679176330566, -2.9141860008239746, -2.7351043224334717, -2.5560226440429688, -2.376940965652466, -2.197859287261963, -2.018777370452881, -1.839695692062378, -1.660614013671875, -1.4815322160720825, -1.30245041847229, -1.123368740081787, -0.9442870020866394, -0.7652052640914917, -0.586123526096344, -0.4070417881011963, -0.22796005010604858, -0.04887831211090088, 0.1302034854888916, 0.30928564071655273, 0.48836737871170044, 0.6674491167068481, 0.8465308547019958, 1.0256125926971436, 1.2046942710876465, 1.383776068687439, 1.5628578662872314, 1.7419395446777344, 1.9210212230682373, 2.1001029014587402, 2.2791848182678223, 2.458266496658325, 2.637348175048828, 2.81643009185791, 2.995511770248413, 3.174593448638916, 3.353675127029419, 3.532756805419922, 3.711838722229004, 3.890920400619507, 4.07000207901001, 4.249083995819092, 4.428165435791016, 4.607247352600098, 4.78632926940918, 4.9654107093811035, 5.1444926261901855, 5.323574066162109, 5.502655982971191, 5.681737899780273, 5.8608198165893555, 6.039901256561279]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 12.0, 12.0, 27.0, 28.0, 39.0, 64.0, 65.0, 80.0, 75.0, 91.0, 84.0, 76.0, 78.0, 59.0, 54.0, 37.0, 18.0, 21.0, 15.0, 14.0, 13.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.287173748016357, -5.141117095947266, -4.995060443878174, -4.849003791809082, -4.702946662902832, -4.55689001083374, -4.410833358764648, -4.264776706695557, -4.118720054626465, -3.972663402557373, -3.8266067504882812, -3.6805498600006104, -3.5344932079315186, -3.3884365558624268, -3.242379665374756, -3.096323013305664, -2.9502663612365723, -2.8042097091674805, -2.6581530570983887, -2.5120961666107178, -2.366039514541626, -2.219982862472534, -2.0739259719848633, -1.9278693199157715, -1.7818126678466797, -1.635756015777588, -1.4896992444992065, -1.3436424732208252, -1.1975858211517334, -1.0515291690826416, -0.9054723978042603, -0.7594156265258789, -0.6133584976196289, -0.46730178594589233, -0.32124507427215576, -0.1751883625984192, -0.029131650924682617, 0.11692506074905396, 0.2629817724227905, 0.4090385437011719, 0.5550951957702637, 0.7011519074440002, 0.8472086191177368, 0.9932653307914734, 1.13932204246521, 1.2853786945343018, 1.431435465812683, 1.5774922370910645, 1.7235488891601562, 1.869605541229248, 2.01566219329834, 2.1617190837860107, 2.3077757358551025, 2.4538323879241943, 2.5998892784118652, 2.745945930480957, 2.892002582550049, 3.0380592346191406, 3.1841158866882324, 3.3301727771759033, 3.476229429244995, 3.622286081314087, 3.768342971801758, 3.9143996238708496, 4.060456275939941]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 23.0, 23.0, 56.0, 94.0, 191.0, 373.0, 1004.0, 3102.0, 17310.0, 329059.0, 662840.0, 28047.0, 4240.0, 1249.0, 453.0, 200.0, 116.0, 60.0, 23.0, 22.0, 20.0, 7.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.492919921875, -0.4759864807128906, -0.45905303955078125, -0.4421195983886719, -0.4251861572265625, -0.4082527160644531, -0.39131927490234375, -0.3743858337402344, -0.357452392578125, -0.3405189514160156, -0.32358551025390625, -0.3066520690917969, -0.2897186279296875, -0.2727851867675781, -0.25585174560546875, -0.23891830444335938, -0.22198486328125, -0.20505142211914062, -0.18811798095703125, -0.17118453979492188, -0.1542510986328125, -0.13731765747070312, -0.12038421630859375, -0.10345077514648438, -0.086517333984375, -0.06958389282226562, -0.05265045166015625, -0.035717010498046875, -0.0187835693359375, -0.001850128173828125, 0.01508331298828125, 0.032016754150390625, 0.0489501953125, 0.06588363647460938, 0.08281707763671875, 0.09975051879882812, 0.1166839599609375, 0.13361740112304688, 0.15055084228515625, 0.16748428344726562, 0.184417724609375, 0.20135116577148438, 0.21828460693359375, 0.23521804809570312, 0.2521514892578125, 0.2690849304199219, 0.28601837158203125, 0.3029518127441406, 0.31988525390625, 0.3368186950683594, 0.35375213623046875, 0.3706855773925781, 0.3876190185546875, 0.4045524597167969, 0.42148590087890625, 0.4384193420410156, 0.455352783203125, 0.4722862243652344, 0.48921966552734375, 0.5061531066894531, 0.5230865478515625, 0.5400199890136719, 0.5569534301757812, 0.5738868713378906, 0.5908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 9.0, 18.0, 26.0, 48.0, 56.0, 99.0, 94.0, 108.0, 127.0, 113.0, 65.0, 57.0, 44.0, 28.0, 25.0, 18.0, 9.0, 12.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.91351318359375, -3.7918701171875, -3.67022705078125, -3.548583984375, -3.42694091796875, -3.3052978515625, -3.18365478515625, -3.06201171875, -2.94036865234375, -2.8187255859375, -2.69708251953125, -2.575439453125, -2.45379638671875, -2.3321533203125, -2.21051025390625, -2.0888671875, -1.96722412109375, -1.8455810546875, -1.72393798828125, -1.602294921875, -1.48065185546875, -1.3590087890625, -1.23736572265625, -1.11572265625, -0.99407958984375, -0.8724365234375, -0.75079345703125, -0.629150390625, -0.50750732421875, -0.3858642578125, -0.26422119140625, -0.142578125, -0.02093505859375, 0.1007080078125, 0.22235107421875, 0.343994140625, 0.46563720703125, 0.5872802734375, 0.70892333984375, 0.83056640625, 0.95220947265625, 1.0738525390625, 1.19549560546875, 1.317138671875, 1.43878173828125, 1.5604248046875, 1.68206787109375, 1.8037109375, 1.92535400390625, 2.0469970703125, 2.16864013671875, 2.290283203125, 2.41192626953125, 2.5335693359375, 2.65521240234375, 2.77685546875, 2.89849853515625, 3.0201416015625, 3.14178466796875, 3.263427734375, 3.38507080078125, 3.5067138671875, 3.62835693359375, 3.75]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 4.0, 4.0, 4.0, 6.0, 8.0, 10.0, 12.0, 14.0, 21.0, 26.0, 30.0, 41.0, 48.0, 65.0, 85.0, 119.0, 151.0, 256.0, 412.0, 821.0, 2903.0, 19390.0, 216499.0, 701208.0, 92551.0, 10062.0, 1908.0, 677.0, 372.0, 220.0, 140.0, 97.0, 75.0, 47.0, 50.0, 49.0, 29.0, 27.0, 26.0, 16.0, 14.0, 11.0, 7.0, 7.0, 9.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.3056640625, -0.2964935302734375, -0.287322998046875, -0.2781524658203125, -0.26898193359375, -0.2598114013671875, -0.250640869140625, -0.2414703369140625, -0.2322998046875, -0.2231292724609375, -0.213958740234375, -0.2047882080078125, -0.19561767578125, -0.1864471435546875, -0.177276611328125, -0.1681060791015625, -0.158935546875, -0.1497650146484375, -0.140594482421875, -0.1314239501953125, -0.12225341796875, -0.1130828857421875, -0.103912353515625, -0.0947418212890625, -0.0855712890625, -0.0764007568359375, -0.067230224609375, -0.0580596923828125, -0.04888916015625, -0.0397186279296875, -0.030548095703125, -0.0213775634765625, -0.01220703125, -0.0030364990234375, 0.006134033203125, 0.0153045654296875, 0.02447509765625, 0.0336456298828125, 0.042816162109375, 0.0519866943359375, 0.0611572265625, 0.0703277587890625, 0.079498291015625, 0.0886688232421875, 0.09783935546875, 0.1070098876953125, 0.116180419921875, 0.1253509521484375, 0.134521484375, 0.1436920166015625, 0.152862548828125, 0.1620330810546875, 0.17120361328125, 0.1803741455078125, 0.189544677734375, 0.1987152099609375, 0.2078857421875, 0.2170562744140625, 0.226226806640625, 0.2353973388671875, 0.24456787109375, 0.2537384033203125, 0.262908935546875, 0.2720794677734375, 0.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 8.0, 15.0, 13.0, 9.0, 13.0, 19.0, 23.0, 33.0, 35.0, 22.0, 42.0, 33.0, 47.0, 55.0, 46.0, 47.0, 49.0, 32.0, 39.0, 41.0, 53.0, 29.0, 38.0, 33.0, 32.0, 31.0, 24.0, 23.0, 15.0, 15.0, 17.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.118865966796875, -3.00921630859375, -2.899566650390625, -2.7899169921875, -2.680267333984375, -2.57061767578125, -2.460968017578125, -2.351318359375, -2.241668701171875, -2.13201904296875, -2.022369384765625, -1.9127197265625, -1.803070068359375, -1.69342041015625, -1.583770751953125, -1.47412109375, -1.364471435546875, -1.25482177734375, -1.145172119140625, -1.0355224609375, -0.925872802734375, -0.81622314453125, -0.706573486328125, -0.596923828125, -0.487274169921875, -0.37762451171875, -0.267974853515625, -0.1583251953125, -0.048675537109375, 0.06097412109375, 0.170623779296875, 0.2802734375, 0.389923095703125, 0.49957275390625, 0.609222412109375, 0.7188720703125, 0.828521728515625, 0.93817138671875, 1.047821044921875, 1.157470703125, 1.267120361328125, 1.37677001953125, 1.486419677734375, 1.5960693359375, 1.705718994140625, 1.81536865234375, 1.925018310546875, 2.03466796875, 2.144317626953125, 2.25396728515625, 2.363616943359375, 2.4732666015625, 2.582916259765625, 2.69256591796875, 2.802215576171875, 2.911865234375, 3.021514892578125, 3.13116455078125, 3.240814208984375, 3.3504638671875, 3.460113525390625, 3.56976318359375, 3.679412841796875, 3.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 26.0, 27.0, 65.0, 109.0, 271.0, 1052.0, 102597.0, 942429.0, 1327.0, 339.0, 119.0, 71.0, 34.0, 17.0, 15.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43359375, -0.4204826354980469, -0.40737152099609375, -0.3942604064941406, -0.3811492919921875, -0.3680381774902344, -0.35492706298828125, -0.3418159484863281, -0.328704833984375, -0.3155937194824219, -0.30248260498046875, -0.2893714904785156, -0.2762603759765625, -0.2631492614746094, -0.25003814697265625, -0.23692703247070312, -0.22381591796875, -0.21070480346679688, -0.19759368896484375, -0.18448257446289062, -0.1713714599609375, -0.15826034545898438, -0.14514923095703125, -0.13203811645507812, -0.118927001953125, -0.10581588745117188, -0.09270477294921875, -0.07959365844726562, -0.0664825439453125, -0.053371429443359375, -0.04026031494140625, -0.027149200439453125, -0.0140380859375, -0.000926971435546875, 0.01218414306640625, 0.025295257568359375, 0.0384063720703125, 0.051517486572265625, 0.06462860107421875, 0.07773971557617188, 0.090850830078125, 0.10396194458007812, 0.11707305908203125, 0.13018417358398438, 0.1432952880859375, 0.15640640258789062, 0.16951751708984375, 0.18262863159179688, 0.19573974609375, 0.20885086059570312, 0.22196197509765625, 0.23507308959960938, 0.2481842041015625, 0.2612953186035156, 0.27440643310546875, 0.2875175476074219, 0.300628662109375, 0.3137397766113281, 0.32685089111328125, 0.3399620056152344, 0.3530731201171875, 0.3661842346191406, 0.37929534912109375, 0.3924064636230469, 0.405517578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 15.0, 20.0, 34.0, 64.0, 116.0, 173.0, 189.0, 141.0, 80.0, 44.0, 24.0, 24.0, 15.0, 17.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.854534149169922e-05, -6.659794598817825e-05, -6.465055048465729e-05, -6.270315498113632e-05, -6.0755759477615356e-05, -5.880836397409439e-05, -5.6860968470573425e-05, -5.491357296705246e-05, -5.2966177463531494e-05, -5.101878196001053e-05, -4.907138645648956e-05, -4.71239909529686e-05, -4.517659544944763e-05, -4.3229199945926666e-05, -4.12818044424057e-05, -3.9334408938884735e-05, -3.738701343536377e-05, -3.5439617931842804e-05, -3.349222242832184e-05, -3.154482692480087e-05, -2.9597431421279907e-05, -2.765003591775894e-05, -2.5702640414237976e-05, -2.375524491071701e-05, -2.1807849407196045e-05, -1.986045390367508e-05, -1.7913058400154114e-05, -1.5965662896633148e-05, -1.4018267393112183e-05, -1.2070871889591217e-05, -1.0123476386070251e-05, -8.176080882549286e-06, -6.22868537902832e-06, -4.281289875507355e-06, -2.333894371986389e-06, -3.864988684654236e-07, 1.560896635055542e-06, 3.5082921385765076e-06, 5.455687642097473e-06, 7.403083145618439e-06, 9.350478649139404e-06, 1.129787415266037e-05, 1.3245269656181335e-05, 1.5192665159702301e-05, 1.7140060663223267e-05, 1.9087456166744232e-05, 2.1034851670265198e-05, 2.2982247173786163e-05, 2.492964267730713e-05, 2.6877038180828094e-05, 2.882443368434906e-05, 3.0771829187870026e-05, 3.271922469139099e-05, 3.466662019491196e-05, 3.661401569843292e-05, 3.856141120195389e-05, 4.0508806705474854e-05, 4.245620220899582e-05, 4.4403597712516785e-05, 4.635099321603775e-05, 4.8298388719558716e-05, 5.024578422307968e-05, 5.219317972660065e-05, 5.414057523012161e-05, 5.608797073364258e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 12.0, 11.0, 13.0, 15.0, 39.0, 84.0, 218.0, 619.0, 2915.0, 74654.0, 962355.0, 6172.0, 916.0, 280.0, 112.0, 58.0, 27.0, 21.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41943359375, -0.4078407287597656, -0.39624786376953125, -0.3846549987792969, -0.3730621337890625, -0.3614692687988281, -0.34987640380859375, -0.3382835388183594, -0.326690673828125, -0.3150978088378906, -0.30350494384765625, -0.2919120788574219, -0.2803192138671875, -0.2687263488769531, -0.25713348388671875, -0.24554061889648438, -0.23394775390625, -0.22235488891601562, -0.21076202392578125, -0.19916915893554688, -0.1875762939453125, -0.17598342895507812, -0.16439056396484375, -0.15279769897460938, -0.141204833984375, -0.12961196899414062, -0.11801910400390625, -0.10642623901367188, -0.0948333740234375, -0.08324050903320312, -0.07164764404296875, -0.060054779052734375, -0.0484619140625, -0.036869049072265625, -0.02527618408203125, -0.013683319091796875, -0.0020904541015625, 0.009502410888671875, 0.02109527587890625, 0.032688140869140625, 0.044281005859375, 0.055873870849609375, 0.06746673583984375, 0.07905960083007812, 0.0906524658203125, 0.10224533081054688, 0.11383819580078125, 0.12543106079101562, 0.13702392578125, 0.14861679077148438, 0.16020965576171875, 0.17180252075195312, 0.1833953857421875, 0.19498825073242188, 0.20658111572265625, 0.21817398071289062, 0.229766845703125, 0.24135971069335938, 0.25295257568359375, 0.2645454406738281, 0.2761383056640625, 0.2877311706542969, 0.29932403564453125, 0.3109169006347656, 0.322509765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 0.0, 4.0, 6.0, 12.0, 12.0, 18.0, 25.0, 33.0, 132.0, 415.0, 181.0, 71.0, 33.0, 13.0, 15.0, 7.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054351806640625, -0.0525212287902832, -0.050690650939941406, -0.04886007308959961, -0.04702949523925781, -0.045198917388916016, -0.04336833953857422, -0.04153776168823242, -0.039707183837890625, -0.03787660598754883, -0.03604602813720703, -0.034215450286865234, -0.03238487243652344, -0.03055429458618164, -0.028723716735839844, -0.026893138885498047, -0.02506256103515625, -0.023231983184814453, -0.021401405334472656, -0.01957082748413086, -0.017740249633789062, -0.015909671783447266, -0.014079093933105469, -0.012248516082763672, -0.010417938232421875, -0.008587360382080078, -0.006756782531738281, -0.004926204681396484, -0.0030956268310546875, -0.0012650489807128906, 0.0005655288696289062, 0.002396106719970703, 0.0042266845703125, 0.006057262420654297, 0.007887840270996094, 0.00971841812133789, 0.011548995971679688, 0.013379573822021484, 0.015210151672363281, 0.017040729522705078, 0.018871307373046875, 0.020701885223388672, 0.02253246307373047, 0.024363040924072266, 0.026193618774414062, 0.02802419662475586, 0.029854774475097656, 0.03168535232543945, 0.03351593017578125, 0.03534650802612305, 0.037177085876464844, 0.03900766372680664, 0.04083824157714844, 0.042668819427490234, 0.04449939727783203, 0.04632997512817383, 0.048160552978515625, 0.04999113082885742, 0.05182170867919922, 0.053652286529541016, 0.05548286437988281, 0.05731344223022461, 0.059144020080566406, 0.0609745979309082, 0.06280517578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 6.0, 8.0, 9.0, 21.0, 41.0, 71.0, 126.0, 203.0, 176.0, 141.0, 78.0, 38.0, 21.0, 14.0, 13.0, 5.0, 7.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.707956790924072, -4.5609540939331055, -4.4139509201049805, -4.2669477462768555, -4.119945049285889, -3.9729421138763428, -3.825939178466797, -3.678936243057251, -3.531933307647705, -3.384930372238159, -3.2379274368286133, -3.0909245014190674, -2.9439215660095215, -2.7969186305999756, -2.6499156951904297, -2.502912759780884, -2.355909824371338, -2.208906888961792, -2.061903953552246, -1.9149010181427002, -1.7678980827331543, -1.6208951473236084, -1.4738922119140625, -1.3268892765045166, -1.1798863410949707, -1.0328834056854248, -0.8858804702758789, -0.738877534866333, -0.5918745994567871, -0.4448716640472412, -0.2978687286376953, -0.15086579322814941, -0.0038628578186035156, 0.14314007759094238, 0.2901430130004883, 0.4371459484100342, 0.5841488838195801, 0.731151819229126, 0.8781547546386719, 1.0251576900482178, 1.1721606254577637, 1.3191635608673096, 1.4661664962768555, 1.6131694316864014, 1.7601723670959473, 1.9071753025054932, 2.054178237915039, 2.201181173324585, 2.348184108734131, 2.4951870441436768, 2.6421899795532227, 2.7891929149627686, 2.9361958503723145, 3.0831987857818604, 3.2302017211914062, 3.377204656600952, 3.524207592010498, 3.671210527420044, 3.81821346282959, 3.9652163982391357, 4.112219333648682, 4.259222030639648, 4.406225204467773, 4.553228378295898, 4.700231075286865]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 18.0, 26.0, 37.0, 50.0, 64.0, 96.0, 92.0, 116.0, 105.0, 97.0, 78.0, 59.0, 33.0, 26.0, 20.0, 15.0, 8.0, 13.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.16665506362915, -4.053471088409424, -3.940286636352539, -3.8271026611328125, -3.713918447494507, -3.600734233856201, -3.4875502586364746, -3.374366044998169, -3.2611818313598633, -3.1479976177215576, -3.034813404083252, -2.9216294288635254, -2.8084452152252197, -2.695261001586914, -2.5820770263671875, -2.468892812728882, -2.355708599090576, -2.2425243854522705, -2.129340171813965, -2.0161561965942383, -1.9029719829559326, -1.789787769317627, -1.6766036748886108, -1.5634195804595947, -1.450235366821289, -1.3370511531829834, -1.2238670587539673, -1.1106829643249512, -0.9974987506866455, -0.8843145966529846, -0.7711304426193237, -0.6579462885856628, -0.544762134552002, -0.43157798051834106, -0.3183938264846802, -0.2052096724510193, -0.0920255184173584, 0.02115863561630249, 0.13434278964996338, 0.24752694368362427, 0.36071109771728516, 0.47389525175094604, 0.5870794057846069, 0.7002635598182678, 0.8134477138519287, 0.9266318678855896, 1.0398160219192505, 1.1530001163482666, 1.2661843299865723, 1.379368543624878, 1.492552638053894, 1.6057367324829102, 1.7189209461212158, 1.8321051597595215, 1.9452892541885376, 2.0584733486175537, 2.1716575622558594, 2.284841775894165, 2.3980259895324707, 2.5112099647521973, 2.624394178390503, 2.7375783920288086, 2.850762367248535, 2.963946580886841, 3.0771307945251465]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 9.0, 14.0, 18.0, 32.0, 42.0, 58.0, 130.0, 206.0, 699.0, 2366.0, 9859.0, 58700.0, 534805.0, 388478.0, 42334.0, 7747.0, 1945.0, 569.0, 243.0, 104.0, 50.0, 44.0, 15.0, 13.0, 13.0, 18.0, 11.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.34375, -5.206451416015625, -5.06915283203125, -4.931854248046875, -4.7945556640625, -4.657257080078125, -4.51995849609375, -4.382659912109375, -4.245361328125, -4.108062744140625, -3.97076416015625, -3.833465576171875, -3.6961669921875, -3.558868408203125, -3.42156982421875, -3.284271240234375, -3.14697265625, -3.009674072265625, -2.87237548828125, -2.735076904296875, -2.5977783203125, -2.460479736328125, -2.32318115234375, -2.185882568359375, -2.048583984375, -1.911285400390625, -1.77398681640625, -1.636688232421875, -1.4993896484375, -1.362091064453125, -1.22479248046875, -1.087493896484375, -0.9501953125, -0.812896728515625, -0.67559814453125, -0.538299560546875, -0.4010009765625, -0.263702392578125, -0.12640380859375, 0.010894775390625, 0.148193359375, 0.285491943359375, 0.42279052734375, 0.560089111328125, 0.6973876953125, 0.834686279296875, 0.97198486328125, 1.109283447265625, 1.24658203125, 1.383880615234375, 1.52117919921875, 1.658477783203125, 1.7957763671875, 1.933074951171875, 2.07037353515625, 2.207672119140625, 2.344970703125, 2.482269287109375, 2.61956787109375, 2.756866455078125, 2.8941650390625, 3.031463623046875, 3.16876220703125, 3.306060791015625, 3.443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 8.0, 14.0, 29.0, 42.0, 75.0, 133.0, 175.0, 185.0, 134.0, 83.0, 43.0, 29.0, 19.0, 8.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-20.234375, -19.82220458984375, -19.4100341796875, -18.99786376953125, -18.585693359375, -18.17352294921875, -17.7613525390625, -17.34918212890625, -16.93701171875, -16.52484130859375, -16.1126708984375, -15.70050048828125, -15.288330078125, -14.87615966796875, -14.4639892578125, -14.05181884765625, -13.6396484375, -13.22747802734375, -12.8153076171875, -12.40313720703125, -11.990966796875, -11.57879638671875, -11.1666259765625, -10.75445556640625, -10.34228515625, -9.93011474609375, -9.5179443359375, -9.10577392578125, -8.693603515625, -8.28143310546875, -7.8692626953125, -7.45709228515625, -7.044921875, -6.63275146484375, -6.2205810546875, -5.80841064453125, -5.396240234375, -4.98406982421875, -4.5718994140625, -4.15972900390625, -3.74755859375, -3.33538818359375, -2.9232177734375, -2.51104736328125, -2.098876953125, -1.68670654296875, -1.2745361328125, -0.86236572265625, -0.4501953125, -0.03802490234375, 0.3741455078125, 0.78631591796875, 1.198486328125, 1.61065673828125, 2.0228271484375, 2.43499755859375, 2.84716796875, 3.25933837890625, 3.6715087890625, 4.08367919921875, 4.495849609375, 4.90802001953125, 5.3201904296875, 5.73236083984375, 6.14453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 11.0, 22.0, 16.0, 23.0, 24.0, 29.0, 39.0, 61.0, 61.0, 81.0, 103.0, 140.0, 336.0, 1275.0, 13816.0, 736234.0, 287578.0, 6944.0, 847.0, 286.0, 133.0, 95.0, 74.0, 62.0, 58.0, 49.0, 27.0, 23.0, 19.0, 20.0, 14.0, 14.0, 9.0, 8.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.92999267578125, -7.6959228515625, -7.46185302734375, -7.227783203125, -6.99371337890625, -6.7596435546875, -6.52557373046875, -6.29150390625, -6.05743408203125, -5.8233642578125, -5.58929443359375, -5.355224609375, -5.12115478515625, -4.8870849609375, -4.65301513671875, -4.4189453125, -4.18487548828125, -3.9508056640625, -3.71673583984375, -3.482666015625, -3.24859619140625, -3.0145263671875, -2.78045654296875, -2.54638671875, -2.31231689453125, -2.0782470703125, -1.84417724609375, -1.610107421875, -1.37603759765625, -1.1419677734375, -0.90789794921875, -0.673828125, -0.43975830078125, -0.2056884765625, 0.02838134765625, 0.262451171875, 0.49652099609375, 0.7305908203125, 0.96466064453125, 1.19873046875, 1.43280029296875, 1.6668701171875, 1.90093994140625, 2.135009765625, 2.36907958984375, 2.6031494140625, 2.83721923828125, 3.0712890625, 3.30535888671875, 3.5394287109375, 3.77349853515625, 4.007568359375, 4.24163818359375, 4.4757080078125, 4.70977783203125, 4.94384765625, 5.17791748046875, 5.4119873046875, 5.64605712890625, 5.880126953125, 6.11419677734375, 6.3482666015625, 6.58233642578125, 6.81640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 5.0, 11.0, 11.0, 9.0, 19.0, 24.0, 25.0, 32.0, 31.0, 36.0, 31.0, 30.0, 46.0, 54.0, 58.0, 47.0, 50.0, 57.0, 40.0, 56.0, 38.0, 33.0, 37.0, 32.0, 33.0, 34.0, 23.0, 6.0, 16.0, 15.0, 11.0, 16.0, 7.0, 8.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9610595703125, -5.781494140625, -5.6019287109375, -5.42236328125, -5.2427978515625, -5.063232421875, -4.8836669921875, -4.7041015625, -4.5245361328125, -4.344970703125, -4.1654052734375, -3.98583984375, -3.8062744140625, -3.626708984375, -3.4471435546875, -3.267578125, -3.0880126953125, -2.908447265625, -2.7288818359375, -2.54931640625, -2.3697509765625, -2.190185546875, -2.0106201171875, -1.8310546875, -1.6514892578125, -1.471923828125, -1.2923583984375, -1.11279296875, -0.9332275390625, -0.753662109375, -0.5740966796875, -0.39453125, -0.2149658203125, -0.035400390625, 0.1441650390625, 0.32373046875, 0.5032958984375, 0.682861328125, 0.8624267578125, 1.0419921875, 1.2215576171875, 1.401123046875, 1.5806884765625, 1.76025390625, 1.9398193359375, 2.119384765625, 2.2989501953125, 2.478515625, 2.6580810546875, 2.837646484375, 3.0172119140625, 3.19677734375, 3.3763427734375, 3.555908203125, 3.7354736328125, 3.9150390625, 4.0946044921875, 4.274169921875, 4.4537353515625, 4.63330078125, 4.8128662109375, 4.992431640625, 5.1719970703125, 5.3515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 8.0, 20.0, 23.0, 28.0, 46.0, 71.0, 99.0, 130.0, 223.0, 351.0, 546.0, 958.0, 1801.0, 3995.0, 9184.0, 25557.0, 89091.0, 349610.0, 406424.0, 110080.0, 30522.0, 10558.0, 4304.0, 2131.0, 1125.0, 584.0, 362.0, 233.0, 155.0, 84.0, 62.0, 45.0, 35.0, 19.0, 21.0, 14.0, 12.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62158203125, -0.6002044677734375, -0.578826904296875, -0.5574493408203125, -0.53607177734375, -0.5146942138671875, -0.493316650390625, -0.4719390869140625, -0.4505615234375, -0.4291839599609375, -0.407806396484375, -0.3864288330078125, -0.36505126953125, -0.3436737060546875, -0.322296142578125, -0.3009185791015625, -0.279541015625, -0.2581634521484375, -0.236785888671875, -0.2154083251953125, -0.19403076171875, -0.1726531982421875, -0.151275634765625, -0.1298980712890625, -0.1085205078125, -0.0871429443359375, -0.065765380859375, -0.0443878173828125, -0.02301025390625, -0.0016326904296875, 0.019744873046875, 0.0411224365234375, 0.0625, 0.0838775634765625, 0.105255126953125, 0.1266326904296875, 0.14801025390625, 0.1693878173828125, 0.190765380859375, 0.2121429443359375, 0.2335205078125, 0.2548980712890625, 0.276275634765625, 0.2976531982421875, 0.31903076171875, 0.3404083251953125, 0.361785888671875, 0.3831634521484375, 0.404541015625, 0.4259185791015625, 0.447296142578125, 0.4686737060546875, 0.49005126953125, 0.5114288330078125, 0.532806396484375, 0.5541839599609375, 0.5755615234375, 0.5969390869140625, 0.618316650390625, 0.6396942138671875, 0.66107177734375, 0.6824493408203125, 0.703826904296875, 0.7252044677734375, 0.74658203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 15.0, 13.0, 16.0, 13.0, 22.0, 16.0, 20.0, 27.0, 29.0, 59.0, 63.0, 59.0, 67.0, 83.0, 70.0, 70.0, 69.0, 51.0, 45.0, 44.0, 30.0, 27.0, 12.0, 19.0, 12.0, 10.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.0001506805419921875, -0.0001467997208237648, -0.0001429188996553421, -0.0001390380784869194, -0.0001351572573184967, -0.000131276436150074, -0.0001273956149816513, -0.0001235147938132286, -0.00011963397264480591, -0.00011575315147638321, -0.00011187233030796051, -0.00010799150913953781, -0.00010411068797111511, -0.00010022986680269241, -9.634904563426971e-05, -9.246822446584702e-05, -8.858740329742432e-05, -8.470658212900162e-05, -8.082576096057892e-05, -7.694493979215622e-05, -7.306411862373352e-05, -6.918329745531082e-05, -6.530247628688812e-05, -6.142165511846542e-05, -5.7540833950042725e-05, -5.3660012781620026e-05, -4.977919161319733e-05, -4.589837044477463e-05, -4.201754927635193e-05, -3.813672810792923e-05, -3.425590693950653e-05, -3.0375085771083832e-05, -2.6494264602661133e-05, -2.2613443434238434e-05, -1.8732622265815735e-05, -1.4851801097393036e-05, -1.0970979928970337e-05, -7.090158760547638e-06, -3.209337592124939e-06, 6.7148357629776e-07, 4.552304744720459e-06, 8.433125913143158e-06, 1.2313947081565857e-05, 1.6194768249988556e-05, 2.0075589418411255e-05, 2.3956410586833954e-05, 2.7837231755256653e-05, 3.171805292367935e-05, 3.559887409210205e-05, 3.947969526052475e-05, 4.336051642894745e-05, 4.724133759737015e-05, 5.112215876579285e-05, 5.5002979934215546e-05, 5.8883801102638245e-05, 6.276462227106094e-05, 6.664544343948364e-05, 7.052626460790634e-05, 7.440708577632904e-05, 7.828790694475174e-05, 8.216872811317444e-05, 8.604954928159714e-05, 8.993037045001984e-05, 9.381119161844254e-05, 9.769201278686523e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 14.0, 19.0, 29.0, 60.0, 93.0, 133.0, 231.0, 411.0, 888.0, 2141.0, 5887.0, 21092.0, 125070.0, 649186.0, 200632.0, 30300.0, 7507.0, 2590.0, 1078.0, 522.0, 300.0, 143.0, 76.0, 46.0, 35.0, 20.0, 13.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.912017822265625, -0.87774658203125, -0.843475341796875, -0.8092041015625, -0.774932861328125, -0.74066162109375, -0.706390380859375, -0.672119140625, -0.637847900390625, -0.60357666015625, -0.569305419921875, -0.5350341796875, -0.500762939453125, -0.46649169921875, -0.432220458984375, -0.39794921875, -0.363677978515625, -0.32940673828125, -0.295135498046875, -0.2608642578125, -0.226593017578125, -0.19232177734375, -0.158050537109375, -0.123779296875, -0.089508056640625, -0.05523681640625, -0.020965576171875, 0.0133056640625, 0.047576904296875, 0.08184814453125, 0.116119384765625, 0.150390625, 0.184661865234375, 0.21893310546875, 0.253204345703125, 0.2874755859375, 0.321746826171875, 0.35601806640625, 0.390289306640625, 0.424560546875, 0.458831787109375, 0.49310302734375, 0.527374267578125, 0.5616455078125, 0.595916748046875, 0.63018798828125, 0.664459228515625, 0.69873046875, 0.733001708984375, 0.76727294921875, 0.801544189453125, 0.8358154296875, 0.870086669921875, 0.90435791015625, 0.938629150390625, 0.972900390625, 1.007171630859375, 1.04144287109375, 1.075714111328125, 1.1099853515625, 1.144256591796875, 1.17852783203125, 1.212799072265625, 1.2470703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 3.0, 9.0, 8.0, 14.0, 22.0, 20.0, 28.0, 32.0, 31.0, 63.0, 80.0, 80.0, 84.0, 70.0, 74.0, 77.0, 51.0, 62.0, 29.0, 41.0, 24.0, 21.0, 19.0, 13.0, 8.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.505859375, -0.4915199279785156, -0.47718048095703125, -0.4628410339355469, -0.4485015869140625, -0.4341621398925781, -0.41982269287109375, -0.4054832458496094, -0.391143798828125, -0.3768043518066406, -0.36246490478515625, -0.3481254577636719, -0.3337860107421875, -0.3194465637207031, -0.30510711669921875, -0.2907676696777344, -0.27642822265625, -0.2620887756347656, -0.24774932861328125, -0.23340988159179688, -0.2190704345703125, -0.20473098754882812, -0.19039154052734375, -0.17605209350585938, -0.161712646484375, -0.14737319946289062, -0.13303375244140625, -0.11869430541992188, -0.1043548583984375, -0.09001541137695312, -0.07567596435546875, -0.061336517333984375, -0.0469970703125, -0.032657623291015625, -0.01831817626953125, -0.003978729248046875, 0.0103607177734375, 0.024700164794921875, 0.03903961181640625, 0.053379058837890625, 0.067718505859375, 0.08205795288085938, 0.09639739990234375, 0.11073684692382812, 0.1250762939453125, 0.13941574096679688, 0.15375518798828125, 0.16809463500976562, 0.18243408203125, 0.19677352905273438, 0.21111297607421875, 0.22545242309570312, 0.2397918701171875, 0.2541313171386719, 0.26847076416015625, 0.2828102111816406, 0.297149658203125, 0.3114891052246094, 0.32582855224609375, 0.3401679992675781, 0.3545074462890625, 0.3688468933105469, 0.38318634033203125, 0.3975257873535156, 0.411865234375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 6.0, 21.0, 63.0, 197.0, 344.0, 212.0, 82.0, 35.0, 17.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.076003074645996, -7.522428512573242, -6.96885347366333, -6.415278911590576, -5.861703872680664, -5.30812931060791, -4.754554748535156, -4.200980186462402, -3.6474051475524902, -3.0938303470611572, -2.540255546569824, -1.9866809844970703, -1.4331061840057373, -0.8795313835144043, -0.3259568214416504, 0.22761797904968262, 0.7811927795410156, 1.3347675800323486, 1.888342261314392, 2.4419169425964355, 2.9954917430877686, 3.5490665435791016, 4.1026411056518555, 4.656215667724609, 5.2097907066345215, 5.763365268707275, 6.3169403076171875, 6.870514869689941, 7.424089431762695, 7.977664470672607, 8.531238555908203, 9.084814071655273, 9.638389587402344, 10.191964149475098, 10.745538711547852, 11.299114227294922, 11.852688789367676, 12.40626335144043, 12.959837913513184, 13.513412475585938, 14.066987991333008, 14.620562553405762, 15.174137115478516, 15.727712631225586, 16.281286239624023, 16.834861755371094, 17.38843536376953, 17.9420108795166, 18.495586395263672, 19.049161911010742, 19.60273551940918, 20.15631103515625, 20.709884643554688, 21.263460159301758, 21.817035675048828, 22.370609283447266, 22.924182891845703, 23.477758407592773, 24.03133201599121, 24.58490753173828, 25.13848114013672, 25.69205665588379, 26.24563217163086, 26.799205780029297, 27.352781295776367]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 14.0, 15.0, 9.0, 28.0, 35.0, 36.0, 45.0, 57.0, 57.0, 74.0, 54.0, 71.0, 66.0, 71.0, 73.0, 58.0, 50.0, 39.0, 32.0, 24.0, 28.0, 17.0, 14.0, 12.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.78019905090332, -17.322389602661133, -16.864580154418945, -16.406770706176758, -15.948962211608887, -15.4911527633667, -15.033343315124512, -14.575533866882324, -14.117724418640137, -13.65991497039795, -13.202105522155762, -12.74429702758789, -12.286487579345703, -11.828678131103516, -11.370868682861328, -10.91305923461914, -10.455249786376953, -9.997440338134766, -9.539630889892578, -9.08182144165039, -8.62401294708252, -8.166203498840332, -7.7083940505981445, -7.250584602355957, -6.792776107788086, -6.334966659545898, -5.877157688140869, -5.419348239898682, -4.961538791656494, -4.503729820251465, -4.045920372009277, -3.58811092376709, -3.1303014755249023, -2.672492265701294, -2.2146828174591064, -1.756873607635498, -1.2990642786026, -0.8412549495697021, -0.38344573974609375, 0.07436370849609375, 0.5321729183197021, 0.9899822473526001, 1.447791576385498, 1.9056007862091064, 2.363409996032715, 2.8212194442749023, 3.2790286540985107, 3.7368381023406982, 4.194647312164307, 4.652456760406494, 5.110265731811523, 5.568075180053711, 6.025884628295898, 6.483694076538086, 6.941503047943115, 7.399312496185303, 7.857121467590332, 8.31493091583252, 8.772740364074707, 9.230548858642578, 9.688358306884766, 10.146167755126953, 10.60397720336914, 11.061786651611328, 11.519596099853516]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 11.0, 6.0, 20.0, 12.0, 25.0, 35.0, 52.0, 68.0, 126.0, 183.0, 345.0, 638.0, 1642.0, 4855.0, 20155.0, 161195.0, 3690687.0, 277232.0, 27255.0, 5952.0, 2039.0, 764.0, 351.0, 201.0, 113.0, 90.0, 55.0, 41.0, 29.0, 24.0, 14.0, 17.0, 14.0, 9.0, 5.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.23828125, -5.08233642578125, -4.9263916015625, -4.77044677734375, -4.614501953125, -4.45855712890625, -4.3026123046875, -4.14666748046875, -3.99072265625, -3.83477783203125, -3.6788330078125, -3.52288818359375, -3.366943359375, -3.21099853515625, -3.0550537109375, -2.89910888671875, -2.7431640625, -2.58721923828125, -2.4312744140625, -2.27532958984375, -2.119384765625, -1.96343994140625, -1.8074951171875, -1.65155029296875, -1.49560546875, -1.33966064453125, -1.1837158203125, -1.02777099609375, -0.871826171875, -0.71588134765625, -0.5599365234375, -0.40399169921875, -0.248046875, -0.09210205078125, 0.0638427734375, 0.21978759765625, 0.375732421875, 0.53167724609375, 0.6876220703125, 0.84356689453125, 0.99951171875, 1.15545654296875, 1.3114013671875, 1.46734619140625, 1.623291015625, 1.77923583984375, 1.9351806640625, 2.09112548828125, 2.2470703125, 2.40301513671875, 2.5589599609375, 2.71490478515625, 2.870849609375, 3.02679443359375, 3.1827392578125, 3.33868408203125, 3.49462890625, 3.65057373046875, 3.8065185546875, 3.96246337890625, 4.118408203125, 4.27435302734375, 4.4302978515625, 4.58624267578125, 4.7421875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 11.0, 11.0, 21.0, 22.0, 28.0, 65.0, 66.0, 83.0, 100.0, 115.0, 102.0, 111.0, 75.0, 55.0, 43.0, 29.0, 25.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.24700927734375, -5.0916748046875, -4.93634033203125, -4.781005859375, -4.62567138671875, -4.4703369140625, -4.31500244140625, -4.15966796875, -4.00433349609375, -3.8489990234375, -3.69366455078125, -3.538330078125, -3.38299560546875, -3.2276611328125, -3.07232666015625, -2.9169921875, -2.76165771484375, -2.6063232421875, -2.45098876953125, -2.295654296875, -2.14031982421875, -1.9849853515625, -1.82965087890625, -1.67431640625, -1.51898193359375, -1.3636474609375, -1.20831298828125, -1.052978515625, -0.89764404296875, -0.7423095703125, -0.58697509765625, -0.431640625, -0.27630615234375, -0.1209716796875, 0.03436279296875, 0.189697265625, 0.34503173828125, 0.5003662109375, 0.65570068359375, 0.81103515625, 0.96636962890625, 1.1217041015625, 1.27703857421875, 1.432373046875, 1.58770751953125, 1.7430419921875, 1.89837646484375, 2.0537109375, 2.20904541015625, 2.3643798828125, 2.51971435546875, 2.675048828125, 2.83038330078125, 2.9857177734375, 3.14105224609375, 3.29638671875, 3.45172119140625, 3.6070556640625, 3.76239013671875, 3.917724609375, 4.07305908203125, 4.2283935546875, 4.38372802734375, 4.5390625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 5.0, 10.0, 9.0, 15.0, 9.0, 16.0, 30.0, 46.0, 55.0, 94.0, 145.0, 241.0, 710.0, 3420.0, 40744.0, 4011846.0, 128973.0, 6085.0, 1024.0, 346.0, 145.0, 70.0, 51.0, 34.0, 32.0, 23.0, 10.0, 11.0, 9.0, 12.0, 7.0, 6.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7421875, -9.45263671875, -9.1630859375, -8.87353515625, -8.583984375, -8.29443359375, -8.0048828125, -7.71533203125, -7.42578125, -7.13623046875, -6.8466796875, -6.55712890625, -6.267578125, -5.97802734375, -5.6884765625, -5.39892578125, -5.109375, -4.81982421875, -4.5302734375, -4.24072265625, -3.951171875, -3.66162109375, -3.3720703125, -3.08251953125, -2.79296875, -2.50341796875, -2.2138671875, -1.92431640625, -1.634765625, -1.34521484375, -1.0556640625, -0.76611328125, -0.4765625, -0.18701171875, 0.1025390625, 0.39208984375, 0.681640625, 0.97119140625, 1.2607421875, 1.55029296875, 1.83984375, 2.12939453125, 2.4189453125, 2.70849609375, 2.998046875, 3.28759765625, 3.5771484375, 3.86669921875, 4.15625, 4.44580078125, 4.7353515625, 5.02490234375, 5.314453125, 5.60400390625, 5.8935546875, 6.18310546875, 6.47265625, 6.76220703125, 7.0517578125, 7.34130859375, 7.630859375, 7.92041015625, 8.2099609375, 8.49951171875, 8.7890625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 7.0, 4.0, 4.0, 19.0, 12.0, 13.0, 27.0, 26.0, 44.0, 49.0, 50.0, 75.0, 110.0, 158.0, 262.0, 480.0, 1117.0, 582.0, 304.0, 183.0, 116.0, 105.0, 55.0, 57.0, 46.0, 30.0, 31.0, 14.0, 19.0, 12.0, 5.0, 11.0, 3.0, 4.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6170501708984375, -0.592987060546875, -0.5689239501953125, -0.54486083984375, -0.5207977294921875, -0.496734619140625, -0.4726715087890625, -0.4486083984375, -0.4245452880859375, -0.400482177734375, -0.3764190673828125, -0.35235595703125, -0.3282928466796875, -0.304229736328125, -0.2801666259765625, -0.256103515625, -0.2320404052734375, -0.207977294921875, -0.1839141845703125, -0.15985107421875, -0.1357879638671875, -0.111724853515625, -0.0876617431640625, -0.0635986328125, -0.0395355224609375, -0.015472412109375, 0.0085906982421875, 0.03265380859375, 0.0567169189453125, 0.080780029296875, 0.1048431396484375, 0.12890625, 0.1529693603515625, 0.177032470703125, 0.2010955810546875, 0.22515869140625, 0.2492218017578125, 0.273284912109375, 0.2973480224609375, 0.3214111328125, 0.3454742431640625, 0.369537353515625, 0.3936004638671875, 0.41766357421875, 0.4417266845703125, 0.465789794921875, 0.4898529052734375, 0.513916015625, 0.5379791259765625, 0.562042236328125, 0.5861053466796875, 0.61016845703125, 0.6342315673828125, 0.658294677734375, 0.6823577880859375, 0.7064208984375, 0.7304840087890625, 0.754547119140625, 0.7786102294921875, 0.80267333984375, 0.8267364501953125, 0.850799560546875, 0.8748626708984375, 0.89892578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 17.0, 21.0, 40.0, 68.0, 152.0, 172.0, 186.0, 123.0, 78.0, 48.0, 26.0, 13.0, 12.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.059237003326416, -6.852049827575684, -6.644863128662109, -6.437675952911377, -6.2304887771606445, -6.023301601409912, -5.81611442565918, -5.6089277267456055, -5.401740550994873, -5.194553375244141, -4.987366676330566, -4.780179500579834, -4.572992324829102, -4.365805149078369, -4.158617973327637, -3.9514312744140625, -3.74424409866333, -3.5370569229125977, -3.3298699855804443, -3.122683048248291, -2.9154958724975586, -2.708308696746826, -2.501121759414673, -2.2939348220825195, -2.086747646331787, -1.8795605897903442, -1.6723735332489014, -1.4651864767074585, -1.2579994201660156, -1.0508123636245728, -0.8436253070831299, -0.636438250541687, -0.42925071716308594, -0.22206366062164307, -0.014876604080200195, 0.19231045246124268, 0.39949750900268555, 0.6066845655441284, 0.8138716220855713, 1.0210586786270142, 1.228245735168457, 1.4354327917099, 1.6426198482513428, 1.8498069047927856, 2.0569939613342285, 2.264181137084961, 2.4713680744171143, 2.6785550117492676, 2.8857421875, 3.0929293632507324, 3.3001163005828857, 3.507303237915039, 3.7144904136657715, 3.921677589416504, 4.128864288330078, 4.3360514640808105, 4.543238639831543, 4.750425815582275, 4.957612991333008, 5.164799690246582, 5.3719868659973145, 5.579174041748047, 5.786360740661621, 5.9935479164123535, 6.200735092163086]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 10.0, 11.0, 14.0, 17.0, 30.0, 40.0, 49.0, 49.0, 75.0, 83.0, 88.0, 83.0, 103.0, 63.0, 68.0, 65.0, 39.0, 29.0, 21.0, 13.0, 15.0, 9.0, 11.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.132678031921387, -4.987570285797119, -4.842462539672852, -4.697354793548584, -4.552247047424316, -4.407139301300049, -4.262031555175781, -4.1169233322143555, -3.971815824508667, -3.8267080783843994, -3.681600332260132, -3.5364925861358643, -3.3913846015930176, -3.24627685546875, -3.1011691093444824, -2.956061363220215, -2.8109536170959473, -2.6658458709716797, -2.520738124847412, -2.3756303787231445, -2.230522632598877, -2.0854148864746094, -1.9403069019317627, -1.7951991558074951, -1.6500914096832275, -1.50498366355896, -1.3598759174346924, -1.2147680521011353, -1.0696603059768677, -0.9245525598526001, -0.7794447541236877, -0.6343369483947754, -0.4892292022705078, -0.34412142634391785, -0.19901365041732788, -0.053905874490737915, 0.09120190143585205, 0.23630964756011963, 0.381417453289032, 0.5265252590179443, 0.6716330051422119, 0.8167407512664795, 0.9618485569953918, 1.1069563627243042, 1.2520641088485718, 1.3971718549728394, 1.5422797203063965, 1.687387466430664, 1.8324952125549316, 1.9776029586791992, 2.122710704803467, 2.2678184509277344, 2.412926197052002, 2.5580339431762695, 2.703141927719116, 2.848249673843384, 2.9933574199676514, 3.138465166091919, 3.2835729122161865, 3.428680658340454, 3.573788642883301, 3.7188963890075684, 3.864004135131836, 4.0091118812561035, 4.154219627380371]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 7.0, 10.0, 8.0, 17.0, 33.0, 39.0, 72.0, 128.0, 224.0, 386.0, 862.0, 2158.0, 6433.0, 27595.0, 249993.0, 671332.0, 70686.0, 12372.0, 3584.0, 1288.0, 573.0, 284.0, 162.0, 99.0, 55.0, 26.0, 25.0, 22.0, 10.0, 14.0, 5.0, 10.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.4443359375, -0.43271636962890625, -0.4210968017578125, -0.40947723388671875, -0.397857666015625, -0.38623809814453125, -0.3746185302734375, -0.36299896240234375, -0.35137939453125, -0.33975982666015625, -0.3281402587890625, -0.31652069091796875, -0.304901123046875, -0.29328155517578125, -0.2816619873046875, -0.27004241943359375, -0.2584228515625, -0.24680328369140625, -0.2351837158203125, -0.22356414794921875, -0.211944580078125, -0.20032501220703125, -0.1887054443359375, -0.17708587646484375, -0.16546630859375, -0.15384674072265625, -0.1422271728515625, -0.13060760498046875, -0.118988037109375, -0.10736846923828125, -0.0957489013671875, -0.08412933349609375, -0.072509765625, -0.06089019775390625, -0.0492706298828125, -0.03765106201171875, -0.026031494140625, -0.01441192626953125, -0.0027923583984375, 0.00882720947265625, 0.02044677734375, 0.03206634521484375, 0.0436859130859375, 0.05530548095703125, 0.066925048828125, 0.07854461669921875, 0.0901641845703125, 0.10178375244140625, 0.1134033203125, 0.12502288818359375, 0.1366424560546875, 0.14826202392578125, 0.159881591796875, 0.17150115966796875, 0.1831207275390625, 0.19474029541015625, 0.20635986328125, 0.21797943115234375, 0.2295989990234375, 0.24121856689453125, 0.252838134765625, 0.26445770263671875, 0.2760772705078125, 0.28769683837890625, 0.29931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 26.0, 37.0, 41.0, 59.0, 74.0, 104.0, 117.0, 123.0, 109.0, 97.0, 50.0, 52.0, 25.0, 18.0, 11.0, 11.0, 11.0, 5.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.614105224609375, -4.48602294921875, -4.357940673828125, -4.2298583984375, -4.101776123046875, -3.97369384765625, -3.845611572265625, -3.717529296875, -3.589447021484375, -3.46136474609375, -3.333282470703125, -3.2052001953125, -3.077117919921875, -2.94903564453125, -2.820953369140625, -2.69287109375, -2.564788818359375, -2.43670654296875, -2.308624267578125, -2.1805419921875, -2.052459716796875, -1.92437744140625, -1.796295166015625, -1.668212890625, -1.540130615234375, -1.41204833984375, -1.283966064453125, -1.1558837890625, -1.027801513671875, -0.89971923828125, -0.771636962890625, -0.6435546875, -0.515472412109375, -0.38739013671875, -0.259307861328125, -0.1312255859375, -0.003143310546875, 0.12493896484375, 0.253021240234375, 0.381103515625, 0.509185791015625, 0.63726806640625, 0.765350341796875, 0.8934326171875, 1.021514892578125, 1.14959716796875, 1.277679443359375, 1.40576171875, 1.533843994140625, 1.66192626953125, 1.790008544921875, 1.9180908203125, 2.046173095703125, 2.17425537109375, 2.302337646484375, 2.430419921875, 2.558502197265625, 2.68658447265625, 2.814666748046875, 2.9427490234375, 3.070831298828125, 3.19891357421875, 3.326995849609375, 3.455078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 17.0, 15.0, 14.0, 22.0, 29.0, 39.0, 56.0, 83.0, 131.0, 203.0, 364.0, 757.0, 2969.0, 34023.0, 692449.0, 300210.0, 13762.0, 1932.0, 587.0, 284.0, 156.0, 112.0, 87.0, 45.0, 46.0, 36.0, 26.0, 13.0, 13.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3572883605957031, -0.34397125244140625, -0.3306541442871094, -0.3173370361328125, -0.3040199279785156, -0.29070281982421875, -0.2773857116699219, -0.264068603515625, -0.2507514953613281, -0.23743438720703125, -0.22411727905273438, -0.2108001708984375, -0.19748306274414062, -0.18416595458984375, -0.17084884643554688, -0.15753173828125, -0.14421463012695312, -0.13089752197265625, -0.11758041381835938, -0.1042633056640625, -0.09094619750976562, -0.07762908935546875, -0.06431198120117188, -0.050994873046875, -0.037677764892578125, -0.02436065673828125, -0.011043548583984375, 0.0022735595703125, 0.015590667724609375, 0.02890777587890625, 0.042224884033203125, 0.0555419921875, 0.06885910034179688, 0.08217620849609375, 0.09549331665039062, 0.1088104248046875, 0.12212753295898438, 0.13544464111328125, 0.14876174926757812, 0.162078857421875, 0.17539596557617188, 0.18871307373046875, 0.20203018188476562, 0.2153472900390625, 0.22866439819335938, 0.24198150634765625, 0.2552986145019531, 0.26861572265625, 0.2819328308105469, 0.29524993896484375, 0.3085670471191406, 0.3218841552734375, 0.3352012634277344, 0.34851837158203125, 0.3618354797363281, 0.375152587890625, 0.3884696960449219, 0.40178680419921875, 0.4151039123535156, 0.4284210205078125, 0.4417381286621094, 0.45505523681640625, 0.4683723449707031, 0.481689453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 7.0, 6.0, 7.0, 6.0, 13.0, 12.0, 17.0, 16.0, 29.0, 37.0, 36.0, 32.0, 34.0, 49.0, 43.0, 63.0, 40.0, 57.0, 76.0, 37.0, 53.0, 46.0, 51.0, 40.0, 43.0, 36.0, 26.0, 17.0, 15.0, 16.0, 9.0, 5.0, 7.0, 4.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.73828125, -4.5946044921875, -4.450927734375, -4.3072509765625, -4.16357421875, -4.0198974609375, -3.876220703125, -3.7325439453125, -3.5888671875, -3.4451904296875, -3.301513671875, -3.1578369140625, -3.01416015625, -2.8704833984375, -2.726806640625, -2.5831298828125, -2.439453125, -2.2957763671875, -2.152099609375, -2.0084228515625, -1.86474609375, -1.7210693359375, -1.577392578125, -1.4337158203125, -1.2900390625, -1.1463623046875, -1.002685546875, -0.8590087890625, -0.71533203125, -0.5716552734375, -0.427978515625, -0.2843017578125, -0.140625, 0.0030517578125, 0.146728515625, 0.2904052734375, 0.43408203125, 0.5777587890625, 0.721435546875, 0.8651123046875, 1.0087890625, 1.1524658203125, 1.296142578125, 1.4398193359375, 1.58349609375, 1.7271728515625, 1.870849609375, 2.0145263671875, 2.158203125, 2.3018798828125, 2.445556640625, 2.5892333984375, 2.73291015625, 2.8765869140625, 3.020263671875, 3.1639404296875, 3.3076171875, 3.4512939453125, 3.594970703125, 3.7386474609375, 3.88232421875, 4.0260009765625, 4.169677734375, 4.3133544921875, 4.45703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 11.0, 5.0, 10.0, 16.0, 12.0, 33.0, 27.0, 53.0, 94.0, 182.0, 434.0, 1999.0, 128660.0, 913221.0, 2740.0, 531.0, 197.0, 105.0, 61.0, 36.0, 28.0, 11.0, 11.0, 13.0, 10.0, 6.0, 7.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.382080078125, -0.37230491638183594, -0.3625297546386719, -0.3527545928955078, -0.34297943115234375, -0.3332042694091797, -0.3234291076660156, -0.31365394592285156, -0.3038787841796875, -0.29410362243652344, -0.2843284606933594, -0.2745532989501953, -0.26477813720703125, -0.2550029754638672, -0.24522781372070312, -0.23545265197753906, -0.225677490234375, -0.21590232849121094, -0.20612716674804688, -0.1963520050048828, -0.18657684326171875, -0.1768016815185547, -0.16702651977539062, -0.15725135803222656, -0.1474761962890625, -0.13770103454589844, -0.12792587280273438, -0.11815071105957031, -0.10837554931640625, -0.09860038757324219, -0.08882522583007812, -0.07905006408691406, -0.06927490234375, -0.05949974060058594, -0.049724578857421875, -0.03994941711425781, -0.03017425537109375, -0.020399093627929688, -0.010623931884765625, -0.0008487701416015625, 0.0089263916015625, 0.018701553344726562, 0.028476715087890625, 0.03825187683105469, 0.04802703857421875, 0.05780220031738281, 0.06757736206054688, 0.07735252380371094, 0.087127685546875, 0.09690284729003906, 0.10667800903320312, 0.11645317077636719, 0.12622833251953125, 0.1360034942626953, 0.14577865600585938, 0.15555381774902344, 0.1653289794921875, 0.17510414123535156, 0.18487930297851562, 0.1946544647216797, 0.20442962646484375, 0.2142047882080078, 0.22397994995117188, 0.23375511169433594, 0.2435302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 6.0, 1.0, 8.0, 16.0, 10.0, 13.0, 16.0, 32.0, 33.0, 41.0, 53.0, 54.0, 78.0, 109.0, 89.0, 81.0, 59.0, 53.0, 44.0, 34.0, 27.0, 28.0, 28.0, 21.0, 8.0, 11.0, 11.0, 8.0, 4.0, 5.0, 1.0, 0.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2961368560791016e-05, -3.194250166416168e-05, -3.092363476753235e-05, -2.9904767870903015e-05, -2.888590097427368e-05, -2.7867034077644348e-05, -2.6848167181015015e-05, -2.582930028438568e-05, -2.4810433387756348e-05, -2.3791566491127014e-05, -2.277269959449768e-05, -2.1753832697868347e-05, -2.0734965801239014e-05, -1.971609890460968e-05, -1.8697232007980347e-05, -1.7678365111351013e-05, -1.665949821472168e-05, -1.5640631318092346e-05, -1.4621764421463013e-05, -1.360289752483368e-05, -1.2584030628204346e-05, -1.1565163731575012e-05, -1.0546296834945679e-05, -9.527429938316345e-06, -8.508563041687012e-06, -7.489696145057678e-06, -6.470829248428345e-06, -5.451962351799011e-06, -4.433095455169678e-06, -3.4142285585403442e-06, -2.3953616619110107e-06, -1.3764947652816772e-06, -3.5762786865234375e-07, 6.612390279769897e-07, 1.6801059246063232e-06, 2.6989728212356567e-06, 3.7178397178649902e-06, 4.736706614494324e-06, 5.755573511123657e-06, 6.774440407752991e-06, 7.793307304382324e-06, 8.812174201011658e-06, 9.831041097640991e-06, 1.0849907994270325e-05, 1.1868774890899658e-05, 1.2887641787528992e-05, 1.3906508684158325e-05, 1.4925375580787659e-05, 1.5944242477416992e-05, 1.6963109374046326e-05, 1.798197627067566e-05, 1.9000843167304993e-05, 2.0019710063934326e-05, 2.103857696056366e-05, 2.2057443857192993e-05, 2.3076310753822327e-05, 2.409517765045166e-05, 2.5114044547080994e-05, 2.6132911443710327e-05, 2.715177834033966e-05, 2.8170645236968994e-05, 2.9189512133598328e-05, 3.020837903022766e-05, 3.1227245926856995e-05, 3.224611282348633e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 10.0, 18.0, 19.0, 31.0, 55.0, 106.0, 246.0, 759.0, 3293.0, 39317.0, 977987.0, 23145.0, 2495.0, 616.0, 207.0, 93.0, 51.0, 33.0, 14.0, 15.0, 7.0, 5.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.30224609375, -0.29346466064453125, -0.2846832275390625, -0.27590179443359375, -0.267120361328125, -0.25833892822265625, -0.2495574951171875, -0.24077606201171875, -0.23199462890625, -0.22321319580078125, -0.2144317626953125, -0.20565032958984375, -0.196868896484375, -0.18808746337890625, -0.1793060302734375, -0.17052459716796875, -0.1617431640625, -0.15296173095703125, -0.1441802978515625, -0.13539886474609375, -0.126617431640625, -0.11783599853515625, -0.1090545654296875, -0.10027313232421875, -0.09149169921875, -0.08271026611328125, -0.0739288330078125, -0.06514739990234375, -0.056365966796875, -0.04758453369140625, -0.0388031005859375, -0.03002166748046875, -0.021240234375, -0.01245880126953125, -0.0036773681640625, 0.00510406494140625, 0.013885498046875, 0.02266693115234375, 0.0314483642578125, 0.04022979736328125, 0.04901123046875, 0.05779266357421875, 0.0665740966796875, 0.07535552978515625, 0.084136962890625, 0.09291839599609375, 0.1016998291015625, 0.11048126220703125, 0.1192626953125, 0.12804412841796875, 0.1368255615234375, 0.14560699462890625, 0.154388427734375, 0.16316986083984375, 0.1719512939453125, 0.18073272705078125, 0.18951416015625, 0.19829559326171875, 0.2070770263671875, 0.21585845947265625, 0.224639892578125, 0.23342132568359375, 0.2422027587890625, 0.25098419189453125, 0.259765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 9.0, 18.0, 9.0, 24.0, 51.0, 108.0, 269.0, 238.0, 93.0, 56.0, 22.0, 13.0, 17.0, 7.0, 11.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042510986328125, -0.041086673736572266, -0.03966236114501953, -0.0382380485534668, -0.03681373596191406, -0.03538942337036133, -0.033965110778808594, -0.03254079818725586, -0.031116485595703125, -0.02969217300415039, -0.028267860412597656, -0.026843547821044922, -0.025419235229492188, -0.023994922637939453, -0.02257061004638672, -0.021146297454833984, -0.01972198486328125, -0.018297672271728516, -0.01687335968017578, -0.015449047088623047, -0.014024734497070312, -0.012600421905517578, -0.011176109313964844, -0.00975179672241211, -0.008327484130859375, -0.006903171539306641, -0.005478858947753906, -0.004054546356201172, -0.0026302337646484375, -0.0012059211730957031, 0.00021839141845703125, 0.0016427040100097656, 0.0030670166015625, 0.004491329193115234, 0.005915641784667969, 0.007339954376220703, 0.008764266967773438, 0.010188579559326172, 0.011612892150878906, 0.01303720474243164, 0.014461517333984375, 0.01588582992553711, 0.017310142517089844, 0.018734455108642578, 0.020158767700195312, 0.021583080291748047, 0.02300739288330078, 0.024431705474853516, 0.02585601806640625, 0.027280330657958984, 0.02870464324951172, 0.030128955841064453, 0.03155326843261719, 0.03297758102416992, 0.034401893615722656, 0.03582620620727539, 0.037250518798828125, 0.03867483139038086, 0.040099143981933594, 0.04152345657348633, 0.04294776916503906, 0.0443720817565918, 0.04579639434814453, 0.047220706939697266, 0.04864501953125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 9.0, 10.0, 25.0, 38.0, 93.0, 198.0, 225.0, 194.0, 87.0, 41.0, 26.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8823747634887695, -5.711939811706543, -5.541504859924316, -5.37106990814209, -5.200634956359863, -5.030200481414795, -4.859765529632568, -4.689330577850342, -4.518895626068115, -4.348460674285889, -4.178025722503662, -4.0075907707214355, -3.837156057357788, -3.6667211055755615, -3.496286392211914, -3.3258514404296875, -3.155416488647461, -2.9849815368652344, -2.814546585083008, -2.6441118717193604, -2.473676919937134, -2.3032419681549072, -2.1328072547912598, -1.9623723030090332, -1.7919373512268066, -1.62150239944458, -1.451067566871643, -1.280632734298706, -1.1101977825164795, -0.9397628903388977, -0.7693279981613159, -0.5988931655883789, -0.42845869064331055, -0.25802379846572876, -0.08758890628814697, 0.08284598588943481, 0.2532808780670166, 0.4237157702445984, 0.5941506624221802, 0.7645854949951172, 0.9350204467773438, 1.1054553985595703, 1.2758902311325073, 1.4463250637054443, 1.616760015487671, 1.7871949672698975, 1.9576297998428345, 2.1280646324157715, 2.298499584197998, 2.4689345359802246, 2.639369487762451, 2.8098042011260986, 2.980239152908325, 3.1506741046905518, 3.321108818054199, 3.491543769836426, 3.6619787216186523, 3.832413673400879, 4.0028486251831055, 4.173283576965332, 4.343718528747559, 4.514153003692627, 4.6845879554748535, 4.85502290725708, 5.025457859039307]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 21.0, 16.0, 41.0, 49.0, 65.0, 73.0, 106.0, 103.0, 113.0, 104.0, 81.0, 59.0, 43.0, 30.0, 20.0, 13.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.253957748413086, -4.1391191482543945, -4.024280548095703, -3.909442186355591, -3.7946035861968994, -3.679764986038208, -3.5649266242980957, -3.4500880241394043, -3.335249423980713, -3.2204108238220215, -3.10557222366333, -2.9907338619232178, -2.8758952617645264, -2.761056661605835, -2.6462182998657227, -2.5313796997070312, -2.41654109954834, -2.3017024993896484, -2.186863899230957, -2.0720255374908447, -1.9571869373321533, -1.842348337173462, -1.72750985622406, -1.6126713752746582, -1.4978327751159668, -1.3829941749572754, -1.2681556940078735, -1.1533172130584717, -1.0384786128997803, -0.9236400723457336, -0.808801531791687, -0.6939629912376404, -0.5791242122650146, -0.464285671710968, -0.3494471311569214, -0.23460859060287476, -0.11977005004882812, -0.004931509494781494, 0.10990703105926514, 0.22474557161331177, 0.3395841121673584, 0.45442265272140503, 0.5692611932754517, 0.6840997338294983, 0.7989382743835449, 0.9137768149375916, 1.0286153554916382, 1.14345383644104, 1.2582924365997314, 1.3731310367584229, 1.4879695177078247, 1.6028079986572266, 1.717646598815918, 1.8324851989746094, 1.9473236799240112, 2.062162160873413, 2.1770007610321045, 2.291839361190796, 2.406677722930908, 2.5215163230895996, 2.636354923248291, 2.7511935234069824, 2.866032123565674, 2.980870485305786, 3.0957090854644775]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 13.0, 29.0, 76.0, 132.0, 358.0, 1330.0, 10804.0, 485835.0, 536622.0, 11331.0, 1404.0, 336.0, 126.0, 63.0, 30.0, 9.0, 15.0, 10.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.20391845703125, -5.9742431640625, -5.74456787109375, -5.514892578125, -5.28521728515625, -5.0555419921875, -4.82586669921875, -4.59619140625, -4.36651611328125, -4.1368408203125, -3.90716552734375, -3.677490234375, -3.44781494140625, -3.2181396484375, -2.98846435546875, -2.7587890625, -2.52911376953125, -2.2994384765625, -2.06976318359375, -1.840087890625, -1.61041259765625, -1.3807373046875, -1.15106201171875, -0.92138671875, -0.69171142578125, -0.4620361328125, -0.23236083984375, -0.002685546875, 0.22698974609375, 0.4566650390625, 0.68634033203125, 0.916015625, 1.14569091796875, 1.3753662109375, 1.60504150390625, 1.834716796875, 2.06439208984375, 2.2940673828125, 2.52374267578125, 2.75341796875, 2.98309326171875, 3.2127685546875, 3.44244384765625, 3.672119140625, 3.90179443359375, 4.1314697265625, 4.36114501953125, 4.5908203125, 4.82049560546875, 5.0501708984375, 5.27984619140625, 5.509521484375, 5.73919677734375, 5.9688720703125, 6.19854736328125, 6.42822265625, 6.65789794921875, 6.8875732421875, 7.11724853515625, 7.346923828125, 7.57659912109375, 7.8062744140625, 8.03594970703125, 8.265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 15.0, 26.0, 65.0, 124.0, 227.0, 268.0, 154.0, 64.0, 24.0, 19.0, 13.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -31.452880859375, -30.81201171875, -30.171142578125, -29.5302734375, -28.889404296875, -28.24853515625, -27.607666015625, -26.966796875, -26.325927734375, -25.68505859375, -25.044189453125, -24.4033203125, -23.762451171875, -23.12158203125, -22.480712890625, -21.83984375, -21.198974609375, -20.55810546875, -19.917236328125, -19.2763671875, -18.635498046875, -17.99462890625, -17.353759765625, -16.712890625, -16.072021484375, -15.43115234375, -14.790283203125, -14.1494140625, -13.508544921875, -12.86767578125, -12.226806640625, -11.5859375, -10.945068359375, -10.30419921875, -9.663330078125, -9.0224609375, -8.381591796875, -7.74072265625, -7.099853515625, -6.458984375, -5.818115234375, -5.17724609375, -4.536376953125, -3.8955078125, -3.254638671875, -2.61376953125, -1.972900390625, -1.33203125, -0.691162109375, -0.05029296875, 0.590576171875, 1.2314453125, 1.872314453125, 2.51318359375, 3.154052734375, 3.794921875, 4.435791015625, 5.07666015625, 5.717529296875, 6.3583984375, 6.999267578125, 7.64013671875, 8.281005859375, 8.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 6.0, 20.0, 15.0, 20.0, 29.0, 57.0, 76.0, 121.0, 225.0, 478.0, 1382.0, 6399.0, 88194.0, 879927.0, 63851.0, 5588.0, 1209.0, 431.0, 198.0, 115.0, 63.0, 45.0, 39.0, 23.0, 12.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.532470703125, -4.39697265625, -4.261474609375, -4.1259765625, -3.990478515625, -3.85498046875, -3.719482421875, -3.583984375, -3.448486328125, -3.31298828125, -3.177490234375, -3.0419921875, -2.906494140625, -2.77099609375, -2.635498046875, -2.5, -2.364501953125, -2.22900390625, -2.093505859375, -1.9580078125, -1.822509765625, -1.68701171875, -1.551513671875, -1.416015625, -1.280517578125, -1.14501953125, -1.009521484375, -0.8740234375, -0.738525390625, -0.60302734375, -0.467529296875, -0.33203125, -0.196533203125, -0.06103515625, 0.074462890625, 0.2099609375, 0.345458984375, 0.48095703125, 0.616455078125, 0.751953125, 0.887451171875, 1.02294921875, 1.158447265625, 1.2939453125, 1.429443359375, 1.56494140625, 1.700439453125, 1.8359375, 1.971435546875, 2.10693359375, 2.242431640625, 2.3779296875, 2.513427734375, 2.64892578125, 2.784423828125, 2.919921875, 3.055419921875, 3.19091796875, 3.326416015625, 3.4619140625, 3.597412109375, 3.73291015625, 3.868408203125, 4.00390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 9.0, 7.0, 16.0, 20.0, 15.0, 26.0, 26.0, 33.0, 27.0, 28.0, 40.0, 48.0, 50.0, 58.0, 47.0, 53.0, 62.0, 63.0, 47.0, 42.0, 39.0, 43.0, 35.0, 24.0, 28.0, 21.0, 13.0, 17.0, 14.0, 17.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.85546875, -7.634521484375, -7.41357421875, -7.192626953125, -6.9716796875, -6.750732421875, -6.52978515625, -6.308837890625, -6.087890625, -5.866943359375, -5.64599609375, -5.425048828125, -5.2041015625, -4.983154296875, -4.76220703125, -4.541259765625, -4.3203125, -4.099365234375, -3.87841796875, -3.657470703125, -3.4365234375, -3.215576171875, -2.99462890625, -2.773681640625, -2.552734375, -2.331787109375, -2.11083984375, -1.889892578125, -1.6689453125, -1.447998046875, -1.22705078125, -1.006103515625, -0.78515625, -0.564208984375, -0.34326171875, -0.122314453125, 0.0986328125, 0.319580078125, 0.54052734375, 0.761474609375, 0.982421875, 1.203369140625, 1.42431640625, 1.645263671875, 1.8662109375, 2.087158203125, 2.30810546875, 2.529052734375, 2.75, 2.970947265625, 3.19189453125, 3.412841796875, 3.6337890625, 3.854736328125, 4.07568359375, 4.296630859375, 4.517578125, 4.738525390625, 4.95947265625, 5.180419921875, 5.4013671875, 5.622314453125, 5.84326171875, 6.064208984375, 6.28515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 10.0, 4.0, 7.0, 7.0, 8.0, 8.0, 26.0, 41.0, 54.0, 87.0, 138.0, 252.0, 463.0, 956.0, 2028.0, 4962.0, 16019.0, 74633.0, 509867.0, 363708.0, 54674.0, 12805.0, 4212.0, 1785.0, 781.0, 395.0, 218.0, 147.0, 83.0, 53.0, 40.0, 24.0, 15.0, 7.0, 12.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8388671875, -0.8125762939453125, -0.786285400390625, -0.7599945068359375, -0.73370361328125, -0.7074127197265625, -0.681121826171875, -0.6548309326171875, -0.6285400390625, -0.6022491455078125, -0.575958251953125, -0.5496673583984375, -0.52337646484375, -0.4970855712890625, -0.470794677734375, -0.4445037841796875, -0.418212890625, -0.3919219970703125, -0.365631103515625, -0.3393402099609375, -0.31304931640625, -0.2867584228515625, -0.260467529296875, -0.2341766357421875, -0.2078857421875, -0.1815948486328125, -0.155303955078125, -0.1290130615234375, -0.10272216796875, -0.0764312744140625, -0.050140380859375, -0.0238494873046875, 0.00244140625, 0.0287322998046875, 0.055023193359375, 0.0813140869140625, 0.10760498046875, 0.1338958740234375, 0.160186767578125, 0.1864776611328125, 0.2127685546875, 0.2390594482421875, 0.265350341796875, 0.2916412353515625, 0.31793212890625, 0.3442230224609375, 0.370513916015625, 0.3968048095703125, 0.423095703125, 0.4493865966796875, 0.475677490234375, 0.5019683837890625, 0.52825927734375, 0.5545501708984375, 0.580841064453125, 0.6071319580078125, 0.6334228515625, 0.6597137451171875, 0.686004638671875, 0.7122955322265625, 0.73858642578125, 0.7648773193359375, 0.791168212890625, 0.8174591064453125, 0.84375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 18.0, 32.0, 29.0, 45.0, 70.0, 106.0, 117.0, 133.0, 114.0, 80.0, 62.0, 40.0, 36.0, 26.0, 13.0, 14.0, 17.0, 5.0, 7.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001277923583984375, -0.0001221001148223877, -0.00011640787124633789, -0.00011071562767028809, -0.00010502338409423828, -9.933114051818848e-05, -9.363889694213867e-05, -8.794665336608887e-05, -8.225440979003906e-05, -7.656216621398926e-05, -7.086992263793945e-05, -6.517767906188965e-05, -5.9485435485839844e-05, -5.379319190979004e-05, -4.8100948333740234e-05, -4.240870475769043e-05, -3.6716461181640625e-05, -3.102421760559082e-05, -2.5331974029541016e-05, -1.963973045349121e-05, -1.3947486877441406e-05, -8.255243301391602e-06, -2.562999725341797e-06, 3.129243850708008e-06, 8.821487426757812e-06, 1.4513731002807617e-05, 2.0205974578857422e-05, 2.5898218154907227e-05, 3.159046173095703e-05, 3.7282705307006836e-05, 4.297494888305664e-05, 4.8667192459106445e-05, 5.435943603515625e-05, 6.0051679611206055e-05, 6.574392318725586e-05, 7.143616676330566e-05, 7.712841033935547e-05, 8.282065391540527e-05, 8.851289749145508e-05, 9.420514106750488e-05, 9.989738464355469e-05, 0.00010558962821960449, 0.0001112818717956543, 0.0001169741153717041, 0.0001226663589477539, 0.0001283586025238037, 0.00013405084609985352, 0.00013974308967590332, 0.00014543533325195312, 0.00015112757682800293, 0.00015681982040405273, 0.00016251206398010254, 0.00016820430755615234, 0.00017389655113220215, 0.00017958879470825195, 0.00018528103828430176, 0.00019097328186035156, 0.00019666552543640137, 0.00020235776901245117, 0.00020805001258850098, 0.00021374225616455078, 0.00021943449974060059, 0.0002251267433166504, 0.0002308189868927002, 0.00023651123046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 8.0, 17.0, 20.0, 43.0, 73.0, 178.0, 339.0, 1100.0, 5205.0, 61074.0, 898416.0, 74366.0, 5804.0, 1194.0, 394.0, 137.0, 96.0, 36.0, 22.0, 11.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4159088134765625, -1.358184814453125, -1.3004608154296875, -1.24273681640625, -1.1850128173828125, -1.127288818359375, -1.0695648193359375, -1.0118408203125, -0.9541168212890625, -0.896392822265625, -0.8386688232421875, -0.78094482421875, -0.7232208251953125, -0.665496826171875, -0.6077728271484375, -0.550048828125, -0.4923248291015625, -0.434600830078125, -0.3768768310546875, -0.31915283203125, -0.2614288330078125, -0.203704833984375, -0.1459808349609375, -0.0882568359375, -0.0305328369140625, 0.027191162109375, 0.0849151611328125, 0.14263916015625, 0.2003631591796875, 0.258087158203125, 0.3158111572265625, 0.37353515625, 0.4312591552734375, 0.488983154296875, 0.5467071533203125, 0.60443115234375, 0.6621551513671875, 0.719879150390625, 0.7776031494140625, 0.8353271484375, 0.8930511474609375, 0.950775146484375, 1.0084991455078125, 1.06622314453125, 1.1239471435546875, 1.181671142578125, 1.2393951416015625, 1.297119140625, 1.3548431396484375, 1.412567138671875, 1.4702911376953125, 1.52801513671875, 1.5857391357421875, 1.643463134765625, 1.7011871337890625, 1.7589111328125, 1.8166351318359375, 1.874359130859375, 1.9320831298828125, 1.98980712890625, 2.0475311279296875, 2.105255126953125, 2.1629791259765625, 2.220703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 16.0, 12.0, 15.0, 30.0, 30.0, 29.0, 50.0, 72.0, 65.0, 101.0, 114.0, 108.0, 87.0, 54.0, 51.0, 41.0, 34.0, 15.0, 13.0, 16.0, 9.0, 3.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5504837036132812, -0.5335845947265625, -0.5166854858398438, -0.499786376953125, -0.48288726806640625, -0.4659881591796875, -0.44908905029296875, -0.43218994140625, -0.41529083251953125, -0.3983917236328125, -0.38149261474609375, -0.364593505859375, -0.34769439697265625, -0.3307952880859375, -0.31389617919921875, -0.2969970703125, -0.28009796142578125, -0.2631988525390625, -0.24629974365234375, -0.229400634765625, -0.21250152587890625, -0.1956024169921875, -0.17870330810546875, -0.16180419921875, -0.14490509033203125, -0.1280059814453125, -0.11110687255859375, -0.094207763671875, -0.07730865478515625, -0.0604095458984375, -0.04351043701171875, -0.026611328125, -0.00971221923828125, 0.0071868896484375, 0.02408599853515625, 0.040985107421875, 0.05788421630859375, 0.0747833251953125, 0.09168243408203125, 0.10858154296875, 0.12548065185546875, 0.1423797607421875, 0.15927886962890625, 0.176177978515625, 0.19307708740234375, 0.2099761962890625, 0.22687530517578125, 0.2437744140625, 0.26067352294921875, 0.2775726318359375, 0.29447174072265625, 0.311370849609375, 0.32826995849609375, 0.3451690673828125, 0.36206817626953125, 0.37896728515625, 0.39586639404296875, 0.4127655029296875, 0.42966461181640625, 0.446563720703125, 0.46346282958984375, 0.4803619384765625, 0.49726104736328125, 0.51416015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 7.0, 7.0, 14.0, 97.0, 538.0, 282.0, 45.0, 11.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.893657684326172, -27.88878631591797, -26.883914947509766, -25.879043579101562, -24.874170303344727, -23.869298934936523, -22.86442756652832, -21.859556198120117, -20.85468292236328, -19.849811553955078, -18.844940185546875, -17.840068817138672, -16.835195541381836, -15.830324172973633, -14.82545280456543, -13.820581436157227, -12.815710067749023, -11.81083869934082, -10.8059663772583, -9.801095008850098, -8.796222686767578, -7.791351318359375, -6.786479949951172, -5.7816081047058105, -4.776736259460449, -3.771864414215088, -2.7669928073883057, -1.7621212005615234, -0.7572493553161621, 0.24762248992919922, 1.2524938583374023, 2.2573657035827637, 3.262237548828125, 4.267109394073486, 5.271981239318848, 6.276852607727051, 7.281724452972412, 8.286596298217773, 9.291467666625977, 10.29633903503418, 11.3012113571167, 12.306082725524902, 13.310955047607422, 14.315826416015625, 15.320697784423828, 16.32556915283203, 17.330440521240234, 18.33531379699707, 19.340185165405273, 20.345056533813477, 21.34992790222168, 22.354801177978516, 23.35967254638672, 24.364543914794922, 25.369415283203125, 26.374286651611328, 27.37915802001953, 28.384029388427734, 29.388900756835938, 30.39377212524414, 31.398645401000977, 32.40351867675781, 33.40838623046875, 34.41326141357422, 35.41813278198242]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 14.0, 14.0, 15.0, 12.0, 19.0, 33.0, 30.0, 32.0, 55.0, 56.0, 53.0, 67.0, 66.0, 75.0, 57.0, 53.0, 43.0, 65.0, 54.0, 38.0, 38.0, 33.0, 20.0, 22.0, 6.0, 10.0, 12.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.108684539794922, -24.528242111206055, -23.94780158996582, -23.367359161376953, -22.786916732788086, -22.20647621154785, -21.626033782958984, -21.04559326171875, -20.465150833129883, -19.884708404541016, -19.30426788330078, -18.723825454711914, -18.143383026123047, -17.562942504882812, -16.982500076293945, -16.402057647705078, -15.821616172790527, -15.241174697875977, -14.66073226928711, -14.080290794372559, -13.499849319458008, -12.91940689086914, -12.33896541595459, -11.758523941040039, -11.178081512451172, -10.597640037536621, -10.017197608947754, -9.436756134033203, -8.856314659118652, -8.275873184204102, -7.695430755615234, -7.114989280700684, -6.534546852111816, -5.954104900360107, -5.373663425445557, -4.793221473693848, -4.212779998779297, -3.632338047027588, -3.051896095275879, -2.471454620361328, -1.8910126686096191, -1.3105709552764893, -0.7301291227340698, -0.1496872901916504, 0.4307544231414795, 1.0111961364746094, 1.5916380882263184, 2.172079563140869, 2.752521514892578, 3.332963228225708, 3.913404941558838, 4.493846893310547, 5.074288368225098, 5.654730319976807, 6.235172271728516, 6.815613746643066, 7.396055698394775, 7.976497650146484, 8.556939125061035, 9.137380599975586, 9.717823028564453, 10.298264503479004, 10.878705978393555, 11.459148406982422, 12.039589881896973]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 12.0, 16.0, 25.0, 48.0, 55.0, 107.0, 152.0, 259.0, 414.0, 780.0, 1636.0, 3916.0, 11351.0, 49052.0, 527904.0, 3406231.0, 154264.0, 25441.0, 7275.0, 2654.0, 1181.0, 580.0, 355.0, 190.0, 134.0, 87.0, 52.0, 29.0, 23.0, 14.0, 9.0, 8.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.8671875, -3.73046875, -3.59375, -3.45703125, -3.3203125, -3.18359375, -3.046875, -2.91015625, -2.7734375, -2.63671875, -2.5, -2.36328125, -2.2265625, -2.08984375, -1.953125, -1.81640625, -1.6796875, -1.54296875, -1.40625, -1.26953125, -1.1328125, -0.99609375, -0.859375, -0.72265625, -0.5859375, -0.44921875, -0.3125, -0.17578125, -0.0390625, 0.09765625, 0.234375, 0.37109375, 0.5078125, 0.64453125, 0.78125, 0.91796875, 1.0546875, 1.19140625, 1.328125, 1.46484375, 1.6015625, 1.73828125, 1.875, 2.01171875, 2.1484375, 2.28515625, 2.421875, 2.55859375, 2.6953125, 2.83203125, 2.96875, 3.10546875, 3.2421875, 3.37890625, 3.515625, 3.65234375, 3.7890625, 3.92578125, 4.0625, 4.19921875, 4.3359375, 4.47265625, 4.609375, 4.74609375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 7.0, 4.0, 12.0, 13.0, 37.0, 36.0, 43.0, 65.0, 75.0, 102.0, 106.0, 88.0, 97.0, 80.0, 57.0, 49.0, 31.0, 29.0, 15.0, 13.0, 10.0, 12.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.5877685546875, -4.456787109375, -4.3258056640625, -4.19482421875, -4.0638427734375, -3.932861328125, -3.8018798828125, -3.6708984375, -3.5399169921875, -3.408935546875, -3.2779541015625, -3.14697265625, -3.0159912109375, -2.885009765625, -2.7540283203125, -2.623046875, -2.4920654296875, -2.361083984375, -2.2301025390625, -2.09912109375, -1.9681396484375, -1.837158203125, -1.7061767578125, -1.5751953125, -1.4442138671875, -1.313232421875, -1.1822509765625, -1.05126953125, -0.9202880859375, -0.789306640625, -0.6583251953125, -0.52734375, -0.3963623046875, -0.265380859375, -0.1343994140625, -0.00341796875, 0.1275634765625, 0.258544921875, 0.3895263671875, 0.5205078125, 0.6514892578125, 0.782470703125, 0.9134521484375, 1.04443359375, 1.1754150390625, 1.306396484375, 1.4373779296875, 1.568359375, 1.6993408203125, 1.830322265625, 1.9613037109375, 2.09228515625, 2.2232666015625, 2.354248046875, 2.4852294921875, 2.6162109375, 2.7471923828125, 2.878173828125, 3.0091552734375, 3.14013671875, 3.2711181640625, 3.402099609375, 3.5330810546875, 3.6640625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 13.0, 16.0, 37.0, 54.0, 66.0, 96.0, 153.0, 299.0, 567.0, 1217.0, 3369.0, 13185.0, 89821.0, 3569648.0, 472981.0, 32055.0, 6722.0, 2136.0, 842.0, 349.0, 235.0, 119.0, 68.0, 51.0, 35.0, 22.0, 23.0, 15.0, 12.0, 13.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.79437255859375, -4.6434326171875, -4.49249267578125, -4.341552734375, -4.19061279296875, -4.0396728515625, -3.88873291015625, -3.73779296875, -3.58685302734375, -3.4359130859375, -3.28497314453125, -3.134033203125, -2.98309326171875, -2.8321533203125, -2.68121337890625, -2.5302734375, -2.37933349609375, -2.2283935546875, -2.07745361328125, -1.926513671875, -1.77557373046875, -1.6246337890625, -1.47369384765625, -1.32275390625, -1.17181396484375, -1.0208740234375, -0.86993408203125, -0.718994140625, -0.56805419921875, -0.4171142578125, -0.26617431640625, -0.115234375, 0.03570556640625, 0.1866455078125, 0.33758544921875, 0.488525390625, 0.63946533203125, 0.7904052734375, 0.94134521484375, 1.09228515625, 1.24322509765625, 1.3941650390625, 1.54510498046875, 1.696044921875, 1.84698486328125, 1.9979248046875, 2.14886474609375, 2.2998046875, 2.45074462890625, 2.6016845703125, 2.75262451171875, 2.903564453125, 3.05450439453125, 3.2054443359375, 3.35638427734375, 3.50732421875, 3.65826416015625, 3.8092041015625, 3.96014404296875, 4.111083984375, 4.26202392578125, 4.4129638671875, 4.56390380859375, 4.71484375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 8.0, 11.0, 13.0, 15.0, 16.0, 20.0, 44.0, 56.0, 63.0, 77.0, 114.0, 154.0, 216.0, 405.0, 710.0, 808.0, 415.0, 239.0, 140.0, 147.0, 89.0, 77.0, 53.0, 40.0, 36.0, 26.0, 11.0, 13.0, 9.0, 9.0, 7.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.73974609375, -0.7159500122070312, -0.6921539306640625, -0.6683578491210938, -0.644561767578125, -0.6207656860351562, -0.5969696044921875, -0.5731735229492188, -0.54937744140625, -0.5255813598632812, -0.5017852783203125, -0.47798919677734375, -0.454193115234375, -0.43039703369140625, -0.4066009521484375, -0.38280487060546875, -0.3590087890625, -0.33521270751953125, -0.3114166259765625, -0.28762054443359375, -0.263824462890625, -0.24002838134765625, -0.2162322998046875, -0.19243621826171875, -0.16864013671875, -0.14484405517578125, -0.1210479736328125, -0.09725189208984375, -0.073455810546875, -0.04965972900390625, -0.0258636474609375, -0.00206756591796875, 0.021728515625, 0.04552459716796875, 0.0693206787109375, 0.09311676025390625, 0.116912841796875, 0.14070892333984375, 0.1645050048828125, 0.18830108642578125, 0.21209716796875, 0.23589324951171875, 0.2596893310546875, 0.28348541259765625, 0.307281494140625, 0.33107757568359375, 0.3548736572265625, 0.37866973876953125, 0.4024658203125, 0.42626190185546875, 0.4500579833984375, 0.47385406494140625, 0.497650146484375, 0.5214462280273438, 0.5452423095703125, 0.5690383911132812, 0.59283447265625, 0.6166305541992188, 0.6404266357421875, 0.6642227172851562, 0.688018798828125, 0.7118148803710938, 0.7356109619140625, 0.7594070434570312, 0.783203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 9.0, 5.0, 13.0, 16.0, 14.0, 50.0, 53.0, 134.0, 145.0, 202.0, 147.0, 82.0, 49.0, 24.0, 11.0, 11.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.659629821777344, -5.472128391265869, -5.2846269607543945, -5.09712553024292, -4.909624099731445, -4.722122669219971, -4.534621238708496, -4.34712028503418, -4.159618377685547, -3.9721169471740723, -3.7846155166625977, -3.597114086151123, -3.4096126556396484, -3.222111225128174, -3.0346100330352783, -2.8471086025238037, -2.659607410430908, -2.4721059799194336, -2.284604549407959, -2.0971031188964844, -1.9096018075942993, -1.7221003770828247, -1.5345990657806396, -1.347097635269165, -1.1595962047576904, -0.9720947742462158, -0.784593403339386, -0.5970920324325562, -0.40959060192108154, -0.22208917140960693, -0.034587860107421875, 0.15291357040405273, 0.34041452407836914, 0.5279159545898438, 0.7154173254966736, 0.9029186964035034, 1.090420126914978, 1.2779215574264526, 1.4654228687286377, 1.6529242992401123, 1.840425729751587, 2.0279271602630615, 2.215428590774536, 2.4029297828674316, 2.5904312133789062, 2.777932643890381, 2.9654340744018555, 3.15293550491333, 3.3404369354248047, 3.5279383659362793, 3.715439796447754, 3.9029412269592285, 4.090442657470703, 4.277944087982178, 4.465445518493652, 4.652946472167969, 4.840448379516602, 5.027949810028076, 5.215451240539551, 5.402952671051025, 5.5904541015625, 5.777955532073975, 5.965456962585449, 6.152957916259766, 6.34045934677124]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 8.0, 8.0, 16.0, 14.0, 29.0, 22.0, 26.0, 49.0, 62.0, 61.0, 71.0, 78.0, 61.0, 62.0, 74.0, 80.0, 45.0, 49.0, 44.0, 26.0, 23.0, 23.0, 14.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03287935256958, -3.9171664714813232, -3.8014535903930664, -3.6857404708862305, -3.5700275897979736, -3.454314708709717, -3.33860182762146, -3.222888946533203, -3.1071760654449463, -2.9914631843566895, -2.8757503032684326, -2.760037422180176, -2.64432430267334, -2.528611421585083, -2.412898540496826, -2.2971856594085693, -2.1814727783203125, -2.0657598972320557, -1.9500468969345093, -1.8343340158462524, -1.7186211347579956, -1.6029081344604492, -1.4871952533721924, -1.3714823722839355, -1.2557692527770996, -1.1400563716888428, -1.0243433713912964, -0.9086304903030396, -0.7929176092147827, -0.6772046685218811, -0.5614917278289795, -0.44577884674072266, -0.3300659656524658, -0.2143530547618866, -0.09864012897014618, 0.01707279682159424, 0.13278570771217346, 0.24849861860275269, 0.3642115592956543, 0.47992444038391113, 0.5956373810768127, 0.7113503217697144, 0.8270632028579712, 0.9427761435508728, 1.0584890842437744, 1.1742019653320312, 1.289914846420288, 1.405627727508545, 1.5213407278060913, 1.6370536088943481, 1.7527666091918945, 1.8684794902801514, 1.9841923713684082, 2.099905252456665, 2.215618133544922, 2.331331253051758, 2.4470441341400146, 2.5627570152282715, 2.6784698963165283, 2.794182777404785, 2.909895896911621, 3.025608777999878, 3.1413216590881348, 3.2570345401763916, 3.3727474212646484]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 1.0, 7.0, 6.0, 14.0, 12.0, 14.0, 31.0, 43.0, 68.0, 131.0, 249.0, 564.0, 1545.0, 5964.0, 38001.0, 672701.0, 302556.0, 20716.0, 3851.0, 1173.0, 425.0, 180.0, 109.0, 63.0, 39.0, 23.0, 19.0, 10.0, 10.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.465087890625, -0.4504890441894531, -0.43589019775390625, -0.4212913513183594, -0.4066925048828125, -0.3920936584472656, -0.37749481201171875, -0.3628959655761719, -0.348297119140625, -0.3336982727050781, -0.31909942626953125, -0.3045005798339844, -0.2899017333984375, -0.2753028869628906, -0.26070404052734375, -0.24610519409179688, -0.23150634765625, -0.21690750122070312, -0.20230865478515625, -0.18770980834960938, -0.1731109619140625, -0.15851211547851562, -0.14391326904296875, -0.12931442260742188, -0.114715576171875, -0.10011672973632812, -0.08551788330078125, -0.07091903686523438, -0.0563201904296875, -0.041721343994140625, -0.02712249755859375, -0.012523651123046875, 0.0020751953125, 0.016674041748046875, 0.03127288818359375, 0.045871734619140625, 0.0604705810546875, 0.07506942749023438, 0.08966827392578125, 0.10426712036132812, 0.118865966796875, 0.13346481323242188, 0.14806365966796875, 0.16266250610351562, 0.1772613525390625, 0.19186019897460938, 0.20645904541015625, 0.22105789184570312, 0.23565673828125, 0.2502555847167969, 0.26485443115234375, 0.2794532775878906, 0.2940521240234375, 0.3086509704589844, 0.32324981689453125, 0.3378486633300781, 0.352447509765625, 0.3670463562011719, 0.38164520263671875, 0.3962440490722656, 0.4108428955078125, 0.4254417419433594, 0.44004058837890625, 0.4546394348144531, 0.46923828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 6.0, 13.0, 10.0, 11.0, 27.0, 19.0, 25.0, 55.0, 40.0, 78.0, 100.0, 82.0, 88.0, 83.0, 67.0, 70.0, 46.0, 42.0, 26.0, 29.0, 20.0, 17.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.953125, -2.866912841796875, -2.78070068359375, -2.694488525390625, -2.6082763671875, -2.522064208984375, -2.43585205078125, -2.349639892578125, -2.263427734375, -2.177215576171875, -2.09100341796875, -2.004791259765625, -1.9185791015625, -1.832366943359375, -1.74615478515625, -1.659942626953125, -1.57373046875, -1.487518310546875, -1.40130615234375, -1.315093994140625, -1.2288818359375, -1.142669677734375, -1.05645751953125, -0.970245361328125, -0.884033203125, -0.797821044921875, -0.71160888671875, -0.625396728515625, -0.5391845703125, -0.452972412109375, -0.36676025390625, -0.280548095703125, -0.1943359375, -0.108123779296875, -0.02191162109375, 0.064300537109375, 0.1505126953125, 0.236724853515625, 0.32293701171875, 0.409149169921875, 0.495361328125, 0.581573486328125, 0.66778564453125, 0.753997802734375, 0.8402099609375, 0.926422119140625, 1.01263427734375, 1.098846435546875, 1.18505859375, 1.271270751953125, 1.35748291015625, 1.443695068359375, 1.5299072265625, 1.616119384765625, 1.70233154296875, 1.788543701171875, 1.874755859375, 1.960968017578125, 2.04718017578125, 2.133392333984375, 2.2196044921875, 2.305816650390625, 2.39202880859375, 2.478240966796875, 2.564453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 8.0, 9.0, 12.0, 13.0, 23.0, 38.0, 45.0, 94.0, 87.0, 128.0, 193.0, 303.0, 476.0, 1192.0, 5836.0, 72054.0, 799457.0, 154916.0, 10416.0, 1578.0, 590.0, 327.0, 224.0, 136.0, 93.0, 79.0, 54.0, 45.0, 25.0, 18.0, 15.0, 8.0, 13.0, 10.0, 10.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3585357666015625, -0.347198486328125, -0.3358612060546875, -0.32452392578125, -0.3131866455078125, -0.301849365234375, -0.2905120849609375, -0.2791748046875, -0.2678375244140625, -0.256500244140625, -0.2451629638671875, -0.23382568359375, -0.2224884033203125, -0.211151123046875, -0.1998138427734375, -0.1884765625, -0.1771392822265625, -0.165802001953125, -0.1544647216796875, -0.14312744140625, -0.1317901611328125, -0.120452880859375, -0.1091156005859375, -0.0977783203125, -0.0864410400390625, -0.075103759765625, -0.0637664794921875, -0.05242919921875, -0.0410919189453125, -0.029754638671875, -0.0184173583984375, -0.007080078125, 0.0042572021484375, 0.015594482421875, 0.0269317626953125, 0.03826904296875, 0.0496063232421875, 0.060943603515625, 0.0722808837890625, 0.0836181640625, 0.0949554443359375, 0.106292724609375, 0.1176300048828125, 0.12896728515625, 0.1403045654296875, 0.151641845703125, 0.1629791259765625, 0.17431640625, 0.1856536865234375, 0.196990966796875, 0.2083282470703125, 0.21966552734375, 0.2310028076171875, 0.242340087890625, 0.2536773681640625, 0.2650146484375, 0.2763519287109375, 0.287689208984375, 0.2990264892578125, 0.31036376953125, 0.3217010498046875, 0.333038330078125, 0.3443756103515625, 0.355712890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 3.0, 11.0, 7.0, 13.0, 18.0, 27.0, 28.0, 33.0, 40.0, 57.0, 42.0, 50.0, 46.0, 67.0, 61.0, 51.0, 67.0, 57.0, 51.0, 33.0, 29.0, 32.0, 29.0, 30.0, 20.0, 17.0, 13.0, 12.0, 8.0, 6.0, 13.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74017333984375, -3.6053466796875, -3.47052001953125, -3.335693359375, -3.20086669921875, -3.0660400390625, -2.93121337890625, -2.79638671875, -2.66156005859375, -2.5267333984375, -2.39190673828125, -2.257080078125, -2.12225341796875, -1.9874267578125, -1.85260009765625, -1.7177734375, -1.58294677734375, -1.4481201171875, -1.31329345703125, -1.178466796875, -1.04364013671875, -0.9088134765625, -0.77398681640625, -0.63916015625, -0.50433349609375, -0.3695068359375, -0.23468017578125, -0.099853515625, 0.03497314453125, 0.1697998046875, 0.30462646484375, 0.439453125, 0.57427978515625, 0.7091064453125, 0.84393310546875, 0.978759765625, 1.11358642578125, 1.2484130859375, 1.38323974609375, 1.51806640625, 1.65289306640625, 1.7877197265625, 1.92254638671875, 2.057373046875, 2.19219970703125, 2.3270263671875, 2.46185302734375, 2.5966796875, 2.73150634765625, 2.8663330078125, 3.00115966796875, 3.135986328125, 3.27081298828125, 3.4056396484375, 3.54046630859375, 3.67529296875, 3.81011962890625, 3.9449462890625, 4.07977294921875, 4.214599609375, 4.34942626953125, 4.4842529296875, 4.61907958984375, 4.75390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 5.0, 7.0, 15.0, 13.0, 11.0, 22.0, 30.0, 37.0, 54.0, 49.0, 80.0, 105.0, 108.0, 173.0, 232.0, 317.0, 544.0, 1263.0, 6010.0, 87056.0, 913626.0, 32732.0, 3480.0, 933.0, 466.0, 314.0, 213.0, 159.0, 104.0, 81.0, 64.0, 40.0, 45.0, 29.0, 25.0, 31.0, 14.0, 15.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.06903076171875, -0.06702136993408203, -0.06501197814941406, -0.0630025863647461, -0.060993194580078125, -0.058983802795410156, -0.05697441101074219, -0.05496501922607422, -0.05295562744140625, -0.05094623565673828, -0.04893684387207031, -0.046927452087402344, -0.044918060302734375, -0.042908668518066406, -0.04089927673339844, -0.03888988494873047, -0.0368804931640625, -0.03487110137939453, -0.03286170959472656, -0.030852317810058594, -0.028842926025390625, -0.026833534240722656, -0.024824142456054688, -0.02281475067138672, -0.02080535888671875, -0.01879596710205078, -0.016786575317382812, -0.014777183532714844, -0.012767791748046875, -0.010758399963378906, -0.008749008178710938, -0.006739616394042969, -0.004730224609375, -0.0027208328247070312, -0.0007114410400390625, 0.0012979507446289062, 0.003307342529296875, 0.005316734313964844, 0.0073261260986328125, 0.009335517883300781, 0.01134490966796875, 0.013354301452636719, 0.015363693237304688, 0.017373085021972656, 0.019382476806640625, 0.021391868591308594, 0.023401260375976562, 0.02541065216064453, 0.0274200439453125, 0.02942943572998047, 0.03143882751464844, 0.033448219299316406, 0.035457611083984375, 0.037467002868652344, 0.03947639465332031, 0.04148578643798828, 0.04349517822265625, 0.04550457000732422, 0.04751396179199219, 0.049523353576660156, 0.051532745361328125, 0.053542137145996094, 0.05555152893066406, 0.05756092071533203, 0.0595703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 16.0, 14.0, 18.0, 28.0, 49.0, 59.0, 113.0, 115.0, 114.0, 126.0, 88.0, 68.0, 40.0, 26.0, 28.0, 15.0, 12.0, 17.0, 9.0, 9.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0159950256347656e-05, -2.9262155294418335e-05, -2.8364360332489014e-05, -2.7466565370559692e-05, -2.656877040863037e-05, -2.567097544670105e-05, -2.477318048477173e-05, -2.3875385522842407e-05, -2.2977590560913086e-05, -2.2079795598983765e-05, -2.1182000637054443e-05, -2.0284205675125122e-05, -1.93864107131958e-05, -1.848861575126648e-05, -1.7590820789337158e-05, -1.6693025827407837e-05, -1.5795230865478516e-05, -1.4897435903549194e-05, -1.3999640941619873e-05, -1.3101845979690552e-05, -1.220405101776123e-05, -1.130625605583191e-05, -1.0408461093902588e-05, -9.510666131973267e-06, -8.612871170043945e-06, -7.715076208114624e-06, -6.817281246185303e-06, -5.9194862842559814e-06, -5.02169132232666e-06, -4.123896360397339e-06, -3.2261013984680176e-06, -2.3283064365386963e-06, -1.430511474609375e-06, -5.327165126800537e-07, 3.650784492492676e-07, 1.2628734111785889e-06, 2.16066837310791e-06, 3.0584633350372314e-06, 3.956258296966553e-06, 4.854053258895874e-06, 5.751848220825195e-06, 6.649643182754517e-06, 7.547438144683838e-06, 8.44523310661316e-06, 9.34302806854248e-06, 1.0240823030471802e-05, 1.1138617992401123e-05, 1.2036412954330444e-05, 1.2934207916259766e-05, 1.3832002878189087e-05, 1.4729797840118408e-05, 1.562759280204773e-05, 1.652538776397705e-05, 1.7423182725906372e-05, 1.8320977687835693e-05, 1.9218772649765015e-05, 2.0116567611694336e-05, 2.1014362573623657e-05, 2.191215753555298e-05, 2.28099524974823e-05, 2.370774745941162e-05, 2.4605542421340942e-05, 2.5503337383270264e-05, 2.6401132345199585e-05, 2.7298927307128906e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 18.0, 10.0, 18.0, 44.0, 46.0, 70.0, 105.0, 202.0, 299.0, 593.0, 1243.0, 2918.0, 9477.0, 52007.0, 842430.0, 116637.0, 14824.0, 4207.0, 1668.0, 711.0, 400.0, 227.0, 122.0, 68.0, 49.0, 33.0, 18.0, 16.0, 16.0, 12.0, 2.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10235595703125, -0.09931468963623047, -0.09627342224121094, -0.0932321548461914, -0.09019088745117188, -0.08714962005615234, -0.08410835266113281, -0.08106708526611328, -0.07802581787109375, -0.07498455047607422, -0.07194328308105469, -0.06890201568603516, -0.06586074829101562, -0.0628194808959961, -0.05977821350097656, -0.05673694610595703, -0.0536956787109375, -0.05065441131591797, -0.04761314392089844, -0.044571876525878906, -0.041530609130859375, -0.038489341735839844, -0.03544807434082031, -0.03240680694580078, -0.02936553955078125, -0.02632427215576172, -0.023283004760742188, -0.020241737365722656, -0.017200469970703125, -0.014159202575683594, -0.011117935180664062, -0.008076667785644531, -0.005035400390625, -0.0019941329956054688, 0.0010471343994140625, 0.004088401794433594, 0.007129669189453125, 0.010170936584472656, 0.013212203979492188, 0.01625347137451172, 0.01929473876953125, 0.02233600616455078, 0.025377273559570312, 0.028418540954589844, 0.031459808349609375, 0.034501075744628906, 0.03754234313964844, 0.04058361053466797, 0.0436248779296875, 0.04666614532470703, 0.04970741271972656, 0.052748680114746094, 0.055789947509765625, 0.058831214904785156, 0.06187248229980469, 0.06491374969482422, 0.06795501708984375, 0.07099628448486328, 0.07403755187988281, 0.07707881927490234, 0.08012008666992188, 0.0831613540649414, 0.08620262145996094, 0.08924388885498047, 0.09228515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 7.0, 2.0, 5.0, 6.0, 15.0, 16.0, 30.0, 40.0, 63.0, 102.0, 197.0, 190.0, 83.0, 68.0, 35.0, 28.0, 21.0, 14.0, 8.0, 6.0, 11.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019195556640625, -0.018575668334960938, -0.017955780029296875, -0.017335891723632812, -0.01671600341796875, -0.016096115112304688, -0.015476226806640625, -0.014856338500976562, -0.0142364501953125, -0.013616561889648438, -0.012996673583984375, -0.012376785278320312, -0.01175689697265625, -0.011137008666992188, -0.010517120361328125, -0.009897232055664062, -0.00927734375, -0.008657455444335938, -0.008037567138671875, -0.0074176788330078125, -0.00679779052734375, -0.0061779022216796875, -0.005558013916015625, -0.0049381256103515625, -0.0043182373046875, -0.0036983489990234375, -0.003078460693359375, -0.0024585723876953125, -0.00183868408203125, -0.0012187957763671875, -0.000598907470703125, 2.09808349609375e-05, 0.000640869140625, 0.0012607574462890625, 0.001880645751953125, 0.0025005340576171875, 0.00312042236328125, 0.0037403106689453125, 0.004360198974609375, 0.0049800872802734375, 0.0055999755859375, 0.0062198638916015625, 0.006839752197265625, 0.0074596405029296875, 0.00807952880859375, 0.008699417114257812, 0.009319305419921875, 0.009939193725585938, 0.01055908203125, 0.011178970336914062, 0.011798858642578125, 0.012418746948242188, 0.01303863525390625, 0.013658523559570312, 0.014278411865234375, 0.014898300170898438, 0.0155181884765625, 0.016138076782226562, 0.016757965087890625, 0.017377853393554688, 0.01799774169921875, 0.018617630004882812, 0.019237518310546875, 0.019857406616210938, 0.020477294921875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 12.0, 21.0, 32.0, 84.0, 188.0, 278.0, 196.0, 84.0, 30.0, 21.0, 15.0, 4.0, 9.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39328145980835, -5.222194671630859, -5.051107406616211, -4.880020618438721, -4.7089338302612305, -4.537846565246582, -4.366759777069092, -4.195672988891602, -4.024585723876953, -3.853498697280884, -3.6824119091033936, -3.511324882507324, -3.340238094329834, -3.1691510677337646, -2.9980640411376953, -2.826977252960205, -2.655890464782715, -2.4848034381866455, -2.3137166500091553, -2.142629623413086, -1.9715427160263062, -1.8004558086395264, -1.629368782043457, -1.4582818746566772, -1.2871949672698975, -1.1161080598831177, -0.9450210928916931, -0.7739341259002686, -0.6028472185134888, -0.431760311126709, -0.26067328453063965, -0.08958637714385986, 0.08150053024291992, 0.2525874674320221, 0.42367440462112427, 0.5947613716125488, 0.7658482789993286, 0.9369351863861084, 1.1080222129821777, 1.2791091203689575, 1.4501960277557373, 1.621282935142517, 1.7923698425292969, 1.9634568691253662, 2.1345438957214355, 2.305630683898926, 2.476717710494995, 2.6478047370910645, 2.8188915252685547, 2.989978551864624, 3.1610653400421143, 3.3321523666381836, 3.503239154815674, 3.674326181411743, 3.8454132080078125, 4.016499996185303, 4.187586784362793, 4.358673572540283, 4.529760837554932, 4.700847625732422, 4.871934413909912, 5.043021202087402, 5.214108467102051, 5.385195255279541, 5.5562825202941895]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 8.0, 8.0, 6.0, 10.0, 12.0, 16.0, 19.0, 29.0, 37.0, 61.0, 69.0, 82.0, 75.0, 85.0, 86.0, 81.0, 65.0, 53.0, 49.0, 41.0, 29.0, 20.0, 17.0, 13.0, 1.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0085010528564453, -2.9245901107788086, -2.840679168701172, -2.756768226623535, -2.6728570461273193, -2.5889461040496826, -2.505035161972046, -2.421124219894409, -2.3372130393981934, -2.2533020973205566, -2.16939115524292, -2.085480213165283, -2.0015690326690674, -1.9176580905914307, -1.833747148513794, -1.7498362064361572, -1.6659252643585205, -1.5820143222808838, -1.4981032609939575, -1.4141923189163208, -1.3302812576293945, -1.2463703155517578, -1.162459373474121, -1.0785484313964844, -0.9946373701095581, -0.9107263684272766, -0.8268153667449951, -0.7429044246673584, -0.6589934229850769, -0.5750824213027954, -0.4911714792251587, -0.4072604775428772, -0.3233497142791748, -0.2394387274980545, -0.1555277407169342, -0.0716167688369751, 0.012294232845306396, 0.09620523452758789, 0.1801161766052246, 0.2640271782875061, 0.3479381799697876, 0.4318491816520691, 0.5157601833343506, 0.5996711254119873, 0.6835821270942688, 0.7674931287765503, 0.851404070854187, 0.9353150725364685, 1.01922607421875, 1.1031370162963867, 1.187048077583313, 1.2709590196609497, 1.354870080947876, 1.4387810230255127, 1.5226919651031494, 1.6066029071807861, 1.6905139684677124, 1.7744249105453491, 1.8583359718322754, 1.942246913909912, 2.026157855987549, 2.1100687980651855, 2.1939797401428223, 2.277890920639038, 2.361801862716675]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 23.0, 30.0, 36.0, 60.0, 98.0, 186.0, 322.0, 634.0, 1214.0, 2691.0, 6309.0, 17786.0, 62386.0, 297788.0, 501380.0, 112246.0, 28527.0, 9716.0, 3689.0, 1611.0, 813.0, 417.0, 245.0, 121.0, 80.0, 41.0, 37.0, 17.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.6116485595703125, -1.552398681640625, -1.4931488037109375, -1.43389892578125, -1.3746490478515625, -1.315399169921875, -1.2561492919921875, -1.1968994140625, -1.1376495361328125, -1.078399658203125, -1.0191497802734375, -0.95989990234375, -0.9006500244140625, -0.841400146484375, -0.7821502685546875, -0.722900390625, -0.6636505126953125, -0.604400634765625, -0.5451507568359375, -0.48590087890625, -0.4266510009765625, -0.367401123046875, -0.3081512451171875, -0.2489013671875, -0.1896514892578125, -0.130401611328125, -0.0711517333984375, -0.01190185546875, 0.0473480224609375, 0.106597900390625, 0.1658477783203125, 0.22509765625, 0.2843475341796875, 0.343597412109375, 0.4028472900390625, 0.46209716796875, 0.5213470458984375, 0.580596923828125, 0.6398468017578125, 0.6990966796875, 0.7583465576171875, 0.817596435546875, 0.8768463134765625, 0.93609619140625, 0.9953460693359375, 1.054595947265625, 1.1138458251953125, 1.173095703125, 1.2323455810546875, 1.291595458984375, 1.3508453369140625, 1.41009521484375, 1.4693450927734375, 1.528594970703125, 1.5878448486328125, 1.6470947265625, 1.7063446044921875, 1.765594482421875, 1.8248443603515625, 1.88409423828125, 1.9433441162109375, 2.002593994140625, 2.0618438720703125, 2.12109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 6.0, 7.0, 19.0, 21.0, 20.0, 28.0, 57.0, 61.0, 64.0, 81.0, 88.0, 95.0, 86.0, 58.0, 68.0, 48.0, 42.0, 32.0, 22.0, 24.0, 16.0, 7.0, 1.0, 6.0, 9.0, 1.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.29296875, -7.08709716796875, -6.8812255859375, -6.67535400390625, -6.469482421875, -6.26361083984375, -6.0577392578125, -5.85186767578125, -5.64599609375, -5.44012451171875, -5.2342529296875, -5.02838134765625, -4.822509765625, -4.61663818359375, -4.4107666015625, -4.20489501953125, -3.9990234375, -3.79315185546875, -3.5872802734375, -3.38140869140625, -3.175537109375, -2.96966552734375, -2.7637939453125, -2.55792236328125, -2.35205078125, -2.14617919921875, -1.9403076171875, -1.73443603515625, -1.528564453125, -1.32269287109375, -1.1168212890625, -0.91094970703125, -0.705078125, -0.49920654296875, -0.2933349609375, -0.08746337890625, 0.118408203125, 0.32427978515625, 0.5301513671875, 0.73602294921875, 0.94189453125, 1.14776611328125, 1.3536376953125, 1.55950927734375, 1.765380859375, 1.97125244140625, 2.1771240234375, 2.38299560546875, 2.5888671875, 2.79473876953125, 3.0006103515625, 3.20648193359375, 3.412353515625, 3.61822509765625, 3.8240966796875, 4.02996826171875, 4.23583984375, 4.44171142578125, 4.6475830078125, 4.85345458984375, 5.059326171875, 5.26519775390625, 5.4710693359375, 5.67694091796875, 5.8828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 10.0, 6.0, 16.0, 12.0, 20.0, 28.0, 47.0, 56.0, 70.0, 84.0, 135.0, 230.0, 437.0, 867.0, 2140.0, 6702.0, 31504.0, 256544.0, 641354.0, 87403.0, 14278.0, 3832.0, 1368.0, 574.0, 310.0, 168.0, 110.0, 79.0, 41.0, 34.0, 22.0, 20.0, 16.0, 7.0, 13.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.9011077880859375, -1.840301513671875, -1.7794952392578125, -1.71868896484375, -1.6578826904296875, -1.597076416015625, -1.5362701416015625, -1.4754638671875, -1.4146575927734375, -1.353851318359375, -1.2930450439453125, -1.23223876953125, -1.1714324951171875, -1.110626220703125, -1.0498199462890625, -0.989013671875, -0.9282073974609375, -0.867401123046875, -0.8065948486328125, -0.74578857421875, -0.6849822998046875, -0.624176025390625, -0.5633697509765625, -0.5025634765625, -0.4417572021484375, -0.380950927734375, -0.3201446533203125, -0.25933837890625, -0.1985321044921875, -0.137725830078125, -0.0769195556640625, -0.01611328125, 0.0446929931640625, 0.105499267578125, 0.1663055419921875, 0.22711181640625, 0.2879180908203125, 0.348724365234375, 0.4095306396484375, 0.4703369140625, 0.5311431884765625, 0.591949462890625, 0.6527557373046875, 0.71356201171875, 0.7743682861328125, 0.835174560546875, 0.8959808349609375, 0.956787109375, 1.0175933837890625, 1.078399658203125, 1.1392059326171875, 1.20001220703125, 1.2608184814453125, 1.321624755859375, 1.3824310302734375, 1.4432373046875, 1.5040435791015625, 1.564849853515625, 1.6256561279296875, 1.68646240234375, 1.7472686767578125, 1.808074951171875, 1.8688812255859375, 1.9296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 13.0, 10.0, 15.0, 12.0, 19.0, 31.0, 33.0, 41.0, 40.0, 45.0, 50.0, 44.0, 48.0, 46.0, 57.0, 56.0, 56.0, 61.0, 34.0, 44.0, 40.0, 45.0, 22.0, 27.0, 15.0, 20.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.05950927734375, -6.8416748046875, -6.62384033203125, -6.406005859375, -6.18817138671875, -5.9703369140625, -5.75250244140625, -5.53466796875, -5.31683349609375, -5.0989990234375, -4.88116455078125, -4.663330078125, -4.44549560546875, -4.2276611328125, -4.00982666015625, -3.7919921875, -3.57415771484375, -3.3563232421875, -3.13848876953125, -2.920654296875, -2.70281982421875, -2.4849853515625, -2.26715087890625, -2.04931640625, -1.83148193359375, -1.6136474609375, -1.39581298828125, -1.177978515625, -0.96014404296875, -0.7423095703125, -0.52447509765625, -0.306640625, -0.08880615234375, 0.1290283203125, 0.34686279296875, 0.564697265625, 0.78253173828125, 1.0003662109375, 1.21820068359375, 1.43603515625, 1.65386962890625, 1.8717041015625, 2.08953857421875, 2.307373046875, 2.52520751953125, 2.7430419921875, 2.96087646484375, 3.1787109375, 3.39654541015625, 3.6143798828125, 3.83221435546875, 4.050048828125, 4.26788330078125, 4.4857177734375, 4.70355224609375, 4.92138671875, 5.13922119140625, 5.3570556640625, 5.57489013671875, 5.792724609375, 6.01055908203125, 6.2283935546875, 6.44622802734375, 6.6640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 10.0, 14.0, 32.0, 46.0, 70.0, 139.0, 235.0, 429.0, 841.0, 2234.0, 7367.0, 45931.0, 708200.0, 255953.0, 19857.0, 4226.0, 1451.0, 654.0, 336.0, 184.0, 99.0, 80.0, 36.0, 21.0, 20.0, 9.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9049224853515625, -0.868438720703125, -0.8319549560546875, -0.79547119140625, -0.7589874267578125, -0.722503662109375, -0.6860198974609375, -0.6495361328125, -0.6130523681640625, -0.576568603515625, -0.5400848388671875, -0.50360107421875, -0.4671173095703125, -0.430633544921875, -0.3941497802734375, -0.357666015625, -0.3211822509765625, -0.284698486328125, -0.2482147216796875, -0.21173095703125, -0.1752471923828125, -0.138763427734375, -0.1022796630859375, -0.0657958984375, -0.0293121337890625, 0.007171630859375, 0.0436553955078125, 0.08013916015625, 0.1166229248046875, 0.153106689453125, 0.1895904541015625, 0.22607421875, 0.2625579833984375, 0.299041748046875, 0.3355255126953125, 0.37200927734375, 0.4084930419921875, 0.444976806640625, 0.4814605712890625, 0.5179443359375, 0.5544281005859375, 0.590911865234375, 0.6273956298828125, 0.66387939453125, 0.7003631591796875, 0.736846923828125, 0.7733306884765625, 0.809814453125, 0.8462982177734375, 0.882781982421875, 0.9192657470703125, 0.95574951171875, 0.9922332763671875, 1.028717041015625, 1.0652008056640625, 1.1016845703125, 1.1381683349609375, 1.174652099609375, 1.2111358642578125, 1.24761962890625, 1.2841033935546875, 1.320587158203125, 1.3570709228515625, 1.3935546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 7.0, 10.0, 16.0, 17.0, 27.0, 36.0, 53.0, 90.0, 84.0, 129.0, 118.0, 112.0, 90.0, 47.0, 43.0, 37.0, 17.0, 15.0, 12.0, 10.0, 5.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001647472381591797, -0.00015980564057826996, -0.00015486404299736023, -0.0001499224454164505, -0.00014498084783554077, -0.00014003925025463104, -0.0001350976526737213, -0.00013015605509281158, -0.00012521445751190186, -0.00012027285993099213, -0.0001153312623500824, -0.00011038966476917267, -0.00010544806718826294, -0.00010050646960735321, -9.556487202644348e-05, -9.062327444553375e-05, -8.568167686462402e-05, -8.07400792837143e-05, -7.579848170280457e-05, -7.085688412189484e-05, -6.591528654098511e-05, -6.097368896007538e-05, -5.603209137916565e-05, -5.109049379825592e-05, -4.614889621734619e-05, -4.120729863643646e-05, -3.6265701055526733e-05, -3.1324103474617004e-05, -2.6382505893707275e-05, -2.1440908312797546e-05, -1.6499310731887817e-05, -1.1557713150978088e-05, -6.616115570068359e-06, -1.6745179891586304e-06, 3.2670795917510986e-06, 8.208677172660828e-06, 1.3150274753570557e-05, 1.8091872334480286e-05, 2.3033469915390015e-05, 2.7975067496299744e-05, 3.291666507720947e-05, 3.78582626581192e-05, 4.279986023902893e-05, 4.774145781993866e-05, 5.268305540084839e-05, 5.762465298175812e-05, 6.256625056266785e-05, 6.750784814357758e-05, 7.24494457244873e-05, 7.739104330539703e-05, 8.233264088630676e-05, 8.727423846721649e-05, 9.221583604812622e-05, 9.715743362903595e-05, 0.00010209903120994568, 0.00010704062879085541, 0.00011198222637176514, 0.00011692382395267487, 0.0001218654215335846, 0.00012680701911449432, 0.00013174861669540405, 0.00013669021427631378, 0.0001416318118572235, 0.00014657340943813324, 0.00015151500701904297]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 14.0, 21.0, 20.0, 25.0, 34.0, 43.0, 72.0, 99.0, 144.0, 232.0, 428.0, 852.0, 1767.0, 4257.0, 12957.0, 63857.0, 557715.0, 347635.0, 41573.0, 9938.0, 3432.0, 1520.0, 767.0, 421.0, 226.0, 159.0, 95.0, 65.0, 48.0, 28.0, 15.0, 10.0, 18.0, 14.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6487350463867188, -0.6226654052734375, -0.5965957641601562, -0.570526123046875, -0.5444564819335938, -0.5183868408203125, -0.49231719970703125, -0.46624755859375, -0.44017791748046875, -0.4141082763671875, -0.38803863525390625, -0.361968994140625, -0.33589935302734375, -0.3098297119140625, -0.28376007080078125, -0.2576904296875, -0.23162078857421875, -0.2055511474609375, -0.17948150634765625, -0.153411865234375, -0.12734222412109375, -0.1012725830078125, -0.07520294189453125, -0.04913330078125, -0.02306365966796875, 0.0030059814453125, 0.02907562255859375, 0.055145263671875, 0.08121490478515625, 0.1072845458984375, 0.13335418701171875, 0.159423828125, 0.18549346923828125, 0.2115631103515625, 0.23763275146484375, 0.263702392578125, 0.28977203369140625, 0.3158416748046875, 0.34191131591796875, 0.36798095703125, 0.39405059814453125, 0.4201202392578125, 0.44618988037109375, 0.472259521484375, 0.49832916259765625, 0.5243988037109375, 0.5504684448242188, 0.5765380859375, 0.6026077270507812, 0.6286773681640625, 0.6547470092773438, 0.680816650390625, 0.7068862915039062, 0.7329559326171875, 0.7590255737304688, 0.78509521484375, 0.8111648559570312, 0.8372344970703125, 0.8633041381835938, 0.889373779296875, 0.9154434204101562, 0.9415130615234375, 0.9675827026367188, 0.99365234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 7.0, 18.0, 21.0, 17.0, 29.0, 35.0, 52.0, 58.0, 82.0, 78.0, 95.0, 96.0, 68.0, 73.0, 58.0, 40.0, 35.0, 35.0, 10.0, 19.0, 11.0, 3.0, 3.0, 8.0, 8.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3925323486328125, -0.381011962890625, -0.3694915771484375, -0.35797119140625, -0.3464508056640625, -0.334930419921875, -0.3234100341796875, -0.3118896484375, -0.3003692626953125, -0.288848876953125, -0.2773284912109375, -0.26580810546875, -0.2542877197265625, -0.242767333984375, -0.2312469482421875, -0.2197265625, -0.2082061767578125, -0.196685791015625, -0.1851654052734375, -0.17364501953125, -0.1621246337890625, -0.150604248046875, -0.1390838623046875, -0.1275634765625, -0.1160430908203125, -0.104522705078125, -0.0930023193359375, -0.08148193359375, -0.0699615478515625, -0.058441162109375, -0.0469207763671875, -0.035400390625, -0.0238800048828125, -0.012359619140625, -0.0008392333984375, 0.01068115234375, 0.0222015380859375, 0.033721923828125, 0.0452423095703125, 0.0567626953125, 0.0682830810546875, 0.079803466796875, 0.0913238525390625, 0.10284423828125, 0.1143646240234375, 0.125885009765625, 0.1374053955078125, 0.14892578125, 0.1604461669921875, 0.171966552734375, 0.1834869384765625, 0.19500732421875, 0.2065277099609375, 0.218048095703125, 0.2295684814453125, 0.2410888671875, 0.2526092529296875, 0.264129638671875, 0.2756500244140625, 0.28717041015625, 0.2986907958984375, 0.310211181640625, 0.3217315673828125, 0.333251953125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 10.0, 61.0, 160.0, 378.0, 248.0, 78.0, 28.0, 11.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.317737579345703, -20.76665496826172, -20.215572357177734, -19.66448974609375, -19.113407135009766, -18.56232452392578, -18.011241912841797, -17.460159301757812, -16.909076690673828, -16.357994079589844, -15.80691146850586, -15.255828857421875, -14.70474624633789, -14.153663635253906, -13.602581977844238, -13.051499366760254, -12.500417709350586, -11.949335098266602, -11.398252487182617, -10.847169876098633, -10.296087265014648, -9.745004653930664, -9.193922996520996, -8.642840385437012, -8.091757774353027, -7.540675163269043, -6.989592552185059, -6.438510417938232, -5.887427806854248, -5.336345195770264, -4.7852630615234375, -4.234180450439453, -3.6830968856811523, -3.132014274597168, -2.5809319019317627, -2.0298495292663574, -1.478766918182373, -0.9276843070983887, -0.3766019344329834, 0.17448043823242188, 0.7255630493164062, 1.276645541191101, 1.827728033065796, 2.378810405731201, 2.9298930168151855, 3.48097562789917, 4.032057762145996, 4.5831403732299805, 5.134222984313965, 5.685305595397949, 6.236388206481934, 6.78747034072876, 7.338552951812744, 7.8896355628967285, 8.440717697143555, 8.991800308227539, 9.542882919311523, 10.093965530395508, 10.645048141479492, 11.196130752563477, 11.747213363647461, 12.298295974731445, 12.849377632141113, 13.400460243225098, 13.951542854309082]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 7.0, 10.0, 14.0, 13.0, 17.0, 26.0, 30.0, 33.0, 26.0, 42.0, 43.0, 42.0, 41.0, 54.0, 56.0, 52.0, 65.0, 44.0, 49.0, 47.0, 37.0, 42.0, 28.0, 22.0, 33.0, 24.0, 16.0, 11.0, 7.0, 11.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.751856803894043, -15.308099746704102, -14.864343643188477, -14.420587539672852, -13.97683048248291, -13.533073425292969, -13.089317321777344, -12.645561218261719, -12.201804161071777, -11.758047103881836, -11.314291000366211, -10.870534896850586, -10.426777839660645, -9.983020782470703, -9.539264678955078, -9.095508575439453, -8.651751518249512, -8.20799446105957, -7.764238357543945, -7.320481777191162, -6.876725196838379, -6.432968616485596, -5.9892120361328125, -5.545455455780029, -5.101698875427246, -4.657942295074463, -4.21418571472168, -3.7704291343688965, -3.3266725540161133, -2.88291597366333, -2.439159393310547, -1.9954028129577637, -1.5516462326049805, -1.1078896522521973, -0.6641330718994141, -0.22037649154663086, 0.22338008880615234, 0.6671366691589355, 1.1108932495117188, 1.554649829864502, 1.9984064102172852, 2.4421629905700684, 2.8859195709228516, 3.3296761512756348, 3.773432731628418, 4.217189311981201, 4.660945892333984, 5.104702472686768, 5.548459053039551, 5.992215633392334, 6.435972213745117, 6.8797287940979, 7.323485374450684, 7.767241954803467, 8.21099853515625, 8.654754638671875, 9.098511695861816, 9.542268753051758, 9.986024856567383, 10.429780960083008, 10.87353801727295, 11.31729507446289, 11.761051177978516, 12.20480728149414, 12.648564338684082]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 8.0, 11.0, 13.0, 16.0, 29.0, 30.0, 50.0, 58.0, 78.0, 142.0, 187.0, 315.0, 499.0, 899.0, 1683.0, 3504.0, 9112.0, 31250.0, 180986.0, 3351689.0, 531582.0, 56456.0, 14892.0, 5512.0, 2422.0, 1142.0, 630.0, 363.0, 235.0, 136.0, 101.0, 66.0, 44.0, 29.0, 27.0, 14.0, 25.0, 5.0, 7.0, 10.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-3.947265625, -3.836700439453125, -3.72613525390625, -3.615570068359375, -3.5050048828125, -3.394439697265625, -3.28387451171875, -3.173309326171875, -3.062744140625, -2.952178955078125, -2.84161376953125, -2.731048583984375, -2.6204833984375, -2.509918212890625, -2.39935302734375, -2.288787841796875, -2.17822265625, -2.067657470703125, -1.95709228515625, -1.846527099609375, -1.7359619140625, -1.625396728515625, -1.51483154296875, -1.404266357421875, -1.293701171875, -1.183135986328125, -1.07257080078125, -0.962005615234375, -0.8514404296875, -0.740875244140625, -0.63031005859375, -0.519744873046875, -0.4091796875, -0.298614501953125, -0.18804931640625, -0.077484130859375, 0.0330810546875, 0.143646240234375, 0.25421142578125, 0.364776611328125, 0.475341796875, 0.585906982421875, 0.69647216796875, 0.807037353515625, 0.9176025390625, 1.028167724609375, 1.13873291015625, 1.249298095703125, 1.35986328125, 1.470428466796875, 1.58099365234375, 1.691558837890625, 1.8021240234375, 1.912689208984375, 2.02325439453125, 2.133819580078125, 2.244384765625, 2.354949951171875, 2.46551513671875, 2.576080322265625, 2.6866455078125, 2.797210693359375, 2.90777587890625, 3.018341064453125, 3.12890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 1.0, 9.0, 13.0, 14.0, 14.0, 27.0, 34.0, 43.0, 54.0, 75.0, 81.0, 83.0, 116.0, 101.0, 95.0, 62.0, 41.0, 29.0, 24.0, 23.0, 10.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.797210693359375, -3.68621826171875, -3.575225830078125, -3.4642333984375, -3.353240966796875, -3.24224853515625, -3.131256103515625, -3.020263671875, -2.909271240234375, -2.79827880859375, -2.687286376953125, -2.5762939453125, -2.465301513671875, -2.35430908203125, -2.243316650390625, -2.13232421875, -2.021331787109375, -1.91033935546875, -1.799346923828125, -1.6883544921875, -1.577362060546875, -1.46636962890625, -1.355377197265625, -1.244384765625, -1.133392333984375, -1.02239990234375, -0.911407470703125, -0.8004150390625, -0.689422607421875, -0.57843017578125, -0.467437744140625, -0.3564453125, -0.245452880859375, -0.13446044921875, -0.023468017578125, 0.0875244140625, 0.198516845703125, 0.30950927734375, 0.420501708984375, 0.531494140625, 0.642486572265625, 0.75347900390625, 0.864471435546875, 0.9754638671875, 1.086456298828125, 1.19744873046875, 1.308441162109375, 1.41943359375, 1.530426025390625, 1.64141845703125, 1.752410888671875, 1.8634033203125, 1.974395751953125, 2.08538818359375, 2.196380615234375, 2.307373046875, 2.418365478515625, 2.52935791015625, 2.640350341796875, 2.7513427734375, 2.862335205078125, 2.97332763671875, 3.084320068359375, 3.1953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 5.0, 6.0, 5.0, 17.0, 24.0, 53.0, 62.0, 133.0, 299.0, 940.0, 4331.0, 52093.0, 4009552.0, 118281.0, 6576.0, 1184.0, 381.0, 152.0, 65.0, 47.0, 30.0, 20.0, 12.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.02728271484375, -7.7733154296875, -7.51934814453125, -7.265380859375, -7.01141357421875, -6.7574462890625, -6.50347900390625, -6.24951171875, -5.99554443359375, -5.7415771484375, -5.48760986328125, -5.233642578125, -4.97967529296875, -4.7257080078125, -4.47174072265625, -4.2177734375, -3.96380615234375, -3.7098388671875, -3.45587158203125, -3.201904296875, -2.94793701171875, -2.6939697265625, -2.44000244140625, -2.18603515625, -1.93206787109375, -1.6781005859375, -1.42413330078125, -1.170166015625, -0.91619873046875, -0.6622314453125, -0.40826416015625, -0.154296875, 0.09967041015625, 0.3536376953125, 0.60760498046875, 0.861572265625, 1.11553955078125, 1.3695068359375, 1.62347412109375, 1.87744140625, 2.13140869140625, 2.3853759765625, 2.63934326171875, 2.893310546875, 3.14727783203125, 3.4012451171875, 3.65521240234375, 3.9091796875, 4.16314697265625, 4.4171142578125, 4.67108154296875, 4.925048828125, 5.17901611328125, 5.4329833984375, 5.68695068359375, 5.94091796875, 6.19488525390625, 6.4488525390625, 6.70281982421875, 6.956787109375, 7.21075439453125, 7.4647216796875, 7.71868896484375, 7.97265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 8.0, 9.0, 11.0, 22.0, 20.0, 39.0, 36.0, 84.0, 122.0, 208.0, 421.0, 1195.0, 960.0, 395.0, 188.0, 103.0, 56.0, 60.0, 48.0, 33.0, 18.0, 10.0, 6.0, 10.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0266876220703125, -0.989898681640625, -0.9531097412109375, -0.91632080078125, -0.8795318603515625, -0.842742919921875, -0.8059539794921875, -0.7691650390625, -0.7323760986328125, -0.695587158203125, -0.6587982177734375, -0.62200927734375, -0.5852203369140625, -0.548431396484375, -0.5116424560546875, -0.474853515625, -0.4380645751953125, -0.401275634765625, -0.3644866943359375, -0.32769775390625, -0.2909088134765625, -0.254119873046875, -0.2173309326171875, -0.1805419921875, -0.1437530517578125, -0.106964111328125, -0.0701751708984375, -0.03338623046875, 0.0034027099609375, 0.040191650390625, 0.0769805908203125, 0.11376953125, 0.1505584716796875, 0.187347412109375, 0.2241363525390625, 0.26092529296875, 0.2977142333984375, 0.334503173828125, 0.3712921142578125, 0.4080810546875, 0.4448699951171875, 0.481658935546875, 0.5184478759765625, 0.55523681640625, 0.5920257568359375, 0.628814697265625, 0.6656036376953125, 0.702392578125, 0.7391815185546875, 0.775970458984375, 0.8127593994140625, 0.84954833984375, 0.8863372802734375, 0.923126220703125, 0.9599151611328125, 0.9967041015625, 1.0334930419921875, 1.070281982421875, 1.1070709228515625, 1.14385986328125, 1.1806488037109375, 1.217437744140625, 1.2542266845703125, 1.291015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 7.0, 18.0, 21.0, 16.0, 28.0, 40.0, 94.0, 193.0, 196.0, 146.0, 99.0, 54.0, 26.0, 18.0, 12.0, 7.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.628277778625488, -5.443141937255859, -5.258006572723389, -5.07287073135376, -4.887734889984131, -4.702599048614502, -4.517463684082031, -4.332327842712402, -4.147192001342773, -3.9620563983917236, -3.7769205570220947, -3.591784954071045, -3.406649112701416, -3.221513509750366, -3.0363779067993164, -2.8512420654296875, -2.6661064624786377, -2.480970859527588, -2.295835018157959, -2.110699415206909, -1.9255635738372803, -1.7404279708862305, -1.5552922487258911, -1.3701565265655518, -1.1850208044052124, -0.999885082244873, -0.8147493600845337, -0.6296136975288391, -0.44447797536849976, -0.2593422532081604, -0.07420659065246582, 0.11092913150787354, 0.2960648536682129, 0.48120057582855225, 0.6663362979888916, 0.8514719605445862, 1.0366077423095703, 1.2217433452606201, 1.4068790674209595, 1.5920147895812988, 1.7771505117416382, 1.9622862339019775, 2.1474218368530273, 2.3325576782226562, 2.517693281173706, 2.702829122543335, 2.8879647254943848, 3.0731005668640137, 3.2582361698150635, 3.4433717727661133, 3.628507614135742, 3.813643217086792, 3.998779058456421, 4.183914661407471, 4.3690505027771, 4.55418586730957, 4.739321708679199, 4.924457550048828, 5.109592914581299, 5.294728755950928, 5.479864597320557, 5.6650004386901855, 5.850135803222656, 6.035271644592285, 6.220407485961914]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 7.0, 9.0, 5.0, 22.0, 20.0, 18.0, 30.0, 33.0, 46.0, 51.0, 61.0, 67.0, 67.0, 62.0, 72.0, 64.0, 57.0, 65.0, 43.0, 41.0, 35.0, 28.0, 14.0, 16.0, 19.0, 9.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.736663818359375, -3.6356585025787354, -3.5346531867980957, -3.433647871017456, -3.3326425552368164, -3.2316370010375977, -3.130631685256958, -3.0296263694763184, -2.9286210536956787, -2.827615737915039, -2.7266104221343994, -2.6256051063537598, -2.524599552154541, -2.4235944747924805, -2.3225889205932617, -2.221583604812622, -2.1205782890319824, -2.0195729732513428, -1.9185676574707031, -1.817562222480774, -1.7165569067001343, -1.6155515909194946, -1.5145461559295654, -1.4135408401489258, -1.3125355243682861, -1.2115302085876465, -1.1105248928070068, -1.0095194578170776, -0.908514142036438, -0.8075088262557983, -0.7065034508705139, -0.6054980754852295, -0.5044925212860107, -0.4034871757030487, -0.30248183012008667, -0.20147648453712463, -0.1004711389541626, 0.0005341768264770508, 0.10153955221176147, 0.2025449275970459, 0.30355024337768555, 0.4045555889606476, 0.5055609345436096, 0.606566309928894, 0.7075716257095337, 0.8085769414901733, 0.9095823168754578, 1.0105876922607422, 1.1115930080413818, 1.2125983238220215, 1.3136036396026611, 1.4146090745925903, 1.51561439037323, 1.6166197061538696, 1.7176251411437988, 1.8186304569244385, 1.9196357727050781, 2.0206410884857178, 2.1216464042663574, 2.222651720046997, 2.3236570358276367, 2.4246625900268555, 2.525667905807495, 2.6266732215881348, 2.7276785373687744]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 11.0, 17.0, 27.0, 38.0, 45.0, 81.0, 142.0, 299.0, 806.0, 3433.0, 33512.0, 869750.0, 131080.0, 7042.0, 1370.0, 392.0, 197.0, 92.0, 59.0, 27.0, 28.0, 22.0, 17.0, 13.0, 11.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6513671875, -0.6320343017578125, -0.612701416015625, -0.5933685302734375, -0.57403564453125, -0.5547027587890625, -0.535369873046875, -0.5160369873046875, -0.4967041015625, -0.4773712158203125, -0.458038330078125, -0.4387054443359375, -0.41937255859375, -0.4000396728515625, -0.380706787109375, -0.3613739013671875, -0.342041015625, -0.3227081298828125, -0.303375244140625, -0.2840423583984375, -0.26470947265625, -0.2453765869140625, -0.226043701171875, -0.2067108154296875, -0.1873779296875, -0.1680450439453125, -0.148712158203125, -0.1293792724609375, -0.11004638671875, -0.0907135009765625, -0.071380615234375, -0.0520477294921875, -0.03271484375, -0.0133819580078125, 0.005950927734375, 0.0252838134765625, 0.04461669921875, 0.0639495849609375, 0.083282470703125, 0.1026153564453125, 0.1219482421875, 0.1412811279296875, 0.160614013671875, 0.1799468994140625, 0.19927978515625, 0.2186126708984375, 0.237945556640625, 0.2572784423828125, 0.276611328125, 0.2959442138671875, 0.315277099609375, 0.3346099853515625, 0.35394287109375, 0.3732757568359375, 0.392608642578125, 0.4119415283203125, 0.4312744140625, 0.4506072998046875, 0.469940185546875, 0.4892730712890625, 0.50860595703125, 0.5279388427734375, 0.547271728515625, 0.5666046142578125, 0.5859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 2.0, 13.0, 14.0, 17.0, 23.0, 28.0, 31.0, 53.0, 54.0, 63.0, 72.0, 70.0, 92.0, 66.0, 73.0, 67.0, 56.0, 45.0, 42.0, 28.0, 14.0, 15.0, 14.0, 12.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.84375, -2.7613525390625, -2.678955078125, -2.5965576171875, -2.51416015625, -2.4317626953125, -2.349365234375, -2.2669677734375, -2.1845703125, -2.1021728515625, -2.019775390625, -1.9373779296875, -1.85498046875, -1.7725830078125, -1.690185546875, -1.6077880859375, -1.525390625, -1.4429931640625, -1.360595703125, -1.2781982421875, -1.19580078125, -1.1134033203125, -1.031005859375, -0.9486083984375, -0.8662109375, -0.7838134765625, -0.701416015625, -0.6190185546875, -0.53662109375, -0.4542236328125, -0.371826171875, -0.2894287109375, -0.20703125, -0.1246337890625, -0.042236328125, 0.0401611328125, 0.12255859375, 0.2049560546875, 0.287353515625, 0.3697509765625, 0.4521484375, 0.5345458984375, 0.616943359375, 0.6993408203125, 0.78173828125, 0.8641357421875, 0.946533203125, 1.0289306640625, 1.111328125, 1.1937255859375, 1.276123046875, 1.3585205078125, 1.44091796875, 1.5233154296875, 1.605712890625, 1.6881103515625, 1.7705078125, 1.8529052734375, 1.935302734375, 2.0177001953125, 2.10009765625, 2.1824951171875, 2.264892578125, 2.3472900390625, 2.4296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 5.0, 15.0, 15.0, 15.0, 25.0, 22.0, 30.0, 51.0, 47.0, 81.0, 118.0, 204.0, 317.0, 567.0, 1649.0, 10846.0, 121724.0, 730974.0, 163580.0, 14334.0, 2233.0, 653.0, 314.0, 177.0, 126.0, 107.0, 79.0, 50.0, 33.0, 35.0, 19.0, 21.0, 12.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2600440979003906, -0.25153350830078125, -0.24302291870117188, -0.2345123291015625, -0.22600173950195312, -0.21749114990234375, -0.20898056030273438, -0.200469970703125, -0.19195938110351562, -0.18344879150390625, -0.17493820190429688, -0.1664276123046875, -0.15791702270507812, -0.14940643310546875, -0.14089584350585938, -0.13238525390625, -0.12387466430664062, -0.11536407470703125, -0.10685348510742188, -0.0983428955078125, -0.08983230590820312, -0.08132171630859375, -0.07281112670898438, -0.064300537109375, -0.055789947509765625, -0.04727935791015625, -0.038768768310546875, -0.0302581787109375, -0.021747589111328125, -0.01323699951171875, -0.004726409912109375, 0.0037841796875, 0.012294769287109375, 0.02080535888671875, 0.029315948486328125, 0.0378265380859375, 0.046337127685546875, 0.05484771728515625, 0.06335830688476562, 0.071868896484375, 0.08037948608398438, 0.08889007568359375, 0.09740066528320312, 0.1059112548828125, 0.11442184448242188, 0.12293243408203125, 0.13144302368164062, 0.13995361328125, 0.14846420288085938, 0.15697479248046875, 0.16548538208007812, 0.1739959716796875, 0.18250656127929688, 0.19101715087890625, 0.19952774047851562, 0.208038330078125, 0.21654891967773438, 0.22505950927734375, 0.23357009887695312, 0.2420806884765625, 0.2505912780761719, 0.25910186767578125, 0.2676124572753906, 0.276123046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 9.0, 13.0, 15.0, 15.0, 15.0, 18.0, 29.0, 32.0, 35.0, 33.0, 41.0, 44.0, 33.0, 47.0, 45.0, 45.0, 46.0, 50.0, 45.0, 34.0, 33.0, 30.0, 32.0, 34.0, 30.0, 35.0, 26.0, 23.0, 19.0, 13.0, 10.0, 9.0, 14.0, 8.0, 10.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5703125, -3.466033935546875, -3.36175537109375, -3.257476806640625, -3.1531982421875, -3.048919677734375, -2.94464111328125, -2.840362548828125, -2.736083984375, -2.631805419921875, -2.52752685546875, -2.423248291015625, -2.3189697265625, -2.214691162109375, -2.11041259765625, -2.006134033203125, -1.90185546875, -1.797576904296875, -1.69329833984375, -1.589019775390625, -1.4847412109375, -1.380462646484375, -1.27618408203125, -1.171905517578125, -1.067626953125, -0.963348388671875, -0.85906982421875, -0.754791259765625, -0.6505126953125, -0.546234130859375, -0.44195556640625, -0.337677001953125, -0.2333984375, -0.129119873046875, -0.02484130859375, 0.079437255859375, 0.1837158203125, 0.287994384765625, 0.39227294921875, 0.496551513671875, 0.600830078125, 0.705108642578125, 0.80938720703125, 0.913665771484375, 1.0179443359375, 1.122222900390625, 1.22650146484375, 1.330780029296875, 1.43505859375, 1.539337158203125, 1.64361572265625, 1.747894287109375, 1.8521728515625, 1.956451416015625, 2.06072998046875, 2.165008544921875, 2.269287109375, 2.373565673828125, 2.47784423828125, 2.582122802734375, 2.6864013671875, 2.790679931640625, 2.89495849609375, 2.999237060546875, 3.103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 7.0, 5.0, 14.0, 17.0, 15.0, 26.0, 31.0, 35.0, 50.0, 85.0, 152.0, 418.0, 1526.0, 12634.0, 1009071.0, 21338.0, 2097.0, 474.0, 213.0, 99.0, 54.0, 36.0, 33.0, 19.0, 15.0, 14.0, 14.0, 11.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1253662109375, -0.12139701843261719, -0.11742782592773438, -0.11345863342285156, -0.10948944091796875, -0.10552024841308594, -0.10155105590820312, -0.09758186340332031, -0.0936126708984375, -0.08964347839355469, -0.08567428588867188, -0.08170509338378906, -0.07773590087890625, -0.07376670837402344, -0.06979751586914062, -0.06582832336425781, -0.061859130859375, -0.05788993835449219, -0.053920745849609375, -0.04995155334472656, -0.04598236083984375, -0.04201316833496094, -0.038043975830078125, -0.03407478332519531, -0.0301055908203125, -0.026136398315429688, -0.022167205810546875, -0.018198013305664062, -0.01422882080078125, -0.010259628295898438, -0.006290435791015625, -0.0023212432861328125, 0.00164794921875, 0.0056171417236328125, 0.009586334228515625, 0.013555526733398438, 0.01752471923828125, 0.021493911743164062, 0.025463104248046875, 0.029432296752929688, 0.0334014892578125, 0.03737068176269531, 0.041339874267578125, 0.04530906677246094, 0.04927825927734375, 0.05324745178222656, 0.057216644287109375, 0.06118583679199219, 0.065155029296875, 0.06912422180175781, 0.07309341430664062, 0.07706260681152344, 0.08103179931640625, 0.08500099182128906, 0.08897018432617188, 0.09293937683105469, 0.0969085693359375, 0.10087776184082031, 0.10484695434570312, 0.10881614685058594, 0.11278533935546875, 0.11675453186035156, 0.12072372436523438, 0.12469291687011719, 0.128662109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 2.0, 6.0, 12.0, 21.0, 55.0, 154.0, 304.0, 265.0, 104.0, 39.0, 20.0, 6.0, 4.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.273653030395508e-05, -4.0685757994651794e-05, -3.863498568534851e-05, -3.658421337604523e-05, -3.453344106674194e-05, -3.248266875743866e-05, -3.0431896448135376e-05, -2.8381124138832092e-05, -2.633035182952881e-05, -2.4279579520225525e-05, -2.222880721092224e-05, -2.0178034901618958e-05, -1.8127262592315674e-05, -1.607649028301239e-05, -1.4025717973709106e-05, -1.1974945664405823e-05, -9.924173355102539e-06, -7.873401045799255e-06, -5.822628736495972e-06, -3.771856427192688e-06, -1.7210841178894043e-06, 3.296881914138794e-07, 2.380460500717163e-06, 4.431232810020447e-06, 6.4820051193237305e-06, 8.532777428627014e-06, 1.0583549737930298e-05, 1.2634322047233582e-05, 1.4685094356536865e-05, 1.673586666584015e-05, 1.8786638975143433e-05, 2.0837411284446716e-05, 2.288818359375e-05, 2.4938955903053284e-05, 2.6989728212356567e-05, 2.904050052165985e-05, 3.1091272830963135e-05, 3.314204514026642e-05, 3.51928174495697e-05, 3.7243589758872986e-05, 3.929436206817627e-05, 4.134513437747955e-05, 4.339590668678284e-05, 4.544667899608612e-05, 4.7497451305389404e-05, 4.954822361469269e-05, 5.159899592399597e-05, 5.3649768233299255e-05, 5.570054054260254e-05, 5.775131285190582e-05, 5.9802085161209106e-05, 6.185285747051239e-05, 6.390362977981567e-05, 6.595440208911896e-05, 6.800517439842224e-05, 7.005594670772552e-05, 7.210671901702881e-05, 7.415749132633209e-05, 7.620826363563538e-05, 7.825903594493866e-05, 8.030980825424194e-05, 8.236058056354523e-05, 8.441135287284851e-05, 8.64621251821518e-05, 8.851289749145508e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 8.0, 6.0, 14.0, 18.0, 33.0, 33.0, 59.0, 83.0, 126.0, 224.0, 488.0, 1280.0, 4300.0, 37176.0, 980220.0, 19190.0, 3230.0, 1020.0, 430.0, 209.0, 131.0, 80.0, 54.0, 41.0, 22.0, 27.0, 11.0, 6.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.1349029541015625, -0.129791259765625, -0.1246795654296875, -0.11956787109375, -0.1144561767578125, -0.109344482421875, -0.1042327880859375, -0.09912109375, -0.0940093994140625, -0.088897705078125, -0.0837860107421875, -0.07867431640625, -0.0735626220703125, -0.068450927734375, -0.0633392333984375, -0.0582275390625, -0.0531158447265625, -0.048004150390625, -0.0428924560546875, -0.03778076171875, -0.0326690673828125, -0.027557373046875, -0.0224456787109375, -0.017333984375, -0.0122222900390625, -0.007110595703125, -0.0019989013671875, 0.00311279296875, 0.0082244873046875, 0.013336181640625, 0.0184478759765625, 0.0235595703125, 0.0286712646484375, 0.033782958984375, 0.0388946533203125, 0.04400634765625, 0.0491180419921875, 0.054229736328125, 0.0593414306640625, 0.064453125, 0.0695648193359375, 0.074676513671875, 0.0797882080078125, 0.08489990234375, 0.0900115966796875, 0.095123291015625, 0.1002349853515625, 0.1053466796875, 0.1104583740234375, 0.115570068359375, 0.1206817626953125, 0.12579345703125, 0.1309051513671875, 0.136016845703125, 0.1411285400390625, 0.146240234375, 0.1513519287109375, 0.156463623046875, 0.1615753173828125, 0.16668701171875, 0.1717987060546875, 0.176910400390625, 0.1820220947265625, 0.1871337890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 21.0, 27.0, 37.0, 68.0, 149.0, 344.0, 160.0, 80.0, 40.0, 24.0, 17.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035858154296875, -0.03482174873352051, -0.033785343170166016, -0.03274893760681152, -0.03171253204345703, -0.03067612648010254, -0.029639720916748047, -0.028603315353393555, -0.027566909790039062, -0.02653050422668457, -0.025494098663330078, -0.024457693099975586, -0.023421287536621094, -0.0223848819732666, -0.02134847640991211, -0.020312070846557617, -0.019275665283203125, -0.018239259719848633, -0.01720285415649414, -0.01616644859313965, -0.015130043029785156, -0.014093637466430664, -0.013057231903076172, -0.01202082633972168, -0.010984420776367188, -0.009948015213012695, -0.008911609649658203, -0.007875204086303711, -0.006838798522949219, -0.0058023929595947266, -0.004765987396240234, -0.003729581832885742, -0.00269317626953125, -0.0016567707061767578, -0.0006203651428222656, 0.00041604042053222656, 0.0014524459838867188, 0.002488851547241211, 0.003525257110595703, 0.004561662673950195, 0.0055980682373046875, 0.00663447380065918, 0.007670879364013672, 0.008707284927368164, 0.009743690490722656, 0.010780096054077148, 0.01181650161743164, 0.012852907180786133, 0.013889312744140625, 0.014925718307495117, 0.01596212387084961, 0.0169985294342041, 0.018034934997558594, 0.019071340560913086, 0.020107746124267578, 0.02114415168762207, 0.022180557250976562, 0.023216962814331055, 0.024253368377685547, 0.02528977394104004, 0.02632617950439453, 0.027362585067749023, 0.028398990631103516, 0.029435396194458008, 0.0304718017578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 11.0, 16.0, 26.0, 39.0, 86.0, 240.0, 285.0, 145.0, 73.0, 30.0, 14.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.954397201538086, -5.775512218475342, -5.596627235412598, -5.4177422523498535, -5.238857269287109, -5.059972286224365, -4.881087303161621, -4.702201843261719, -4.523317337036133, -4.344432353973389, -4.1655473709106445, -3.9866623878479004, -3.8077774047851562, -3.628892421722412, -3.450007200241089, -3.2711222171783447, -3.0922369956970215, -2.9133520126342773, -2.734467029571533, -2.555582046508789, -2.376697063446045, -2.197812080383301, -2.0189268589019775, -1.8400418758392334, -1.6611568927764893, -1.4822719097137451, -1.303386926651001, -1.1245018243789673, -0.9456168413162231, -0.766731858253479, -0.5878467559814453, -0.40896177291870117, -0.23007726669311523, -0.051192253828048706, 0.12769275903701782, 0.30657780170440674, 0.4854627847671509, 0.664347767829895, 0.8432328701019287, 1.0221178531646729, 1.201002836227417, 1.3798878192901611, 1.5587728023529053, 1.737657904624939, 1.916542887687683, 2.095427989959717, 2.274312973022461, 2.453197956085205, 2.632082939147949, 2.8109679222106934, 2.9898529052734375, 3.1687378883361816, 3.347622871398926, 3.52650785446167, 3.705393075942993, 3.8842780590057373, 4.063162803649902, 4.2420477867126465, 4.420932769775391, 4.599817752838135, 4.778702735900879, 4.957587718963623, 5.136472702026367, 5.3153581619262695, 5.494243144989014]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 13.0, 10.0, 23.0, 19.0, 25.0, 35.0, 53.0, 56.0, 67.0, 70.0, 78.0, 78.0, 79.0, 66.0, 63.0, 55.0, 39.0, 40.0, 19.0, 16.0, 24.0, 11.0, 8.0, 6.0, 10.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.8812129497528076, -2.804255485534668, -2.727297782897949, -2.6503403186798096, -2.57338285446167, -2.496425151824951, -2.4194676876068115, -2.342510223388672, -2.265552520751953, -2.1885950565338135, -2.1116373538970947, -2.034679889678955, -1.9577223062515259, -1.8807647228240967, -1.803807258605957, -1.7268496751785278, -1.6498920917510986, -1.5729345083236694, -1.4959769248962402, -1.4190194606781006, -1.3420618772506714, -1.2651042938232422, -1.1881468296051025, -1.1111892461776733, -1.0342316627502441, -0.9572740793228149, -0.8803165555000305, -0.8033590316772461, -0.7264014482498169, -0.6494438648223877, -0.5724863409996033, -0.49552881717681885, -0.41857123374938965, -0.34161368012428284, -0.264656126499176, -0.1876985728740692, -0.1107410192489624, -0.03378346562385559, 0.04317408800125122, 0.12013161182403564, 0.19708919525146484, 0.27404674887657166, 0.35100430250167847, 0.4279618561267853, 0.5049194097518921, 0.5818769931793213, 0.6588345170021057, 0.7357920408248901, 0.8127496242523193, 0.8897072076797485, 0.966664731502533, 1.0436222553253174, 1.1205798387527466, 1.1975374221801758, 1.2744948863983154, 1.3514524698257446, 1.4284100532531738, 1.505367636680603, 1.5823252201080322, 1.6592826843261719, 1.736240267753601, 1.8131978511810303, 1.89015531539917, 1.9671128988265991, 2.0440704822540283]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 9.0, 8.0, 14.0, 16.0, 24.0, 29.0, 40.0, 60.0, 87.0, 150.0, 184.0, 284.0, 422.0, 716.0, 1164.0, 2057.0, 4036.0, 8324.0, 20756.0, 69091.0, 473409.0, 372817.0, 59832.0, 18646.0, 7658.0, 3637.0, 1979.0, 1164.0, 683.0, 407.0, 273.0, 168.0, 128.0, 80.0, 51.0, 49.0, 22.0, 22.0, 14.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2890625, -1.2460174560546875, -1.202972412109375, -1.1599273681640625, -1.11688232421875, -1.0738372802734375, -1.030792236328125, -0.9877471923828125, -0.9447021484375, -0.9016571044921875, -0.858612060546875, -0.8155670166015625, -0.77252197265625, -0.7294769287109375, -0.686431884765625, -0.6433868408203125, -0.600341796875, -0.5572967529296875, -0.514251708984375, -0.4712066650390625, -0.42816162109375, -0.3851165771484375, -0.342071533203125, -0.2990264892578125, -0.2559814453125, -0.2129364013671875, -0.169891357421875, -0.1268463134765625, -0.08380126953125, -0.0407562255859375, 0.002288818359375, 0.0453338623046875, 0.08837890625, 0.1314239501953125, 0.174468994140625, 0.2175140380859375, 0.26055908203125, 0.3036041259765625, 0.346649169921875, 0.3896942138671875, 0.4327392578125, 0.4757843017578125, 0.518829345703125, 0.5618743896484375, 0.60491943359375, 0.6479644775390625, 0.691009521484375, 0.7340545654296875, 0.777099609375, 0.8201446533203125, 0.863189697265625, 0.9062347412109375, 0.94927978515625, 0.9923248291015625, 1.035369873046875, 1.0784149169921875, 1.1214599609375, 1.1645050048828125, 1.207550048828125, 1.2505950927734375, 1.29364013671875, 1.3366851806640625, 1.379730224609375, 1.4227752685546875, 1.4658203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 3.0, 7.0, 6.0, 10.0, 15.0, 11.0, 24.0, 24.0, 51.0, 39.0, 59.0, 74.0, 94.0, 74.0, 82.0, 80.0, 65.0, 60.0, 44.0, 44.0, 32.0, 20.0, 18.0, 14.0, 10.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.625, -6.44647216796875, -6.2679443359375, -6.08941650390625, -5.910888671875, -5.73236083984375, -5.5538330078125, -5.37530517578125, -5.19677734375, -5.01824951171875, -4.8397216796875, -4.66119384765625, -4.482666015625, -4.30413818359375, -4.1256103515625, -3.94708251953125, -3.7685546875, -3.59002685546875, -3.4114990234375, -3.23297119140625, -3.054443359375, -2.87591552734375, -2.6973876953125, -2.51885986328125, -2.34033203125, -2.16180419921875, -1.9832763671875, -1.80474853515625, -1.626220703125, -1.44769287109375, -1.2691650390625, -1.09063720703125, -0.912109375, -0.73358154296875, -0.5550537109375, -0.37652587890625, -0.197998046875, -0.01947021484375, 0.1590576171875, 0.33758544921875, 0.51611328125, 0.69464111328125, 0.8731689453125, 1.05169677734375, 1.230224609375, 1.40875244140625, 1.5872802734375, 1.76580810546875, 1.9443359375, 2.12286376953125, 2.3013916015625, 2.47991943359375, 2.658447265625, 2.83697509765625, 3.0155029296875, 3.19403076171875, 3.37255859375, 3.55108642578125, 3.7296142578125, 3.90814208984375, 4.086669921875, 4.26519775390625, 4.4437255859375, 4.62225341796875, 4.80078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 15.0, 31.0, 18.0, 38.0, 80.0, 155.0, 317.0, 1013.0, 4156.0, 46041.0, 957639.0, 33833.0, 3596.0, 929.0, 327.0, 148.0, 81.0, 50.0, 21.0, 20.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2840576171875, -4.169677734375, -4.0552978515625, -3.94091796875, -3.8265380859375, -3.712158203125, -3.5977783203125, -3.4833984375, -3.3690185546875, -3.254638671875, -3.1402587890625, -3.02587890625, -2.9114990234375, -2.797119140625, -2.6827392578125, -2.568359375, -2.4539794921875, -2.339599609375, -2.2252197265625, -2.11083984375, -1.9964599609375, -1.882080078125, -1.7677001953125, -1.6533203125, -1.5389404296875, -1.424560546875, -1.3101806640625, -1.19580078125, -1.0814208984375, -0.967041015625, -0.8526611328125, -0.73828125, -0.6239013671875, -0.509521484375, -0.3951416015625, -0.28076171875, -0.1663818359375, -0.052001953125, 0.0623779296875, 0.1767578125, 0.2911376953125, 0.405517578125, 0.5198974609375, 0.63427734375, 0.7486572265625, 0.863037109375, 0.9774169921875, 1.091796875, 1.2061767578125, 1.320556640625, 1.4349365234375, 1.54931640625, 1.6636962890625, 1.778076171875, 1.8924560546875, 2.0068359375, 2.1212158203125, 2.235595703125, 2.3499755859375, 2.46435546875, 2.5787353515625, 2.693115234375, 2.8074951171875, 2.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 10.0, 5.0, 11.0, 7.0, 15.0, 21.0, 15.0, 34.0, 30.0, 38.0, 44.0, 50.0, 45.0, 51.0, 60.0, 59.0, 61.0, 55.0, 59.0, 57.0, 39.0, 43.0, 30.0, 31.0, 31.0, 29.0, 14.0, 13.0, 15.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-8.5625, -8.357177734375, -8.15185546875, -7.946533203125, -7.7412109375, -7.535888671875, -7.33056640625, -7.125244140625, -6.919921875, -6.714599609375, -6.50927734375, -6.303955078125, -6.0986328125, -5.893310546875, -5.68798828125, -5.482666015625, -5.27734375, -5.072021484375, -4.86669921875, -4.661376953125, -4.4560546875, -4.250732421875, -4.04541015625, -3.840087890625, -3.634765625, -3.429443359375, -3.22412109375, -3.018798828125, -2.8134765625, -2.608154296875, -2.40283203125, -2.197509765625, -1.9921875, -1.786865234375, -1.58154296875, -1.376220703125, -1.1708984375, -0.965576171875, -0.76025390625, -0.554931640625, -0.349609375, -0.144287109375, 0.06103515625, 0.266357421875, 0.4716796875, 0.677001953125, 0.88232421875, 1.087646484375, 1.29296875, 1.498291015625, 1.70361328125, 1.908935546875, 2.1142578125, 2.319580078125, 2.52490234375, 2.730224609375, 2.935546875, 3.140869140625, 3.34619140625, 3.551513671875, 3.7568359375, 3.962158203125, 4.16748046875, 4.372802734375, 4.578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 8.0, 7.0, 16.0, 16.0, 34.0, 63.0, 88.0, 218.0, 497.0, 1613.0, 7467.0, 102176.0, 897916.0, 32676.0, 3981.0, 1044.0, 378.0, 153.0, 86.0, 31.0, 26.0, 18.0, 7.0, 8.0, 2.0, 7.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.5665435791015625, -1.525665283203125, -1.4847869873046875, -1.44390869140625, -1.4030303955078125, -1.362152099609375, -1.3212738037109375, -1.2803955078125, -1.2395172119140625, -1.198638916015625, -1.1577606201171875, -1.11688232421875, -1.0760040283203125, -1.035125732421875, -0.9942474365234375, -0.953369140625, -0.9124908447265625, -0.871612548828125, -0.8307342529296875, -0.78985595703125, -0.7489776611328125, -0.708099365234375, -0.6672210693359375, -0.6263427734375, -0.5854644775390625, -0.544586181640625, -0.5037078857421875, -0.46282958984375, -0.4219512939453125, -0.381072998046875, -0.3401947021484375, -0.29931640625, -0.2584381103515625, -0.217559814453125, -0.1766815185546875, -0.13580322265625, -0.0949249267578125, -0.054046630859375, -0.0131683349609375, 0.0277099609375, 0.0685882568359375, 0.109466552734375, 0.1503448486328125, 0.19122314453125, 0.2321014404296875, 0.272979736328125, 0.3138580322265625, 0.354736328125, 0.3956146240234375, 0.436492919921875, 0.4773712158203125, 0.51824951171875, 0.5591278076171875, 0.600006103515625, 0.6408843994140625, 0.6817626953125, 0.7226409912109375, 0.763519287109375, 0.8043975830078125, 0.84527587890625, 0.8861541748046875, 0.927032470703125, 0.9679107666015625, 1.0087890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 9.0, 15.0, 19.0, 21.0, 35.0, 49.0, 88.0, 151.0, 285.0, 95.0, 67.0, 49.0, 36.0, 26.0, 8.0, 6.0, 8.0, 11.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.801650255918503e-05, -8.370541036128998e-05, -7.939431816339493e-05, -7.508322596549988e-05, -7.077213376760483e-05, -6.646104156970978e-05, -6.214994937181473e-05, -5.783885717391968e-05, -5.352776497602463e-05, -4.921667277812958e-05, -4.490558058023453e-05, -4.059448838233948e-05, -3.628339618444443e-05, -3.197230398654938e-05, -2.7661211788654327e-05, -2.3350119590759277e-05, -1.9039027392864227e-05, -1.4727935194969177e-05, -1.0416842997074127e-05, -6.105750799179077e-06, -1.794658601284027e-06, 2.516433596611023e-06, 6.827525794506073e-06, 1.1138617992401123e-05, 1.5449710190296173e-05, 1.9760802388191223e-05, 2.4071894586086273e-05, 2.8382986783981323e-05, 3.269407898187637e-05, 3.700517117977142e-05, 4.1316263377666473e-05, 4.5627355575561523e-05, 4.9938447773456573e-05, 5.4249539971351624e-05, 5.8560632169246674e-05, 6.287172436714172e-05, 6.718281656503677e-05, 7.149390876293182e-05, 7.580500096082687e-05, 8.011609315872192e-05, 8.442718535661697e-05, 8.873827755451202e-05, 9.304936975240707e-05, 9.736046195030212e-05, 0.00010167155414819717, 0.00010598264634609222, 0.00011029373854398727, 0.00011460483074188232, 0.00011891592293977737, 0.00012322701513767242, 0.00012753810733556747, 0.00013184919953346252, 0.00013616029173135757, 0.00014047138392925262, 0.00014478247612714767, 0.00014909356832504272, 0.00015340466052293777, 0.00015771575272083282, 0.00016202684491872787, 0.00016633793711662292, 0.00017064902931451797, 0.00017496012151241302, 0.00017927121371030807, 0.00018358230590820312]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 10.0, 13.0, 15.0, 19.0, 28.0, 35.0, 89.0, 132.0, 263.0, 530.0, 1250.0, 3825.0, 15934.0, 136778.0, 819117.0, 57081.0, 9086.0, 2514.0, 885.0, 397.0, 192.0, 122.0, 64.0, 41.0, 35.0, 12.0, 19.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.9699935913085938, -0.9399871826171875, -0.9099807739257812, -0.879974365234375, -0.8499679565429688, -0.8199615478515625, -0.7899551391601562, -0.75994873046875, -0.7299423217773438, -0.6999359130859375, -0.6699295043945312, -0.639923095703125, -0.6099166870117188, -0.5799102783203125, -0.5499038696289062, -0.5198974609375, -0.48989105224609375, -0.4598846435546875, -0.42987823486328125, -0.399871826171875, -0.36986541748046875, -0.3398590087890625, -0.30985260009765625, -0.27984619140625, -0.24983978271484375, -0.2198333740234375, -0.18982696533203125, -0.159820556640625, -0.12981414794921875, -0.0998077392578125, -0.06980133056640625, -0.039794921875, -0.00978851318359375, 0.0202178955078125, 0.05022430419921875, 0.080230712890625, 0.11023712158203125, 0.1402435302734375, 0.17024993896484375, 0.20025634765625, 0.23026275634765625, 0.2602691650390625, 0.29027557373046875, 0.320281982421875, 0.35028839111328125, 0.3802947998046875, 0.41030120849609375, 0.4403076171875, 0.47031402587890625, 0.5003204345703125, 0.5303268432617188, 0.560333251953125, 0.5903396606445312, 0.6203460693359375, 0.6503524780273438, 0.68035888671875, 0.7103652954101562, 0.7403717041015625, 0.7703781127929688, 0.800384521484375, 0.8303909301757812, 0.8603973388671875, 0.8904037475585938, 0.92041015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 7.0, 9.0, 14.0, 21.0, 27.0, 42.0, 55.0, 75.0, 156.0, 249.0, 90.0, 64.0, 28.0, 38.0, 22.0, 17.0, 15.0, 14.0, 13.0, 6.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.467041015625, -0.45481109619140625, -0.4425811767578125, -0.43035125732421875, -0.418121337890625, -0.40589141845703125, -0.3936614990234375, -0.38143157958984375, -0.36920166015625, -0.35697174072265625, -0.3447418212890625, -0.33251190185546875, -0.320281982421875, -0.30805206298828125, -0.2958221435546875, -0.28359222412109375, -0.2713623046875, -0.25913238525390625, -0.2469024658203125, -0.23467254638671875, -0.222442626953125, -0.21021270751953125, -0.1979827880859375, -0.18575286865234375, -0.17352294921875, -0.16129302978515625, -0.1490631103515625, -0.13683319091796875, -0.124603271484375, -0.11237335205078125, -0.1001434326171875, -0.08791351318359375, -0.07568359375, -0.06345367431640625, -0.0512237548828125, -0.03899383544921875, -0.026763916015625, -0.01453399658203125, -0.0023040771484375, 0.00992584228515625, 0.02215576171875, 0.03438568115234375, 0.0466156005859375, 0.05884552001953125, 0.071075439453125, 0.08330535888671875, 0.0955352783203125, 0.10776519775390625, 0.1199951171875, 0.13222503662109375, 0.1444549560546875, 0.15668487548828125, 0.168914794921875, 0.18114471435546875, 0.1933746337890625, 0.20560455322265625, 0.21783447265625, 0.23006439208984375, 0.2422943115234375, 0.25452423095703125, 0.266754150390625, 0.27898406982421875, 0.2912139892578125, 0.30344390869140625, 0.315673828125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 1.0, 8.0, 18.0, 27.0, 77.0, 273.0, 363.0, 138.0, 58.0, 20.0, 9.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.589208126068115, -7.057093143463135, -6.5249786376953125, -5.992863655090332, -5.460748672485352, -4.928633689880371, -4.396518707275391, -3.8644042015075684, -3.332289218902588, -2.8001742362976074, -2.268059492111206, -1.7359446287155151, -1.2038297653198242, -0.6717147827148438, -0.13960003852844238, 0.392514705657959, 0.9246296882629395, 1.4567445516586304, 1.9888594150543213, 2.5209741592407227, 3.053089141845703, 3.5852041244506836, 4.117319107055664, 4.649433612823486, 5.181548595428467, 5.713663578033447, 6.2457780838012695, 6.77789306640625, 7.3100080490112305, 7.842123031616211, 8.374238014221191, 8.906352996826172, 9.438467025756836, 9.970582008361816, 10.502696990966797, 11.034811973571777, 11.566926956176758, 12.099040985107422, 12.631155967712402, 13.163270950317383, 13.695385932922363, 14.227500915527344, 14.759615898132324, 15.291730880737305, 15.823844909667969, 16.355960845947266, 16.88807487487793, 17.420188903808594, 17.95230484008789, 18.484418869018555, 19.01653480529785, 19.548648834228516, 20.080764770507812, 20.612878799438477, 21.144994735717773, 21.677108764648438, 22.209224700927734, 22.7413387298584, 23.273454666137695, 23.80556869506836, 24.337684631347656, 24.86979866027832, 25.401914596557617, 25.93402862548828, 26.466142654418945]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 16.0, 16.0, 23.0, 25.0, 39.0, 48.0, 54.0, 76.0, 70.0, 63.0, 66.0, 72.0, 60.0, 65.0, 64.0, 45.0, 40.0, 32.0, 26.0, 19.0, 22.0, 18.0, 10.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.230571746826172, -16.753639221191406, -16.276704788208008, -15.799771308898926, -15.322837829589844, -14.845904350280762, -14.36897087097168, -13.892038345336914, -13.415103912353516, -12.938170433044434, -12.461236953735352, -11.98430347442627, -11.507369995117188, -11.030436515808105, -10.553503036499023, -10.076570510864258, -9.599637031555176, -9.122703552246094, -8.645770072937012, -8.16883659362793, -7.691903114318848, -7.214969635009766, -6.738036632537842, -6.26110315322876, -5.784169673919678, -5.307236194610596, -4.830302715301514, -4.35336971282959, -3.8764359951019287, -3.3995025157928467, -2.9225692749023438, -2.4456357955932617, -1.9687023162841797, -1.4917688369750977, -1.0148354768753052, -0.5379021167755127, -0.060968637466430664, 0.41596484184265137, 0.8928980827331543, 1.3698315620422363, 1.8467650413513184, 2.3236985206604004, 2.8006319999694824, 3.2775652408599854, 3.7544987201690674, 4.23143196105957, 4.708365440368652, 5.185298919677734, 5.662232398986816, 6.139165878295898, 6.6160993576049805, 7.0930328369140625, 7.5699663162231445, 8.046899795532227, 8.523832321166992, 9.00076675415039, 9.477699279785156, 9.954632759094238, 10.43156623840332, 10.908499717712402, 11.385433197021484, 11.862366676330566, 12.339300155639648, 12.816232681274414, 13.293167114257812]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 12.0, 27.0, 34.0, 58.0, 154.0, 284.0, 757.0, 2727.0, 17440.0, 675521.0, 3461447.0, 30030.0, 3997.0, 1056.0, 372.0, 155.0, 83.0, 43.0, 35.0, 12.0, 13.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82421875, -7.5948486328125, -7.365478515625, -7.1361083984375, -6.90673828125, -6.6773681640625, -6.447998046875, -6.2186279296875, -5.9892578125, -5.7598876953125, -5.530517578125, -5.3011474609375, -5.07177734375, -4.8424072265625, -4.613037109375, -4.3836669921875, -4.154296875, -3.9249267578125, -3.695556640625, -3.4661865234375, -3.23681640625, -3.0074462890625, -2.778076171875, -2.5487060546875, -2.3193359375, -2.0899658203125, -1.860595703125, -1.6312255859375, -1.40185546875, -1.1724853515625, -0.943115234375, -0.7137451171875, -0.484375, -0.2550048828125, -0.025634765625, 0.2037353515625, 0.43310546875, 0.6624755859375, 0.891845703125, 1.1212158203125, 1.3505859375, 1.5799560546875, 1.809326171875, 2.0386962890625, 2.26806640625, 2.4974365234375, 2.726806640625, 2.9561767578125, 3.185546875, 3.4149169921875, 3.644287109375, 3.8736572265625, 4.10302734375, 4.3323974609375, 4.561767578125, 4.7911376953125, 5.0205078125, 5.2498779296875, 5.479248046875, 5.7086181640625, 5.93798828125, 6.1673583984375, 6.396728515625, 6.6260986328125, 6.85546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 11.0, 12.0, 19.0, 14.0, 30.0, 38.0, 66.0, 77.0, 105.0, 110.0, 118.0, 99.0, 86.0, 62.0, 31.0, 27.0, 21.0, 16.0, 9.0, 10.0, 11.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.921875, -3.806793212890625, -3.69171142578125, -3.576629638671875, -3.4615478515625, -3.346466064453125, -3.23138427734375, -3.116302490234375, -3.001220703125, -2.886138916015625, -2.77105712890625, -2.655975341796875, -2.5408935546875, -2.425811767578125, -2.31072998046875, -2.195648193359375, -2.08056640625, -1.965484619140625, -1.85040283203125, -1.735321044921875, -1.6202392578125, -1.505157470703125, -1.39007568359375, -1.274993896484375, -1.159912109375, -1.044830322265625, -0.92974853515625, -0.814666748046875, -0.6995849609375, -0.584503173828125, -0.46942138671875, -0.354339599609375, -0.2392578125, -0.124176025390625, -0.00909423828125, 0.105987548828125, 0.2210693359375, 0.336151123046875, 0.45123291015625, 0.566314697265625, 0.681396484375, 0.796478271484375, 0.91156005859375, 1.026641845703125, 1.1417236328125, 1.256805419921875, 1.37188720703125, 1.486968994140625, 1.60205078125, 1.717132568359375, 1.83221435546875, 1.947296142578125, 2.0623779296875, 2.177459716796875, 2.29254150390625, 2.407623291015625, 2.522705078125, 2.637786865234375, 2.75286865234375, 2.867950439453125, 2.9830322265625, 3.098114013671875, 3.21319580078125, 3.328277587890625, 3.443359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 21.0, 40.0, 65.0, 129.0, 286.0, 827.0, 3805.0, 53785.0, 4045245.0, 83654.0, 4847.0, 947.0, 296.0, 137.0, 65.0, 33.0, 27.0, 10.0, 5.0, 9.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0546875, -10.7821044921875, -10.509521484375, -10.2369384765625, -9.96435546875, -9.6917724609375, -9.419189453125, -9.1466064453125, -8.8740234375, -8.6014404296875, -8.328857421875, -8.0562744140625, -7.78369140625, -7.5111083984375, -7.238525390625, -6.9659423828125, -6.693359375, -6.4207763671875, -6.148193359375, -5.8756103515625, -5.60302734375, -5.3304443359375, -5.057861328125, -4.7852783203125, -4.5126953125, -4.2401123046875, -3.967529296875, -3.6949462890625, -3.42236328125, -3.1497802734375, -2.877197265625, -2.6046142578125, -2.33203125, -2.0594482421875, -1.786865234375, -1.5142822265625, -1.24169921875, -0.9691162109375, -0.696533203125, -0.4239501953125, -0.1513671875, 0.1212158203125, 0.393798828125, 0.6663818359375, 0.93896484375, 1.2115478515625, 1.484130859375, 1.7567138671875, 2.029296875, 2.3018798828125, 2.574462890625, 2.8470458984375, 3.11962890625, 3.3922119140625, 3.664794921875, 3.9373779296875, 4.2099609375, 4.4825439453125, 4.755126953125, 5.0277099609375, 5.30029296875, 5.5728759765625, 5.845458984375, 6.1180419921875, 6.390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 10.0, 9.0, 16.0, 18.0, 21.0, 32.0, 53.0, 74.0, 119.0, 145.0, 289.0, 591.0, 1315.0, 559.0, 303.0, 142.0, 117.0, 63.0, 48.0, 39.0, 28.0, 18.0, 11.0, 10.0, 11.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8154296875, -0.7846832275390625, -0.753936767578125, -0.7231903076171875, -0.69244384765625, -0.6616973876953125, -0.630950927734375, -0.6002044677734375, -0.5694580078125, -0.5387115478515625, -0.507965087890625, -0.4772186279296875, -0.44647216796875, -0.4157257080078125, -0.384979248046875, -0.3542327880859375, -0.323486328125, -0.2927398681640625, -0.261993408203125, -0.2312469482421875, -0.20050048828125, -0.1697540283203125, -0.139007568359375, -0.1082611083984375, -0.0775146484375, -0.0467681884765625, -0.016021728515625, 0.0147247314453125, 0.04547119140625, 0.0762176513671875, 0.106964111328125, 0.1377105712890625, 0.16845703125, 0.1992034912109375, 0.229949951171875, 0.2606964111328125, 0.29144287109375, 0.3221893310546875, 0.352935791015625, 0.3836822509765625, 0.4144287109375, 0.4451751708984375, 0.475921630859375, 0.5066680908203125, 0.53741455078125, 0.5681610107421875, 0.598907470703125, 0.6296539306640625, 0.660400390625, 0.6911468505859375, 0.721893310546875, 0.7526397705078125, 0.78338623046875, 0.8141326904296875, 0.844879150390625, 0.8756256103515625, 0.9063720703125, 0.9371185302734375, 0.967864990234375, 0.9986114501953125, 1.02935791015625, 1.0601043701171875, 1.090850830078125, 1.1215972900390625, 1.15234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 11.0, 8.0, 22.0, 40.0, 52.0, 94.0, 105.0, 141.0, 168.0, 103.0, 91.0, 43.0, 30.0, 25.0, 11.0, 7.0, 8.0, 6.0, 3.0, 0.0, 7.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.091717720031738, -4.932479381561279, -4.77324104309082, -4.614002704620361, -4.454764366149902, -4.295525550842285, -4.136287689208984, -3.977048873901367, -3.817810535430908, -3.658572196960449, -3.4993338584899902, -3.3400955200195312, -3.180856943130493, -3.021618604660034, -2.862380266189575, -2.703141689300537, -2.5439035892486572, -2.3846652507781982, -2.2254269123077393, -2.066188335418701, -1.9069499969482422, -1.7477116584777832, -1.5884733200073242, -1.4292348623275757, -1.2699965238571167, -1.1107581853866577, -0.9515197277069092, -0.7922813892364502, -0.6330429911613464, -0.4738045930862427, -0.3145662546157837, -0.15532779693603516, 0.003910541534423828, 0.1631489247083664, 0.32238730788230896, 0.48162567615509033, 0.6408640742301941, 0.8001024723052979, 0.9593408107757568, 1.1185792684555054, 1.2778176069259644, 1.4370559453964233, 1.5962944030761719, 1.7555327415466309, 1.9147710800170898, 2.074009418487549, 2.233247756958008, 2.392486333847046, 2.551724672317505, 2.710963010787964, 2.870201349258423, 3.029439926147461, 3.18867826461792, 3.347916603088379, 3.507154941558838, 3.666393280029297, 3.825631618499756, 3.984869956970215, 4.144108295440674, 4.303346633911133, 4.462584972381592, 4.621823310852051, 4.781062126159668, 4.940300464630127, 5.099538803100586]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 15.0, 18.0, 22.0, 36.0, 37.0, 54.0, 54.0, 61.0, 68.0, 74.0, 76.0, 97.0, 76.0, 65.0, 47.0, 36.0, 33.0, 22.0, 13.0, 20.0, 13.0, 11.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.7531285285949707, -3.6427433490753174, -3.532357931137085, -3.4219727516174316, -3.311587333679199, -3.201202154159546, -3.0908169746398926, -2.98043155670166, -2.8700461387634277, -2.7596609592437744, -2.649275541305542, -2.5388903617858887, -2.4285049438476562, -2.318119764328003, -2.2077345848083496, -2.097349166870117, -1.9869639873504639, -1.876578688621521, -1.7661933898925781, -1.6558082103729248, -1.5454227924346924, -1.435037612915039, -1.3246523141860962, -1.2142670154571533, -1.1038817167282104, -0.9934964179992676, -0.8831111192703247, -0.7727258801460266, -0.6623405814170837, -0.5519552826881409, -0.4415700435638428, -0.3311847448348999, -0.22079920768737793, -0.11041392385959625, -2.8640031814575195e-05, 0.11035662889480591, 0.22074192762374878, 0.33112722635269165, 0.44151246547698975, 0.5518977642059326, 0.6622830629348755, 0.7726683616638184, 0.8830536603927612, 0.9934388995170593, 1.1038241386413574, 1.2142095565795898, 1.3245947360992432, 1.434980034828186, 1.545365333557129, 1.6557506322860718, 1.7661359310150146, 1.876521110534668, 1.9869065284729004, 2.0972917079925537, 2.207676887512207, 2.3180623054504395, 2.428447723388672, 2.538832902908325, 2.6492183208465576, 2.759603500366211, 2.8699889183044434, 2.9803740978240967, 3.09075927734375, 3.2011446952819824, 3.3115298748016357]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 7.0, 13.0, 22.0, 18.0, 24.0, 53.0, 85.0, 103.0, 178.0, 313.0, 609.0, 1403.0, 4541.0, 20745.0, 343073.0, 637205.0, 31047.0, 5651.0, 1760.0, 754.0, 373.0, 210.0, 121.0, 64.0, 51.0, 36.0, 23.0, 16.0, 9.0, 10.0, 3.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.45671844482421875, -0.4424896240234375, -0.42826080322265625, -0.414031982421875, -0.39980316162109375, -0.3855743408203125, -0.37134552001953125, -0.35711669921875, -0.34288787841796875, -0.3286590576171875, -0.31443023681640625, -0.300201416015625, -0.28597259521484375, -0.2717437744140625, -0.25751495361328125, -0.2432861328125, -0.22905731201171875, -0.2148284912109375, -0.20059967041015625, -0.186370849609375, -0.17214202880859375, -0.1579132080078125, -0.14368438720703125, -0.12945556640625, -0.11522674560546875, -0.1009979248046875, -0.08676910400390625, -0.072540283203125, -0.05831146240234375, -0.0440826416015625, -0.02985382080078125, -0.015625, -0.00139617919921875, 0.0128326416015625, 0.02706146240234375, 0.041290283203125, 0.05551910400390625, 0.0697479248046875, 0.08397674560546875, 0.09820556640625, 0.11243438720703125, 0.1266632080078125, 0.14089202880859375, 0.155120849609375, 0.16934967041015625, 0.1835784912109375, 0.19780731201171875, 0.2120361328125, 0.22626495361328125, 0.2404937744140625, 0.25472259521484375, 0.268951416015625, 0.28318023681640625, 0.2974090576171875, 0.31163787841796875, 0.32586669921875, 0.34009552001953125, 0.3543243408203125, 0.36855316162109375, 0.382781982421875, 0.39701080322265625, 0.4112396240234375, 0.42546844482421875, 0.439697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 12.0, 26.0, 24.0, 44.0, 59.0, 72.0, 78.0, 92.0, 117.0, 100.0, 93.0, 68.0, 51.0, 46.0, 22.0, 14.0, 13.0, 11.0, 9.0, 11.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.811981201171875, -2.71380615234375, -2.615631103515625, -2.5174560546875, -2.419281005859375, -2.32110595703125, -2.222930908203125, -2.124755859375, -2.026580810546875, -1.92840576171875, -1.830230712890625, -1.7320556640625, -1.633880615234375, -1.53570556640625, -1.437530517578125, -1.33935546875, -1.241180419921875, -1.14300537109375, -1.044830322265625, -0.9466552734375, -0.848480224609375, -0.75030517578125, -0.652130126953125, -0.553955078125, -0.455780029296875, -0.35760498046875, -0.259429931640625, -0.1612548828125, -0.063079833984375, 0.03509521484375, 0.133270263671875, 0.2314453125, 0.329620361328125, 0.42779541015625, 0.525970458984375, 0.6241455078125, 0.722320556640625, 0.82049560546875, 0.918670654296875, 1.016845703125, 1.115020751953125, 1.21319580078125, 1.311370849609375, 1.4095458984375, 1.507720947265625, 1.60589599609375, 1.704071044921875, 1.80224609375, 1.900421142578125, 1.99859619140625, 2.096771240234375, 2.1949462890625, 2.293121337890625, 2.39129638671875, 2.489471435546875, 2.587646484375, 2.685821533203125, 2.78399658203125, 2.882171630859375, 2.9803466796875, 3.078521728515625, 3.17669677734375, 3.274871826171875, 3.373046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 15.0, 18.0, 24.0, 32.0, 48.0, 48.0, 59.0, 101.0, 159.0, 248.0, 470.0, 1520.0, 13970.0, 567435.0, 451236.0, 10684.0, 1297.0, 456.0, 202.0, 130.0, 93.0, 84.0, 48.0, 38.0, 22.0, 19.0, 15.0, 12.0, 8.0, 8.0, 7.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4151115417480469, -0.40077972412109375, -0.3864479064941406, -0.3721160888671875, -0.3577842712402344, -0.34345245361328125, -0.3291206359863281, -0.314788818359375, -0.3004570007324219, -0.28612518310546875, -0.2717933654785156, -0.2574615478515625, -0.24312973022460938, -0.22879791259765625, -0.21446609497070312, -0.20013427734375, -0.18580245971679688, -0.17147064208984375, -0.15713882446289062, -0.1428070068359375, -0.12847518920898438, -0.11414337158203125, -0.09981155395507812, -0.085479736328125, -0.07114791870117188, -0.05681610107421875, -0.042484283447265625, -0.0281524658203125, -0.013820648193359375, 0.00051116943359375, 0.014842987060546875, 0.0291748046875, 0.043506622314453125, 0.05783843994140625, 0.07217025756835938, 0.0865020751953125, 0.10083389282226562, 0.11516571044921875, 0.12949752807617188, 0.143829345703125, 0.15816116333007812, 0.17249298095703125, 0.18682479858398438, 0.2011566162109375, 0.21548843383789062, 0.22982025146484375, 0.24415206909179688, 0.25848388671875, 0.2728157043457031, 0.28714752197265625, 0.3014793395996094, 0.3158111572265625, 0.3301429748535156, 0.34447479248046875, 0.3588066101074219, 0.373138427734375, 0.3874702453613281, 0.40180206298828125, 0.4161338806152344, 0.4304656982421875, 0.4447975158691406, 0.45912933349609375, 0.4734611511230469, 0.48779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 12.0, 7.0, 7.0, 15.0, 24.0, 27.0, 25.0, 21.0, 30.0, 33.0, 30.0, 34.0, 31.0, 32.0, 42.0, 45.0, 40.0, 44.0, 46.0, 41.0, 40.0, 45.0, 37.0, 35.0, 20.0, 24.0, 24.0, 26.0, 17.0, 17.0, 22.0, 13.0, 11.0, 7.0, 8.0, 4.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.7933349609375, -2.701904296875, -2.6104736328125, -2.51904296875, -2.4276123046875, -2.336181640625, -2.2447509765625, -2.1533203125, -2.0618896484375, -1.970458984375, -1.8790283203125, -1.78759765625, -1.6961669921875, -1.604736328125, -1.5133056640625, -1.421875, -1.3304443359375, -1.239013671875, -1.1475830078125, -1.05615234375, -0.9647216796875, -0.873291015625, -0.7818603515625, -0.6904296875, -0.5989990234375, -0.507568359375, -0.4161376953125, -0.32470703125, -0.2332763671875, -0.141845703125, -0.0504150390625, 0.041015625, 0.1324462890625, 0.223876953125, 0.3153076171875, 0.40673828125, 0.4981689453125, 0.589599609375, 0.6810302734375, 0.7724609375, 0.8638916015625, 0.955322265625, 1.0467529296875, 1.13818359375, 1.2296142578125, 1.321044921875, 1.4124755859375, 1.50390625, 1.5953369140625, 1.686767578125, 1.7781982421875, 1.86962890625, 1.9610595703125, 2.052490234375, 2.1439208984375, 2.2353515625, 2.3267822265625, 2.418212890625, 2.5096435546875, 2.60107421875, 2.6925048828125, 2.783935546875, 2.8753662109375, 2.966796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 11.0, 17.0, 24.0, 53.0, 163.0, 471.0, 2773.0, 1041627.0, 2813.0, 388.0, 100.0, 43.0, 29.0, 14.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.30068206787109375, -0.2878875732421875, -0.27509307861328125, -0.262298583984375, -0.24950408935546875, -0.2367095947265625, -0.22391510009765625, -0.21112060546875, -0.19832611083984375, -0.1855316162109375, -0.17273712158203125, -0.159942626953125, -0.14714813232421875, -0.1343536376953125, -0.12155914306640625, -0.1087646484375, -0.09597015380859375, -0.0831756591796875, -0.07038116455078125, -0.057586669921875, -0.04479217529296875, -0.0319976806640625, -0.01920318603515625, -0.00640869140625, 0.00638580322265625, 0.0191802978515625, 0.03197479248046875, 0.044769287109375, 0.05756378173828125, 0.0703582763671875, 0.08315277099609375, 0.095947265625, 0.10874176025390625, 0.1215362548828125, 0.13433074951171875, 0.147125244140625, 0.15991973876953125, 0.1727142333984375, 0.18550872802734375, 0.19830322265625, 0.21109771728515625, 0.2238922119140625, 0.23668670654296875, 0.249481201171875, 0.26227569580078125, 0.2750701904296875, 0.28786468505859375, 0.3006591796875, 0.31345367431640625, 0.3262481689453125, 0.33904266357421875, 0.351837158203125, 0.36463165283203125, 0.3774261474609375, 0.39022064208984375, 0.40301513671875, 0.41580963134765625, 0.4286041259765625, 0.44139862060546875, 0.454193115234375, 0.46698760986328125, 0.4797821044921875, 0.49257659912109375, 0.50537109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 10.0, 8.0, 20.0, 33.0, 70.0, 136.0, 175.0, 192.0, 134.0, 77.0, 55.0, 25.0, 17.0, 15.0, 14.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.638599395751953e-05, -5.504675209522247e-05, -5.3707510232925415e-05, -5.236826837062836e-05, -5.10290265083313e-05, -4.968978464603424e-05, -4.835054278373718e-05, -4.7011300921440125e-05, -4.5672059059143066e-05, -4.433281719684601e-05, -4.299357533454895e-05, -4.165433347225189e-05, -4.0315091609954834e-05, -3.8975849747657776e-05, -3.763660788536072e-05, -3.629736602306366e-05, -3.49581241607666e-05, -3.3618882298469543e-05, -3.2279640436172485e-05, -3.094039857387543e-05, -2.960115671157837e-05, -2.826191484928131e-05, -2.6922672986984253e-05, -2.5583431124687195e-05, -2.4244189262390137e-05, -2.290494740009308e-05, -2.156570553779602e-05, -2.0226463675498962e-05, -1.8887221813201904e-05, -1.7547979950904846e-05, -1.6208738088607788e-05, -1.486949622631073e-05, -1.3530254364013672e-05, -1.2191012501716614e-05, -1.0851770639419556e-05, -9.512528777122498e-06, -8.17328691482544e-06, -6.834045052528381e-06, -5.494803190231323e-06, -4.155561327934265e-06, -2.816319465637207e-06, -1.477077603340149e-06, -1.3783574104309082e-07, 1.2014061212539673e-06, 2.5406479835510254e-06, 3.8798898458480835e-06, 5.219131708145142e-06, 6.5583735704422e-06, 7.897615432739258e-06, 9.236857295036316e-06, 1.0576099157333374e-05, 1.1915341019630432e-05, 1.325458288192749e-05, 1.4593824744224548e-05, 1.5933066606521606e-05, 1.7272308468818665e-05, 1.8611550331115723e-05, 1.995079219341278e-05, 2.129003405570984e-05, 2.2629275918006897e-05, 2.3968517780303955e-05, 2.5307759642601013e-05, 2.664700150489807e-05, 2.798624336719513e-05, 2.9325485229492188e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 8.0, 15.0, 24.0, 41.0, 55.0, 127.0, 214.0, 533.0, 2383.0, 152376.0, 888482.0, 3145.0, 593.0, 260.0, 127.0, 59.0, 39.0, 24.0, 17.0, 6.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2529296875, -0.24196243286132812, -0.23099517822265625, -0.22002792358398438, -0.2090606689453125, -0.19809341430664062, -0.18712615966796875, -0.17615890502929688, -0.165191650390625, -0.15422439575195312, -0.14325714111328125, -0.13228988647460938, -0.1213226318359375, -0.11035537719726562, -0.09938812255859375, -0.08842086791992188, -0.07745361328125, -0.06648635864257812, -0.05551910400390625, -0.044551849365234375, -0.0335845947265625, -0.022617340087890625, -0.01165008544921875, -0.000682830810546875, 0.010284423828125, 0.021251678466796875, 0.03221893310546875, 0.043186187744140625, 0.0541534423828125, 0.06512069702148438, 0.07608795166015625, 0.08705520629882812, 0.0980224609375, 0.10898971557617188, 0.11995697021484375, 0.13092422485351562, 0.1418914794921875, 0.15285873413085938, 0.16382598876953125, 0.17479324340820312, 0.185760498046875, 0.19672775268554688, 0.20769500732421875, 0.21866226196289062, 0.2296295166015625, 0.24059677124023438, 0.25156402587890625, 0.2625312805175781, 0.27349853515625, 0.2844657897949219, 0.29543304443359375, 0.3064002990722656, 0.3173675537109375, 0.3283348083496094, 0.33930206298828125, 0.3502693176269531, 0.361236572265625, 0.3722038269042969, 0.38317108154296875, 0.3941383361816406, 0.4051055908203125, 0.4160728454589844, 0.42704010009765625, 0.4380073547363281, 0.448974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 12.0, 19.0, 34.0, 334.0, 518.0, 36.0, 21.0, 12.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12443161010742188, -0.12178802490234375, -0.11914443969726562, -0.1165008544921875, -0.11385726928710938, -0.11121368408203125, -0.10857009887695312, -0.105926513671875, -0.10328292846679688, -0.10063934326171875, -0.09799575805664062, -0.0953521728515625, -0.09270858764648438, -0.09006500244140625, -0.08742141723632812, -0.08477783203125, -0.08213424682617188, -0.07949066162109375, -0.07684707641601562, -0.0742034912109375, -0.07155990600585938, -0.06891632080078125, -0.06627273559570312, -0.063629150390625, -0.060985565185546875, -0.05834197998046875, -0.055698394775390625, -0.0530548095703125, -0.050411224365234375, -0.04776763916015625, -0.045124053955078125, -0.04248046875, -0.039836883544921875, -0.03719329833984375, -0.034549713134765625, -0.0319061279296875, -0.029262542724609375, -0.02661895751953125, -0.023975372314453125, -0.021331787109375, -0.018688201904296875, -0.01604461669921875, -0.013401031494140625, -0.0107574462890625, -0.008113861083984375, -0.00547027587890625, -0.002826690673828125, -0.00018310546875, 0.002460479736328125, 0.00510406494140625, 0.007747650146484375, 0.0103912353515625, 0.013034820556640625, 0.01567840576171875, 0.018321990966796875, 0.020965576171875, 0.023609161376953125, 0.02625274658203125, 0.028896331787109375, 0.0315399169921875, 0.034183502197265625, 0.03682708740234375, 0.039470672607421875, 0.0421142578125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 16.0, 19.0, 46.0, 77.0, 121.0, 182.0, 194.0, 137.0, 68.0, 42.0, 33.0, 8.0, 9.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8529906272888184, -3.7201764583587646, -3.58736252784729, -3.4545483589172363, -3.3217344284057617, -3.188920259475708, -3.0561060905456543, -2.9232921600341797, -2.790477991104126, -2.6576638221740723, -2.5248498916625977, -2.392035722732544, -2.2592215538024902, -2.1264076232910156, -1.993593454360962, -1.8607794046401978, -1.7279653549194336, -1.5951513051986694, -1.4623372554779053, -1.3295230865478516, -1.1967090368270874, -1.0638949871063232, -0.9310808777809143, -0.7982667684555054, -0.6654527187347412, -0.532638669013977, -0.3998245596885681, -0.26701048016548157, -0.13419640064239502, -0.0013823509216308594, 0.13143175840377808, 0.264245867729187, 0.3970603942871094, 0.5298744440078735, 0.6626885533332825, 0.7955026626586914, 0.9283167123794556, 1.0611307621002197, 1.1939449310302734, 1.3267589807510376, 1.4595730304718018, 1.592387080192566, 1.72520112991333, 1.8580152988433838, 1.990829348564148, 2.123643398284912, 2.256457567214966, 2.3892717361450195, 2.522085666656494, 2.654899835586548, 2.7877137660980225, 2.920527935028076, 3.053341865539551, 3.1861560344696045, 3.318970203399658, 3.451784133911133, 3.5845983028411865, 3.7174124717712402, 3.850226402282715, 3.9830405712127686, 4.115854740142822, 4.248668670654297, 4.3814826011657715, 4.514297008514404, 4.647110939025879]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 12.0, 24.0, 16.0, 23.0, 40.0, 52.0, 62.0, 74.0, 75.0, 92.0, 90.0, 101.0, 89.0, 55.0, 37.0, 45.0, 17.0, 18.0, 15.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6858091354370117, -2.6021041870117188, -2.5183990001678467, -2.4346940517425537, -2.3509888648986816, -2.2672839164733887, -2.1835789680480957, -2.0998737812042236, -2.0161685943603516, -1.932463526725769, -1.8487584590911865, -1.7650535106658936, -1.6813483238220215, -1.5976433753967285, -1.513938307762146, -1.4302332401275635, -1.3465282917022705, -1.262823224067688, -1.1791181564331055, -1.0954132080078125, -1.0117080211639404, -0.9280030131340027, -0.8442980051040649, -0.7605929374694824, -0.6768878698348999, -0.5931828022003174, -0.5094777345657349, -0.4257727265357971, -0.3420676589012146, -0.2583625912666321, -0.17465758323669434, -0.09095251560211182, -0.007247447967529297, 0.07645760476589203, 0.16016265749931335, 0.2438676953315735, 0.327572762966156, 0.4112778306007385, 0.49498283863067627, 0.5786879062652588, 0.6623929738998413, 0.7460980415344238, 0.8298031091690063, 0.9135081171989441, 0.9972131848335266, 1.080918312072754, 1.1646232604980469, 1.2483283281326294, 1.332033395767212, 1.4157384634017944, 1.499443531036377, 1.58314847946167, 1.666853666305542, 1.750558614730835, 1.8342636823654175, 1.91796875, 2.001673698425293, 2.085378646850586, 2.169083833694458, 2.252788782119751, 2.336493968963623, 2.420198917388916, 2.503903865814209, 2.587609052658081, 2.671314239501953]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 5.0, 16.0, 12.0, 24.0, 18.0, 38.0, 62.0, 70.0, 103.0, 173.0, 240.0, 438.0, 661.0, 1159.0, 2052.0, 4002.0, 8342.0, 20316.0, 63052.0, 420412.0, 425919.0, 63402.0, 20504.0, 8459.0, 3986.0, 2064.0, 1166.0, 682.0, 369.0, 264.0, 164.0, 119.0, 65.0, 55.0, 35.0, 22.0, 18.0, 14.0, 16.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.701171875, -1.64447021484375, -1.5877685546875, -1.53106689453125, -1.474365234375, -1.41766357421875, -1.3609619140625, -1.30426025390625, -1.24755859375, -1.19085693359375, -1.1341552734375, -1.07745361328125, -1.020751953125, -0.96405029296875, -0.9073486328125, -0.85064697265625, -0.7939453125, -0.73724365234375, -0.6805419921875, -0.62384033203125, -0.567138671875, -0.51043701171875, -0.4537353515625, -0.39703369140625, -0.34033203125, -0.28363037109375, -0.2269287109375, -0.17022705078125, -0.113525390625, -0.05682373046875, -0.0001220703125, 0.05657958984375, 0.11328125, 0.16998291015625, 0.2266845703125, 0.28338623046875, 0.340087890625, 0.39678955078125, 0.4534912109375, 0.51019287109375, 0.56689453125, 0.62359619140625, 0.6802978515625, 0.73699951171875, 0.793701171875, 0.85040283203125, 0.9071044921875, 0.96380615234375, 1.0205078125, 1.07720947265625, 1.1339111328125, 1.19061279296875, 1.247314453125, 1.30401611328125, 1.3607177734375, 1.41741943359375, 1.47412109375, 1.53082275390625, 1.5875244140625, 1.64422607421875, 1.700927734375, 1.75762939453125, 1.8143310546875, 1.87103271484375, 1.927734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 17.0, 14.0, 28.0, 43.0, 54.0, 52.0, 68.0, 66.0, 90.0, 89.0, 92.0, 65.0, 73.0, 47.0, 35.0, 24.0, 23.0, 18.0, 13.0, 13.0, 9.0, 4.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39178466796875, -4.2366943359375, -4.08160400390625, -3.926513671875, -3.77142333984375, -3.6163330078125, -3.46124267578125, -3.30615234375, -3.15106201171875, -2.9959716796875, -2.84088134765625, -2.685791015625, -2.53070068359375, -2.3756103515625, -2.22052001953125, -2.0654296875, -1.91033935546875, -1.7552490234375, -1.60015869140625, -1.445068359375, -1.28997802734375, -1.1348876953125, -0.97979736328125, -0.82470703125, -0.66961669921875, -0.5145263671875, -0.35943603515625, -0.204345703125, -0.04925537109375, 0.1058349609375, 0.26092529296875, 0.416015625, 0.57110595703125, 0.7261962890625, 0.88128662109375, 1.036376953125, 1.19146728515625, 1.3465576171875, 1.50164794921875, 1.65673828125, 1.81182861328125, 1.9669189453125, 2.12200927734375, 2.277099609375, 2.43218994140625, 2.5872802734375, 2.74237060546875, 2.8974609375, 3.05255126953125, 3.2076416015625, 3.36273193359375, 3.517822265625, 3.67291259765625, 3.8280029296875, 3.98309326171875, 4.13818359375, 4.29327392578125, 4.4483642578125, 4.60345458984375, 4.758544921875, 4.91363525390625, 5.0687255859375, 5.22381591796875, 5.37890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 10.0, 18.0, 25.0, 29.0, 29.0, 46.0, 55.0, 85.0, 104.0, 137.0, 212.0, 342.0, 582.0, 1362.0, 5242.0, 37042.0, 851899.0, 135123.0, 11589.0, 2359.0, 842.0, 429.0, 287.0, 202.0, 134.0, 89.0, 74.0, 40.0, 40.0, 28.0, 31.0, 10.0, 12.0, 9.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.517578125, -3.416290283203125, -3.31500244140625, -3.213714599609375, -3.1124267578125, -3.011138916015625, -2.90985107421875, -2.808563232421875, -2.707275390625, -2.605987548828125, -2.50469970703125, -2.403411865234375, -2.3021240234375, -2.200836181640625, -2.09954833984375, -1.998260498046875, -1.89697265625, -1.795684814453125, -1.69439697265625, -1.593109130859375, -1.4918212890625, -1.390533447265625, -1.28924560546875, -1.187957763671875, -1.086669921875, -0.985382080078125, -0.88409423828125, -0.782806396484375, -0.6815185546875, -0.580230712890625, -0.47894287109375, -0.377655029296875, -0.2763671875, -0.175079345703125, -0.07379150390625, 0.027496337890625, 0.1287841796875, 0.230072021484375, 0.33135986328125, 0.432647705078125, 0.533935546875, 0.635223388671875, 0.73651123046875, 0.837799072265625, 0.9390869140625, 1.040374755859375, 1.14166259765625, 1.242950439453125, 1.34423828125, 1.445526123046875, 1.54681396484375, 1.648101806640625, 1.7493896484375, 1.850677490234375, 1.95196533203125, 2.053253173828125, 2.154541015625, 2.255828857421875, 2.35711669921875, 2.458404541015625, 2.5596923828125, 2.660980224609375, 2.76226806640625, 2.863555908203125, 2.96484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 7.0, 10.0, 6.0, 12.0, 8.0, 11.0, 23.0, 19.0, 24.0, 26.0, 37.0, 35.0, 40.0, 52.0, 55.0, 56.0, 58.0, 62.0, 54.0, 41.0, 62.0, 40.0, 48.0, 34.0, 37.0, 22.0, 18.0, 23.0, 23.0, 10.0, 14.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.79296875, -4.64007568359375, -4.4871826171875, -4.33428955078125, -4.181396484375, -4.02850341796875, -3.8756103515625, -3.72271728515625, -3.56982421875, -3.41693115234375, -3.2640380859375, -3.11114501953125, -2.958251953125, -2.80535888671875, -2.6524658203125, -2.49957275390625, -2.3466796875, -2.19378662109375, -2.0408935546875, -1.88800048828125, -1.735107421875, -1.58221435546875, -1.4293212890625, -1.27642822265625, -1.12353515625, -0.97064208984375, -0.8177490234375, -0.66485595703125, -0.511962890625, -0.35906982421875, -0.2061767578125, -0.05328369140625, 0.099609375, 0.25250244140625, 0.4053955078125, 0.55828857421875, 0.711181640625, 0.86407470703125, 1.0169677734375, 1.16986083984375, 1.32275390625, 1.47564697265625, 1.6285400390625, 1.78143310546875, 1.934326171875, 2.08721923828125, 2.2401123046875, 2.39300537109375, 2.5458984375, 2.69879150390625, 2.8516845703125, 3.00457763671875, 3.157470703125, 3.31036376953125, 3.4632568359375, 3.61614990234375, 3.76904296875, 3.92193603515625, 4.0748291015625, 4.22772216796875, 4.380615234375, 4.53350830078125, 4.6864013671875, 4.83929443359375, 4.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 15.0, 20.0, 35.0, 46.0, 120.0, 475.0, 2829.0, 131516.0, 907370.0, 5121.0, 677.0, 194.0, 50.0, 35.0, 17.0, 12.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.806793212890625, -4.68389892578125, -4.561004638671875, -4.4381103515625, -4.315216064453125, -4.19232177734375, -4.069427490234375, -3.946533203125, -3.823638916015625, -3.70074462890625, -3.577850341796875, -3.4549560546875, -3.332061767578125, -3.20916748046875, -3.086273193359375, -2.96337890625, -2.840484619140625, -2.71759033203125, -2.594696044921875, -2.4718017578125, -2.348907470703125, -2.22601318359375, -2.103118896484375, -1.980224609375, -1.857330322265625, -1.73443603515625, -1.611541748046875, -1.4886474609375, -1.365753173828125, -1.24285888671875, -1.119964599609375, -0.9970703125, -0.874176025390625, -0.75128173828125, -0.628387451171875, -0.5054931640625, -0.382598876953125, -0.25970458984375, -0.136810302734375, -0.013916015625, 0.108978271484375, 0.23187255859375, 0.354766845703125, 0.4776611328125, 0.600555419921875, 0.72344970703125, 0.846343994140625, 0.96923828125, 1.092132568359375, 1.21502685546875, 1.337921142578125, 1.4608154296875, 1.583709716796875, 1.70660400390625, 1.829498291015625, 1.952392578125, 2.075286865234375, 2.19818115234375, 2.321075439453125, 2.4439697265625, 2.566864013671875, 2.68975830078125, 2.812652587890625, 2.935546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 7.0, 16.0, 27.0, 28.0, 22.0, 33.0, 63.0, 130.0, 259.0, 159.0, 62.0, 40.0, 29.0, 21.0, 19.0, 20.0, 8.0, 13.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018334388732910156, -0.00017804093658924103, -0.0001727379858493805, -0.00016743503510951996, -0.00016213208436965942, -0.0001568291336297989, -0.00015152618288993835, -0.00014622323215007782, -0.00014092028141021729, -0.00013561733067035675, -0.00013031437993049622, -0.00012501142919063568, -0.00011970847845077515, -0.00011440552771091461, -0.00010910257697105408, -0.00010379962623119354, -9.849667549133301e-05, -9.319372475147247e-05, -8.789077401161194e-05, -8.25878232717514e-05, -7.728487253189087e-05, -7.198192179203033e-05, -6.66789710521698e-05, -6.137602031230927e-05, -5.607306957244873e-05, -5.0770118832588196e-05, -4.546716809272766e-05, -4.0164217352867126e-05, -3.486126661300659e-05, -2.9558315873146057e-05, -2.4255365133285522e-05, -1.8952414393424988e-05, -1.3649463653564453e-05, -8.346512913703918e-06, -3.043562173843384e-06, 2.259388566017151e-06, 7.5623393058776855e-06, 1.286529004573822e-05, 1.8168240785598755e-05, 2.347119152545929e-05, 2.8774142265319824e-05, 3.407709300518036e-05, 3.9380043745040894e-05, 4.468299448490143e-05, 4.998594522476196e-05, 5.52888959646225e-05, 6.059184670448303e-05, 6.589479744434357e-05, 7.11977481842041e-05, 7.650069892406464e-05, 8.180364966392517e-05, 8.71066004037857e-05, 9.240955114364624e-05, 9.771250188350677e-05, 0.00010301545262336731, 0.00010831840336322784, 0.00011362135410308838, 0.00011892430484294891, 0.00012422725558280945, 0.00012953020632266998, 0.00013483315706253052, 0.00014013610780239105, 0.0001454390585422516, 0.00015074200928211212, 0.00015604496002197266]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 15.0, 28.0, 60.0, 126.0, 326.0, 1337.0, 14282.0, 965597.0, 63070.0, 2884.0, 537.0, 148.0, 75.0, 27.0, 15.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.724853515625, -1.62158203125, -1.518310546875, -1.4150390625, -1.311767578125, -1.20849609375, -1.105224609375, -1.001953125, -0.898681640625, -0.79541015625, -0.692138671875, -0.5888671875, -0.485595703125, -0.38232421875, -0.279052734375, -0.17578125, -0.072509765625, 0.03076171875, 0.134033203125, 0.2373046875, 0.340576171875, 0.44384765625, 0.547119140625, 0.650390625, 0.753662109375, 0.85693359375, 0.960205078125, 1.0634765625, 1.166748046875, 1.27001953125, 1.373291015625, 1.4765625, 1.579833984375, 1.68310546875, 1.786376953125, 1.8896484375, 1.992919921875, 2.09619140625, 2.199462890625, 2.302734375, 2.406005859375, 2.50927734375, 2.612548828125, 2.7158203125, 2.819091796875, 2.92236328125, 3.025634765625, 3.12890625, 3.232177734375, 3.33544921875, 3.438720703125, 3.5419921875, 3.645263671875, 3.74853515625, 3.851806640625, 3.955078125, 4.058349609375, 4.16162109375, 4.264892578125, 4.3681640625, 4.471435546875, 4.57470703125, 4.677978515625, 4.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 22.0, 41.0, 41.0, 104.0, 529.0, 91.0, 54.0, 37.0, 26.0, 14.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.498046875, -1.4658050537109375, -1.433563232421875, -1.4013214111328125, -1.36907958984375, -1.3368377685546875, -1.304595947265625, -1.2723541259765625, -1.2401123046875, -1.2078704833984375, -1.175628662109375, -1.1433868408203125, -1.11114501953125, -1.0789031982421875, -1.046661376953125, -1.0144195556640625, -0.982177734375, -0.9499359130859375, -0.917694091796875, -0.8854522705078125, -0.85321044921875, -0.8209686279296875, -0.788726806640625, -0.7564849853515625, -0.7242431640625, -0.6920013427734375, -0.659759521484375, -0.6275177001953125, -0.59527587890625, -0.5630340576171875, -0.530792236328125, -0.4985504150390625, -0.46630859375, -0.4340667724609375, -0.401824951171875, -0.3695831298828125, -0.33734130859375, -0.3050994873046875, -0.272857666015625, -0.2406158447265625, -0.2083740234375, -0.1761322021484375, -0.143890380859375, -0.1116485595703125, -0.07940673828125, -0.0471649169921875, -0.014923095703125, 0.0173187255859375, 0.049560546875, 0.0818023681640625, 0.114044189453125, 0.1462860107421875, 0.17852783203125, 0.2107696533203125, 0.243011474609375, 0.2752532958984375, 0.3074951171875, 0.3397369384765625, 0.371978759765625, 0.4042205810546875, 0.43646240234375, 0.4687042236328125, 0.500946044921875, 0.5331878662109375, 0.5654296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 11.0, 10.0, 30.0, 74.0, 146.0, 263.0, 232.0, 111.0, 59.0, 30.0, 10.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.956765651702881, -7.55506706237793, -7.1533684730529785, -6.751669883728027, -6.349970817565918, -5.948272705078125, -5.546573638916016, -5.1448750495910645, -4.743176460266113, -4.341477870941162, -3.939779281616211, -3.5380804538726807, -3.1363818645477295, -2.7346832752227783, -2.332984447479248, -1.9312858581542969, -1.5295872688293457, -1.1278886795043945, -0.7261899709701538, -0.3244912624359131, 0.07720732688903809, 0.47890591621398926, 0.8806047439575195, 1.2823033332824707, 1.6840019226074219, 2.085700511932373, 2.487399101257324, 2.8890979290008545, 3.2907965183258057, 3.692495107650757, 4.094193935394287, 4.495892524719238, 4.897590637207031, 5.299289226531982, 5.700987815856934, 6.102686882019043, 6.504384994506836, 6.906084060668945, 7.3077826499938965, 7.709481239318848, 8.11117935180664, 8.51287841796875, 8.914576530456543, 9.316275596618652, 9.717973709106445, 10.119672775268555, 10.521371841430664, 10.923069953918457, 11.324769020080566, 11.726468086242676, 12.128166198730469, 12.529865264892578, 12.931563377380371, 13.33326244354248, 13.734960556030273, 14.136659622192383, 14.538358688354492, 14.940057754516602, 15.341755867004395, 15.743454933166504, 16.145153045654297, 16.546852111816406, 16.948551177978516, 17.350250244140625, 17.7519474029541]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 19.0, 12.0, 20.0, 10.0, 19.0, 18.0, 20.0, 24.0, 28.0, 40.0, 32.0, 40.0, 32.0, 41.0, 39.0, 34.0, 51.0, 43.0, 46.0, 35.0, 39.0, 48.0, 37.0, 32.0, 31.0, 25.0, 27.0, 18.0, 14.0, 15.0, 15.0, 16.0, 15.0, 4.0, 12.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.197763442993164, -5.985151290893555, -5.772539138793945, -5.559926509857178, -5.347314357757568, -5.134702205657959, -4.922089576721191, -4.709477424621582, -4.496865272521973, -4.284253120422363, -4.071640968322754, -3.8590283393859863, -3.646416187286377, -3.4338040351867676, -3.221191644668579, -3.0085792541503906, -2.7959671020507812, -2.583354949951172, -2.3707425594329834, -2.158130168914795, -1.9455180168151855, -1.7329057455062866, -1.5202934741973877, -1.3076812028884888, -1.0950689315795898, -0.8824566602706909, -0.669844388961792, -0.45723211765289307, -0.24461984634399414, -0.032007575035095215, 0.1806046962738037, 0.39321696758270264, 0.6058297157287598, 0.8184419870376587, 1.0310542583465576, 1.2436665296554565, 1.4562788009643555, 1.6688910722732544, 1.8815033435821533, 2.094115734100342, 2.306727886199951, 2.5193400382995605, 2.731952428817749, 2.9445648193359375, 3.157176971435547, 3.3697891235351562, 3.5824015140533447, 3.795013904571533, 4.007626056671143, 4.220238208770752, 4.4328508377075195, 4.645462989807129, 4.858075141906738, 5.070687294006348, 5.283299446105957, 5.495912075042725, 5.708524227142334, 5.921136379241943, 6.133749008178711, 6.34636116027832, 6.55897331237793, 6.771585464477539, 6.984197616577148, 7.196810245513916, 7.409422397613525]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 11.0, 16.0, 15.0, 14.0, 18.0, 30.0, 24.0, 35.0, 58.0, 92.0, 165.0, 356.0, 1154.0, 6310.0, 129744.0, 4008755.0, 42009.0, 3837.0, 872.0, 282.0, 130.0, 60.0, 57.0, 32.0, 21.0, 28.0, 18.0, 15.0, 14.0, 9.0, 9.0, 13.0, 7.0, 10.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4765625, -8.214599609375, -7.95263671875, -7.690673828125, -7.4287109375, -7.166748046875, -6.90478515625, -6.642822265625, -6.380859375, -6.118896484375, -5.85693359375, -5.594970703125, -5.3330078125, -5.071044921875, -4.80908203125, -4.547119140625, -4.28515625, -4.023193359375, -3.76123046875, -3.499267578125, -3.2373046875, -2.975341796875, -2.71337890625, -2.451416015625, -2.189453125, -1.927490234375, -1.66552734375, -1.403564453125, -1.1416015625, -0.879638671875, -0.61767578125, -0.355712890625, -0.09375, 0.168212890625, 0.43017578125, 0.692138671875, 0.9541015625, 1.216064453125, 1.47802734375, 1.739990234375, 2.001953125, 2.263916015625, 2.52587890625, 2.787841796875, 3.0498046875, 3.311767578125, 3.57373046875, 3.835693359375, 4.09765625, 4.359619140625, 4.62158203125, 4.883544921875, 5.1455078125, 5.407470703125, 5.66943359375, 5.931396484375, 6.193359375, 6.455322265625, 6.71728515625, 6.979248046875, 7.2412109375, 7.503173828125, 7.76513671875, 8.027099609375, 8.2890625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 19.0, 13.0, 19.0, 23.0, 29.0, 39.0, 49.0, 77.0, 87.0, 82.0, 94.0, 98.0, 93.0, 52.0, 49.0, 33.0, 31.0, 18.0, 18.0, 19.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.345703125, -3.253631591796875, -3.16156005859375, -3.069488525390625, -2.9774169921875, -2.885345458984375, -2.79327392578125, -2.701202392578125, -2.609130859375, -2.517059326171875, -2.42498779296875, -2.332916259765625, -2.2408447265625, -2.148773193359375, -2.05670166015625, -1.964630126953125, -1.87255859375, -1.780487060546875, -1.68841552734375, -1.596343994140625, -1.5042724609375, -1.412200927734375, -1.32012939453125, -1.228057861328125, -1.135986328125, -1.043914794921875, -0.95184326171875, -0.859771728515625, -0.7677001953125, -0.675628662109375, -0.58355712890625, -0.491485595703125, -0.3994140625, -0.307342529296875, -0.21527099609375, -0.123199462890625, -0.0311279296875, 0.060943603515625, 0.15301513671875, 0.245086669921875, 0.337158203125, 0.429229736328125, 0.52130126953125, 0.613372802734375, 0.7054443359375, 0.797515869140625, 0.88958740234375, 0.981658935546875, 1.07373046875, 1.165802001953125, 1.25787353515625, 1.349945068359375, 1.4420166015625, 1.534088134765625, 1.62615966796875, 1.718231201171875, 1.810302734375, 1.902374267578125, 1.99444580078125, 2.086517333984375, 2.1785888671875, 2.270660400390625, 2.36273193359375, 2.454803466796875, 2.546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 2.0, 11.0, 9.0, 17.0, 36.0, 61.0, 104.0, 250.0, 767.0, 3878.0, 53158.0, 3983295.0, 144280.0, 6655.0, 1133.0, 315.0, 149.0, 56.0, 35.0, 19.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.890625, -10.62255859375, -10.3544921875, -10.08642578125, -9.818359375, -9.55029296875, -9.2822265625, -9.01416015625, -8.74609375, -8.47802734375, -8.2099609375, -7.94189453125, -7.673828125, -7.40576171875, -7.1376953125, -6.86962890625, -6.6015625, -6.33349609375, -6.0654296875, -5.79736328125, -5.529296875, -5.26123046875, -4.9931640625, -4.72509765625, -4.45703125, -4.18896484375, -3.9208984375, -3.65283203125, -3.384765625, -3.11669921875, -2.8486328125, -2.58056640625, -2.3125, -2.04443359375, -1.7763671875, -1.50830078125, -1.240234375, -0.97216796875, -0.7041015625, -0.43603515625, -0.16796875, 0.10009765625, 0.3681640625, 0.63623046875, 0.904296875, 1.17236328125, 1.4404296875, 1.70849609375, 1.9765625, 2.24462890625, 2.5126953125, 2.78076171875, 3.048828125, 3.31689453125, 3.5849609375, 3.85302734375, 4.12109375, 4.38916015625, 4.6572265625, 4.92529296875, 5.193359375, 5.46142578125, 5.7294921875, 5.99755859375, 6.265625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 6.0, 5.0, 6.0, 8.0, 21.0, 27.0, 28.0, 30.0, 46.0, 54.0, 91.0, 111.0, 153.0, 227.0, 356.0, 705.0, 815.0, 442.0, 255.0, 186.0, 100.0, 109.0, 46.0, 46.0, 38.0, 30.0, 27.0, 15.0, 20.0, 16.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7553558349609375, -0.731903076171875, -0.7084503173828125, -0.68499755859375, -0.6615447998046875, -0.638092041015625, -0.6146392822265625, -0.5911865234375, -0.5677337646484375, -0.544281005859375, -0.5208282470703125, -0.49737548828125, -0.4739227294921875, -0.450469970703125, -0.4270172119140625, -0.403564453125, -0.3801116943359375, -0.356658935546875, -0.3332061767578125, -0.30975341796875, -0.2863006591796875, -0.262847900390625, -0.2393951416015625, -0.2159423828125, -0.1924896240234375, -0.169036865234375, -0.1455841064453125, -0.12213134765625, -0.0986785888671875, -0.075225830078125, -0.0517730712890625, -0.0283203125, -0.0048675537109375, 0.018585205078125, 0.0420379638671875, 0.06549072265625, 0.0889434814453125, 0.112396240234375, 0.1358489990234375, 0.1593017578125, 0.1827545166015625, 0.206207275390625, 0.2296600341796875, 0.25311279296875, 0.2765655517578125, 0.300018310546875, 0.3234710693359375, 0.346923828125, 0.3703765869140625, 0.393829345703125, 0.4172821044921875, 0.44073486328125, 0.4641876220703125, 0.487640380859375, 0.5110931396484375, 0.5345458984375, 0.5579986572265625, 0.581451416015625, 0.6049041748046875, 0.62835693359375, 0.6518096923828125, 0.675262451171875, 0.6987152099609375, 0.72216796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 7.0, 16.0, 14.0, 32.0, 47.0, 103.0, 94.0, 188.0, 147.0, 122.0, 83.0, 53.0, 38.0, 12.0, 17.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.128007411956787, -4.951148986816406, -4.774291038513184, -4.597433090209961, -4.42057466506958, -4.243716239929199, -4.066858291625977, -3.890000104904175, -3.713141918182373, -3.5362837314605713, -3.3594255447387695, -3.1825673580169678, -3.005709171295166, -2.8288509845733643, -2.6519927978515625, -2.4751346111297607, -2.298276424407959, -2.1214182376861572, -1.9445600509643555, -1.7677018642425537, -1.590843677520752, -1.4139854907989502, -1.2371273040771484, -1.0602691173553467, -0.8834109306335449, -0.7065527439117432, -0.5296945571899414, -0.35283637046813965, -0.1759781837463379, 0.0008800029754638672, 0.17773818969726562, 0.3545963764190674, 0.5314550399780273, 0.7083132266998291, 0.8851714134216309, 1.0620296001434326, 1.2388877868652344, 1.4157459735870361, 1.592604160308838, 1.7694623470306396, 1.9463205337524414, 2.123178720474243, 2.300036907196045, 2.4768950939178467, 2.6537532806396484, 2.83061146736145, 3.007469654083252, 3.1843278408050537, 3.3611860275268555, 3.5380442142486572, 3.714902400970459, 3.8917605876922607, 4.0686187744140625, 4.245476722717285, 4.422335147857666, 4.599193572998047, 4.7760515213012695, 4.952909469604492, 5.129767894744873, 5.306626319885254, 5.483484268188477, 5.660342216491699, 5.83720064163208, 6.014059066772461, 6.190917015075684]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 6.0, 10.0, 27.0, 25.0, 25.0, 41.0, 44.0, 54.0, 50.0, 57.0, 74.0, 67.0, 63.0, 64.0, 63.0, 53.0, 47.0, 41.0, 25.0, 33.0, 23.0, 18.0, 16.0, 21.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3691611289978027, -3.271679639816284, -3.1741981506347656, -3.076716899871826, -2.9792354106903076, -2.881753921508789, -2.7842724323272705, -2.686790943145752, -2.5893096923828125, -2.491828203201294, -2.3943467140197754, -2.296865463256836, -2.1993839740753174, -2.101902484893799, -2.0044209957122803, -1.9069395065307617, -1.8094580173492432, -1.7119765281677246, -1.6144951581954956, -1.517013669013977, -1.419532299041748, -1.3220508098602295, -1.224569320678711, -1.1270878314971924, -1.0296064615249634, -0.9321250319480896, -0.8346436023712158, -0.7371621131896973, -0.6396806836128235, -0.5421992540359497, -0.44471776485443115, -0.3472363352775574, -0.2497551441192627, -0.15227369964122772, -0.05479225516319275, 0.04268920421600342, 0.1401706337928772, 0.23765206336975098, 0.33513355255126953, 0.4326149821281433, 0.5300964117050171, 0.6275778412818909, 0.7250592708587646, 0.8225407600402832, 0.920022189617157, 1.0175036191940308, 1.1149851083755493, 1.2124664783477783, 1.3099479675292969, 1.4074294567108154, 1.5049108266830444, 1.602392315864563, 1.699873685836792, 1.7973551750183105, 1.894836664199829, 1.9923181533813477, 2.089799404144287, 2.1872808933258057, 2.284762382507324, 2.3822436332702637, 2.4797251224517822, 2.577206611633301, 2.6746881008148193, 2.772169589996338, 2.8696510791778564]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 3.0, 7.0, 2.0, 11.0, 9.0, 12.0, 20.0, 27.0, 21.0, 43.0, 54.0, 88.0, 125.0, 156.0, 243.0, 388.0, 677.0, 1202.0, 2827.0, 10487.0, 82099.0, 787532.0, 141285.0, 14280.0, 3578.0, 1322.0, 731.0, 444.0, 249.0, 170.0, 122.0, 84.0, 74.0, 46.0, 34.0, 24.0, 18.0, 13.0, 9.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.5146484375, -0.49835968017578125, -0.4820709228515625, -0.46578216552734375, -0.449493408203125, -0.43320465087890625, -0.4169158935546875, -0.40062713623046875, -0.38433837890625, -0.36804962158203125, -0.3517608642578125, -0.33547210693359375, -0.319183349609375, -0.30289459228515625, -0.2866058349609375, -0.27031707763671875, -0.2540283203125, -0.23773956298828125, -0.2214508056640625, -0.20516204833984375, -0.188873291015625, -0.17258453369140625, -0.1562957763671875, -0.14000701904296875, -0.12371826171875, -0.10742950439453125, -0.0911407470703125, -0.07485198974609375, -0.058563232421875, -0.04227447509765625, -0.0259857177734375, -0.00969696044921875, 0.006591796875, 0.02288055419921875, 0.0391693115234375, 0.05545806884765625, 0.071746826171875, 0.08803558349609375, 0.1043243408203125, 0.12061309814453125, 0.13690185546875, 0.15319061279296875, 0.1694793701171875, 0.18576812744140625, 0.202056884765625, 0.21834564208984375, 0.2346343994140625, 0.25092315673828125, 0.2672119140625, 0.28350067138671875, 0.2997894287109375, 0.31607818603515625, 0.332366943359375, 0.34865570068359375, 0.3649444580078125, 0.38123321533203125, 0.39752197265625, 0.41381072998046875, 0.4300994873046875, 0.44638824462890625, 0.462677001953125, 0.47896575927734375, 0.4952545166015625, 0.5115432739257812, 0.52783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 6.0, 17.0, 17.0, 22.0, 33.0, 36.0, 60.0, 53.0, 50.0, 79.0, 61.0, 67.0, 88.0, 59.0, 60.0, 49.0, 41.0, 35.0, 40.0, 21.0, 10.0, 24.0, 13.0, 16.0, 3.0, 8.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4765625, -2.395904541015625, -2.31524658203125, -2.234588623046875, -2.1539306640625, -2.073272705078125, -1.99261474609375, -1.911956787109375, -1.831298828125, -1.750640869140625, -1.66998291015625, -1.589324951171875, -1.5086669921875, -1.428009033203125, -1.34735107421875, -1.266693115234375, -1.18603515625, -1.105377197265625, -1.02471923828125, -0.944061279296875, -0.8634033203125, -0.782745361328125, -0.70208740234375, -0.621429443359375, -0.540771484375, -0.460113525390625, -0.37945556640625, -0.298797607421875, -0.2181396484375, -0.137481689453125, -0.05682373046875, 0.023834228515625, 0.1044921875, 0.185150146484375, 0.26580810546875, 0.346466064453125, 0.4271240234375, 0.507781982421875, 0.58843994140625, 0.669097900390625, 0.749755859375, 0.830413818359375, 0.91107177734375, 0.991729736328125, 1.0723876953125, 1.153045654296875, 1.23370361328125, 1.314361572265625, 1.39501953125, 1.475677490234375, 1.55633544921875, 1.636993408203125, 1.7176513671875, 1.798309326171875, 1.87896728515625, 1.959625244140625, 2.040283203125, 2.120941162109375, 2.20159912109375, 2.282257080078125, 2.3629150390625, 2.443572998046875, 2.52423095703125, 2.604888916015625, 2.685546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 12.0, 10.0, 30.0, 18.0, 37.0, 37.0, 55.0, 73.0, 109.0, 142.0, 193.0, 318.0, 453.0, 977.0, 3896.0, 44037.0, 605906.0, 365427.0, 22320.0, 2430.0, 738.0, 399.0, 262.0, 194.0, 123.0, 74.0, 61.0, 52.0, 44.0, 19.0, 29.0, 14.0, 15.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.35931396484375, -0.3472900390625, -0.33526611328125, -0.3232421875, -0.31121826171875, -0.2991943359375, -0.28717041015625, -0.275146484375, -0.26312255859375, -0.2510986328125, -0.23907470703125, -0.22705078125, -0.21502685546875, -0.2030029296875, -0.19097900390625, -0.178955078125, -0.16693115234375, -0.1549072265625, -0.14288330078125, -0.130859375, -0.11883544921875, -0.1068115234375, -0.09478759765625, -0.082763671875, -0.07073974609375, -0.0587158203125, -0.04669189453125, -0.03466796875, -0.02264404296875, -0.0106201171875, 0.00140380859375, 0.013427734375, 0.02545166015625, 0.0374755859375, 0.04949951171875, 0.0615234375, 0.07354736328125, 0.0855712890625, 0.09759521484375, 0.109619140625, 0.12164306640625, 0.1336669921875, 0.14569091796875, 0.15771484375, 0.16973876953125, 0.1817626953125, 0.19378662109375, 0.205810546875, 0.21783447265625, 0.2298583984375, 0.24188232421875, 0.25390625, 0.26593017578125, 0.2779541015625, 0.28997802734375, 0.302001953125, 0.31402587890625, 0.3260498046875, 0.33807373046875, 0.35009765625, 0.36212158203125, 0.3741455078125, 0.38616943359375, 0.398193359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 4.0, 9.0, 18.0, 15.0, 21.0, 28.0, 23.0, 26.0, 31.0, 38.0, 31.0, 34.0, 32.0, 31.0, 39.0, 42.0, 49.0, 58.0, 50.0, 45.0, 46.0, 39.0, 34.0, 34.0, 27.0, 24.0, 23.0, 20.0, 19.0, 20.0, 13.0, 11.0, 21.0, 2.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.17578125, -4.0543212890625, -3.932861328125, -3.8114013671875, -3.68994140625, -3.5684814453125, -3.447021484375, -3.3255615234375, -3.2041015625, -3.0826416015625, -2.961181640625, -2.8397216796875, -2.71826171875, -2.5968017578125, -2.475341796875, -2.3538818359375, -2.232421875, -2.1109619140625, -1.989501953125, -1.8680419921875, -1.74658203125, -1.6251220703125, -1.503662109375, -1.3822021484375, -1.2607421875, -1.1392822265625, -1.017822265625, -0.8963623046875, -0.77490234375, -0.6534423828125, -0.531982421875, -0.4105224609375, -0.2890625, -0.1676025390625, -0.046142578125, 0.0753173828125, 0.19677734375, 0.3182373046875, 0.439697265625, 0.5611572265625, 0.6826171875, 0.8040771484375, 0.925537109375, 1.0469970703125, 1.16845703125, 1.2899169921875, 1.411376953125, 1.5328369140625, 1.654296875, 1.7757568359375, 1.897216796875, 2.0186767578125, 2.14013671875, 2.2615966796875, 2.383056640625, 2.5045166015625, 2.6259765625, 2.7474365234375, 2.868896484375, 2.9903564453125, 3.11181640625, 3.2332763671875, 3.354736328125, 3.4761962890625, 3.59765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 3.0, 8.0, 8.0, 11.0, 14.0, 23.0, 19.0, 22.0, 32.0, 38.0, 50.0, 73.0, 103.0, 178.0, 398.0, 1437.0, 12721.0, 993715.0, 35986.0, 2423.0, 577.0, 225.0, 134.0, 91.0, 63.0, 37.0, 34.0, 21.0, 16.0, 15.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.14024066925048828, -0.13607215881347656, -0.13190364837646484, -0.12773513793945312, -0.1235666275024414, -0.11939811706542969, -0.11522960662841797, -0.11106109619140625, -0.10689258575439453, -0.10272407531738281, -0.0985555648803711, -0.09438705444335938, -0.09021854400634766, -0.08605003356933594, -0.08188152313232422, -0.0777130126953125, -0.07354450225830078, -0.06937599182128906, -0.06520748138427734, -0.061038970947265625, -0.056870460510253906, -0.05270195007324219, -0.04853343963623047, -0.04436492919921875, -0.04019641876220703, -0.03602790832519531, -0.031859397888183594, -0.027690887451171875, -0.023522377014160156, -0.019353866577148438, -0.015185356140136719, -0.011016845703125, -0.006848335266113281, -0.0026798248291015625, 0.0014886856079101562, 0.005657196044921875, 0.009825706481933594, 0.013994216918945312, 0.01816272735595703, 0.02233123779296875, 0.02649974822998047, 0.030668258666992188, 0.034836769104003906, 0.039005279541015625, 0.043173789978027344, 0.04734230041503906, 0.05151081085205078, 0.0556793212890625, 0.05984783172607422, 0.06401634216308594, 0.06818485260009766, 0.07235336303710938, 0.0765218734741211, 0.08069038391113281, 0.08485889434814453, 0.08902740478515625, 0.09319591522216797, 0.09736442565917969, 0.1015329360961914, 0.10570144653320312, 0.10986995697021484, 0.11403846740722656, 0.11820697784423828, 0.12237548828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 9.0, 4.0, 5.0, 13.0, 22.0, 25.0, 23.0, 36.0, 36.0, 63.0, 78.0, 111.0, 120.0, 124.0, 97.0, 69.0, 45.0, 23.0, 22.0, 12.0, 20.0, 7.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8312206268310547e-05, -2.734735608100891e-05, -2.6382505893707275e-05, -2.541765570640564e-05, -2.4452805519104004e-05, -2.3487955331802368e-05, -2.2523105144500732e-05, -2.1558254957199097e-05, -2.059340476989746e-05, -1.9628554582595825e-05, -1.866370439529419e-05, -1.7698854207992554e-05, -1.6734004020690918e-05, -1.5769153833389282e-05, -1.4804303646087646e-05, -1.383945345878601e-05, -1.2874603271484375e-05, -1.190975308418274e-05, -1.0944902896881104e-05, -9.980052709579468e-06, -9.015202522277832e-06, -8.050352334976196e-06, -7.0855021476745605e-06, -6.120651960372925e-06, -5.155801773071289e-06, -4.190951585769653e-06, -3.2261013984680176e-06, -2.261251211166382e-06, -1.296401023864746e-06, -3.3155083656311035e-07, 6.332993507385254e-07, 1.5981495380401611e-06, 2.562999725341797e-06, 3.5278499126434326e-06, 4.492700099945068e-06, 5.457550287246704e-06, 6.42240047454834e-06, 7.387250661849976e-06, 8.352100849151611e-06, 9.316951036453247e-06, 1.0281801223754883e-05, 1.1246651411056519e-05, 1.2211501598358154e-05, 1.317635178565979e-05, 1.4141201972961426e-05, 1.5106052160263062e-05, 1.6070902347564697e-05, 1.7035752534866333e-05, 1.800060272216797e-05, 1.8965452909469604e-05, 1.993030309677124e-05, 2.0895153284072876e-05, 2.1860003471374512e-05, 2.2824853658676147e-05, 2.3789703845977783e-05, 2.475455403327942e-05, 2.5719404220581055e-05, 2.668425440788269e-05, 2.7649104595184326e-05, 2.8613954782485962e-05, 2.9578804969787598e-05, 3.0543655157089233e-05, 3.150850534439087e-05, 3.2473355531692505e-05, 3.343820571899414e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 13.0, 20.0, 16.0, 29.0, 44.0, 72.0, 132.0, 174.0, 388.0, 731.0, 1692.0, 5169.0, 28057.0, 877363.0, 118427.0, 10979.0, 2899.0, 1080.0, 531.0, 297.0, 159.0, 95.0, 64.0, 45.0, 31.0, 14.0, 12.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14711952209472656, -0.14262771606445312, -0.1381359100341797, -0.13364410400390625, -0.1291522979736328, -0.12466049194335938, -0.12016868591308594, -0.1156768798828125, -0.11118507385253906, -0.10669326782226562, -0.10220146179199219, -0.09770965576171875, -0.09321784973144531, -0.08872604370117188, -0.08423423767089844, -0.079742431640625, -0.07525062561035156, -0.07075881958007812, -0.06626701354980469, -0.06177520751953125, -0.05728340148925781, -0.052791595458984375, -0.04829978942871094, -0.0438079833984375, -0.03931617736816406, -0.034824371337890625, -0.030332565307617188, -0.02584075927734375, -0.021348953247070312, -0.016857147216796875, -0.012365341186523438, -0.00787353515625, -0.0033817291259765625, 0.001110076904296875, 0.0056018829345703125, 0.01009368896484375, 0.014585494995117188, 0.019077301025390625, 0.023569107055664062, 0.0280609130859375, 0.03255271911621094, 0.037044525146484375, 0.04153633117675781, 0.04602813720703125, 0.05051994323730469, 0.055011749267578125, 0.05950355529785156, 0.063995361328125, 0.06848716735839844, 0.07297897338867188, 0.07747077941894531, 0.08196258544921875, 0.08645439147949219, 0.09094619750976562, 0.09543800354003906, 0.0999298095703125, 0.10442161560058594, 0.10891342163085938, 0.11340522766113281, 0.11789703369140625, 0.12238883972167969, 0.12688064575195312, 0.13137245178222656, 0.1358642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 8.0, 12.0, 15.0, 23.0, 39.0, 98.0, 268.0, 270.0, 106.0, 48.0, 32.0, 15.0, 13.0, 9.0, 6.0, 5.0, 1.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0355224609375, -0.034297943115234375, -0.03307342529296875, -0.031848907470703125, -0.0306243896484375, -0.029399871826171875, -0.02817535400390625, -0.026950836181640625, -0.025726318359375, -0.024501800537109375, -0.02327728271484375, -0.022052764892578125, -0.0208282470703125, -0.019603729248046875, -0.01837921142578125, -0.017154693603515625, -0.01593017578125, -0.014705657958984375, -0.01348114013671875, -0.012256622314453125, -0.0110321044921875, -0.009807586669921875, -0.00858306884765625, -0.007358551025390625, -0.006134033203125, -0.004909515380859375, -0.00368499755859375, -0.002460479736328125, -0.0012359619140625, -1.1444091796875e-05, 0.00121307373046875, 0.002437591552734375, 0.003662109375, 0.004886627197265625, 0.00611114501953125, 0.007335662841796875, 0.0085601806640625, 0.009784698486328125, 0.01100921630859375, 0.012233734130859375, 0.013458251953125, 0.014682769775390625, 0.01590728759765625, 0.017131805419921875, 0.0183563232421875, 0.019580841064453125, 0.02080535888671875, 0.022029876708984375, 0.02325439453125, 0.024478912353515625, 0.02570343017578125, 0.026927947998046875, 0.0281524658203125, 0.029376983642578125, 0.03060150146484375, 0.031826019287109375, 0.033050537109375, 0.034275054931640625, 0.03549957275390625, 0.036724090576171875, 0.0379486083984375, 0.039173126220703125, 0.04039764404296875, 0.041622161865234375, 0.0428466796875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 40.0, 65.0, 106.0, 134.0, 198.0, 147.0, 99.0, 69.0, 41.0, 20.0, 10.0, 12.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455575704574585, -3.3145558834075928, -3.1735360622406006, -3.0325162410736084, -2.891496181488037, -2.750476360321045, -2.6094565391540527, -2.4684367179870605, -2.3274168968200684, -2.186397075653076, -2.045377254486084, -1.9043573141098022, -1.76333749294281, -1.6223176717758179, -1.4812977313995361, -1.340277910232544, -1.1992580890655518, -1.0582382678985596, -0.9172183871269226, -0.7761985063552856, -0.6351786851882935, -0.49415886402130127, -0.3531389832496643, -0.21211910247802734, -0.07109928131103516, 0.06992056965827942, 0.210940420627594, 0.35196027159690857, 0.49298012256622314, 0.6339999437332153, 0.7750198245048523, 0.9160397052764893, 1.0570592880249023, 1.1980791091918945, 1.3390989303588867, 1.4801188707351685, 1.6211386919021606, 1.7621585130691528, 1.9031784534454346, 2.0441982746124268, 2.185218095779419, 2.326237916946411, 2.4672577381134033, 2.6082775592803955, 2.749297618865967, 2.890317440032959, 3.031337261199951, 3.1723570823669434, 3.3133769035339355, 3.4543967247009277, 3.59541654586792, 3.736436367034912, 3.8774561882019043, 4.0184760093688965, 4.159495830535889, 4.300516128540039, 4.441535949707031, 4.582555770874023, 4.723575592041016, 4.864595413208008, 5.005615234375, 5.146635055541992, 5.287654876708984, 5.428674697875977, 5.569694519042969]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 10.0, 7.0, 20.0, 21.0, 28.0, 41.0, 49.0, 52.0, 44.0, 72.0, 70.0, 78.0, 86.0, 55.0, 58.0, 64.0, 45.0, 36.0, 31.0, 28.0, 16.0, 20.0, 14.0, 11.0, 11.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5668931007385254, -2.4891254901885986, -2.411357879638672, -2.333590269088745, -2.2558226585388184, -2.1780550479888916, -2.100287437438965, -2.022520065307617, -1.9447523355484009, -1.8669847249984741, -1.7892171144485474, -1.7114495038986206, -1.6336820125579834, -1.5559144020080566, -1.4781467914581299, -1.4003791809082031, -1.3226115703582764, -1.2448439598083496, -1.1670763492584229, -1.089308738708496, -1.0115411281585693, -0.9337735772132874, -0.8560060262680054, -0.7782384157180786, -0.7004708051681519, -0.6227031946182251, -0.5449355840682983, -0.46716803312301636, -0.3894004225730896, -0.31163281202316284, -0.23386523127555847, -0.1560976505279541, -0.07833027839660645, -0.0005626827478408813, 0.07720491290092468, 0.15497250854969025, 0.2327401041984558, 0.31050771474838257, 0.38827529549598694, 0.4660428762435913, 0.5438104867935181, 0.6215780973434448, 0.6993457078933716, 0.7771132588386536, 0.8548808693885803, 0.9326484799385071, 1.010416030883789, 1.0881836414337158, 1.1659512519836426, 1.2437188625335693, 1.321486473083496, 1.3992540836334229, 1.4770216941833496, 1.5547893047332764, 1.6325567960739136, 1.7103244066238403, 1.788092017173767, 1.8658596277236938, 1.9436272382736206, 2.021394729614258, 2.0991623401641846, 2.1769299507141113, 2.254697561264038, 2.332465171813965, 2.4102327823638916]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 14.0, 15.0, 21.0, 29.0, 68.0, 99.0, 160.0, 229.0, 436.0, 766.0, 1539.0, 3103.0, 7016.0, 18436.0, 59039.0, 312341.0, 521738.0, 82709.0, 24174.0, 8938.0, 3760.0, 1758.0, 898.0, 474.0, 284.0, 191.0, 107.0, 66.0, 41.0, 31.0, 17.0, 18.0, 9.0, 1.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.17828369140625, -2.1104736328125, -2.04266357421875, -1.974853515625, -1.90704345703125, -1.8392333984375, -1.77142333984375, -1.70361328125, -1.63580322265625, -1.5679931640625, -1.50018310546875, -1.432373046875, -1.36456298828125, -1.2967529296875, -1.22894287109375, -1.1611328125, -1.09332275390625, -1.0255126953125, -0.95770263671875, -0.889892578125, -0.82208251953125, -0.7542724609375, -0.68646240234375, -0.61865234375, -0.55084228515625, -0.4830322265625, -0.41522216796875, -0.347412109375, -0.27960205078125, -0.2117919921875, -0.14398193359375, -0.076171875, -0.00836181640625, 0.0594482421875, 0.12725830078125, 0.195068359375, 0.26287841796875, 0.3306884765625, 0.39849853515625, 0.46630859375, 0.53411865234375, 0.6019287109375, 0.66973876953125, 0.737548828125, 0.80535888671875, 0.8731689453125, 0.94097900390625, 1.0087890625, 1.07659912109375, 1.1444091796875, 1.21221923828125, 1.280029296875, 1.34783935546875, 1.4156494140625, 1.48345947265625, 1.55126953125, 1.61907958984375, 1.6868896484375, 1.75469970703125, 1.822509765625, 1.89031982421875, 1.9581298828125, 2.02593994140625, 2.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 9.0, 10.0, 13.0, 18.0, 28.0, 36.0, 24.0, 57.0, 54.0, 67.0, 74.0, 73.0, 81.0, 80.0, 89.0, 55.0, 54.0, 38.0, 32.0, 23.0, 25.0, 12.0, 14.0, 10.0, 4.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.890625, -5.723388671875, -5.55615234375, -5.388916015625, -5.2216796875, -5.054443359375, -4.88720703125, -4.719970703125, -4.552734375, -4.385498046875, -4.21826171875, -4.051025390625, -3.8837890625, -3.716552734375, -3.54931640625, -3.382080078125, -3.21484375, -3.047607421875, -2.88037109375, -2.713134765625, -2.5458984375, -2.378662109375, -2.21142578125, -2.044189453125, -1.876953125, -1.709716796875, -1.54248046875, -1.375244140625, -1.2080078125, -1.040771484375, -0.87353515625, -0.706298828125, -0.5390625, -0.371826171875, -0.20458984375, -0.037353515625, 0.1298828125, 0.297119140625, 0.46435546875, 0.631591796875, 0.798828125, 0.966064453125, 1.13330078125, 1.300537109375, 1.4677734375, 1.635009765625, 1.80224609375, 1.969482421875, 2.13671875, 2.303955078125, 2.47119140625, 2.638427734375, 2.8056640625, 2.972900390625, 3.14013671875, 3.307373046875, 3.474609375, 3.641845703125, 3.80908203125, 3.976318359375, 4.1435546875, 4.310791015625, 4.47802734375, 4.645263671875, 4.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 17.0, 17.0, 26.0, 36.0, 52.0, 69.0, 84.0, 167.0, 265.0, 596.0, 2942.0, 64487.0, 946373.0, 30370.0, 1848.0, 461.0, 247.0, 138.0, 99.0, 69.0, 50.0, 33.0, 33.0, 23.0, 12.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.3359375, -7.1226806640625, -6.909423828125, -6.6961669921875, -6.48291015625, -6.2696533203125, -6.056396484375, -5.8431396484375, -5.6298828125, -5.4166259765625, -5.203369140625, -4.9901123046875, -4.77685546875, -4.5635986328125, -4.350341796875, -4.1370849609375, -3.923828125, -3.7105712890625, -3.497314453125, -3.2840576171875, -3.07080078125, -2.8575439453125, -2.644287109375, -2.4310302734375, -2.2177734375, -2.0045166015625, -1.791259765625, -1.5780029296875, -1.36474609375, -1.1514892578125, -0.938232421875, -0.7249755859375, -0.51171875, -0.2984619140625, -0.085205078125, 0.1280517578125, 0.34130859375, 0.5545654296875, 0.767822265625, 0.9810791015625, 1.1943359375, 1.4075927734375, 1.620849609375, 1.8341064453125, 2.04736328125, 2.2606201171875, 2.473876953125, 2.6871337890625, 2.900390625, 3.1136474609375, 3.326904296875, 3.5401611328125, 3.75341796875, 3.9666748046875, 4.179931640625, 4.3931884765625, 4.6064453125, 4.8197021484375, 5.032958984375, 5.2462158203125, 5.45947265625, 5.6727294921875, 5.885986328125, 6.0992431640625, 6.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 11.0, 16.0, 27.0, 19.0, 22.0, 25.0, 22.0, 36.0, 39.0, 49.0, 44.0, 48.0, 56.0, 48.0, 46.0, 44.0, 37.0, 43.0, 42.0, 42.0, 44.0, 34.0, 23.0, 25.0, 15.0, 25.0, 21.0, 16.0, 4.0, 10.0, 12.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.3046875, -5.14898681640625, -4.9932861328125, -4.83758544921875, -4.681884765625, -4.52618408203125, -4.3704833984375, -4.21478271484375, -4.05908203125, -3.90338134765625, -3.7476806640625, -3.59197998046875, -3.436279296875, -3.28057861328125, -3.1248779296875, -2.96917724609375, -2.8134765625, -2.65777587890625, -2.5020751953125, -2.34637451171875, -2.190673828125, -2.03497314453125, -1.8792724609375, -1.72357177734375, -1.56787109375, -1.41217041015625, -1.2564697265625, -1.10076904296875, -0.945068359375, -0.78936767578125, -0.6336669921875, -0.47796630859375, -0.322265625, -0.16656494140625, -0.0108642578125, 0.14483642578125, 0.300537109375, 0.45623779296875, 0.6119384765625, 0.76763916015625, 0.92333984375, 1.07904052734375, 1.2347412109375, 1.39044189453125, 1.546142578125, 1.70184326171875, 1.8575439453125, 2.01324462890625, 2.1689453125, 2.32464599609375, 2.4803466796875, 2.63604736328125, 2.791748046875, 2.94744873046875, 3.1031494140625, 3.25885009765625, 3.41455078125, 3.57025146484375, 3.7259521484375, 3.88165283203125, 4.037353515625, 4.19305419921875, 4.3487548828125, 4.50445556640625, 4.66015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 14.0, 20.0, 23.0, 25.0, 69.0, 102.0, 153.0, 290.0, 663.0, 1721.0, 6887.0, 42876.0, 559776.0, 391368.0, 35843.0, 5926.0, 1536.0, 579.0, 267.0, 135.0, 95.0, 58.0, 30.0, 20.0, 14.0, 12.0, 6.0, 8.0, 0.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.00189208984375, -0.9647216796875, -0.92755126953125, -0.890380859375, -0.85321044921875, -0.8160400390625, -0.77886962890625, -0.74169921875, -0.70452880859375, -0.6673583984375, -0.63018798828125, -0.593017578125, -0.55584716796875, -0.5186767578125, -0.48150634765625, -0.4443359375, -0.40716552734375, -0.3699951171875, -0.33282470703125, -0.295654296875, -0.25848388671875, -0.2213134765625, -0.18414306640625, -0.14697265625, -0.10980224609375, -0.0726318359375, -0.03546142578125, 0.001708984375, 0.03887939453125, 0.0760498046875, 0.11322021484375, 0.150390625, 0.18756103515625, 0.2247314453125, 0.26190185546875, 0.299072265625, 0.33624267578125, 0.3734130859375, 0.41058349609375, 0.44775390625, 0.48492431640625, 0.5220947265625, 0.55926513671875, 0.596435546875, 0.63360595703125, 0.6707763671875, 0.70794677734375, 0.7451171875, 0.78228759765625, 0.8194580078125, 0.85662841796875, 0.893798828125, 0.93096923828125, 0.9681396484375, 1.00531005859375, 1.04248046875, 1.07965087890625, 1.1168212890625, 1.15399169921875, 1.191162109375, 1.22833251953125, 1.2655029296875, 1.30267333984375, 1.33984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 31.0, 27.0, 38.0, 66.0, 74.0, 120.0, 206.0, 123.0, 84.0, 43.0, 38.0, 29.0, 20.0, 13.0, 12.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015592575073242188, -0.0001504272222518921, -0.0001449286937713623, -0.00013943016529083252, -0.00013393163681030273, -0.00012843310832977295, -0.00012293457984924316, -0.00011743605136871338, -0.0001119375228881836, -0.00010643899440765381, -0.00010094046592712402, -9.544193744659424e-05, -8.994340896606445e-05, -8.444488048553467e-05, -7.894635200500488e-05, -7.34478235244751e-05, -6.794929504394531e-05, -6.245076656341553e-05, -5.695223808288574e-05, -5.145370960235596e-05, -4.595518112182617e-05, -4.045665264129639e-05, -3.49581241607666e-05, -2.9459595680236816e-05, -2.396106719970703e-05, -1.8462538719177246e-05, -1.2964010238647461e-05, -7.465481758117676e-06, -1.9669532775878906e-06, 3.5315752029418945e-06, 9.03010368347168e-06, 1.4528632164001465e-05, 2.002716064453125e-05, 2.5525689125061035e-05, 3.102421760559082e-05, 3.6522746086120605e-05, 4.202127456665039e-05, 4.7519803047180176e-05, 5.301833152770996e-05, 5.8516860008239746e-05, 6.401538848876953e-05, 6.951391696929932e-05, 7.50124454498291e-05, 8.051097393035889e-05, 8.600950241088867e-05, 9.150803089141846e-05, 9.700655937194824e-05, 0.00010250508785247803, 0.00010800361633300781, 0.0001135021448135376, 0.00011900067329406738, 0.00012449920177459717, 0.00012999773025512695, 0.00013549625873565674, 0.00014099478721618652, 0.0001464933156967163, 0.0001519918441772461, 0.00015749037265777588, 0.00016298890113830566, 0.00016848742961883545, 0.00017398595809936523, 0.00017948448657989502, 0.0001849830150604248, 0.0001904815435409546, 0.00019598007202148438]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 10.0, 4.0, 5.0, 16.0, 19.0, 19.0, 35.0, 86.0, 176.0, 510.0, 1764.0, 10758.0, 149510.0, 825689.0, 52930.0, 5290.0, 1093.0, 339.0, 151.0, 57.0, 33.0, 22.0, 13.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4168701171875, -1.363037109375, -1.3092041015625, -1.25537109375, -1.2015380859375, -1.147705078125, -1.0938720703125, -1.0400390625, -0.9862060546875, -0.932373046875, -0.8785400390625, -0.82470703125, -0.7708740234375, -0.717041015625, -0.6632080078125, -0.609375, -0.5555419921875, -0.501708984375, -0.4478759765625, -0.39404296875, -0.3402099609375, -0.286376953125, -0.2325439453125, -0.1787109375, -0.1248779296875, -0.071044921875, -0.0172119140625, 0.03662109375, 0.0904541015625, 0.144287109375, 0.1981201171875, 0.251953125, 0.3057861328125, 0.359619140625, 0.4134521484375, 0.46728515625, 0.5211181640625, 0.574951171875, 0.6287841796875, 0.6826171875, 0.7364501953125, 0.790283203125, 0.8441162109375, 0.89794921875, 0.9517822265625, 1.005615234375, 1.0594482421875, 1.11328125, 1.1671142578125, 1.220947265625, 1.2747802734375, 1.32861328125, 1.3824462890625, 1.436279296875, 1.4901123046875, 1.5439453125, 1.5977783203125, 1.651611328125, 1.7054443359375, 1.75927734375, 1.8131103515625, 1.866943359375, 1.9207763671875, 1.974609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 8.0, 14.0, 16.0, 27.0, 47.0, 51.0, 91.0, 119.0, 196.0, 129.0, 95.0, 60.0, 46.0, 24.0, 20.0, 18.0, 12.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4609375, -0.44217681884765625, -0.4234161376953125, -0.40465545654296875, -0.385894775390625, -0.36713409423828125, -0.3483734130859375, -0.32961273193359375, -0.31085205078125, -0.29209136962890625, -0.2733306884765625, -0.25457000732421875, -0.235809326171875, -0.21704864501953125, -0.1982879638671875, -0.17952728271484375, -0.1607666015625, -0.14200592041015625, -0.1232452392578125, -0.10448455810546875, -0.085723876953125, -0.06696319580078125, -0.0482025146484375, -0.02944183349609375, -0.01068115234375, 0.00807952880859375, 0.0268402099609375, 0.04560089111328125, 0.064361572265625, 0.08312225341796875, 0.1018829345703125, 0.12064361572265625, 0.139404296875, 0.15816497802734375, 0.1769256591796875, 0.19568634033203125, 0.214447021484375, 0.23320770263671875, 0.2519683837890625, 0.27072906494140625, 0.28948974609375, 0.30825042724609375, 0.3270111083984375, 0.34577178955078125, 0.364532470703125, 0.38329315185546875, 0.4020538330078125, 0.42081451416015625, 0.4395751953125, 0.45833587646484375, 0.4770965576171875, 0.49585723876953125, 0.514617919921875, 0.5333786010742188, 0.5521392822265625, 0.5708999633789062, 0.58966064453125, 0.6084213256835938, 0.6271820068359375, 0.6459426879882812, 0.664703369140625, 0.6834640502929688, 0.7022247314453125, 0.7209854125976562, 0.73974609375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 13.0, 29.0, 119.0, 324.0, 331.0, 137.0, 33.0, 13.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.941051483154297, -31.231830596923828, -30.52260971069336, -29.81338882446289, -29.104167938232422, -28.394948959350586, -27.685728073120117, -26.97650718688965, -26.26728630065918, -25.55806541442871, -24.848844528198242, -24.139623641967773, -23.430404663085938, -22.72118377685547, -22.011962890625, -21.30274200439453, -20.593521118164062, -19.884300231933594, -19.175079345703125, -18.465858459472656, -17.756637573242188, -17.04741859436035, -16.338197708129883, -15.628976821899414, -14.919755935668945, -14.210535049438477, -13.501314163208008, -12.792094230651855, -12.082873344421387, -11.373652458190918, -10.664432525634766, -9.955211639404297, -9.245990753173828, -8.53676986694336, -7.827549457550049, -7.118329048156738, -6.4091081619262695, -5.699887275695801, -4.99066686630249, -4.28144645690918, -3.572225570678711, -2.8630049228668213, -2.1537842750549316, -1.444563627243042, -0.7353429794311523, -0.026122331619262695, 0.683098316192627, 1.3923187255859375, 2.1015396118164062, 2.810760259628296, 3.5199809074401855, 4.229201316833496, 4.938422203063965, 5.647643089294434, 6.356863498687744, 7.066083908081055, 7.775304794311523, 8.484525680541992, 9.193746566772461, 9.902966499328613, 10.612187385559082, 11.32140827178955, 12.030628204345703, 12.739849090576172, 13.44906997680664]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 13.0, 6.0, 14.0, 10.0, 18.0, 15.0, 24.0, 25.0, 26.0, 33.0, 26.0, 31.0, 37.0, 37.0, 31.0, 52.0, 39.0, 36.0, 44.0, 44.0, 43.0, 44.0, 30.0, 40.0, 28.0, 28.0, 30.0, 18.0, 27.0, 15.0, 20.0, 19.0, 15.0, 14.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.344343185424805, -8.106801986694336, -7.869259834289551, -7.631718158721924, -7.394176483154297, -7.156635284423828, -6.919093132019043, -6.681551933288574, -6.444010257720947, -6.20646858215332, -5.968926906585693, -5.731385231018066, -5.4938435554504395, -5.2563018798828125, -5.018760681152344, -4.781219005584717, -4.54367733001709, -4.306135654449463, -4.068593978881836, -3.831052303314209, -3.593510866165161, -3.355969190597534, -3.1184275150299072, -2.8808860778808594, -2.643343925476074, -2.4058022499084473, -2.1682605743408203, -1.930719017982483, -1.6931774616241455, -1.4556357860565186, -1.2180941104888916, -0.9805525541305542, -0.7430109977722168, -0.5054693818092346, -0.26792773604393005, -0.03038609027862549, 0.2071555256843567, 0.44469714164733887, 0.6822388172149658, 0.9197803735733032, 1.1573220491409302, 1.3948637247085571, 1.6324052810668945, 1.8699469566345215, 2.1074886322021484, 2.3450303077697754, 2.5825719833374023, 2.82011342048645, 3.057655096054077, 3.295196771621704, 3.532738447189331, 3.770279884338379, 4.007821559906006, 4.245363235473633, 4.48290491104126, 4.720446586608887, 4.957988262176514, 5.195529937744141, 5.433071613311768, 5.6706132888793945, 5.9081549644470215, 6.145696640014648, 6.383237838745117, 6.620779514312744, 6.858321189880371]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 8.0, 15.0, 16.0, 20.0, 26.0, 36.0, 51.0, 56.0, 68.0, 97.0, 144.0, 195.0, 342.0, 600.0, 1406.0, 3536.0, 12440.0, 68072.0, 1622412.0, 2382369.0, 80353.0, 14476.0, 4140.0, 1488.0, 737.0, 363.0, 243.0, 149.0, 111.0, 65.0, 63.0, 33.0, 28.0, 27.0, 22.0, 9.0, 12.0, 8.0, 9.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.1112060546875, -3.964599609375, -3.8179931640625, -3.67138671875, -3.5247802734375, -3.378173828125, -3.2315673828125, -3.0849609375, -2.9383544921875, -2.791748046875, -2.6451416015625, -2.49853515625, -2.3519287109375, -2.205322265625, -2.0587158203125, -1.912109375, -1.7655029296875, -1.618896484375, -1.4722900390625, -1.32568359375, -1.1790771484375, -1.032470703125, -0.8858642578125, -0.7392578125, -0.5926513671875, -0.446044921875, -0.2994384765625, -0.15283203125, -0.0062255859375, 0.140380859375, 0.2869873046875, 0.43359375, 0.5802001953125, 0.726806640625, 0.8734130859375, 1.02001953125, 1.1666259765625, 1.313232421875, 1.4598388671875, 1.6064453125, 1.7530517578125, 1.899658203125, 2.0462646484375, 2.19287109375, 2.3394775390625, 2.486083984375, 2.6326904296875, 2.779296875, 2.9259033203125, 3.072509765625, 3.2191162109375, 3.36572265625, 3.5123291015625, 3.658935546875, 3.8055419921875, 3.9521484375, 4.0987548828125, 4.245361328125, 4.3919677734375, 4.53857421875, 4.6851806640625, 4.831787109375, 4.9783935546875, 5.125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 9.0, 14.0, 18.0, 26.0, 28.0, 57.0, 56.0, 56.0, 71.0, 88.0, 88.0, 80.0, 78.0, 68.0, 57.0, 52.0, 29.0, 32.0, 17.0, 21.0, 7.0, 12.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.115234375, -3.030364990234375, -2.94549560546875, -2.860626220703125, -2.7757568359375, -2.690887451171875, -2.60601806640625, -2.521148681640625, -2.436279296875, -2.351409912109375, -2.26654052734375, -2.181671142578125, -2.0968017578125, -2.011932373046875, -1.92706298828125, -1.842193603515625, -1.75732421875, -1.672454833984375, -1.58758544921875, -1.502716064453125, -1.4178466796875, -1.332977294921875, -1.24810791015625, -1.163238525390625, -1.078369140625, -0.993499755859375, -0.90863037109375, -0.823760986328125, -0.7388916015625, -0.654022216796875, -0.56915283203125, -0.484283447265625, -0.3994140625, -0.314544677734375, -0.22967529296875, -0.144805908203125, -0.0599365234375, 0.024932861328125, 0.10980224609375, 0.194671630859375, 0.279541015625, 0.364410400390625, 0.44927978515625, 0.534149169921875, 0.6190185546875, 0.703887939453125, 0.78875732421875, 0.873626708984375, 0.95849609375, 1.043365478515625, 1.12823486328125, 1.213104248046875, 1.2979736328125, 1.382843017578125, 1.46771240234375, 1.552581787109375, 1.637451171875, 1.722320556640625, 1.80718994140625, 1.892059326171875, 1.9769287109375, 2.061798095703125, 2.14666748046875, 2.231536865234375, 2.31640625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 10.0, 8.0, 23.0, 23.0, 52.0, 78.0, 89.0, 199.0, 467.0, 1752.0, 13068.0, 423458.0, 3698368.0, 50967.0, 4186.0, 827.0, 296.0, 151.0, 78.0, 51.0, 41.0, 31.0, 13.0, 12.0, 8.0, 7.0, 9.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.5703125, -10.29388427734375, -10.0174560546875, -9.74102783203125, -9.464599609375, -9.18817138671875, -8.9117431640625, -8.63531494140625, -8.35888671875, -8.08245849609375, -7.8060302734375, -7.52960205078125, -7.253173828125, -6.97674560546875, -6.7003173828125, -6.42388916015625, -6.1474609375, -5.87103271484375, -5.5946044921875, -5.31817626953125, -5.041748046875, -4.76531982421875, -4.4888916015625, -4.21246337890625, -3.93603515625, -3.65960693359375, -3.3831787109375, -3.10675048828125, -2.830322265625, -2.55389404296875, -2.2774658203125, -2.00103759765625, -1.724609375, -1.44818115234375, -1.1717529296875, -0.89532470703125, -0.618896484375, -0.34246826171875, -0.0660400390625, 0.21038818359375, 0.48681640625, 0.76324462890625, 1.0396728515625, 1.31610107421875, 1.592529296875, 1.86895751953125, 2.1453857421875, 2.42181396484375, 2.6982421875, 2.97467041015625, 3.2510986328125, 3.52752685546875, 3.803955078125, 4.08038330078125, 4.3568115234375, 4.63323974609375, 4.90966796875, 5.18609619140625, 5.4625244140625, 5.73895263671875, 6.015380859375, 6.29180908203125, 6.5682373046875, 6.84466552734375, 7.12109375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 2.0, 9.0, 11.0, 13.0, 19.0, 25.0, 25.0, 39.0, 49.0, 70.0, 108.0, 150.0, 235.0, 363.0, 579.0, 749.0, 525.0, 329.0, 221.0, 155.0, 108.0, 76.0, 52.0, 41.0, 27.0, 22.0, 19.0, 12.0, 8.0, 6.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.16015625, -1.1254730224609375, -1.090789794921875, -1.0561065673828125, -1.02142333984375, -0.9867401123046875, -0.952056884765625, -0.9173736572265625, -0.8826904296875, -0.8480072021484375, -0.813323974609375, -0.7786407470703125, -0.74395751953125, -0.7092742919921875, -0.674591064453125, -0.6399078369140625, -0.605224609375, -0.5705413818359375, -0.535858154296875, -0.5011749267578125, -0.46649169921875, -0.4318084716796875, -0.397125244140625, -0.3624420166015625, -0.3277587890625, -0.2930755615234375, -0.258392333984375, -0.2237091064453125, -0.18902587890625, -0.1543426513671875, -0.119659423828125, -0.0849761962890625, -0.05029296875, -0.0156097412109375, 0.019073486328125, 0.0537567138671875, 0.08843994140625, 0.1231231689453125, 0.157806396484375, 0.1924896240234375, 0.2271728515625, 0.2618560791015625, 0.296539306640625, 0.3312225341796875, 0.36590576171875, 0.4005889892578125, 0.435272216796875, 0.4699554443359375, 0.504638671875, 0.5393218994140625, 0.574005126953125, 0.6086883544921875, 0.64337158203125, 0.6780548095703125, 0.712738037109375, 0.7474212646484375, 0.7821044921875, 0.8167877197265625, 0.851470947265625, 0.8861541748046875, 0.92083740234375, 0.9555206298828125, 0.990203857421875, 1.0248870849609375, 1.0595703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 11.0, 10.0, 17.0, 27.0, 21.0, 36.0, 46.0, 61.0, 77.0, 81.0, 70.0, 81.0, 83.0, 71.0, 80.0, 59.0, 38.0, 25.0, 20.0, 18.0, 16.0, 16.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.030686855316162, -3.9129021167755127, -3.7951176166534424, -3.677332878112793, -3.5595483779907227, -3.4417636394500732, -3.323978900909424, -3.2061944007873535, -3.088409662246704, -2.9706249237060547, -2.8528404235839844, -2.735055685043335, -2.6172709465026855, -2.4994864463806152, -2.381701707839966, -2.2639169692993164, -2.146132469177246, -2.0283477306365967, -1.9105632305145264, -1.792778491973877, -1.674993872642517, -1.5572092533111572, -1.4394245147705078, -1.321639895439148, -1.203855276107788, -1.0860706567764282, -0.9682859778404236, -0.850501298904419, -0.7327166795730591, -0.6149320602416992, -0.4971473813056946, -0.37936270236968994, -0.261577844619751, -0.14379319548606873, -0.026008546352386475, 0.09177610278129578, 0.20956075191497803, 0.3273453712463379, 0.44513005018234253, 0.5629147291183472, 0.680699348449707, 0.7984839677810669, 0.9162686467170715, 1.0340533256530762, 1.151837944984436, 1.269622564315796, 1.3874073028564453, 1.5051919221878052, 1.622976541519165, 1.740761160850525, 1.8585457801818848, 1.9763305187225342, 2.0941152572631836, 2.211899757385254, 2.3296844959259033, 2.4474692344665527, 2.565253734588623, 2.6830384731292725, 2.8008229732513428, 2.918607711791992, 3.0363922119140625, 3.154176950454712, 3.2719616889953613, 3.3897461891174316, 3.507530927658081]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 4.0, 7.0, 11.0, 13.0, 13.0, 24.0, 26.0, 26.0, 22.0, 35.0, 39.0, 32.0, 57.0, 44.0, 49.0, 37.0, 42.0, 48.0, 47.0, 46.0, 46.0, 39.0, 36.0, 22.0, 39.0, 35.0, 24.0, 36.0, 15.0, 18.0, 10.0, 15.0, 9.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8297390937805176, -2.747905731201172, -2.6660726070404053, -2.5842392444610596, -2.502406120300293, -2.4205727577209473, -2.3387393951416016, -2.256906032562256, -2.1750729084014893, -2.0932395458221436, -2.011406421661377, -1.9295730590820312, -1.847739815711975, -1.765906572341919, -1.6840732097625732, -1.602239966392517, -1.520406723022461, -1.4385734796524048, -1.3567402362823486, -1.274906873703003, -1.1930736303329468, -1.1112403869628906, -1.029407024383545, -0.9475737810134888, -0.8657405376434326, -0.7839072942733765, -0.7020739912986755, -0.6202406883239746, -0.5384074449539185, -0.4565741717815399, -0.3747408986091614, -0.29290759563446045, -0.2110745906829834, -0.12924131751060486, -0.04740804433822632, 0.03442522883415222, 0.11625850200653076, 0.1980917751789093, 0.27992504835128784, 0.36175835132598877, 0.4435915946960449, 0.5254248380661011, 0.607258141040802, 0.6890914440155029, 0.7709246873855591, 0.8527579307556152, 0.9345912337303162, 1.016424536705017, 1.0982577800750732, 1.1800910234451294, 1.2619242668151855, 1.3437576293945312, 1.4255908727645874, 1.5074241161346436, 1.5892574787139893, 1.6710907220840454, 1.7529239654541016, 1.8347572088241577, 1.9165904521942139, 1.9984238147735596, 2.080256938934326, 2.162090301513672, 2.2439236640930176, 2.3257570266723633, 2.40759015083313]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 8.0, 15.0, 14.0, 11.0, 28.0, 43.0, 73.0, 92.0, 147.0, 216.0, 453.0, 1133.0, 3461.0, 15577.0, 163361.0, 770657.0, 79017.0, 9986.0, 2393.0, 862.0, 418.0, 219.0, 129.0, 74.0, 44.0, 35.0, 20.0, 18.0, 10.0, 10.0, 5.0, 7.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6796875, -0.6614990234375, -0.643310546875, -0.6251220703125, -0.60693359375, -0.5887451171875, -0.570556640625, -0.5523681640625, -0.5341796875, -0.5159912109375, -0.497802734375, -0.4796142578125, -0.46142578125, -0.4432373046875, -0.425048828125, -0.4068603515625, -0.388671875, -0.3704833984375, -0.352294921875, -0.3341064453125, -0.31591796875, -0.2977294921875, -0.279541015625, -0.2613525390625, -0.2431640625, -0.2249755859375, -0.206787109375, -0.1885986328125, -0.17041015625, -0.1522216796875, -0.134033203125, -0.1158447265625, -0.09765625, -0.0794677734375, -0.061279296875, -0.0430908203125, -0.02490234375, -0.0067138671875, 0.011474609375, 0.0296630859375, 0.0478515625, 0.0660400390625, 0.084228515625, 0.1024169921875, 0.12060546875, 0.1387939453125, 0.156982421875, 0.1751708984375, 0.193359375, 0.2115478515625, 0.229736328125, 0.2479248046875, 0.26611328125, 0.2843017578125, 0.302490234375, 0.3206787109375, 0.3388671875, 0.3570556640625, 0.375244140625, 0.3934326171875, 0.41162109375, 0.4298095703125, 0.447998046875, 0.4661865234375, 0.484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 14.0, 16.0, 20.0, 27.0, 31.0, 35.0, 39.0, 40.0, 70.0, 61.0, 57.0, 57.0, 53.0, 49.0, 49.0, 56.0, 42.0, 39.0, 52.0, 39.0, 34.0, 25.0, 19.0, 11.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.375, -2.3097686767578125, -2.244537353515625, -2.1793060302734375, -2.11407470703125, -2.0488433837890625, -1.983612060546875, -1.9183807373046875, -1.8531494140625, -1.7879180908203125, -1.722686767578125, -1.6574554443359375, -1.59222412109375, -1.5269927978515625, -1.461761474609375, -1.3965301513671875, -1.331298828125, -1.2660675048828125, -1.200836181640625, -1.1356048583984375, -1.07037353515625, -1.0051422119140625, -0.939910888671875, -0.8746795654296875, -0.8094482421875, -0.7442169189453125, -0.678985595703125, -0.6137542724609375, -0.54852294921875, -0.4832916259765625, -0.418060302734375, -0.3528289794921875, -0.28759765625, -0.2223663330078125, -0.157135009765625, -0.0919036865234375, -0.02667236328125, 0.0385589599609375, 0.103790283203125, 0.1690216064453125, 0.2342529296875, 0.2994842529296875, 0.364715576171875, 0.4299468994140625, 0.49517822265625, 0.5604095458984375, 0.625640869140625, 0.6908721923828125, 0.756103515625, 0.8213348388671875, 0.886566162109375, 0.9517974853515625, 1.01702880859375, 1.0822601318359375, 1.147491455078125, 1.2127227783203125, 1.2779541015625, 1.3431854248046875, 1.408416748046875, 1.4736480712890625, 1.53887939453125, 1.6041107177734375, 1.669342041015625, 1.7345733642578125, 1.7998046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 12.0, 17.0, 19.0, 20.0, 22.0, 42.0, 43.0, 71.0, 104.0, 124.0, 186.0, 247.0, 421.0, 649.0, 1958.0, 16362.0, 364427.0, 628969.0, 29768.0, 2769.0, 805.0, 482.0, 269.0, 222.0, 144.0, 105.0, 76.0, 61.0, 44.0, 22.0, 17.0, 15.0, 13.0, 9.0, 8.0, 6.0, 2.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.3927574157714844, -0.37926483154296875, -0.3657722473144531, -0.3522796630859375, -0.3387870788574219, -0.32529449462890625, -0.3118019104003906, -0.298309326171875, -0.2848167419433594, -0.27132415771484375, -0.2578315734863281, -0.2443389892578125, -0.23084640502929688, -0.21735382080078125, -0.20386123657226562, -0.19036865234375, -0.17687606811523438, -0.16338348388671875, -0.14989089965820312, -0.1363983154296875, -0.12290573120117188, -0.10941314697265625, -0.09592056274414062, -0.082427978515625, -0.06893539428710938, -0.05544281005859375, -0.041950225830078125, -0.0284576416015625, -0.014965057373046875, -0.00147247314453125, 0.012020111083984375, 0.0255126953125, 0.039005279541015625, 0.05249786376953125, 0.06599044799804688, 0.0794830322265625, 0.09297561645507812, 0.10646820068359375, 0.11996078491210938, 0.133453369140625, 0.14694595336914062, 0.16043853759765625, 0.17393112182617188, 0.1874237060546875, 0.20091629028320312, 0.21440887451171875, 0.22790145874023438, 0.24139404296875, 0.2548866271972656, 0.26837921142578125, 0.2818717956542969, 0.2953643798828125, 0.3088569641113281, 0.32234954833984375, 0.3358421325683594, 0.349334716796875, 0.3628273010253906, 0.37631988525390625, 0.3898124694824219, 0.4033050537109375, 0.4167976379394531, 0.43029022216796875, 0.4437828063964844, 0.457275390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 16.0, 13.0, 13.0, 11.0, 15.0, 10.0, 26.0, 20.0, 22.0, 27.0, 34.0, 38.0, 44.0, 46.0, 56.0, 46.0, 53.0, 44.0, 50.0, 52.0, 38.0, 39.0, 34.0, 27.0, 31.0, 31.0, 24.0, 20.0, 19.0, 18.0, 12.0, 10.0, 8.0, 6.0, 8.0, 6.0, 2.0, 4.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.11328125, -3.012359619140625, -2.91143798828125, -2.810516357421875, -2.7095947265625, -2.608673095703125, -2.50775146484375, -2.406829833984375, -2.305908203125, -2.204986572265625, -2.10406494140625, -2.003143310546875, -1.9022216796875, -1.801300048828125, -1.70037841796875, -1.599456787109375, -1.49853515625, -1.397613525390625, -1.29669189453125, -1.195770263671875, -1.0948486328125, -0.993927001953125, -0.89300537109375, -0.792083740234375, -0.691162109375, -0.590240478515625, -0.48931884765625, -0.388397216796875, -0.2874755859375, -0.186553955078125, -0.08563232421875, 0.015289306640625, 0.1162109375, 0.217132568359375, 0.31805419921875, 0.418975830078125, 0.5198974609375, 0.620819091796875, 0.72174072265625, 0.822662353515625, 0.923583984375, 1.024505615234375, 1.12542724609375, 1.226348876953125, 1.3272705078125, 1.428192138671875, 1.52911376953125, 1.630035400390625, 1.73095703125, 1.831878662109375, 1.93280029296875, 2.033721923828125, 2.1346435546875, 2.235565185546875, 2.33648681640625, 2.437408447265625, 2.538330078125, 2.639251708984375, 2.74017333984375, 2.841094970703125, 2.9420166015625, 3.042938232421875, 3.14385986328125, 3.244781494140625, 3.345703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 7.0, 11.0, 23.0, 13.0, 30.0, 33.0, 43.0, 73.0, 79.0, 101.0, 129.0, 188.0, 337.0, 758.0, 3397.0, 48043.0, 957843.0, 32812.0, 2943.0, 698.0, 271.0, 176.0, 137.0, 100.0, 70.0, 48.0, 42.0, 27.0, 24.0, 18.0, 15.0, 11.0, 5.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1070556640625, -0.10385417938232422, -0.10065269470214844, -0.09745121002197266, -0.09424972534179688, -0.0910482406616211, -0.08784675598144531, -0.08464527130126953, -0.08144378662109375, -0.07824230194091797, -0.07504081726074219, -0.0718393325805664, -0.06863784790039062, -0.06543636322021484, -0.06223487854003906, -0.05903339385986328, -0.0558319091796875, -0.05263042449951172, -0.04942893981933594, -0.046227455139160156, -0.043025970458984375, -0.039824485778808594, -0.03662300109863281, -0.03342151641845703, -0.03022003173828125, -0.02701854705810547, -0.023817062377929688, -0.020615577697753906, -0.017414093017578125, -0.014212608337402344, -0.011011123657226562, -0.007809638977050781, -0.004608154296875, -0.0014066696166992188, 0.0017948150634765625, 0.004996299743652344, 0.008197784423828125, 0.011399269104003906, 0.014600753784179688, 0.01780223846435547, 0.02100372314453125, 0.02420520782470703, 0.027406692504882812, 0.030608177185058594, 0.033809661865234375, 0.037011146545410156, 0.04021263122558594, 0.04341411590576172, 0.0466156005859375, 0.04981708526611328, 0.05301856994628906, 0.056220054626464844, 0.059421539306640625, 0.0626230239868164, 0.06582450866699219, 0.06902599334716797, 0.07222747802734375, 0.07542896270751953, 0.07863044738769531, 0.0818319320678711, 0.08503341674804688, 0.08823490142822266, 0.09143638610839844, 0.09463787078857422, 0.09783935546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 3.0, 8.0, 12.0, 16.0, 12.0, 29.0, 46.0, 65.0, 99.0, 135.0, 145.0, 123.0, 92.0, 57.0, 51.0, 25.0, 17.0, 15.0, 10.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.286823630332947e-05, -3.1463801860809326e-05, -3.0059367418289185e-05, -2.8654932975769043e-05, -2.72504985332489e-05, -2.584606409072876e-05, -2.4441629648208618e-05, -2.3037195205688477e-05, -2.1632760763168335e-05, -2.0228326320648193e-05, -1.8823891878128052e-05, -1.741945743560791e-05, -1.601502299308777e-05, -1.4610588550567627e-05, -1.3206154108047485e-05, -1.1801719665527344e-05, -1.0397285223007202e-05, -8.99285078048706e-06, -7.588416337966919e-06, -6.183981895446777e-06, -4.779547452926636e-06, -3.375113010406494e-06, -1.9706785678863525e-06, -5.662441253662109e-07, 8.381903171539307e-07, 2.2426247596740723e-06, 3.647059202194214e-06, 5.0514936447143555e-06, 6.455928087234497e-06, 7.860362529754639e-06, 9.26479697227478e-06, 1.0669231414794922e-05, 1.2073665857315063e-05, 1.3478100299835205e-05, 1.4882534742355347e-05, 1.6286969184875488e-05, 1.769140362739563e-05, 1.909583806991577e-05, 2.0500272512435913e-05, 2.1904706954956055e-05, 2.3309141397476196e-05, 2.4713575839996338e-05, 2.611801028251648e-05, 2.752244472503662e-05, 2.8926879167556763e-05, 3.0331313610076904e-05, 3.1735748052597046e-05, 3.314018249511719e-05, 3.454461693763733e-05, 3.594905138015747e-05, 3.735348582267761e-05, 3.8757920265197754e-05, 4.0162354707717896e-05, 4.156678915023804e-05, 4.297122359275818e-05, 4.437565803527832e-05, 4.578009247779846e-05, 4.7184526920318604e-05, 4.8588961362838745e-05, 4.999339580535889e-05, 5.139783024787903e-05, 5.280226469039917e-05, 5.420669913291931e-05, 5.561113357543945e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 15.0, 20.0, 32.0, 38.0, 58.0, 98.0, 107.0, 169.0, 270.0, 394.0, 591.0, 950.0, 1776.0, 3961.0, 11438.0, 49538.0, 733485.0, 206628.0, 25215.0, 7246.0, 2778.0, 1416.0, 805.0, 462.0, 333.0, 204.0, 159.0, 113.0, 71.0, 53.0, 28.0, 23.0, 12.0, 14.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.0985250473022461, -0.09542655944824219, -0.09232807159423828, -0.08922958374023438, -0.08613109588623047, -0.08303260803222656, -0.07993412017822266, -0.07683563232421875, -0.07373714447021484, -0.07063865661621094, -0.06754016876220703, -0.06444168090820312, -0.06134319305419922, -0.05824470520019531, -0.055146217346191406, -0.0520477294921875, -0.048949241638183594, -0.04585075378417969, -0.04275226593017578, -0.039653778076171875, -0.03655529022216797, -0.03345680236816406, -0.030358314514160156, -0.02725982666015625, -0.024161338806152344, -0.021062850952148438, -0.01796436309814453, -0.014865875244140625, -0.011767387390136719, -0.008668899536132812, -0.005570411682128906, -0.002471923828125, 0.0006265640258789062, 0.0037250518798828125, 0.006823539733886719, 0.009922027587890625, 0.013020515441894531, 0.016119003295898438, 0.019217491149902344, 0.02231597900390625, 0.025414466857910156, 0.028512954711914062, 0.03161144256591797, 0.034709930419921875, 0.03780841827392578, 0.04090690612792969, 0.044005393981933594, 0.0471038818359375, 0.050202369689941406, 0.05330085754394531, 0.05639934539794922, 0.059497833251953125, 0.06259632110595703, 0.06569480895996094, 0.06879329681396484, 0.07189178466796875, 0.07499027252197266, 0.07808876037597656, 0.08118724822998047, 0.08428573608398438, 0.08738422393798828, 0.09048271179199219, 0.0935811996459961, 0.0966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 13.0, 9.0, 19.0, 19.0, 28.0, 44.0, 73.0, 150.0, 313.0, 124.0, 73.0, 40.0, 20.0, 23.0, 10.0, 11.0, 6.0, 7.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.020904541015625, -0.020277976989746094, -0.019651412963867188, -0.01902484893798828, -0.018398284912109375, -0.01777172088623047, -0.017145156860351562, -0.016518592834472656, -0.01589202880859375, -0.015265464782714844, -0.014638900756835938, -0.014012336730957031, -0.013385772705078125, -0.012759208679199219, -0.012132644653320312, -0.011506080627441406, -0.0108795166015625, -0.010252952575683594, -0.009626388549804688, -0.008999824523925781, -0.008373260498046875, -0.007746696472167969, -0.0071201324462890625, -0.006493568420410156, -0.00586700439453125, -0.005240440368652344, -0.0046138763427734375, -0.003987312316894531, -0.003360748291015625, -0.0027341842651367188, -0.0021076202392578125, -0.0014810562133789062, -0.0008544921875, -0.00022792816162109375, 0.0003986358642578125, 0.0010251998901367188, 0.001651763916015625, 0.0022783279418945312, 0.0029048919677734375, 0.0035314559936523438, 0.00415802001953125, 0.004784584045410156, 0.0054111480712890625, 0.006037712097167969, 0.006664276123046875, 0.007290840148925781, 0.007917404174804688, 0.008543968200683594, 0.0091705322265625, 0.009797096252441406, 0.010423660278320312, 0.011050224304199219, 0.011676788330078125, 0.012303352355957031, 0.012929916381835938, 0.013556480407714844, 0.01418304443359375, 0.014809608459472656, 0.015436172485351562, 0.01606273651123047, 0.016689300537109375, 0.01731586456298828, 0.017942428588867188, 0.018568992614746094, 0.019195556640625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 10.0, 12.0, 15.0, 19.0, 24.0, 26.0, 40.0, 60.0, 73.0, 71.0, 67.0, 82.0, 84.0, 73.0, 78.0, 69.0, 43.0, 36.0, 16.0, 20.0, 14.0, 15.0, 11.0, 11.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5374808311462402, -2.4661457538604736, -2.394810438156128, -2.3234753608703613, -2.2521400451660156, -2.180804967880249, -2.1094696521759033, -2.0381345748901367, -1.9667993783950806, -1.8954641819000244, -1.8241289854049683, -1.752793788909912, -1.6814587116241455, -1.6101233959197998, -1.5387883186340332, -1.467453122138977, -1.396117925643921, -1.3247827291488647, -1.2534475326538086, -1.1821123361587524, -1.1107771396636963, -1.0394420623779297, -0.9681068658828735, -0.8967716693878174, -0.8254364728927612, -0.7541012763977051, -0.6827660799026489, -0.6114309430122375, -0.5400957465171814, -0.46876055002212524, -0.3974253833293915, -0.3260902166366577, -0.25475478172302246, -0.1834196001291275, -0.11208441853523254, -0.040749236941337585, 0.030585944652557373, 0.10192114114761353, 0.1732563078403473, 0.24459147453308105, 0.3159266710281372, 0.38726186752319336, 0.4585970342159271, 0.5299322009086609, 0.601267397403717, 0.6726025938987732, 0.7439377307891846, 0.8152729272842407, 0.8866081237792969, 0.957943320274353, 1.0292785167694092, 1.1006137132644653, 1.1719489097595215, 1.243283987045288, 1.3146191835403442, 1.3859543800354004, 1.4572895765304565, 1.5286247730255127, 1.5999599695205688, 1.671295166015625, 1.7426302433013916, 1.8139655590057373, 1.885300636291504, 1.95663583278656, 2.027971029281616]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 11.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 28.0, 28.0, 46.0, 48.0, 49.0, 55.0, 55.0, 38.0, 51.0, 55.0, 52.0, 59.0, 40.0, 34.0, 37.0, 35.0, 28.0, 40.0, 24.0, 20.0, 14.0, 13.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.021963596343994, -1.965125560760498, -1.908287525177002, -1.8514493703842163, -1.7946113348007202, -1.7377732992172241, -1.680935263633728, -1.6240971088409424, -1.5672590732574463, -1.5104210376739502, -1.453583002090454, -1.3967448472976685, -1.3399068117141724, -1.2830687761306763, -1.2262307405471802, -1.1693925857543945, -1.1125545501708984, -1.0557165145874023, -0.9988784193992615, -0.9420403838157654, -0.8852022886276245, -0.8283642530441284, -0.7715262174606323, -0.7146881222724915, -0.6578501462936401, -0.601012110710144, -0.5441740155220032, -0.4873359799385071, -0.4304978847503662, -0.3736598491668701, -0.31682178378105164, -0.25998371839523315, -0.20314562320709229, -0.1463075578212738, -0.08946949988603592, -0.032631441950798035, 0.024206623435020447, 0.08104467391967773, 0.13788273930549622, 0.1947208046913147, 0.2515588700771332, 0.30839693546295166, 0.36523500084877014, 0.4220730662345886, 0.4789111018180847, 0.5357491970062256, 0.5925872325897217, 0.6494252681732178, 0.7062633633613586, 0.7631013989448547, 0.8199394941329956, 0.8767775297164917, 0.9336156249046326, 0.9904536604881287, 1.0472917556762695, 1.1041297912597656, 1.1609678268432617, 1.2178058624267578, 1.274643898010254, 1.3314820528030396, 1.3883200883865356, 1.4451581239700317, 1.5019961595535278, 1.5588343143463135, 1.6156723499298096]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 10.0, 12.0, 23.0, 34.0, 54.0, 81.0, 134.0, 217.0, 370.0, 702.0, 1362.0, 2771.0, 5869.0, 13882.0, 34635.0, 95545.0, 393401.0, 354280.0, 88529.0, 32467.0, 13193.0, 5569.0, 2573.0, 1231.0, 683.0, 377.0, 206.0, 128.0, 77.0, 47.0, 37.0, 18.0, 12.0, 6.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.3515625, -3.269744873046875, -3.18792724609375, -3.106109619140625, -3.0242919921875, -2.942474365234375, -2.86065673828125, -2.778839111328125, -2.697021484375, -2.615203857421875, -2.53338623046875, -2.451568603515625, -2.3697509765625, -2.287933349609375, -2.20611572265625, -2.124298095703125, -2.04248046875, -1.960662841796875, -1.87884521484375, -1.797027587890625, -1.7152099609375, -1.633392333984375, -1.55157470703125, -1.469757080078125, -1.387939453125, -1.306121826171875, -1.22430419921875, -1.142486572265625, -1.0606689453125, -0.978851318359375, -0.89703369140625, -0.815216064453125, -0.7333984375, -0.651580810546875, -0.56976318359375, -0.487945556640625, -0.4061279296875, -0.324310302734375, -0.24249267578125, -0.160675048828125, -0.078857421875, 0.002960205078125, 0.08477783203125, 0.166595458984375, 0.2484130859375, 0.330230712890625, 0.41204833984375, 0.493865966796875, 0.57568359375, 0.657501220703125, 0.73931884765625, 0.821136474609375, 0.9029541015625, 0.984771728515625, 1.06658935546875, 1.148406982421875, 1.230224609375, 1.312042236328125, 1.39385986328125, 1.475677490234375, 1.5574951171875, 1.639312744140625, 1.72113037109375, 1.802947998046875, 1.884765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 12.0, 9.0, 15.0, 20.0, 20.0, 29.0, 38.0, 43.0, 47.0, 59.0, 50.0, 67.0, 75.0, 54.0, 65.0, 60.0, 45.0, 48.0, 36.0, 36.0, 42.0, 16.0, 22.0, 18.0, 12.0, 8.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.57232666015625, -4.4337158203125, -4.29510498046875, -4.156494140625, -4.01788330078125, -3.8792724609375, -3.74066162109375, -3.60205078125, -3.46343994140625, -3.3248291015625, -3.18621826171875, -3.047607421875, -2.90899658203125, -2.7703857421875, -2.63177490234375, -2.4931640625, -2.35455322265625, -2.2159423828125, -2.07733154296875, -1.938720703125, -1.80010986328125, -1.6614990234375, -1.52288818359375, -1.38427734375, -1.24566650390625, -1.1070556640625, -0.96844482421875, -0.829833984375, -0.69122314453125, -0.5526123046875, -0.41400146484375, -0.275390625, -0.13677978515625, 0.0018310546875, 0.14044189453125, 0.279052734375, 0.41766357421875, 0.5562744140625, 0.69488525390625, 0.83349609375, 0.97210693359375, 1.1107177734375, 1.24932861328125, 1.387939453125, 1.52655029296875, 1.6651611328125, 1.80377197265625, 1.9423828125, 2.08099365234375, 2.2196044921875, 2.35821533203125, 2.496826171875, 2.63543701171875, 2.7740478515625, 2.91265869140625, 3.05126953125, 3.18988037109375, 3.3284912109375, 3.46710205078125, 3.605712890625, 3.74432373046875, 3.8829345703125, 4.02154541015625, 4.16015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 10.0, 7.0, 12.0, 21.0, 31.0, 42.0, 89.0, 164.0, 336.0, 861.0, 3169.0, 16124.0, 107810.0, 764585.0, 130658.0, 19225.0, 3662.0, 992.0, 320.0, 159.0, 96.0, 59.0, 33.0, 24.0, 14.0, 9.0, 7.0, 8.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.22314453125, -4.0751953125, -3.92724609375, -3.779296875, -3.63134765625, -3.4833984375, -3.33544921875, -3.1875, -3.03955078125, -2.8916015625, -2.74365234375, -2.595703125, -2.44775390625, -2.2998046875, -2.15185546875, -2.00390625, -1.85595703125, -1.7080078125, -1.56005859375, -1.412109375, -1.26416015625, -1.1162109375, -0.96826171875, -0.8203125, -0.67236328125, -0.5244140625, -0.37646484375, -0.228515625, -0.08056640625, 0.0673828125, 0.21533203125, 0.36328125, 0.51123046875, 0.6591796875, 0.80712890625, 0.955078125, 1.10302734375, 1.2509765625, 1.39892578125, 1.546875, 1.69482421875, 1.8427734375, 1.99072265625, 2.138671875, 2.28662109375, 2.4345703125, 2.58251953125, 2.73046875, 2.87841796875, 3.0263671875, 3.17431640625, 3.322265625, 3.47021484375, 3.6181640625, 3.76611328125, 3.9140625, 4.06201171875, 4.2099609375, 4.35791015625, 4.505859375, 4.65380859375, 4.8017578125, 4.94970703125, 5.09765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 8.0, 5.0, 3.0, 5.0, 10.0, 12.0, 15.0, 19.0, 19.0, 29.0, 20.0, 24.0, 32.0, 32.0, 38.0, 34.0, 37.0, 41.0, 45.0, 45.0, 45.0, 35.0, 50.0, 40.0, 41.0, 50.0, 44.0, 35.0, 23.0, 25.0, 20.0, 30.0, 14.0, 10.0, 12.0, 11.0, 3.0, 12.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0], "bins": [-4.8984375, -4.76483154296875, -4.6312255859375, -4.49761962890625, -4.364013671875, -4.23040771484375, -4.0968017578125, -3.96319580078125, -3.82958984375, -3.69598388671875, -3.5623779296875, -3.42877197265625, -3.295166015625, -3.16156005859375, -3.0279541015625, -2.89434814453125, -2.7607421875, -2.62713623046875, -2.4935302734375, -2.35992431640625, -2.226318359375, -2.09271240234375, -1.9591064453125, -1.82550048828125, -1.69189453125, -1.55828857421875, -1.4246826171875, -1.29107666015625, -1.157470703125, -1.02386474609375, -0.8902587890625, -0.75665283203125, -0.623046875, -0.48944091796875, -0.3558349609375, -0.22222900390625, -0.088623046875, 0.04498291015625, 0.1785888671875, 0.31219482421875, 0.44580078125, 0.57940673828125, 0.7130126953125, 0.84661865234375, 0.980224609375, 1.11383056640625, 1.2474365234375, 1.38104248046875, 1.5146484375, 1.64825439453125, 1.7818603515625, 1.91546630859375, 2.049072265625, 2.18267822265625, 2.3162841796875, 2.44989013671875, 2.58349609375, 2.71710205078125, 2.8507080078125, 2.98431396484375, 3.117919921875, 3.25152587890625, 3.3851318359375, 3.51873779296875, 3.65234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 11.0, 10.0, 14.0, 24.0, 54.0, 88.0, 237.0, 796.0, 3262.0, 19248.0, 298202.0, 681017.0, 38633.0, 5137.0, 1263.0, 325.0, 121.0, 51.0, 25.0, 19.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.9510345458984375, -1.888397216796875, -1.8257598876953125, -1.76312255859375, -1.7004852294921875, -1.637847900390625, -1.5752105712890625, -1.5125732421875, -1.4499359130859375, -1.387298583984375, -1.3246612548828125, -1.26202392578125, -1.1993865966796875, -1.136749267578125, -1.0741119384765625, -1.011474609375, -0.9488372802734375, -0.886199951171875, -0.8235626220703125, -0.76092529296875, -0.6982879638671875, -0.635650634765625, -0.5730133056640625, -0.5103759765625, -0.4477386474609375, -0.385101318359375, -0.3224639892578125, -0.25982666015625, -0.1971893310546875, -0.134552001953125, -0.0719146728515625, -0.00927734375, 0.0533599853515625, 0.115997314453125, 0.1786346435546875, 0.24127197265625, 0.3039093017578125, 0.366546630859375, 0.4291839599609375, 0.4918212890625, 0.5544586181640625, 0.617095947265625, 0.6797332763671875, 0.74237060546875, 0.8050079345703125, 0.867645263671875, 0.9302825927734375, 0.992919921875, 1.0555572509765625, 1.118194580078125, 1.1808319091796875, 1.24346923828125, 1.3061065673828125, 1.368743896484375, 1.4313812255859375, 1.4940185546875, 1.5566558837890625, 1.619293212890625, 1.6819305419921875, 1.74456787109375, 1.8072052001953125, 1.869842529296875, 1.9324798583984375, 1.9951171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 9.0, 3.0, 4.0, 17.0, 14.0, 21.0, 50.0, 44.0, 67.0, 86.0, 121.0, 149.0, 98.0, 91.0, 54.0, 54.0, 35.0, 17.0, 18.0, 10.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002124309539794922, -0.00020492449402809143, -0.00019741803407669067, -0.00018991157412528992, -0.00018240511417388916, -0.0001748986542224884, -0.00016739219427108765, -0.0001598857343196869, -0.00015237927436828613, -0.00014487281441688538, -0.00013736635446548462, -0.00012985989451408386, -0.0001223534345626831, -0.00011484697461128235, -0.00010734051465988159, -9.983405470848083e-05, -9.232759475708008e-05, -8.482113480567932e-05, -7.731467485427856e-05, -6.980821490287781e-05, -6.230175495147705e-05, -5.4795295000076294e-05, -4.728883504867554e-05, -3.978237509727478e-05, -3.2275915145874023e-05, -2.4769455194473267e-05, -1.726299524307251e-05, -9.756535291671753e-06, -2.250075340270996e-06, 5.256384611129761e-06, 1.2762844562530518e-05, 2.0269304513931274e-05, 2.777576446533203e-05, 3.528222441673279e-05, 4.2788684368133545e-05, 5.02951443195343e-05, 5.780160427093506e-05, 6.530806422233582e-05, 7.281452417373657e-05, 8.032098412513733e-05, 8.782744407653809e-05, 9.533390402793884e-05, 0.0001028403639793396, 0.00011034682393074036, 0.00011785328388214111, 0.00012535974383354187, 0.00013286620378494263, 0.00014037266373634338, 0.00014787912368774414, 0.0001553855836391449, 0.00016289204359054565, 0.0001703985035419464, 0.00017790496349334717, 0.00018541142344474792, 0.00019291788339614868, 0.00020042434334754944, 0.0002079308032989502, 0.00021543726325035095, 0.0002229437232017517, 0.00023045018315315247, 0.00023795664310455322, 0.000245463103055954, 0.00025296956300735474, 0.0002604760229587555, 0.00026798248291015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 5.0, 15.0, 16.0, 23.0, 26.0, 50.0, 59.0, 99.0, 171.0, 373.0, 742.0, 1611.0, 3779.0, 10657.0, 38340.0, 188881.0, 596461.0, 157847.0, 33429.0, 9475.0, 3485.0, 1523.0, 680.0, 322.0, 171.0, 112.0, 59.0, 42.0, 31.0, 21.0, 12.0, 8.0, 7.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9521484375, -0.91473388671875, -0.8773193359375, -0.83990478515625, -0.802490234375, -0.76507568359375, -0.7276611328125, -0.69024658203125, -0.65283203125, -0.61541748046875, -0.5780029296875, -0.54058837890625, -0.503173828125, -0.46575927734375, -0.4283447265625, -0.39093017578125, -0.353515625, -0.31610107421875, -0.2786865234375, -0.24127197265625, -0.203857421875, -0.16644287109375, -0.1290283203125, -0.09161376953125, -0.05419921875, -0.01678466796875, 0.0206298828125, 0.05804443359375, 0.095458984375, 0.13287353515625, 0.1702880859375, 0.20770263671875, 0.2451171875, 0.28253173828125, 0.3199462890625, 0.35736083984375, 0.394775390625, 0.43218994140625, 0.4696044921875, 0.50701904296875, 0.54443359375, 0.58184814453125, 0.6192626953125, 0.65667724609375, 0.694091796875, 0.73150634765625, 0.7689208984375, 0.80633544921875, 0.84375, 0.88116455078125, 0.9185791015625, 0.95599365234375, 0.993408203125, 1.03082275390625, 1.0682373046875, 1.10565185546875, 1.14306640625, 1.18048095703125, 1.2178955078125, 1.25531005859375, 1.292724609375, 1.33013916015625, 1.3675537109375, 1.40496826171875, 1.4423828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 8.0, 15.0, 7.0, 18.0, 17.0, 20.0, 36.0, 39.0, 34.0, 51.0, 67.0, 86.0, 79.0, 104.0, 86.0, 71.0, 50.0, 43.0, 45.0, 22.0, 25.0, 24.0, 9.0, 6.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4755973815917969, -0.45925140380859375, -0.4429054260253906, -0.4265594482421875, -0.4102134704589844, -0.39386749267578125, -0.3775215148925781, -0.361175537109375, -0.3448295593261719, -0.32848358154296875, -0.3121376037597656, -0.2957916259765625, -0.2794456481933594, -0.26309967041015625, -0.24675369262695312, -0.23040771484375, -0.21406173706054688, -0.19771575927734375, -0.18136978149414062, -0.1650238037109375, -0.14867782592773438, -0.13233184814453125, -0.11598587036132812, -0.099639892578125, -0.08329391479492188, -0.06694793701171875, -0.050601959228515625, -0.0342559814453125, -0.017910003662109375, -0.00156402587890625, 0.014781951904296875, 0.0311279296875, 0.047473907470703125, 0.06381988525390625, 0.08016586303710938, 0.0965118408203125, 0.11285781860351562, 0.12920379638671875, 0.14554977416992188, 0.161895751953125, 0.17824172973632812, 0.19458770751953125, 0.21093368530273438, 0.2272796630859375, 0.24362564086914062, 0.25997161865234375, 0.2763175964355469, 0.29266357421875, 0.3090095520019531, 0.32535552978515625, 0.3417015075683594, 0.3580474853515625, 0.3743934631347656, 0.39073944091796875, 0.4070854187011719, 0.423431396484375, 0.4397773742675781, 0.45612335205078125, 0.4724693298339844, 0.4888153076171875, 0.5051612854003906, 0.5215072631835938, 0.5378532409667969, 0.55419921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 10.0, 34.0, 139.0, 350.0, 345.0, 107.0, 25.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12266731262207, -3.290733575820923, -2.4587998390197754, -1.626866102218628, -0.7949323654174805, 0.037001609802246094, 0.8689351081848145, 1.7008686065673828, 2.5328025817871094, 3.364736318588257, 4.196670055389404, 5.028603553771973, 5.860537528991699, 6.692471504211426, 7.524405002593994, 8.356338500976562, 9.188272476196289, 10.020206451416016, 10.852140426635742, 11.684073448181152, 12.516007423400879, 13.347941398620605, 14.179874420166016, 15.011808395385742, 15.843742370605469, 16.675676345825195, 17.507610321044922, 18.33954429626465, 19.171478271484375, 20.00341033935547, 20.835344314575195, 21.667278289794922, 22.499210357666016, 23.331144332885742, 24.16307830810547, 24.995012283325195, 25.826946258544922, 26.658878326416016, 27.490812301635742, 28.32274627685547, 29.154680252075195, 29.986614227294922, 30.81854820251465, 31.650482177734375, 32.48241424560547, 33.31435012817383, 34.14628219604492, 34.97821807861328, 35.810150146484375, 36.64208221435547, 37.47401809692383, 38.30595016479492, 39.13788604736328, 39.969818115234375, 40.801753997802734, 41.63368606567383, 42.46562194824219, 43.29755401611328, 44.12948989868164, 44.961421966552734, 45.793357849121094, 46.62528991699219, 47.45722579956055, 48.28915786743164, 49.121089935302734]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 9.0, 6.0, 5.0, 9.0, 5.0, 10.0, 8.0, 21.0, 20.0, 21.0, 27.0, 26.0, 33.0, 28.0, 26.0, 25.0, 28.0, 36.0, 25.0, 32.0, 40.0, 45.0, 45.0, 33.0, 33.0, 29.0, 36.0, 38.0, 38.0, 24.0, 31.0, 38.0, 21.0, 22.0, 21.0, 22.0, 11.0, 16.0, 10.0, 13.0, 9.0, 11.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.895088195800781, -6.673768997192383, -6.452449321746826, -6.231130123138428, -6.009810447692871, -5.788491249084473, -5.567172050476074, -5.345852851867676, -5.124533176422119, -4.903213977813721, -4.681894302368164, -4.460575103759766, -4.239255905151367, -4.0179362297058105, -3.796617031097412, -3.5752975940704346, -3.353978157043457, -3.1326587200164795, -2.911339282989502, -2.6900200843811035, -2.468700647354126, -2.2473812103271484, -2.02606201171875, -1.8047425746917725, -1.583423137664795, -1.3621037006378174, -1.1407843828201294, -0.9194650053977966, -0.6981456279754639, -0.47682619094848633, -0.25550687313079834, -0.03418755531311035, 0.1871318817138672, 0.40845125913619995, 0.6297706365585327, 0.8510900139808655, 1.0724093914031982, 1.2937288284301758, 1.5150481462478638, 1.7363674640655518, 1.9576869010925293, 2.179006338119507, 2.4003257751464844, 2.621644973754883, 2.8429644107818604, 3.064283847808838, 3.2856030464172363, 3.506922483444214, 3.7282419204711914, 3.949561357498169, 4.1708807945251465, 4.392199993133545, 4.613519668579102, 4.8348388671875, 5.056158065795898, 5.277477264404297, 5.4987969398498535, 5.720116138458252, 5.941435813903809, 6.162755012512207, 6.3840742111206055, 6.605393886566162, 6.8267130851745605, 7.048032760620117, 7.269351959228516]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 3.0, 4.0, 12.0, 10.0, 14.0, 18.0, 19.0, 32.0, 37.0, 42.0, 77.0, 113.0, 249.0, 529.0, 1460.0, 5537.0, 31550.0, 481842.0, 3501949.0, 149303.0, 16097.0, 3361.0, 1030.0, 427.0, 171.0, 118.0, 60.0, 50.0, 37.0, 27.0, 23.0, 18.0, 16.0, 13.0, 7.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-7.06640625, -6.88671875, -6.70703125, -6.52734375, -6.34765625, -6.16796875, -5.98828125, -5.80859375, -5.62890625, -5.44921875, -5.26953125, -5.08984375, -4.91015625, -4.73046875, -4.55078125, -4.37109375, -4.19140625, -4.01171875, -3.83203125, -3.65234375, -3.47265625, -3.29296875, -3.11328125, -2.93359375, -2.75390625, -2.57421875, -2.39453125, -2.21484375, -2.03515625, -1.85546875, -1.67578125, -1.49609375, -1.31640625, -1.13671875, -0.95703125, -0.77734375, -0.59765625, -0.41796875, -0.23828125, -0.05859375, 0.12109375, 0.30078125, 0.48046875, 0.66015625, 0.83984375, 1.01953125, 1.19921875, 1.37890625, 1.55859375, 1.73828125, 1.91796875, 2.09765625, 2.27734375, 2.45703125, 2.63671875, 2.81640625, 2.99609375, 3.17578125, 3.35546875, 3.53515625, 3.71484375, 3.89453125, 4.07421875, 4.25390625, 4.43359375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 8.0, 7.0, 6.0, 5.0, 11.0, 13.0, 18.0, 13.0, 15.0, 18.0, 39.0, 37.0, 37.0, 30.0, 49.0, 45.0, 36.0, 41.0, 38.0, 50.0, 52.0, 57.0, 42.0, 37.0, 40.0, 31.0, 33.0, 27.0, 28.0, 23.0, 17.0, 19.0, 15.0, 18.0, 7.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.457000732421875, -1.41204833984375, -1.367095947265625, -1.3221435546875, -1.277191162109375, -1.23223876953125, -1.187286376953125, -1.142333984375, -1.097381591796875, -1.05242919921875, -1.007476806640625, -0.9625244140625, -0.917572021484375, -0.87261962890625, -0.827667236328125, -0.78271484375, -0.737762451171875, -0.69281005859375, -0.647857666015625, -0.6029052734375, -0.557952880859375, -0.51300048828125, -0.468048095703125, -0.423095703125, -0.378143310546875, -0.33319091796875, -0.288238525390625, -0.2432861328125, -0.198333740234375, -0.15338134765625, -0.108428955078125, -0.0634765625, -0.018524169921875, 0.02642822265625, 0.071380615234375, 0.1163330078125, 0.161285400390625, 0.20623779296875, 0.251190185546875, 0.296142578125, 0.341094970703125, 0.38604736328125, 0.430999755859375, 0.4759521484375, 0.520904541015625, 0.56585693359375, 0.610809326171875, 0.65576171875, 0.700714111328125, 0.74566650390625, 0.790618896484375, 0.8355712890625, 0.880523681640625, 0.92547607421875, 0.970428466796875, 1.015380859375, 1.060333251953125, 1.10528564453125, 1.150238037109375, 1.1951904296875, 1.240142822265625, 1.28509521484375, 1.330047607421875, 1.375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 11.0, 8.0, 13.0, 20.0, 16.0, 36.0, 46.0, 60.0, 105.0, 148.0, 273.0, 661.0, 2364.0, 11201.0, 87820.0, 1748714.0, 2222833.0, 103102.0, 12791.0, 2518.0, 717.0, 329.0, 175.0, 89.0, 66.0, 40.0, 32.0, 16.0, 18.0, 11.0, 7.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.35235595703125, -4.1851806640625, -4.01800537109375, -3.850830078125, -3.68365478515625, -3.5164794921875, -3.34930419921875, -3.18212890625, -3.01495361328125, -2.8477783203125, -2.68060302734375, -2.513427734375, -2.34625244140625, -2.1790771484375, -2.01190185546875, -1.8447265625, -1.67755126953125, -1.5103759765625, -1.34320068359375, -1.176025390625, -1.00885009765625, -0.8416748046875, -0.67449951171875, -0.50732421875, -0.34014892578125, -0.1729736328125, -0.00579833984375, 0.161376953125, 0.32855224609375, 0.4957275390625, 0.66290283203125, 0.830078125, 0.99725341796875, 1.1644287109375, 1.33160400390625, 1.498779296875, 1.66595458984375, 1.8331298828125, 2.00030517578125, 2.16748046875, 2.33465576171875, 2.5018310546875, 2.66900634765625, 2.836181640625, 3.00335693359375, 3.1705322265625, 3.33770751953125, 3.5048828125, 3.67205810546875, 3.8392333984375, 4.00640869140625, 4.173583984375, 4.34075927734375, 4.5079345703125, 4.67510986328125, 4.84228515625, 5.00946044921875, 5.1766357421875, 5.34381103515625, 5.510986328125, 5.67816162109375, 5.8453369140625, 6.01251220703125, 6.1796875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 11.0, 16.0, 24.0, 34.0, 47.0, 55.0, 72.0, 122.0, 139.0, 189.0, 244.0, 346.0, 470.0, 551.0, 442.0, 326.0, 270.0, 163.0, 132.0, 95.0, 74.0, 48.0, 38.0, 28.0, 23.0, 16.0, 12.0, 15.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.1943359375, -1.1624298095703125, -1.130523681640625, -1.0986175537109375, -1.06671142578125, -1.0348052978515625, -1.002899169921875, -0.9709930419921875, -0.9390869140625, -0.9071807861328125, -0.875274658203125, -0.8433685302734375, -0.81146240234375, -0.7795562744140625, -0.747650146484375, -0.7157440185546875, -0.683837890625, -0.6519317626953125, -0.620025634765625, -0.5881195068359375, -0.55621337890625, -0.5243072509765625, -0.492401123046875, -0.4604949951171875, -0.4285888671875, -0.3966827392578125, -0.364776611328125, -0.3328704833984375, -0.30096435546875, -0.2690582275390625, -0.237152099609375, -0.2052459716796875, -0.17333984375, -0.1414337158203125, -0.109527587890625, -0.0776214599609375, -0.04571533203125, -0.0138092041015625, 0.018096923828125, 0.0500030517578125, 0.0819091796875, 0.1138153076171875, 0.145721435546875, 0.1776275634765625, 0.20953369140625, 0.2414398193359375, 0.273345947265625, 0.3052520751953125, 0.337158203125, 0.3690643310546875, 0.400970458984375, 0.4328765869140625, 0.46478271484375, 0.4966888427734375, 0.528594970703125, 0.5605010986328125, 0.5924072265625, 0.6243133544921875, 0.656219482421875, 0.6881256103515625, 0.72003173828125, 0.7519378662109375, 0.783843994140625, 0.8157501220703125, 0.84765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 5.0, 5.0, 8.0, 11.0, 14.0, 17.0, 13.0, 18.0, 19.0, 28.0, 38.0, 27.0, 34.0, 27.0, 42.0, 31.0, 46.0, 42.0, 37.0, 42.0, 40.0, 46.0, 50.0, 43.0, 42.0, 37.0, 36.0, 32.0, 21.0, 21.0, 13.0, 21.0, 9.0, 13.0, 13.0, 5.0, 8.0, 4.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.2177224159240723, -2.1481213569641113, -2.0785205364227295, -2.0089194774627686, -1.9393186569213867, -1.8697177171707153, -1.800116777420044, -1.730515718460083, -1.6609148979187012, -1.5913139581680298, -1.5217130184173584, -1.452112078666687, -1.3825111389160156, -1.3129101991653442, -1.2433092594146729, -1.173708200454712, -1.1041072607040405, -1.0345063209533691, -0.9649053812026978, -0.8953044414520264, -0.825703501701355, -0.7561025619506836, -0.6865015625953674, -0.616900622844696, -0.5472996830940247, -0.47769874334335327, -0.4080978035926819, -0.3384968340396881, -0.2688958942890167, -0.19929495453834534, -0.12969398498535156, -0.060093045234680176, 0.009507894515991211, 0.0791088417172432, 0.14870978891849518, 0.21831074357032776, 0.28791168332099915, 0.35751262307167053, 0.4271135926246643, 0.4967145323753357, 0.5663154721260071, 0.6359164118766785, 0.7055173516273499, 0.775118350982666, 0.8447192907333374, 0.9143202304840088, 0.9839211702346802, 1.0535221099853516, 1.123123049736023, 1.1927239894866943, 1.2623249292373657, 1.331925868988037, 1.4015268087387085, 1.4711277484893799, 1.5407288074493408, 1.6103296279907227, 1.6799306869506836, 1.749531626701355, 1.8191325664520264, 1.8887335062026978, 1.9583344459533691, 2.02793550491333, 2.097536325454712, 2.167137384414673, 2.2367382049560547]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 1.0, 0.0, 6.0, 8.0, 9.0, 20.0, 17.0, 19.0, 25.0, 28.0, 26.0, 38.0, 37.0, 42.0, 27.0, 27.0, 38.0, 27.0, 51.0, 41.0, 31.0, 42.0, 40.0, 39.0, 42.0, 30.0, 28.0, 35.0, 51.0, 29.0, 18.0, 18.0, 20.0, 21.0, 11.0, 14.0, 6.0, 11.0, 5.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.814331531524658, -2.73667573928833, -2.659019947052002, -2.581364393234253, -2.503708600997925, -2.4260528087615967, -2.3483972549438477, -2.2707414627075195, -2.1930856704711914, -2.1154298782348633, -2.037774085998535, -1.9601185321807861, -1.882462739944458, -1.8048069477081299, -1.7271512746810913, -1.6494956016540527, -1.5718398094177246, -1.4941840171813965, -1.416528344154358, -1.3388726711273193, -1.2612168788909912, -1.183561086654663, -1.1059054136276245, -1.028249740600586, -0.9505939483642578, -0.8729382157325745, -0.7952824831008911, -0.7176267504692078, -0.6399710178375244, -0.5623152852058411, -0.4846595525741577, -0.40700381994247437, -0.3293483257293701, -0.25169259309768677, -0.17403686046600342, -0.09638112783432007, -0.01872539520263672, 0.05893033742904663, 0.13658607006072998, 0.21424180269241333, 0.2918975353240967, 0.36955326795578003, 0.4472090005874634, 0.5248647332191467, 0.6025204658508301, 0.6801761984825134, 0.7578319311141968, 0.8354876637458801, 0.9131433963775635, 0.9907991290092468, 1.0684548616409302, 1.1461105346679688, 1.2237663269042969, 1.301422119140625, 1.3790777921676636, 1.4567334651947021, 1.5343892574310303, 1.6120450496673584, 1.689700722694397, 1.7673563957214355, 1.8450121879577637, 1.9226679801940918, 2.00032377243042, 2.077979326248169, 2.155635118484497]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 5.0, 8.0, 12.0, 10.0, 25.0, 30.0, 39.0, 48.0, 63.0, 92.0, 113.0, 159.0, 254.0, 388.0, 695.0, 1503.0, 10324.0, 612096.0, 411642.0, 7783.0, 1380.0, 656.0, 349.0, 262.0, 172.0, 105.0, 82.0, 65.0, 46.0, 28.0, 28.0, 18.0, 17.0, 17.0, 11.0, 5.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94580078125, -0.9142227172851562, -0.8826446533203125, -0.8510665893554688, -0.819488525390625, -0.7879104614257812, -0.7563323974609375, -0.7247543334960938, -0.69317626953125, -0.6615982055664062, -0.6300201416015625, -0.5984420776367188, -0.566864013671875, -0.5352859497070312, -0.5037078857421875, -0.47212982177734375, -0.4405517578125, -0.40897369384765625, -0.3773956298828125, -0.34581756591796875, -0.314239501953125, -0.28266143798828125, -0.2510833740234375, -0.21950531005859375, -0.18792724609375, -0.15634918212890625, -0.1247711181640625, -0.09319305419921875, -0.061614990234375, -0.03003692626953125, 0.0015411376953125, 0.03311920166015625, 0.064697265625, 0.09627532958984375, 0.1278533935546875, 0.15943145751953125, 0.191009521484375, 0.22258758544921875, 0.2541656494140625, 0.28574371337890625, 0.31732177734375, 0.34889984130859375, 0.3804779052734375, 0.41205596923828125, 0.443634033203125, 0.47521209716796875, 0.5067901611328125, 0.5383682250976562, 0.5699462890625, 0.6015243530273438, 0.6331024169921875, 0.6646804809570312, 0.696258544921875, 0.7278366088867188, 0.7594146728515625, 0.7909927368164062, 0.82257080078125, 0.8541488647460938, 0.8857269287109375, 0.9173049926757812, 0.948883056640625, 0.9804611206054688, 1.0120391845703125, 1.0436172485351562, 1.0751953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 5.0, 8.0, 11.0, 14.0, 14.0, 15.0, 21.0, 28.0, 25.0, 26.0, 32.0, 44.0, 39.0, 37.0, 44.0, 44.0, 36.0, 42.0, 36.0, 39.0, 46.0, 44.0, 36.0, 40.0, 34.0, 30.0, 33.0, 32.0, 23.0, 23.0, 21.0, 21.0, 14.0, 8.0, 11.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.02734375, -1.9683074951171875, -1.909271240234375, -1.8502349853515625, -1.79119873046875, -1.7321624755859375, -1.673126220703125, -1.6140899658203125, -1.5550537109375, -1.4960174560546875, -1.436981201171875, -1.3779449462890625, -1.31890869140625, -1.2598724365234375, -1.200836181640625, -1.1417999267578125, -1.082763671875, -1.0237274169921875, -0.964691162109375, -0.9056549072265625, -0.84661865234375, -0.7875823974609375, -0.728546142578125, -0.6695098876953125, -0.6104736328125, -0.5514373779296875, -0.492401123046875, -0.4333648681640625, -0.37432861328125, -0.3152923583984375, -0.256256103515625, -0.1972198486328125, -0.13818359375, -0.0791473388671875, -0.020111083984375, 0.0389251708984375, 0.09796142578125, 0.1569976806640625, 0.216033935546875, 0.2750701904296875, 0.3341064453125, 0.3931427001953125, 0.452178955078125, 0.5112152099609375, 0.57025146484375, 0.6292877197265625, 0.688323974609375, 0.7473602294921875, 0.806396484375, 0.8654327392578125, 0.924468994140625, 0.9835052490234375, 1.04254150390625, 1.1015777587890625, 1.160614013671875, 1.2196502685546875, 1.2786865234375, 1.3377227783203125, 1.396759033203125, 1.4557952880859375, 1.51483154296875, 1.5738677978515625, 1.632904052734375, 1.6919403076171875, 1.7509765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 1.0, 6.0, 4.0, 7.0, 8.0, 10.0, 15.0, 9.0, 17.0, 20.0, 22.0, 41.0, 36.0, 57.0, 85.0, 104.0, 144.0, 199.0, 324.0, 599.0, 1770.0, 10051.0, 106609.0, 756260.0, 155296.0, 12789.0, 2191.0, 726.0, 351.0, 217.0, 146.0, 110.0, 78.0, 59.0, 42.0, 41.0, 25.0, 25.0, 17.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.417236328125, -0.40358734130859375, -0.3899383544921875, -0.37628936767578125, -0.362640380859375, -0.34899139404296875, -0.3353424072265625, -0.32169342041015625, -0.30804443359375, -0.29439544677734375, -0.2807464599609375, -0.26709747314453125, -0.253448486328125, -0.23979949951171875, -0.2261505126953125, -0.21250152587890625, -0.1988525390625, -0.18520355224609375, -0.1715545654296875, -0.15790557861328125, -0.144256591796875, -0.13060760498046875, -0.1169586181640625, -0.10330963134765625, -0.08966064453125, -0.07601165771484375, -0.0623626708984375, -0.04871368408203125, -0.035064697265625, -0.02141571044921875, -0.0077667236328125, 0.00588226318359375, 0.01953125, 0.03318023681640625, 0.0468292236328125, 0.06047821044921875, 0.074127197265625, 0.08777618408203125, 0.1014251708984375, 0.11507415771484375, 0.12872314453125, 0.14237213134765625, 0.1560211181640625, 0.16967010498046875, 0.183319091796875, 0.19696807861328125, 0.2106170654296875, 0.22426605224609375, 0.2379150390625, 0.25156402587890625, 0.2652130126953125, 0.27886199951171875, 0.292510986328125, 0.30615997314453125, 0.3198089599609375, 0.33345794677734375, 0.34710693359375, 0.36075592041015625, 0.3744049072265625, 0.38805389404296875, 0.401702880859375, 0.41535186767578125, 0.4290008544921875, 0.44264984130859375, 0.456298828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 7.0, 8.0, 16.0, 16.0, 17.0, 26.0, 19.0, 30.0, 27.0, 35.0, 37.0, 48.0, 47.0, 42.0, 60.0, 46.0, 50.0, 67.0, 45.0, 52.0, 52.0, 34.0, 43.0, 25.0, 28.0, 27.0, 20.0, 13.0, 14.0, 9.0, 5.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.6053466796875, -4.441162109375, -4.2769775390625, -4.11279296875, -3.9486083984375, -3.784423828125, -3.6202392578125, -3.4560546875, -3.2918701171875, -3.127685546875, -2.9635009765625, -2.79931640625, -2.6351318359375, -2.470947265625, -2.3067626953125, -2.142578125, -1.9783935546875, -1.814208984375, -1.6500244140625, -1.48583984375, -1.3216552734375, -1.157470703125, -0.9932861328125, -0.8291015625, -0.6649169921875, -0.500732421875, -0.3365478515625, -0.17236328125, -0.0081787109375, 0.156005859375, 0.3201904296875, 0.484375, 0.6485595703125, 0.812744140625, 0.9769287109375, 1.14111328125, 1.3052978515625, 1.469482421875, 1.6336669921875, 1.7978515625, 1.9620361328125, 2.126220703125, 2.2904052734375, 2.45458984375, 2.6187744140625, 2.782958984375, 2.9471435546875, 3.111328125, 3.2755126953125, 3.439697265625, 3.6038818359375, 3.76806640625, 3.9322509765625, 4.096435546875, 4.2606201171875, 4.4248046875, 4.5889892578125, 4.753173828125, 4.9173583984375, 5.08154296875, 5.2457275390625, 5.409912109375, 5.5740966796875, 5.73828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 3.0, 8.0, 9.0, 10.0, 17.0, 22.0, 29.0, 27.0, 49.0, 72.0, 109.0, 175.0, 341.0, 772.0, 2832.0, 41238.0, 979586.0, 19584.0, 2113.0, 740.0, 313.0, 147.0, 103.0, 58.0, 51.0, 28.0, 34.0, 16.0, 18.0, 11.0, 11.0, 4.0, 5.0, 2.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.14269065856933594, -0.13828659057617188, -0.1338825225830078, -0.12947845458984375, -0.1250743865966797, -0.12067031860351562, -0.11626625061035156, -0.1118621826171875, -0.10745811462402344, -0.10305404663085938, -0.09864997863769531, -0.09424591064453125, -0.08984184265136719, -0.08543777465820312, -0.08103370666503906, -0.076629638671875, -0.07222557067871094, -0.06782150268554688, -0.06341743469238281, -0.05901336669921875, -0.05460929870605469, -0.050205230712890625, -0.04580116271972656, -0.0413970947265625, -0.03699302673339844, -0.032588958740234375, -0.028184890747070312, -0.02378082275390625, -0.019376754760742188, -0.014972686767578125, -0.010568618774414062, -0.00616455078125, -0.0017604827880859375, 0.002643585205078125, 0.0070476531982421875, 0.01145172119140625, 0.015855789184570312, 0.020259857177734375, 0.024663925170898438, 0.0290679931640625, 0.03347206115722656, 0.037876129150390625, 0.04228019714355469, 0.04668426513671875, 0.05108833312988281, 0.055492401123046875, 0.05989646911621094, 0.064300537109375, 0.06870460510253906, 0.07310867309570312, 0.07751274108886719, 0.08191680908203125, 0.08632087707519531, 0.09072494506835938, 0.09512901306152344, 0.0995330810546875, 0.10393714904785156, 0.10834121704101562, 0.11274528503417969, 0.11714935302734375, 0.12155342102050781, 0.12595748901367188, 0.13036155700683594, 0.134765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 20.0, 27.0, 32.0, 63.0, 61.0, 89.0, 119.0, 111.0, 107.0, 95.0, 72.0, 48.0, 38.0, 26.0, 14.0, 15.0, 9.0, 6.0, 7.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.458427429199219e-05, -4.312768578529358e-05, -4.167109727859497e-05, -4.021450877189636e-05, -3.8757920265197754e-05, -3.7301331758499146e-05, -3.584474325180054e-05, -3.438815474510193e-05, -3.293156623840332e-05, -3.147497773170471e-05, -3.0018389225006104e-05, -2.8561800718307495e-05, -2.7105212211608887e-05, -2.564862370491028e-05, -2.419203519821167e-05, -2.273544669151306e-05, -2.1278858184814453e-05, -1.9822269678115845e-05, -1.8365681171417236e-05, -1.6909092664718628e-05, -1.545250415802002e-05, -1.3995915651321411e-05, -1.2539327144622803e-05, -1.1082738637924194e-05, -9.626150131225586e-06, -8.169561624526978e-06, -6.712973117828369e-06, -5.256384611129761e-06, -3.7997961044311523e-06, -2.343207597732544e-06, -8.866190910339355e-07, 5.699694156646729e-07, 2.0265579223632812e-06, 3.4831464290618896e-06, 4.939734935760498e-06, 6.3963234424591064e-06, 7.852911949157715e-06, 9.309500455856323e-06, 1.0766088962554932e-05, 1.222267746925354e-05, 1.3679265975952148e-05, 1.5135854482650757e-05, 1.6592442989349365e-05, 1.8049031496047974e-05, 1.9505620002746582e-05, 2.096220850944519e-05, 2.24187970161438e-05, 2.3875385522842407e-05, 2.5331974029541016e-05, 2.6788562536239624e-05, 2.8245151042938232e-05, 2.970173954963684e-05, 3.115832805633545e-05, 3.261491656303406e-05, 3.4071505069732666e-05, 3.5528093576431274e-05, 3.698468208312988e-05, 3.844127058982849e-05, 3.98978590965271e-05, 4.135444760322571e-05, 4.2811036109924316e-05, 4.4267624616622925e-05, 4.572421312332153e-05, 4.718080163002014e-05, 4.863739013671875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 15.0, 20.0, 27.0, 31.0, 44.0, 42.0, 68.0, 86.0, 126.0, 151.0, 209.0, 302.0, 390.0, 593.0, 852.0, 1523.0, 2442.0, 4342.0, 8595.0, 20762.0, 69702.0, 583233.0, 278408.0, 44790.0, 15116.0, 6961.0, 3673.0, 2106.0, 1284.0, 816.0, 522.0, 354.0, 251.0, 174.0, 116.0, 103.0, 67.0, 65.0, 47.0, 17.0, 25.0, 24.0, 22.0, 11.0, 8.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.07769775390625, -0.07540225982666016, -0.07310676574707031, -0.07081127166748047, -0.06851577758789062, -0.06622028350830078, -0.06392478942871094, -0.061629295349121094, -0.05933380126953125, -0.057038307189941406, -0.05474281311035156, -0.05244731903076172, -0.050151824951171875, -0.04785633087158203, -0.04556083679199219, -0.043265342712402344, -0.0409698486328125, -0.038674354553222656, -0.03637886047363281, -0.03408336639404297, -0.031787872314453125, -0.02949237823486328, -0.027196884155273438, -0.024901390075683594, -0.02260589599609375, -0.020310401916503906, -0.018014907836914062, -0.01571941375732422, -0.013423919677734375, -0.011128425598144531, -0.008832931518554688, -0.006537437438964844, -0.004241943359375, -0.0019464492797851562, 0.0003490447998046875, 0.0026445388793945312, 0.004940032958984375, 0.007235527038574219, 0.009531021118164062, 0.011826515197753906, 0.01412200927734375, 0.016417503356933594, 0.018712997436523438, 0.02100849151611328, 0.023303985595703125, 0.02559947967529297, 0.027894973754882812, 0.030190467834472656, 0.0324859619140625, 0.034781455993652344, 0.03707695007324219, 0.03937244415283203, 0.041667938232421875, 0.04396343231201172, 0.04625892639160156, 0.048554420471191406, 0.05084991455078125, 0.053145408630371094, 0.05544090270996094, 0.05773639678955078, 0.060031890869140625, 0.06232738494873047, 0.06462287902832031, 0.06691837310791016, 0.0692138671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 10.0, 12.0, 19.0, 11.0, 24.0, 53.0, 75.0, 154.0, 271.0, 137.0, 79.0, 44.0, 32.0, 10.0, 9.0, 11.0, 3.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026171207427978516, -0.02536487579345703, -0.024558544158935547, -0.023752212524414062, -0.022945880889892578, -0.022139549255371094, -0.02133321762084961, -0.020526885986328125, -0.01972055435180664, -0.018914222717285156, -0.018107891082763672, -0.017301559448242188, -0.016495227813720703, -0.01568889617919922, -0.014882564544677734, -0.01407623291015625, -0.013269901275634766, -0.012463569641113281, -0.011657238006591797, -0.010850906372070312, -0.010044574737548828, -0.009238243103027344, -0.00843191146850586, -0.007625579833984375, -0.006819248199462891, -0.006012916564941406, -0.005206584930419922, -0.0044002532958984375, -0.003593921661376953, -0.0027875900268554688, -0.0019812583923339844, -0.0011749267578125, -0.0003685951232910156, 0.00043773651123046875, 0.0012440681457519531, 0.0020503997802734375, 0.002856731414794922, 0.0036630630493164062, 0.004469394683837891, 0.005275726318359375, 0.006082057952880859, 0.006888389587402344, 0.007694721221923828, 0.008501052856445312, 0.009307384490966797, 0.010113716125488281, 0.010920047760009766, 0.01172637939453125, 0.012532711029052734, 0.013339042663574219, 0.014145374298095703, 0.014951705932617188, 0.015758037567138672, 0.016564369201660156, 0.01737070083618164, 0.018177032470703125, 0.01898336410522461, 0.019789695739746094, 0.020596027374267578, 0.021402359008789062, 0.022208690643310547, 0.02301502227783203, 0.023821353912353516, 0.024627685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 7.0, 5.0, 13.0, 19.0, 14.0, 22.0, 24.0, 23.0, 24.0, 41.0, 32.0, 38.0, 44.0, 38.0, 31.0, 47.0, 52.0, 41.0, 42.0, 39.0, 56.0, 48.0, 43.0, 42.0, 28.0, 31.0, 24.0, 27.0, 11.0, 8.0, 9.0, 6.0, 12.0, 8.0, 6.0, 4.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4931228160858154, -1.4449156522750854, -1.3967084884643555, -1.348501443862915, -1.300294280052185, -1.252087116241455, -1.2038800716400146, -1.1556729078292847, -1.1074657440185547, -1.0592585802078247, -1.0110514163970947, -0.9628443717956543, -0.9146372079849243, -0.8664300441741943, -0.8182229399681091, -0.7700158357620239, -0.721808671951294, -0.673601508140564, -0.6253944039344788, -0.5771872997283936, -0.5289801359176636, -0.480773001909256, -0.4325658679008484, -0.3843587338924408, -0.3361515998840332, -0.2879444658756256, -0.23973733186721802, -0.19153019785881042, -0.14332306385040283, -0.09511592984199524, -0.046908795833587646, 0.0012983381748199463, 0.04950559139251709, 0.09771272540092468, 0.14591985940933228, 0.19412699341773987, 0.24233412742614746, 0.29054126143455505, 0.33874839544296265, 0.38695552945137024, 0.43516266345977783, 0.4833697974681854, 0.531576931476593, 0.5797840356826782, 0.6279911994934082, 0.6761983633041382, 0.7244054675102234, 0.7726125717163086, 0.8208197355270386, 0.8690268993377686, 0.9172340035438538, 0.965441107749939, 1.013648271560669, 1.061855435371399, 1.110062599182129, 1.1582696437835693, 1.2064768075942993, 1.2546839714050293, 1.3028910160064697, 1.3510981798171997, 1.3993053436279297, 1.4475125074386597, 1.4957196712493896, 1.54392671585083, 1.59213387966156]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 20.0, 17.0, 15.0, 28.0, 23.0, 27.0, 47.0, 41.0, 48.0, 24.0, 43.0, 33.0, 37.0, 49.0, 42.0, 47.0, 35.0, 45.0, 42.0, 35.0, 40.0, 38.0, 41.0, 25.0, 19.0, 17.0, 21.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.1137325763702393, -2.0571537017822266, -2.000574827194214, -1.9439959526062012, -1.887417197227478, -1.8308383226394653, -1.7742594480514526, -1.71768057346344, -1.6611018180847168, -1.604522943496704, -1.5479440689086914, -1.4913651943206787, -1.4347864389419556, -1.3782075643539429, -1.3216286897659302, -1.2650498151779175, -1.2084709405899048, -1.151892066001892, -1.0953131914138794, -1.0387344360351562, -0.9821555614471436, -0.9255766868591309, -0.8689978122711182, -0.8124189376831055, -0.7558401226997375, -0.6992612481117249, -0.6426824331283569, -0.5861035585403442, -0.5295246839523315, -0.4729458689689636, -0.4163669943809509, -0.3597881495952606, -0.3032093048095703, -0.24663046002388, -0.1900516003370285, -0.133472740650177, -0.0768938958644867, -0.020315051078796387, 0.03626382350921631, 0.09284266829490662, 0.14942151308059692, 0.20600035786628723, 0.26257920265197754, 0.31915807723999023, 0.37573692202568054, 0.43231576681137085, 0.48889464139938354, 0.5454734563827515, 0.6020523309707642, 0.6586312055587769, 0.7152100205421448, 0.7717888951301575, 0.8283677101135254, 0.8849465847015381, 0.9415254592895508, 0.9981043338775635, 1.0546832084655762, 1.1112620830535889, 1.1678409576416016, 1.2244198322296143, 1.2809985876083374, 1.33757746219635, 1.3941563367843628, 1.4507352113723755, 1.5073139667510986]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 11.0, 11.0, 11.0, 21.0, 36.0, 74.0, 87.0, 151.0, 260.0, 424.0, 903.0, 1820.0, 3947.0, 9477.0, 25303.0, 75614.0, 238026.0, 431038.0, 173132.0, 55413.0, 19025.0, 7268.0, 3260.0, 1529.0, 754.0, 382.0, 223.0, 137.0, 92.0, 44.0, 36.0, 10.0, 12.0, 14.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.586090087890625, -3.48468017578125, -3.383270263671875, -3.2818603515625, -3.180450439453125, -3.07904052734375, -2.977630615234375, -2.876220703125, -2.774810791015625, -2.67340087890625, -2.571990966796875, -2.4705810546875, -2.369171142578125, -2.26776123046875, -2.166351318359375, -2.06494140625, -1.963531494140625, -1.86212158203125, -1.760711669921875, -1.6593017578125, -1.557891845703125, -1.45648193359375, -1.355072021484375, -1.253662109375, -1.152252197265625, -1.05084228515625, -0.949432373046875, -0.8480224609375, -0.746612548828125, -0.64520263671875, -0.543792724609375, -0.4423828125, -0.340972900390625, -0.23956298828125, -0.138153076171875, -0.0367431640625, 0.064666748046875, 0.16607666015625, 0.267486572265625, 0.368896484375, 0.470306396484375, 0.57171630859375, 0.673126220703125, 0.7745361328125, 0.875946044921875, 0.97735595703125, 1.078765869140625, 1.18017578125, 1.281585693359375, 1.38299560546875, 1.484405517578125, 1.5858154296875, 1.687225341796875, 1.78863525390625, 1.890045166015625, 1.991455078125, 2.092864990234375, 2.19427490234375, 2.295684814453125, 2.3970947265625, 2.498504638671875, 2.59991455078125, 2.701324462890625, 2.802734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 4.0, 12.0, 12.0, 16.0, 16.0, 23.0, 24.0, 23.0, 39.0, 28.0, 37.0, 38.0, 49.0, 39.0, 49.0, 38.0, 33.0, 49.0, 41.0, 48.0, 42.0, 42.0, 34.0, 36.0, 31.0, 29.0, 34.0, 25.0, 17.0, 11.0, 11.0, 15.0, 11.0, 13.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.064453125, -2.971832275390625, -2.87921142578125, -2.786590576171875, -2.6939697265625, -2.601348876953125, -2.50872802734375, -2.416107177734375, -2.323486328125, -2.230865478515625, -2.13824462890625, -2.045623779296875, -1.9530029296875, -1.860382080078125, -1.76776123046875, -1.675140380859375, -1.58251953125, -1.489898681640625, -1.39727783203125, -1.304656982421875, -1.2120361328125, -1.119415283203125, -1.02679443359375, -0.934173583984375, -0.841552734375, -0.748931884765625, -0.65631103515625, -0.563690185546875, -0.4710693359375, -0.378448486328125, -0.28582763671875, -0.193206787109375, -0.1005859375, -0.007965087890625, 0.08465576171875, 0.177276611328125, 0.2698974609375, 0.362518310546875, 0.45513916015625, 0.547760009765625, 0.640380859375, 0.733001708984375, 0.82562255859375, 0.918243408203125, 1.0108642578125, 1.103485107421875, 1.19610595703125, 1.288726806640625, 1.38134765625, 1.473968505859375, 1.56658935546875, 1.659210205078125, 1.7518310546875, 1.844451904296875, 1.93707275390625, 2.029693603515625, 2.122314453125, 2.214935302734375, 2.30755615234375, 2.400177001953125, 2.4927978515625, 2.585418701171875, 2.67803955078125, 2.770660400390625, 2.86328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 10.0, 21.0, 22.0, 23.0, 36.0, 42.0, 90.0, 113.0, 181.0, 279.0, 440.0, 769.0, 1249.0, 2252.0, 4063.0, 7739.0, 15297.0, 31272.0, 65920.0, 137460.0, 276749.0, 259481.0, 125250.0, 59939.0, 29237.0, 14348.0, 7230.0, 3926.0, 2081.0, 1200.0, 670.0, 403.0, 240.0, 169.0, 110.0, 58.0, 62.0, 36.0, 22.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9814453125, -1.9174041748046875, -1.853363037109375, -1.7893218994140625, -1.72528076171875, -1.6612396240234375, -1.597198486328125, -1.5331573486328125, -1.4691162109375, -1.4050750732421875, -1.341033935546875, -1.2769927978515625, -1.21295166015625, -1.1489105224609375, -1.084869384765625, -1.0208282470703125, -0.956787109375, -0.8927459716796875, -0.828704833984375, -0.7646636962890625, -0.70062255859375, -0.6365814208984375, -0.572540283203125, -0.5084991455078125, -0.4444580078125, -0.3804168701171875, -0.316375732421875, -0.2523345947265625, -0.18829345703125, -0.1242523193359375, -0.060211181640625, 0.0038299560546875, 0.06787109375, 0.1319122314453125, 0.195953369140625, 0.2599945068359375, 0.32403564453125, 0.3880767822265625, 0.452117919921875, 0.5161590576171875, 0.5802001953125, 0.6442413330078125, 0.708282470703125, 0.7723236083984375, 0.83636474609375, 0.9004058837890625, 0.964447021484375, 1.0284881591796875, 1.092529296875, 1.1565704345703125, 1.220611572265625, 1.2846527099609375, 1.34869384765625, 1.4127349853515625, 1.476776123046875, 1.5408172607421875, 1.6048583984375, 1.6688995361328125, 1.732940673828125, 1.7969818115234375, 1.86102294921875, 1.9250640869140625, 1.989105224609375, 2.0531463623046875, 2.1171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 7.0, 10.0, 11.0, 9.0, 12.0, 19.0, 22.0, 20.0, 20.0, 25.0, 36.0, 29.0, 27.0, 28.0, 32.0, 47.0, 49.0, 43.0, 51.0, 43.0, 42.0, 38.0, 37.0, 33.0, 45.0, 28.0, 33.0, 30.0, 19.0, 20.0, 14.0, 20.0, 14.0, 10.0, 11.0, 6.0, 10.0, 7.0, 4.0, 10.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.890625, -3.774749755859375, -3.65887451171875, -3.542999267578125, -3.4271240234375, -3.311248779296875, -3.19537353515625, -3.079498291015625, -2.963623046875, -2.847747802734375, -2.73187255859375, -2.615997314453125, -2.5001220703125, -2.384246826171875, -2.26837158203125, -2.152496337890625, -2.03662109375, -1.920745849609375, -1.80487060546875, -1.688995361328125, -1.5731201171875, -1.457244873046875, -1.34136962890625, -1.225494384765625, -1.109619140625, -0.993743896484375, -0.87786865234375, -0.761993408203125, -0.6461181640625, -0.530242919921875, -0.41436767578125, -0.298492431640625, -0.1826171875, -0.066741943359375, 0.04913330078125, 0.165008544921875, 0.2808837890625, 0.396759033203125, 0.51263427734375, 0.628509521484375, 0.744384765625, 0.860260009765625, 0.97613525390625, 1.092010498046875, 1.2078857421875, 1.323760986328125, 1.43963623046875, 1.555511474609375, 1.67138671875, 1.787261962890625, 1.90313720703125, 2.019012451171875, 2.1348876953125, 2.250762939453125, 2.36663818359375, 2.482513427734375, 2.598388671875, 2.714263916015625, 2.83013916015625, 2.946014404296875, 3.0618896484375, 3.177764892578125, 3.29364013671875, 3.409515380859375, 3.525390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 8.0, 14.0, 29.0, 38.0, 46.0, 68.0, 101.0, 137.0, 200.0, 353.0, 536.0, 852.0, 1353.0, 2184.0, 3600.0, 6010.0, 10157.0, 17796.0, 30975.0, 56903.0, 104562.0, 189649.0, 263425.0, 161248.0, 87277.0, 47779.0, 26319.0, 14996.0, 8619.0, 5065.0, 3034.0, 1917.0, 1204.0, 732.0, 445.0, 306.0, 191.0, 147.0, 81.0, 64.0, 38.0, 33.0, 15.0, 17.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.4150390625, -0.40259552001953125, -0.3901519775390625, -0.37770843505859375, -0.365264892578125, -0.35282135009765625, -0.3403778076171875, -0.32793426513671875, -0.31549072265625, -0.30304718017578125, -0.2906036376953125, -0.27816009521484375, -0.265716552734375, -0.25327301025390625, -0.2408294677734375, -0.22838592529296875, -0.2159423828125, -0.20349884033203125, -0.1910552978515625, -0.17861175537109375, -0.166168212890625, -0.15372467041015625, -0.1412811279296875, -0.12883758544921875, -0.11639404296875, -0.10395050048828125, -0.0915069580078125, -0.07906341552734375, -0.066619873046875, -0.05417633056640625, -0.0417327880859375, -0.02928924560546875, -0.016845703125, -0.00440216064453125, 0.0080413818359375, 0.02048492431640625, 0.032928466796875, 0.04537200927734375, 0.0578155517578125, 0.07025909423828125, 0.08270263671875, 0.09514617919921875, 0.1075897216796875, 0.12003326416015625, 0.132476806640625, 0.14492034912109375, 0.1573638916015625, 0.16980743408203125, 0.1822509765625, 0.19469451904296875, 0.2071380615234375, 0.21958160400390625, 0.232025146484375, 0.24446868896484375, 0.2569122314453125, 0.26935577392578125, 0.28179931640625, 0.29424285888671875, 0.3066864013671875, 0.31912994384765625, 0.331573486328125, 0.34401702880859375, 0.3564605712890625, 0.36890411376953125, 0.38134765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 8.0, 8.0, 16.0, 19.0, 19.0, 38.0, 27.0, 47.0, 64.0, 73.0, 84.0, 79.0, 94.0, 90.0, 58.0, 68.0, 55.0, 38.0, 29.0, 22.0, 12.0, 12.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019443035125732422, -0.00018889643251895905, -0.00018336251378059387, -0.0001778285950422287, -0.00017229467630386353, -0.00016676075756549835, -0.00016122683882713318, -0.000155692920088768, -0.00015015900135040283, -0.00014462508261203766, -0.00013909116387367249, -0.0001335572451353073, -0.00012802332639694214, -0.00012248940765857697, -0.00011695548892021179, -0.00011142157018184662, -0.00010588765144348145, -0.00010035373270511627, -9.48198139667511e-05, -8.928589522838593e-05, -8.375197649002075e-05, -7.821805775165558e-05, -7.26841390132904e-05, -6.715022027492523e-05, -6.161630153656006e-05, -5.6082382798194885e-05, -5.054846405982971e-05, -4.501454532146454e-05, -3.9480626583099365e-05, -3.394670784473419e-05, -2.841278910636902e-05, -2.2878870368003845e-05, -1.7344951629638672e-05, -1.1811032891273499e-05, -6.277114152908325e-06, -7.431954145431519e-07, 4.7907233238220215e-06, 1.0324642062187195e-05, 1.5858560800552368e-05, 2.139247953891754e-05, 2.6926398277282715e-05, 3.246031701564789e-05, 3.799423575401306e-05, 4.3528154492378235e-05, 4.906207323074341e-05, 5.459599196910858e-05, 6.0129910707473755e-05, 6.566382944583893e-05, 7.11977481842041e-05, 7.673166692256927e-05, 8.226558566093445e-05, 8.779950439929962e-05, 9.33334231376648e-05, 9.886734187602997e-05, 0.00010440126061439514, 0.00010993517935276031, 0.00011546909809112549, 0.00012100301682949066, 0.00012653693556785583, 0.000132070854306221, 0.00013760477304458618, 0.00014313869178295135, 0.00014867261052131653, 0.0001542065292596817, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 13.0, 31.0, 25.0, 42.0, 64.0, 77.0, 105.0, 148.0, 203.0, 361.0, 474.0, 686.0, 1104.0, 1820.0, 2984.0, 5049.0, 9232.0, 17438.0, 34470.0, 69575.0, 141133.0, 278618.0, 238383.0, 121779.0, 59923.0, 29633.0, 15254.0, 8159.0, 4469.0, 2657.0, 1638.0, 957.0, 630.0, 414.0, 322.0, 209.0, 141.0, 98.0, 75.0, 37.0, 32.0, 33.0, 18.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.52978515625, -0.5136795043945312, -0.4975738525390625, -0.48146820068359375, -0.465362548828125, -0.44925689697265625, -0.4331512451171875, -0.41704559326171875, -0.40093994140625, -0.38483428955078125, -0.3687286376953125, -0.35262298583984375, -0.336517333984375, -0.32041168212890625, -0.3043060302734375, -0.28820037841796875, -0.2720947265625, -0.25598907470703125, -0.2398834228515625, -0.22377777099609375, -0.207672119140625, -0.19156646728515625, -0.1754608154296875, -0.15935516357421875, -0.14324951171875, -0.12714385986328125, -0.1110382080078125, -0.09493255615234375, -0.078826904296875, -0.06272125244140625, -0.0466156005859375, -0.03050994873046875, -0.014404296875, 0.00170135498046875, 0.0178070068359375, 0.03391265869140625, 0.050018310546875, 0.06612396240234375, 0.0822296142578125, 0.09833526611328125, 0.11444091796875, 0.13054656982421875, 0.1466522216796875, 0.16275787353515625, 0.178863525390625, 0.19496917724609375, 0.2110748291015625, 0.22718048095703125, 0.2432861328125, 0.25939178466796875, 0.2754974365234375, 0.29160308837890625, 0.307708740234375, 0.32381439208984375, 0.3399200439453125, 0.35602569580078125, 0.37213134765625, 0.38823699951171875, 0.4043426513671875, 0.42044830322265625, 0.436553955078125, 0.45265960693359375, 0.4687652587890625, 0.48487091064453125, 0.5009765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 6.0, 6.0, 15.0, 14.0, 29.0, 25.0, 14.0, 30.0, 42.0, 38.0, 60.0, 57.0, 79.0, 78.0, 83.0, 86.0, 52.0, 34.0, 45.0, 36.0, 31.0, 28.0, 16.0, 17.0, 12.0, 7.0, 11.0, 8.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.49462890625, -0.48003387451171875, -0.4654388427734375, -0.45084381103515625, -0.436248779296875, -0.42165374755859375, -0.4070587158203125, -0.39246368408203125, -0.37786865234375, -0.36327362060546875, -0.3486785888671875, -0.33408355712890625, -0.319488525390625, -0.30489349365234375, -0.2902984619140625, -0.27570343017578125, -0.2611083984375, -0.24651336669921875, -0.2319183349609375, -0.21732330322265625, -0.202728271484375, -0.18813323974609375, -0.1735382080078125, -0.15894317626953125, -0.14434814453125, -0.12975311279296875, -0.1151580810546875, -0.10056304931640625, -0.085968017578125, -0.07137298583984375, -0.0567779541015625, -0.04218292236328125, -0.027587890625, -0.01299285888671875, 0.0016021728515625, 0.01619720458984375, 0.030792236328125, 0.04538726806640625, 0.0599822998046875, 0.07457733154296875, 0.08917236328125, 0.10376739501953125, 0.1183624267578125, 0.13295745849609375, 0.147552490234375, 0.16214752197265625, 0.1767425537109375, 0.19133758544921875, 0.2059326171875, 0.22052764892578125, 0.2351226806640625, 0.24971771240234375, 0.264312744140625, 0.27890777587890625, 0.2935028076171875, 0.30809783935546875, 0.32269287109375, 0.33728790283203125, 0.3518829345703125, 0.36647796630859375, 0.381072998046875, 0.39566802978515625, 0.4102630615234375, 0.42485809326171875, 0.439453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 10.0, 26.0, 34.0, 59.0, 79.0, 125.0, 151.0, 108.0, 126.0, 101.0, 61.0, 43.0, 32.0, 21.0, 5.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.081125259399414, -5.7800140380859375, -5.478902816772461, -5.177792072296143, -4.876680850982666, -4.5755696296691895, -4.274458885192871, -3.9733476638793945, -3.672236442565918, -3.3711252212524414, -3.070014238357544, -2.7689032554626465, -2.46779203414917, -2.1666808128356934, -1.865569829940796, -1.5644588470458984, -1.2633476257324219, -0.9622365236282349, -0.6611254215240479, -0.36001431941986084, -0.05890321731567383, 0.24220788478851318, 0.5433189868927002, 0.8444299697875977, 1.1455411911010742, 1.4466522932052612, 1.7477633953094482, 2.0488743782043457, 2.3499855995178223, 2.651096820831299, 2.9522078037261963, 3.2533187866210938, 3.5544309616088867, 3.8555421829223633, 4.15665340423584, 4.457764148712158, 4.758875370025635, 5.059986591339111, 5.36109733581543, 5.662208557128906, 5.963319778442383, 6.264430999755859, 6.565542221069336, 6.866652965545654, 7.167764186859131, 7.468875408172607, 7.769986152648926, 8.071097373962402, 8.372208595275879, 8.673319816589355, 8.974431037902832, 9.275542259216309, 9.576652526855469, 9.877763748168945, 10.178874969482422, 10.479986190795898, 10.781097412109375, 11.082208633422852, 11.383319854736328, 11.684431076049805, 11.985542297363281, 12.286652565002441, 12.587763786315918, 12.888875007629395, 13.189986228942871]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 14.0, 10.0, 14.0, 13.0, 22.0, 16.0, 19.0, 26.0, 28.0, 34.0, 29.0, 36.0, 31.0, 41.0, 47.0, 46.0, 42.0, 33.0, 52.0, 41.0, 40.0, 39.0, 36.0, 39.0, 33.0, 34.0, 21.0, 31.0, 20.0, 24.0, 11.0, 15.0, 12.0, 9.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.644021034240723, -7.400257110595703, -7.156493186950684, -6.912729263305664, -6.668964862823486, -6.425200939178467, -6.181437015533447, -5.937673091888428, -5.69390869140625, -5.4501447677612305, -5.206380844116211, -4.962616920471191, -4.718852519989014, -4.475088596343994, -4.231324672698975, -3.987560749053955, -3.7437968254089355, -3.500032901763916, -3.2562687397003174, -3.012504816055298, -2.768740653991699, -2.5249767303466797, -2.28121280670166, -2.0374488830566406, -1.793684720993042, -1.549920678138733, -1.3061566352844238, -1.0623927116394043, -0.8186286687850952, -0.5748646259307861, -0.3311007022857666, -0.08733665943145752, 0.15642786026000977, 0.40019187331199646, 0.6439558863639832, 0.8877198696136475, 1.1314839124679565, 1.3752479553222656, 1.6190118789672852, 1.8627759218215942, 2.1065399646759033, 2.350303888320923, 2.5940680503845215, 2.837831974029541, 3.0815958976745605, 3.325360059738159, 3.5691239833831787, 3.8128881454467773, 4.056652069091797, 4.300415992736816, 4.544179916381836, 4.7879438400268555, 5.031708240509033, 5.275472164154053, 5.519236087799072, 5.763000011444092, 6.0067644119262695, 6.250528335571289, 6.494292259216309, 6.738056182861328, 6.981820583343506, 7.225584506988525, 7.469348430633545, 7.7131123542785645, 7.956876277923584]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 18.0, 9.0, 17.0, 22.0, 25.0, 38.0, 51.0, 53.0, 89.0, 112.0, 159.0, 216.0, 309.0, 414.0, 558.0, 785.0, 1176.0, 1706.0, 3094.0, 1034804.0, 2120.0, 1373.0, 917.0, 671.0, 493.0, 356.0, 263.0, 195.0, 140.0, 101.0, 67.0, 68.0, 42.0, 36.0, 22.0, 21.0, 10.0, 15.0, 5.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.278793334960938, -8.005146980285645, -7.731500625610352, -7.457854270935059, -7.184207916259766, -6.910561561584473, -6.6369147300720215, -6.3632683753967285, -6.0896220207214355, -5.815975666046143, -5.54232931137085, -5.268682956695557, -4.9950361251831055, -4.7213897705078125, -4.4477434158325195, -4.174097061157227, -3.9004507064819336, -3.6268043518066406, -3.3531579971313477, -3.0795114040374756, -2.8058650493621826, -2.5322186946868896, -2.2585721015930176, -1.9849257469177246, -1.7112793922424316, -1.4376330375671387, -1.1639865636825562, -0.8903401494026184, -0.6166937351226807, -0.3430473804473877, -0.06940090656280518, 0.20424556732177734, 0.4778909683227539, 0.7515373826026917, 1.0251837968826294, 1.298830270767212, 1.5724766254425049, 1.8461229801177979, 2.11976957321167, 2.393415927886963, 2.667062282562256, 2.940708637237549, 3.214354991912842, 3.488001585006714, 3.761647939682007, 4.035294532775879, 4.308940887451172, 4.582587242126465, 4.856233596801758, 5.129879951477051, 5.403526306152344, 5.677172660827637, 5.95081901550293, 6.224465370178223, 6.498112201690674, 6.771758556365967, 7.04540491104126, 7.319051265716553, 7.592697620391846, 7.866343975067139, 8.13999080657959, 8.413637161254883, 8.687283515930176, 8.960929870605469, 9.234576225280762]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 42.0, 78.0, 130.0, 316.0, 1672.0, 12631.0, 51434052.0, 18995.0, 2572.0, 504.0, 165.0, 58.0, 25.0, 18.0, 7.0, 9.0, 12.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.34563446044922, -30.972518920898438, -29.599403381347656, -28.226289749145508, -26.853174209594727, -25.480058670043945, -24.106945037841797, -22.733829498291016, -21.360713958740234, -19.987598419189453, -18.614482879638672, -17.241369247436523, -15.868253707885742, -14.495138168334961, -13.122023582458496, -11.748907089233398, -10.375791549682617, -9.002676963806152, -7.629561424255371, -6.256446361541748, -4.883331298828125, -3.5102157592773438, -2.137101173400879, -0.7639856338500977, 0.6091295480728149, 1.9822447299957275, 3.3553600311279297, 4.728475093841553, 6.101590156555176, 7.474705696105957, 8.847820281982422, 10.220935821533203, 11.594051361083984, 12.96716594696045, 14.34028148651123, 15.713396072387695, 17.086511611938477, 18.459627151489258, 19.832740783691406, 21.205856323242188, 22.57897186279297, 23.95208740234375, 25.32520294189453, 26.69831657409668, 28.07143211364746, 29.444547653198242, 30.81766128540039, 32.19078063964844, 33.56389617919922, 34.93701171875, 36.31012725830078, 37.68324279785156, 39.056358337402344, 40.429473876953125, 41.80258560180664, 43.17570114135742, 44.5488166809082, 45.921932220458984, 47.295047760009766, 48.66816329956055, 50.04127502441406, 51.414390563964844, 52.787506103515625, 54.160621643066406]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 3.0, 11.0, 8.0, 13.0, 15.0, 27.0, 25.0, 53.0, 71.0, 111.0, 153.0, 230.0, 356.0, 484.0, 757.0, 1270.0, 2343.0, 4923.0, 12286.0, 39192.0, 147367.0, 592249.0, 4509129.0, 723973.0, 183102.0, 47266.0, 14737.0, 5358.0, 2528.0, 1241.0, 764.0, 502.0, 310.0, 186.0, 143.0, 80.0, 52.0, 27.0, 33.0, 15.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.63037109375, -0.6144447326660156, -0.5985183715820312, -0.5825920104980469, -0.5666656494140625, -0.5507392883300781, -0.5348129272460938, -0.5188865661621094, -0.502960205078125, -0.4870338439941406, -0.47110748291015625, -0.4551811218261719, -0.4392547607421875, -0.4233283996582031, -0.40740203857421875, -0.3914756774902344, -0.37554931640625, -0.3596229553222656, -0.34369659423828125, -0.3277702331542969, -0.3118438720703125, -0.2959175109863281, -0.27999114990234375, -0.2640647888183594, -0.248138427734375, -0.23221206665039062, -0.21628570556640625, -0.20035934448242188, -0.1844329833984375, -0.16850662231445312, -0.15258026123046875, -0.13665390014648438, -0.1207275390625, -0.10480117797851562, -0.08887481689453125, -0.07294845581054688, -0.0570220947265625, -0.041095733642578125, -0.02516937255859375, -0.009243011474609375, 0.006683349609375, 0.022609710693359375, 0.03853607177734375, 0.054462432861328125, 0.0703887939453125, 0.08631515502929688, 0.10224151611328125, 0.11816787719726562, 0.13409423828125, 0.15002059936523438, 0.16594696044921875, 0.18187332153320312, 0.1977996826171875, 0.21372604370117188, 0.22965240478515625, 0.24557876586914062, 0.261505126953125, 0.2774314880371094, 0.29335784912109375, 0.3092842102050781, 0.3252105712890625, 0.3411369323730469, 0.35706329345703125, 0.3729896545410156, 0.388916015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 10.0, 16.0, 10.0, 17.0, 22.0, 25.0, 18.0, 34.0, 44.0, 39.0, 55.0, 52.0, 53.0, 105.0, 1006.0, 59.0, 59.0, 54.0, 46.0, 40.0, 38.0, 33.0, 30.0, 27.0, 21.0, 21.0, 18.0, 14.0, 9.0, 4.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.15625, -17.552734375, -16.94921875, -16.345703125, -15.7421875, -15.138671875, -14.53515625, -13.931640625, -13.328125, -12.724609375, -12.12109375, -11.517578125, -10.9140625, -10.310546875, -9.70703125, -9.103515625, -8.5, -7.896484375, -7.29296875, -6.689453125, -6.0859375, -5.482421875, -4.87890625, -4.275390625, -3.671875, -3.068359375, -2.46484375, -1.861328125, -1.2578125, -0.654296875, -0.05078125, 0.552734375, 1.15625, 1.759765625, 2.36328125, 2.966796875, 3.5703125, 4.173828125, 4.77734375, 5.380859375, 5.984375, 6.587890625, 7.19140625, 7.794921875, 8.3984375, 9.001953125, 9.60546875, 10.208984375, 10.8125, 11.416015625, 12.01953125, 12.623046875, 13.2265625, 13.830078125, 14.43359375, 15.037109375, 15.640625, 16.244140625, 16.84765625, 17.451171875, 18.0546875, 18.658203125, 19.26171875, 19.865234375, 20.46875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 0.0, 17.0, 20.0, 16.0, 20.0, 30.0, 43.0, 49.0, 40.0, 49.0, 65.0, 80.0, 119.0, 150.0, 198.0, 249.0, 337.0, 394.0, 523.0, 771.0, 1212.0, 1986.0, 3713.0, 7658.0, 17265.0, 46175.0, 138520.0, 445342.0, 4206059.0, 920655.0, 331574.0, 103870.0, 35495.0, 13785.0, 6042.0, 3165.0, 1670.0, 1146.0, 761.0, 516.0, 354.0, 292.0, 214.0, 167.0, 133.0, 106.0, 90.0, 72.0, 74.0, 44.0, 25.0, 21.0, 14.0, 21.0, 15.0, 4.0, 7.0, 3.0, 5.0, 2.0], "bins": [-0.322265625, -0.31246185302734375, -0.3026580810546875, -0.29285430908203125, -0.283050537109375, -0.27324676513671875, -0.2634429931640625, -0.25363922119140625, -0.24383544921875, -0.23403167724609375, -0.2242279052734375, -0.21442413330078125, -0.204620361328125, -0.19481658935546875, -0.1850128173828125, -0.17520904541015625, -0.1654052734375, -0.15560150146484375, -0.1457977294921875, -0.13599395751953125, -0.126190185546875, -0.11638641357421875, -0.1065826416015625, -0.09677886962890625, -0.08697509765625, -0.07717132568359375, -0.0673675537109375, -0.05756378173828125, -0.047760009765625, -0.03795623779296875, -0.0281524658203125, -0.01834869384765625, -0.008544921875, 0.00125885009765625, 0.0110626220703125, 0.02086639404296875, 0.030670166015625, 0.04047393798828125, 0.0502777099609375, 0.06008148193359375, 0.06988525390625, 0.07968902587890625, 0.0894927978515625, 0.09929656982421875, 0.109100341796875, 0.11890411376953125, 0.1287078857421875, 0.13851165771484375, 0.1483154296875, 0.15811920166015625, 0.1679229736328125, 0.17772674560546875, 0.187530517578125, 0.19733428955078125, 0.2071380615234375, 0.21694183349609375, 0.22674560546875, 0.23654937744140625, 0.2463531494140625, 0.25615692138671875, 0.265960693359375, 0.27576446533203125, 0.2855682373046875, 0.29537200927734375, 0.30517578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 17.0, 16.0, 14.0, 23.0, 35.0, 28.0, 35.0, 59.0, 49.0, 47.0, 61.0, 56.0, 1076.0, 72.0, 71.0, 61.0, 50.0, 51.0, 38.0, 32.0, 23.0, 17.0, 10.0, 20.0, 14.0, 9.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.1875, -22.515380859375, -21.84326171875, -21.171142578125, -20.4990234375, -19.826904296875, -19.15478515625, -18.482666015625, -17.810546875, -17.138427734375, -16.46630859375, -15.794189453125, -15.1220703125, -14.449951171875, -13.77783203125, -13.105712890625, -12.43359375, -11.761474609375, -11.08935546875, -10.417236328125, -9.7451171875, -9.072998046875, -8.40087890625, -7.728759765625, -7.056640625, -6.384521484375, -5.71240234375, -5.040283203125, -4.3681640625, -3.696044921875, -3.02392578125, -2.351806640625, -1.6796875, -1.007568359375, -0.33544921875, 0.336669921875, 1.0087890625, 1.680908203125, 2.35302734375, 3.025146484375, 3.697265625, 4.369384765625, 5.04150390625, 5.713623046875, 6.3857421875, 7.057861328125, 7.72998046875, 8.402099609375, 9.07421875, 9.746337890625, 10.41845703125, 11.090576171875, 11.7626953125, 12.434814453125, 13.10693359375, 13.779052734375, 14.451171875, 15.123291015625, 15.79541015625, 16.467529296875, 17.1396484375, 17.811767578125, 18.48388671875, 19.156005859375, 19.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 13.0, 11.0, 20.0, 23.0, 43.0, 60.0, 98.0, 228.0, 409.0, 729.0, 1565.0, 3940.0, 23214.0, 6129902.0, 119443.0, 6912.0, 2549.0, 1022.0, 553.0, 243.0, 184.0, 74.0, 55.0, 36.0, 28.0, 23.0, 12.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.4609375, -2.3989410400390625, -2.336944580078125, -2.2749481201171875, -2.21295166015625, -2.1509552001953125, -2.088958740234375, -2.0269622802734375, -1.9649658203125, -1.9029693603515625, -1.840972900390625, -1.7789764404296875, -1.71697998046875, -1.6549835205078125, -1.592987060546875, -1.5309906005859375, -1.468994140625, -1.4069976806640625, -1.345001220703125, -1.2830047607421875, -1.22100830078125, -1.1590118408203125, -1.097015380859375, -1.0350189208984375, -0.9730224609375, -0.9110260009765625, -0.849029541015625, -0.7870330810546875, -0.72503662109375, -0.6630401611328125, -0.601043701171875, -0.5390472412109375, -0.47705078125, -0.4150543212890625, -0.353057861328125, -0.2910614013671875, -0.22906494140625, -0.1670684814453125, -0.105072021484375, -0.0430755615234375, 0.0189208984375, 0.0809173583984375, 0.142913818359375, 0.2049102783203125, 0.26690673828125, 0.3289031982421875, 0.390899658203125, 0.4528961181640625, 0.514892578125, 0.5768890380859375, 0.638885498046875, 0.7008819580078125, 0.76287841796875, 0.8248748779296875, 0.886871337890625, 0.9488677978515625, 1.0108642578125, 1.0728607177734375, 1.134857177734375, 1.1968536376953125, 1.25885009765625, 1.3208465576171875, 1.382843017578125, 1.4448394775390625, 1.5068359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 8.0, 11.0, 15.0, 38.0, 56.0, 83.0, 94.0, 120.0, 1152.0, 106.0, 100.0, 67.0, 71.0, 47.0, 18.0, 15.0, 8.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.40625, -14.3388671875, -13.271484375, -12.2041015625, -11.13671875, -10.0693359375, -9.001953125, -7.9345703125, -6.8671875, -5.7998046875, -4.732421875, -3.6650390625, -2.59765625, -1.5302734375, -0.462890625, 0.6044921875, 1.671875, 2.7392578125, 3.806640625, 4.8740234375, 5.94140625, 7.0087890625, 8.076171875, 9.1435546875, 10.2109375, 11.2783203125, 12.345703125, 13.4130859375, 14.48046875, 15.5478515625, 16.615234375, 17.6826171875, 18.75, 19.8173828125, 20.884765625, 21.9521484375, 23.01953125, 24.0869140625, 25.154296875, 26.2216796875, 27.2890625, 28.3564453125, 29.423828125, 30.4912109375, 31.55859375, 32.6259765625, 33.693359375, 34.7607421875, 35.828125, 36.8955078125, 37.962890625, 39.0302734375, 40.09765625, 41.1650390625, 42.232421875, 43.2998046875, 44.3671875, 45.4345703125, 46.501953125, 47.5693359375, 48.63671875, 49.7041015625, 50.771484375, 51.8388671875, 52.90625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 16.0, 883.0, 107.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4377670288086, -85.56261444091797, -82.68745422363281, -79.81230163574219, -76.93714904785156, -74.0619888305664, -71.18683624267578, -68.31167602539062, -65.4365234375, -62.56136703491211, -59.68621063232422, -56.811058044433594, -53.9359016418457, -51.06074523925781, -48.18559265136719, -45.3104362487793, -42.435279846191406, -39.560123443603516, -36.684967041015625, -33.809814453125, -30.93465805053711, -28.05950164794922, -25.18434715270996, -22.309192657470703, -19.434036254882812, -16.558879852294922, -13.683725357055664, -10.80856990814209, -7.933414459228516, -5.058259010314941, -2.183103561401367, 0.6920509338378906, 3.56719970703125, 6.442355155944824, 9.317510604858398, 12.192666053771973, 15.067821502685547, 17.942977905273438, 20.818132400512695, 23.693286895751953, 26.568443298339844, 29.443599700927734, 32.318756103515625, 35.19390869140625, 38.06906509399414, 40.94422149658203, 43.819374084472656, 46.69453048706055, 49.56968688964844, 52.44484329223633, 55.31999969482422, 58.195152282714844, 61.070308685302734, 63.945465087890625, 66.82061767578125, 69.69577026367188, 72.57093048095703, 75.44608306884766, 78.32124328613281, 81.19639587402344, 84.07154846191406, 86.94670867919922, 89.82186126708984, 92.697021484375, 95.57217407226562]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 21.0, 56.0, 118.0, 186.0, 207.0, 182.0, 117.0, 58.0, 24.0, 16.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.10977935791016, -93.33302307128906, -90.55626678466797, -87.7795181274414, -85.00276184082031, -82.22600555419922, -79.44924926757812, -76.67250061035156, -73.89574432373047, -71.11898803710938, -68.34223175048828, -65.56548309326172, -62.788726806640625, -60.01197052001953, -57.23521423339844, -54.45846176147461, -51.681705474853516, -48.90494918823242, -46.128196716308594, -43.3514404296875, -40.57468795776367, -37.79793167114258, -35.02117919921875, -32.244422912597656, -29.467668533325195, -26.690914154052734, -23.914159774780273, -21.137405395507812, -18.36064910888672, -15.583895683288574, -12.807140350341797, -10.030385971069336, -7.253631591796875, -4.476877212524414, -1.700122356414795, 1.0766324996948242, 3.853386878967285, 6.630141258239746, 9.406896591186523, 12.183650970458984, 14.960405349731445, 17.737159729003906, 20.513914108276367, 23.290668487548828, 26.067424774169922, 28.84417724609375, 31.620933532714844, 34.39768981933594, 37.174442291259766, 39.95119857788086, 42.72795104980469, 45.50470733642578, 48.28145980834961, 51.0582160949707, 53.83496856689453, 56.611724853515625, 59.38848114013672, 62.16523742675781, 64.9419937133789, 67.71874237060547, 70.49549865722656, 73.27225494384766, 76.04901123046875, 78.82575988769531, 81.6025161743164]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 21.0, 25.0, 3286.0, 6444.0, 134530.0, 4041061.0, 6289.0, 1330.0, 1236.0, 18.0, 8.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1585693359375, -0.15392494201660156, -0.14928054809570312, -0.1446361541748047, -0.13999176025390625, -0.1353473663330078, -0.13070297241210938, -0.12605857849121094, -0.1214141845703125, -0.11676979064941406, -0.11212539672851562, -0.10748100280761719, -0.10283660888671875, -0.09819221496582031, -0.09354782104492188, -0.08890342712402344, -0.084259033203125, -0.07961463928222656, -0.07497024536132812, -0.07032585144042969, -0.06568145751953125, -0.06103706359863281, -0.056392669677734375, -0.05174827575683594, -0.0471038818359375, -0.04245948791503906, -0.037815093994140625, -0.03317070007324219, -0.02852630615234375, -0.023881912231445312, -0.019237518310546875, -0.014593124389648438, -0.00994873046875, -0.0053043365478515625, -0.000659942626953125, 0.0039844512939453125, 0.00862884521484375, 0.013273239135742188, 0.017917633056640625, 0.022562026977539062, 0.0272064208984375, 0.03185081481933594, 0.036495208740234375, 0.04113960266113281, 0.04578399658203125, 0.05042839050292969, 0.055072784423828125, 0.05971717834472656, 0.064361572265625, 0.06900596618652344, 0.07365036010742188, 0.07829475402832031, 0.08293914794921875, 0.08758354187011719, 0.09222793579101562, 0.09687232971191406, 0.1015167236328125, 0.10616111755371094, 0.11080551147460938, 0.11544990539550781, 0.12009429931640625, 0.12473869323730469, 0.12938308715820312, 0.13402748107910156, 0.138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 59.0, 225.0, 579.0, 90.0, 28.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0906982421875, -0.08805465698242188, -0.08541107177734375, -0.08276748657226562, -0.0801239013671875, -0.07748031616210938, -0.07483673095703125, -0.07219314575195312, -0.069549560546875, -0.06690597534179688, -0.06426239013671875, -0.061618804931640625, -0.0589752197265625, -0.056331634521484375, -0.05368804931640625, -0.051044464111328125, -0.04840087890625, -0.045757293701171875, -0.04311370849609375, -0.040470123291015625, -0.0378265380859375, -0.035182952880859375, -0.03253936767578125, -0.029895782470703125, -0.027252197265625, -0.024608612060546875, -0.02196502685546875, -0.019321441650390625, -0.0166778564453125, -0.014034271240234375, -0.01139068603515625, -0.008747100830078125, -0.006103515625, -0.003459930419921875, -0.00081634521484375, 0.001827239990234375, 0.0044708251953125, 0.007114410400390625, 0.00975799560546875, 0.012401580810546875, 0.015045166015625, 0.017688751220703125, 0.02033233642578125, 0.022975921630859375, 0.0256195068359375, 0.028263092041015625, 0.03090667724609375, 0.033550262451171875, 0.03619384765625, 0.038837432861328125, 0.04148101806640625, 0.044124603271484375, 0.0467681884765625, 0.049411773681640625, 0.05205535888671875, 0.054698944091796875, 0.057342529296875, 0.059986114501953125, 0.06262969970703125, 0.06527328491210938, 0.0679168701171875, 0.07056045532226562, 0.07320404052734375, 0.07584762573242188, 0.0784912109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 9.0, 21.0, 31.0, 56.0, 70.0, 160.0, 351.0, 1695.0, 4187705.0, 3402.0, 390.0, 138.0, 65.0, 49.0, 28.0, 23.0, 12.0, 12.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1494140625, -0.1446819305419922, -0.13994979858398438, -0.13521766662597656, -0.13048553466796875, -0.12575340270996094, -0.12102127075195312, -0.11628913879394531, -0.1115570068359375, -0.10682487487792969, -0.10209274291992188, -0.09736061096191406, -0.09262847900390625, -0.08789634704589844, -0.08316421508789062, -0.07843208312988281, -0.073699951171875, -0.06896781921386719, -0.06423568725585938, -0.05950355529785156, -0.05477142333984375, -0.05003929138183594, -0.045307159423828125, -0.04057502746582031, -0.0358428955078125, -0.031110763549804688, -0.026378631591796875, -0.021646499633789062, -0.01691436767578125, -0.012182235717773438, -0.007450103759765625, -0.0027179718017578125, 0.00201416015625, 0.0067462921142578125, 0.011478424072265625, 0.016210556030273438, 0.02094268798828125, 0.025674819946289062, 0.030406951904296875, 0.03513908386230469, 0.0398712158203125, 0.04460334777832031, 0.049335479736328125, 0.05406761169433594, 0.05879974365234375, 0.06353187561035156, 0.06826400756835938, 0.07299613952636719, 0.077728271484375, 0.08246040344238281, 0.08719253540039062, 0.09192466735839844, 0.09665679931640625, 0.10138893127441406, 0.10612106323242188, 0.11085319519042969, 0.1155853271484375, 0.12031745910644531, 0.12504959106445312, 0.12978172302246094, 0.13451385498046875, 0.13924598693847656, 0.14397811889648438, 0.1487102508544922, 0.1534423828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 10.0, 20.0, 30.0, 51.0, 75.0, 154.0, 299.0, 710.0, 1325.0, 740.0, 294.0, 118.0, 67.0, 46.0, 26.0, 21.0, 13.0, 11.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032379150390625, -0.031352996826171875, -0.03032684326171875, -0.029300689697265625, -0.0282745361328125, -0.027248382568359375, -0.02622222900390625, -0.025196075439453125, -0.024169921875, -0.023143768310546875, -0.02211761474609375, -0.021091461181640625, -0.0200653076171875, -0.019039154052734375, -0.01801300048828125, -0.016986846923828125, -0.015960693359375, -0.014934539794921875, -0.01390838623046875, -0.012882232666015625, -0.0118560791015625, -0.010829925537109375, -0.00980377197265625, -0.008777618408203125, -0.00775146484375, -0.006725311279296875, -0.00569915771484375, -0.004673004150390625, -0.0036468505859375, -0.002620697021484375, -0.00159454345703125, -0.000568389892578125, 0.000457763671875, 0.001483917236328125, 0.00251007080078125, 0.003536224365234375, 0.0045623779296875, 0.005588531494140625, 0.00661468505859375, 0.007640838623046875, 0.0086669921875, 0.009693145751953125, 0.01071929931640625, 0.011745452880859375, 0.0127716064453125, 0.013797760009765625, 0.01482391357421875, 0.015850067138671875, 0.016876220703125, 0.017902374267578125, 0.01892852783203125, 0.019954681396484375, 0.0209808349609375, 0.022006988525390625, 0.02303314208984375, 0.024059295654296875, 0.02508544921875, 0.026111602783203125, 0.02713775634765625, 0.028163909912109375, 0.0291900634765625, 0.030216217041015625, 0.03124237060546875, 0.032268524169921875, 0.033294677734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 957.0, 59.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13312101364135742, -0.12063343077898026, -0.10814584791660309, -0.09565827250480652, -0.08317068964242935, -0.07068310678005219, -0.058195531368255615, -0.04570794850587845, -0.03322036564350128, -0.020732784643769264, -0.008245203644037247, 0.004242375493049622, 0.01672995835542679, 0.029217541217803955, 0.041705116629600525, 0.05419269949197769, 0.06668028235435486, 0.07916786521673203, 0.09165544807910919, 0.10414302349090576, 0.11663060635328293, 0.1291181892156601, 0.14160576462745667, 0.15409335494041443, 0.166580930352211, 0.17906850576400757, 0.19155609607696533, 0.2040436714887619, 0.21653124690055847, 0.22901883721351624, 0.2415064126253128, 0.2539939880371094, 0.26648157835006714, 0.2789691686630249, 0.2914567291736603, 0.30394431948661804, 0.3164319097995758, 0.3289194703102112, 0.34140706062316895, 0.3538946509361267, 0.3663822412490845, 0.37886983156204224, 0.3913573920726776, 0.4038449823856354, 0.41633257269859314, 0.4288201332092285, 0.4413077235221863, 0.45379531383514404, 0.4662828743457794, 0.4787704646587372, 0.49125802516937256, 0.5037456154823303, 0.5162332057952881, 0.5287207961082458, 0.5412083864212036, 0.5536959171295166, 0.5661835074424744, 0.5786710977554321, 0.5911586880683899, 0.6036462783813477, 0.6161338090896606, 0.6286213994026184, 0.6411089897155762, 0.6535965800285339, 0.6660841703414917]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 15.0, 14.0, 9.0, 12.0, 18.0, 17.0, 19.0, 27.0, 28.0, 28.0, 25.0, 23.0, 32.0, 42.0, 34.0, 32.0, 38.0, 40.0, 46.0, 36.0, 43.0, 46.0, 43.0, 25.0, 31.0, 36.0, 37.0, 30.0, 24.0, 24.0, 20.0, 20.0, 16.0, 12.0, 5.0, 12.0, 8.0, 5.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.051763057708740234, -0.050176411867141724, -0.048589762300252914, -0.047003112733364105, -0.045416466891765594, -0.043829821050167084, -0.042243171483278275, -0.040656521916389465, -0.039069876074790955, -0.037483230233192444, -0.035896580666303635, -0.034309931099414825, -0.032723285257816315, -0.031136637553572655, -0.029549989849328995, -0.027963342145085335, -0.026376694440841675, -0.024790046736598015, -0.023203399032354355, -0.021616751328110695, -0.020030103623867035, -0.018443455919623375, -0.016856808215379715, -0.015270160511136055, -0.013683512806892395, -0.012096865102648735, -0.010510217398405075, -0.008923569694161415, -0.007336921989917755, -0.005750274285674095, -0.004163626581430435, -0.002576978877186775, -0.0009903311729431152, 0.0005963165313005447, 0.0021829642355442047, 0.0037696119397878647, 0.005356259644031525, 0.006942907348275185, 0.008529555052518845, 0.010116202756762505, 0.011702850461006165, 0.013289498165249825, 0.014876145869493484, 0.016462793573737144, 0.018049441277980804, 0.019636088982224464, 0.021222736686468124, 0.022809384390711784, 0.024396032094955444, 0.025982679799199104, 0.027569327503442764, 0.029155975207686424, 0.030742622911930084, 0.032329268753528595, 0.033915918320417404, 0.03550256788730621, 0.037089213728904724, 0.038675859570503235, 0.040262509137392044, 0.04184915870428085, 0.043435804545879364, 0.045022450387477875, 0.046609099954366684, 0.04819574952125549, 0.049782395362854004]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 6.0, 7.0, 20.0, 30.0, 26.0, 37.0, 76.0, 96.0, 144.0, 251.0, 458.0, 1097.0, 7143.0, 1020429.0, 15718.0, 1636.0, 584.0, 280.0, 162.0, 86.0, 71.0, 38.0, 40.0, 17.0, 17.0, 11.0, 13.0, 12.0, 3.0, 1.0, 7.0, 7.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.21484375, -4.093109130859375, -3.97137451171875, -3.849639892578125, -3.7279052734375, -3.606170654296875, -3.48443603515625, -3.362701416015625, -3.240966796875, -3.119232177734375, -2.99749755859375, -2.875762939453125, -2.7540283203125, -2.632293701171875, -2.51055908203125, -2.388824462890625, -2.26708984375, -2.145355224609375, -2.02362060546875, -1.901885986328125, -1.7801513671875, -1.658416748046875, -1.53668212890625, -1.414947509765625, -1.293212890625, -1.171478271484375, -1.04974365234375, -0.928009033203125, -0.8062744140625, -0.684539794921875, -0.56280517578125, -0.441070556640625, -0.3193359375, -0.197601318359375, -0.07586669921875, 0.045867919921875, 0.1676025390625, 0.289337158203125, 0.41107177734375, 0.532806396484375, 0.654541015625, 0.776275634765625, 0.89801025390625, 1.019744873046875, 1.1414794921875, 1.263214111328125, 1.38494873046875, 1.506683349609375, 1.62841796875, 1.750152587890625, 1.87188720703125, 1.993621826171875, 2.1153564453125, 2.237091064453125, 2.35882568359375, 2.480560302734375, 2.602294921875, 2.724029541015625, 2.84576416015625, 2.967498779296875, 3.0892333984375, 3.210968017578125, 3.33270263671875, 3.454437255859375, 3.576171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 56.0, 203.0, 589.0, 101.0, 29.0, 11.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0897216796875, -0.08711051940917969, -0.08449935913085938, -0.08188819885253906, -0.07927703857421875, -0.07666587829589844, -0.07405471801757812, -0.07144355773925781, -0.0688323974609375, -0.06622123718261719, -0.06361007690429688, -0.06099891662597656, -0.05838775634765625, -0.05577659606933594, -0.053165435791015625, -0.05055427551269531, -0.047943115234375, -0.04533195495605469, -0.042720794677734375, -0.04010963439941406, -0.03749847412109375, -0.03488731384277344, -0.032276153564453125, -0.029664993286132812, -0.0270538330078125, -0.024442672729492188, -0.021831512451171875, -0.019220352172851562, -0.01660919189453125, -0.013998031616210938, -0.011386871337890625, -0.008775711059570312, -0.00616455078125, -0.0035533905029296875, -0.000942230224609375, 0.0016689300537109375, 0.00428009033203125, 0.0068912506103515625, 0.009502410888671875, 0.012113571166992188, 0.0147247314453125, 0.017335891723632812, 0.019947052001953125, 0.022558212280273438, 0.02516937255859375, 0.027780532836914062, 0.030391693115234375, 0.03300285339355469, 0.035614013671875, 0.03822517395019531, 0.040836334228515625, 0.04344749450683594, 0.04605865478515625, 0.04866981506347656, 0.051280975341796875, 0.05389213562011719, 0.0565032958984375, 0.05911445617675781, 0.061725616455078125, 0.06433677673339844, 0.06694793701171875, 0.06955909729003906, 0.07217025756835938, 0.07478141784667969, 0.077392578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 8.0, 4.0, 3.0, 8.0, 13.0, 17.0, 17.0, 21.0, 44.0, 77.0, 103.0, 156.0, 258.0, 567.0, 987.0, 1779.0, 3790.0, 8231.0, 19052.0, 49265.0, 178620.0, 589486.0, 127358.0, 39589.0, 15393.0, 6871.0, 3307.0, 1572.0, 836.0, 432.0, 261.0, 151.0, 85.0, 54.0, 39.0, 31.0, 14.0, 19.0, 11.0, 12.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09325122833251953, -0.09037208557128906, -0.0874929428100586, -0.08461380004882812, -0.08173465728759766, -0.07885551452636719, -0.07597637176513672, -0.07309722900390625, -0.07021808624267578, -0.06733894348144531, -0.06445980072021484, -0.061580657958984375, -0.058701515197753906, -0.05582237243652344, -0.05294322967529297, -0.0500640869140625, -0.04718494415283203, -0.04430580139160156, -0.041426658630371094, -0.038547515869140625, -0.035668373107910156, -0.03278923034667969, -0.02991008758544922, -0.02703094482421875, -0.02415180206298828, -0.021272659301757812, -0.018393516540527344, -0.015514373779296875, -0.012635231018066406, -0.009756088256835938, -0.006876945495605469, -0.003997802734375, -0.0011186599731445312, 0.0017604827880859375, 0.004639625549316406, 0.007518768310546875, 0.010397911071777344, 0.013277053833007812, 0.01615619659423828, 0.01903533935546875, 0.02191448211669922, 0.024793624877929688, 0.027672767639160156, 0.030551910400390625, 0.033431053161621094, 0.03631019592285156, 0.03918933868408203, 0.0420684814453125, 0.04494762420654297, 0.04782676696777344, 0.050705909729003906, 0.053585052490234375, 0.056464195251464844, 0.05934333801269531, 0.06222248077392578, 0.06510162353515625, 0.06798076629638672, 0.07085990905761719, 0.07373905181884766, 0.07661819458007812, 0.0794973373413086, 0.08237648010253906, 0.08525562286376953, 0.088134765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 8.0, 10.0, 24.0, 22.0, 21.0, 31.0, 24.0, 29.0, 36.0, 31.0, 42.0, 42.0, 52.0, 37.0, 43.0, 55.0, 49.0, 46.0, 37.0, 43.0, 41.0, 38.0, 33.0, 24.0, 26.0, 32.0, 14.0, 16.0, 6.0, 8.0, 12.0, 6.0, 7.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04718017578125, -0.0456395149230957, -0.044098854064941406, -0.04255819320678711, -0.04101753234863281, -0.039476871490478516, -0.03793621063232422, -0.03639554977416992, -0.034854888916015625, -0.03331422805786133, -0.03177356719970703, -0.030232906341552734, -0.028692245483398438, -0.02715158462524414, -0.025610923767089844, -0.024070262908935547, -0.02252960205078125, -0.020988941192626953, -0.019448280334472656, -0.01790761947631836, -0.016366958618164062, -0.014826297760009766, -0.013285636901855469, -0.011744976043701172, -0.010204315185546875, -0.008663654327392578, -0.007122993469238281, -0.005582332611083984, -0.0040416717529296875, -0.0025010108947753906, -0.0009603500366210938, 0.0005803108215332031, 0.0021209716796875, 0.003661632537841797, 0.005202293395996094, 0.006742954254150391, 0.008283615112304688, 0.009824275970458984, 0.011364936828613281, 0.012905597686767578, 0.014446258544921875, 0.015986919403076172, 0.01752758026123047, 0.019068241119384766, 0.020608901977539062, 0.02214956283569336, 0.023690223693847656, 0.025230884552001953, 0.02677154541015625, 0.028312206268310547, 0.029852867126464844, 0.03139352798461914, 0.03293418884277344, 0.034474849700927734, 0.03601551055908203, 0.03755617141723633, 0.039096832275390625, 0.04063749313354492, 0.04217815399169922, 0.043718814849853516, 0.04525947570800781, 0.04680013656616211, 0.048340797424316406, 0.0498814582824707, 0.051422119140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 7.0, 13.0, 16.0, 28.0, 59.0, 117.0, 224.0, 538.0, 1460.0, 5541.0, 38235.0, 881458.0, 107268.0, 9936.0, 2226.0, 792.0, 303.0, 152.0, 73.0, 45.0, 24.0, 16.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198211669921875, -0.01912999153137207, -0.01843881607055664, -0.01774764060974121, -0.01705646514892578, -0.01636528968811035, -0.015674114227294922, -0.014982938766479492, -0.014291763305664062, -0.013600587844848633, -0.012909412384033203, -0.012218236923217773, -0.011527061462402344, -0.010835886001586914, -0.010144710540771484, -0.009453535079956055, -0.008762359619140625, -0.008071184158325195, -0.007380008697509766, -0.006688833236694336, -0.005997657775878906, -0.0053064823150634766, -0.004615306854248047, -0.003924131393432617, -0.0032329559326171875, -0.002541780471801758, -0.0018506050109863281, -0.0011594295501708984, -0.00046825408935546875, 0.00022292137145996094, 0.0009140968322753906, 0.0016052722930908203, 0.00229644775390625, 0.0029876232147216797, 0.0036787986755371094, 0.004369974136352539, 0.005061149597167969, 0.0057523250579833984, 0.006443500518798828, 0.007134675979614258, 0.007825851440429688, 0.008517026901245117, 0.009208202362060547, 0.009899377822875977, 0.010590553283691406, 0.011281728744506836, 0.011972904205322266, 0.012664079666137695, 0.013355255126953125, 0.014046430587768555, 0.014737606048583984, 0.015428781509399414, 0.016119956970214844, 0.016811132431030273, 0.017502307891845703, 0.018193483352661133, 0.018884658813476562, 0.019575834274291992, 0.020267009735107422, 0.02095818519592285, 0.02164936065673828, 0.02234053611755371, 0.02303171157836914, 0.02372288703918457, 0.0244140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 17.0, 17.0, 41.0, 77.0, 174.0, 283.0, 190.0, 98.0, 47.0, 24.0, 6.0, 3.0, 0.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.27195292711258e-05, -6.735697388648987e-05, -6.199441850185394e-05, -5.663186311721802e-05, -5.126930773258209e-05, -4.590675234794617e-05, -4.054419696331024e-05, -3.5181641578674316e-05, -2.981908619403839e-05, -2.4456530809402466e-05, -1.909397542476654e-05, -1.3731420040130615e-05, -8.36886465549469e-06, -3.0063092708587646e-06, 2.3562461137771606e-06, 7.718801498413086e-06, 1.3081356883049011e-05, 1.8443912267684937e-05, 2.3806467652320862e-05, 2.9169023036956787e-05, 3.453157842159271e-05, 3.989413380622864e-05, 4.525668919086456e-05, 5.061924457550049e-05, 5.5981799960136414e-05, 6.134435534477234e-05, 6.670691072940826e-05, 7.206946611404419e-05, 7.743202149868011e-05, 8.279457688331604e-05, 8.815713226795197e-05, 9.351968765258789e-05, 9.888224303722382e-05, 0.00010424479842185974, 0.00010960735380649567, 0.00011496990919113159, 0.00012033246457576752, 0.00012569501996040344, 0.00013105757534503937, 0.0001364201307296753, 0.00014178268611431122, 0.00014714524149894714, 0.00015250779688358307, 0.000157870352268219, 0.00016323290765285492, 0.00016859546303749084, 0.00017395801842212677, 0.0001793205738067627, 0.00018468312919139862, 0.00019004568457603455, 0.00019540823996067047, 0.0002007707953453064, 0.00020613335072994232, 0.00021149590611457825, 0.00021685846149921417, 0.0002222210168838501, 0.00022758357226848602, 0.00023294612765312195, 0.00023830868303775787, 0.0002436712384223938, 0.0002490337938070297, 0.00025439634919166565, 0.0002597589045763016, 0.0002651214599609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 13.0, 11.0, 15.0, 24.0, 32.0, 48.0, 78.0, 198.0, 423.0, 994.0, 2920.0, 11055.0, 105368.0, 884654.0, 33311.0, 6210.0, 1903.0, 664.0, 283.0, 127.0, 73.0, 41.0, 26.0, 22.0, 16.0, 16.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195465087890625, -0.018901348114013672, -0.018256187438964844, -0.017611026763916016, -0.016965866088867188, -0.01632070541381836, -0.01567554473876953, -0.015030384063720703, -0.014385223388671875, -0.013740062713623047, -0.013094902038574219, -0.01244974136352539, -0.011804580688476562, -0.011159420013427734, -0.010514259338378906, -0.009869098663330078, -0.00922393798828125, -0.008578777313232422, -0.007933616638183594, -0.007288455963134766, -0.0066432952880859375, -0.005998134613037109, -0.005352973937988281, -0.004707813262939453, -0.004062652587890625, -0.003417491912841797, -0.0027723312377929688, -0.0021271705627441406, -0.0014820098876953125, -0.0008368492126464844, -0.00019168853759765625, 0.0004534721374511719, 0.0010986328125, 0.0017437934875488281, 0.0023889541625976562, 0.0030341148376464844, 0.0036792755126953125, 0.004324436187744141, 0.004969596862792969, 0.005614757537841797, 0.006259918212890625, 0.006905078887939453, 0.007550239562988281, 0.00819540023803711, 0.008840560913085938, 0.009485721588134766, 0.010130882263183594, 0.010776042938232422, 0.01142120361328125, 0.012066364288330078, 0.012711524963378906, 0.013356685638427734, 0.014001846313476562, 0.01464700698852539, 0.015292167663574219, 0.015937328338623047, 0.016582489013671875, 0.017227649688720703, 0.01787281036376953, 0.01851797103881836, 0.019163131713867188, 0.019808292388916016, 0.020453453063964844, 0.021098613739013672, 0.0217437744140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 8.0, 6.0, 9.0, 8.0, 17.0, 21.0, 24.0, 30.0, 68.0, 91.0, 173.0, 210.0, 101.0, 62.0, 54.0, 27.0, 24.0, 12.0, 7.0, 5.0, 5.0, 3.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.008989214897155762, -0.008632421493530273, -0.008275628089904785, -0.007918834686279297, -0.007562041282653809, -0.00720524787902832, -0.006848454475402832, -0.006491661071777344, -0.0061348676681518555, -0.005778074264526367, -0.005421280860900879, -0.005064487457275391, -0.004707694053649902, -0.004350900650024414, -0.003994107246398926, -0.0036373138427734375, -0.0032805204391479492, -0.002923727035522461, -0.0025669336318969727, -0.0022101402282714844, -0.001853346824645996, -0.0014965534210205078, -0.0011397600173950195, -0.0007829666137695312, -0.00042617321014404297, -6.937980651855469e-05, 0.0002874135971069336, 0.0006442070007324219, 0.0010010004043579102, 0.0013577938079833984, 0.0017145872116088867, 0.002071380615234375, 0.0024281740188598633, 0.0027849674224853516, 0.00314176082611084, 0.003498554229736328, 0.0038553476333618164, 0.004212141036987305, 0.004568934440612793, 0.004925727844238281, 0.0052825212478637695, 0.005639314651489258, 0.005996108055114746, 0.006352901458740234, 0.006709694862365723, 0.007066488265991211, 0.007423281669616699, 0.0077800750732421875, 0.008136868476867676, 0.008493661880493164, 0.008850455284118652, 0.00920724868774414, 0.009564042091369629, 0.009920835494995117, 0.010277628898620605, 0.010634422302246094, 0.010991215705871582, 0.01134800910949707, 0.011704802513122559, 0.012061595916748047, 0.012418389320373535, 0.012775182723999023, 0.013131976127624512, 0.01348876953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 10.0, 17.0, 31.0, 87.0, 304.0, 266.0, 130.0, 50.0, 42.0, 19.0, 20.0, 4.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4709995985031128, -0.453492671251297, -0.4359857439994812, -0.4184788465499878, -0.400971919298172, -0.3834649920463562, -0.3659580647945404, -0.3484511375427246, -0.3309442400932312, -0.3134373128414154, -0.2959303855895996, -0.2784234881401062, -0.2609165608882904, -0.2434096336364746, -0.2259027063846588, -0.20839577913284302, -0.19088885188102722, -0.17338192462921143, -0.15587501227855682, -0.13836808502674103, -0.12086116522550583, -0.10335424542427063, -0.08584731817245483, -0.06834039837121964, -0.050833478569984436, -0.03332655876874924, -0.01581963524222374, 0.0016872882843017578, 0.019194208085536957, 0.036701127886772156, 0.05420805513858795, 0.07171497493982315, 0.08922189474105835, 0.10672881454229355, 0.12423573434352875, 0.14174266159534454, 0.15924957394599915, 0.17675650119781494, 0.19426342844963074, 0.21177035570144653, 0.22927726805210114, 0.24678419530391693, 0.26429110765457153, 0.28179803490638733, 0.2993049621582031, 0.31681185960769653, 0.3343188166618347, 0.3518257141113281, 0.3693326413631439, 0.3868395686149597, 0.4043464958667755, 0.4218534231185913, 0.4393603205680847, 0.4568672478199005, 0.4743741750717163, 0.4918811023235321, 0.5093880295753479, 0.5268949270248413, 0.5444018840789795, 0.5619087815284729, 0.5794157385826111, 0.5969226360321045, 0.6144295930862427, 0.6319364905357361, 0.6494433879852295]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 20.0, 42.0, 62.0, 83.0, 120.0, 108.0, 133.0, 127.0, 84.0, 78.0, 58.0, 28.0, 20.0, 11.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5549145936965942, -0.535903811454773, -0.5168930888175964, -0.49788230657577515, -0.47887152433395386, -0.45986077189445496, -0.44085001945495605, -0.42183923721313477, -0.40282848477363586, -0.38381773233413696, -0.3648069500923157, -0.3457961976528168, -0.32678544521331787, -0.3077746629714966, -0.2887639105319977, -0.2697531580924988, -0.2507423758506775, -0.2317316085100174, -0.2127208411693573, -0.1937100887298584, -0.1746993213891983, -0.1556885540485382, -0.1366778016090393, -0.11766703426837921, -0.09865626692771912, -0.07964549958705902, -0.06063473969697952, -0.041623976081609726, -0.02261321246623993, -0.003602445125579834, 0.015408314764499664, 0.03441907465457916, 0.05342990159988403, 0.07244066894054413, 0.09145142883062363, 0.11046218872070312, 0.12947295606136322, 0.14848372340202332, 0.16749447584152222, 0.1865052431821823, 0.2055160105228424, 0.2245267778635025, 0.2435375452041626, 0.2625482976436615, 0.2815590500831604, 0.3005698323249817, 0.3195805847644806, 0.3385913372039795, 0.3576021194458008, 0.3766128718852997, 0.39562365412712097, 0.4146344065666199, 0.43364518880844116, 0.45265594124794006, 0.47166669368743896, 0.49067747592926025, 0.5096882581710815, 0.5286990404129028, 0.5477097630500793, 0.5667205452919006, 0.5857313275337219, 0.6047420501708984, 0.6237528324127197, 0.642763614654541, 0.6617743372917175]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 11.0, 14.0, 9.0, 19.0, 25.0, 30.0, 47.0, 54.0, 86.0, 102.0, 207.0, 592.0, 4910.0, 4169072.0, 17017.0, 1136.0, 328.0, 152.0, 118.0, 89.0, 67.0, 41.0, 37.0, 29.0, 18.0, 21.0, 10.0, 11.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4951171875, -0.48040771484375, -0.4656982421875, -0.45098876953125, -0.436279296875, -0.42156982421875, -0.4068603515625, -0.39215087890625, -0.37744140625, -0.36273193359375, -0.3480224609375, -0.33331298828125, -0.318603515625, -0.30389404296875, -0.2891845703125, -0.27447509765625, -0.259765625, -0.24505615234375, -0.2303466796875, -0.21563720703125, -0.200927734375, -0.18621826171875, -0.1715087890625, -0.15679931640625, -0.14208984375, -0.12738037109375, -0.1126708984375, -0.09796142578125, -0.083251953125, -0.06854248046875, -0.0538330078125, -0.03912353515625, -0.0244140625, -0.00970458984375, 0.0050048828125, 0.01971435546875, 0.034423828125, 0.04913330078125, 0.0638427734375, 0.07855224609375, 0.09326171875, 0.10797119140625, 0.1226806640625, 0.13739013671875, 0.152099609375, 0.16680908203125, 0.1815185546875, 0.19622802734375, 0.2109375, 0.22564697265625, 0.2403564453125, 0.25506591796875, 0.269775390625, 0.28448486328125, 0.2991943359375, 0.31390380859375, 0.32861328125, 0.34332275390625, 0.3580322265625, 0.37274169921875, 0.387451171875, 0.40216064453125, 0.4168701171875, 0.43157958984375, 0.4462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 18.0, 94.0, 396.0, 395.0, 63.0, 22.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0830078125, -0.0805673599243164, -0.07812690734863281, -0.07568645477294922, -0.07324600219726562, -0.07080554962158203, -0.06836509704589844, -0.06592464447021484, -0.06348419189453125, -0.061043739318847656, -0.05860328674316406, -0.05616283416748047, -0.053722381591796875, -0.05128192901611328, -0.04884147644042969, -0.046401023864746094, -0.0439605712890625, -0.041520118713378906, -0.03907966613769531, -0.03663921356201172, -0.034198760986328125, -0.03175830841064453, -0.029317855834960938, -0.026877403259277344, -0.02443695068359375, -0.021996498107910156, -0.019556045532226562, -0.01711559295654297, -0.014675140380859375, -0.012234687805175781, -0.009794235229492188, -0.007353782653808594, -0.004913330078125, -0.0024728775024414062, -3.24249267578125e-05, 0.0024080276489257812, 0.004848480224609375, 0.007288932800292969, 0.009729385375976562, 0.012169837951660156, 0.01461029052734375, 0.017050743103027344, 0.019491195678710938, 0.02193164825439453, 0.024372100830078125, 0.02681255340576172, 0.029253005981445312, 0.031693458557128906, 0.0341339111328125, 0.036574363708496094, 0.03901481628417969, 0.04145526885986328, 0.043895721435546875, 0.04633617401123047, 0.04877662658691406, 0.051217079162597656, 0.05365753173828125, 0.056097984313964844, 0.05853843688964844, 0.06097888946533203, 0.06341934204101562, 0.06585979461669922, 0.06830024719238281, 0.0707406997680664, 0.07318115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 24.0, 34.0, 56.0, 137.0, 424.0, 2334.0, 114974.0, 4069200.0, 6006.0, 705.0, 210.0, 79.0, 38.0, 26.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2739429473876953, -0.2671241760253906, -0.26030540466308594, -0.25348663330078125, -0.24666786193847656, -0.23984909057617188, -0.2330303192138672, -0.2262115478515625, -0.2193927764892578, -0.21257400512695312, -0.20575523376464844, -0.19893646240234375, -0.19211769104003906, -0.18529891967773438, -0.1784801483154297, -0.171661376953125, -0.1648426055908203, -0.15802383422851562, -0.15120506286621094, -0.14438629150390625, -0.13756752014160156, -0.13074874877929688, -0.12392997741699219, -0.1171112060546875, -0.11029243469238281, -0.10347366333007812, -0.09665489196777344, -0.08983612060546875, -0.08301734924316406, -0.07619857788085938, -0.06937980651855469, -0.06256103515625, -0.05574226379394531, -0.048923492431640625, -0.04210472106933594, -0.03528594970703125, -0.028467178344726562, -0.021648406982421875, -0.014829635620117188, -0.0080108642578125, -0.0011920928955078125, 0.005626678466796875, 0.012445449829101562, 0.01926422119140625, 0.026082992553710938, 0.032901763916015625, 0.03972053527832031, 0.046539306640625, 0.05335807800292969, 0.060176849365234375, 0.06699562072753906, 0.07381439208984375, 0.08063316345214844, 0.08745193481445312, 0.09427070617675781, 0.1010894775390625, 0.10790824890136719, 0.11472702026367188, 0.12154579162597656, 0.12836456298828125, 0.13518333435058594, 0.14200210571289062, 0.1488208770751953, 0.1556396484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 9.0, 9.0, 20.0, 31.0, 50.0, 111.0, 260.0, 1941.0, 1222.0, 236.0, 89.0, 41.0, 26.0, 13.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09160423278808594, -0.08951950073242188, -0.08743476867675781, -0.08535003662109375, -0.08326530456542969, -0.08118057250976562, -0.07909584045410156, -0.0770111083984375, -0.07492637634277344, -0.07284164428710938, -0.07075691223144531, -0.06867218017578125, -0.06658744812011719, -0.06450271606445312, -0.06241798400878906, -0.060333251953125, -0.05824851989746094, -0.056163787841796875, -0.05407905578613281, -0.05199432373046875, -0.04990959167480469, -0.047824859619140625, -0.04574012756347656, -0.0436553955078125, -0.04157066345214844, -0.039485931396484375, -0.03740119934082031, -0.03531646728515625, -0.03323173522949219, -0.031147003173828125, -0.029062271118164062, -0.0269775390625, -0.024892807006835938, -0.022808074951171875, -0.020723342895507812, -0.01863861083984375, -0.016553878784179688, -0.014469146728515625, -0.012384414672851562, -0.0102996826171875, -0.008214950561523438, -0.006130218505859375, -0.0040454864501953125, -0.00196075439453125, 0.0001239776611328125, 0.002208709716796875, 0.0042934417724609375, 0.006378173828125, 0.008462905883789062, 0.010547637939453125, 0.012632369995117188, 0.01471710205078125, 0.016801834106445312, 0.018886566162109375, 0.020971298217773438, 0.0230560302734375, 0.025140762329101562, 0.027225494384765625, 0.029310226440429688, 0.03139495849609375, 0.03347969055175781, 0.035564422607421875, 0.03764915466308594, 0.03973388671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 43.0, 657.0, 303.0, 8.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47507214546203613, -0.4534001350402832, -0.4317281246185303, -0.41005611419677734, -0.3883841037750244, -0.3667120933532715, -0.34504005312919617, -0.32336804270744324, -0.3016960322856903, -0.2800240218639374, -0.25835201144218445, -0.23667998611927032, -0.2150079756975174, -0.19333596527576447, -0.17166393995285034, -0.1499919295310974, -0.12831991910934448, -0.10664790868759155, -0.08497589081525803, -0.0633038729429245, -0.04163186252117157, -0.01995985209941864, 0.0017121732234954834, 0.023384183645248413, 0.04505619406700134, 0.06672820448875427, 0.0884002223610878, 0.11007224023342133, 0.13174425065517426, 0.15341626107692719, 0.1750882863998413, 0.19676029682159424, 0.21843230724334717, 0.2401043176651001, 0.261776328086853, 0.28344833850860596, 0.3051203489303589, 0.3267923593521118, 0.34846439957618713, 0.37013640999794006, 0.391808420419693, 0.4134804308414459, 0.43515244126319885, 0.45682448148727417, 0.4784964919090271, 0.50016850233078, 0.521840512752533, 0.5435125231742859, 0.5651845335960388, 0.5868565440177917, 0.6085285544395447, 0.6302005648612976, 0.6518725752830505, 0.6735445857048035, 0.6952166557312012, 0.7168886661529541, 0.738560676574707, 0.76023268699646, 0.7819046974182129, 0.8035767078399658, 0.8252487182617188, 0.8469207286834717, 0.8685927391052246, 0.8902647495269775, 0.9119367599487305]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 13.0, 20.0, 21.0, 22.0, 18.0, 19.0, 32.0, 38.0, 26.0, 30.0, 33.0, 46.0, 25.0, 25.0, 34.0, 37.0, 43.0, 42.0, 41.0, 33.0, 45.0, 38.0, 40.0, 33.0, 23.0, 27.0, 19.0, 16.0, 17.0, 16.0, 17.0, 10.0, 15.0, 13.0, 6.0, 6.0, 5.0, 9.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06899738311767578, -0.06689704954624176, -0.06479671597480774, -0.06269637495279312, -0.0605960413813591, -0.05849570780992508, -0.05639537051320076, -0.05429503321647644, -0.05219469964504242, -0.0500943660736084, -0.04799402877688408, -0.04589369148015976, -0.04379335790872574, -0.04169302433729172, -0.0395926870405674, -0.03749234974384308, -0.03539201617240906, -0.03329168260097504, -0.031191345304250717, -0.029091009870171547, -0.026990674436092377, -0.024890339002013206, -0.022790003567934036, -0.020689668133854866, -0.018589332699775696, -0.016488997265696526, -0.014388661831617355, -0.012288326397538185, -0.010187990963459015, -0.008087655529379845, -0.0059873200953006744, -0.003886984661221504, -0.001786649227142334, 0.00031368620693683624, 0.0024140216410160065, 0.004514357075095177, 0.006614692509174347, 0.008715027943253517, 0.010815363377332687, 0.012915698811411858, 0.015016034245491028, 0.017116369679570198, 0.01921670511364937, 0.02131704054772854, 0.02341737598180771, 0.02551771141588688, 0.02761804684996605, 0.02971838228404522, 0.03181871771812439, 0.03391905128955841, 0.03601938858628273, 0.03811972588300705, 0.04022005945444107, 0.04232039302587509, 0.04442073032259941, 0.04652106761932373, 0.04862140119075775, 0.05072173476219177, 0.05282207205891609, 0.05492240935564041, 0.05702274292707443, 0.05912307649850845, 0.06122341379523277, 0.06332375109195709, 0.06542408466339111]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 7.0, 5.0, 9.0, 7.0, 13.0, 14.0, 18.0, 27.0, 46.0, 41.0, 51.0, 82.0, 106.0, 131.0, 171.0, 270.0, 358.0, 517.0, 967.0, 3441.0, 52973.0, 964744.0, 19763.0, 2274.0, 836.0, 507.0, 293.0, 235.0, 138.0, 126.0, 65.0, 88.0, 52.0, 40.0, 29.0, 28.0, 15.0, 18.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1611328125, -0.15599632263183594, -0.15085983276367188, -0.1457233428955078, -0.14058685302734375, -0.1354503631591797, -0.13031387329101562, -0.12517738342285156, -0.1200408935546875, -0.11490440368652344, -0.10976791381835938, -0.10463142395019531, -0.09949493408203125, -0.09435844421386719, -0.08922195434570312, -0.08408546447753906, -0.078948974609375, -0.07381248474121094, -0.06867599487304688, -0.06353950500488281, -0.05840301513671875, -0.05326652526855469, -0.048130035400390625, -0.04299354553222656, -0.0378570556640625, -0.03272056579589844, -0.027584075927734375, -0.022447586059570312, -0.01731109619140625, -0.012174606323242188, -0.007038116455078125, -0.0019016265869140625, 0.00323486328125, 0.008371353149414062, 0.013507843017578125, 0.018644332885742188, 0.02378082275390625, 0.028917312622070312, 0.034053802490234375, 0.03919029235839844, 0.0443267822265625, 0.04946327209472656, 0.054599761962890625, 0.05973625183105469, 0.06487274169921875, 0.07000923156738281, 0.07514572143554688, 0.08028221130371094, 0.085418701171875, 0.09055519104003906, 0.09569168090820312, 0.10082817077636719, 0.10596466064453125, 0.11110115051269531, 0.11623764038085938, 0.12137413024902344, 0.1265106201171875, 0.13164710998535156, 0.13678359985351562, 0.1419200897216797, 0.14705657958984375, 0.1521930694580078, 0.15732955932617188, 0.16246604919433594, 0.1676025390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 30.0, 129.0, 493.0, 273.0, 48.0, 16.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08514404296875, -0.08269500732421875, -0.0802459716796875, -0.07779693603515625, -0.075347900390625, -0.07289886474609375, -0.0704498291015625, -0.06800079345703125, -0.0655517578125, -0.06310272216796875, -0.0606536865234375, -0.05820465087890625, -0.055755615234375, -0.05330657958984375, -0.0508575439453125, -0.04840850830078125, -0.04595947265625, -0.04351043701171875, -0.0410614013671875, -0.03861236572265625, -0.036163330078125, -0.03371429443359375, -0.0312652587890625, -0.02881622314453125, -0.0263671875, -0.02391815185546875, -0.0214691162109375, -0.01902008056640625, -0.016571044921875, -0.01412200927734375, -0.0116729736328125, -0.00922393798828125, -0.00677490234375, -0.00432586669921875, -0.0018768310546875, 0.00057220458984375, 0.003021240234375, 0.00547027587890625, 0.0079193115234375, 0.01036834716796875, 0.0128173828125, 0.01526641845703125, 0.0177154541015625, 0.02016448974609375, 0.022613525390625, 0.02506256103515625, 0.0275115966796875, 0.02996063232421875, 0.03240966796875, 0.03485870361328125, 0.0373077392578125, 0.03975677490234375, 0.042205810546875, 0.04465484619140625, 0.0471038818359375, 0.04955291748046875, 0.052001953125, 0.05445098876953125, 0.0569000244140625, 0.05934906005859375, 0.061798095703125, 0.06424713134765625, 0.0666961669921875, 0.06914520263671875, 0.07159423828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 7.0, 8.0, 11.0, 16.0, 16.0, 16.0, 21.0, 32.0, 26.0, 41.0, 43.0, 56.0, 91.0, 128.0, 265.0, 651.0, 3801.0, 866813.0, 173457.0, 1763.0, 519.0, 216.0, 129.0, 77.0, 64.0, 59.0, 38.0, 48.0, 20.0, 20.0, 25.0, 16.0, 11.0, 8.0, 9.0, 4.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.24755859375, -0.2402477264404297, -0.23293685913085938, -0.22562599182128906, -0.21831512451171875, -0.21100425720214844, -0.20369338989257812, -0.1963825225830078, -0.1890716552734375, -0.1817607879638672, -0.17444992065429688, -0.16713905334472656, -0.15982818603515625, -0.15251731872558594, -0.14520645141601562, -0.1378955841064453, -0.130584716796875, -0.12327384948730469, -0.11596298217773438, -0.10865211486816406, -0.10134124755859375, -0.09403038024902344, -0.08671951293945312, -0.07940864562988281, -0.0720977783203125, -0.06478691101074219, -0.057476043701171875, -0.05016517639160156, -0.04285430908203125, -0.03554344177246094, -0.028232574462890625, -0.020921707153320312, -0.01361083984375, -0.0062999725341796875, 0.001010894775390625, 0.008321762084960938, 0.01563262939453125, 0.022943496704101562, 0.030254364013671875, 0.03756523132324219, 0.0448760986328125, 0.05218696594238281, 0.059497833251953125, 0.06680870056152344, 0.07411956787109375, 0.08143043518066406, 0.08874130249023438, 0.09605216979980469, 0.103363037109375, 0.11067390441894531, 0.11798477172851562, 0.12529563903808594, 0.13260650634765625, 0.13991737365722656, 0.14722824096679688, 0.1545391082763672, 0.1618499755859375, 0.1691608428955078, 0.17647171020507812, 0.18378257751464844, 0.19109344482421875, 0.19840431213378906, 0.20571517944335938, 0.2130260467529297, 0.2203369140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 13.0, 16.0, 14.0, 14.0, 26.0, 17.0, 21.0, 23.0, 34.0, 33.0, 36.0, 32.0, 40.0, 52.0, 51.0, 54.0, 42.0, 45.0, 57.0, 47.0, 44.0, 45.0, 31.0, 34.0, 27.0, 23.0, 22.0, 20.0, 13.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.040172576904296875, -0.03896331787109375, -0.037754058837890625, -0.0365447998046875, -0.035335540771484375, -0.03412628173828125, -0.032917022705078125, -0.031707763671875, -0.030498504638671875, -0.02928924560546875, -0.028079986572265625, -0.0268707275390625, -0.025661468505859375, -0.02445220947265625, -0.023242950439453125, -0.02203369140625, -0.020824432373046875, -0.01961517333984375, -0.018405914306640625, -0.0171966552734375, -0.015987396240234375, -0.01477813720703125, -0.013568878173828125, -0.012359619140625, -0.011150360107421875, -0.00994110107421875, -0.008731842041015625, -0.0075225830078125, -0.006313323974609375, -0.00510406494140625, -0.003894805908203125, -0.002685546875, -0.001476287841796875, -0.00026702880859375, 0.000942230224609375, 0.0021514892578125, 0.003360748291015625, 0.00457000732421875, 0.005779266357421875, 0.006988525390625, 0.008197784423828125, 0.00940704345703125, 0.010616302490234375, 0.0118255615234375, 0.013034820556640625, 0.01424407958984375, 0.015453338623046875, 0.01666259765625, 0.017871856689453125, 0.01908111572265625, 0.020290374755859375, 0.0214996337890625, 0.022708892822265625, 0.02391815185546875, 0.025127410888671875, 0.026336669921875, 0.027545928955078125, 0.02875518798828125, 0.029964447021484375, 0.0311737060546875, 0.032382965087890625, 0.03359222412109375, 0.034801483154296875, 0.0360107421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 8.0, 10.0, 20.0, 18.0, 27.0, 24.0, 43.0, 75.0, 123.0, 246.0, 488.0, 1234.0, 4017.0, 26051.0, 929898.0, 76278.0, 6837.0, 1821.0, 631.0, 287.0, 146.0, 86.0, 44.0, 23.0, 17.0, 13.0, 14.0, 11.0, 8.0, 4.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0382080078125, -0.03707313537597656, -0.035938262939453125, -0.03480339050292969, -0.03366851806640625, -0.03253364562988281, -0.031398773193359375, -0.030263900756835938, -0.0291290283203125, -0.027994155883789062, -0.026859283447265625, -0.025724411010742188, -0.02458953857421875, -0.023454666137695312, -0.022319793701171875, -0.021184921264648438, -0.020050048828125, -0.018915176391601562, -0.017780303955078125, -0.016645431518554688, -0.01551055908203125, -0.014375686645507812, -0.013240814208984375, -0.012105941772460938, -0.0109710693359375, -0.009836196899414062, -0.008701324462890625, -0.0075664520263671875, -0.00643157958984375, -0.0052967071533203125, -0.004161834716796875, -0.0030269622802734375, -0.00189208984375, -0.0007572174072265625, 0.000377655029296875, 0.0015125274658203125, 0.00264739990234375, 0.0037822723388671875, 0.004917144775390625, 0.0060520172119140625, 0.0071868896484375, 0.008321762084960938, 0.009456634521484375, 0.010591506958007812, 0.01172637939453125, 0.012861251831054688, 0.013996124267578125, 0.015130996704101562, 0.016265869140625, 0.017400741577148438, 0.018535614013671875, 0.019670486450195312, 0.02080535888671875, 0.021940231323242188, 0.023075103759765625, 0.024209976196289062, 0.0253448486328125, 0.026479721069335938, 0.027614593505859375, 0.028749465942382812, 0.02988433837890625, 0.031019210815429688, 0.032154083251953125, 0.03328895568847656, 0.034423828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 1.0, 4.0, 10.0, 4.0, 4.0, 12.0, 10.0, 16.0, 17.0, 22.0, 23.0, 34.0, 50.0, 45.0, 73.0, 81.0, 106.0, 108.0, 74.0, 54.0, 43.0, 46.0, 35.0, 21.0, 20.0, 16.0, 10.0, 13.0, 11.0, 9.0, 10.0, 2.0, 4.0, 3.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.086992263793945e-05, -6.801262497901917e-05, -6.515532732009888e-05, -6.229802966117859e-05, -5.94407320022583e-05, -5.658343434333801e-05, -5.3726136684417725e-05, -5.0868839025497437e-05, -4.801154136657715e-05, -4.515424370765686e-05, -4.229694604873657e-05, -3.9439648389816284e-05, -3.6582350730895996e-05, -3.372505307197571e-05, -3.086775541305542e-05, -2.8010457754135132e-05, -2.5153160095214844e-05, -2.2295862436294556e-05, -1.9438564777374268e-05, -1.658126711845398e-05, -1.3723969459533691e-05, -1.0866671800613403e-05, -8.009374141693115e-06, -5.152076482772827e-06, -2.294778823852539e-06, 5.62518835067749e-07, 3.419816493988037e-06, 6.277114152908325e-06, 9.134411811828613e-06, 1.1991709470748901e-05, 1.484900712966919e-05, 1.7706304788589478e-05, 2.0563602447509766e-05, 2.3420900106430054e-05, 2.6278197765350342e-05, 2.913549542427063e-05, 3.199279308319092e-05, 3.4850090742111206e-05, 3.7707388401031494e-05, 4.056468605995178e-05, 4.342198371887207e-05, 4.627928137779236e-05, 4.9136579036712646e-05, 5.1993876695632935e-05, 5.485117435455322e-05, 5.770847201347351e-05, 6.05657696723938e-05, 6.342306733131409e-05, 6.628036499023438e-05, 6.913766264915466e-05, 7.199496030807495e-05, 7.485225796699524e-05, 7.770955562591553e-05, 8.056685328483582e-05, 8.34241509437561e-05, 8.628144860267639e-05, 8.913874626159668e-05, 9.199604392051697e-05, 9.485334157943726e-05, 9.771063923835754e-05, 0.00010056793689727783, 0.00010342523455619812, 0.00010628253221511841, 0.0001091398298740387, 0.00011199712753295898]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 1.0, 7.0, 5.0, 15.0, 14.0, 28.0, 39.0, 51.0, 65.0, 115.0, 548.0, 27765.0, 1016880.0, 2502.0, 226.0, 78.0, 45.0, 37.0, 27.0, 19.0, 25.0, 9.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04498291015625, -0.04363059997558594, -0.042278289794921875, -0.04092597961425781, -0.03957366943359375, -0.03822135925292969, -0.036869049072265625, -0.03551673889160156, -0.0341644287109375, -0.03281211853027344, -0.031459808349609375, -0.030107498168945312, -0.02875518798828125, -0.027402877807617188, -0.026050567626953125, -0.024698257446289062, -0.023345947265625, -0.021993637084960938, -0.020641326904296875, -0.019289016723632812, -0.01793670654296875, -0.016584396362304688, -0.015232086181640625, -0.013879776000976562, -0.0125274658203125, -0.011175155639648438, -0.009822845458984375, -0.008470535278320312, -0.00711822509765625, -0.0057659149169921875, -0.004413604736328125, -0.0030612945556640625, -0.001708984375, -0.0003566741943359375, 0.000995635986328125, 0.0023479461669921875, 0.00370025634765625, 0.0050525665283203125, 0.006404876708984375, 0.0077571868896484375, 0.0091094970703125, 0.010461807250976562, 0.011814117431640625, 0.013166427612304688, 0.01451873779296875, 0.015871047973632812, 0.017223358154296875, 0.018575668334960938, 0.019927978515625, 0.021280288696289062, 0.022632598876953125, 0.023984909057617188, 0.02533721923828125, 0.026689529418945312, 0.028041839599609375, 0.029394149780273438, 0.0307464599609375, 0.03209877014160156, 0.033451080322265625, 0.03480339050292969, 0.03615570068359375, 0.03750801086425781, 0.038860321044921875, 0.04021263122558594, 0.04156494140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 2.0, 6.0, 5.0, 13.0, 15.0, 24.0, 37.0, 51.0, 49.0, 56.0, 77.0, 107.0, 126.0, 96.0, 82.0, 55.0, 41.0, 35.0, 21.0, 21.0, 24.0, 7.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00722503662109375, -0.007008254528045654, -0.006791472434997559, -0.006574690341949463, -0.006357908248901367, -0.0061411261558532715, -0.005924344062805176, -0.00570756196975708, -0.005490779876708984, -0.005273997783660889, -0.005057215690612793, -0.004840433597564697, -0.0046236515045166016, -0.004406869411468506, -0.00419008731842041, -0.0039733052253723145, -0.0037565231323242188, -0.003539741039276123, -0.0033229589462280273, -0.0031061768531799316, -0.002889394760131836, -0.0026726126670837402, -0.0024558305740356445, -0.002239048480987549, -0.002022266387939453, -0.0018054842948913574, -0.0015887022018432617, -0.001371920108795166, -0.0011551380157470703, -0.0009383559226989746, -0.0007215738296508789, -0.0005047917366027832, -0.0002880096435546875, -7.12275505065918e-05, 0.0001455545425415039, 0.0003623366355895996, 0.0005791187286376953, 0.000795900821685791, 0.0010126829147338867, 0.0012294650077819824, 0.0014462471008300781, 0.0016630291938781738, 0.0018798112869262695, 0.0020965933799743652, 0.002313375473022461, 0.0025301575660705566, 0.0027469396591186523, 0.002963721752166748, 0.0031805038452148438, 0.0033972859382629395, 0.003614068031311035, 0.003830850124359131, 0.0040476322174072266, 0.004264414310455322, 0.004481196403503418, 0.004697978496551514, 0.004914760589599609, 0.005131542682647705, 0.005348324775695801, 0.0055651068687438965, 0.005781888961791992, 0.005998671054840088, 0.006215453147888184, 0.006432235240936279, 0.006649017333984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 45.0, 841.0, 106.0, 12.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0873236656188965, -1.0519155263900757, -1.0165073871612549, -0.9810993075370789, -0.9456911683082581, -0.9102830290794373, -0.8748749494552612, -0.8394668102264404, -0.8040586709976196, -0.7686505317687988, -0.733242392539978, -0.697834312915802, -0.6624261736869812, -0.6270180344581604, -0.5916099548339844, -0.5562018156051636, -0.5207936763763428, -0.485385537147522, -0.44997742772102356, -0.41456931829452515, -0.37916117906570435, -0.34375303983688354, -0.30834493041038513, -0.2729368209838867, -0.23752868175506592, -0.2021205574274063, -0.1667124330997467, -0.1313043087720871, -0.09589618444442749, -0.06048806011676788, -0.025079935789108276, 0.01032818853855133, 0.04573643207550049, 0.0811445564031601, 0.1165526807308197, 0.1519608050584793, 0.18736892938613892, 0.22277705371379852, 0.25818517804145813, 0.29359328746795654, 0.32900142669677734, 0.36440956592559814, 0.39981767535209656, 0.43522578477859497, 0.47063392400741577, 0.5060420632362366, 0.5414501428604126, 0.5768582820892334, 0.6122664213180542, 0.647674560546875, 0.6830826997756958, 0.7184907793998718, 0.7538989186286926, 0.7893070578575134, 0.8247151374816895, 0.8601232767105103, 0.895531415939331, 0.9309395551681519, 0.9663476943969727, 1.0017558336257935, 1.0371639728546143, 1.0725719928741455, 1.1079801321029663, 1.143388271331787, 1.178796410560608]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 12.0, 19.0, 23.0, 28.0, 35.0, 55.0, 81.0, 81.0, 104.0, 111.0, 96.0, 89.0, 85.0, 63.0, 51.0, 33.0, 10.0, 10.0, 10.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27862876653671265, -0.2688198685646057, -0.25901100039482117, -0.24920211732387543, -0.2393932342529297, -0.22958433628082275, -0.21977545320987701, -0.20996657013893127, -0.20015768706798553, -0.1903488039970398, -0.18053992092609406, -0.17073103785514832, -0.16092213988304138, -0.15111327171325684, -0.1413043737411499, -0.13149549067020416, -0.12168660759925842, -0.11187772452831268, -0.10206884145736694, -0.0922599509358406, -0.08245106786489487, -0.07264218479394913, -0.06283329427242279, -0.05302441120147705, -0.04321552813053131, -0.03340664505958557, -0.023597758263349533, -0.013788873329758644, -0.003979988396167755, 0.005828894674777985, 0.015637781471014023, 0.02544666826725006, 0.0352555513381958, 0.04506443440914154, 0.05487332120537758, 0.06468220800161362, 0.07449109107255936, 0.0842999741435051, 0.09410886466503143, 0.10391774773597717, 0.11372663080692291, 0.12353551387786865, 0.1333443969488144, 0.14315328001976013, 0.15296217799186707, 0.1627710461616516, 0.17257994413375854, 0.18238882720470428, 0.19219771027565002, 0.20200659334659576, 0.2118154764175415, 0.22162435948848724, 0.23143324255943298, 0.24124214053153992, 0.25105100870132446, 0.2608599066734314, 0.27066880464553833, 0.28047770261764526, 0.2902865707874298, 0.30009546875953674, 0.3099043369293213, 0.3197132349014282, 0.32952210307121277, 0.3393310010433197, 0.34913986921310425]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 9.0, 22.0, 38.0, 105.0, 460.0, 92433.0, 4100118.0, 774.0, 181.0, 68.0, 28.0, 14.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.43389892578125, -0.4207763671875, -0.40765380859375, -0.39453125, -0.38140869140625, -0.3682861328125, -0.35516357421875, -0.342041015625, -0.32891845703125, -0.3157958984375, -0.30267333984375, -0.28955078125, -0.27642822265625, -0.2633056640625, -0.25018310546875, -0.237060546875, -0.22393798828125, -0.2108154296875, -0.19769287109375, -0.1845703125, -0.17144775390625, -0.1583251953125, -0.14520263671875, -0.132080078125, -0.11895751953125, -0.1058349609375, -0.09271240234375, -0.07958984375, -0.06646728515625, -0.0533447265625, -0.04022216796875, -0.027099609375, -0.01397705078125, -0.0008544921875, 0.01226806640625, 0.025390625, 0.03851318359375, 0.0516357421875, 0.06475830078125, 0.077880859375, 0.09100341796875, 0.1041259765625, 0.11724853515625, 0.13037109375, 0.14349365234375, 0.1566162109375, 0.16973876953125, 0.182861328125, 0.19598388671875, 0.2091064453125, 0.22222900390625, 0.2353515625, 0.24847412109375, 0.2615966796875, 0.27471923828125, 0.287841796875, 0.30096435546875, 0.3140869140625, 0.32720947265625, 0.34033203125, 0.35345458984375, 0.3665771484375, 0.37969970703125, 0.392822265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 66.0, 250.0, 491.0, 140.0, 30.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07952880859375, -0.07721328735351562, -0.07489776611328125, -0.07258224487304688, -0.0702667236328125, -0.06795120239257812, -0.06563568115234375, -0.06332015991210938, -0.061004638671875, -0.058689117431640625, -0.05637359619140625, -0.054058074951171875, -0.0517425537109375, -0.049427032470703125, -0.04711151123046875, -0.044795989990234375, -0.04248046875, -0.040164947509765625, -0.03784942626953125, -0.035533905029296875, -0.0332183837890625, -0.030902862548828125, -0.02858734130859375, -0.026271820068359375, -0.023956298828125, -0.021640777587890625, -0.01932525634765625, -0.017009735107421875, -0.0146942138671875, -0.012378692626953125, -0.01006317138671875, -0.007747650146484375, -0.00543212890625, -0.003116607666015625, -0.00080108642578125, 0.001514434814453125, 0.0038299560546875, 0.006145477294921875, 0.00846099853515625, 0.010776519775390625, 0.013092041015625, 0.015407562255859375, 0.01772308349609375, 0.020038604736328125, 0.0223541259765625, 0.024669647216796875, 0.02698516845703125, 0.029300689697265625, 0.0316162109375, 0.033931732177734375, 0.03624725341796875, 0.038562774658203125, 0.0408782958984375, 0.043193817138671875, 0.04550933837890625, 0.047824859619140625, 0.050140380859375, 0.052455902099609375, 0.05477142333984375, 0.057086944580078125, 0.0594024658203125, 0.061717987060546875, 0.06403350830078125, 0.06634902954101562, 0.06866455078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 10.0, 14.0, 18.0, 28.0, 32.0, 45.0, 78.0, 131.0, 205.0, 341.0, 767.0, 2001.0, 8505.0, 93442.0, 3876830.0, 194966.0, 12529.0, 2470.0, 802.0, 388.0, 230.0, 124.0, 77.0, 73.0, 45.0, 21.0, 15.0, 20.0, 14.0, 5.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.061309814453125, -0.059369564056396484, -0.05742931365966797, -0.05548906326293945, -0.05354881286621094, -0.05160856246948242, -0.049668312072753906, -0.04772806167602539, -0.045787811279296875, -0.04384756088256836, -0.041907310485839844, -0.03996706008911133, -0.03802680969238281, -0.0360865592956543, -0.03414630889892578, -0.032206058502197266, -0.03026580810546875, -0.028325557708740234, -0.02638530731201172, -0.024445056915283203, -0.022504806518554688, -0.020564556121826172, -0.018624305725097656, -0.01668405532836914, -0.014743804931640625, -0.01280355453491211, -0.010863304138183594, -0.008923053741455078, -0.0069828033447265625, -0.005042552947998047, -0.0031023025512695312, -0.0011620521545410156, 0.0007781982421875, 0.0027184486389160156, 0.004658699035644531, 0.006598949432373047, 0.008539199829101562, 0.010479450225830078, 0.012419700622558594, 0.01435995101928711, 0.016300201416015625, 0.01824045181274414, 0.020180702209472656, 0.022120952606201172, 0.024061203002929688, 0.026001453399658203, 0.02794170379638672, 0.029881954193115234, 0.03182220458984375, 0.033762454986572266, 0.03570270538330078, 0.0376429557800293, 0.03958320617675781, 0.04152345657348633, 0.043463706970214844, 0.04540395736694336, 0.047344207763671875, 0.04928445816040039, 0.051224708557128906, 0.05316495895385742, 0.05510520935058594, 0.05704545974731445, 0.05898571014404297, 0.060925960540771484, 0.0628662109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 13.0, 10.0, 11.0, 21.0, 29.0, 48.0, 58.0, 74.0, 118.0, 149.0, 296.0, 420.0, 628.0, 748.0, 470.0, 274.0, 185.0, 110.0, 105.0, 72.0, 46.0, 41.0, 35.0, 19.0, 17.0, 10.0, 14.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0232086181640625, -0.022531509399414062, -0.021854400634765625, -0.021177291870117188, -0.02050018310546875, -0.019823074340820312, -0.019145965576171875, -0.018468856811523438, -0.017791748046875, -0.017114639282226562, -0.016437530517578125, -0.015760421752929688, -0.01508331298828125, -0.014406204223632812, -0.013729095458984375, -0.013051986694335938, -0.0123748779296875, -0.011697769165039062, -0.011020660400390625, -0.010343551635742188, -0.00966644287109375, -0.008989334106445312, -0.008312225341796875, -0.0076351165771484375, -0.0069580078125, -0.0062808990478515625, -0.005603790283203125, -0.0049266815185546875, -0.00424957275390625, -0.0035724639892578125, -0.002895355224609375, -0.0022182464599609375, -0.0015411376953125, -0.0008640289306640625, -0.000186920166015625, 0.0004901885986328125, 0.00116729736328125, 0.0018444061279296875, 0.002521514892578125, 0.0031986236572265625, 0.003875732421875, 0.0045528411865234375, 0.005229949951171875, 0.0059070587158203125, 0.00658416748046875, 0.0072612762451171875, 0.007938385009765625, 0.008615493774414062, 0.0092926025390625, 0.009969711303710938, 0.010646820068359375, 0.011323928833007812, 0.01200103759765625, 0.012678146362304688, 0.013355255126953125, 0.014032363891601562, 0.01470947265625, 0.015386581420898438, 0.016063690185546875, 0.016740798950195312, 0.01741790771484375, 0.018095016479492188, 0.018772125244140625, 0.019449234008789062, 0.0201263427734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 33.0, 909.0, 62.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9128276705741882, -0.8871968388557434, -0.8615660071372986, -0.8359351754188538, -0.8103043437004089, -0.7846734523773193, -0.7590426206588745, -0.7334117889404297, -0.7077809572219849, -0.68215012550354, -0.6565192937850952, -0.6308884620666504, -0.6052576303482056, -0.5796267986297607, -0.5539959669113159, -0.5283650755882263, -0.5027343034744263, -0.47710347175598145, -0.4514726400375366, -0.4258418083190918, -0.4002109467983246, -0.37458011507987976, -0.34894928336143494, -0.3233184218406677, -0.2976875901222229, -0.2720567584037781, -0.24642591178417206, -0.22079508006572723, -0.19516423344612122, -0.1695334017276764, -0.14390257000923157, -0.11827172338962555, -0.09264087677001953, -0.06701003760099411, -0.04137920215725899, -0.015748366713523865, 0.009882472455501556, 0.03551331162452698, 0.0611441433429718, 0.08677498996257782, 0.11240582168102264, 0.13803665339946747, 0.1636675000190735, 0.1892983317375183, 0.21492916345596313, 0.24056001007556915, 0.2661908268928528, 0.29182168841362, 0.3174525201320648, 0.34308335185050964, 0.36871418356895447, 0.3943450450897217, 0.4199758768081665, 0.44560670852661133, 0.47123754024505615, 0.496868371963501, 0.5224992036819458, 0.5481300354003906, 0.5737608671188354, 0.5993916988372803, 0.6250225305557251, 0.6506533622741699, 0.6762841939926147, 0.7019150853157043, 0.7275459170341492]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 15.0, 15.0, 15.0, 29.0, 36.0, 47.0, 67.0, 83.0, 90.0, 63.0, 95.0, 85.0, 70.0, 67.0, 52.0, 44.0, 42.0, 16.0, 19.0, 15.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10208785533905029, -0.09830343723297119, -0.09451901912689209, -0.09073460102081299, -0.08695018291473389, -0.08316576480865479, -0.07938135415315628, -0.07559693604707718, -0.07181251794099808, -0.06802809983491898, -0.06424368172883987, -0.06045926734805107, -0.05667484924197197, -0.05289043113589287, -0.049106016755104065, -0.04532159864902496, -0.04153718054294586, -0.03775276243686676, -0.03396834433078766, -0.030183929949998856, -0.026399511843919754, -0.022615093737840652, -0.0188306774944067, -0.015046261250972748, -0.011261843144893646, -0.007477425970137119, -0.0036930087953805923, 9.14083793759346e-05, 0.0038758255541324615, 0.007660243660211563, 0.011444659903645515, 0.015229076147079468, 0.01901349425315857, 0.02279791235923767, 0.026582328602671623, 0.030366744846105576, 0.03415116295218468, 0.03793558105826378, 0.04171999543905258, 0.04550441354513168, 0.049288831651210785, 0.053073249757289886, 0.05685766786336899, 0.06064208224415779, 0.0644264966249466, 0.0682109147310257, 0.0719953328371048, 0.0757797509431839, 0.079564169049263, 0.0833485871553421, 0.0871330052614212, 0.0909174233675003, 0.0947018414735794, 0.09848625957965851, 0.10227067023515701, 0.10605508834123611, 0.10983950644731522, 0.11362392455339432, 0.11740834265947342, 0.12119276076555252, 0.12497717142105103, 0.12876158952713013, 0.13254600763320923, 0.13633042573928833, 0.14011484384536743]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 13.0, 9.0, 17.0, 19.0, 17.0, 21.0, 31.0, 36.0, 47.0, 65.0, 81.0, 116.0, 158.0, 217.0, 338.0, 596.0, 1404.0, 7648.0, 885982.0, 144987.0, 4071.0, 1074.0, 508.0, 282.0, 189.0, 146.0, 109.0, 74.0, 63.0, 48.0, 33.0, 35.0, 18.0, 16.0, 14.0, 15.0, 13.0, 5.0, 7.0, 4.0, 6.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.303955078125, -0.2949790954589844, -0.28600311279296875, -0.2770271301269531, -0.2680511474609375, -0.2590751647949219, -0.25009918212890625, -0.24112319946289062, -0.232147216796875, -0.22317123413085938, -0.21419525146484375, -0.20521926879882812, -0.1962432861328125, -0.18726730346679688, -0.17829132080078125, -0.16931533813476562, -0.16033935546875, -0.15136337280273438, -0.14238739013671875, -0.13341140747070312, -0.1244354248046875, -0.11545944213867188, -0.10648345947265625, -0.09750747680664062, -0.088531494140625, -0.07955551147460938, -0.07057952880859375, -0.061603546142578125, -0.0526275634765625, -0.043651580810546875, -0.03467559814453125, -0.025699615478515625, -0.0167236328125, -0.007747650146484375, 0.00122833251953125, 0.010204315185546875, 0.0191802978515625, 0.028156280517578125, 0.03713226318359375, 0.046108245849609375, 0.055084228515625, 0.06406021118164062, 0.07303619384765625, 0.08201217651367188, 0.0909881591796875, 0.09996414184570312, 0.10894012451171875, 0.11791610717773438, 0.12689208984375, 0.13586807250976562, 0.14484405517578125, 0.15382003784179688, 0.1627960205078125, 0.17177200317382812, 0.18074798583984375, 0.18972396850585938, 0.198699951171875, 0.20767593383789062, 0.21665191650390625, 0.22562789916992188, 0.2346038818359375, 0.24357986450195312, 0.25255584716796875, 0.2615318298339844, 0.2705078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 61.0, 245.0, 481.0, 164.0, 29.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07940673828125, -0.07709980010986328, -0.07479286193847656, -0.07248592376708984, -0.07017898559570312, -0.0678720474243164, -0.06556510925292969, -0.06325817108154297, -0.06095123291015625, -0.05864429473876953, -0.05633735656738281, -0.054030418395996094, -0.051723480224609375, -0.049416542053222656, -0.04710960388183594, -0.04480266571044922, -0.0424957275390625, -0.04018878936767578, -0.03788185119628906, -0.035574913024902344, -0.033267974853515625, -0.030961036682128906, -0.028654098510742188, -0.02634716033935547, -0.02404022216796875, -0.02173328399658203, -0.019426345825195312, -0.017119407653808594, -0.014812469482421875, -0.012505531311035156, -0.010198593139648438, -0.007891654968261719, -0.005584716796875, -0.0032777786254882812, -0.0009708404541015625, 0.0013360977172851562, 0.003643035888671875, 0.005949974060058594, 0.008256912231445312, 0.010563850402832031, 0.01287078857421875, 0.015177726745605469, 0.017484664916992188, 0.019791603088378906, 0.022098541259765625, 0.024405479431152344, 0.026712417602539062, 0.02901935577392578, 0.0313262939453125, 0.03363323211669922, 0.03594017028808594, 0.038247108459472656, 0.040554046630859375, 0.042860984802246094, 0.04516792297363281, 0.04747486114501953, 0.04978179931640625, 0.05208873748779297, 0.05439567565917969, 0.056702613830566406, 0.059009552001953125, 0.061316490173339844, 0.06362342834472656, 0.06593036651611328, 0.0682373046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 13.0, 9.0, 14.0, 15.0, 24.0, 44.0, 47.0, 64.0, 119.0, 162.0, 242.0, 435.0, 1039.0, 5065.0, 102889.0, 915724.0, 18672.0, 2223.0, 701.0, 363.0, 199.0, 129.0, 88.0, 57.0, 51.0, 36.0, 24.0, 17.0, 11.0, 15.0, 8.0, 4.0, 3.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2166748046875, -0.21035194396972656, -0.20402908325195312, -0.1977062225341797, -0.19138336181640625, -0.1850605010986328, -0.17873764038085938, -0.17241477966308594, -0.1660919189453125, -0.15976905822753906, -0.15344619750976562, -0.1471233367919922, -0.14080047607421875, -0.1344776153564453, -0.12815475463867188, -0.12183189392089844, -0.115509033203125, -0.10918617248535156, -0.10286331176757812, -0.09654045104980469, -0.09021759033203125, -0.08389472961425781, -0.07757186889648438, -0.07124900817871094, -0.0649261474609375, -0.05860328674316406, -0.052280426025390625, -0.04595756530761719, -0.03963470458984375, -0.03331184387207031, -0.026988983154296875, -0.020666122436523438, -0.01434326171875, -0.008020401000976562, -0.001697540283203125, 0.0046253204345703125, 0.01094818115234375, 0.017271041870117188, 0.023593902587890625, 0.029916763305664062, 0.0362396240234375, 0.04256248474121094, 0.048885345458984375, 0.05520820617675781, 0.06153106689453125, 0.06785392761230469, 0.07417678833007812, 0.08049964904785156, 0.086822509765625, 0.09314537048339844, 0.09946823120117188, 0.10579109191894531, 0.11211395263671875, 0.11843681335449219, 0.12475967407226562, 0.13108253479003906, 0.1374053955078125, 0.14372825622558594, 0.15005111694335938, 0.1563739776611328, 0.16269683837890625, 0.1690196990966797, 0.17534255981445312, 0.18166542053222656, 0.18798828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 11.0, 7.0, 9.0, 34.0, 32.0, 40.0, 53.0, 71.0, 82.0, 78.0, 102.0, 82.0, 74.0, 74.0, 49.0, 42.0, 28.0, 25.0, 22.0, 14.0, 12.0, 12.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055694580078125, -0.053815364837646484, -0.05193614959716797, -0.05005693435668945, -0.04817771911621094, -0.04629850387573242, -0.044419288635253906, -0.04254007339477539, -0.040660858154296875, -0.03878164291381836, -0.036902427673339844, -0.03502321243286133, -0.03314399719238281, -0.0312647819519043, -0.02938556671142578, -0.027506351470947266, -0.02562713623046875, -0.023747920989990234, -0.02186870574951172, -0.019989490509033203, -0.018110275268554688, -0.016231060028076172, -0.014351844787597656, -0.01247262954711914, -0.010593414306640625, -0.00871419906616211, -0.006834983825683594, -0.004955768585205078, -0.0030765533447265625, -0.0011973381042480469, 0.0006818771362304688, 0.0025610923767089844, 0.0044403076171875, 0.006319522857666016, 0.008198738098144531, 0.010077953338623047, 0.011957168579101562, 0.013836383819580078, 0.015715599060058594, 0.01759481430053711, 0.019474029541015625, 0.02135324478149414, 0.023232460021972656, 0.025111675262451172, 0.026990890502929688, 0.028870105743408203, 0.03074932098388672, 0.032628536224365234, 0.03450775146484375, 0.036386966705322266, 0.03826618194580078, 0.0401453971862793, 0.04202461242675781, 0.04390382766723633, 0.045783042907714844, 0.04766225814819336, 0.049541473388671875, 0.05142068862915039, 0.053299903869628906, 0.05517911911010742, 0.05705833435058594, 0.05893754959106445, 0.06081676483154297, 0.06269598007202148, 0.0645751953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 12.0, 17.0, 37.0, 56.0, 114.0, 210.0, 476.0, 1138.0, 3117.0, 11576.0, 881010.0, 138055.0, 8414.0, 2461.0, 935.0, 439.0, 206.0, 121.0, 51.0, 25.0, 26.0, 14.0, 10.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14318466186523438, -0.13805389404296875, -0.13292312622070312, -0.1277923583984375, -0.12266159057617188, -0.11753082275390625, -0.11240005493164062, -0.107269287109375, -0.10213851928710938, -0.09700775146484375, -0.09187698364257812, -0.0867462158203125, -0.08161544799804688, -0.07648468017578125, -0.07135391235351562, -0.06622314453125, -0.061092376708984375, -0.05596160888671875, -0.050830841064453125, -0.0457000732421875, -0.040569305419921875, -0.03543853759765625, -0.030307769775390625, -0.025177001953125, -0.020046234130859375, -0.01491546630859375, -0.009784698486328125, -0.0046539306640625, 0.000476837158203125, 0.00560760498046875, 0.010738372802734375, 0.015869140625, 0.020999908447265625, 0.02613067626953125, 0.031261444091796875, 0.0363922119140625, 0.041522979736328125, 0.04665374755859375, 0.051784515380859375, 0.056915283203125, 0.062046051025390625, 0.06717681884765625, 0.07230758666992188, 0.0774383544921875, 0.08256912231445312, 0.08769989013671875, 0.09283065795898438, 0.09796142578125, 0.10309219360351562, 0.10822296142578125, 0.11335372924804688, 0.1184844970703125, 0.12361526489257812, 0.12874603271484375, 0.13387680053710938, 0.139007568359375, 0.14413833618164062, 0.14926910400390625, 0.15439987182617188, 0.1595306396484375, 0.16466140747070312, 0.16979217529296875, 0.17492294311523438, 0.1800537109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 5.0, 8.0, 5.0, 7.0, 11.0, 17.0, 25.0, 41.0, 67.0, 135.0, 152.0, 183.0, 125.0, 69.0, 31.0, 21.0, 20.0, 13.0, 12.0, 4.0, 4.0, 6.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021266937255859375, -0.00020641088485717773, -0.00020015239715576172, -0.0001938939094543457, -0.0001876354217529297, -0.00018137693405151367, -0.00017511844635009766, -0.00016885995864868164, -0.00016260147094726562, -0.0001563429832458496, -0.0001500844955444336, -0.00014382600784301758, -0.00013756752014160156, -0.00013130903244018555, -0.00012505054473876953, -0.00011879205703735352, -0.0001125335693359375, -0.00010627508163452148, -0.00010001659393310547, -9.375810623168945e-05, -8.749961853027344e-05, -8.124113082885742e-05, -7.49826431274414e-05, -6.872415542602539e-05, -6.246566772460938e-05, -5.620718002319336e-05, -4.9948692321777344e-05, -4.369020462036133e-05, -3.743171691894531e-05, -3.11732292175293e-05, -2.491474151611328e-05, -1.8656253814697266e-05, -1.239776611328125e-05, -6.139278411865234e-06, 1.1920928955078125e-07, 6.377696990966797e-06, 1.2636184692382812e-05, 1.8894672393798828e-05, 2.5153160095214844e-05, 3.141164779663086e-05, 3.7670135498046875e-05, 4.392862319946289e-05, 5.0187110900878906e-05, 5.644559860229492e-05, 6.270408630371094e-05, 6.896257400512695e-05, 7.522106170654297e-05, 8.147954940795898e-05, 8.7738037109375e-05, 9.399652481079102e-05, 0.00010025501251220703, 0.00010651350021362305, 0.00011277198791503906, 0.00011903047561645508, 0.0001252889633178711, 0.0001315474510192871, 0.00013780593872070312, 0.00014406442642211914, 0.00015032291412353516, 0.00015658140182495117, 0.0001628398895263672, 0.0001690983772277832, 0.00017535686492919922, 0.00018161535263061523, 0.00018787384033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 13.0, 17.0, 15.0, 30.0, 35.0, 66.0, 128.0, 355.0, 1164.0, 5463.0, 426027.0, 607688.0, 5639.0, 1138.0, 368.0, 166.0, 66.0, 44.0, 28.0, 21.0, 11.0, 9.0, 7.0, 10.0, 5.0, 1.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.13186931610107422, -0.12787437438964844, -0.12387943267822266, -0.11988449096679688, -0.1158895492553711, -0.11189460754394531, -0.10789966583251953, -0.10390472412109375, -0.09990978240966797, -0.09591484069824219, -0.0919198989868164, -0.08792495727539062, -0.08393001556396484, -0.07993507385253906, -0.07594013214111328, -0.0719451904296875, -0.06795024871826172, -0.06395530700683594, -0.059960365295410156, -0.055965423583984375, -0.051970481872558594, -0.04797554016113281, -0.04398059844970703, -0.03998565673828125, -0.03599071502685547, -0.03199577331542969, -0.028000831604003906, -0.024005889892578125, -0.020010948181152344, -0.016016006469726562, -0.012021064758300781, -0.008026123046875, -0.004031181335449219, -3.62396240234375e-05, 0.003958702087402344, 0.007953643798828125, 0.011948585510253906, 0.015943527221679688, 0.01993846893310547, 0.02393341064453125, 0.02792835235595703, 0.03192329406738281, 0.035918235778808594, 0.039913177490234375, 0.043908119201660156, 0.04790306091308594, 0.05189800262451172, 0.0558929443359375, 0.05988788604736328, 0.06388282775878906, 0.06787776947021484, 0.07187271118164062, 0.0758676528930664, 0.07986259460449219, 0.08385753631591797, 0.08785247802734375, 0.09184741973876953, 0.09584236145019531, 0.0998373031616211, 0.10383224487304688, 0.10782718658447266, 0.11182212829589844, 0.11581707000732422, 0.11981201171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 16.0, 14.0, 32.0, 53.0, 208.0, 400.0, 143.0, 39.0, 23.0, 18.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.04864501953125, -0.04747152328491211, -0.04629802703857422, -0.04512453079223633, -0.04395103454589844, -0.04277753829956055, -0.041604042053222656, -0.040430545806884766, -0.039257049560546875, -0.038083553314208984, -0.036910057067871094, -0.0357365608215332, -0.03456306457519531, -0.03338956832885742, -0.03221607208251953, -0.03104257583618164, -0.02986907958984375, -0.02869558334350586, -0.02752208709716797, -0.026348590850830078, -0.025175094604492188, -0.024001598358154297, -0.022828102111816406, -0.021654605865478516, -0.020481109619140625, -0.019307613372802734, -0.018134117126464844, -0.016960620880126953, -0.015787124633789062, -0.014613628387451172, -0.013440132141113281, -0.01226663589477539, -0.0110931396484375, -0.00991964340209961, -0.008746147155761719, -0.007572650909423828, -0.0063991546630859375, -0.005225658416748047, -0.004052162170410156, -0.0028786659240722656, -0.001705169677734375, -0.0005316734313964844, 0.0006418228149414062, 0.0018153190612792969, 0.0029888153076171875, 0.004162311553955078, 0.005335807800292969, 0.006509304046630859, 0.00768280029296875, 0.00885629653930664, 0.010029792785644531, 0.011203289031982422, 0.012376785278320312, 0.013550281524658203, 0.014723777770996094, 0.015897274017333984, 0.017070770263671875, 0.018244266510009766, 0.019417762756347656, 0.020591259002685547, 0.021764755249023438, 0.022938251495361328, 0.02411174774169922, 0.02528524398803711, 0.026458740234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 35.0, 745.0, 220.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.697610855102539, -1.6559439897537231, -1.6142770051956177, -1.5726101398468018, -1.5309431552886963, -1.4892762899398804, -1.447609305381775, -1.405942440032959, -1.3642754554748535, -1.3226085901260376, -1.2809416055679321, -1.2392747402191162, -1.1976077556610107, -1.1559408903121948, -1.1142739057540894, -1.0726070404052734, -1.030940055847168, -0.9892731308937073, -0.9476062059402466, -0.9059392809867859, -0.8642723560333252, -0.8226054310798645, -0.7809385061264038, -0.7392716407775879, -0.697604775428772, -0.6559378504753113, -0.6142709255218506, -0.5726040005683899, -0.5309370756149292, -0.4892701506614685, -0.4476032555103302, -0.4059363305568695, -0.3642693758010864, -0.32260245084762573, -0.28093552589416504, -0.23926861584186554, -0.19760169088840485, -0.15593476593494415, -0.11426785588264465, -0.07260093092918396, -0.030934005975723267, 0.010732915252447128, 0.05239983648061752, 0.09406675398349762, 0.1357336789369583, 0.177400603890419, 0.2190675139427185, 0.2607344388961792, 0.3024013638496399, 0.3440682888031006, 0.3857352137565613, 0.427402138710022, 0.46906906366348267, 0.5107359886169434, 0.5524028539657593, 0.5940698385238647, 0.6357367038726807, 0.6774036288261414, 0.719070553779602, 0.7607374787330627, 0.8024044036865234, 0.8440713286399841, 0.8857382535934448, 0.9274051189422607, 0.9690721035003662]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 11.0, 6.0, 12.0, 11.0, 9.0, 17.0, 31.0, 19.0, 34.0, 35.0, 31.0, 46.0, 49.0, 40.0, 45.0, 48.0, 40.0, 51.0, 48.0, 59.0, 52.0, 48.0, 50.0, 35.0, 22.0, 32.0, 24.0, 21.0, 20.0, 15.0, 12.0, 13.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13452327251434326, -0.13065354526042938, -0.1267838180065155, -0.12291409075260162, -0.11904436349868774, -0.11517463624477386, -0.11130491644144058, -0.1074351891875267, -0.10356546193361282, -0.09969573467969894, -0.09582600742578506, -0.09195628017187119, -0.0880865603685379, -0.08421683311462402, -0.08034710586071014, -0.07647737860679626, -0.07260765135288239, -0.0687379240989685, -0.06486819684505463, -0.060998473316431046, -0.057128746062517166, -0.05325901880860329, -0.049389295279979706, -0.045519568026065826, -0.04164984077215195, -0.03778011351823807, -0.03391038626432419, -0.030040662735700607, -0.026170935481786728, -0.02230120822787285, -0.01843148283660412, -0.014561757445335388, -0.010692030191421509, -0.006822303868830204, -0.0029525775462388992, 0.0009171487763524055, 0.00478687509894371, 0.00865660235285759, 0.01252632774412632, 0.01639605313539505, 0.02026578038930893, 0.02413550764322281, 0.02800523303449154, 0.03187495842576027, 0.03574468567967415, 0.03961441293358803, 0.04348413646221161, 0.04735386371612549, 0.05122359097003937, 0.05509331822395325, 0.058963045477867126, 0.062832772731781, 0.06670249998569489, 0.07057222723960876, 0.07444194704294205, 0.07831167429685593, 0.0821814015507698, 0.08605112880468369, 0.08992085605859756, 0.09379058331251144, 0.09766030311584473, 0.1015300303697586, 0.10539975762367249, 0.10926948487758636, 0.11313921213150024]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 6.0, 8.0, 13.0, 28.0, 27.0, 44.0, 85.0, 157.0, 378.0, 2529.0, 11305.0, 4143417.0, 31615.0, 3164.0, 795.0, 300.0, 151.0, 91.0, 65.0, 31.0, 22.0, 15.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10597896575927734, -0.10130119323730469, -0.09662342071533203, -0.09194564819335938, -0.08726787567138672, -0.08259010314941406, -0.0779123306274414, -0.07323455810546875, -0.0685567855834961, -0.06387901306152344, -0.05920124053955078, -0.054523468017578125, -0.04984569549560547, -0.04516792297363281, -0.040490150451660156, -0.0358123779296875, -0.031134605407714844, -0.026456832885742188, -0.02177906036376953, -0.017101287841796875, -0.012423515319824219, -0.0077457427978515625, -0.0030679702758789062, 0.00160980224609375, 0.006287574768066406, 0.010965347290039062, 0.01564311981201172, 0.020320892333984375, 0.02499866485595703, 0.029676437377929688, 0.034354209899902344, 0.039031982421875, 0.043709754943847656, 0.04838752746582031, 0.05306529998779297, 0.057743072509765625, 0.06242084503173828, 0.06709861755371094, 0.0717763900756836, 0.07645416259765625, 0.0811319351196289, 0.08580970764160156, 0.09048748016357422, 0.09516525268554688, 0.09984302520751953, 0.10452079772949219, 0.10919857025146484, 0.1138763427734375, 0.11855411529541016, 0.12323188781738281, 0.12790966033935547, 0.13258743286132812, 0.13726520538330078, 0.14194297790527344, 0.1466207504272461, 0.15129852294921875, 0.1559762954711914, 0.16065406799316406, 0.16533184051513672, 0.17000961303710938, 0.17468738555908203, 0.1793651580810547, 0.18404293060302734, 0.188720703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 21.0, 133.0, 426.0, 314.0, 76.0, 21.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07568359375, -0.07345008850097656, -0.07121658325195312, -0.06898307800292969, -0.06674957275390625, -0.06451606750488281, -0.062282562255859375, -0.06004905700683594, -0.0578155517578125, -0.05558204650878906, -0.053348541259765625, -0.05111503601074219, -0.04888153076171875, -0.04664802551269531, -0.044414520263671875, -0.04218101501464844, -0.039947509765625, -0.03771400451660156, -0.035480499267578125, -0.03324699401855469, -0.03101348876953125, -0.028779983520507812, -0.026546478271484375, -0.024312973022460938, -0.0220794677734375, -0.019845962524414062, -0.017612457275390625, -0.015378952026367188, -0.01314544677734375, -0.010911941528320312, -0.008678436279296875, -0.0064449310302734375, -0.00421142578125, -0.0019779205322265625, 0.000255584716796875, 0.0024890899658203125, 0.00472259521484375, 0.0069561004638671875, 0.009189605712890625, 0.011423110961914062, 0.0136566162109375, 0.015890121459960938, 0.018123626708984375, 0.020357131958007812, 0.02259063720703125, 0.024824142456054688, 0.027057647705078125, 0.029291152954101562, 0.031524658203125, 0.03375816345214844, 0.035991668701171875, 0.03822517395019531, 0.04045867919921875, 0.04269218444824219, 0.044925689697265625, 0.04715919494628906, 0.0493927001953125, 0.05162620544433594, 0.053859710693359375, 0.05609321594238281, 0.05832672119140625, 0.06056022644042969, 0.06279373168945312, 0.06502723693847656, 0.0672607421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 20.0, 42.0, 61.0, 113.0, 174.0, 370.0, 890.0, 2974.0, 42384.0, 4027327.0, 113647.0, 4288.0, 1068.0, 427.0, 215.0, 92.0, 62.0, 35.0, 21.0, 10.0, 13.0, 8.0, 10.0, 3.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06265735626220703, -0.05988502502441406, -0.057112693786621094, -0.054340362548828125, -0.051568031311035156, -0.04879570007324219, -0.04602336883544922, -0.04325103759765625, -0.04047870635986328, -0.03770637512207031, -0.034934043884277344, -0.032161712646484375, -0.029389381408691406, -0.026617050170898438, -0.02384471893310547, -0.0210723876953125, -0.01830005645751953, -0.015527725219726562, -0.012755393981933594, -0.009983062744140625, -0.007210731506347656, -0.0044384002685546875, -0.0016660690307617188, 0.00110626220703125, 0.0038785934448242188, 0.0066509246826171875, 0.009423255920410156, 0.012195587158203125, 0.014967918395996094, 0.017740249633789062, 0.02051258087158203, 0.023284912109375, 0.02605724334716797, 0.028829574584960938, 0.031601905822753906, 0.034374237060546875, 0.037146568298339844, 0.03991889953613281, 0.04269123077392578, 0.04546356201171875, 0.04823589324951172, 0.05100822448730469, 0.053780555725097656, 0.056552886962890625, 0.059325218200683594, 0.06209754943847656, 0.06486988067626953, 0.0676422119140625, 0.07041454315185547, 0.07318687438964844, 0.0759592056274414, 0.07873153686523438, 0.08150386810302734, 0.08427619934082031, 0.08704853057861328, 0.08982086181640625, 0.09259319305419922, 0.09536552429199219, 0.09813785552978516, 0.10091018676757812, 0.1036825180053711, 0.10645484924316406, 0.10922718048095703, 0.11199951171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 14.0, 7.0, 13.0, 29.0, 42.0, 61.0, 93.0, 169.0, 243.0, 360.0, 663.0, 826.0, 529.0, 328.0, 253.0, 142.0, 94.0, 84.0, 33.0, 28.0, 19.0, 12.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045318603515625, -0.044165849685668945, -0.04301309585571289, -0.041860342025756836, -0.04070758819580078, -0.03955483436584473, -0.03840208053588867, -0.03724932670593262, -0.03609657287597656, -0.03494381904602051, -0.03379106521606445, -0.0326383113861084, -0.031485557556152344, -0.03033280372619629, -0.029180049896240234, -0.02802729606628418, -0.026874542236328125, -0.02572178840637207, -0.024569034576416016, -0.02341628074645996, -0.022263526916503906, -0.02111077308654785, -0.019958019256591797, -0.018805265426635742, -0.017652511596679688, -0.016499757766723633, -0.015347003936767578, -0.014194250106811523, -0.013041496276855469, -0.011888742446899414, -0.01073598861694336, -0.009583234786987305, -0.00843048095703125, -0.007277727127075195, -0.006124973297119141, -0.004972219467163086, -0.0038194656372070312, -0.0026667118072509766, -0.0015139579772949219, -0.0003612041473388672, 0.0007915496826171875, 0.0019443035125732422, 0.003097057342529297, 0.0042498111724853516, 0.005402565002441406, 0.006555318832397461, 0.007708072662353516, 0.00886082649230957, 0.010013580322265625, 0.01116633415222168, 0.012319087982177734, 0.013471841812133789, 0.014624595642089844, 0.0157773494720459, 0.016930103302001953, 0.018082857131958008, 0.019235610961914062, 0.020388364791870117, 0.021541118621826172, 0.022693872451782227, 0.02384662628173828, 0.024999380111694336, 0.02615213394165039, 0.027304887771606445, 0.0284576416015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 11.0, 52.0, 685.0, 251.0, 11.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6076231598854065, -0.5864946246147156, -0.5653660297393799, -0.544237494468689, -0.523108959197998, -0.5019804239273071, -0.48085182905197144, -0.4597232937812805, -0.4385947287082672, -0.4174661636352539, -0.396337628364563, -0.3752090632915497, -0.3540804982185364, -0.33295196294784546, -0.31182339787483215, -0.29069483280181885, -0.26956629753112793, -0.24843774735927582, -0.2273091971874237, -0.2061806321144104, -0.1850520819425583, -0.16392353177070618, -0.14279496669769287, -0.12166641652584076, -0.10053786635398865, -0.07940931618213654, -0.05828075855970383, -0.03715220093727112, -0.016023650765419006, 0.0051048994064331055, 0.02623346447944641, 0.04736201465129852, 0.06849062442779541, 0.08961917459964752, 0.11074773222208023, 0.13187628984451294, 0.15300484001636505, 0.17413339018821716, 0.19526195526123047, 0.21639050543308258, 0.2375190556049347, 0.258647620677948, 0.2797761559486389, 0.3009047210216522, 0.3220332860946655, 0.34316182136535645, 0.36429038643836975, 0.38541895151138306, 0.406547486782074, 0.4276760518550873, 0.4488045871257782, 0.4699331521987915, 0.4910616874694824, 0.5121902227401733, 0.533318817615509, 0.5544473528862, 0.5755759477615356, 0.5967044830322266, 0.6178330779075623, 0.6389616131782532, 0.6600901484489441, 0.6812187433242798, 0.7023472785949707, 0.7234758138656616, 0.7446043491363525]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 7.0, 13.0, 18.0, 23.0, 40.0, 48.0, 52.0, 80.0, 79.0, 87.0, 81.0, 88.0, 91.0, 62.0, 64.0, 52.0, 31.0, 28.0, 16.0, 19.0, 12.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16862046718597412, -0.16302843391895294, -0.15743640065193176, -0.15184436738491058, -0.1462523341178894, -0.14066031575202942, -0.13506828248500824, -0.12947624921798706, -0.12388421595096588, -0.1182921826839447, -0.11270014941692352, -0.10710812360048294, -0.10151609033346176, -0.09592405706644058, -0.09033203125, -0.08473999798297882, -0.07914796471595764, -0.07355593144893646, -0.06796389818191528, -0.0623718723654747, -0.05677983909845352, -0.05118780583143234, -0.04559577628970146, -0.04000374674797058, -0.0344117134809494, -0.028819682076573372, -0.023227650672197342, -0.017635619267821312, -0.012043587863445282, -0.006451556459069252, -0.000859525054693222, 0.004732504487037659, 0.010324537754058838, 0.015916569158434868, 0.021508600562810898, 0.027100631967186928, 0.03269266337156296, 0.03828469663858414, 0.04387672618031502, 0.0494687557220459, 0.05506078898906708, 0.06065282225608826, 0.06624485552310944, 0.07183688133955002, 0.0774289146065712, 0.08302094787359238, 0.08861297369003296, 0.09420500695705414, 0.09979704022407532, 0.1053890734910965, 0.11098110675811768, 0.11657313257455826, 0.12216516584157944, 0.12775719165802002, 0.1333492249250412, 0.13894125819206238, 0.14453329145908356, 0.15012532472610474, 0.15571735799312592, 0.1613093912601471, 0.16690140962600708, 0.17249344289302826, 0.17808547616004944, 0.18367750942707062, 0.1892695426940918]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 6.0, 7.0, 10.0, 11.0, 12.0, 15.0, 19.0, 26.0, 27.0, 64.0, 58.0, 102.0, 134.0, 178.0, 298.0, 437.0, 810.0, 2454.0, 26684.0, 972716.0, 39185.0, 2867.0, 952.0, 476.0, 252.0, 219.0, 124.0, 108.0, 57.0, 53.0, 34.0, 28.0, 28.0, 22.0, 18.0, 6.0, 12.0, 16.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1678466796875, -0.16298866271972656, -0.15813064575195312, -0.1532726287841797, -0.14841461181640625, -0.1435565948486328, -0.13869857788085938, -0.13384056091308594, -0.1289825439453125, -0.12412452697753906, -0.11926651000976562, -0.11440849304199219, -0.10955047607421875, -0.10469245910644531, -0.09983444213867188, -0.09497642517089844, -0.090118408203125, -0.08526039123535156, -0.08040237426757812, -0.07554435729980469, -0.07068634033203125, -0.06582832336425781, -0.060970306396484375, -0.05611228942871094, -0.0512542724609375, -0.04639625549316406, -0.041538238525390625, -0.03668022155761719, -0.03182220458984375, -0.026964187622070312, -0.022106170654296875, -0.017248153686523438, -0.01239013671875, -0.0075321197509765625, -0.002674102783203125, 0.0021839141845703125, 0.00704193115234375, 0.011899948120117188, 0.016757965087890625, 0.021615982055664062, 0.0264739990234375, 0.03133201599121094, 0.036190032958984375, 0.04104804992675781, 0.04590606689453125, 0.05076408386230469, 0.055622100830078125, 0.06048011779785156, 0.065338134765625, 0.07019615173339844, 0.07505416870117188, 0.07991218566894531, 0.08477020263671875, 0.08962821960449219, 0.09448623657226562, 0.09934425354003906, 0.1042022705078125, 0.10906028747558594, 0.11391830444335938, 0.11877632141113281, 0.12363433837890625, 0.1284923553466797, 0.13335037231445312, 0.13820838928222656, 0.14306640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 34.0, 163.0, 447.0, 283.0, 51.0, 15.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0745849609375, -0.0723714828491211, -0.07015800476074219, -0.06794452667236328, -0.06573104858398438, -0.06351757049560547, -0.06130409240722656, -0.059090614318847656, -0.05687713623046875, -0.054663658142089844, -0.05245018005371094, -0.05023670196533203, -0.048023223876953125, -0.04580974578857422, -0.04359626770019531, -0.041382789611816406, -0.0391693115234375, -0.036955833435058594, -0.03474235534667969, -0.03252887725830078, -0.030315399169921875, -0.02810192108154297, -0.025888442993164062, -0.023674964904785156, -0.02146148681640625, -0.019248008728027344, -0.017034530639648438, -0.014821052551269531, -0.012607574462890625, -0.010394096374511719, -0.008180618286132812, -0.005967140197753906, -0.003753662109375, -0.0015401840209960938, 0.0006732940673828125, 0.0028867721557617188, 0.005100250244140625, 0.007313728332519531, 0.009527206420898438, 0.011740684509277344, 0.01395416259765625, 0.016167640686035156, 0.018381118774414062, 0.02059459686279297, 0.022808074951171875, 0.02502155303955078, 0.027235031127929688, 0.029448509216308594, 0.0316619873046875, 0.033875465393066406, 0.03608894348144531, 0.03830242156982422, 0.040515899658203125, 0.04272937774658203, 0.04494285583496094, 0.047156333923339844, 0.04936981201171875, 0.051583290100097656, 0.05379676818847656, 0.05601024627685547, 0.058223724365234375, 0.06043720245361328, 0.06265068054199219, 0.0648641586303711, 0.06707763671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 11.0, 18.0, 9.0, 13.0, 17.0, 28.0, 39.0, 52.0, 83.0, 148.0, 203.0, 404.0, 771.0, 2583.0, 32257.0, 948247.0, 58399.0, 3232.0, 905.0, 432.0, 228.0, 138.0, 80.0, 56.0, 60.0, 31.0, 31.0, 18.0, 9.0, 13.0, 7.0, 6.0, 2.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1583251953125, -0.1529712677001953, -0.14761734008789062, -0.14226341247558594, -0.13690948486328125, -0.13155555725097656, -0.12620162963867188, -0.12084770202636719, -0.1154937744140625, -0.11013984680175781, -0.10478591918945312, -0.09943199157714844, -0.09407806396484375, -0.08872413635253906, -0.08337020874023438, -0.07801628112792969, -0.072662353515625, -0.06730842590332031, -0.061954498291015625, -0.05660057067871094, -0.05124664306640625, -0.04589271545410156, -0.040538787841796875, -0.03518486022949219, -0.0298309326171875, -0.024477005004882812, -0.019123077392578125, -0.013769149780273438, -0.00841522216796875, -0.0030612945556640625, 0.002292633056640625, 0.0076465606689453125, 0.01300048828125, 0.018354415893554688, 0.023708343505859375, 0.029062271118164062, 0.03441619873046875, 0.03977012634277344, 0.045124053955078125, 0.05047798156738281, 0.0558319091796875, 0.06118583679199219, 0.06653976440429688, 0.07189369201660156, 0.07724761962890625, 0.08260154724121094, 0.08795547485351562, 0.09330940246582031, 0.098663330078125, 0.10401725769042969, 0.10937118530273438, 0.11472511291503906, 0.12007904052734375, 0.12543296813964844, 0.13078689575195312, 0.1361408233642578, 0.1414947509765625, 0.1468486785888672, 0.15220260620117188, 0.15755653381347656, 0.16291046142578125, 0.16826438903808594, 0.17361831665039062, 0.1789722442626953, 0.184326171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 12.0, 24.0, 7.0, 13.0, 18.0, 22.0, 20.0, 22.0, 42.0, 48.0, 53.0, 48.0, 60.0, 70.0, 62.0, 46.0, 64.0, 56.0, 51.0, 45.0, 36.0, 41.0, 29.0, 17.0, 16.0, 11.0, 16.0, 7.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.048259735107421875, -0.04674530029296875, -0.045230865478515625, -0.0437164306640625, -0.042201995849609375, -0.04068756103515625, -0.039173126220703125, -0.03765869140625, -0.036144256591796875, -0.03462982177734375, -0.033115386962890625, -0.0316009521484375, -0.030086517333984375, -0.02857208251953125, -0.027057647705078125, -0.025543212890625, -0.024028778076171875, -0.02251434326171875, -0.020999908447265625, -0.0194854736328125, -0.017971038818359375, -0.01645660400390625, -0.014942169189453125, -0.013427734375, -0.011913299560546875, -0.01039886474609375, -0.008884429931640625, -0.0073699951171875, -0.005855560302734375, -0.00434112548828125, -0.002826690673828125, -0.001312255859375, 0.000202178955078125, 0.00171661376953125, 0.003231048583984375, 0.0047454833984375, 0.006259918212890625, 0.00777435302734375, 0.009288787841796875, 0.01080322265625, 0.012317657470703125, 0.01383209228515625, 0.015346527099609375, 0.0168609619140625, 0.018375396728515625, 0.01988983154296875, 0.021404266357421875, 0.022918701171875, 0.024433135986328125, 0.02594757080078125, 0.027462005615234375, 0.0289764404296875, 0.030490875244140625, 0.03200531005859375, 0.033519744873046875, 0.0350341796875, 0.036548614501953125, 0.03806304931640625, 0.039577484130859375, 0.0410919189453125, 0.042606353759765625, 0.04412078857421875, 0.045635223388671875, 0.047149658203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 6.0, 6.0, 13.0, 14.0, 31.0, 51.0, 45.0, 71.0, 145.0, 262.0, 493.0, 1082.0, 2448.0, 6817.0, 20758.0, 158628.0, 801286.0, 38751.0, 10810.0, 3821.0, 1462.0, 702.0, 327.0, 154.0, 128.0, 73.0, 42.0, 31.0, 19.0, 15.0, 12.0, 16.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054473876953125, -0.052472591400146484, -0.05047130584716797, -0.04847002029418945, -0.04646873474121094, -0.04446744918823242, -0.042466163635253906, -0.04046487808227539, -0.038463592529296875, -0.03646230697631836, -0.034461021423339844, -0.03245973587036133, -0.030458450317382812, -0.028457164764404297, -0.02645587921142578, -0.024454593658447266, -0.02245330810546875, -0.020452022552490234, -0.01845073699951172, -0.016449451446533203, -0.014448165893554688, -0.012446880340576172, -0.010445594787597656, -0.00844430923461914, -0.006443023681640625, -0.004441738128662109, -0.0024404525756835938, -0.0004391670227050781, 0.0015621185302734375, 0.003563404083251953, 0.005564689636230469, 0.007565975189208984, 0.0095672607421875, 0.011568546295166016, 0.013569831848144531, 0.015571117401123047, 0.017572402954101562, 0.019573688507080078, 0.021574974060058594, 0.02357625961303711, 0.025577545166015625, 0.02757883071899414, 0.029580116271972656, 0.03158140182495117, 0.03358268737792969, 0.0355839729309082, 0.03758525848388672, 0.039586544036865234, 0.04158782958984375, 0.043589115142822266, 0.04559040069580078, 0.0475916862487793, 0.04959297180175781, 0.05159425735473633, 0.053595542907714844, 0.05559682846069336, 0.057598114013671875, 0.05959939956665039, 0.061600685119628906, 0.06360197067260742, 0.06560325622558594, 0.06760454177856445, 0.06960582733154297, 0.07160711288452148, 0.0736083984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 8.0, 10.0, 13.0, 14.0, 21.0, 35.0, 40.0, 46.0, 71.0, 100.0, 106.0, 115.0, 117.0, 66.0, 40.0, 41.0, 21.0, 35.0, 21.0, 16.0, 16.0, 11.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.976483225822449e-05, -5.7481229305267334e-05, -5.519762635231018e-05, -5.291402339935303e-05, -5.0630420446395874e-05, -4.834681749343872e-05, -4.606321454048157e-05, -4.3779611587524414e-05, -4.149600863456726e-05, -3.921240568161011e-05, -3.6928802728652954e-05, -3.46451997756958e-05, -3.236159682273865e-05, -3.0077993869781494e-05, -2.779439091682434e-05, -2.5510787963867188e-05, -2.3227185010910034e-05, -2.094358205795288e-05, -1.8659979104995728e-05, -1.6376376152038574e-05, -1.4092773199081421e-05, -1.1809170246124268e-05, -9.525567293167114e-06, -7.241964340209961e-06, -4.958361387252808e-06, -2.6747584342956543e-06, -3.91155481338501e-07, 1.8924474716186523e-06, 4.176050424575806e-06, 6.459653377532959e-06, 8.743256330490112e-06, 1.1026859283447266e-05, 1.3310462236404419e-05, 1.5594065189361572e-05, 1.7877668142318726e-05, 2.016127109527588e-05, 2.2444874048233032e-05, 2.4728477001190186e-05, 2.701207995414734e-05, 2.9295682907104492e-05, 3.1579285860061646e-05, 3.38628888130188e-05, 3.614649176597595e-05, 3.8430094718933105e-05, 4.071369767189026e-05, 4.299730062484741e-05, 4.5280903577804565e-05, 4.756450653076172e-05, 4.984810948371887e-05, 5.2131712436676025e-05, 5.441531538963318e-05, 5.669891834259033e-05, 5.8982521295547485e-05, 6.126612424850464e-05, 6.354972720146179e-05, 6.583333015441895e-05, 6.81169331073761e-05, 7.040053606033325e-05, 7.26841390132904e-05, 7.496774196624756e-05, 7.725134491920471e-05, 7.953494787216187e-05, 8.181855082511902e-05, 8.410215377807617e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 10.0, 13.0, 19.0, 30.0, 34.0, 40.0, 96.0, 186.0, 372.0, 1653.0, 13398.0, 919667.0, 106165.0, 5385.0, 811.0, 277.0, 139.0, 86.0, 59.0, 28.0, 19.0, 17.0, 14.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1241455078125, -0.1207742691040039, -0.11740303039550781, -0.11403179168701172, -0.11066055297851562, -0.10728931427001953, -0.10391807556152344, -0.10054683685302734, -0.09717559814453125, -0.09380435943603516, -0.09043312072753906, -0.08706188201904297, -0.08369064331054688, -0.08031940460205078, -0.07694816589355469, -0.0735769271850586, -0.0702056884765625, -0.0668344497680664, -0.06346321105957031, -0.06009197235107422, -0.056720733642578125, -0.05334949493408203, -0.04997825622558594, -0.046607017517089844, -0.04323577880859375, -0.039864540100097656, -0.03649330139160156, -0.03312206268310547, -0.029750823974609375, -0.02637958526611328, -0.023008346557617188, -0.019637107849121094, -0.016265869140625, -0.012894630432128906, -0.009523391723632812, -0.006152153015136719, -0.002780914306640625, 0.0005903244018554688, 0.0039615631103515625, 0.007332801818847656, 0.01070404052734375, 0.014075279235839844, 0.017446517944335938, 0.02081775665283203, 0.024188995361328125, 0.02756023406982422, 0.030931472778320312, 0.034302711486816406, 0.0376739501953125, 0.041045188903808594, 0.04441642761230469, 0.04778766632080078, 0.051158905029296875, 0.05453014373779297, 0.05790138244628906, 0.061272621154785156, 0.06464385986328125, 0.06801509857177734, 0.07138633728027344, 0.07475757598876953, 0.07812881469726562, 0.08150005340576172, 0.08487129211425781, 0.0882425308227539, 0.09161376953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 9.0, 15.0, 14.0, 14.0, 32.0, 49.0, 100.0, 171.0, 196.0, 140.0, 77.0, 50.0, 23.0, 13.0, 13.0, 13.0, 5.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.026153564453125, -0.025314807891845703, -0.024476051330566406, -0.02363729476928711, -0.022798538208007812, -0.021959781646728516, -0.02112102508544922, -0.020282268524169922, -0.019443511962890625, -0.018604755401611328, -0.01776599884033203, -0.016927242279052734, -0.016088485717773438, -0.01524972915649414, -0.014410972595214844, -0.013572216033935547, -0.01273345947265625, -0.011894702911376953, -0.011055946350097656, -0.01021718978881836, -0.009378433227539062, -0.008539676666259766, -0.007700920104980469, -0.006862163543701172, -0.006023406982421875, -0.005184650421142578, -0.004345893859863281, -0.0035071372985839844, -0.0026683807373046875, -0.0018296241760253906, -0.0009908676147460938, -0.00015211105346679688, 0.0006866455078125, 0.0015254020690917969, 0.0023641586303710938, 0.0032029151916503906, 0.0040416717529296875, 0.004880428314208984, 0.005719184875488281, 0.006557941436767578, 0.007396697998046875, 0.008235454559326172, 0.009074211120605469, 0.009912967681884766, 0.010751724243164062, 0.01159048080444336, 0.012429237365722656, 0.013267993927001953, 0.01410675048828125, 0.014945507049560547, 0.015784263610839844, 0.01662302017211914, 0.017461776733398438, 0.018300533294677734, 0.01913928985595703, 0.019978046417236328, 0.020816802978515625, 0.021655559539794922, 0.02249431610107422, 0.023333072662353516, 0.024171829223632812, 0.02501058578491211, 0.025849342346191406, 0.026688098907470703, 0.02752685546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 13.0, 54.0, 203.0, 425.0, 229.0, 52.0, 16.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5034151077270508, -0.48789334297180176, -0.4723716080188751, -0.4568498432636261, -0.4413280785083771, -0.42580634355545044, -0.4102845788002014, -0.3947628140449524, -0.37924107909202576, -0.36371931433677673, -0.3481975793838501, -0.3326758146286011, -0.31715404987335205, -0.3016323149204254, -0.2861105501651764, -0.27058881521224976, -0.25506705045700073, -0.2395453006029129, -0.22402353584766388, -0.20850178599357605, -0.19298003613948822, -0.1774582862854004, -0.16193652153015137, -0.14641477167606354, -0.13089299201965332, -0.1153712347149849, -0.09984948486089706, -0.08432772755622864, -0.06880597770214081, -0.05328422039747238, -0.037762463092803955, -0.022240713238716125, -0.006718963384628296, 0.008802791126072407, 0.02432454563677311, 0.03984630107879639, 0.055368054658174515, 0.07088980823755264, 0.08641156554222107, 0.1019333153963089, 0.11745507270097733, 0.13297683000564575, 0.14849857985973358, 0.1640203297138214, 0.17954209446907043, 0.19506384432315826, 0.2105855941772461, 0.22610735893249512, 0.24162910878658295, 0.2571508586406708, 0.2726726233959198, 0.28819435834884644, 0.30371612310409546, 0.3192378878593445, 0.3347596526145935, 0.35028138756752014, 0.36580315232276917, 0.3813249170780182, 0.3968466520309448, 0.41236841678619385, 0.42789018154144287, 0.4434119164943695, 0.45893368124961853, 0.47445541620254517, 0.4899771809577942]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 3.0, 10.0, 12.0, 15.0, 16.0, 34.0, 22.0, 31.0, 56.0, 49.0, 60.0, 73.0, 65.0, 75.0, 59.0, 55.0, 55.0, 58.0, 43.0, 47.0, 44.0, 24.0, 22.0, 12.0, 16.0, 13.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17116987705230713, -0.16502514481544495, -0.15888041257858276, -0.1527356654405594, -0.1465909332036972, -0.14044620096683502, -0.13430145382881165, -0.12815672159194946, -0.12201198935508728, -0.1158672571182251, -0.10972251743078232, -0.10357777774333954, -0.09743304550647736, -0.09128831326961517, -0.0851435735821724, -0.07899883389472961, -0.07285410165786743, -0.06670936942100525, -0.06056462973356247, -0.05441989377140999, -0.04827515780925751, -0.042130421847105026, -0.035985685884952545, -0.029840949922800064, -0.023696213960647583, -0.017551477998495102, -0.01140674203634262, -0.00526200607419014, 0.0008827298879623413, 0.007027465850114822, 0.013172201812267303, 0.019316937774419785, 0.025461673736572266, 0.03160640969872475, 0.03775114566087723, 0.04389588162302971, 0.05004061758518219, 0.05618535354733467, 0.06233008950948715, 0.06847482919692993, 0.07461956143379211, 0.0807642936706543, 0.08690903335809708, 0.09305377304553986, 0.09919850528240204, 0.10534323751926422, 0.111487977206707, 0.11763271689414978, 0.12377744913101196, 0.12992218136787415, 0.13606691360473633, 0.1422116607427597, 0.1483563929796219, 0.15450112521648407, 0.16064587235450745, 0.16679060459136963, 0.1729353368282318, 0.179080069065094, 0.18522480130195618, 0.19136954843997955, 0.19751428067684174, 0.20365901291370392, 0.2098037600517273, 0.21594849228858948, 0.22209322452545166]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 12.0, 7.0, 9.0, 25.0, 16.0, 40.0, 43.0, 90.0, 132.0, 303.0, 1189.0, 3513.0, 6270.0, 147583.0, 4008577.0, 19415.0, 3939.0, 1581.0, 805.0, 267.0, 150.0, 93.0, 65.0, 44.0, 29.0, 28.0, 14.0, 14.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.06729793548583984, -0.06483268737792969, -0.06236743927001953, -0.059902191162109375, -0.05743694305419922, -0.05497169494628906, -0.052506446838378906, -0.05004119873046875, -0.047575950622558594, -0.04511070251464844, -0.04264545440673828, -0.040180206298828125, -0.03771495819091797, -0.03524971008300781, -0.032784461975097656, -0.0303192138671875, -0.027853965759277344, -0.025388717651367188, -0.02292346954345703, -0.020458221435546875, -0.01799297332763672, -0.015527725219726562, -0.013062477111816406, -0.01059722900390625, -0.008131980895996094, -0.0056667327880859375, -0.0032014846801757812, -0.000736236572265625, 0.0017290115356445312, 0.0041942596435546875, 0.006659507751464844, 0.009124755859375, 0.011590003967285156, 0.014055252075195312, 0.01652050018310547, 0.018985748291015625, 0.02145099639892578, 0.023916244506835938, 0.026381492614746094, 0.02884674072265625, 0.031311988830566406, 0.03377723693847656, 0.03624248504638672, 0.038707733154296875, 0.04117298126220703, 0.04363822937011719, 0.046103477478027344, 0.0485687255859375, 0.051033973693847656, 0.05349922180175781, 0.05596446990966797, 0.058429718017578125, 0.06089496612548828, 0.06336021423339844, 0.0658254623413086, 0.06829071044921875, 0.0707559585571289, 0.07322120666503906, 0.07568645477294922, 0.07815170288085938, 0.08061695098876953, 0.08308219909667969, 0.08554744720458984, 0.0880126953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 36.0, 158.0, 392.0, 302.0, 79.0, 19.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0699462890625, -0.06787872314453125, -0.0658111572265625, -0.06374359130859375, -0.061676025390625, -0.05960845947265625, -0.0575408935546875, -0.05547332763671875, -0.05340576171875, -0.05133819580078125, -0.0492706298828125, -0.04720306396484375, -0.045135498046875, -0.04306793212890625, -0.0410003662109375, -0.03893280029296875, -0.036865234375, -0.03479766845703125, -0.0327301025390625, -0.03066253662109375, -0.028594970703125, -0.02652740478515625, -0.0244598388671875, -0.02239227294921875, -0.02032470703125, -0.01825714111328125, -0.0161895751953125, -0.01412200927734375, -0.012054443359375, -0.00998687744140625, -0.0079193115234375, -0.00585174560546875, -0.0037841796875, -0.00171661376953125, 0.0003509521484375, 0.00241851806640625, 0.004486083984375, 0.00655364990234375, 0.0086212158203125, 0.01068878173828125, 0.01275634765625, 0.01482391357421875, 0.0168914794921875, 0.01895904541015625, 0.021026611328125, 0.02309417724609375, 0.0251617431640625, 0.02722930908203125, 0.029296875, 0.03136444091796875, 0.0334320068359375, 0.03549957275390625, 0.037567138671875, 0.03963470458984375, 0.0417022705078125, 0.04376983642578125, 0.04583740234375, 0.04790496826171875, 0.0499725341796875, 0.05204010009765625, 0.054107666015625, 0.05617523193359375, 0.0582427978515625, 0.06031036376953125, 0.0623779296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 13.0, 11.0, 21.0, 27.0, 44.0, 77.0, 113.0, 243.0, 413.0, 1055.0, 3805.0, 33861.0, 3652893.0, 487478.0, 10804.0, 2012.0, 688.0, 316.0, 151.0, 87.0, 60.0, 29.0, 22.0, 15.0, 9.0, 9.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06700801849365234, -0.06468009948730469, -0.06235218048095703, -0.060024261474609375, -0.05769634246826172, -0.05536842346191406, -0.053040504455566406, -0.05071258544921875, -0.048384666442871094, -0.04605674743652344, -0.04372882843017578, -0.041400909423828125, -0.03907299041748047, -0.03674507141113281, -0.034417152404785156, -0.0320892333984375, -0.029761314392089844, -0.027433395385742188, -0.02510547637939453, -0.022777557373046875, -0.02044963836669922, -0.018121719360351562, -0.015793800354003906, -0.01346588134765625, -0.011137962341308594, -0.008810043334960938, -0.006482124328613281, -0.004154205322265625, -0.0018262863159179688, 0.0005016326904296875, 0.0028295516967773438, 0.005157470703125, 0.007485389709472656, 0.009813308715820312, 0.012141227722167969, 0.014469146728515625, 0.01679706573486328, 0.019124984741210938, 0.021452903747558594, 0.02378082275390625, 0.026108741760253906, 0.028436660766601562, 0.03076457977294922, 0.033092498779296875, 0.03542041778564453, 0.03774833679199219, 0.040076255798339844, 0.0424041748046875, 0.044732093811035156, 0.04706001281738281, 0.04938793182373047, 0.051715850830078125, 0.05404376983642578, 0.05637168884277344, 0.058699607849121094, 0.06102752685546875, 0.0633554458618164, 0.06568336486816406, 0.06801128387451172, 0.07033920288085938, 0.07266712188720703, 0.07499504089355469, 0.07732295989990234, 0.07965087890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 5.0, 14.0, 18.0, 26.0, 33.0, 48.0, 73.0, 133.0, 179.0, 243.0, 378.0, 508.0, 591.0, 544.0, 376.0, 276.0, 194.0, 138.0, 73.0, 70.0, 42.0, 39.0, 27.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027923583984375, -0.027040958404541016, -0.02615833282470703, -0.025275707244873047, -0.024393081665039062, -0.023510456085205078, -0.022627830505371094, -0.02174520492553711, -0.020862579345703125, -0.01997995376586914, -0.019097328186035156, -0.018214702606201172, -0.017332077026367188, -0.016449451446533203, -0.015566825866699219, -0.014684200286865234, -0.01380157470703125, -0.012918949127197266, -0.012036323547363281, -0.011153697967529297, -0.010271072387695312, -0.009388446807861328, -0.008505821228027344, -0.007623195648193359, -0.006740570068359375, -0.005857944488525391, -0.004975318908691406, -0.004092693328857422, -0.0032100677490234375, -0.002327442169189453, -0.0014448165893554688, -0.0005621910095214844, 0.0003204345703125, 0.0012030601501464844, 0.0020856857299804688, 0.002968311309814453, 0.0038509368896484375, 0.004733562469482422, 0.005616188049316406, 0.006498813629150391, 0.007381439208984375, 0.00826406478881836, 0.009146690368652344, 0.010029315948486328, 0.010911941528320312, 0.011794567108154297, 0.012677192687988281, 0.013559818267822266, 0.01444244384765625, 0.015325069427490234, 0.01620769500732422, 0.017090320587158203, 0.017972946166992188, 0.018855571746826172, 0.019738197326660156, 0.02062082290649414, 0.021503448486328125, 0.02238607406616211, 0.023268699645996094, 0.024151325225830078, 0.025033950805664062, 0.025916576385498047, 0.02679920196533203, 0.027681827545166016, 0.028564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 35.0, 154.0, 408.0, 299.0, 85.0, 14.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29196077585220337, -0.28144949674606323, -0.2709381878376007, -0.2604268789291382, -0.24991559982299805, -0.23940430581569672, -0.22889301180839539, -0.21838171780109406, -0.20787042379379272, -0.1973591297864914, -0.18684783577919006, -0.17633654177188873, -0.1658252477645874, -0.15531395375728607, -0.14480265974998474, -0.1342913657426834, -0.12378007173538208, -0.11326877772808075, -0.10275748372077942, -0.09224618971347809, -0.08173489570617676, -0.07122360169887543, -0.0607123076915741, -0.050201013684272766, -0.039689719676971436, -0.029178425669670105, -0.018667131662368774, -0.008155837655067444, 0.0023554563522338867, 0.012866750359535217, 0.023378044366836548, 0.03388933837413788, 0.04440063238143921, 0.05491192638874054, 0.06542322039604187, 0.0759345144033432, 0.08644580841064453, 0.09695710241794586, 0.10746839642524719, 0.11797969043254852, 0.12849098443984985, 0.13900227844715118, 0.14951357245445251, 0.16002486646175385, 0.17053616046905518, 0.1810474544763565, 0.19155874848365784, 0.20207004249095917, 0.2125813364982605, 0.22309263050556183, 0.23360392451286316, 0.2441152185201645, 0.2546265125274658, 0.26513779163360596, 0.2756491005420685, 0.286160409450531, 0.29667168855667114, 0.3071829676628113, 0.3176942765712738, 0.32820558547973633, 0.33871686458587646, 0.3492281436920166, 0.3597394526004791, 0.37025076150894165, 0.3807620406150818]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 16.0, 12.0, 30.0, 26.0, 31.0, 34.0, 35.0, 47.0, 56.0, 62.0, 49.0, 65.0, 46.0, 55.0, 45.0, 37.0, 62.0, 46.0, 41.0, 34.0, 34.0, 27.0, 21.0, 16.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11320865154266357, -0.10996858775615692, -0.10672852396965027, -0.10348846018314362, -0.10024839639663696, -0.09700833261013031, -0.09376827627420425, -0.0905282124876976, -0.08728814870119095, -0.0840480849146843, -0.08080802112817764, -0.07756795734167099, -0.07432790100574493, -0.07108783721923828, -0.06784777343273163, -0.06460770964622498, -0.06136764585971832, -0.05812758207321167, -0.05488751828670502, -0.05164745822548866, -0.04840739443898201, -0.04516733065247536, -0.041927270591259, -0.03868720680475235, -0.0354471430182457, -0.032207079231739044, -0.02896701730787754, -0.025726955384016037, -0.022486891597509384, -0.01924682781100273, -0.016006765887141228, -0.012766703963279724, -0.009526640176773071, -0.006286577321588993, -0.003046514466404915, 0.00019354838877916336, 0.0034336112439632416, 0.006673675030469894, 0.009913736954331398, 0.013153798878192902, 0.016393862664699554, 0.019633926451206207, 0.02287398837506771, 0.026114050298929214, 0.029354114085435867, 0.03259417787194252, 0.035834237933158875, 0.03907430171966553, 0.04231436550617218, 0.04555442929267883, 0.048794493079185486, 0.05203455314040184, 0.05527461692690849, 0.058514680713415146, 0.0617547407746315, 0.06499480456113815, 0.0682348683476448, 0.07147493213415146, 0.07471499592065811, 0.07795505970716476, 0.08119511604309082, 0.08443517982959747, 0.08767524361610413, 0.09091530740261078, 0.09415537118911743]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 10.0, 11.0, 12.0, 17.0, 25.0, 19.0, 26.0, 33.0, 38.0, 45.0, 52.0, 88.0, 111.0, 117.0, 185.0, 258.0, 330.0, 518.0, 873.0, 2107.0, 14428.0, 567752.0, 444861.0, 12059.0, 1932.0, 823.0, 471.0, 326.0, 227.0, 182.0, 126.0, 105.0, 67.0, 62.0, 50.0, 40.0, 34.0, 20.0, 27.0, 22.0, 17.0, 10.0, 9.0, 8.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.094970703125, -0.09208965301513672, -0.08920860290527344, -0.08632755279541016, -0.08344650268554688, -0.0805654525756836, -0.07768440246582031, -0.07480335235595703, -0.07192230224609375, -0.06904125213623047, -0.06616020202636719, -0.0632791519165039, -0.060398101806640625, -0.057517051696777344, -0.05463600158691406, -0.05175495147705078, -0.0488739013671875, -0.04599285125732422, -0.04311180114746094, -0.040230751037597656, -0.037349700927734375, -0.034468650817871094, -0.03158760070800781, -0.02870655059814453, -0.02582550048828125, -0.02294445037841797, -0.020063400268554688, -0.017182350158691406, -0.014301300048828125, -0.011420249938964844, -0.008539199829101562, -0.005658149719238281, -0.002777099609375, 0.00010395050048828125, 0.0029850006103515625, 0.005866050720214844, 0.008747100830078125, 0.011628150939941406, 0.014509201049804688, 0.01739025115966797, 0.02027130126953125, 0.02315235137939453, 0.026033401489257812, 0.028914451599121094, 0.031795501708984375, 0.034676551818847656, 0.03755760192871094, 0.04043865203857422, 0.0433197021484375, 0.04620075225830078, 0.04908180236816406, 0.051962852478027344, 0.054843902587890625, 0.057724952697753906, 0.06060600280761719, 0.06348705291748047, 0.06636810302734375, 0.06924915313720703, 0.07213020324707031, 0.0750112533569336, 0.07789230346679688, 0.08077335357666016, 0.08365440368652344, 0.08653545379638672, 0.08941650390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 23.0, 112.0, 355.0, 367.0, 109.0, 27.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0677490234375, -0.06569957733154297, -0.06365013122558594, -0.061600685119628906, -0.059551239013671875, -0.057501792907714844, -0.05545234680175781, -0.05340290069580078, -0.05135345458984375, -0.04930400848388672, -0.04725456237792969, -0.045205116271972656, -0.043155670166015625, -0.041106224060058594, -0.03905677795410156, -0.03700733184814453, -0.0349578857421875, -0.03290843963623047, -0.030858993530273438, -0.028809547424316406, -0.026760101318359375, -0.024710655212402344, -0.022661209106445312, -0.02061176300048828, -0.01856231689453125, -0.01651287078857422, -0.014463424682617188, -0.012413978576660156, -0.010364532470703125, -0.008315086364746094, -0.0062656402587890625, -0.004216194152832031, -0.002166748046875, -0.00011730194091796875, 0.0019321441650390625, 0.003981590270996094, 0.006031036376953125, 0.008080482482910156, 0.010129928588867188, 0.012179374694824219, 0.01422882080078125, 0.01627826690673828, 0.018327713012695312, 0.020377159118652344, 0.022426605224609375, 0.024476051330566406, 0.026525497436523438, 0.02857494354248047, 0.0306243896484375, 0.03267383575439453, 0.03472328186035156, 0.036772727966308594, 0.038822174072265625, 0.040871620178222656, 0.04292106628417969, 0.04497051239013672, 0.04701995849609375, 0.04906940460205078, 0.05111885070800781, 0.053168296813964844, 0.055217742919921875, 0.057267189025878906, 0.05931663513183594, 0.06136608123779297, 0.06341552734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 2.0, 7.0, 9.0, 10.0, 16.0, 15.0, 25.0, 24.0, 44.0, 73.0, 125.0, 177.0, 423.0, 928.0, 3032.0, 69056.0, 957748.0, 13518.0, 1865.0, 676.0, 318.0, 158.0, 82.0, 58.0, 36.0, 20.0, 25.0, 13.0, 15.0, 10.0, 10.0, 6.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1761474609375, -0.17101478576660156, -0.16588211059570312, -0.1607494354248047, -0.15561676025390625, -0.1504840850830078, -0.14535140991210938, -0.14021873474121094, -0.1350860595703125, -0.12995338439941406, -0.12482070922851562, -0.11968803405761719, -0.11455535888671875, -0.10942268371582031, -0.10429000854492188, -0.09915733337402344, -0.094024658203125, -0.08889198303222656, -0.08375930786132812, -0.07862663269042969, -0.07349395751953125, -0.06836128234863281, -0.06322860717773438, -0.05809593200683594, -0.0529632568359375, -0.04783058166503906, -0.042697906494140625, -0.03756523132324219, -0.03243255615234375, -0.027299880981445312, -0.022167205810546875, -0.017034530639648438, -0.01190185546875, -0.0067691802978515625, -0.001636505126953125, 0.0034961700439453125, 0.00862884521484375, 0.013761520385742188, 0.018894195556640625, 0.024026870727539062, 0.0291595458984375, 0.03429222106933594, 0.039424896240234375, 0.04455757141113281, 0.04969024658203125, 0.05482292175292969, 0.059955596923828125, 0.06508827209472656, 0.070220947265625, 0.07535362243652344, 0.08048629760742188, 0.08561897277832031, 0.09075164794921875, 0.09588432312011719, 0.10101699829101562, 0.10614967346191406, 0.1112823486328125, 0.11641502380371094, 0.12154769897460938, 0.1266803741455078, 0.13181304931640625, 0.1369457244873047, 0.14207839965820312, 0.14721107482910156, 0.15234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 9.0, 17.0, 9.0, 14.0, 21.0, 24.0, 25.0, 28.0, 33.0, 34.0, 38.0, 51.0, 49.0, 47.0, 46.0, 57.0, 43.0, 48.0, 52.0, 37.0, 49.0, 37.0, 40.0, 28.0, 25.0, 23.0, 16.0, 18.0, 13.0, 9.0, 11.0, 5.0, 9.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.03936767578125, -0.03816032409667969, -0.036952972412109375, -0.03574562072753906, -0.03453826904296875, -0.03333091735839844, -0.032123565673828125, -0.030916213989257812, -0.0297088623046875, -0.028501510620117188, -0.027294158935546875, -0.026086807250976562, -0.02487945556640625, -0.023672103881835938, -0.022464752197265625, -0.021257400512695312, -0.020050048828125, -0.018842697143554688, -0.017635345458984375, -0.016427993774414062, -0.01522064208984375, -0.014013290405273438, -0.012805938720703125, -0.011598587036132812, -0.0103912353515625, -0.009183883666992188, -0.007976531982421875, -0.0067691802978515625, -0.00556182861328125, -0.0043544769287109375, -0.003147125244140625, -0.0019397735595703125, -0.000732421875, 0.0004749298095703125, 0.001682281494140625, 0.0028896331787109375, 0.00409698486328125, 0.0053043365478515625, 0.006511688232421875, 0.0077190399169921875, 0.0089263916015625, 0.010133743286132812, 0.011341094970703125, 0.012548446655273438, 0.01375579833984375, 0.014963150024414062, 0.016170501708984375, 0.017377853393554688, 0.018585205078125, 0.019792556762695312, 0.020999908447265625, 0.022207260131835938, 0.02341461181640625, 0.024621963500976562, 0.025829315185546875, 0.027036666870117188, 0.0282440185546875, 0.029451370239257812, 0.030658721923828125, 0.03186607360839844, 0.03307342529296875, 0.03428077697753906, 0.035488128662109375, 0.03669548034667969, 0.03790283203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 13.0, 16.0, 16.0, 30.0, 53.0, 57.0, 90.0, 139.0, 241.0, 388.0, 684.0, 1309.0, 3046.0, 9108.0, 45347.0, 528133.0, 409452.0, 36764.0, 8083.0, 2733.0, 1197.0, 637.0, 363.0, 234.0, 139.0, 77.0, 55.0, 41.0, 33.0, 23.0, 14.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0216827392578125, -0.020906925201416016, -0.02013111114501953, -0.019355297088623047, -0.018579483032226562, -0.017803668975830078, -0.017027854919433594, -0.01625204086303711, -0.015476226806640625, -0.01470041275024414, -0.013924598693847656, -0.013148784637451172, -0.012372970581054688, -0.011597156524658203, -0.010821342468261719, -0.010045528411865234, -0.00926971435546875, -0.008493900299072266, -0.007718086242675781, -0.006942272186279297, -0.0061664581298828125, -0.005390644073486328, -0.004614830017089844, -0.0038390159606933594, -0.003063201904296875, -0.0022873878479003906, -0.0015115737915039062, -0.0007357597351074219, 4.00543212890625e-05, 0.0008158683776855469, 0.0015916824340820312, 0.0023674964904785156, 0.003143310546875, 0.003919124603271484, 0.004694938659667969, 0.005470752716064453, 0.0062465667724609375, 0.007022380828857422, 0.007798194885253906, 0.00857400894165039, 0.009349822998046875, 0.01012563705444336, 0.010901451110839844, 0.011677265167236328, 0.012453079223632812, 0.013228893280029297, 0.014004707336425781, 0.014780521392822266, 0.01555633544921875, 0.016332149505615234, 0.01710796356201172, 0.017883777618408203, 0.018659591674804688, 0.019435405731201172, 0.020211219787597656, 0.02098703384399414, 0.021762847900390625, 0.02253866195678711, 0.023314476013183594, 0.024090290069580078, 0.024866104125976562, 0.025641918182373047, 0.02641773223876953, 0.027193546295166016, 0.0279693603515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 15.0, 10.0, 12.0, 12.0, 22.0, 28.0, 35.0, 45.0, 71.0, 78.0, 107.0, 113.0, 106.0, 95.0, 63.0, 38.0, 32.0, 25.0, 18.0, 12.0, 7.0, 6.0, 8.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -7.059238851070404e-05, -6.852671504020691e-05, -6.646104156970978e-05, -6.439536809921265e-05, -6.232969462871552e-05, -6.0264021158218384e-05, -5.819834768772125e-05, -5.613267421722412e-05, -5.406700074672699e-05, -5.200132727622986e-05, -4.993565380573273e-05, -4.7869980335235596e-05, -4.5804306864738464e-05, -4.373863339424133e-05, -4.16729599237442e-05, -3.960728645324707e-05, -3.754161298274994e-05, -3.547593951225281e-05, -3.3410266041755676e-05, -3.1344592571258545e-05, -2.9278919100761414e-05, -2.7213245630264282e-05, -2.514757215976715e-05, -2.308189868927002e-05, -2.1016225218772888e-05, -1.8950551748275757e-05, -1.6884878277778625e-05, -1.4819204807281494e-05, -1.2753531336784363e-05, -1.0687857866287231e-05, -8.6221843957901e-06, -6.556510925292969e-06, -4.490837454795837e-06, -2.425163984298706e-06, -3.594905138015747e-07, 1.7061829566955566e-06, 3.771856427192688e-06, 5.837529897689819e-06, 7.90320336818695e-06, 9.968876838684082e-06, 1.2034550309181213e-05, 1.4100223779678345e-05, 1.6165897250175476e-05, 1.8231570720672607e-05, 2.029724419116974e-05, 2.236291766166687e-05, 2.4428591132164e-05, 2.6494264602661133e-05, 2.8559938073158264e-05, 3.0625611543655396e-05, 3.269128501415253e-05, 3.475695848464966e-05, 3.682263195514679e-05, 3.888830542564392e-05, 4.095397889614105e-05, 4.3019652366638184e-05, 4.5085325837135315e-05, 4.7150999307632446e-05, 4.921667277812958e-05, 5.128234624862671e-05, 5.334801971912384e-05, 5.541369318962097e-05, 5.74793666601181e-05, 5.9545040130615234e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 14.0, 11.0, 12.0, 29.0, 30.0, 58.0, 91.0, 174.0, 341.0, 798.0, 2575.0, 23682.0, 886254.0, 126727.0, 5463.0, 1258.0, 431.0, 218.0, 149.0, 67.0, 60.0, 28.0, 19.0, 7.0, 9.0, 9.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050323486328125, -0.048914432525634766, -0.04750537872314453, -0.0460963249206543, -0.04468727111816406, -0.04327821731567383, -0.041869163513183594, -0.04046010971069336, -0.039051055908203125, -0.03764200210571289, -0.036232948303222656, -0.03482389450073242, -0.03341484069824219, -0.03200578689575195, -0.03059673309326172, -0.029187679290771484, -0.02777862548828125, -0.026369571685791016, -0.02496051788330078, -0.023551464080810547, -0.022142410278320312, -0.020733356475830078, -0.019324302673339844, -0.01791524887084961, -0.016506195068359375, -0.01509714126586914, -0.013688087463378906, -0.012279033660888672, -0.010869979858398438, -0.009460926055908203, -0.008051872253417969, -0.006642818450927734, -0.0052337646484375, -0.0038247108459472656, -0.0024156570434570312, -0.0010066032409667969, 0.0004024505615234375, 0.0018115043640136719, 0.0032205581665039062, 0.004629611968994141, 0.006038665771484375, 0.007447719573974609, 0.008856773376464844, 0.010265827178955078, 0.011674880981445312, 0.013083934783935547, 0.014492988586425781, 0.015902042388916016, 0.01731109619140625, 0.018720149993896484, 0.02012920379638672, 0.021538257598876953, 0.022947311401367188, 0.024356365203857422, 0.025765419006347656, 0.02717447280883789, 0.028583526611328125, 0.02999258041381836, 0.031401634216308594, 0.03281068801879883, 0.03421974182128906, 0.0356287956237793, 0.03703784942626953, 0.038446903228759766, 0.03985595703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 6.0, 9.0, 10.0, 19.0, 23.0, 29.0, 41.0, 47.0, 55.0, 79.0, 72.0, 113.0, 107.0, 90.0, 70.0, 51.0, 22.0, 36.0, 26.0, 10.0, 14.0, 15.0, 17.0, 12.0, 11.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01297760009765625, -0.012528538703918457, -0.012079477310180664, -0.011630415916442871, -0.011181354522705078, -0.010732293128967285, -0.010283231735229492, -0.0098341703414917, -0.009385108947753906, -0.008936047554016113, -0.00848698616027832, -0.008037924766540527, -0.007588863372802734, -0.007139801979064941, -0.0066907405853271484, -0.0062416791915893555, -0.0057926177978515625, -0.0053435564041137695, -0.0048944950103759766, -0.004445433616638184, -0.003996372222900391, -0.0035473108291625977, -0.0030982494354248047, -0.0026491880416870117, -0.0022001266479492188, -0.0017510652542114258, -0.0013020038604736328, -0.0008529424667358398, -0.0004038810729980469, 4.5180320739746094e-05, 0.0004942417144775391, 0.000943303108215332, 0.001392364501953125, 0.001841425895690918, 0.002290487289428711, 0.002739548683166504, 0.003188610076904297, 0.00363767147064209, 0.004086732864379883, 0.004535794258117676, 0.004984855651855469, 0.005433917045593262, 0.005882978439331055, 0.006332039833068848, 0.006781101226806641, 0.007230162620544434, 0.0076792240142822266, 0.00812828540802002, 0.008577346801757812, 0.009026408195495605, 0.009475469589233398, 0.009924530982971191, 0.010373592376708984, 0.010822653770446777, 0.01127171516418457, 0.011720776557922363, 0.012169837951660156, 0.01261889934539795, 0.013067960739135742, 0.013517022132873535, 0.013966083526611328, 0.014415144920349121, 0.014864206314086914, 0.015313267707824707, 0.0157623291015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 14.0, 49.0, 158.0, 346.0, 250.0, 132.0, 31.0, 16.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32951870560646057, -0.32184770703315735, -0.3141767382621765, -0.3065057396888733, -0.29883474111557007, -0.29116377234458923, -0.283492773771286, -0.2758217751979828, -0.26815080642700195, -0.26047980785369873, -0.2528088390827179, -0.24513784050941467, -0.23746685683727264, -0.22979587316513062, -0.2221248745918274, -0.21445389091968536, -0.20678289234638214, -0.1991119086742401, -0.1914409101009369, -0.18376992642879486, -0.17609894275665283, -0.1684279441833496, -0.16075696051120758, -0.15308597683906555, -0.14541497826576233, -0.1377439945936203, -0.13007299602031708, -0.12240201234817505, -0.11473102867603302, -0.1070600375533104, -0.09938904643058777, -0.09171806275844574, -0.0840470939874649, -0.07637610286474228, -0.06870511919260025, -0.061034128069877625, -0.0533631406724453, -0.04569215327501297, -0.038021162152290344, -0.030350174754858017, -0.02267918735742569, -0.015008199028670788, -0.007337210699915886, 0.0003337785601615906, 0.008004765957593918, 0.015675753355026245, 0.02334674447774887, 0.031017731875181198, 0.038688719272613525, 0.04635970667004585, 0.05403069406747818, 0.061701685190200806, 0.06937266886234283, 0.07704365998506546, 0.08471465110778809, 0.09238563477993011, 0.10005662590265274, 0.10772761702537537, 0.1153986006975174, 0.12306959182024002, 0.13074058294296265, 0.13841156661510468, 0.1460825502872467, 0.15375354886054993, 0.16142453253269196]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 9.0, 16.0, 11.0, 18.0, 25.0, 28.0, 35.0, 48.0, 44.0, 59.0, 63.0, 65.0, 55.0, 67.0, 57.0, 57.0, 58.0, 57.0, 37.0, 36.0, 34.0, 18.0, 30.0, 25.0, 13.0, 6.0, 9.0, 3.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16439300775527954, -0.15996703505516052, -0.1555410623550415, -0.1511150747537613, -0.14668910205364227, -0.14226312935352325, -0.13783714175224304, -0.13341116905212402, -0.128985196352005, -0.12455922365188599, -0.12013324350118637, -0.11570726335048676, -0.11128129065036774, -0.10685531795024872, -0.1024293377995491, -0.09800335764884949, -0.09357738494873047, -0.08915141224861145, -0.08472543209791183, -0.08029945194721222, -0.0758734792470932, -0.07144750654697418, -0.06702152639627457, -0.06259554624557495, -0.05816957354545593, -0.053743597120046616, -0.0493176206946373, -0.04489164426922798, -0.040465667843818665, -0.03603969141840935, -0.03161371499300003, -0.027187738567590714, -0.022761762142181396, -0.01833578571677208, -0.013909809291362762, -0.009483832865953445, -0.005057856440544128, -0.0006318800151348114, 0.0037940964102745056, 0.008220072835683823, 0.01264604926109314, 0.017072025686502457, 0.021498002111911774, 0.02592397853732109, 0.030349954962730408, 0.034775931388139725, 0.03920190781354904, 0.04362788423895836, 0.048053860664367676, 0.05247983708977699, 0.05690581351518631, 0.06133178994059563, 0.06575776636600494, 0.07018373906612396, 0.07460971921682358, 0.0790356993675232, 0.08346167206764221, 0.08788764476776123, 0.09231362491846085, 0.09673960506916046, 0.10116557776927948, 0.1055915504693985, 0.11001753062009811, 0.11444351077079773, 0.11886948347091675]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 17.0, 15.0, 26.0, 30.0, 50.0, 48.0, 87.0, 152.0, 262.0, 831.0, 2281.0, 4356.0, 7403.0, 64382.0, 3981059.0, 117434.0, 9033.0, 3226.0, 1392.0, 1049.0, 424.0, 207.0, 150.0, 72.0, 57.0, 53.0, 40.0, 28.0, 26.0, 11.0, 15.0, 11.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.055850982666015625, -0.05396270751953125, -0.052074432373046875, -0.0501861572265625, -0.048297882080078125, -0.04640960693359375, -0.044521331787109375, -0.042633056640625, -0.040744781494140625, -0.03885650634765625, -0.036968231201171875, -0.0350799560546875, -0.033191680908203125, -0.03130340576171875, -0.029415130615234375, -0.02752685546875, -0.025638580322265625, -0.02375030517578125, -0.021862030029296875, -0.0199737548828125, -0.018085479736328125, -0.01619720458984375, -0.014308929443359375, -0.012420654296875, -0.010532379150390625, -0.00864410400390625, -0.006755828857421875, -0.0048675537109375, -0.002979278564453125, -0.00109100341796875, 0.000797271728515625, 0.002685546875, 0.004573822021484375, 0.00646209716796875, 0.008350372314453125, 0.0102386474609375, 0.012126922607421875, 0.01401519775390625, 0.015903472900390625, 0.017791748046875, 0.019680023193359375, 0.02156829833984375, 0.023456573486328125, 0.0253448486328125, 0.027233123779296875, 0.02912139892578125, 0.031009674072265625, 0.03289794921875, 0.034786224365234375, 0.03667449951171875, 0.038562774658203125, 0.0404510498046875, 0.042339324951171875, 0.04422760009765625, 0.046115875244140625, 0.048004150390625, 0.049892425537109375, 0.05178070068359375, 0.053668975830078125, 0.0555572509765625, 0.057445526123046875, 0.05933380126953125, 0.061222076416015625, 0.0631103515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 12.0, 99.0, 281.0, 396.0, 172.0, 30.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06506109237670898, -0.06304454803466797, -0.06102800369262695, -0.05901145935058594, -0.05699491500854492, -0.054978370666503906, -0.05296182632446289, -0.050945281982421875, -0.04892873764038086, -0.046912193298339844, -0.04489564895629883, -0.04287910461425781, -0.0408625602722168, -0.03884601593017578, -0.036829471588134766, -0.03481292724609375, -0.032796382904052734, -0.03077983856201172, -0.028763294219970703, -0.026746749877929688, -0.024730205535888672, -0.022713661193847656, -0.02069711685180664, -0.018680572509765625, -0.01666402816772461, -0.014647483825683594, -0.012630939483642578, -0.010614395141601562, -0.008597850799560547, -0.006581306457519531, -0.004564762115478516, -0.0025482177734375, -0.0005316734313964844, 0.0014848709106445312, 0.003501415252685547, 0.0055179595947265625, 0.007534503936767578, 0.009551048278808594, 0.01156759262084961, 0.013584136962890625, 0.01560068130493164, 0.017617225646972656, 0.019633769989013672, 0.021650314331054688, 0.023666858673095703, 0.02568340301513672, 0.027699947357177734, 0.02971649169921875, 0.031733036041259766, 0.03374958038330078, 0.0357661247253418, 0.03778266906738281, 0.03979921340942383, 0.041815757751464844, 0.04383230209350586, 0.045848846435546875, 0.04786539077758789, 0.049881935119628906, 0.05189847946166992, 0.05391502380371094, 0.05593156814575195, 0.05794811248779297, 0.059964656829833984, 0.061981201171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 11.0, 17.0, 13.0, 19.0, 47.0, 62.0, 80.0, 130.0, 243.0, 570.0, 2417.0, 71162.0, 4098435.0, 18316.0, 1746.0, 476.0, 217.0, 119.0, 70.0, 29.0, 27.0, 23.0, 14.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06658935546875, -0.06347370147705078, -0.06035804748535156, -0.057242393493652344, -0.054126739501953125, -0.051011085510253906, -0.04789543151855469, -0.04477977752685547, -0.04166412353515625, -0.03854846954345703, -0.03543281555175781, -0.032317161560058594, -0.029201507568359375, -0.026085853576660156, -0.022970199584960938, -0.01985454559326172, -0.0167388916015625, -0.013623237609863281, -0.010507583618164062, -0.007391929626464844, -0.004276275634765625, -0.0011606216430664062, 0.0019550323486328125, 0.005070686340332031, 0.00818634033203125, 0.011301994323730469, 0.014417648315429688, 0.017533302307128906, 0.020648956298828125, 0.023764610290527344, 0.026880264282226562, 0.02999591827392578, 0.033111572265625, 0.03622722625732422, 0.03934288024902344, 0.042458534240722656, 0.045574188232421875, 0.048689842224121094, 0.05180549621582031, 0.05492115020751953, 0.05803680419921875, 0.06115245819091797, 0.06426811218261719, 0.0673837661743164, 0.07049942016601562, 0.07361507415771484, 0.07673072814941406, 0.07984638214111328, 0.0829620361328125, 0.08607769012451172, 0.08919334411621094, 0.09230899810791016, 0.09542465209960938, 0.0985403060913086, 0.10165596008300781, 0.10477161407470703, 0.10788726806640625, 0.11100292205810547, 0.11411857604980469, 0.1172342300415039, 0.12034988403320312, 0.12346553802490234, 0.12658119201660156, 0.12969684600830078, 0.1328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 22.0, 24.0, 46.0, 82.0, 114.0, 166.0, 276.0, 508.0, 779.0, 745.0, 487.0, 243.0, 165.0, 100.0, 82.0, 67.0, 38.0, 27.0, 14.0, 16.0, 11.0, 5.0, 8.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036224365234375, -0.035361289978027344, -0.03449821472167969, -0.03363513946533203, -0.032772064208984375, -0.03190898895263672, -0.031045913696289062, -0.030182838439941406, -0.02931976318359375, -0.028456687927246094, -0.027593612670898438, -0.02673053741455078, -0.025867462158203125, -0.02500438690185547, -0.024141311645507812, -0.023278236389160156, -0.0224151611328125, -0.021552085876464844, -0.020689010620117188, -0.01982593536376953, -0.018962860107421875, -0.01809978485107422, -0.017236709594726562, -0.016373634338378906, -0.01551055908203125, -0.014647483825683594, -0.013784408569335938, -0.012921333312988281, -0.012058258056640625, -0.011195182800292969, -0.010332107543945312, -0.009469032287597656, -0.00860595703125, -0.007742881774902344, -0.0068798065185546875, -0.006016731262207031, -0.005153656005859375, -0.004290580749511719, -0.0034275054931640625, -0.0025644302368164062, -0.00170135498046875, -0.0008382797241210938, 2.47955322265625e-05, 0.0008878707885742188, 0.001750946044921875, 0.0026140213012695312, 0.0034770965576171875, 0.004340171813964844, 0.0052032470703125, 0.006066322326660156, 0.0069293975830078125, 0.007792472839355469, 0.008655548095703125, 0.009518623352050781, 0.010381698608398438, 0.011244773864746094, 0.01210784912109375, 0.012970924377441406, 0.013833999633789062, 0.014697074890136719, 0.015560150146484375, 0.01642322540283203, 0.017286300659179688, 0.018149375915527344, 0.019012451171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 35.0, 183.0, 396.0, 271.0, 82.0, 21.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3306017816066742, -0.32248300313949585, -0.3143642246723175, -0.30624544620513916, -0.2981266677379608, -0.29000788927078247, -0.2818891108036041, -0.2737703323364258, -0.26565152406692505, -0.2575327455997467, -0.24941396713256836, -0.24129518866539001, -0.23317641019821167, -0.22505763173103333, -0.2169388383626938, -0.20882005989551544, -0.2007012963294983, -0.19258251786231995, -0.1844637393951416, -0.17634496092796326, -0.1682261824607849, -0.16010740399360657, -0.15198861062526703, -0.14386983215808868, -0.13575105369091034, -0.127632275223732, -0.11951349675655365, -0.11139471083879471, -0.10327593237161636, -0.09515715390443802, -0.08703836798667908, -0.07891958951950073, -0.07080078125, -0.06268200278282166, -0.05456322059035301, -0.04644443839788437, -0.038325659930706024, -0.03020688146352768, -0.022088099271059036, -0.013969317078590393, -0.005850538611412048, 0.0022682417184114456, 0.01038702204823494, 0.018505802378058434, 0.026624582707881927, 0.03474336117506027, 0.042862143367528915, 0.05098092555999756, 0.0590997040271759, 0.06721848249435425, 0.07533726096153259, 0.08345604687929153, 0.09157482534646988, 0.09969360381364822, 0.10781238973140717, 0.11593116819858551, 0.12404994666576385, 0.1321687251329422, 0.14028750360012054, 0.1484062820672989, 0.15652507543563843, 0.16464385390281677, 0.17276263236999512, 0.18088141083717346, 0.1890001893043518]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 20.0, 20.0, 29.0, 28.0, 39.0, 46.0, 49.0, 67.0, 55.0, 58.0, 66.0, 81.0, 54.0, 70.0, 62.0, 51.0, 44.0, 38.0, 34.0, 33.0, 13.0, 14.0, 9.0, 8.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11437290906906128, -0.11101101338863373, -0.10764911770820618, -0.10428722202777863, -0.10092532634735107, -0.09756343066692352, -0.09420154243707657, -0.09083964675664902, -0.08747775107622147, -0.08411585539579391, -0.08075395971536636, -0.07739206403493881, -0.07403017580509186, -0.0706682801246643, -0.06730638444423676, -0.0639444887638092, -0.06058259308338165, -0.0572206974029541, -0.05385880172252655, -0.0504969097673893, -0.047135014086961746, -0.043773118406534195, -0.04041122645139694, -0.03704933077096939, -0.03368743509054184, -0.03032553941011429, -0.026963645592331886, -0.023601751774549484, -0.020239856094121933, -0.01687796041369438, -0.01351606659591198, -0.010154172778129578, -0.006792277097702026, -0.0034303823485970497, -6.848759949207306e-05, 0.0032934071496129036, 0.00665530189871788, 0.010017197579145432, 0.013379091396927834, 0.016740985214710236, 0.020102880895137787, 0.023464776575565338, 0.02682667039334774, 0.030188564211130142, 0.033550459891557693, 0.036912355571985245, 0.0402742475271225, 0.04363614320755005, 0.0469980388879776, 0.05035993456840515, 0.0537218302488327, 0.057083722203969955, 0.06044561788439751, 0.06380751729011536, 0.06716940551996231, 0.07053130120038986, 0.07389319688081741, 0.07725509256124496, 0.08061698824167252, 0.08397888392210007, 0.08734077215194702, 0.09070266783237457, 0.09406456351280212, 0.09742645919322968, 0.10078835487365723]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 5.0, 16.0, 24.0, 14.0, 25.0, 27.0, 37.0, 56.0, 75.0, 99.0, 106.0, 154.0, 246.0, 342.0, 455.0, 861.0, 2063.0, 11319.0, 385453.0, 625560.0, 16362.0, 2405.0, 939.0, 587.0, 319.0, 241.0, 180.0, 145.0, 105.0, 85.0, 54.0, 38.0, 36.0, 31.0, 17.0, 9.0, 11.0, 6.0, 12.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 5.0], "bins": [-0.08221435546875, -0.07993507385253906, -0.07765579223632812, -0.07537651062011719, -0.07309722900390625, -0.07081794738769531, -0.06853866577148438, -0.06625938415527344, -0.0639801025390625, -0.06170082092285156, -0.059421539306640625, -0.05714225769042969, -0.05486297607421875, -0.05258369445800781, -0.050304412841796875, -0.04802513122558594, -0.045745849609375, -0.04346656799316406, -0.041187286376953125, -0.03890800476074219, -0.03662872314453125, -0.03434944152832031, -0.032070159912109375, -0.029790878295898438, -0.0275115966796875, -0.025232315063476562, -0.022953033447265625, -0.020673751831054688, -0.01839447021484375, -0.016115188598632812, -0.013835906982421875, -0.011556625366210938, -0.00927734375, -0.0069980621337890625, -0.004718780517578125, -0.0024394989013671875, -0.00016021728515625, 0.0021190643310546875, 0.004398345947265625, 0.0066776275634765625, 0.0089569091796875, 0.011236190795898438, 0.013515472412109375, 0.015794754028320312, 0.01807403564453125, 0.020353317260742188, 0.022632598876953125, 0.024911880493164062, 0.027191162109375, 0.029470443725585938, 0.031749725341796875, 0.03402900695800781, 0.03630828857421875, 0.03858757019042969, 0.040866851806640625, 0.04314613342285156, 0.0454254150390625, 0.04770469665527344, 0.049983978271484375, 0.05226325988769531, 0.05454254150390625, 0.05682182312011719, 0.059101104736328125, 0.06138038635253906, 0.06365966796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 92.0, 277.0, 403.0, 175.0, 33.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0645751953125, -0.06263542175292969, -0.060695648193359375, -0.05875587463378906, -0.05681610107421875, -0.05487632751464844, -0.052936553955078125, -0.05099678039550781, -0.0490570068359375, -0.04711723327636719, -0.045177459716796875, -0.04323768615722656, -0.04129791259765625, -0.03935813903808594, -0.037418365478515625, -0.03547859191894531, -0.033538818359375, -0.03159904479980469, -0.029659271240234375, -0.027719497680664062, -0.02577972412109375, -0.023839950561523438, -0.021900177001953125, -0.019960403442382812, -0.0180206298828125, -0.016080856323242188, -0.014141082763671875, -0.012201309204101562, -0.01026153564453125, -0.008321762084960938, -0.006381988525390625, -0.0044422149658203125, -0.00250244140625, -0.0005626678466796875, 0.001377105712890625, 0.0033168792724609375, 0.00525665283203125, 0.0071964263916015625, 0.009136199951171875, 0.011075973510742188, 0.0130157470703125, 0.014955520629882812, 0.016895294189453125, 0.018835067749023438, 0.02077484130859375, 0.022714614868164062, 0.024654388427734375, 0.026594161987304688, 0.028533935546875, 0.030473709106445312, 0.032413482666015625, 0.03435325622558594, 0.03629302978515625, 0.03823280334472656, 0.040172576904296875, 0.04211235046386719, 0.0440521240234375, 0.04599189758300781, 0.047931671142578125, 0.04987144470214844, 0.05181121826171875, 0.05375099182128906, 0.055690765380859375, 0.05763053894042969, 0.0595703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 10.0, 16.0, 19.0, 21.0, 25.0, 29.0, 27.0, 36.0, 48.0, 43.0, 71.0, 91.0, 121.0, 227.0, 328.0, 613.0, 1336.0, 4568.0, 26274.0, 294981.0, 637482.0, 68752.0, 9067.0, 2160.0, 855.0, 450.0, 273.0, 160.0, 111.0, 79.0, 68.0, 29.0, 41.0, 28.0, 29.0, 19.0, 16.0, 23.0, 6.0, 2.0, 10.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0455322265625, -0.044161319732666016, -0.04279041290283203, -0.04141950607299805, -0.04004859924316406, -0.03867769241333008, -0.037306785583496094, -0.03593587875366211, -0.034564971923828125, -0.03319406509399414, -0.031823158264160156, -0.030452251434326172, -0.029081344604492188, -0.027710437774658203, -0.02633953094482422, -0.024968624114990234, -0.02359771728515625, -0.022226810455322266, -0.02085590362548828, -0.019484996795654297, -0.018114089965820312, -0.016743183135986328, -0.015372276306152344, -0.01400136947631836, -0.012630462646484375, -0.01125955581665039, -0.009888648986816406, -0.008517742156982422, -0.0071468353271484375, -0.005775928497314453, -0.004405021667480469, -0.0030341148376464844, -0.0016632080078125, -0.0002923011779785156, 0.0010786056518554688, 0.002449512481689453, 0.0038204193115234375, 0.005191326141357422, 0.006562232971191406, 0.00793313980102539, 0.009304046630859375, 0.01067495346069336, 0.012045860290527344, 0.013416767120361328, 0.014787673950195312, 0.016158580780029297, 0.01752948760986328, 0.018900394439697266, 0.02027130126953125, 0.021642208099365234, 0.02301311492919922, 0.024384021759033203, 0.025754928588867188, 0.027125835418701172, 0.028496742248535156, 0.02986764907836914, 0.031238555908203125, 0.03260946273803711, 0.033980369567871094, 0.03535127639770508, 0.03672218322753906, 0.03809309005737305, 0.03946399688720703, 0.040834903717041016, 0.042205810546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 7.0, 9.0, 14.0, 12.0, 7.0, 25.0, 24.0, 24.0, 28.0, 30.0, 36.0, 33.0, 41.0, 40.0, 43.0, 32.0, 50.0, 33.0, 43.0, 40.0, 33.0, 38.0, 26.0, 30.0, 43.0, 29.0, 25.0, 27.0, 18.0, 16.0, 19.0, 19.0, 10.0, 10.0, 15.0, 11.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0254974365234375, -0.02466559410095215, -0.023833751678466797, -0.023001909255981445, -0.022170066833496094, -0.021338224411010742, -0.02050638198852539, -0.01967453956604004, -0.018842697143554688, -0.018010854721069336, -0.017179012298583984, -0.016347169876098633, -0.015515327453613281, -0.01468348503112793, -0.013851642608642578, -0.013019800186157227, -0.012187957763671875, -0.011356115341186523, -0.010524272918701172, -0.00969243049621582, -0.008860588073730469, -0.008028745651245117, -0.007196903228759766, -0.006365060806274414, -0.0055332183837890625, -0.004701375961303711, -0.0038695335388183594, -0.003037691116333008, -0.0022058486938476562, -0.0013740062713623047, -0.0005421638488769531, 0.00028967857360839844, 0.00112152099609375, 0.0019533634185791016, 0.002785205841064453, 0.0036170482635498047, 0.004448890686035156, 0.005280733108520508, 0.006112575531005859, 0.006944417953491211, 0.0077762603759765625, 0.008608102798461914, 0.009439945220947266, 0.010271787643432617, 0.011103630065917969, 0.01193547248840332, 0.012767314910888672, 0.013599157333374023, 0.014430999755859375, 0.015262842178344727, 0.016094684600830078, 0.01692652702331543, 0.01775836944580078, 0.018590211868286133, 0.019422054290771484, 0.020253896713256836, 0.021085739135742188, 0.02191758155822754, 0.02274942398071289, 0.023581266403198242, 0.024413108825683594, 0.025244951248168945, 0.026076793670654297, 0.02690863609313965, 0.027740478515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 7.0, 9.0, 14.0, 13.0, 19.0, 30.0, 50.0, 62.0, 94.0, 173.0, 236.0, 288.0, 458.0, 723.0, 1119.0, 1737.0, 3087.0, 6507.0, 17019.0, 88354.0, 752327.0, 138333.0, 21427.0, 7471.0, 3592.0, 1973.0, 1119.0, 728.0, 508.0, 333.0, 218.0, 164.0, 97.0, 87.0, 58.0, 34.0, 23.0, 19.0, 14.0, 10.0, 9.0, 8.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019012451171875, -0.01836991310119629, -0.017727375030517578, -0.017084836959838867, -0.016442298889160156, -0.015799760818481445, -0.015157222747802734, -0.014514684677124023, -0.013872146606445312, -0.013229608535766602, -0.01258707046508789, -0.01194453239440918, -0.011301994323730469, -0.010659456253051758, -0.010016918182373047, -0.009374380111694336, -0.008731842041015625, -0.008089303970336914, -0.007446765899658203, -0.006804227828979492, -0.006161689758300781, -0.00551915168762207, -0.004876613616943359, -0.0042340755462646484, -0.0035915374755859375, -0.0029489994049072266, -0.0023064613342285156, -0.0016639232635498047, -0.0010213851928710938, -0.0003788471221923828, 0.0002636909484863281, 0.0009062290191650391, 0.00154876708984375, 0.002191305160522461, 0.002833843231201172, 0.003476381301879883, 0.004118919372558594, 0.004761457443237305, 0.005403995513916016, 0.0060465335845947266, 0.0066890716552734375, 0.0073316097259521484, 0.00797414779663086, 0.00861668586730957, 0.009259223937988281, 0.009901762008666992, 0.010544300079345703, 0.011186838150024414, 0.011829376220703125, 0.012471914291381836, 0.013114452362060547, 0.013756990432739258, 0.014399528503417969, 0.01504206657409668, 0.01568460464477539, 0.0163271427154541, 0.016969680786132812, 0.017612218856811523, 0.018254756927490234, 0.018897294998168945, 0.019539833068847656, 0.020182371139526367, 0.020824909210205078, 0.02146744728088379, 0.0221099853515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 7.0, 9.0, 19.0, 17.0, 18.0, 23.0, 29.0, 29.0, 66.0, 60.0, 138.0, 154.0, 107.0, 74.0, 56.0, 31.0, 23.0, 18.0, 16.0, 14.0, 15.0, 9.0, 9.0, 5.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.395578384399414e-05, -6.152968853712082e-05, -5.91035932302475e-05, -5.6677497923374176e-05, -5.4251402616500854e-05, -5.182530730962753e-05, -4.939921200275421e-05, -4.697311669588089e-05, -4.454702138900757e-05, -4.212092608213425e-05, -3.9694830775260925e-05, -3.7268735468387604e-05, -3.484264016151428e-05, -3.241654485464096e-05, -2.999044954776764e-05, -2.7564354240894318e-05, -2.5138258934020996e-05, -2.2712163627147675e-05, -2.0286068320274353e-05, -1.785997301340103e-05, -1.543387770652771e-05, -1.3007782399654388e-05, -1.0581687092781067e-05, -8.155591785907745e-06, -5.729496479034424e-06, -3.3034011721611023e-06, -8.773058652877808e-07, 1.5487894415855408e-06, 3.974884748458862e-06, 6.400980055332184e-06, 8.827075362205505e-06, 1.1253170669078827e-05, 1.3679265975952148e-05, 1.610536128282547e-05, 1.853145658969879e-05, 2.0957551896572113e-05, 2.3383647203445435e-05, 2.5809742510318756e-05, 2.8235837817192078e-05, 3.06619331240654e-05, 3.308802843093872e-05, 3.551412373781204e-05, 3.7940219044685364e-05, 4.0366314351558685e-05, 4.279240965843201e-05, 4.521850496530533e-05, 4.764460027217865e-05, 5.007069557905197e-05, 5.249679088592529e-05, 5.4922886192798615e-05, 5.7348981499671936e-05, 5.977507680654526e-05, 6.220117211341858e-05, 6.46272674202919e-05, 6.705336272716522e-05, 6.947945803403854e-05, 7.190555334091187e-05, 7.433164864778519e-05, 7.675774395465851e-05, 7.918383926153183e-05, 8.160993456840515e-05, 8.403602987527847e-05, 8.64621251821518e-05, 8.888822048902512e-05, 9.131431579589844e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 11.0, 25.0, 27.0, 26.0, 58.0, 79.0, 147.0, 238.0, 473.0, 961.0, 2164.0, 5702.0, 22963.0, 236618.0, 707359.0, 55458.0, 10180.0, 3337.0, 1326.0, 578.0, 329.0, 166.0, 110.0, 60.0, 39.0, 21.0, 19.0, 12.0, 8.0, 10.0, 3.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.018902063369750977, -0.018181324005126953, -0.01746058464050293, -0.016739845275878906, -0.016019105911254883, -0.01529836654663086, -0.014577627182006836, -0.013856887817382812, -0.013136148452758789, -0.012415409088134766, -0.011694669723510742, -0.010973930358886719, -0.010253190994262695, -0.009532451629638672, -0.008811712265014648, -0.008090972900390625, -0.0073702335357666016, -0.006649494171142578, -0.005928754806518555, -0.005208015441894531, -0.004487276077270508, -0.0037665367126464844, -0.003045797348022461, -0.0023250579833984375, -0.001604318618774414, -0.0008835792541503906, -0.0001628398895263672, 0.0005578994750976562, 0.0012786388397216797, 0.001999378204345703, 0.0027201175689697266, 0.00344085693359375, 0.0041615962982177734, 0.004882335662841797, 0.00560307502746582, 0.006323814392089844, 0.007044553756713867, 0.007765293121337891, 0.008486032485961914, 0.009206771850585938, 0.009927511215209961, 0.010648250579833984, 0.011368989944458008, 0.012089729309082031, 0.012810468673706055, 0.013531208038330078, 0.014251947402954102, 0.014972686767578125, 0.01569342613220215, 0.016414165496826172, 0.017134904861450195, 0.01785564422607422, 0.018576383590698242, 0.019297122955322266, 0.02001786231994629, 0.020738601684570312, 0.021459341049194336, 0.02218008041381836, 0.022900819778442383, 0.023621559143066406, 0.02434229850769043, 0.025063037872314453, 0.025783777236938477, 0.0265045166015625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 8.0, 9.0, 7.0, 27.0, 26.0, 40.0, 68.0, 118.0, 157.0, 169.0, 103.0, 93.0, 53.0, 38.0, 18.0, 16.0, 11.0, 3.0, 10.0, 6.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0193328857421875, -0.018838882446289062, -0.018344879150390625, -0.017850875854492188, -0.01735687255859375, -0.016862869262695312, -0.016368865966796875, -0.015874862670898438, -0.015380859375, -0.014886856079101562, -0.014392852783203125, -0.013898849487304688, -0.01340484619140625, -0.012910842895507812, -0.012416839599609375, -0.011922836303710938, -0.0114288330078125, -0.010934829711914062, -0.010440826416015625, -0.009946823120117188, -0.00945281982421875, -0.008958816528320312, -0.008464813232421875, -0.007970809936523438, -0.007476806640625, -0.0069828033447265625, -0.006488800048828125, -0.0059947967529296875, -0.00550079345703125, -0.0050067901611328125, -0.004512786865234375, -0.0040187835693359375, -0.0035247802734375, -0.0030307769775390625, -0.002536773681640625, -0.0020427703857421875, -0.00154876708984375, -0.0010547637939453125, -0.000560760498046875, -6.67572021484375e-05, 0.00042724609375, 0.0009212493896484375, 0.001415252685546875, 0.0019092559814453125, 0.00240325927734375, 0.0028972625732421875, 0.003391265869140625, 0.0038852691650390625, 0.0043792724609375, 0.0048732757568359375, 0.005367279052734375, 0.0058612823486328125, 0.00635528564453125, 0.0068492889404296875, 0.007343292236328125, 0.007837295532226562, 0.008331298828125, 0.008825302124023438, 0.009319305419921875, 0.009813308715820312, 0.01030731201171875, 0.010801315307617188, 0.011295318603515625, 0.011789321899414062, 0.0122833251953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 18.0, 303.0, 621.0, 55.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7951155304908752, -0.7753276228904724, -0.7555397152900696, -0.735751748085022, -0.7159638404846191, -0.6961759328842163, -0.6763880252838135, -0.6566001176834106, -0.636812150478363, -0.6170242428779602, -0.5972363352775574, -0.5774483680725098, -0.5576604604721069, -0.5378725528717041, -0.5180846452713013, -0.49829670786857605, -0.4785088002681732, -0.4587208926677704, -0.43893295526504517, -0.41914504766464233, -0.3993571102619171, -0.3795692026615143, -0.35978126525878906, -0.33999335765838623, -0.3202054500579834, -0.30041754245758057, -0.28062960505485535, -0.2608416974544525, -0.2410537600517273, -0.22126585245132446, -0.20147792994976044, -0.1816900074481964, -0.1619020402431488, -0.14211411774158478, -0.12232619524002075, -0.10253828018903732, -0.0827503576874733, -0.06296243518590927, -0.04317452013492584, -0.023386597633361816, -0.0035986751317977905, 0.016189245507121086, 0.03597716614603996, 0.05576508492231369, 0.07555300742387772, 0.09534092992544174, 0.11512884497642517, 0.1349167674779892, 0.15470468997955322, 0.17449261248111725, 0.19428053498268127, 0.2140684425830841, 0.23385637998580933, 0.25364428758621216, 0.273432195186615, 0.2932201325893402, 0.31300806999206543, 0.33279597759246826, 0.3525839149951935, 0.3723718225955963, 0.39215975999832153, 0.41194766759872437, 0.4317355751991272, 0.4515235126018524, 0.47131142020225525]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 5.0, 10.0, 6.0, 15.0, 17.0, 26.0, 19.0, 35.0, 31.0, 38.0, 56.0, 44.0, 46.0, 55.0, 80.0, 67.0, 69.0, 54.0, 51.0, 46.0, 47.0, 32.0, 39.0, 22.0, 32.0, 22.0, 12.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.16861772537231445, -0.16424690186977386, -0.15987607836723328, -0.1555052548646927, -0.1511344313621521, -0.1467636078596115, -0.14239278435707092, -0.13802196085453033, -0.13365113735198975, -0.12928031384944916, -0.12490949034690857, -0.12053866684436798, -0.11616784334182739, -0.1117970198392868, -0.10742619633674622, -0.10305537283420563, -0.09868454933166504, -0.09431372582912445, -0.08994290232658386, -0.08557207882404327, -0.08120125532150269, -0.0768304318189621, -0.07245960831642151, -0.06808878481388092, -0.06371796131134033, -0.059347137808799744, -0.054976314306259155, -0.05060549080371857, -0.04623466730117798, -0.04186384379863739, -0.0374930202960968, -0.03312219679355621, -0.028751373291015625, -0.024380549788475037, -0.020009726285934448, -0.01563890278339386, -0.011268079280853271, -0.006897255778312683, -0.0025264322757720947, 0.0018443912267684937, 0.006215214729309082, 0.01058603823184967, 0.014956861734390259, 0.019327685236930847, 0.023698508739471436, 0.028069332242012024, 0.03244015574455261, 0.0368109792470932, 0.04118180274963379, 0.04555262625217438, 0.049923449754714966, 0.054294273257255554, 0.05866509675979614, 0.06303592026233673, 0.06740674376487732, 0.07177756726741791, 0.0761483907699585, 0.08051921427249908, 0.08489003777503967, 0.08926086127758026, 0.09363168478012085, 0.09800250828266144, 0.10237333178520203, 0.10674415528774261, 0.1111149787902832]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 13.0, 11.0, 28.0, 54.0, 100.0, 150.0, 470.0, 2084.0, 5914.0, 20152.0, 3985124.0, 168290.0, 8094.0, 1905.0, 1134.0, 312.0, 171.0, 88.0, 65.0, 38.0, 25.0, 15.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08563232421875, -0.08301639556884766, -0.08040046691894531, -0.07778453826904297, -0.07516860961914062, -0.07255268096923828, -0.06993675231933594, -0.0673208236694336, -0.06470489501953125, -0.062088966369628906, -0.05947303771972656, -0.05685710906982422, -0.054241180419921875, -0.05162525177001953, -0.04900932312011719, -0.046393394470214844, -0.0437774658203125, -0.041161537170410156, -0.03854560852050781, -0.03592967987060547, -0.033313751220703125, -0.03069782257080078, -0.028081893920898438, -0.025465965270996094, -0.02285003662109375, -0.020234107971191406, -0.017618179321289062, -0.015002250671386719, -0.012386322021484375, -0.009770393371582031, -0.0071544647216796875, -0.004538536071777344, -0.001922607421875, 0.0006933212280273438, 0.0033092498779296875, 0.005925178527832031, 0.008541107177734375, 0.011157035827636719, 0.013772964477539062, 0.016388893127441406, 0.01900482177734375, 0.021620750427246094, 0.024236679077148438, 0.02685260772705078, 0.029468536376953125, 0.03208446502685547, 0.03470039367675781, 0.037316322326660156, 0.0399322509765625, 0.042548179626464844, 0.04516410827636719, 0.04778003692626953, 0.050395965576171875, 0.05301189422607422, 0.05562782287597656, 0.058243751525878906, 0.06085968017578125, 0.0634756088256836, 0.06609153747558594, 0.06870746612548828, 0.07132339477539062, 0.07393932342529297, 0.07655525207519531, 0.07917118072509766, 0.081787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 12.0, 83.0, 283.0, 387.0, 195.0, 27.0, 11.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.06530046463012695, -0.0632791519165039, -0.06125783920288086, -0.05923652648925781, -0.057215213775634766, -0.05519390106201172, -0.05317258834838867, -0.051151275634765625, -0.04912996292114258, -0.04710865020751953, -0.045087337493896484, -0.04306602478027344, -0.04104471206665039, -0.039023399353027344, -0.0370020866394043, -0.03498077392578125, -0.0329594612121582, -0.030938148498535156, -0.02891683578491211, -0.026895523071289062, -0.024874210357666016, -0.02285289764404297, -0.020831584930419922, -0.018810272216796875, -0.016788959503173828, -0.014767646789550781, -0.012746334075927734, -0.010725021362304688, -0.00870370864868164, -0.006682395935058594, -0.004661083221435547, -0.0026397705078125, -0.0006184577941894531, 0.0014028549194335938, 0.0034241676330566406, 0.0054454803466796875, 0.007466793060302734, 0.009488105773925781, 0.011509418487548828, 0.013530731201171875, 0.015552043914794922, 0.01757335662841797, 0.019594669342041016, 0.021615982055664062, 0.02363729476928711, 0.025658607482910156, 0.027679920196533203, 0.02970123291015625, 0.0317225456237793, 0.033743858337402344, 0.03576517105102539, 0.03778648376464844, 0.039807796478271484, 0.04182910919189453, 0.04385042190551758, 0.045871734619140625, 0.04789304733276367, 0.04991436004638672, 0.051935672760009766, 0.05395698547363281, 0.05597829818725586, 0.057999610900878906, 0.06002092361450195, 0.062042236328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 11.0, 21.0, 14.0, 29.0, 52.0, 104.0, 233.0, 771.0, 9480.0, 4152151.0, 29621.0, 1286.0, 272.0, 111.0, 51.0, 22.0, 16.0, 9.0, 11.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11166858673095703, -0.10730934143066406, -0.1029500961303711, -0.09859085083007812, -0.09423160552978516, -0.08987236022949219, -0.08551311492919922, -0.08115386962890625, -0.07679462432861328, -0.07243537902832031, -0.06807613372802734, -0.06371688842773438, -0.059357643127441406, -0.05499839782714844, -0.05063915252685547, -0.0462799072265625, -0.04192066192626953, -0.03756141662597656, -0.033202171325683594, -0.028842926025390625, -0.024483680725097656, -0.020124435424804688, -0.01576519012451172, -0.01140594482421875, -0.007046699523925781, -0.0026874542236328125, 0.0016717910766601562, 0.006031036376953125, 0.010390281677246094, 0.014749526977539062, 0.01910877227783203, 0.023468017578125, 0.02782726287841797, 0.03218650817871094, 0.036545753479003906, 0.040904998779296875, 0.045264244079589844, 0.04962348937988281, 0.05398273468017578, 0.05834197998046875, 0.06270122528076172, 0.06706047058105469, 0.07141971588134766, 0.07577896118164062, 0.0801382064819336, 0.08449745178222656, 0.08885669708251953, 0.0932159423828125, 0.09757518768310547, 0.10193443298339844, 0.1062936782836914, 0.11065292358398438, 0.11501216888427734, 0.11937141418457031, 0.12373065948486328, 0.12808990478515625, 0.13244915008544922, 0.1368083953857422, 0.14116764068603516, 0.14552688598632812, 0.1498861312866211, 0.15424537658691406, 0.15860462188720703, 0.1629638671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 2.0, 9.0, 19.0, 28.0, 46.0, 107.0, 182.0, 453.0, 1002.0, 1158.0, 500.0, 240.0, 129.0, 72.0, 49.0, 23.0, 20.0, 11.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045379638671875, -0.04418826103210449, -0.042996883392333984, -0.04180550575256348, -0.04061412811279297, -0.03942275047302246, -0.03823137283325195, -0.037039995193481445, -0.03584861755371094, -0.03465723991394043, -0.03346586227416992, -0.032274484634399414, -0.031083106994628906, -0.0298917293548584, -0.02870035171508789, -0.027508974075317383, -0.026317596435546875, -0.025126218795776367, -0.02393484115600586, -0.02274346351623535, -0.021552085876464844, -0.020360708236694336, -0.019169330596923828, -0.01797795295715332, -0.016786575317382812, -0.015595197677612305, -0.014403820037841797, -0.013212442398071289, -0.012021064758300781, -0.010829687118530273, -0.009638309478759766, -0.008446931838989258, -0.00725555419921875, -0.006064176559448242, -0.004872798919677734, -0.0036814212799072266, -0.0024900436401367188, -0.001298666000366211, -0.00010728836059570312, 0.0010840892791748047, 0.0022754669189453125, 0.0034668445587158203, 0.004658222198486328, 0.005849599838256836, 0.007040977478027344, 0.008232355117797852, 0.00942373275756836, 0.010615110397338867, 0.011806488037109375, 0.012997865676879883, 0.01418924331665039, 0.015380620956420898, 0.016571998596191406, 0.017763376235961914, 0.018954753875732422, 0.02014613151550293, 0.021337509155273438, 0.022528886795043945, 0.023720264434814453, 0.02491164207458496, 0.02610301971435547, 0.027294397354125977, 0.028485774993896484, 0.029677152633666992, 0.0308685302734375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 73.0, 430.0, 402.0, 71.0, 16.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5248697400093079, -0.5129035115242004, -0.5009373426437378, -0.48897111415863037, -0.47700491547584534, -0.4650387167930603, -0.4530724883079529, -0.44110628962516785, -0.4291400909423828, -0.4171738922595978, -0.40520766377449036, -0.3932414650917053, -0.3812752664089203, -0.36930906772613525, -0.35734283924102783, -0.3453766405582428, -0.3334104120731354, -0.32144421339035034, -0.3094779849052429, -0.2975117862224579, -0.28554558753967285, -0.27357935905456543, -0.2616131603717804, -0.24964696168899536, -0.23768074810504913, -0.2257145345211029, -0.21374833583831787, -0.20178212225437164, -0.18981590867042542, -0.17784970998764038, -0.16588349640369415, -0.15391728281974792, -0.14195111393928528, -0.12998490035533905, -0.11801870167255402, -0.10605248808860779, -0.09408628195524216, -0.08212007582187653, -0.0701538622379303, -0.05818765610456467, -0.046221449971199036, -0.034255243837833405, -0.022289033979177475, -0.010322824120521545, 0.0016433820128440857, 0.013609588146209717, 0.025575801730155945, 0.037542007863521576, 0.04950821399688721, 0.06147442013025284, 0.07344062626361847, 0.0854068398475647, 0.09737304598093033, 0.10933925211429596, 0.12130546569824219, 0.13327166438102722, 0.14523787796497345, 0.15720409154891968, 0.1691702902317047, 0.18113650381565094, 0.19310271739959717, 0.2050689160823822, 0.21703512966632843, 0.22900134325027466, 0.2409675419330597]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 8.0, 8.0, 17.0, 29.0, 22.0, 19.0, 29.0, 40.0, 32.0, 45.0, 23.0, 37.0, 41.0, 37.0, 40.0, 47.0, 45.0, 40.0, 39.0, 37.0, 48.0, 45.0, 34.0, 21.0, 33.0, 27.0, 21.0, 24.0, 17.0, 13.0, 11.0, 9.0, 11.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07431608438491821, -0.0722103863954544, -0.0701046958565712, -0.06799899786710739, -0.06589330732822418, -0.06378760933876038, -0.06168191134929657, -0.05957621708512306, -0.057470522820949554, -0.05536482855677605, -0.05325913429260254, -0.05115343630313873, -0.049047742038965225, -0.04694204777479172, -0.04483634978532791, -0.042730655521154404, -0.040624961256980896, -0.03851926699280739, -0.03641357272863388, -0.034307874739170074, -0.03220218047499657, -0.03009648621082306, -0.027990790084004402, -0.025885093957185745, -0.023779399693012238, -0.02167370542883873, -0.019568009302020073, -0.017462313175201416, -0.015356618911027908, -0.013250923715531826, -0.011145228520035744, -0.009039533324539661, -0.006933838129043579, -0.004828142933547497, -0.0027224477380514145, -0.0006167525425553322, 0.0014889426529407501, 0.0035946378484368324, 0.005700333043932915, 0.007806028239428997, 0.00991172343492508, 0.012017418630421162, 0.014123113825917244, 0.0162288099527359, 0.01833450421690941, 0.020440198481082916, 0.022545894607901573, 0.02465159073472023, 0.026757284998893738, 0.028862979263067245, 0.030968675389885902, 0.03307437151670456, 0.03518006578087807, 0.037285760045051575, 0.03939145803451538, 0.04149715229868889, 0.043602846562862396, 0.045708540827035904, 0.04781423509120941, 0.04991993308067322, 0.052025627344846725, 0.05413132160902023, 0.05623701959848404, 0.05834271386265755, 0.060448408126831055]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 7.0, 8.0, 9.0, 16.0, 18.0, 23.0, 34.0, 45.0, 59.0, 71.0, 104.0, 155.0, 215.0, 321.0, 550.0, 955.0, 2365.0, 17855.0, 763281.0, 251188.0, 7543.0, 1560.0, 787.0, 455.0, 291.0, 171.0, 127.0, 99.0, 64.0, 57.0, 39.0, 16.0, 17.0, 15.0, 10.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0982666015625, -0.09485816955566406, -0.09144973754882812, -0.08804130554199219, -0.08463287353515625, -0.08122444152832031, -0.07781600952148438, -0.07440757751464844, -0.0709991455078125, -0.06759071350097656, -0.06418228149414062, -0.06077384948730469, -0.05736541748046875, -0.05395698547363281, -0.050548553466796875, -0.04714012145996094, -0.043731689453125, -0.04032325744628906, -0.036914825439453125, -0.03350639343261719, -0.03009796142578125, -0.026689529418945312, -0.023281097412109375, -0.019872665405273438, -0.0164642333984375, -0.013055801391601562, -0.009647369384765625, -0.0062389373779296875, -0.00283050537109375, 0.0005779266357421875, 0.003986358642578125, 0.0073947906494140625, 0.01080322265625, 0.014211654663085938, 0.017620086669921875, 0.021028518676757812, 0.02443695068359375, 0.027845382690429688, 0.031253814697265625, 0.03466224670410156, 0.0380706787109375, 0.04147911071777344, 0.044887542724609375, 0.04829597473144531, 0.05170440673828125, 0.05511283874511719, 0.058521270751953125, 0.06192970275878906, 0.065338134765625, 0.06874656677246094, 0.07215499877929688, 0.07556343078613281, 0.07897186279296875, 0.08238029479980469, 0.08578872680664062, 0.08919715881347656, 0.0926055908203125, 0.09601402282714844, 0.09942245483398438, 0.10283088684082031, 0.10623931884765625, 0.10964775085449219, 0.11305618286132812, 0.11646461486816406, 0.119873046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 67.0, 249.0, 407.0, 222.0, 31.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.0642404556274414, -0.06225776672363281, -0.06027507781982422, -0.058292388916015625, -0.05630970001220703, -0.05432701110839844, -0.052344322204589844, -0.05036163330078125, -0.048378944396972656, -0.04639625549316406, -0.04441356658935547, -0.042430877685546875, -0.04044818878173828, -0.03846549987792969, -0.036482810974121094, -0.0345001220703125, -0.032517433166503906, -0.030534744262695312, -0.02855205535888672, -0.026569366455078125, -0.02458667755126953, -0.022603988647460938, -0.020621299743652344, -0.01863861083984375, -0.016655921936035156, -0.014673233032226562, -0.012690544128417969, -0.010707855224609375, -0.008725166320800781, -0.0067424774169921875, -0.004759788513183594, -0.002777099609375, -0.0007944107055664062, 0.0011882781982421875, 0.0031709671020507812, 0.005153656005859375, 0.007136344909667969, 0.009119033813476562, 0.011101722717285156, 0.01308441162109375, 0.015067100524902344, 0.017049789428710938, 0.01903247833251953, 0.021015167236328125, 0.02299785614013672, 0.024980545043945312, 0.026963233947753906, 0.0289459228515625, 0.030928611755371094, 0.03291130065917969, 0.03489398956298828, 0.036876678466796875, 0.03885936737060547, 0.04084205627441406, 0.042824745178222656, 0.04480743408203125, 0.046790122985839844, 0.04877281188964844, 0.05075550079345703, 0.052738189697265625, 0.05472087860107422, 0.05670356750488281, 0.058686256408691406, 0.0606689453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 10.0, 10.0, 9.0, 22.0, 31.0, 36.0, 42.0, 102.0, 152.0, 230.0, 392.0, 769.0, 1880.0, 11754.0, 458502.0, 556445.0, 14299.0, 2026.0, 771.0, 420.0, 199.0, 150.0, 103.0, 60.0, 33.0, 28.0, 22.0, 9.0, 17.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07078075408935547, -0.06795310974121094, -0.0651254653930664, -0.062297821044921875, -0.059470176696777344, -0.05664253234863281, -0.05381488800048828, -0.05098724365234375, -0.04815959930419922, -0.04533195495605469, -0.042504310607910156, -0.039676666259765625, -0.036849021911621094, -0.03402137756347656, -0.03119373321533203, -0.0283660888671875, -0.02553844451904297, -0.022710800170898438, -0.019883155822753906, -0.017055511474609375, -0.014227867126464844, -0.011400222778320312, -0.008572578430175781, -0.00574493408203125, -0.0029172897338867188, -8.96453857421875e-05, 0.0027379989624023438, 0.005565643310546875, 0.008393287658691406, 0.011220932006835938, 0.014048576354980469, 0.016876220703125, 0.01970386505126953, 0.022531509399414062, 0.025359153747558594, 0.028186798095703125, 0.031014442443847656, 0.03384208679199219, 0.03666973114013672, 0.03949737548828125, 0.04232501983642578, 0.04515266418457031, 0.047980308532714844, 0.050807952880859375, 0.053635597229003906, 0.05646324157714844, 0.05929088592529297, 0.0621185302734375, 0.06494617462158203, 0.06777381896972656, 0.0706014633178711, 0.07342910766601562, 0.07625675201416016, 0.07908439636230469, 0.08191204071044922, 0.08473968505859375, 0.08756732940673828, 0.09039497375488281, 0.09322261810302734, 0.09605026245117188, 0.0988779067993164, 0.10170555114746094, 0.10453319549560547, 0.10736083984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 3.0, 14.0, 12.0, 12.0, 18.0, 16.0, 23.0, 32.0, 36.0, 46.0, 40.0, 47.0, 44.0, 53.0, 59.0, 49.0, 54.0, 54.0, 50.0, 57.0, 54.0, 35.0, 40.0, 33.0, 22.0, 17.0, 21.0, 9.0, 14.0, 5.0, 5.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.04265475273132324, -0.041486263275146484, -0.04031777381896973, -0.03914928436279297, -0.03798079490661621, -0.03681230545043945, -0.035643815994262695, -0.03447532653808594, -0.03330683708190918, -0.03213834762573242, -0.030969858169555664, -0.029801368713378906, -0.02863287925720215, -0.02746438980102539, -0.026295900344848633, -0.025127410888671875, -0.023958921432495117, -0.02279043197631836, -0.0216219425201416, -0.020453453063964844, -0.019284963607788086, -0.018116474151611328, -0.01694798469543457, -0.015779495239257812, -0.014611005783081055, -0.013442516326904297, -0.012274026870727539, -0.011105537414550781, -0.009937047958374023, -0.008768558502197266, -0.007600069046020508, -0.00643157958984375, -0.005263090133666992, -0.004094600677490234, -0.0029261112213134766, -0.0017576217651367188, -0.0005891323089599609, 0.0005793571472167969, 0.0017478466033935547, 0.0029163360595703125, 0.00408482551574707, 0.005253314971923828, 0.006421804428100586, 0.007590293884277344, 0.008758783340454102, 0.00992727279663086, 0.011095762252807617, 0.012264251708984375, 0.013432741165161133, 0.01460123062133789, 0.01576972007751465, 0.016938209533691406, 0.018106698989868164, 0.019275188446044922, 0.02044367790222168, 0.021612167358398438, 0.022780656814575195, 0.023949146270751953, 0.02511763572692871, 0.02628612518310547, 0.027454614639282227, 0.028623104095458984, 0.029791593551635742, 0.0309600830078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 16.0, 19.0, 18.0, 34.0, 61.0, 70.0, 105.0, 157.0, 262.0, 491.0, 1066.0, 2303.0, 6208.0, 21194.0, 114599.0, 693563.0, 167753.0, 27657.0, 7586.0, 2747.0, 1235.0, 573.0, 301.0, 183.0, 119.0, 61.0, 46.0, 32.0, 20.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0293426513671875, -0.02849435806274414, -0.02764606475830078, -0.026797771453857422, -0.025949478149414062, -0.025101184844970703, -0.024252891540527344, -0.023404598236083984, -0.022556304931640625, -0.021708011627197266, -0.020859718322753906, -0.020011425018310547, -0.019163131713867188, -0.018314838409423828, -0.01746654510498047, -0.01661825180053711, -0.01576995849609375, -0.01492166519165039, -0.014073371887207031, -0.013225078582763672, -0.012376785278320312, -0.011528491973876953, -0.010680198669433594, -0.009831905364990234, -0.008983612060546875, -0.008135318756103516, -0.007287025451660156, -0.006438732147216797, -0.0055904388427734375, -0.004742145538330078, -0.0038938522338867188, -0.0030455589294433594, -0.002197265625, -0.0013489723205566406, -0.0005006790161132812, 0.0003476142883300781, 0.0011959075927734375, 0.002044200897216797, 0.0028924942016601562, 0.0037407875061035156, 0.004589080810546875, 0.005437374114990234, 0.006285667419433594, 0.007133960723876953, 0.007982254028320312, 0.008830547332763672, 0.009678840637207031, 0.01052713394165039, 0.01137542724609375, 0.01222372055053711, 0.013072013854980469, 0.013920307159423828, 0.014768600463867188, 0.015616893768310547, 0.016465187072753906, 0.017313480377197266, 0.018161773681640625, 0.019010066986083984, 0.019858360290527344, 0.020706653594970703, 0.021554946899414062, 0.022403240203857422, 0.02325153350830078, 0.02409982681274414, 0.0249481201171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 19.0, 12.0, 26.0, 39.0, 52.0, 89.0, 157.0, 214.0, 128.0, 76.0, 44.0, 36.0, 27.0, 10.0, 9.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016164779663085938, -0.0001577325165271759, -0.00015381723642349243, -0.00014990195631980896, -0.0001459866762161255, -0.00014207139611244202, -0.00013815611600875854, -0.00013424083590507507, -0.0001303255558013916, -0.00012641027569770813, -0.00012249499559402466, -0.00011857971549034119, -0.00011466443538665771, -0.00011074915528297424, -0.00010683387517929077, -0.0001029185950756073, -9.900331497192383e-05, -9.508803486824036e-05, -9.117275476455688e-05, -8.725747466087341e-05, -8.334219455718994e-05, -7.942691445350647e-05, -7.5511634349823e-05, -7.159635424613953e-05, -6.768107414245605e-05, -6.376579403877258e-05, -5.985051393508911e-05, -5.593523383140564e-05, -5.201995372772217e-05, -4.8104673624038696e-05, -4.4189393520355225e-05, -4.027411341667175e-05, -3.635883331298828e-05, -3.244355320930481e-05, -2.8528273105621338e-05, -2.4612993001937866e-05, -2.0697712898254395e-05, -1.6782432794570923e-05, -1.2867152690887451e-05, -8.95187258720398e-06, -5.036592483520508e-06, -1.1213123798370361e-06, 2.7939677238464355e-06, 6.709247827529907e-06, 1.0624527931213379e-05, 1.453980803489685e-05, 1.8455088138580322e-05, 2.2370368242263794e-05, 2.6285648345947266e-05, 3.0200928449630737e-05, 3.411620855331421e-05, 3.803148865699768e-05, 4.194676876068115e-05, 4.5862048864364624e-05, 4.9777328968048096e-05, 5.369260907173157e-05, 5.760788917541504e-05, 6.152316927909851e-05, 6.543844938278198e-05, 6.935372948646545e-05, 7.326900959014893e-05, 7.71842896938324e-05, 8.109956979751587e-05, 8.501484990119934e-05, 8.893013000488281e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 9.0, 14.0, 19.0, 28.0, 41.0, 37.0, 60.0, 71.0, 109.0, 200.0, 324.0, 549.0, 1232.0, 3243.0, 12490.0, 84662.0, 766053.0, 153276.0, 18482.0, 4315.0, 1482.0, 746.0, 371.0, 241.0, 134.0, 106.0, 64.0, 45.0, 31.0, 24.0, 18.0, 10.0, 12.0, 3.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029815673828125, -0.028809070587158203, -0.027802467346191406, -0.02679586410522461, -0.025789260864257812, -0.024782657623291016, -0.02377605438232422, -0.022769451141357422, -0.021762847900390625, -0.020756244659423828, -0.01974964141845703, -0.018743038177490234, -0.017736434936523438, -0.01672983169555664, -0.015723228454589844, -0.014716625213623047, -0.01371002197265625, -0.012703418731689453, -0.011696815490722656, -0.01069021224975586, -0.009683609008789062, -0.008677005767822266, -0.007670402526855469, -0.006663799285888672, -0.005657196044921875, -0.004650592803955078, -0.0036439895629882812, -0.0026373863220214844, -0.0016307830810546875, -0.0006241798400878906, 0.00038242340087890625, 0.0013890266418457031, 0.0023956298828125, 0.003402233123779297, 0.004408836364746094, 0.005415439605712891, 0.0064220428466796875, 0.007428646087646484, 0.008435249328613281, 0.009441852569580078, 0.010448455810546875, 0.011455059051513672, 0.012461662292480469, 0.013468265533447266, 0.014474868774414062, 0.01548147201538086, 0.016488075256347656, 0.017494678497314453, 0.01850128173828125, 0.019507884979248047, 0.020514488220214844, 0.02152109146118164, 0.022527694702148438, 0.023534297943115234, 0.02454090118408203, 0.025547504425048828, 0.026554107666015625, 0.027560710906982422, 0.02856731414794922, 0.029573917388916016, 0.030580520629882812, 0.03158712387084961, 0.032593727111816406, 0.0336003303527832, 0.03460693359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 18.0, 13.0, 23.0, 22.0, 20.0, 36.0, 36.0, 66.0, 91.0, 122.0, 128.0, 84.0, 81.0, 49.0, 27.0, 31.0, 17.0, 23.0, 18.0, 7.0, 13.0, 12.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147705078125, -0.014266252517700195, -0.01376199722290039, -0.013257741928100586, -0.012753486633300781, -0.012249231338500977, -0.011744976043701172, -0.011240720748901367, -0.010736465454101562, -0.010232210159301758, -0.009727954864501953, -0.009223699569702148, -0.008719444274902344, -0.008215188980102539, -0.007710933685302734, -0.00720667839050293, -0.006702423095703125, -0.00619816780090332, -0.005693912506103516, -0.005189657211303711, -0.004685401916503906, -0.0041811466217041016, -0.003676891326904297, -0.003172636032104492, -0.0026683807373046875, -0.002164125442504883, -0.0016598701477050781, -0.0011556148529052734, -0.0006513595581054688, -0.00014710426330566406, 0.0003571510314941406, 0.0008614063262939453, 0.00136566162109375, 0.0018699169158935547, 0.0023741722106933594, 0.002878427505493164, 0.0033826828002929688, 0.0038869380950927734, 0.004391193389892578, 0.004895448684692383, 0.0053997039794921875, 0.005903959274291992, 0.006408214569091797, 0.0069124698638916016, 0.007416725158691406, 0.007920980453491211, 0.008425235748291016, 0.00892949104309082, 0.009433746337890625, 0.00993800163269043, 0.010442256927490234, 0.010946512222290039, 0.011450767517089844, 0.011955022811889648, 0.012459278106689453, 0.012963533401489258, 0.013467788696289062, 0.013972043991088867, 0.014476299285888672, 0.014980554580688477, 0.015484809875488281, 0.015989065170288086, 0.01649332046508789, 0.016997575759887695, 0.0175018310546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 322.0, 632.0, 45.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41871970891952515, -0.3891350328922272, -0.3595503568649292, -0.32996565103530884, -0.30038100481033325, -0.2707962989807129, -0.24121162295341492, -0.21162694692611694, -0.18204227089881897, -0.152457594871521, -0.12287291139364243, -0.09328822791576385, -0.06370355188846588, -0.03411887586116791, -0.00453418493270874, 0.025050491094589233, 0.05463516712188721, 0.08421984314918518, 0.11380452662706375, 0.14338921010494232, 0.1729738861322403, 0.20255856215953827, 0.23214325308799744, 0.2617279291152954, 0.2913126051425934, 0.32089728116989136, 0.35048195719718933, 0.3800666332244873, 0.40965133905410767, 0.43923598527908325, 0.4688206911087036, 0.4984053671360016, 0.5279901027679443, 0.5575748085975647, 0.5871594548225403, 0.6167441606521606, 0.6463288068771362, 0.6759135127067566, 0.705498218536377, 0.7350828647613525, 0.7646675109863281, 0.7942522168159485, 0.8238368630409241, 0.8534215688705444, 0.88300621509552, 0.9125909209251404, 0.9421756267547607, 0.9717602729797363, 1.001344919204712, 1.0309295654296875, 1.0605143308639526, 1.0900989770889282, 1.1196836233139038, 1.1492682695388794, 1.1788530349731445, 1.2084376811981201, 1.2380224466323853, 1.2676070928573608, 1.297191858291626, 1.3267765045166016, 1.3563611507415771, 1.3859457969665527, 1.4155305624008179, 1.4451152086257935, 1.474699854850769]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 6.0, 5.0, 14.0, 21.0, 27.0, 39.0, 46.0, 65.0, 66.0, 84.0, 64.0, 99.0, 69.0, 85.0, 71.0, 40.0, 48.0, 41.0, 32.0, 26.0, 13.0, 12.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22911089658737183, -0.22271935641765594, -0.21632781624794006, -0.20993627607822418, -0.2035447359085083, -0.19715319573879242, -0.19076165556907654, -0.18437010049819946, -0.17797857522964478, -0.1715870350599289, -0.165195494890213, -0.15880395472049713, -0.15241241455078125, -0.14602087438106537, -0.1396293342113495, -0.1332377791404724, -0.12684623897075653, -0.12045469880104065, -0.11406315863132477, -0.10767161846160889, -0.101280078291893, -0.09488853812217712, -0.08849699050188065, -0.08210545033216476, -0.07571391016244888, -0.069322369992733, -0.06293082982301712, -0.05653928592801094, -0.05014774575829506, -0.04375620558857918, -0.037364661693573, -0.030973121523857117, -0.024581581354141235, -0.018190041184425354, -0.011798499152064323, -0.005406957119703293, 0.0009845830500125885, 0.00737612321972847, 0.01376766711473465, 0.02015920728445053, 0.026550747454166412, 0.032942287623882294, 0.039333827793598175, 0.045725371688604355, 0.052116911858320236, 0.05850845202803612, 0.0648999959230423, 0.07129153609275818, 0.07768307626247406, 0.08407461643218994, 0.09046615660190582, 0.0968576967716217, 0.10324923694133759, 0.10964077711105347, 0.11603232473134995, 0.12242386490106583, 0.1288154125213623, 0.13520695269107819, 0.14159849286079407, 0.14799003303050995, 0.15438157320022583, 0.1607731133699417, 0.1671646535396576, 0.17355620861053467, 0.17994773387908936]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 15.0, 20.0, 34.0, 46.0, 86.0, 172.0, 733.0, 2365.0, 4818.0, 13080.0, 2224695.0, 1929919.0, 11970.0, 3779.0, 1183.0, 824.0, 239.0, 101.0, 60.0, 37.0, 28.0, 12.0, 12.0, 13.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06900978088378906, -0.06685256958007812, -0.06469535827636719, -0.06253814697265625, -0.06038093566894531, -0.058223724365234375, -0.05606651306152344, -0.0539093017578125, -0.05175209045410156, -0.049594879150390625, -0.04743766784667969, -0.04528045654296875, -0.04312324523925781, -0.040966033935546875, -0.03880882263183594, -0.036651611328125, -0.03449440002441406, -0.032337188720703125, -0.030179977416992188, -0.02802276611328125, -0.025865554809570312, -0.023708343505859375, -0.021551132202148438, -0.0193939208984375, -0.017236709594726562, -0.015079498291015625, -0.012922286987304688, -0.01076507568359375, -0.008607864379882812, -0.006450653076171875, -0.0042934417724609375, -0.00213623046875, 2.09808349609375e-05, 0.002178192138671875, 0.0043354034423828125, 0.00649261474609375, 0.008649826049804688, 0.010807037353515625, 0.012964248657226562, 0.0151214599609375, 0.017278671264648438, 0.019435882568359375, 0.021593093872070312, 0.02375030517578125, 0.025907516479492188, 0.028064727783203125, 0.030221939086914062, 0.032379150390625, 0.03453636169433594, 0.036693572998046875, 0.03885078430175781, 0.04100799560546875, 0.04316520690917969, 0.045322418212890625, 0.04747962951660156, 0.0496368408203125, 0.05179405212402344, 0.053951263427734375, 0.05610847473144531, 0.05826568603515625, 0.06042289733886719, 0.06258010864257812, 0.06473731994628906, 0.06689453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 23.0, 106.0, 303.0, 363.0, 166.0, 24.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06588459014892578, -0.06383705139160156, -0.061789512634277344, -0.059741973876953125, -0.057694435119628906, -0.05564689636230469, -0.05359935760498047, -0.05155181884765625, -0.04950428009033203, -0.04745674133300781, -0.045409202575683594, -0.043361663818359375, -0.041314125061035156, -0.03926658630371094, -0.03721904754638672, -0.0351715087890625, -0.03312397003173828, -0.031076431274414062, -0.029028892517089844, -0.026981353759765625, -0.024933815002441406, -0.022886276245117188, -0.02083873748779297, -0.01879119873046875, -0.01674365997314453, -0.014696121215820312, -0.012648582458496094, -0.010601043701171875, -0.008553504943847656, -0.0065059661865234375, -0.004458427429199219, -0.002410888671875, -0.00036334991455078125, 0.0016841888427734375, 0.0037317276000976562, 0.005779266357421875, 0.007826805114746094, 0.009874343872070312, 0.011921882629394531, 0.01396942138671875, 0.01601696014404297, 0.018064498901367188, 0.020112037658691406, 0.022159576416015625, 0.024207115173339844, 0.026254653930664062, 0.02830219268798828, 0.0303497314453125, 0.03239727020263672, 0.03444480895996094, 0.036492347717285156, 0.038539886474609375, 0.040587425231933594, 0.04263496398925781, 0.04468250274658203, 0.04673004150390625, 0.04877758026123047, 0.05082511901855469, 0.052872657775878906, 0.054920196533203125, 0.056967735290527344, 0.05901527404785156, 0.06106281280517578, 0.0631103515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 9.0, 8.0, 12.0, 13.0, 31.0, 43.0, 47.0, 139.0, 421.0, 1859.0, 36526.0, 4105475.0, 46853.0, 2120.0, 437.0, 147.0, 57.0, 26.0, 24.0, 12.0, 7.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.07347393035888672, -0.07089805603027344, -0.06832218170166016, -0.06574630737304688, -0.0631704330444336, -0.06059455871582031, -0.05801868438720703, -0.05544281005859375, -0.05286693572998047, -0.05029106140136719, -0.047715187072753906, -0.045139312744140625, -0.042563438415527344, -0.03998756408691406, -0.03741168975830078, -0.0348358154296875, -0.03225994110107422, -0.029684066772460938, -0.027108192443847656, -0.024532318115234375, -0.021956443786621094, -0.019380569458007812, -0.01680469512939453, -0.01422882080078125, -0.011652946472167969, -0.009077072143554688, -0.006501197814941406, -0.003925323486328125, -0.0013494491577148438, 0.0012264251708984375, 0.0038022994995117188, 0.006378173828125, 0.008954048156738281, 0.011529922485351562, 0.014105796813964844, 0.016681671142578125, 0.019257545471191406, 0.021833419799804688, 0.02440929412841797, 0.02698516845703125, 0.02956104278564453, 0.03213691711425781, 0.034712791442871094, 0.037288665771484375, 0.039864540100097656, 0.04244041442871094, 0.04501628875732422, 0.0475921630859375, 0.05016803741455078, 0.05274391174316406, 0.055319786071777344, 0.057895660400390625, 0.060471534729003906, 0.06304740905761719, 0.06562328338623047, 0.06819915771484375, 0.07077503204345703, 0.07335090637207031, 0.0759267807006836, 0.07850265502929688, 0.08107852935791016, 0.08365440368652344, 0.08623027801513672, 0.08880615234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 12.0, 19.0, 23.0, 62.0, 92.0, 143.0, 327.0, 745.0, 1167.0, 740.0, 301.0, 169.0, 93.0, 55.0, 39.0, 24.0, 15.0, 11.0, 5.0, 3.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035369873046875, -0.03445100784301758, -0.033532142639160156, -0.032613277435302734, -0.03169441223144531, -0.03077554702758789, -0.02985668182373047, -0.028937816619873047, -0.028018951416015625, -0.027100086212158203, -0.02618122100830078, -0.02526235580444336, -0.024343490600585938, -0.023424625396728516, -0.022505760192871094, -0.021586894989013672, -0.02066802978515625, -0.019749164581298828, -0.018830299377441406, -0.017911434173583984, -0.016992568969726562, -0.01607370376586914, -0.015154838562011719, -0.014235973358154297, -0.013317108154296875, -0.012398242950439453, -0.011479377746582031, -0.01056051254272461, -0.009641647338867188, -0.008722782135009766, -0.007803916931152344, -0.006885051727294922, -0.0059661865234375, -0.005047321319580078, -0.004128456115722656, -0.0032095909118652344, -0.0022907257080078125, -0.0013718605041503906, -0.00045299530029296875, 0.0004658699035644531, 0.001384735107421875, 0.002303600311279297, 0.0032224655151367188, 0.004141330718994141, 0.0050601959228515625, 0.005979061126708984, 0.006897926330566406, 0.007816791534423828, 0.00873565673828125, 0.009654521942138672, 0.010573387145996094, 0.011492252349853516, 0.012411117553710938, 0.01332998275756836, 0.014248847961425781, 0.015167713165283203, 0.016086578369140625, 0.017005443572998047, 0.01792430877685547, 0.01884317398071289, 0.019762039184570312, 0.020680904388427734, 0.021599769592285156, 0.022518634796142578, 0.0234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 155.0, 718.0, 108.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6978673934936523, -0.6817833185195923, -0.665699303150177, -0.6496152281761169, -0.6335312128067017, -0.6174471378326416, -0.6013630628585815, -0.5852790474891663, -0.5691949725151062, -0.5531108975410461, -0.5370268821716309, -0.5209428071975708, -0.5048587918281555, -0.48877471685409546, -0.4726906716823578, -0.4566066265106201, -0.44052258133888245, -0.4244385361671448, -0.4083544909954071, -0.39227044582366943, -0.3761863708496094, -0.3601023256778717, -0.34401828050613403, -0.32793423533439636, -0.3118501901626587, -0.295766144990921, -0.27968209981918335, -0.2635980248451233, -0.24751397967338562, -0.23142993450164795, -0.21534588932991028, -0.1992618441581726, -0.18317779898643494, -0.16709375381469727, -0.1510096937417984, -0.13492564857006073, -0.11884159594774246, -0.1027575433254242, -0.08667349815368652, -0.07058944553136826, -0.05450539290904999, -0.03842134028673172, -0.02233729138970375, -0.006253242492675781, 0.009830810129642487, 0.025914862751960754, 0.041998907923698425, 0.05808296054601669, 0.07416701316833496, 0.09025106579065323, 0.1063351184129715, 0.12241916358470917, 0.13850322365760803, 0.1545872688293457, 0.17067131400108337, 0.18675535917282104, 0.2028394192457199, 0.21892346441745758, 0.23500752449035645, 0.2510915696620941, 0.2671756148338318, 0.28325968980789185, 0.29934370517730713, 0.3154277801513672, 0.33151182532310486]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 10.0, 10.0, 15.0, 18.0, 29.0, 43.0, 42.0, 58.0, 63.0, 76.0, 82.0, 66.0, 74.0, 73.0, 62.0, 67.0, 48.0, 40.0, 37.0, 26.0, 24.0, 17.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11094796657562256, -0.10793082416057587, -0.10491368174552917, -0.10189653187990189, -0.0988793894648552, -0.0958622470498085, -0.09284509718418121, -0.08982795476913452, -0.08681081235408783, -0.08379366993904114, -0.08077652752399445, -0.07775937765836716, -0.07474223524332047, -0.07172509282827377, -0.06870794296264648, -0.06569080054759979, -0.0626736581325531, -0.05965651571750641, -0.05663936957716942, -0.05362222343683243, -0.050605081021785736, -0.047587938606739044, -0.044570792466402054, -0.041553646326065063, -0.03853650391101837, -0.03551936149597168, -0.03250221535563469, -0.029485071077942848, -0.026467926800251007, -0.023450782522559166, -0.020433638244867325, -0.017416493967175484, -0.014399349689483643, -0.011382205411791801, -0.00836506113409996, -0.005347916856408119, -0.002330772578716278, 0.000686371698975563, 0.003703515976667404, 0.006720660254359245, 0.009737804532051086, 0.012754948809742928, 0.01577209308743477, 0.01878923736512661, 0.02180638164281845, 0.024823525920510292, 0.027840670198202133, 0.030857814475893974, 0.033874958753585815, 0.03689210116863251, 0.0399092473089695, 0.04292639344930649, 0.04594353586435318, 0.04896067827939987, 0.05197782441973686, 0.05499497056007385, 0.058012112975120544, 0.061029255390167236, 0.06404639780521393, 0.06706354767084122, 0.07008069008588791, 0.0730978325009346, 0.07611498236656189, 0.07913212478160858, 0.08214926719665527]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 10.0, 10.0, 17.0, 17.0, 24.0, 33.0, 52.0, 84.0, 128.0, 144.0, 280.0, 435.0, 852.0, 2335.0, 32368.0, 953041.0, 53686.0, 2731.0, 899.0, 471.0, 301.0, 215.0, 151.0, 86.0, 54.0, 35.0, 28.0, 17.0, 17.0, 10.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.089111328125, -0.0862874984741211, -0.08346366882324219, -0.08063983917236328, -0.07781600952148438, -0.07499217987060547, -0.07216835021972656, -0.06934452056884766, -0.06652069091796875, -0.06369686126708984, -0.06087303161621094, -0.05804920196533203, -0.055225372314453125, -0.05240154266357422, -0.04957771301269531, -0.046753883361816406, -0.0439300537109375, -0.041106224060058594, -0.03828239440917969, -0.03545856475830078, -0.032634735107421875, -0.02981090545654297, -0.026987075805664062, -0.024163246154785156, -0.02133941650390625, -0.018515586853027344, -0.015691757202148438, -0.012867927551269531, -0.010044097900390625, -0.007220268249511719, -0.0043964385986328125, -0.0015726089477539062, 0.001251220703125, 0.004075050354003906, 0.0068988800048828125, 0.009722709655761719, 0.012546539306640625, 0.015370368957519531, 0.018194198608398438, 0.021018028259277344, 0.02384185791015625, 0.026665687561035156, 0.029489517211914062, 0.03231334686279297, 0.035137176513671875, 0.03796100616455078, 0.04078483581542969, 0.043608665466308594, 0.0464324951171875, 0.049256324768066406, 0.05208015441894531, 0.05490398406982422, 0.057727813720703125, 0.06055164337158203, 0.06337547302246094, 0.06619930267333984, 0.06902313232421875, 0.07184696197509766, 0.07467079162597656, 0.07749462127685547, 0.08031845092773438, 0.08314228057861328, 0.08596611022949219, 0.0887899398803711, 0.09161376953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 20.0, 65.0, 248.0, 378.0, 224.0, 50.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06388711929321289, -0.06191730499267578, -0.05994749069213867, -0.05797767639160156, -0.05600786209106445, -0.054038047790527344, -0.052068233489990234, -0.050098419189453125, -0.048128604888916016, -0.046158790588378906, -0.0441889762878418, -0.04221916198730469, -0.04024934768676758, -0.03827953338623047, -0.03630971908569336, -0.03433990478515625, -0.03237009048461914, -0.03040027618408203, -0.028430461883544922, -0.026460647583007812, -0.024490833282470703, -0.022521018981933594, -0.020551204681396484, -0.018581390380859375, -0.016611576080322266, -0.014641761779785156, -0.012671947479248047, -0.010702133178710938, -0.008732318878173828, -0.006762504577636719, -0.004792690277099609, -0.0028228759765625, -0.0008530616760253906, 0.0011167526245117188, 0.003086566925048828, 0.0050563812255859375, 0.007026195526123047, 0.008996009826660156, 0.010965824127197266, 0.012935638427734375, 0.014905452728271484, 0.016875267028808594, 0.018845081329345703, 0.020814895629882812, 0.022784709930419922, 0.02475452423095703, 0.02672433853149414, 0.02869415283203125, 0.03066396713256836, 0.03263378143310547, 0.03460359573364258, 0.03657341003417969, 0.0385432243347168, 0.040513038635253906, 0.042482852935791016, 0.044452667236328125, 0.046422481536865234, 0.048392295837402344, 0.05036211013793945, 0.05233192443847656, 0.05430173873901367, 0.05627155303955078, 0.05824136734008789, 0.060211181640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 9.0, 8.0, 9.0, 13.0, 11.0, 24.0, 12.0, 23.0, 33.0, 45.0, 78.0, 119.0, 167.0, 349.0, 699.0, 2239.0, 27655.0, 895745.0, 115222.0, 3950.0, 1003.0, 418.0, 236.0, 125.0, 82.0, 65.0, 41.0, 29.0, 30.0, 12.0, 15.0, 19.0, 16.0, 14.0, 6.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07220458984375, -0.06992435455322266, -0.06764411926269531, -0.06536388397216797, -0.06308364868164062, -0.06080341339111328, -0.05852317810058594, -0.056242942810058594, -0.05396270751953125, -0.051682472229003906, -0.04940223693847656, -0.04712200164794922, -0.044841766357421875, -0.04256153106689453, -0.04028129577636719, -0.038001060485839844, -0.0357208251953125, -0.033440589904785156, -0.031160354614257812, -0.02888011932373047, -0.026599884033203125, -0.02431964874267578, -0.022039413452148438, -0.019759178161621094, -0.01747894287109375, -0.015198707580566406, -0.012918472290039062, -0.010638236999511719, -0.008358001708984375, -0.006077766418457031, -0.0037975311279296875, -0.0015172958374023438, 0.000762939453125, 0.0030431747436523438, 0.0053234100341796875, 0.007603645324707031, 0.009883880615234375, 0.012164115905761719, 0.014444351196289062, 0.016724586486816406, 0.01900482177734375, 0.021285057067871094, 0.023565292358398438, 0.02584552764892578, 0.028125762939453125, 0.03040599822998047, 0.03268623352050781, 0.034966468811035156, 0.0372467041015625, 0.039526939392089844, 0.04180717468261719, 0.04408740997314453, 0.046367645263671875, 0.04864788055419922, 0.05092811584472656, 0.053208351135253906, 0.05548858642578125, 0.057768821716308594, 0.06004905700683594, 0.06232929229736328, 0.06460952758789062, 0.06688976287841797, 0.06916999816894531, 0.07145023345947266, 0.07373046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 10.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 9.0, 16.0, 15.0, 25.0, 30.0, 31.0, 24.0, 35.0, 47.0, 37.0, 40.0, 45.0, 37.0, 43.0, 40.0, 50.0, 38.0, 44.0, 47.0, 31.0, 32.0, 31.0, 22.0, 35.0, 25.0, 20.0, 16.0, 15.0, 7.0, 12.0, 13.0, 10.0, 9.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.025805950164794922, -0.024939537048339844, -0.024073123931884766, -0.023206710815429688, -0.02234029769897461, -0.02147388458251953, -0.020607471466064453, -0.019741058349609375, -0.018874645233154297, -0.01800823211669922, -0.01714181900024414, -0.016275405883789062, -0.015408992767333984, -0.014542579650878906, -0.013676166534423828, -0.01280975341796875, -0.011943340301513672, -0.011076927185058594, -0.010210514068603516, -0.009344100952148438, -0.00847768783569336, -0.007611274719238281, -0.006744861602783203, -0.005878448486328125, -0.005012035369873047, -0.004145622253417969, -0.0032792091369628906, -0.0024127960205078125, -0.0015463829040527344, -0.0006799697875976562, 0.00018644332885742188, 0.0010528564453125, 0.0019192695617675781, 0.0027856826782226562, 0.0036520957946777344, 0.0045185089111328125, 0.005384922027587891, 0.006251335144042969, 0.007117748260498047, 0.007984161376953125, 0.008850574493408203, 0.009716987609863281, 0.01058340072631836, 0.011449813842773438, 0.012316226959228516, 0.013182640075683594, 0.014049053192138672, 0.01491546630859375, 0.015781879425048828, 0.016648292541503906, 0.017514705657958984, 0.018381118774414062, 0.01924753189086914, 0.02011394500732422, 0.020980358123779297, 0.021846771240234375, 0.022713184356689453, 0.02357959747314453, 0.02444601058959961, 0.025312423706054688, 0.026178836822509766, 0.027045249938964844, 0.027911663055419922, 0.028778076171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 6.0, 10.0, 18.0, 24.0, 54.0, 99.0, 155.0, 327.0, 737.0, 1976.0, 6289.0, 26062.0, 215041.0, 692552.0, 84184.0, 14567.0, 4059.0, 1317.0, 525.0, 238.0, 112.0, 53.0, 43.0, 28.0, 18.0, 17.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.02099609375, -0.02043330669403076, -0.019870519638061523, -0.019307732582092285, -0.018744945526123047, -0.01818215847015381, -0.01761937141418457, -0.017056584358215332, -0.016493797302246094, -0.015931010246276855, -0.015368223190307617, -0.014805436134338379, -0.01424264907836914, -0.013679862022399902, -0.013117074966430664, -0.012554287910461426, -0.011991500854492188, -0.01142871379852295, -0.010865926742553711, -0.010303139686584473, -0.009740352630615234, -0.009177565574645996, -0.008614778518676758, -0.00805199146270752, -0.007489204406738281, -0.006926417350769043, -0.006363630294799805, -0.005800843238830566, -0.005238056182861328, -0.00467526912689209, -0.0041124820709228516, -0.0035496950149536133, -0.002986907958984375, -0.0024241209030151367, -0.0018613338470458984, -0.0012985467910766602, -0.0007357597351074219, -0.0001729726791381836, 0.0003898143768310547, 0.000952601432800293, 0.0015153884887695312, 0.0020781755447387695, 0.002640962600708008, 0.003203749656677246, 0.0037665367126464844, 0.004329323768615723, 0.004892110824584961, 0.005454897880554199, 0.0060176849365234375, 0.006580471992492676, 0.007143259048461914, 0.007706046104431152, 0.00826883316040039, 0.008831620216369629, 0.009394407272338867, 0.009957194328308105, 0.010519981384277344, 0.011082768440246582, 0.01164555549621582, 0.012208342552185059, 0.012771129608154297, 0.013333916664123535, 0.013896703720092773, 0.014459490776062012, 0.01502227783203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 22.0, 27.0, 35.0, 53.0, 61.0, 76.0, 109.0, 122.0, 100.0, 72.0, 75.0, 59.0, 28.0, 19.0, 19.0, 12.0, 14.0, 8.0, 5.0, 12.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.702278137207031e-05, -8.457992225885391e-05, -8.213706314563751e-05, -7.969420403242111e-05, -7.725134491920471e-05, -7.480848580598831e-05, -7.236562669277191e-05, -6.992276757955551e-05, -6.747990846633911e-05, -6.503704935312271e-05, -6.259419023990631e-05, -6.015133112668991e-05, -5.770847201347351e-05, -5.526561290025711e-05, -5.282275378704071e-05, -5.037989467382431e-05, -4.793703556060791e-05, -4.549417644739151e-05, -4.305131733417511e-05, -4.060845822095871e-05, -3.816559910774231e-05, -3.572273999452591e-05, -3.327988088130951e-05, -3.083702176809311e-05, -2.839416265487671e-05, -2.595130354166031e-05, -2.350844442844391e-05, -2.106558531522751e-05, -1.862272620201111e-05, -1.6179867088794708e-05, -1.3737007975578308e-05, -1.1294148862361908e-05, -8.851289749145508e-06, -6.408430635929108e-06, -3.9655715227127075e-06, -1.5227124094963074e-06, 9.201467037200928e-07, 3.363005816936493e-06, 5.805864930152893e-06, 8.248724043369293e-06, 1.0691583156585693e-05, 1.3134442269802094e-05, 1.5577301383018494e-05, 1.8020160496234894e-05, 2.0463019609451294e-05, 2.2905878722667694e-05, 2.5348737835884094e-05, 2.7791596949100494e-05, 3.0234456062316895e-05, 3.2677315175533295e-05, 3.5120174288749695e-05, 3.7563033401966095e-05, 4.0005892515182495e-05, 4.2448751628398895e-05, 4.4891610741615295e-05, 4.7334469854831696e-05, 4.9777328968048096e-05, 5.2220188081264496e-05, 5.4663047194480896e-05, 5.7105906307697296e-05, 5.9548765420913696e-05, 6.19916245341301e-05, 6.44344836473465e-05, 6.68773427605629e-05, 6.93202018737793e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 15.0, 16.0, 23.0, 30.0, 44.0, 67.0, 93.0, 156.0, 245.0, 516.0, 1011.0, 2311.0, 5744.0, 15550.0, 55009.0, 467893.0, 424148.0, 50959.0, 15030.0, 5339.0, 2209.0, 947.0, 451.0, 268.0, 150.0, 91.0, 68.0, 36.0, 35.0, 18.0, 11.0, 10.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0149078369140625, -0.014374971389770508, -0.013842105865478516, -0.013309240341186523, -0.012776374816894531, -0.012243509292602539, -0.011710643768310547, -0.011177778244018555, -0.010644912719726562, -0.01011204719543457, -0.009579181671142578, -0.009046316146850586, -0.008513450622558594, -0.007980585098266602, -0.007447719573974609, -0.006914854049682617, -0.006381988525390625, -0.005849123001098633, -0.005316257476806641, -0.0047833919525146484, -0.004250526428222656, -0.003717660903930664, -0.003184795379638672, -0.0026519298553466797, -0.0021190643310546875, -0.0015861988067626953, -0.0010533332824707031, -0.0005204677581787109, 1.239776611328125e-05, 0.0005452632904052734, 0.0010781288146972656, 0.0016109943389892578, 0.00214385986328125, 0.002676725387573242, 0.0032095909118652344, 0.0037424564361572266, 0.004275321960449219, 0.004808187484741211, 0.005341053009033203, 0.005873918533325195, 0.0064067840576171875, 0.00693964958190918, 0.007472515106201172, 0.008005380630493164, 0.008538246154785156, 0.009071111679077148, 0.00960397720336914, 0.010136842727661133, 0.010669708251953125, 0.011202573776245117, 0.01173543930053711, 0.012268304824829102, 0.012801170349121094, 0.013334035873413086, 0.013866901397705078, 0.01439976692199707, 0.014932632446289062, 0.015465497970581055, 0.015998363494873047, 0.01653122901916504, 0.01706409454345703, 0.017596960067749023, 0.018129825592041016, 0.018662691116333008, 0.019195556640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 7.0, 7.0, 7.0, 30.0, 30.0, 29.0, 47.0, 45.0, 66.0, 67.0, 98.0, 91.0, 88.0, 75.0, 48.0, 43.0, 39.0, 18.0, 22.0, 17.0, 14.0, 16.0, 11.0, 10.0, 11.0, 8.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008575439453125, -0.008283019065856934, -0.007990598678588867, -0.007698178291320801, -0.007405757904052734, -0.007113337516784668, -0.0068209171295166016, -0.006528496742248535, -0.006236076354980469, -0.005943655967712402, -0.005651235580444336, -0.0053588151931762695, -0.005066394805908203, -0.004773974418640137, -0.00448155403137207, -0.004189133644104004, -0.0038967132568359375, -0.003604292869567871, -0.0033118724822998047, -0.0030194520950317383, -0.002727031707763672, -0.0024346113204956055, -0.002142190933227539, -0.0018497705459594727, -0.0015573501586914062, -0.0012649297714233398, -0.0009725093841552734, -0.000680088996887207, -0.0003876686096191406, -9.524822235107422e-05, 0.0001971721649169922, 0.0004895925521850586, 0.000782012939453125, 0.0010744333267211914, 0.0013668537139892578, 0.0016592741012573242, 0.0019516944885253906, 0.002244114875793457, 0.0025365352630615234, 0.00282895565032959, 0.0031213760375976562, 0.0034137964248657227, 0.003706216812133789, 0.0039986371994018555, 0.004291057586669922, 0.004583477973937988, 0.004875898361206055, 0.005168318748474121, 0.0054607391357421875, 0.005753159523010254, 0.00604557991027832, 0.006338000297546387, 0.006630420684814453, 0.0069228410720825195, 0.007215261459350586, 0.007507681846618652, 0.007800102233886719, 0.008092522621154785, 0.008384943008422852, 0.008677363395690918, 0.008969783782958984, 0.00926220417022705, 0.009554624557495117, 0.009847044944763184, 0.01013946533203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 11.0, 19.0, 294.0, 635.0, 48.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12614059448242188, -0.10892495512962341, -0.09170930832624435, -0.0744936615228653, -0.057278022170066833, -0.04006238281726837, -0.022846736013889313, -0.005631089210510254, 0.011584550142288208, 0.02880019322037697, 0.04601583629846573, 0.06323148310184479, 0.08044712245464325, 0.09766276180744171, 0.11487840861082077, 0.13209405541419983, 0.1493096947669983, 0.16652533411979675, 0.18374097347259521, 0.20095662772655487, 0.21817226707935333, 0.2353879064321518, 0.25260356068611145, 0.2698192000389099, 0.2870348393917084, 0.30425047874450684, 0.3214661180973053, 0.33868175745010376, 0.3558974266052246, 0.3731130361557007, 0.39032870531082153, 0.40754434466362, 0.42475998401641846, 0.4419756233692169, 0.4591912627220154, 0.47640690207481384, 0.4936225414276123, 0.5108382105827332, 0.5280538201332092, 0.5452694892883301, 0.5624850988388062, 0.579700767993927, 0.5969163775444031, 0.6141320466995239, 0.63134765625, 0.6485633254051208, 0.6657789349555969, 0.6829946041107178, 0.7002102732658386, 0.7174259424209595, 0.7346415519714355, 0.7518572211265564, 0.7690728306770325, 0.7862884998321533, 0.8035041093826294, 0.8207197785377502, 0.8379354476928711, 0.8551511168479919, 0.872366726398468, 0.8895823955535889, 0.9067980051040649, 0.9240136742591858, 0.9412292838096619, 0.9584449529647827, 0.9756605625152588]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 5.0, 12.0, 7.0, 8.0, 14.0, 17.0, 11.0, 15.0, 21.0, 20.0, 20.0, 26.0, 38.0, 33.0, 34.0, 35.0, 38.0, 33.0, 50.0, 36.0, 37.0, 50.0, 41.0, 35.0, 40.0, 43.0, 34.0, 34.0, 32.0, 29.0, 20.0, 18.0, 30.0, 15.0, 11.0, 6.0, 11.0, 10.0, 8.0, 11.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08181983232498169, -0.07927834987640381, -0.07673685997724533, -0.07419537752866745, -0.07165388762950897, -0.06911240518093109, -0.06657092273235321, -0.06402944028377533, -0.06148795038461685, -0.05894646421074867, -0.05640497803688049, -0.05386349558830261, -0.05132200941443443, -0.048780523240566254, -0.04623904079198837, -0.043697554618120193, -0.041156068444252014, -0.038614582270383835, -0.036073096096515656, -0.033531613647937775, -0.030990127474069595, -0.028448641300201416, -0.025907156988978386, -0.023365672677755356, -0.020824186503887177, -0.018282700330018997, -0.015741216018795967, -0.013199730776250362, -0.010658245533704758, -0.008116760291159153, -0.005575275048613548, -0.003033790737390518, -0.0004923045635223389, 0.002049180679023266, 0.0045906659215688705, 0.007132151164114475, 0.00967363640666008, 0.012215121649205685, 0.01475660689175129, 0.01729809120297432, 0.0198395773768425, 0.022381063550710678, 0.024922547861933708, 0.02746403217315674, 0.030005518347024918, 0.0325470045208931, 0.03508848696947098, 0.03762997314333916, 0.040171459317207336, 0.042712945491075516, 0.045254431664943695, 0.047795914113521576, 0.050337400287389755, 0.052878886461257935, 0.055420368909835815, 0.057961855083703995, 0.060503341257572174, 0.06304482370615005, 0.06558631360530853, 0.06812779605388641, 0.0706692785024643, 0.07321076840162277, 0.07575225085020065, 0.07829374074935913, 0.08083522319793701]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 11.0, 19.0, 42.0, 72.0, 129.0, 464.0, 1304.0, 3211.0, 6013.0, 29229.0, 3872487.0, 265261.0, 10142.0, 3340.0, 1143.0, 787.0, 273.0, 134.0, 58.0, 45.0, 21.0, 22.0, 16.0, 8.0, 11.0, 2.0, 10.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06610107421875, -0.06414270401000977, -0.06218433380126953, -0.0602259635925293, -0.05826759338378906, -0.05630922317504883, -0.054350852966308594, -0.05239248275756836, -0.050434112548828125, -0.04847574234008789, -0.046517372131347656, -0.04455900192260742, -0.04260063171386719, -0.04064226150512695, -0.03868389129638672, -0.036725521087646484, -0.03476715087890625, -0.032808780670166016, -0.03085041046142578, -0.028892040252685547, -0.026933670043945312, -0.024975299835205078, -0.023016929626464844, -0.02105855941772461, -0.019100189208984375, -0.01714181900024414, -0.015183448791503906, -0.013225078582763672, -0.011266708374023438, -0.009308338165283203, -0.007349967956542969, -0.005391597747802734, -0.0034332275390625, -0.0014748573303222656, 0.00048351287841796875, 0.002441883087158203, 0.0044002532958984375, 0.006358623504638672, 0.008316993713378906, 0.01027536392211914, 0.012233734130859375, 0.01419210433959961, 0.016150474548339844, 0.018108844757080078, 0.020067214965820312, 0.022025585174560547, 0.02398395538330078, 0.025942325592041016, 0.02790069580078125, 0.029859066009521484, 0.03181743621826172, 0.03377580642700195, 0.03573417663574219, 0.03769254684448242, 0.039650917053222656, 0.04160928726196289, 0.043567657470703125, 0.04552602767944336, 0.047484397888183594, 0.04944276809692383, 0.05140113830566406, 0.0533595085144043, 0.05531787872314453, 0.057276248931884766, 0.059234619140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 13.0, 47.0, 213.0, 406.0, 245.0, 62.0, 12.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06490135192871094, -0.06284713745117188, -0.06079292297363281, -0.05873870849609375, -0.05668449401855469, -0.054630279541015625, -0.05257606506347656, -0.0505218505859375, -0.04846763610839844, -0.046413421630859375, -0.04435920715332031, -0.04230499267578125, -0.04025077819824219, -0.038196563720703125, -0.03614234924316406, -0.034088134765625, -0.03203392028808594, -0.029979705810546875, -0.027925491333007812, -0.02587127685546875, -0.023817062377929688, -0.021762847900390625, -0.019708633422851562, -0.0176544189453125, -0.015600204467773438, -0.013545989990234375, -0.011491775512695312, -0.00943756103515625, -0.0073833465576171875, -0.005329132080078125, -0.0032749176025390625, -0.001220703125, 0.0008335113525390625, 0.002887725830078125, 0.0049419403076171875, 0.00699615478515625, 0.009050369262695312, 0.011104583740234375, 0.013158798217773438, 0.0152130126953125, 0.017267227172851562, 0.019321441650390625, 0.021375656127929688, 0.02342987060546875, 0.025484085083007812, 0.027538299560546875, 0.029592514038085938, 0.031646728515625, 0.03370094299316406, 0.035755157470703125, 0.03780937194824219, 0.03986358642578125, 0.04191780090332031, 0.043972015380859375, 0.04602622985839844, 0.0480804443359375, 0.05013465881347656, 0.052188873291015625, 0.05424308776855469, 0.05629730224609375, 0.05835151672363281, 0.060405731201171875, 0.06245994567871094, 0.06451416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 26.0, 46.0, 74.0, 202.0, 581.0, 2281.0, 23919.0, 3407433.0, 745327.0, 12177.0, 1522.0, 413.0, 160.0, 58.0, 28.0, 14.0, 9.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.045223236083984375, -0.04354095458984375, -0.041858673095703125, -0.0401763916015625, -0.038494110107421875, -0.03681182861328125, -0.035129547119140625, -0.033447265625, -0.031764984130859375, -0.03008270263671875, -0.028400421142578125, -0.0267181396484375, -0.025035858154296875, -0.02335357666015625, -0.021671295166015625, -0.019989013671875, -0.018306732177734375, -0.01662445068359375, -0.014942169189453125, -0.0132598876953125, -0.011577606201171875, -0.00989532470703125, -0.008213043212890625, -0.00653076171875, -0.004848480224609375, -0.00316619873046875, -0.001483917236328125, 0.0001983642578125, 0.001880645751953125, 0.00356292724609375, 0.005245208740234375, 0.006927490234375, 0.008609771728515625, 0.01029205322265625, 0.011974334716796875, 0.0136566162109375, 0.015338897705078125, 0.01702117919921875, 0.018703460693359375, 0.0203857421875, 0.022068023681640625, 0.02375030517578125, 0.025432586669921875, 0.0271148681640625, 0.028797149658203125, 0.03047943115234375, 0.032161712646484375, 0.033843994140625, 0.035526275634765625, 0.03720855712890625, 0.038890838623046875, 0.0405731201171875, 0.042255401611328125, 0.04393768310546875, 0.045619964599609375, 0.04730224609375, 0.048984527587890625, 0.05066680908203125, 0.052349090576171875, 0.0540313720703125, 0.055713653564453125, 0.05739593505859375, 0.059078216552734375, 0.060760498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 12.0, 25.0, 61.0, 131.0, 338.0, 1127.0, 1467.0, 514.0, 204.0, 89.0, 52.0, 23.0, 13.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.04829120635986328, -0.04699134826660156, -0.045691490173339844, -0.044391632080078125, -0.043091773986816406, -0.04179191589355469, -0.04049205780029297, -0.03919219970703125, -0.03789234161376953, -0.03659248352050781, -0.035292625427246094, -0.033992767333984375, -0.032692909240722656, -0.03139305114746094, -0.03009319305419922, -0.0287933349609375, -0.02749347686767578, -0.026193618774414062, -0.024893760681152344, -0.023593902587890625, -0.022294044494628906, -0.020994186401367188, -0.01969432830810547, -0.01839447021484375, -0.01709461212158203, -0.015794754028320312, -0.014494895935058594, -0.013195037841796875, -0.011895179748535156, -0.010595321655273438, -0.009295463562011719, -0.00799560546875, -0.006695747375488281, -0.0053958892822265625, -0.004096031188964844, -0.002796173095703125, -0.0014963150024414062, -0.0001964569091796875, 0.0011034011840820312, 0.00240325927734375, 0.0037031173706054688, 0.0050029754638671875, 0.006302833557128906, 0.007602691650390625, 0.008902549743652344, 0.010202407836914062, 0.011502265930175781, 0.0128021240234375, 0.014101982116699219, 0.015401840209960938, 0.016701698303222656, 0.018001556396484375, 0.019301414489746094, 0.020601272583007812, 0.02190113067626953, 0.02320098876953125, 0.02450084686279297, 0.025800704956054688, 0.027100563049316406, 0.028400421142578125, 0.029700279235839844, 0.031000137329101562, 0.03229999542236328, 0.033599853515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 13.0, 184.0, 698.0, 102.0, 9.0, 2.0, 2.0, 2.0], "bins": [-0.8547520041465759, -0.840095043182373, -0.8254380226135254, -0.8107810616493225, -0.7961240410804749, -0.781467080116272, -0.7668100595474243, -0.7521530985832214, -0.7374961376190186, -0.7228391766548157, -0.708182156085968, -0.6935251951217651, -0.6788681745529175, -0.6642112135887146, -0.6495541930198669, -0.6348972320556641, -0.6202402114868164, -0.6055832505226135, -0.5909262299537659, -0.576269268989563, -0.5616122484207153, -0.5469552874565125, -0.5322982668876648, -0.5176413059234619, -0.5029842853546143, -0.488327294588089, -0.4736703038215637, -0.45901331305503845, -0.4443563222885132, -0.4296993613243103, -0.41504237055778503, -0.40038537979125977, -0.3857284486293793, -0.371071457862854, -0.35641446709632874, -0.34175747632980347, -0.3271005153656006, -0.31244349479675293, -0.29778653383255005, -0.2831295430660248, -0.2684725522994995, -0.25381556153297424, -0.23915857076644897, -0.2245015949010849, -0.20984460413455963, -0.19518761336803436, -0.1805306375026703, -0.16587364673614502, -0.15121665596961975, -0.13655966520309448, -0.12190268188714981, -0.10724569857120514, -0.09258870780467987, -0.0779317170381546, -0.06327473372220993, -0.04861775040626526, -0.03396075963973999, -0.01930377259850502, -0.00464678555727005, 0.01001020148396492, 0.02466718852519989, 0.03932417929172516, 0.05398116260766983, 0.0686381459236145, 0.08329513669013977]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 5.0, 8.0, 15.0, 22.0, 21.0, 28.0, 30.0, 18.0, 35.0, 43.0, 52.0, 58.0, 46.0, 49.0, 59.0, 65.0, 52.0, 42.0, 41.0, 53.0, 42.0, 36.0, 33.0, 35.0, 19.0, 25.0, 11.0, 13.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06521707773208618, -0.06319104135036469, -0.06116500496864319, -0.05913896486163139, -0.0571129284799099, -0.0550868920981884, -0.053060851991176605, -0.05103481560945511, -0.04900877922773361, -0.046982742846012115, -0.04495670646429062, -0.042930666357278824, -0.04090462997555733, -0.03887859359383583, -0.036852553486824036, -0.03482651710510254, -0.03280048072338104, -0.030774444341659546, -0.0287484060972929, -0.026722367852926254, -0.024696331471204758, -0.02267029508948326, -0.020644256845116615, -0.01861821860074997, -0.016592182219028473, -0.014566144905984402, -0.01254010759294033, -0.01051407027989626, -0.008488032966852188, -0.006461995653808117, -0.004435958340764046, -0.0024099210277199745, -0.0003838837146759033, 0.0016421535983681679, 0.003668190911412239, 0.00569422822445631, 0.0077202655375003815, 0.009746302850544453, 0.011772340163588524, 0.013798377476632595, 0.015824414789676666, 0.017850451171398163, 0.01987648941576481, 0.021902527660131454, 0.02392856404185295, 0.025954600423574448, 0.027980638667941093, 0.03000667691230774, 0.032032713294029236, 0.03405874967575073, 0.03608478605747223, 0.038110826164484024, 0.04013686254620552, 0.04216289892792702, 0.04418893903493881, 0.04621497541666031, 0.048241011798381805, 0.0502670481801033, 0.0522930845618248, 0.054319124668836594, 0.05634516105055809, 0.05837119743227959, 0.06039723753929138, 0.06242327392101288, 0.06444931030273438]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 11.0, 13.0, 16.0, 15.0, 23.0, 33.0, 47.0, 62.0, 62.0, 87.0, 141.0, 179.0, 265.0, 394.0, 588.0, 1060.0, 2630.0, 20877.0, 507024.0, 489384.0, 19998.0, 2688.0, 1035.0, 564.0, 364.0, 248.0, 174.0, 121.0, 114.0, 75.0, 72.0, 51.0, 43.0, 30.0, 14.0, 11.0, 14.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06298828125, -0.061135292053222656, -0.05928230285644531, -0.05742931365966797, -0.055576324462890625, -0.05372333526611328, -0.05187034606933594, -0.050017356872558594, -0.04816436767578125, -0.046311378479003906, -0.04445838928222656, -0.04260540008544922, -0.040752410888671875, -0.03889942169189453, -0.03704643249511719, -0.035193443298339844, -0.0333404541015625, -0.031487464904785156, -0.029634475708007812, -0.02778148651123047, -0.025928497314453125, -0.02407550811767578, -0.022222518920898438, -0.020369529724121094, -0.01851654052734375, -0.016663551330566406, -0.014810562133789062, -0.012957572937011719, -0.011104583740234375, -0.009251594543457031, -0.0073986053466796875, -0.005545616149902344, -0.003692626953125, -0.0018396377563476562, 1.33514404296875e-05, 0.0018663406372070312, 0.003719329833984375, 0.005572319030761719, 0.0074253082275390625, 0.009278297424316406, 0.01113128662109375, 0.012984275817871094, 0.014837265014648438, 0.01669025421142578, 0.018543243408203125, 0.02039623260498047, 0.022249221801757812, 0.024102210998535156, 0.0259552001953125, 0.027808189392089844, 0.029661178588867188, 0.03151416778564453, 0.033367156982421875, 0.03522014617919922, 0.03707313537597656, 0.038926124572753906, 0.04077911376953125, 0.042632102966308594, 0.04448509216308594, 0.04633808135986328, 0.048191070556640625, 0.05004405975341797, 0.05189704895019531, 0.053750038146972656, 0.05560302734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 36.0, 138.0, 356.0, 326.0, 117.0, 15.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.0637974739074707, -0.061799049377441406, -0.05980062484741211, -0.05780220031738281, -0.055803775787353516, -0.05380535125732422, -0.05180692672729492, -0.049808502197265625, -0.04781007766723633, -0.04581165313720703, -0.043813228607177734, -0.04181480407714844, -0.03981637954711914, -0.037817955017089844, -0.03581953048706055, -0.03382110595703125, -0.03182268142700195, -0.029824256896972656, -0.02782583236694336, -0.025827407836914062, -0.023828983306884766, -0.02183055877685547, -0.019832134246826172, -0.017833709716796875, -0.015835285186767578, -0.013836860656738281, -0.011838436126708984, -0.009840011596679688, -0.00784158706665039, -0.005843162536621094, -0.003844738006591797, -0.0018463134765625, 0.00015211105346679688, 0.0021505355834960938, 0.004148960113525391, 0.0061473846435546875, 0.008145809173583984, 0.010144233703613281, 0.012142658233642578, 0.014141082763671875, 0.016139507293701172, 0.01813793182373047, 0.020136356353759766, 0.022134780883789062, 0.02413320541381836, 0.026131629943847656, 0.028130054473876953, 0.03012847900390625, 0.03212690353393555, 0.034125328063964844, 0.03612375259399414, 0.03812217712402344, 0.040120601654052734, 0.04211902618408203, 0.04411745071411133, 0.046115875244140625, 0.04811429977416992, 0.05011272430419922, 0.052111148834228516, 0.05410957336425781, 0.05610799789428711, 0.058106422424316406, 0.0601048469543457, 0.062103271484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 8.0, 10.0, 9.0, 35.0, 25.0, 44.0, 35.0, 72.0, 81.0, 106.0, 160.0, 322.0, 699.0, 2612.0, 21797.0, 308368.0, 642027.0, 64184.0, 5609.0, 1144.0, 422.0, 252.0, 124.0, 97.0, 74.0, 37.0, 37.0, 39.0, 23.0, 15.0, 19.0, 18.0, 7.0, 8.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.03753042221069336, -0.03615093231201172, -0.03477144241333008, -0.03339195251464844, -0.0320124626159668, -0.030632972717285156, -0.029253482818603516, -0.027873992919921875, -0.026494503021240234, -0.025115013122558594, -0.023735523223876953, -0.022356033325195312, -0.020976543426513672, -0.01959705352783203, -0.01821756362915039, -0.01683807373046875, -0.01545858383178711, -0.014079093933105469, -0.012699604034423828, -0.011320114135742188, -0.009940624237060547, -0.008561134338378906, -0.007181644439697266, -0.005802154541015625, -0.004422664642333984, -0.0030431747436523438, -0.0016636848449707031, -0.0002841949462890625, 0.0010952949523925781, 0.0024747848510742188, 0.0038542747497558594, 0.0052337646484375, 0.006613254547119141, 0.007992744445800781, 0.009372234344482422, 0.010751724243164062, 0.012131214141845703, 0.013510704040527344, 0.014890193939208984, 0.016269683837890625, 0.017649173736572266, 0.019028663635253906, 0.020408153533935547, 0.021787643432617188, 0.023167133331298828, 0.02454662322998047, 0.02592611312866211, 0.02730560302734375, 0.02868509292602539, 0.03006458282470703, 0.03144407272338867, 0.03282356262207031, 0.03420305252075195, 0.035582542419433594, 0.036962032318115234, 0.038341522216796875, 0.039721012115478516, 0.041100502014160156, 0.0424799919128418, 0.04385948181152344, 0.04523897171020508, 0.04661846160888672, 0.04799795150756836, 0.04937744140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 10.0, 6.0, 13.0, 14.0, 12.0, 24.0, 25.0, 25.0, 38.0, 43.0, 42.0, 45.0, 40.0, 42.0, 59.0, 54.0, 59.0, 45.0, 46.0, 49.0, 46.0, 34.0, 37.0, 34.0, 32.0, 21.0, 15.0, 23.0, 11.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.033660888671875, -0.03272652626037598, -0.03179216384887695, -0.03085780143737793, -0.029923439025878906, -0.028989076614379883, -0.02805471420288086, -0.027120351791381836, -0.026185989379882812, -0.02525162696838379, -0.024317264556884766, -0.023382902145385742, -0.02244853973388672, -0.021514177322387695, -0.020579814910888672, -0.01964545249938965, -0.018711090087890625, -0.0177767276763916, -0.016842365264892578, -0.015908002853393555, -0.014973640441894531, -0.014039278030395508, -0.013104915618896484, -0.012170553207397461, -0.011236190795898438, -0.010301828384399414, -0.00936746597290039, -0.008433103561401367, -0.007498741149902344, -0.00656437873840332, -0.005630016326904297, -0.0046956539154052734, -0.00376129150390625, -0.0028269290924072266, -0.0018925666809082031, -0.0009582042694091797, -2.384185791015625e-05, 0.0009105205535888672, 0.0018448829650878906, 0.002779245376586914, 0.0037136077880859375, 0.004647970199584961, 0.005582332611083984, 0.006516695022583008, 0.007451057434082031, 0.008385419845581055, 0.009319782257080078, 0.010254144668579102, 0.011188507080078125, 0.012122869491577148, 0.013057231903076172, 0.013991594314575195, 0.014925956726074219, 0.015860319137573242, 0.016794681549072266, 0.01772904396057129, 0.018663406372070312, 0.019597768783569336, 0.02053213119506836, 0.021466493606567383, 0.022400856018066406, 0.02333521842956543, 0.024269580841064453, 0.025203943252563477, 0.0261383056640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 19.0, 22.0, 42.0, 78.0, 161.0, 310.0, 702.0, 1620.0, 4639.0, 14851.0, 74813.0, 653321.0, 252636.0, 32245.0, 8290.0, 2733.0, 1079.0, 470.0, 224.0, 132.0, 64.0, 33.0, 15.0, 10.0, 12.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0175323486328125, -0.017013072967529297, -0.016493797302246094, -0.01597452163696289, -0.015455245971679688, -0.014935970306396484, -0.014416694641113281, -0.013897418975830078, -0.013378143310546875, -0.012858867645263672, -0.012339591979980469, -0.011820316314697266, -0.011301040649414062, -0.01078176498413086, -0.010262489318847656, -0.009743213653564453, -0.00922393798828125, -0.008704662322998047, -0.008185386657714844, -0.007666110992431641, -0.0071468353271484375, -0.006627559661865234, -0.006108283996582031, -0.005589008331298828, -0.005069732666015625, -0.004550457000732422, -0.004031181335449219, -0.0035119056701660156, -0.0029926300048828125, -0.0024733543395996094, -0.0019540786743164062, -0.0014348030090332031, -0.00091552734375, -0.0003962516784667969, 0.00012302398681640625, 0.0006422996520996094, 0.0011615753173828125, 0.0016808509826660156, 0.0022001266479492188, 0.002719402313232422, 0.003238677978515625, 0.003757953643798828, 0.004277229309082031, 0.004796504974365234, 0.0053157806396484375, 0.005835056304931641, 0.006354331970214844, 0.006873607635498047, 0.00739288330078125, 0.007912158966064453, 0.008431434631347656, 0.00895071029663086, 0.009469985961914062, 0.009989261627197266, 0.010508537292480469, 0.011027812957763672, 0.011547088623046875, 0.012066364288330078, 0.012585639953613281, 0.013104915618896484, 0.013624191284179688, 0.01414346694946289, 0.014662742614746094, 0.015182018280029297, 0.0157012939453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 4.0, 8.0, 8.0, 13.0, 18.0, 24.0, 30.0, 41.0, 32.0, 61.0, 80.0, 80.0, 79.0, 79.0, 77.0, 77.0, 53.0, 47.0, 47.0, 38.0, 23.0, 18.0, 12.0, 15.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4836273193359375e-05, -5.3009018301963806e-05, -5.118176341056824e-05, -4.935450851917267e-05, -4.75272536277771e-05, -4.569999873638153e-05, -4.387274384498596e-05, -4.204548895359039e-05, -4.0218234062194824e-05, -3.8390979170799255e-05, -3.6563724279403687e-05, -3.473646938800812e-05, -3.290921449661255e-05, -3.108195960521698e-05, -2.925470471382141e-05, -2.7427449822425842e-05, -2.5600194931030273e-05, -2.3772940039634705e-05, -2.1945685148239136e-05, -2.0118430256843567e-05, -1.8291175365447998e-05, -1.646392047405243e-05, -1.463666558265686e-05, -1.2809410691261292e-05, -1.0982155799865723e-05, -9.154900908470154e-06, -7.327646017074585e-06, -5.500391125679016e-06, -3.6731362342834473e-06, -1.8458813428878784e-06, -1.862645149230957e-08, 1.8086284399032593e-06, 3.635883331298828e-06, 5.463138222694397e-06, 7.290393114089966e-06, 9.117648005485535e-06, 1.0944902896881104e-05, 1.2772157788276672e-05, 1.4599412679672241e-05, 1.642666757106781e-05, 1.825392246246338e-05, 2.0081177353858948e-05, 2.1908432245254517e-05, 2.3735687136650085e-05, 2.5562942028045654e-05, 2.7390196919441223e-05, 2.9217451810836792e-05, 3.104470670223236e-05, 3.287196159362793e-05, 3.46992164850235e-05, 3.652647137641907e-05, 3.8353726267814636e-05, 4.0180981159210205e-05, 4.2008236050605774e-05, 4.383549094200134e-05, 4.566274583339691e-05, 4.749000072479248e-05, 4.931725561618805e-05, 5.114451050758362e-05, 5.297176539897919e-05, 5.4799020290374756e-05, 5.6626275181770325e-05, 5.8453530073165894e-05, 6.028078496456146e-05, 6.210803985595703e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 9.0, 8.0, 14.0, 25.0, 31.0, 41.0, 74.0, 138.0, 251.0, 733.0, 1864.0, 5236.0, 18493.0, 132331.0, 768799.0, 97500.0, 15409.0, 4660.0, 1642.0, 673.0, 283.0, 138.0, 78.0, 44.0, 22.0, 10.0, 15.0, 5.0, 6.0, 1.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185089111328125, -0.01788020133972168, -0.01725149154663086, -0.01662278175354004, -0.01599407196044922, -0.015365362167358398, -0.014736652374267578, -0.014107942581176758, -0.013479232788085938, -0.012850522994995117, -0.012221813201904297, -0.011593103408813477, -0.010964393615722656, -0.010335683822631836, -0.009706974029541016, -0.009078264236450195, -0.008449554443359375, -0.007820844650268555, -0.007192134857177734, -0.006563425064086914, -0.005934715270996094, -0.0053060054779052734, -0.004677295684814453, -0.004048585891723633, -0.0034198760986328125, -0.002791166305541992, -0.002162456512451172, -0.0015337467193603516, -0.0009050369262695312, -0.00027632713317871094, 0.0003523826599121094, 0.0009810924530029297, 0.00160980224609375, 0.0022385120391845703, 0.0028672218322753906, 0.003495931625366211, 0.004124641418457031, 0.0047533512115478516, 0.005382061004638672, 0.006010770797729492, 0.0066394805908203125, 0.007268190383911133, 0.007896900177001953, 0.008525609970092773, 0.009154319763183594, 0.009783029556274414, 0.010411739349365234, 0.011040449142456055, 0.011669158935546875, 0.012297868728637695, 0.012926578521728516, 0.013555288314819336, 0.014183998107910156, 0.014812707901000977, 0.015441417694091797, 0.016070127487182617, 0.016698837280273438, 0.017327547073364258, 0.017956256866455078, 0.0185849666595459, 0.01921367645263672, 0.01984238624572754, 0.02047109603881836, 0.02109980583190918, 0.021728515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 8.0, 9.0, 8.0, 19.0, 18.0, 19.0, 34.0, 43.0, 58.0, 72.0, 96.0, 107.0, 123.0, 103.0, 62.0, 46.0, 49.0, 25.0, 13.0, 18.0, 13.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01291656494140625, -0.01257479190826416, -0.01223301887512207, -0.01189124584197998, -0.01154947280883789, -0.0112076997756958, -0.010865926742553711, -0.010524153709411621, -0.010182380676269531, -0.009840607643127441, -0.009498834609985352, -0.009157061576843262, -0.008815288543701172, -0.008473515510559082, -0.008131742477416992, -0.007789969444274902, -0.0074481964111328125, -0.007106423377990723, -0.006764650344848633, -0.006422877311706543, -0.006081104278564453, -0.005739331245422363, -0.0053975582122802734, -0.005055785179138184, -0.004714012145996094, -0.004372239112854004, -0.004030466079711914, -0.0036886930465698242, -0.0033469200134277344, -0.0030051469802856445, -0.0026633739471435547, -0.002321600914001465, -0.001979827880859375, -0.0016380548477172852, -0.0012962818145751953, -0.0009545087814331055, -0.0006127357482910156, -0.0002709627151489258, 7.081031799316406e-05, 0.0004125833511352539, 0.0007543563842773438, 0.0010961294174194336, 0.0014379024505615234, 0.0017796754837036133, 0.002121448516845703, 0.002463221549987793, 0.002804994583129883, 0.0031467676162719727, 0.0034885406494140625, 0.0038303136825561523, 0.004172086715698242, 0.004513859748840332, 0.004855632781982422, 0.005197405815124512, 0.0055391788482666016, 0.005880951881408691, 0.006222724914550781, 0.006564497947692871, 0.006906270980834961, 0.007248044013977051, 0.007589817047119141, 0.00793159008026123, 0.00827336311340332, 0.00861513614654541, 0.0089569091796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 46.0, 428.0, 467.0, 50.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8015698194503784, -0.7867310047149658, -0.7718921303749084, -0.7570532560348511, -0.7422144412994385, -0.7273756265640259, -0.7125367522239685, -0.6976978778839111, -0.6828590631484985, -0.6680202484130859, -0.6531813740730286, -0.6383424997329712, -0.6235036849975586, -0.608664870262146, -0.5938259959220886, -0.5789871215820312, -0.5641483068466187, -0.549309492111206, -0.5344706177711487, -0.5196317434310913, -0.5047929286956787, -0.4899540841579437, -0.47511523962020874, -0.46027639508247375, -0.44543755054473877, -0.4305987060070038, -0.4157598614692688, -0.4009210169315338, -0.38608217239379883, -0.37124332785606384, -0.35640448331832886, -0.34156563878059387, -0.3267267942428589, -0.3118879497051239, -0.2970491051673889, -0.28221026062965393, -0.26737141609191895, -0.25253257155418396, -0.23769372701644897, -0.222854882478714, -0.2080160528421402, -0.1931772083044052, -0.17833836376667023, -0.16349951922893524, -0.14866067469120026, -0.13382183015346527, -0.11898298561573029, -0.1041441410779953, -0.08930529654026031, -0.07446645200252533, -0.059627607464790344, -0.04478876292705536, -0.029949918389320374, -0.015111073851585388, -0.00027222931385040283, 0.014566615223884583, 0.029405459761619568, 0.04424430429935455, 0.05908314883708954, 0.07392199337482452, 0.08876083791255951, 0.1035996824502945, 0.11843852698802948, 0.13327737152576447, 0.14811621606349945]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 8.0, 2.0, 11.0, 13.0, 17.0, 11.0, 17.0, 11.0, 21.0, 23.0, 27.0, 37.0, 32.0, 35.0, 29.0, 33.0, 38.0, 33.0, 49.0, 53.0, 32.0, 28.0, 34.0, 37.0, 32.0, 37.0, 33.0, 26.0, 25.0, 33.0, 20.0, 30.0, 25.0, 14.0, 15.0, 17.0, 9.0, 3.0, 8.0, 8.0, 2.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061264991760253906, -0.05924972519278526, -0.05723445862531662, -0.05521918833255768, -0.053203921765089035, -0.05118865519762039, -0.04917338490486145, -0.04715811833739281, -0.045142851769924164, -0.04312758520245552, -0.04111231863498688, -0.039097048342227936, -0.03708178177475929, -0.03506651520729065, -0.03305124491453171, -0.031035978347063065, -0.02902071177959442, -0.027005445212125778, -0.024990176782011986, -0.022974908351898193, -0.02095964178442955, -0.018944375216960907, -0.016929106786847115, -0.014913839288055897, -0.012898571789264679, -0.010883304290473461, -0.008868036791682243, -0.0068527692928910255, -0.004837501794099808, -0.00282223429530859, -0.0008069667965173721, 0.0012083007022738457, 0.0032235682010650635, 0.005238835699856281, 0.007254103198647499, 0.009269370697438717, 0.011284638196229935, 0.013299905695021152, 0.01531517319381237, 0.017330441623926163, 0.019345708191394806, 0.02136097475886345, 0.02337624318897724, 0.025391511619091034, 0.027406778186559677, 0.02942204475402832, 0.03143731504678726, 0.033452581614255905, 0.03546784818172455, 0.03748311474919319, 0.039498381316661835, 0.041513651609420776, 0.04352891817688942, 0.04554418474435806, 0.047559455037117004, 0.04957472160458565, 0.05158998817205429, 0.053605254739522934, 0.05562052130699158, 0.05763579159975052, 0.05965105816721916, 0.061666324734687805, 0.06368159502744675, 0.06569685786962509, 0.06771212816238403]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 16.0, 10.0, 20.0, 50.0, 78.0, 216.0, 759.0, 1824.0, 2917.0, 5687.0, 47698.0, 4042111.0, 81639.0, 6369.0, 2646.0, 853.0, 597.0, 450.0, 143.0, 59.0, 44.0, 15.0, 18.0, 16.0, 9.0, 4.0, 5.0, 8.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.050330162048339844, -0.04862785339355469, -0.04692554473876953, -0.045223236083984375, -0.04352092742919922, -0.04181861877441406, -0.040116310119628906, -0.03841400146484375, -0.036711692810058594, -0.03500938415527344, -0.03330707550048828, -0.031604766845703125, -0.02990245819091797, -0.028200149536132812, -0.026497840881347656, -0.0247955322265625, -0.023093223571777344, -0.021390914916992188, -0.01968860626220703, -0.017986297607421875, -0.01628398895263672, -0.014581680297851562, -0.012879371643066406, -0.01117706298828125, -0.009474754333496094, -0.0077724456787109375, -0.006070137023925781, -0.004367828369140625, -0.0026655197143554688, -0.0009632110595703125, 0.0007390975952148438, 0.00244140625, 0.004143714904785156, 0.0058460235595703125, 0.007548332214355469, 0.009250640869140625, 0.010952949523925781, 0.012655258178710938, 0.014357566833496094, 0.01605987548828125, 0.017762184143066406, 0.019464492797851562, 0.02116680145263672, 0.022869110107421875, 0.02457141876220703, 0.026273727416992188, 0.027976036071777344, 0.0296783447265625, 0.031380653381347656, 0.03308296203613281, 0.03478527069091797, 0.036487579345703125, 0.03818988800048828, 0.03989219665527344, 0.041594505310058594, 0.04329681396484375, 0.044999122619628906, 0.04670143127441406, 0.04840373992919922, 0.050106048583984375, 0.05180835723876953, 0.05351066589355469, 0.055212974548339844, 0.056915283203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 28.0, 114.0, 327.0, 352.0, 143.0, 26.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06903076171875, -0.06700563430786133, -0.06498050689697266, -0.06295537948608398, -0.06093025207519531, -0.05890512466430664, -0.05687999725341797, -0.0548548698425293, -0.052829742431640625, -0.05080461502075195, -0.04877948760986328, -0.04675436019897461, -0.04472923278808594, -0.042704105377197266, -0.040678977966308594, -0.03865385055541992, -0.03662872314453125, -0.03460359573364258, -0.032578468322753906, -0.030553340911865234, -0.028528213500976562, -0.02650308609008789, -0.02447795867919922, -0.022452831268310547, -0.020427703857421875, -0.018402576446533203, -0.01637744903564453, -0.01435232162475586, -0.012327194213867188, -0.010302066802978516, -0.008276939392089844, -0.006251811981201172, -0.0042266845703125, -0.002201557159423828, -0.00017642974853515625, 0.0018486976623535156, 0.0038738250732421875, 0.005898952484130859, 0.007924079895019531, 0.009949207305908203, 0.011974334716796875, 0.013999462127685547, 0.01602458953857422, 0.01804971694946289, 0.020074844360351562, 0.022099971771240234, 0.024125099182128906, 0.026150226593017578, 0.02817535400390625, 0.030200481414794922, 0.032225608825683594, 0.034250736236572266, 0.03627586364746094, 0.03830099105834961, 0.04032611846923828, 0.04235124588012695, 0.044376373291015625, 0.0464015007019043, 0.04842662811279297, 0.05045175552368164, 0.05247688293457031, 0.054502010345458984, 0.056527137756347656, 0.05855226516723633, 0.060577392578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 7.0, 32.0, 73.0, 109.0, 320.0, 1448.0, 24329.0, 4005485.0, 158030.0, 3655.0, 522.0, 157.0, 63.0, 23.0, 10.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.028659343719482422, -0.026709556579589844, -0.024759769439697266, -0.022809982299804688, -0.02086019515991211, -0.01891040802001953, -0.016960620880126953, -0.015010833740234375, -0.013061046600341797, -0.011111259460449219, -0.00916147232055664, -0.0072116851806640625, -0.005261898040771484, -0.0033121109008789062, -0.0013623237609863281, 0.00058746337890625, 0.002537250518798828, 0.004487037658691406, 0.006436824798583984, 0.008386611938476562, 0.01033639907836914, 0.012286186218261719, 0.014235973358154297, 0.016185760498046875, 0.018135547637939453, 0.02008533477783203, 0.02203512191772461, 0.023984909057617188, 0.025934696197509766, 0.027884483337402344, 0.029834270477294922, 0.0317840576171875, 0.03373384475708008, 0.035683631896972656, 0.037633419036865234, 0.03958320617675781, 0.04153299331665039, 0.04348278045654297, 0.04543256759643555, 0.047382354736328125, 0.0493321418762207, 0.05128192901611328, 0.05323171615600586, 0.05518150329589844, 0.057131290435791016, 0.059081077575683594, 0.06103086471557617, 0.06298065185546875, 0.06493043899536133, 0.0668802261352539, 0.06883001327514648, 0.07077980041503906, 0.07272958755493164, 0.07467937469482422, 0.0766291618347168, 0.07857894897460938, 0.08052873611450195, 0.08247852325439453, 0.08442831039428711, 0.08637809753417969, 0.08832788467407227, 0.09027767181396484, 0.09222745895385742, 0.09417724609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 22.0, 54.0, 89.0, 209.0, 715.0, 1823.0, 724.0, 206.0, 97.0, 49.0, 31.0, 16.0, 13.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.041153669357299805, -0.04016256332397461, -0.039171457290649414, -0.03818035125732422, -0.03718924522399902, -0.03619813919067383, -0.03520703315734863, -0.03421592712402344, -0.03322482109069824, -0.03223371505737305, -0.03124260902404785, -0.030251502990722656, -0.02926039695739746, -0.028269290924072266, -0.02727818489074707, -0.026287078857421875, -0.02529597282409668, -0.024304866790771484, -0.02331376075744629, -0.022322654724121094, -0.0213315486907959, -0.020340442657470703, -0.019349336624145508, -0.018358230590820312, -0.017367124557495117, -0.016376018524169922, -0.015384912490844727, -0.014393806457519531, -0.013402700424194336, -0.01241159439086914, -0.011420488357543945, -0.01042938232421875, -0.009438276290893555, -0.00844717025756836, -0.007456064224243164, -0.006464958190917969, -0.0054738521575927734, -0.004482746124267578, -0.003491640090942383, -0.0025005340576171875, -0.0015094280242919922, -0.0005183219909667969, 0.00047278404235839844, 0.0014638900756835938, 0.002454996109008789, 0.0034461021423339844, 0.00443720817565918, 0.005428314208984375, 0.00641942024230957, 0.007410526275634766, 0.008401632308959961, 0.009392738342285156, 0.010383844375610352, 0.011374950408935547, 0.012366056442260742, 0.013357162475585938, 0.014348268508911133, 0.015339374542236328, 0.016330480575561523, 0.01732158660888672, 0.018312692642211914, 0.01930379867553711, 0.020294904708862305, 0.0212860107421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 26.0, 92.0, 252.0, 346.0, 190.0, 63.0, 19.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307908296585083, -0.12615326046943665, -0.12151569128036499, -0.11687812209129333, -0.11224055290222168, -0.10760298371315002, -0.10296542197465897, -0.09832785278558731, -0.09369028359651566, -0.089052714407444, -0.08441514521837234, -0.07977757602930069, -0.07514001429080963, -0.07050244510173798, -0.06586487591266632, -0.061227306723594666, -0.05658973753452301, -0.051952168345451355, -0.0473145991563797, -0.04267703369259834, -0.03803946450352669, -0.03340189531445503, -0.028764327988028526, -0.02412676066160202, -0.019489191472530365, -0.014851623214781284, -0.010214054957032204, -0.005576486699283123, -0.0009389184415340424, 0.003698650747537613, 0.008336218073964119, 0.012973785400390625, 0.01761135458946228, 0.022248923778533936, 0.02688649110496044, 0.03152405843138695, 0.0361616276204586, 0.04079919680953026, 0.045436762273311615, 0.05007433146238327, 0.054711900651454926, 0.05934946984052658, 0.06398703902959824, 0.06862460821866989, 0.07326216995716095, 0.0778997391462326, 0.08253730833530426, 0.08717487752437592, 0.09181244671344757, 0.09645001590251923, 0.10108758509159088, 0.10572515428066254, 0.11036272346973419, 0.11500029265880585, 0.1196378543972969, 0.12427542358636856, 0.12891298532485962, 0.13355055451393127, 0.13818812370300293, 0.14282569289207458, 0.14746326208114624, 0.1521008312702179, 0.15673840045928955, 0.1613759696483612, 0.16601353883743286]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 2.0, 4.0, 11.0, 6.0, 13.0, 21.0, 19.0, 17.0, 26.0, 17.0, 30.0, 24.0, 30.0, 45.0, 39.0, 51.0, 40.0, 42.0, 44.0, 42.0, 41.0, 32.0, 54.0, 30.0, 34.0, 32.0, 36.0, 29.0, 24.0, 29.0, 23.0, 26.0, 15.0, 11.0, 13.0, 11.0, 11.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0357244610786438, -0.03455135226249695, -0.0333782434463501, -0.03220513090491295, -0.031032022088766098, -0.029858913272619247, -0.028685802593827248, -0.027512691915035248, -0.026339583098888397, -0.025166474282741547, -0.023993363603949547, -0.022820252925157547, -0.021647144109010696, -0.020474035292863846, -0.019300924614071846, -0.018127813935279846, -0.016954705119132996, -0.015781596302986145, -0.014608485624194145, -0.01343537587672472, -0.012262266129255295, -0.01108915638178587, -0.009916046634316444, -0.00874293688684702, -0.007569827139377594, -0.006396717391908169, -0.005223607644438744, -0.004050497896969318, -0.002877388149499893, -0.001704278402030468, -0.0005311686545610428, 0.0006419410929083824, 0.0018150508403778076, 0.002988160587847233, 0.004161270335316658, 0.005334380082786083, 0.006507489830255508, 0.007680599577724934, 0.008853709325194359, 0.010026819072663784, 0.01119992882013321, 0.012373038567602634, 0.01354614831507206, 0.014719258062541485, 0.01589236781001091, 0.01706547662615776, 0.01823858730494976, 0.01941169798374176, 0.02058480679988861, 0.02175791561603546, 0.02293102629482746, 0.02410413697361946, 0.02527724578976631, 0.026450354605913162, 0.027623465284705162, 0.028796575963497162, 0.029969684779644012, 0.031142793595790863, 0.032315902411937714, 0.03348901495337486, 0.03466212376952171, 0.035835232585668564, 0.03700834512710571, 0.038181453943252563, 0.039354562759399414]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 4.0, 6.0, 18.0, 21.0, 24.0, 36.0, 51.0, 68.0, 73.0, 105.0, 181.0, 224.0, 324.0, 486.0, 701.0, 1285.0, 4094.0, 37281.0, 729895.0, 255639.0, 12761.0, 2290.0, 932.0, 593.0, 372.0, 285.0, 211.0, 147.0, 114.0, 82.0, 71.0, 58.0, 22.0, 19.0, 20.0, 7.0, 12.0, 4.0, 3.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.044921875, -0.04359245300292969, -0.042263031005859375, -0.04093360900878906, -0.03960418701171875, -0.03827476501464844, -0.036945343017578125, -0.03561592102050781, -0.0342864990234375, -0.03295707702636719, -0.031627655029296875, -0.030298233032226562, -0.02896881103515625, -0.027639389038085938, -0.026309967041015625, -0.024980545043945312, -0.023651123046875, -0.022321701049804688, -0.020992279052734375, -0.019662857055664062, -0.01833343505859375, -0.017004013061523438, -0.015674591064453125, -0.014345169067382812, -0.0130157470703125, -0.011686325073242188, -0.010356903076171875, -0.009027481079101562, -0.00769805908203125, -0.0063686370849609375, -0.005039215087890625, -0.0037097930908203125, -0.00238037109375, -0.0010509490966796875, 0.000278472900390625, 0.0016078948974609375, 0.00293731689453125, 0.0042667388916015625, 0.005596160888671875, 0.0069255828857421875, 0.0082550048828125, 0.009584426879882812, 0.010913848876953125, 0.012243270874023438, 0.01357269287109375, 0.014902114868164062, 0.016231536865234375, 0.017560958862304688, 0.018890380859375, 0.020219802856445312, 0.021549224853515625, 0.022878646850585938, 0.02420806884765625, 0.025537490844726562, 0.026866912841796875, 0.028196334838867188, 0.0295257568359375, 0.030855178833007812, 0.032184600830078125, 0.03351402282714844, 0.03484344482421875, 0.03617286682128906, 0.037502288818359375, 0.03883171081542969, 0.0401611328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 16.0, 84.0, 274.0, 366.0, 205.0, 44.0, 9.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0660400390625, -0.06406116485595703, -0.06208229064941406, -0.060103416442871094, -0.058124542236328125, -0.056145668029785156, -0.05416679382324219, -0.05218791961669922, -0.05020904541015625, -0.04823017120361328, -0.04625129699707031, -0.044272422790527344, -0.042293548583984375, -0.040314674377441406, -0.03833580017089844, -0.03635692596435547, -0.0343780517578125, -0.03239917755126953, -0.030420303344726562, -0.028441429138183594, -0.026462554931640625, -0.024483680725097656, -0.022504806518554688, -0.02052593231201172, -0.01854705810546875, -0.01656818389892578, -0.014589309692382812, -0.012610435485839844, -0.010631561279296875, -0.008652687072753906, -0.0066738128662109375, -0.004694938659667969, -0.002716064453125, -0.0007371902465820312, 0.0012416839599609375, 0.0032205581665039062, 0.005199432373046875, 0.007178306579589844, 0.009157180786132812, 0.011136054992675781, 0.01311492919921875, 0.015093803405761719, 0.017072677612304688, 0.019051551818847656, 0.021030426025390625, 0.023009300231933594, 0.024988174438476562, 0.02696704864501953, 0.0289459228515625, 0.03092479705810547, 0.03290367126464844, 0.034882545471191406, 0.036861419677734375, 0.038840293884277344, 0.04081916809082031, 0.04279804229736328, 0.04477691650390625, 0.04675579071044922, 0.04873466491699219, 0.050713539123535156, 0.052692413330078125, 0.054671287536621094, 0.05665016174316406, 0.05862903594970703, 0.06060791015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 8.0, 12.0, 11.0, 16.0, 19.0, 25.0, 32.0, 28.0, 45.0, 60.0, 77.0, 84.0, 118.0, 191.0, 513.0, 2211.0, 30297.0, 689026.0, 312042.0, 11477.0, 1283.0, 319.0, 153.0, 79.0, 95.0, 63.0, 60.0, 39.0, 38.0, 39.0, 17.0, 20.0, 16.0, 11.0, 8.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04284381866455078, -0.04149818420410156, -0.040152549743652344, -0.038806915283203125, -0.037461280822753906, -0.03611564636230469, -0.03477001190185547, -0.03342437744140625, -0.03207874298095703, -0.030733108520507812, -0.029387474060058594, -0.028041839599609375, -0.026696205139160156, -0.025350570678710938, -0.02400493621826172, -0.0226593017578125, -0.02131366729736328, -0.019968032836914062, -0.018622398376464844, -0.017276763916015625, -0.015931129455566406, -0.014585494995117188, -0.013239860534667969, -0.01189422607421875, -0.010548591613769531, -0.009202957153320312, -0.007857322692871094, -0.006511688232421875, -0.005166053771972656, -0.0038204193115234375, -0.0024747848510742188, -0.001129150390625, 0.00021648406982421875, 0.0015621185302734375, 0.0029077529907226562, 0.004253387451171875, 0.005599021911621094, 0.0069446563720703125, 0.008290290832519531, 0.00963592529296875, 0.010981559753417969, 0.012327194213867188, 0.013672828674316406, 0.015018463134765625, 0.016364097595214844, 0.017709732055664062, 0.01905536651611328, 0.0204010009765625, 0.02174663543701172, 0.023092269897460938, 0.024437904357910156, 0.025783538818359375, 0.027129173278808594, 0.028474807739257812, 0.02982044219970703, 0.03116607666015625, 0.03251171112060547, 0.03385734558105469, 0.035202980041503906, 0.036548614501953125, 0.037894248962402344, 0.03923988342285156, 0.04058551788330078, 0.04193115234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 1.0, 8.0, 9.0, 11.0, 10.0, 9.0, 11.0, 21.0, 20.0, 27.0, 32.0, 32.0, 33.0, 36.0, 37.0, 34.0, 48.0, 53.0, 45.0, 55.0, 50.0, 47.0, 40.0, 55.0, 38.0, 44.0, 29.0, 26.0, 33.0, 22.0, 23.0, 9.0, 9.0, 11.0, 7.0, 9.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024993896484375, -0.024166107177734375, -0.02333831787109375, -0.022510528564453125, -0.0216827392578125, -0.020854949951171875, -0.02002716064453125, -0.019199371337890625, -0.01837158203125, -0.017543792724609375, -0.01671600341796875, -0.015888214111328125, -0.0150604248046875, -0.014232635498046875, -0.01340484619140625, -0.012577056884765625, -0.011749267578125, -0.010921478271484375, -0.01009368896484375, -0.009265899658203125, -0.0084381103515625, -0.007610321044921875, -0.00678253173828125, -0.005954742431640625, -0.005126953125, -0.004299163818359375, -0.00347137451171875, -0.002643585205078125, -0.0018157958984375, -0.000988006591796875, -0.00016021728515625, 0.000667572021484375, 0.001495361328125, 0.002323150634765625, 0.00315093994140625, 0.003978729248046875, 0.0048065185546875, 0.005634307861328125, 0.00646209716796875, 0.007289886474609375, 0.00811767578125, 0.008945465087890625, 0.00977325439453125, 0.010601043701171875, 0.0114288330078125, 0.012256622314453125, 0.01308441162109375, 0.013912200927734375, 0.014739990234375, 0.015567779541015625, 0.01639556884765625, 0.017223358154296875, 0.0180511474609375, 0.018878936767578125, 0.01970672607421875, 0.020534515380859375, 0.0213623046875, 0.022190093994140625, 0.02301788330078125, 0.023845672607421875, 0.0246734619140625, 0.025501251220703125, 0.02632904052734375, 0.027156829833984375, 0.027984619140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 7.0, 10.0, 12.0, 19.0, 40.0, 74.0, 126.0, 186.0, 342.0, 714.0, 1391.0, 2883.0, 5942.0, 14363.0, 37843.0, 114276.0, 374506.0, 337126.0, 100985.0, 33775.0, 12970.0, 5565.0, 2643.0, 1287.0, 646.0, 357.0, 190.0, 113.0, 55.0, 37.0, 22.0, 18.0, 9.0, 10.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0056304931640625, -0.00545424222946167, -0.00527799129486084, -0.00510174036026001, -0.00492548942565918, -0.00474923849105835, -0.0045729875564575195, -0.0043967366218566895, -0.004220485687255859, -0.004044234752655029, -0.0038679838180541992, -0.003691732883453369, -0.003515481948852539, -0.003339231014251709, -0.003162980079650879, -0.002986729145050049, -0.0028104782104492188, -0.0026342272758483887, -0.0024579763412475586, -0.0022817254066467285, -0.0021054744720458984, -0.0019292235374450684, -0.0017529726028442383, -0.0015767216682434082, -0.0014004707336425781, -0.001224219799041748, -0.001047968864440918, -0.0008717179298400879, -0.0006954669952392578, -0.0005192160606384277, -0.00034296512603759766, -0.00016671419143676758, 9.5367431640625e-06, 0.00018578767776489258, 0.00036203861236572266, 0.0005382895469665527, 0.0007145404815673828, 0.0008907914161682129, 0.001067042350769043, 0.001243293285369873, 0.0014195442199707031, 0.0015957951545715332, 0.0017720460891723633, 0.0019482970237731934, 0.0021245479583740234, 0.0023007988929748535, 0.0024770498275756836, 0.0026533007621765137, 0.0028295516967773438, 0.003005802631378174, 0.003182053565979004, 0.003358304500579834, 0.003534555435180664, 0.003710806369781494, 0.0038870573043823242, 0.004063308238983154, 0.004239559173583984, 0.0044158101081848145, 0.0045920610427856445, 0.004768311977386475, 0.004944562911987305, 0.005120813846588135, 0.005297064781188965, 0.005473315715789795, 0.005649566650390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 1.0, 8.0, 8.0, 10.0, 16.0, 41.0, 49.0, 58.0, 85.0, 94.0, 110.0, 122.0, 103.0, 70.0, 54.0, 44.0, 46.0, 27.0, 16.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.090624421834946e-05, -6.837956607341766e-05, -6.585288792848587e-05, -6.332620978355408e-05, -6.0799531638622284e-05, -5.827285349369049e-05, -5.57461753487587e-05, -5.3219497203826904e-05, -5.069281905889511e-05, -4.816614091396332e-05, -4.5639462769031525e-05, -4.311278462409973e-05, -4.058610647916794e-05, -3.8059428334236145e-05, -3.553275018930435e-05, -3.300607204437256e-05, -3.0479393899440765e-05, -2.7952715754508972e-05, -2.542603760957718e-05, -2.2899359464645386e-05, -2.0372681319713593e-05, -1.78460031747818e-05, -1.5319325029850006e-05, -1.2792646884918213e-05, -1.026596873998642e-05, -7.739290595054626e-06, -5.212612450122833e-06, -2.68593430519104e-06, -1.5925616025924683e-07, 2.3674219846725464e-06, 4.89410012960434e-06, 7.420778274536133e-06, 9.947456419467926e-06, 1.247413456439972e-05, 1.5000812709331512e-05, 1.7527490854263306e-05, 2.00541689991951e-05, 2.2580847144126892e-05, 2.5107525289058685e-05, 2.763420343399048e-05, 3.0160881578922272e-05, 3.2687559723854065e-05, 3.521423786878586e-05, 3.774091601371765e-05, 4.0267594158649445e-05, 4.279427230358124e-05, 4.532095044851303e-05, 4.7847628593444824e-05, 5.037430673837662e-05, 5.290098488330841e-05, 5.5427663028240204e-05, 5.7954341173172e-05, 6.048101931810379e-05, 6.300769746303558e-05, 6.553437560796738e-05, 6.806105375289917e-05, 7.058773189783096e-05, 7.311441004276276e-05, 7.564108818769455e-05, 7.816776633262634e-05, 8.069444447755814e-05, 8.322112262248993e-05, 8.574780076742172e-05, 8.827447891235352e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 5.0, 6.0, 10.0, 14.0, 21.0, 25.0, 48.0, 76.0, 166.0, 446.0, 1499.0, 7341.0, 66449.0, 772515.0, 181219.0, 15049.0, 2537.0, 630.0, 224.0, 105.0, 46.0, 36.0, 29.0, 10.0, 14.0, 13.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.018369674682617188, -0.017894744873046875, -0.017419815063476562, -0.01694488525390625, -0.016469955444335938, -0.015995025634765625, -0.015520095825195312, -0.015045166015625, -0.014570236206054688, -0.014095306396484375, -0.013620376586914062, -0.01314544677734375, -0.012670516967773438, -0.012195587158203125, -0.011720657348632812, -0.0112457275390625, -0.010770797729492188, -0.010295867919921875, -0.009820938110351562, -0.00934600830078125, -0.008871078491210938, -0.008396148681640625, -0.007921218872070312, -0.0074462890625, -0.0069713592529296875, -0.006496429443359375, -0.0060214996337890625, -0.00554656982421875, -0.0050716400146484375, -0.004596710205078125, -0.0041217803955078125, -0.0036468505859375, -0.0031719207763671875, -0.002696990966796875, -0.0022220611572265625, -0.00174713134765625, -0.0012722015380859375, -0.000797271728515625, -0.0003223419189453125, 0.000152587890625, 0.0006275177001953125, 0.001102447509765625, 0.0015773773193359375, 0.00205230712890625, 0.0025272369384765625, 0.003002166748046875, 0.0034770965576171875, 0.0039520263671875, 0.0044269561767578125, 0.004901885986328125, 0.0053768157958984375, 0.00585174560546875, 0.0063266754150390625, 0.006801605224609375, 0.0072765350341796875, 0.00775146484375, 0.008226394653320312, 0.008701324462890625, 0.009176254272460938, 0.00965118408203125, 0.010126113891601562, 0.010601043701171875, 0.011075973510742188, 0.0115509033203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 2.0, 4.0, 7.0, 13.0, 9.0, 19.0, 14.0, 29.0, 40.0, 63.0, 54.0, 91.0, 114.0, 104.0, 99.0, 73.0, 61.0, 45.0, 49.0, 26.0, 30.0, 13.0, 7.0, 14.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007579803466796875, -0.007292807102203369, -0.007005810737609863, -0.006718814373016357, -0.0064318180084228516, -0.006144821643829346, -0.00585782527923584, -0.005570828914642334, -0.005283832550048828, -0.004996836185455322, -0.004709839820861816, -0.0044228434562683105, -0.004135847091674805, -0.003848850727081299, -0.003561854362487793, -0.003274857997894287, -0.0029878616333007812, -0.0027008652687072754, -0.0024138689041137695, -0.0021268725395202637, -0.0018398761749267578, -0.001552879810333252, -0.001265883445739746, -0.0009788870811462402, -0.0006918907165527344, -0.0004048943519592285, -0.00011789798736572266, 0.0001690983772277832, 0.00045609474182128906, 0.0007430911064147949, 0.0010300874710083008, 0.0013170838356018066, 0.0016040802001953125, 0.0018910765647888184, 0.0021780729293823242, 0.00246506929397583, 0.002752065658569336, 0.003039062023162842, 0.0033260583877563477, 0.0036130547523498535, 0.0039000511169433594, 0.004187047481536865, 0.004474043846130371, 0.004761040210723877, 0.005048036575317383, 0.005335032939910889, 0.0056220293045043945, 0.0059090256690979, 0.006196022033691406, 0.006483018398284912, 0.006770014762878418, 0.007057011127471924, 0.00734400749206543, 0.0076310038566589355, 0.007918000221252441, 0.008204996585845947, 0.008491992950439453, 0.008778989315032959, 0.009065985679626465, 0.00935298204421997, 0.009639978408813477, 0.009926974773406982, 0.010213971138000488, 0.010500967502593994, 0.0107879638671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 32.0, 602.0, 358.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17137160897254944, -0.15407779812812805, -0.13678400218486786, -0.11949019879102707, -0.10219639539718628, -0.08490259200334549, -0.0676087886095047, -0.05031498521566391, -0.03302118182182312, -0.01572737842798233, 0.0015664249658584595, 0.01886022835969925, 0.03615403175354004, 0.05344783514738083, 0.07074163854122162, 0.08803544193506241, 0.1053292453289032, 0.12262304872274399, 0.13991685211658478, 0.15721064805984497, 0.17450445890426636, 0.19179826974868774, 0.20909206569194794, 0.22638586163520813, 0.24367967247962952, 0.2609734833240509, 0.2782672643661499, 0.2955610752105713, 0.3128548860549927, 0.33014869689941406, 0.34744250774383545, 0.36473628878593445, 0.3820301294326782, 0.3993239402770996, 0.416617751121521, 0.43391153216362, 0.4512053430080414, 0.46849915385246277, 0.48579293489456177, 0.5030867457389832, 0.5203805565834045, 0.5376743674278259, 0.5549681782722473, 0.5722619891166687, 0.5895557403564453, 0.6068495512008667, 0.6241433620452881, 0.6414371728897095, 0.6587309837341309, 0.6760247945785522, 0.6933186054229736, 0.710612416267395, 0.7279062271118164, 0.745199978351593, 0.7624937891960144, 0.7797876000404358, 0.7970814108848572, 0.8143752217292786, 0.8316690325737, 0.8489628434181213, 0.866256594657898, 0.8835504055023193, 0.9008442163467407, 0.9181380271911621, 0.9354318380355835]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 7.0, 1.0, 11.0, 13.0, 15.0, 16.0, 18.0, 15.0, 21.0, 15.0, 25.0, 28.0, 43.0, 37.0, 44.0, 29.0, 35.0, 40.0, 41.0, 36.0, 38.0, 45.0, 37.0, 32.0, 25.0, 30.0, 22.0, 29.0, 27.0, 33.0, 24.0, 24.0, 23.0, 23.0, 11.0, 16.0, 12.0, 9.0, 5.0, 4.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.06923782825469971, -0.06714363396167755, -0.0650494396686554, -0.06295523792505264, -0.06086104363203049, -0.05876684933900833, -0.05667265132069588, -0.05457845330238342, -0.05248425900936127, -0.05039006471633911, -0.04829586669802666, -0.0462016686797142, -0.04410747438669205, -0.04201328009366989, -0.03991908207535744, -0.03782488405704498, -0.03573068976402283, -0.03363649547100067, -0.03154229745268822, -0.029448101297020912, -0.027353905141353607, -0.025259708985686302, -0.023165512830018997, -0.021071316674351692, -0.018977120518684387, -0.016882924363017082, -0.014788728207349777, -0.012694532051682472, -0.010600335896015167, -0.008506139740347862, -0.006411943584680557, -0.004317747429013252, -0.0022235512733459473, -0.00012935511767864227, 0.0019648410379886627, 0.004059037193655968, 0.006153233349323273, 0.008247429504990578, 0.010341625660657883, 0.012435821816325188, 0.014530017971992493, 0.016624214127659798, 0.018718410283327103, 0.020812606438994408, 0.022906802594661713, 0.025000998750329018, 0.027095194905996323, 0.029189391061663628, 0.03128358721733093, 0.03337778151035309, 0.03547197952866554, 0.037566177546978, 0.03966037184000015, 0.04175456613302231, 0.04384876415133476, 0.04594296216964722, 0.04803715646266937, 0.05013135075569153, 0.05222554877400398, 0.05431974679231644, 0.05641394108533859, 0.05850813537836075, 0.0606023333966732, 0.06269653141498566, 0.06479072570800781]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 16.0, 30.0, 101.0, 573.0, 1992.0, 6032.0, 3841636.0, 338164.0, 4129.0, 957.0, 485.0, 89.0, 36.0, 17.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09118270874023438, -0.08849334716796875, -0.08580398559570312, -0.0831146240234375, -0.08042526245117188, -0.07773590087890625, -0.07504653930664062, -0.072357177734375, -0.06966781616210938, -0.06697845458984375, -0.06428909301757812, -0.0615997314453125, -0.058910369873046875, -0.05622100830078125, -0.053531646728515625, -0.05084228515625, -0.048152923583984375, -0.04546356201171875, -0.042774200439453125, -0.0400848388671875, -0.037395477294921875, -0.03470611572265625, -0.032016754150390625, -0.029327392578125, -0.026638031005859375, -0.02394866943359375, -0.021259307861328125, -0.0185699462890625, -0.015880584716796875, -0.01319122314453125, -0.010501861572265625, -0.0078125, -0.005123138427734375, -0.00243377685546875, 0.000255584716796875, 0.0029449462890625, 0.005634307861328125, 0.00832366943359375, 0.011013031005859375, 0.013702392578125, 0.016391754150390625, 0.01908111572265625, 0.021770477294921875, 0.0244598388671875, 0.027149200439453125, 0.02983856201171875, 0.032527923583984375, 0.03521728515625, 0.037906646728515625, 0.04059600830078125, 0.043285369873046875, 0.0459747314453125, 0.048664093017578125, 0.05135345458984375, 0.054042816162109375, 0.056732177734375, 0.059421539306640625, 0.06211090087890625, 0.06480026245117188, 0.0674896240234375, 0.07017898559570312, 0.07286834716796875, 0.07555770874023438, 0.0782470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 28.0, 107.0, 316.0, 372.0, 139.0, 32.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06591796875, -0.06392812728881836, -0.06193828582763672, -0.05994844436645508, -0.05795860290527344, -0.0559687614440918, -0.053978919982910156, -0.051989078521728516, -0.049999237060546875, -0.048009395599365234, -0.046019554138183594, -0.04402971267700195, -0.04203987121582031, -0.04005002975463867, -0.03806018829345703, -0.03607034683227539, -0.03408050537109375, -0.03209066390991211, -0.03010082244873047, -0.028110980987548828, -0.026121139526367188, -0.024131298065185547, -0.022141456604003906, -0.020151615142822266, -0.018161773681640625, -0.016171932220458984, -0.014182090759277344, -0.012192249298095703, -0.010202407836914062, -0.008212566375732422, -0.006222724914550781, -0.004232883453369141, -0.0022430419921875, -0.0002532005310058594, 0.0017366409301757812, 0.003726482391357422, 0.0057163238525390625, 0.007706165313720703, 0.009696006774902344, 0.011685848236083984, 0.013675689697265625, 0.015665531158447266, 0.017655372619628906, 0.019645214080810547, 0.021635055541992188, 0.023624897003173828, 0.02561473846435547, 0.02760457992553711, 0.02959442138671875, 0.03158426284790039, 0.03357410430908203, 0.03556394577026367, 0.03755378723144531, 0.03954362869262695, 0.041533470153808594, 0.043523311614990234, 0.045513153076171875, 0.047502994537353516, 0.049492835998535156, 0.0514826774597168, 0.05347251892089844, 0.05546236038208008, 0.05745220184326172, 0.05944204330444336, 0.061431884765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 8.0, 18.0, 43.0, 67.0, 128.0, 251.0, 610.0, 1496.0, 4288.0, 15905.0, 87024.0, 2808457.0, 1191198.0, 65855.0, 12940.0, 3708.0, 1245.0, 521.0, 234.0, 120.0, 70.0, 31.0, 22.0, 9.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01361846923828125, -0.013024449348449707, -0.012430429458618164, -0.011836409568786621, -0.011242389678955078, -0.010648369789123535, -0.010054349899291992, -0.00946033000946045, -0.008866310119628906, -0.008272290229797363, -0.00767827033996582, -0.007084250450134277, -0.006490230560302734, -0.005896210670471191, -0.0053021907806396484, -0.0047081708908081055, -0.0041141510009765625, -0.0035201311111450195, -0.0029261112213134766, -0.0023320913314819336, -0.0017380714416503906, -0.0011440515518188477, -0.0005500316619873047, 4.398822784423828e-05, 0.0006380081176757812, 0.0012320280075073242, 0.0018260478973388672, 0.00242006778717041, 0.003014087677001953, 0.003608107566833496, 0.004202127456665039, 0.004796147346496582, 0.005390167236328125, 0.005984187126159668, 0.006578207015991211, 0.007172226905822754, 0.007766246795654297, 0.00836026668548584, 0.008954286575317383, 0.009548306465148926, 0.010142326354980469, 0.010736346244812012, 0.011330366134643555, 0.011924386024475098, 0.01251840591430664, 0.013112425804138184, 0.013706445693969727, 0.01430046558380127, 0.014894485473632812, 0.015488505363464355, 0.0160825252532959, 0.01667654514312744, 0.017270565032958984, 0.017864584922790527, 0.01845860481262207, 0.019052624702453613, 0.019646644592285156, 0.0202406644821167, 0.020834684371948242, 0.021428704261779785, 0.022022724151611328, 0.02261674404144287, 0.023210763931274414, 0.023804783821105957, 0.0243988037109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 10.0, 10.0, 8.0, 23.0, 32.0, 33.0, 67.0, 78.0, 180.0, 243.0, 605.0, 1290.0, 654.0, 323.0, 146.0, 104.0, 86.0, 42.0, 32.0, 26.0, 18.0, 11.0, 7.0, 10.0, 9.0, 2.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010833740234375, -0.010520100593566895, -0.010206460952758789, -0.009892821311950684, -0.009579181671142578, -0.009265542030334473, -0.008951902389526367, -0.008638262748718262, -0.008324623107910156, -0.00801098346710205, -0.007697343826293945, -0.00738370418548584, -0.007070064544677734, -0.006756424903869629, -0.0064427852630615234, -0.006129145622253418, -0.0058155059814453125, -0.005501866340637207, -0.0051882266998291016, -0.004874587059020996, -0.004560947418212891, -0.004247307777404785, -0.00393366813659668, -0.0036200284957885742, -0.0033063888549804688, -0.0029927492141723633, -0.002679109573364258, -0.0023654699325561523, -0.002051830291748047, -0.0017381906509399414, -0.001424551010131836, -0.0011109113693237305, -0.000797271728515625, -0.00048363208770751953, -0.00016999244689941406, 0.0001436471939086914, 0.0004572868347167969, 0.0007709264755249023, 0.0010845661163330078, 0.0013982057571411133, 0.0017118453979492188, 0.0020254850387573242, 0.0023391246795654297, 0.002652764320373535, 0.0029664039611816406, 0.003280043601989746, 0.0035936832427978516, 0.003907322883605957, 0.0042209625244140625, 0.004534602165222168, 0.0048482418060302734, 0.005161881446838379, 0.005475521087646484, 0.00578916072845459, 0.006102800369262695, 0.006416440010070801, 0.006730079650878906, 0.007043719291687012, 0.007357358932495117, 0.007670998573303223, 0.007984638214111328, 0.008298277854919434, 0.008611917495727539, 0.008925557136535645, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 55.0, 228.0, 388.0, 246.0, 60.0, 12.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15272080898284912, -0.149119570851326, -0.14551831781864166, -0.14191707968711853, -0.1383158266544342, -0.13471458852291107, -0.13111333549022675, -0.1275120973587036, -0.12391085177659988, -0.12030960619449615, -0.11670836061239243, -0.1131071150302887, -0.10950587689876556, -0.10590462386608124, -0.1023033857345581, -0.09870214015245438, -0.09510089457035065, -0.09149964898824692, -0.08789840340614319, -0.08429715782403946, -0.08069591224193573, -0.0770946741104126, -0.07349342852830887, -0.06989218294620514, -0.06629093736410141, -0.06268969178199768, -0.05908844619989395, -0.05548720434308052, -0.05188595876097679, -0.04828471317887306, -0.04468347132205963, -0.0410822257399559, -0.037480972707271576, -0.03387972712516785, -0.030278483405709267, -0.026677239686250687, -0.023075994104146957, -0.019474748522043228, -0.015873504802584648, -0.012272261083126068, -0.008671015501022339, -0.005069770850241184, -0.0014685261994600296, 0.002132718451321125, 0.00573396310210228, 0.009335208684206009, 0.012936452403664589, 0.01653769612312317, 0.020138941705226898, 0.023740187287330627, 0.027341431006789207, 0.030942674726247787, 0.03454392030835152, 0.038145165890455246, 0.04174640774726868, 0.045347653329372406, 0.048948898911476135, 0.052550144493579865, 0.056151390075683594, 0.059752631932497025, 0.06335388123989105, 0.06695511937141418, 0.07055636495351791, 0.07415761053562164, 0.07775885611772537]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 9.0, 8.0, 8.0, 8.0, 13.0, 23.0, 20.0, 26.0, 25.0, 41.0, 30.0, 51.0, 43.0, 38.0, 58.0, 52.0, 54.0, 52.0, 56.0, 50.0, 43.0, 33.0, 54.0, 28.0, 29.0, 32.0, 19.0, 19.0, 16.0, 17.0, 12.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024567008018493652, -0.02381231263279915, -0.023057615384459496, -0.022302918136119843, -0.02154822275042534, -0.020793527364730835, -0.020038830116391182, -0.01928413286805153, -0.018529437482357025, -0.01777474209666252, -0.01702004484832287, -0.016265347599983215, -0.015510652214288712, -0.014755955897271633, -0.014001259580254555, -0.013246563263237476, -0.012491866946220398, -0.01173717062920332, -0.010982474312186241, -0.010227777995169163, -0.009473081678152084, -0.008718385361135006, -0.007963689044117928, -0.007208992727100849, -0.006454296410083771, -0.005699600093066692, -0.004944903776049614, -0.0041902074590325356, -0.003435511142015457, -0.0026808148249983788, -0.0019261185079813004, -0.001171422190964222, -0.00041672587394714355, 0.00033797044306993484, 0.0010926667600870132, 0.0018473630771040916, 0.00260205939412117, 0.0033567557111382484, 0.004111452028155327, 0.004866148345172405, 0.005620844662189484, 0.006375540979206562, 0.0071302372962236404, 0.007884933613240719, 0.008639629930257797, 0.009394326247274876, 0.010149022564291954, 0.010903718881309032, 0.01165841519832611, 0.01241311151534319, 0.013167807832360268, 0.013922504149377346, 0.014677200466394424, 0.015431896783411503, 0.01618659310042858, 0.016941290348768234, 0.017695985734462738, 0.018450681120157242, 0.019205378368496895, 0.019960075616836548, 0.02071477100253105, 0.021469466388225555, 0.02222416363656521, 0.02297886088490486, 0.023733556270599365]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 8.0, 8.0, 6.0, 11.0, 16.0, 24.0, 25.0, 40.0, 58.0, 68.0, 86.0, 135.0, 156.0, 249.0, 298.0, 450.0, 630.0, 1156.0, 3176.0, 26228.0, 577403.0, 413694.0, 18644.0, 2746.0, 1057.0, 609.0, 440.0, 286.0, 208.0, 164.0, 123.0, 93.0, 70.0, 58.0, 34.0, 24.0, 22.0, 11.0, 12.0, 2.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.03985595703125, -0.0386815071105957, -0.037507057189941406, -0.03633260726928711, -0.03515815734863281, -0.033983707427978516, -0.03280925750732422, -0.03163480758666992, -0.030460357666015625, -0.029285907745361328, -0.02811145782470703, -0.026937007904052734, -0.025762557983398438, -0.02458810806274414, -0.023413658142089844, -0.022239208221435547, -0.02106475830078125, -0.019890308380126953, -0.018715858459472656, -0.01754140853881836, -0.016366958618164062, -0.015192508697509766, -0.014018058776855469, -0.012843608856201172, -0.011669158935546875, -0.010494709014892578, -0.009320259094238281, -0.008145809173583984, -0.0069713592529296875, -0.005796909332275391, -0.004622459411621094, -0.003448009490966797, -0.0022735595703125, -0.0010991096496582031, 7.534027099609375e-05, 0.0012497901916503906, 0.0024242401123046875, 0.0035986900329589844, 0.004773139953613281, 0.005947589874267578, 0.007122039794921875, 0.008296489715576172, 0.009470939636230469, 0.010645389556884766, 0.011819839477539062, 0.01299428939819336, 0.014168739318847656, 0.015343189239501953, 0.01651763916015625, 0.017692089080810547, 0.018866539001464844, 0.02004098892211914, 0.021215438842773438, 0.022389888763427734, 0.02356433868408203, 0.024738788604736328, 0.025913238525390625, 0.027087688446044922, 0.02826213836669922, 0.029436588287353516, 0.030611038208007812, 0.03178548812866211, 0.032959938049316406, 0.0341343879699707, 0.035308837890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 23.0, 101.0, 315.0, 357.0, 155.0, 39.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.061387062072753906, -0.05941963195800781, -0.05745220184326172, -0.055484771728515625, -0.05351734161376953, -0.05154991149902344, -0.049582481384277344, -0.04761505126953125, -0.045647621154785156, -0.04368019104003906, -0.04171276092529297, -0.039745330810546875, -0.03777790069580078, -0.03581047058105469, -0.033843040466308594, -0.0318756103515625, -0.029908180236816406, -0.027940750122070312, -0.02597332000732422, -0.024005889892578125, -0.02203845977783203, -0.020071029663085938, -0.018103599548339844, -0.01613616943359375, -0.014168739318847656, -0.012201309204101562, -0.010233879089355469, -0.008266448974609375, -0.006299018859863281, -0.0043315887451171875, -0.0023641586303710938, -0.000396728515625, 0.0015707015991210938, 0.0035381317138671875, 0.005505561828613281, 0.007472991943359375, 0.009440422058105469, 0.011407852172851562, 0.013375282287597656, 0.01534271240234375, 0.017310142517089844, 0.019277572631835938, 0.02124500274658203, 0.023212432861328125, 0.02517986297607422, 0.027147293090820312, 0.029114723205566406, 0.0310821533203125, 0.033049583435058594, 0.03501701354980469, 0.03698444366455078, 0.038951873779296875, 0.04091930389404297, 0.04288673400878906, 0.044854164123535156, 0.04682159423828125, 0.048789024353027344, 0.05075645446777344, 0.05272388458251953, 0.054691314697265625, 0.05665874481201172, 0.05862617492675781, 0.060593605041503906, 0.06256103515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 10.0, 4.0, 8.0, 14.0, 13.0, 17.0, 21.0, 20.0, 30.0, 39.0, 42.0, 50.0, 48.0, 46.0, 58.0, 56.0, 86.0, 126.0, 238.0, 550.0, 2030.0, 14236.0, 212018.0, 727932.0, 81483.0, 6836.0, 1231.0, 419.0, 193.0, 112.0, 93.0, 76.0, 81.0, 48.0, 53.0, 31.0, 27.0, 21.0, 27.0, 25.0, 18.0, 14.0, 19.0, 8.0, 10.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0], "bins": [-0.033111572265625, -0.03214716911315918, -0.03118276596069336, -0.03021836280822754, -0.02925395965576172, -0.0282895565032959, -0.027325153350830078, -0.026360750198364258, -0.025396347045898438, -0.024431943893432617, -0.023467540740966797, -0.022503137588500977, -0.021538734436035156, -0.020574331283569336, -0.019609928131103516, -0.018645524978637695, -0.017681121826171875, -0.016716718673706055, -0.015752315521240234, -0.014787912368774414, -0.013823509216308594, -0.012859106063842773, -0.011894702911376953, -0.010930299758911133, -0.009965896606445312, -0.009001493453979492, -0.008037090301513672, -0.0070726871490478516, -0.006108283996582031, -0.005143880844116211, -0.004179477691650391, -0.0032150745391845703, -0.00225067138671875, -0.0012862682342529297, -0.0003218650817871094, 0.0006425380706787109, 0.0016069412231445312, 0.0025713443756103516, 0.003535747528076172, 0.004500150680541992, 0.0054645538330078125, 0.006428956985473633, 0.007393360137939453, 0.008357763290405273, 0.009322166442871094, 0.010286569595336914, 0.011250972747802734, 0.012215375900268555, 0.013179779052734375, 0.014144182205200195, 0.015108585357666016, 0.016072988510131836, 0.017037391662597656, 0.018001794815063477, 0.018966197967529297, 0.019930601119995117, 0.020895004272460938, 0.021859407424926758, 0.022823810577392578, 0.0237882137298584, 0.02475261688232422, 0.02571702003479004, 0.02668142318725586, 0.02764582633972168, 0.0286102294921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 11.0, 5.0, 13.0, 13.0, 9.0, 17.0, 15.0, 23.0, 33.0, 27.0, 34.0, 28.0, 30.0, 36.0, 33.0, 39.0, 48.0, 49.0, 49.0, 51.0, 42.0, 38.0, 29.0, 41.0, 30.0, 27.0, 26.0, 20.0, 30.0, 23.0, 25.0, 19.0, 16.0, 14.0, 13.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.02099609375, -0.020303726196289062, -0.019611358642578125, -0.018918991088867188, -0.01822662353515625, -0.017534255981445312, -0.016841888427734375, -0.016149520874023438, -0.0154571533203125, -0.014764785766601562, -0.014072418212890625, -0.013380050659179688, -0.01268768310546875, -0.011995315551757812, -0.011302947998046875, -0.010610580444335938, -0.009918212890625, -0.009225845336914062, -0.008533477783203125, -0.007841110229492188, -0.00714874267578125, -0.0064563751220703125, -0.005764007568359375, -0.0050716400146484375, -0.0043792724609375, -0.0036869049072265625, -0.002994537353515625, -0.0023021697998046875, -0.00160980224609375, -0.0009174346923828125, -0.000225067138671875, 0.0004673004150390625, 0.00115966796875, 0.0018520355224609375, 0.002544403076171875, 0.0032367706298828125, 0.00392913818359375, 0.0046215057373046875, 0.005313873291015625, 0.0060062408447265625, 0.0066986083984375, 0.0073909759521484375, 0.008083343505859375, 0.008775711059570312, 0.00946807861328125, 0.010160446166992188, 0.010852813720703125, 0.011545181274414062, 0.012237548828125, 0.012929916381835938, 0.013622283935546875, 0.014314651489257812, 0.01500701904296875, 0.015699386596679688, 0.016391754150390625, 0.017084121704101562, 0.0177764892578125, 0.018468856811523438, 0.019161224365234375, 0.019853591918945312, 0.02054595947265625, 0.021238327026367188, 0.021930694580078125, 0.022623062133789062, 0.0233154296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 9.0, 6.0, 24.0, 16.0, 38.0, 55.0, 96.0, 183.0, 318.0, 579.0, 1170.0, 2313.0, 4770.0, 10507.0, 26056.0, 77673.0, 308392.0, 439274.0, 115864.0, 35498.0, 13885.0, 5883.0, 2904.0, 1418.0, 714.0, 414.0, 206.0, 117.0, 70.0, 41.0, 15.0, 16.0, 13.0, 5.0, 5.0, 9.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005504608154296875, -0.005333423614501953, -0.005162239074707031, -0.004991054534912109, -0.0048198699951171875, -0.004648685455322266, -0.004477500915527344, -0.004306316375732422, -0.0041351318359375, -0.003963947296142578, -0.0037927627563476562, -0.0036215782165527344, -0.0034503936767578125, -0.0032792091369628906, -0.0031080245971679688, -0.002936840057373047, -0.002765655517578125, -0.002594470977783203, -0.0024232864379882812, -0.0022521018981933594, -0.0020809173583984375, -0.0019097328186035156, -0.0017385482788085938, -0.0015673637390136719, -0.00139617919921875, -0.0012249946594238281, -0.0010538101196289062, -0.0008826255798339844, -0.0007114410400390625, -0.0005402565002441406, -0.00036907196044921875, -0.00019788742065429688, -2.6702880859375e-05, 0.00014448165893554688, 0.00031566619873046875, 0.0004868507385253906, 0.0006580352783203125, 0.0008292198181152344, 0.0010004043579101562, 0.0011715888977050781, 0.0013427734375, 0.0015139579772949219, 0.0016851425170898438, 0.0018563270568847656, 0.0020275115966796875, 0.0021986961364746094, 0.0023698806762695312, 0.002541065216064453, 0.002712249755859375, 0.002883434295654297, 0.0030546188354492188, 0.0032258033752441406, 0.0033969879150390625, 0.0035681724548339844, 0.0037393569946289062, 0.003910541534423828, 0.00408172607421875, 0.004252910614013672, 0.004424095153808594, 0.004595279693603516, 0.0047664642333984375, 0.004937648773193359, 0.005108833312988281, 0.005280017852783203, 0.005451202392578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 2.0, 10.0, 20.0, 11.0, 14.0, 25.0, 36.0, 45.0, 49.0, 65.0, 98.0, 112.0, 89.0, 82.0, 80.0, 58.0, 52.0, 26.0, 21.0, 24.0, 16.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.316205978393555e-05, -9.043142199516296e-05, -8.770078420639038e-05, -8.49701464176178e-05, -8.223950862884521e-05, -7.950887084007263e-05, -7.677823305130005e-05, -7.404759526252747e-05, -7.131695747375488e-05, -6.85863196849823e-05, -6.585568189620972e-05, -6.312504410743713e-05, -6.039440631866455e-05, -5.766376852989197e-05, -5.4933130741119385e-05, -5.22024929523468e-05, -4.947185516357422e-05, -4.6741217374801636e-05, -4.401057958602905e-05, -4.127994179725647e-05, -3.854930400848389e-05, -3.5818666219711304e-05, -3.308802843093872e-05, -3.0357390642166138e-05, -2.7626752853393555e-05, -2.489611506462097e-05, -2.216547727584839e-05, -1.9434839487075806e-05, -1.6704201698303223e-05, -1.397356390953064e-05, -1.1242926120758057e-05, -8.512288331985474e-06, -5.781650543212891e-06, -3.0510127544403076e-06, -3.203749656677246e-07, 2.4102628231048584e-06, 5.140900611877441e-06, 7.871538400650024e-06, 1.0602176189422607e-05, 1.333281397819519e-05, 1.6063451766967773e-05, 1.8794089555740356e-05, 2.152472734451294e-05, 2.4255365133285522e-05, 2.6986002922058105e-05, 2.971664071083069e-05, 3.244727849960327e-05, 3.5177916288375854e-05, 3.790855407714844e-05, 4.063919186592102e-05, 4.3369829654693604e-05, 4.6100467443466187e-05, 4.883110523223877e-05, 5.156174302101135e-05, 5.4292380809783936e-05, 5.702301859855652e-05, 5.97536563873291e-05, 6.248429417610168e-05, 6.521493196487427e-05, 6.794556975364685e-05, 7.067620754241943e-05, 7.340684533119202e-05, 7.61374831199646e-05, 7.886812090873718e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 17.0, 28.0, 37.0, 48.0, 92.0, 180.0, 468.0, 1642.0, 10020.0, 124412.0, 837070.0, 66027.0, 6511.0, 1179.0, 365.0, 181.0, 94.0, 60.0, 40.0, 14.0, 21.0, 7.0, 11.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01219940185546875, -0.011677861213684082, -0.011156320571899414, -0.010634779930114746, -0.010113239288330078, -0.00959169864654541, -0.009070158004760742, -0.008548617362976074, -0.008027076721191406, -0.007505536079406738, -0.00698399543762207, -0.006462454795837402, -0.005940914154052734, -0.005419373512268066, -0.0048978328704833984, -0.0043762922286987305, -0.0038547515869140625, -0.0033332109451293945, -0.0028116703033447266, -0.0022901296615600586, -0.0017685890197753906, -0.0012470483779907227, -0.0007255077362060547, -0.00020396709442138672, 0.00031757354736328125, 0.0008391141891479492, 0.0013606548309326172, 0.0018821954727172852, 0.002403736114501953, 0.002925276756286621, 0.003446817398071289, 0.003968358039855957, 0.004489898681640625, 0.005011439323425293, 0.005532979965209961, 0.006054520606994629, 0.006576061248779297, 0.007097601890563965, 0.007619142532348633, 0.0081406831741333, 0.008662223815917969, 0.009183764457702637, 0.009705305099487305, 0.010226845741271973, 0.01074838638305664, 0.011269927024841309, 0.011791467666625977, 0.012313008308410645, 0.012834548950195312, 0.01335608959197998, 0.013877630233764648, 0.014399170875549316, 0.014920711517333984, 0.015442252159118652, 0.01596379280090332, 0.01648533344268799, 0.017006874084472656, 0.017528414726257324, 0.018049955368041992, 0.01857149600982666, 0.019093036651611328, 0.019614577293395996, 0.020136117935180664, 0.020657658576965332, 0.02117919921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 7.0, 15.0, 24.0, 37.0, 41.0, 81.0, 127.0, 148.0, 145.0, 119.0, 86.0, 59.0, 35.0, 10.0, 10.0, 10.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.01494908332824707, -0.01462411880493164, -0.014299154281616211, -0.013974189758300781, -0.013649225234985352, -0.013324260711669922, -0.012999296188354492, -0.012674331665039062, -0.012349367141723633, -0.012024402618408203, -0.011699438095092773, -0.011374473571777344, -0.011049509048461914, -0.010724544525146484, -0.010399580001831055, -0.010074615478515625, -0.009749650955200195, -0.009424686431884766, -0.009099721908569336, -0.008774757385253906, -0.008449792861938477, -0.008124828338623047, -0.007799863815307617, -0.0074748992919921875, -0.007149934768676758, -0.006824970245361328, -0.0065000057220458984, -0.006175041198730469, -0.005850076675415039, -0.005525112152099609, -0.00520014762878418, -0.00487518310546875, -0.00455021858215332, -0.004225254058837891, -0.003900289535522461, -0.0035753250122070312, -0.0032503604888916016, -0.002925395965576172, -0.002600431442260742, -0.0022754669189453125, -0.0019505023956298828, -0.0016255378723144531, -0.0013005733489990234, -0.0009756088256835938, -0.0006506443023681641, -0.0003256797790527344, -7.152557373046875e-07, 0.000324249267578125, 0.0006492137908935547, 0.0009741783142089844, 0.001299142837524414, 0.0016241073608398438, 0.0019490718841552734, 0.002274036407470703, 0.002599000930786133, 0.0029239654541015625, 0.003248929977416992, 0.003573894500732422, 0.0038988590240478516, 0.004223823547363281, 0.004548788070678711, 0.004873752593994141, 0.00519871711730957, 0.005523681640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 55.0, 874.0, 78.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18397590517997742, -0.16228285431861877, -0.14058981835842133, -0.11889676749706268, -0.09720372408628464, -0.07551068067550659, -0.05381762981414795, -0.0321245938539505, -0.010431542992591858, 0.011261502280831337, 0.03295454755425453, 0.054647594690322876, 0.07634063810110092, 0.09803368151187897, 0.11972673237323761, 0.14141976833343506, 0.1631128191947937, 0.18480587005615234, 0.2064989060163498, 0.22819195687770844, 0.24988499283790588, 0.2715780436992645, 0.29327109456062317, 0.3149641156196594, 0.33665716648101807, 0.3583502173423767, 0.38004326820373535, 0.401736319065094, 0.42342934012413025, 0.4451223909854889, 0.46681544184684753, 0.4885084629058838, 0.5102015137672424, 0.5318945646286011, 0.5535876154899597, 0.5752806663513184, 0.596973717212677, 0.6186667680740356, 0.6403597593307495, 0.6620528101921082, 0.6837458610534668, 0.7054389119148254, 0.7271319627761841, 0.7488250136375427, 0.7705180644989014, 0.7922110557556152, 0.8139041662216187, 0.8355971574783325, 0.8572902679443359, 0.8789833188056946, 0.9006763696670532, 0.9223694205284119, 0.9440624713897705, 0.9657554626464844, 0.9874485731124878, 1.0091415643692017, 1.0308345556259155, 1.0525275468826294, 1.0742206573486328, 1.0959136486053467, 1.11760675907135, 1.139299750328064, 1.1609928607940674, 1.1826858520507812, 1.2043789625167847]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 5.0, 6.0, 12.0, 18.0, 16.0, 9.0, 20.0, 20.0, 22.0, 24.0, 28.0, 40.0, 37.0, 31.0, 36.0, 40.0, 49.0, 37.0, 33.0, 47.0, 35.0, 38.0, 45.0, 43.0, 41.0, 25.0, 25.0, 35.0, 25.0, 18.0, 18.0, 14.0, 13.0, 12.0, 12.0, 4.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07189327478408813, -0.06971617043018341, -0.06753907352685928, -0.06536196917295456, -0.06318487226963043, -0.06100776791572571, -0.058830663561820984, -0.05665356293320656, -0.05447646230459213, -0.05229936167597771, -0.05012226104736328, -0.04794515669345856, -0.04576805606484413, -0.043590955436229706, -0.04141385108232498, -0.039236750453710556, -0.03705964982509613, -0.034882549196481705, -0.03270544856786728, -0.030528344213962555, -0.02835124358534813, -0.026174142956733704, -0.02399704046547413, -0.021819937974214554, -0.019642837345600128, -0.017465736716985703, -0.015288634225726128, -0.013111532665789127, -0.010934431105852127, -0.008757329545915127, -0.0065802279859781265, -0.004403126426041126, -0.002226024866104126, -4.89233061671257e-05, 0.0021281782537698746, 0.004305279813706875, 0.006482381373643875, 0.008659482933580875, 0.010836584493517876, 0.013013686053454876, 0.015190787613391876, 0.017367888242006302, 0.019544990733265877, 0.02172209322452545, 0.023899193853139877, 0.026076294481754303, 0.028253396973013878, 0.030430499464273453, 0.03260760009288788, 0.034784700721502304, 0.03696180135011673, 0.039138905704021454, 0.04131600633263588, 0.043493106961250305, 0.04567021131515503, 0.047847311943769455, 0.05002441257238388, 0.052201513200998306, 0.05437861382961273, 0.056555718183517456, 0.05873281881213188, 0.06090991944074631, 0.06308702379465103, 0.06526412069797516, 0.06744122505187988]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 19.0, 44.0, 137.0, 386.0, 987.0, 1618.0, 3577.0, 42712.0, 4114485.0, 25250.0, 2892.0, 1162.0, 445.0, 248.0, 174.0, 65.0, 25.0, 18.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050537109375, -0.048760414123535156, -0.04698371887207031, -0.04520702362060547, -0.043430328369140625, -0.04165363311767578, -0.03987693786621094, -0.038100242614746094, -0.03632354736328125, -0.034546852111816406, -0.03277015686035156, -0.03099346160888672, -0.029216766357421875, -0.02744007110595703, -0.025663375854492188, -0.023886680603027344, -0.0221099853515625, -0.020333290100097656, -0.018556594848632812, -0.01677989959716797, -0.015003204345703125, -0.013226509094238281, -0.011449813842773438, -0.009673118591308594, -0.00789642333984375, -0.006119728088378906, -0.0043430328369140625, -0.0025663375854492188, -0.000789642333984375, 0.0009870529174804688, 0.0027637481689453125, 0.004540443420410156, 0.006317138671875, 0.008093833923339844, 0.009870529174804688, 0.011647224426269531, 0.013423919677734375, 0.015200614929199219, 0.016977310180664062, 0.018754005432128906, 0.02053070068359375, 0.022307395935058594, 0.024084091186523438, 0.02586078643798828, 0.027637481689453125, 0.02941417694091797, 0.031190872192382812, 0.032967567443847656, 0.0347442626953125, 0.036520957946777344, 0.03829765319824219, 0.04007434844970703, 0.041851043701171875, 0.04362773895263672, 0.04540443420410156, 0.047181129455566406, 0.04895782470703125, 0.050734519958496094, 0.05251121520996094, 0.05428791046142578, 0.056064605712890625, 0.05784130096435547, 0.05961799621582031, 0.061394691467285156, 0.06317138671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 25.0, 144.0, 376.0, 324.0, 109.0, 18.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06634235382080078, -0.06426429748535156, -0.062186241149902344, -0.060108184814453125, -0.058030128479003906, -0.05595207214355469, -0.05387401580810547, -0.05179595947265625, -0.04971790313720703, -0.04763984680175781, -0.045561790466308594, -0.043483734130859375, -0.041405677795410156, -0.03932762145996094, -0.03724956512451172, -0.0351715087890625, -0.03309345245361328, -0.031015396118164062, -0.028937339782714844, -0.026859283447265625, -0.024781227111816406, -0.022703170776367188, -0.02062511444091797, -0.01854705810546875, -0.01646900177001953, -0.014390945434570312, -0.012312889099121094, -0.010234832763671875, -0.008156776428222656, -0.0060787200927734375, -0.004000663757324219, -0.001922607421875, 0.00015544891357421875, 0.0022335052490234375, 0.004311561584472656, 0.006389617919921875, 0.008467674255371094, 0.010545730590820312, 0.012623786926269531, 0.01470184326171875, 0.01677989959716797, 0.018857955932617188, 0.020936012268066406, 0.023014068603515625, 0.025092124938964844, 0.027170181274414062, 0.02924823760986328, 0.0313262939453125, 0.03340435028076172, 0.03548240661621094, 0.037560462951660156, 0.039638519287109375, 0.041716575622558594, 0.04379463195800781, 0.04587268829345703, 0.04795074462890625, 0.05002880096435547, 0.05210685729980469, 0.054184913635253906, 0.056262969970703125, 0.058341026306152344, 0.06041908264160156, 0.06249713897705078, 0.0645751953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 51.0, 101.0, 228.0, 1229.0, 11013.0, 841698.0, 3321404.0, 16425.0, 1638.0, 344.0, 98.0, 26.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.033504486083984375, -0.03221893310546875, -0.030933380126953125, -0.0296478271484375, -0.028362274169921875, -0.02707672119140625, -0.025791168212890625, -0.024505615234375, -0.023220062255859375, -0.02193450927734375, -0.020648956298828125, -0.0193634033203125, -0.018077850341796875, -0.01679229736328125, -0.015506744384765625, -0.01422119140625, -0.012935638427734375, -0.01165008544921875, -0.010364532470703125, -0.0090789794921875, -0.007793426513671875, -0.00650787353515625, -0.005222320556640625, -0.003936767578125, -0.002651214599609375, -0.00136566162109375, -8.0108642578125e-05, 0.0012054443359375, 0.002490997314453125, 0.00377655029296875, 0.005062103271484375, 0.00634765625, 0.007633209228515625, 0.00891876220703125, 0.010204315185546875, 0.0114898681640625, 0.012775421142578125, 0.01406097412109375, 0.015346527099609375, 0.016632080078125, 0.017917633056640625, 0.01920318603515625, 0.020488739013671875, 0.0217742919921875, 0.023059844970703125, 0.02434539794921875, 0.025630950927734375, 0.02691650390625, 0.028202056884765625, 0.02948760986328125, 0.030773162841796875, 0.0320587158203125, 0.033344268798828125, 0.03462982177734375, 0.035915374755859375, 0.037200927734375, 0.038486480712890625, 0.03977203369140625, 0.041057586669921875, 0.0423431396484375, 0.043628692626953125, 0.04491424560546875, 0.046199798583984375, 0.0474853515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 14.0, 30.0, 32.0, 128.0, 248.0, 1018.0, 1837.0, 442.0, 136.0, 73.0, 42.0, 19.0, 19.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020355224609375, -0.019821882247924805, -0.01928853988647461, -0.018755197525024414, -0.01822185516357422, -0.017688512802124023, -0.017155170440673828, -0.016621828079223633, -0.016088485717773438, -0.015555143356323242, -0.015021800994873047, -0.014488458633422852, -0.013955116271972656, -0.013421773910522461, -0.012888431549072266, -0.01235508918762207, -0.011821746826171875, -0.01128840446472168, -0.010755062103271484, -0.010221719741821289, -0.009688377380371094, -0.009155035018920898, -0.008621692657470703, -0.008088350296020508, -0.0075550079345703125, -0.007021665573120117, -0.006488323211669922, -0.0059549808502197266, -0.005421638488769531, -0.004888296127319336, -0.004354953765869141, -0.0038216114044189453, -0.00328826904296875, -0.0027549266815185547, -0.0022215843200683594, -0.001688241958618164, -0.0011548995971679688, -0.0006215572357177734, -8.821487426757812e-05, 0.0004451274871826172, 0.0009784698486328125, 0.0015118122100830078, 0.002045154571533203, 0.0025784969329833984, 0.0031118392944335938, 0.003645181655883789, 0.004178524017333984, 0.00471186637878418, 0.005245208740234375, 0.00577855110168457, 0.006311893463134766, 0.006845235824584961, 0.007378578186035156, 0.007911920547485352, 0.008445262908935547, 0.008978605270385742, 0.009511947631835938, 0.010045289993286133, 0.010578632354736328, 0.011111974716186523, 0.011645317077636719, 0.012178659439086914, 0.01271200180053711, 0.013245344161987305, 0.0137786865234375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 41.0, 215.0, 430.0, 237.0, 55.0, 19.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.2023770958185196, -0.1987934410572052, -0.19520977139472961, -0.19162611663341522, -0.18804244697093964, -0.18445879220962524, -0.18087512254714966, -0.17729146778583527, -0.17370781302452087, -0.17012415826320648, -0.1665404886007309, -0.1629568338394165, -0.15937316417694092, -0.15578950941562653, -0.15220585465431213, -0.14862218499183655, -0.14503851532936096, -0.14145486056804657, -0.13787119090557098, -0.1342875361442566, -0.130703866481781, -0.1271202117204666, -0.12353654950857162, -0.11995288729667664, -0.11636923253536224, -0.11278557032346725, -0.10920190811157227, -0.10561825335025787, -0.10203459113836288, -0.0984509289264679, -0.0948672667145729, -0.09128360450267792, -0.08769994229078293, -0.08411628007888794, -0.08053261786699295, -0.07694895565509796, -0.07336530089378357, -0.06978163868188858, -0.06619797646999359, -0.0626143142580986, -0.05903065204620361, -0.055446989834308624, -0.051863331347703934, -0.048279669135808945, -0.044696006923913956, -0.041112348437309265, -0.037528686225414276, -0.03394502401351929, -0.030361365526914597, -0.026777705177664757, -0.023194042965769768, -0.019610382616519928, -0.01602672040462494, -0.0124430600553751, -0.00885939970612526, -0.00527573749423027, -0.0016920771449804306, 0.0018915839027613401, 0.005475244950503111, 0.009058905765414238, 0.012642567045986652, 0.016226228326559067, 0.019809888675808907, 0.023393550887703896, 0.026977211236953735]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 30.0, 23.0, 27.0, 34.0, 46.0, 47.0, 70.0, 54.0, 71.0, 61.0, 55.0, 58.0, 57.0, 60.0, 57.0, 39.0, 45.0, 36.0, 27.0, 21.0, 23.0, 9.0, 9.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027879655361175537, -0.026923367753624916, -0.025967080146074295, -0.025010792538523674, -0.024054504930973053, -0.023098217323422432, -0.02214192971587181, -0.02118564210832119, -0.02022935450077057, -0.019273066893219948, -0.018316779285669327, -0.017360491678118706, -0.016404204070568085, -0.015447916463017464, -0.014491628855466843, -0.013535341247916222, -0.0125790536403656, -0.01162276603281498, -0.010666478425264359, -0.009710190817713737, -0.008753903210163116, -0.007797615602612495, -0.006841327995061874, -0.005885040387511253, -0.004928752779960632, -0.003972465172410011, -0.0030161775648593903, -0.0020598899573087692, -0.0011036023497581482, -0.00014731474220752716, 0.0008089728653430939, 0.001765260472893715, 0.002721548080444336, 0.003677835687994957, 0.004634123295545578, 0.005590410903096199, 0.00654669851064682, 0.007502986118197441, 0.008459273725748062, 0.009415561333298683, 0.010371848940849304, 0.011328136548399925, 0.012284424155950546, 0.013240711763501167, 0.014196999371051788, 0.01515328697860241, 0.01610957458615303, 0.01706586219370365, 0.018022149801254272, 0.018978437408804893, 0.019934725016355515, 0.020891012623906136, 0.021847300231456757, 0.022803587839007378, 0.023759875446558, 0.02471616305410862, 0.02567245066165924, 0.026628738269209862, 0.027585025876760483, 0.028541313484311104, 0.029497601091861725, 0.030453888699412346, 0.03141017630696297, 0.03236646205186844, 0.03332275152206421]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 13.0, 9.0, 16.0, 22.0, 41.0, 37.0, 48.0, 66.0, 92.0, 128.0, 171.0, 198.0, 286.0, 370.0, 592.0, 1075.0, 2677.0, 14169.0, 249612.0, 729522.0, 40471.0, 4963.0, 1469.0, 724.0, 444.0, 325.0, 247.0, 187.0, 138.0, 103.0, 78.0, 71.0, 48.0, 28.0, 21.0, 25.0, 17.0, 7.0, 11.0, 5.0, 6.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0379638671875, -0.03682088851928711, -0.03567790985107422, -0.03453493118286133, -0.03339195251464844, -0.03224897384643555, -0.031105995178222656, -0.029963016510009766, -0.028820037841796875, -0.027677059173583984, -0.026534080505371094, -0.025391101837158203, -0.024248123168945312, -0.023105144500732422, -0.02196216583251953, -0.02081918716430664, -0.01967620849609375, -0.01853322982788086, -0.01739025115966797, -0.016247272491455078, -0.015104293823242188, -0.013961315155029297, -0.012818336486816406, -0.011675357818603516, -0.010532379150390625, -0.009389400482177734, -0.008246421813964844, -0.007103443145751953, -0.0059604644775390625, -0.004817485809326172, -0.0036745071411132812, -0.0025315284729003906, -0.0013885498046875, -0.0002455711364746094, 0.0008974075317382812, 0.002040386199951172, 0.0031833648681640625, 0.004326343536376953, 0.005469322204589844, 0.006612300872802734, 0.007755279541015625, 0.008898258209228516, 0.010041236877441406, 0.011184215545654297, 0.012327194213867188, 0.013470172882080078, 0.014613151550292969, 0.01575613021850586, 0.01689910888671875, 0.01804208755493164, 0.01918506622314453, 0.020328044891357422, 0.021471023559570312, 0.022614002227783203, 0.023756980895996094, 0.024899959564208984, 0.026042938232421875, 0.027185916900634766, 0.028328895568847656, 0.029471874237060547, 0.030614852905273438, 0.03175783157348633, 0.03290081024169922, 0.03404378890991211, 0.035186767578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 24.0, 122.0, 338.0, 337.0, 147.0, 24.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.06380701065063477, -0.06181812286376953, -0.0598292350769043, -0.05784034729003906, -0.05585145950317383, -0.053862571716308594, -0.05187368392944336, -0.049884796142578125, -0.04789590835571289, -0.045907020568847656, -0.04391813278198242, -0.04192924499511719, -0.03994035720825195, -0.03795146942138672, -0.035962581634521484, -0.03397369384765625, -0.031984806060791016, -0.02999591827392578, -0.028007030487060547, -0.026018142700195312, -0.024029254913330078, -0.022040367126464844, -0.02005147933959961, -0.018062591552734375, -0.01607370376586914, -0.014084815979003906, -0.012095928192138672, -0.010107040405273438, -0.008118152618408203, -0.006129264831542969, -0.004140377044677734, -0.0021514892578125, -0.00016260147094726562, 0.0018262863159179688, 0.003815174102783203, 0.0058040618896484375, 0.007792949676513672, 0.009781837463378906, 0.01177072525024414, 0.013759613037109375, 0.01574850082397461, 0.017737388610839844, 0.019726276397705078, 0.021715164184570312, 0.023704051971435547, 0.02569293975830078, 0.027681827545166016, 0.02967071533203125, 0.031659603118896484, 0.03364849090576172, 0.03563737869262695, 0.03762626647949219, 0.03961515426635742, 0.041604042053222656, 0.04359292984008789, 0.045581817626953125, 0.04757070541381836, 0.049559593200683594, 0.05154848098754883, 0.05353736877441406, 0.0555262565612793, 0.05751514434814453, 0.059504032135009766, 0.061492919921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 10.0, 18.0, 18.0, 17.0, 39.0, 30.0, 52.0, 47.0, 83.0, 74.0, 113.0, 153.0, 297.0, 946.0, 4453.0, 50037.0, 730873.0, 245288.0, 12848.0, 1903.0, 510.0, 200.0, 133.0, 80.0, 52.0, 61.0, 48.0, 46.0, 26.0, 26.0, 14.0, 14.0, 13.0, 7.0, 5.0, 7.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028289794921875, -0.02727031707763672, -0.026250839233398438, -0.025231361389160156, -0.024211883544921875, -0.023192405700683594, -0.022172927856445312, -0.02115345001220703, -0.02013397216796875, -0.01911449432373047, -0.018095016479492188, -0.017075538635253906, -0.016056060791015625, -0.015036582946777344, -0.014017105102539062, -0.012997627258300781, -0.0119781494140625, -0.010958671569824219, -0.009939193725585938, -0.008919715881347656, -0.007900238037109375, -0.006880760192871094, -0.0058612823486328125, -0.004841804504394531, -0.00382232666015625, -0.0028028488159179688, -0.0017833709716796875, -0.0007638931274414062, 0.000255584716796875, 0.0012750625610351562, 0.0022945404052734375, 0.0033140182495117188, 0.00433349609375, 0.005352973937988281, 0.0063724517822265625, 0.007391929626464844, 0.008411407470703125, 0.009430885314941406, 0.010450363159179688, 0.011469841003417969, 0.01248931884765625, 0.013508796691894531, 0.014528274536132812, 0.015547752380371094, 0.016567230224609375, 0.017586708068847656, 0.018606185913085938, 0.01962566375732422, 0.0206451416015625, 0.02166461944580078, 0.022684097290039062, 0.023703575134277344, 0.024723052978515625, 0.025742530822753906, 0.026762008666992188, 0.02778148651123047, 0.02880096435546875, 0.02982044219970703, 0.030839920043945312, 0.031859397888183594, 0.032878875732421875, 0.033898353576660156, 0.03491783142089844, 0.03593730926513672, 0.036956787109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 9.0, 16.0, 21.0, 23.0, 31.0, 27.0, 40.0, 41.0, 44.0, 49.0, 49.0, 58.0, 64.0, 62.0, 62.0, 64.0, 43.0, 47.0, 39.0, 42.0, 27.0, 32.0, 28.0, 18.0, 16.0, 10.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032623291015625, -0.031708478927612305, -0.03079366683959961, -0.029878854751586914, -0.02896404266357422, -0.028049230575561523, -0.027134418487548828, -0.026219606399536133, -0.025304794311523438, -0.024389982223510742, -0.023475170135498047, -0.02256035804748535, -0.021645545959472656, -0.02073073387145996, -0.019815921783447266, -0.01890110969543457, -0.017986297607421875, -0.01707148551940918, -0.016156673431396484, -0.015241861343383789, -0.014327049255371094, -0.013412237167358398, -0.012497425079345703, -0.011582612991333008, -0.010667800903320312, -0.009752988815307617, -0.008838176727294922, -0.007923364639282227, -0.007008552551269531, -0.006093740463256836, -0.005178928375244141, -0.004264116287231445, -0.00334930419921875, -0.0024344921112060547, -0.0015196800231933594, -0.0006048679351806641, 0.00030994415283203125, 0.0012247562408447266, 0.002139568328857422, 0.003054380416870117, 0.0039691925048828125, 0.004884004592895508, 0.005798816680908203, 0.0067136287689208984, 0.007628440856933594, 0.008543252944946289, 0.009458065032958984, 0.01037287712097168, 0.011287689208984375, 0.01220250129699707, 0.013117313385009766, 0.014032125473022461, 0.014946937561035156, 0.01586174964904785, 0.016776561737060547, 0.017691373825073242, 0.018606185913085938, 0.019520998001098633, 0.020435810089111328, 0.021350622177124023, 0.02226543426513672, 0.023180246353149414, 0.02409505844116211, 0.025009870529174805, 0.0259246826171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 11.0, 3.0, 16.0, 13.0, 22.0, 38.0, 34.0, 54.0, 106.0, 133.0, 254.0, 377.0, 601.0, 1062.0, 1938.0, 3616.0, 7282.0, 16373.0, 44282.0, 173629.0, 535097.0, 184770.0, 45772.0, 17014.0, 7466.0, 3754.0, 1990.0, 1114.0, 654.0, 383.0, 234.0, 134.0, 112.0, 78.0, 48.0, 28.0, 10.0, 11.0, 10.0, 8.0, 11.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00585174560546875, -0.005659997463226318, -0.005468249320983887, -0.005276501178741455, -0.0050847530364990234, -0.004893004894256592, -0.00470125675201416, -0.0045095086097717285, -0.004317760467529297, -0.004126012325286865, -0.003934264183044434, -0.003742516040802002, -0.0035507678985595703, -0.0033590197563171387, -0.003167271614074707, -0.0029755234718322754, -0.0027837753295898438, -0.002592027187347412, -0.0024002790451049805, -0.002208530902862549, -0.002016782760620117, -0.0018250346183776855, -0.001633286476135254, -0.0014415383338928223, -0.0012497901916503906, -0.001058042049407959, -0.0008662939071655273, -0.0006745457649230957, -0.00048279762268066406, -0.0002910494804382324, -9.930133819580078e-05, 9.244680404663086e-05, 0.0002841949462890625, 0.00047594308853149414, 0.0006676912307739258, 0.0008594393730163574, 0.001051187515258789, 0.0012429356575012207, 0.0014346837997436523, 0.001626431941986084, 0.0018181800842285156, 0.0020099282264709473, 0.002201676368713379, 0.0023934245109558105, 0.002585172653198242, 0.002776920795440674, 0.0029686689376831055, 0.003160417079925537, 0.0033521652221679688, 0.0035439133644104004, 0.003735661506652832, 0.003927409648895264, 0.004119157791137695, 0.004310905933380127, 0.004502654075622559, 0.00469440221786499, 0.004886150360107422, 0.0050778985023498535, 0.005269646644592285, 0.005461394786834717, 0.0056531429290771484, 0.00584489107131958, 0.006036639213562012, 0.006228387355804443, 0.006420135498046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 7.0, 18.0, 27.0, 27.0, 58.0, 153.0, 220.0, 203.0, 118.0, 88.0, 34.0, 16.0, 13.0, 6.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.00021215900778770447, -0.0002064034342765808, -0.00020064786076545715, -0.0001948922872543335, -0.00018913671374320984, -0.00018338114023208618, -0.00017762556672096252, -0.00017186999320983887, -0.0001661144196987152, -0.00016035884618759155, -0.0001546032726764679, -0.00014884769916534424, -0.00014309212565422058, -0.00013733655214309692, -0.00013158097863197327, -0.0001258254051208496, -0.00012006983160972595, -0.0001143142580986023, -0.00010855868458747864, -0.00010280311107635498, -9.704753756523132e-05, -9.129196405410767e-05, -8.553639054298401e-05, -7.978081703186035e-05, -7.40252435207367e-05, -6.826967000961304e-05, -6.251409649848938e-05, -5.675852298736572e-05, -5.1002949476242065e-05, -4.524737596511841e-05, -3.949180245399475e-05, -3.3736228942871094e-05, -2.7980655431747437e-05, -2.222508192062378e-05, -1.6469508409500122e-05, -1.0713934898376465e-05, -4.958361387252808e-06, 7.972121238708496e-07, 6.552785634994507e-06, 1.2308359146118164e-05, 1.806393265724182e-05, 2.381950616836548e-05, 2.9575079679489136e-05, 3.533065319061279e-05, 4.108622670173645e-05, 4.684180021286011e-05, 5.2597373723983765e-05, 5.835294723510742e-05, 6.410852074623108e-05, 6.986409425735474e-05, 7.56196677684784e-05, 8.137524127960205e-05, 8.713081479072571e-05, 9.288638830184937e-05, 9.864196181297302e-05, 0.00010439753532409668, 0.00011015310883522034, 0.000115908682346344, 0.00012166425585746765, 0.0001274198293685913, 0.00013317540287971497, 0.00013893097639083862, 0.00014468654990196228, 0.00015044212341308594]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 14.0, 32.0, 37.0, 77.0, 126.0, 256.0, 540.0, 1222.0, 3426.0, 14051.0, 112413.0, 811934.0, 87091.0, 12046.0, 3112.0, 1101.0, 477.0, 238.0, 140.0, 99.0, 40.0, 30.0, 13.0, 11.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0166473388671875, -0.016177773475646973, -0.015708208084106445, -0.015238642692565918, -0.01476907730102539, -0.014299511909484863, -0.013829946517944336, -0.013360381126403809, -0.012890815734863281, -0.012421250343322754, -0.011951684951782227, -0.0114821195602417, -0.011012554168701172, -0.010542988777160645, -0.010073423385620117, -0.00960385799407959, -0.009134292602539062, -0.008664727210998535, -0.008195161819458008, -0.0077255964279174805, -0.007256031036376953, -0.006786465644836426, -0.0063169002532958984, -0.005847334861755371, -0.005377769470214844, -0.004908204078674316, -0.004438638687133789, -0.003969073295593262, -0.0034995079040527344, -0.003029942512512207, -0.0025603771209716797, -0.0020908117294311523, -0.001621246337890625, -0.0011516809463500977, -0.0006821155548095703, -0.00021255016326904297, 0.0002570152282714844, 0.0007265806198120117, 0.001196146011352539, 0.0016657114028930664, 0.0021352767944335938, 0.002604842185974121, 0.0030744075775146484, 0.0035439729690551758, 0.004013538360595703, 0.0044831037521362305, 0.004952669143676758, 0.005422234535217285, 0.0058917999267578125, 0.00636136531829834, 0.006830930709838867, 0.0073004961013793945, 0.007770061492919922, 0.00823962688446045, 0.008709192276000977, 0.009178757667541504, 0.009648323059082031, 0.010117888450622559, 0.010587453842163086, 0.011057019233703613, 0.01152658462524414, 0.011996150016784668, 0.012465715408325195, 0.012935280799865723, 0.01340484619140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 7.0, 8.0, 9.0, 12.0, 21.0, 25.0, 34.0, 70.0, 117.0, 114.0, 152.0, 135.0, 91.0, 66.0, 33.0, 21.0, 17.0, 15.0, 5.0, 13.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006931304931640625, -0.006607115268707275, -0.006282925605773926, -0.005958735942840576, -0.0056345462799072266, -0.005310356616973877, -0.004986166954040527, -0.004661977291107178, -0.004337787628173828, -0.0040135979652404785, -0.003689408302307129, -0.0033652186393737793, -0.0030410289764404297, -0.00271683931350708, -0.0023926496505737305, -0.002068459987640381, -0.0017442703247070312, -0.0014200806617736816, -0.001095890998840332, -0.0007717013359069824, -0.0004475116729736328, -0.0001233220100402832, 0.0002008676528930664, 0.000525057315826416, 0.0008492469787597656, 0.0011734366416931152, 0.0014976263046264648, 0.0018218159675598145, 0.002146005630493164, 0.0024701952934265137, 0.0027943849563598633, 0.003118574619293213, 0.0034427642822265625, 0.003766953945159912, 0.004091143608093262, 0.004415333271026611, 0.004739522933959961, 0.0050637125968933105, 0.00538790225982666, 0.00571209192276001, 0.006036281585693359, 0.006360471248626709, 0.006684660911560059, 0.007008850574493408, 0.007333040237426758, 0.007657229900360107, 0.007981419563293457, 0.008305609226226807, 0.008629798889160156, 0.008953988552093506, 0.009278178215026855, 0.009602367877960205, 0.009926557540893555, 0.010250747203826904, 0.010574936866760254, 0.010899126529693604, 0.011223316192626953, 0.011547505855560303, 0.011871695518493652, 0.012195885181427002, 0.012520074844360352, 0.012844264507293701, 0.01316845417022705, 0.0134926438331604, 0.01381683349609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 12.0, 112.0, 586.0, 247.0, 37.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15375575423240662, -0.14257372915744781, -0.131391704082489, -0.12020967155694962, -0.10902764648199081, -0.09784562140703201, -0.08666358888149261, -0.07548156380653381, -0.06429953873157501, -0.05311751365661621, -0.04193548485636711, -0.03075345605611801, -0.01957143098115921, -0.008389405906200409, 0.0027926266193389893, 0.01397465169429779, 0.025156676769256592, 0.03633870184421539, 0.04752073064446449, 0.05870275944471359, 0.0698847845196724, 0.0810668095946312, 0.0922488421201706, 0.1034308671951294, 0.1146128922700882, 0.125794917345047, 0.1369769424200058, 0.1481589674949646, 0.1593410074710846, 0.1705230176448822, 0.1817050576210022, 0.192887082695961, 0.2040690779685974, 0.2152511030435562, 0.22643312811851501, 0.237615168094635, 0.24879717826843262, 0.2599792182445526, 0.2711612582206726, 0.2823432683944702, 0.2935252785682678, 0.3047073185443878, 0.3158893287181854, 0.3270713686943054, 0.338253378868103, 0.349435418844223, 0.360617458820343, 0.3717994689941406, 0.3829815089702606, 0.3941635489463806, 0.4053455591201782, 0.4165275990962982, 0.4277096092700958, 0.4388916492462158, 0.4500736594200134, 0.4612556993961334, 0.4724377393722534, 0.4836197793483734, 0.494801789522171, 0.505983829498291, 0.5171658396720886, 0.5283478498458862, 0.5395299196243286, 0.5507119297981262, 0.5618939399719238]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 16.0, 17.0, 17.0, 19.0, 19.0, 32.0, 36.0, 36.0, 34.0, 41.0, 38.0, 40.0, 51.0, 48.0, 45.0, 53.0, 49.0, 36.0, 35.0, 37.0, 31.0, 33.0, 29.0, 31.0, 31.0, 31.0, 16.0, 15.0, 16.0, 11.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07513010501861572, -0.07288433611392975, -0.07063857465982437, -0.0683928057551384, -0.06614704430103302, -0.06390127539634705, -0.06165550649166107, -0.059409741312265396, -0.05716397613286972, -0.054918210953474045, -0.05267244577407837, -0.050426676869392395, -0.04818091168999672, -0.045935146510601044, -0.04368937760591507, -0.041443612426519394, -0.03919784724712372, -0.03695208206772804, -0.03470631688833237, -0.03246054798364639, -0.030214782804250717, -0.02796901762485504, -0.025723250582814217, -0.02347748354077339, -0.021231718361377716, -0.01898595318198204, -0.016740186139941216, -0.014494420029222965, -0.012248653918504715, -0.010002887807786465, -0.007757121697068214, -0.0055113546550273895, -0.003265589475631714, -0.0010198233649134636, 0.0012259427458047867, 0.003471708856523037, 0.005717474967241287, 0.007963241077959538, 0.010209007188677788, 0.012454774230718613, 0.014700539410114288, 0.016946304589509964, 0.01919207163155079, 0.021437838673591614, 0.02368360385298729, 0.025929369032382965, 0.02817513607442379, 0.030420903116464615, 0.03266666829586029, 0.034912433475255966, 0.03715819865465164, 0.039403967559337616, 0.04164973273873329, 0.04389549791812897, 0.04614126682281494, 0.04838703200221062, 0.05063279718160629, 0.05287856236100197, 0.055124327540397644, 0.05737009644508362, 0.059615861624479294, 0.06186162680387497, 0.06410739570856094, 0.06635315716266632, 0.0685989260673523]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 3.0, 8.0, 16.0, 25.0, 37.0, 93.0, 286.0, 658.0, 1166.0, 1485.0, 2422.0, 8542.0, 238502.0, 3910507.0, 23033.0, 3787.0, 1735.0, 819.0, 387.0, 291.0, 244.0, 99.0, 40.0, 25.0, 18.0, 12.0, 11.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.0379328727722168, -0.036589622497558594, -0.03524637222290039, -0.03390312194824219, -0.032559871673583984, -0.03121662139892578, -0.029873371124267578, -0.028530120849609375, -0.027186870574951172, -0.02584362030029297, -0.024500370025634766, -0.023157119750976562, -0.02181386947631836, -0.020470619201660156, -0.019127368927001953, -0.01778411865234375, -0.016440868377685547, -0.015097618103027344, -0.01375436782836914, -0.012411117553710938, -0.011067867279052734, -0.009724617004394531, -0.008381366729736328, -0.007038116455078125, -0.005694866180419922, -0.004351615905761719, -0.0030083656311035156, -0.0016651153564453125, -0.0003218650817871094, 0.0010213851928710938, 0.002364635467529297, 0.0037078857421875, 0.005051136016845703, 0.006394386291503906, 0.007737636566162109, 0.009080886840820312, 0.010424137115478516, 0.011767387390136719, 0.013110637664794922, 0.014453887939453125, 0.015797138214111328, 0.01714038848876953, 0.018483638763427734, 0.019826889038085938, 0.02117013931274414, 0.022513389587402344, 0.023856639862060547, 0.02519989013671875, 0.026543140411376953, 0.027886390686035156, 0.02922964096069336, 0.030572891235351562, 0.031916141510009766, 0.03325939178466797, 0.03460264205932617, 0.035945892333984375, 0.03728914260864258, 0.03863239288330078, 0.039975643157958984, 0.04131889343261719, 0.04266214370727539, 0.044005393981933594, 0.0453486442565918, 0.04669189453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 15.0, 88.0, 262.0, 372.0, 201.0, 53.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06346893310546875, -0.0615081787109375, -0.05954742431640625, -0.057586669921875, -0.05562591552734375, -0.0536651611328125, -0.05170440673828125, -0.04974365234375, -0.04778289794921875, -0.0458221435546875, -0.04386138916015625, -0.041900634765625, -0.03993988037109375, -0.0379791259765625, -0.03601837158203125, -0.0340576171875, -0.03209686279296875, -0.0301361083984375, -0.02817535400390625, -0.026214599609375, -0.02425384521484375, -0.0222930908203125, -0.02033233642578125, -0.01837158203125, -0.01641082763671875, -0.0144500732421875, -0.01248931884765625, -0.010528564453125, -0.00856781005859375, -0.0066070556640625, -0.00464630126953125, -0.002685546875, -0.00072479248046875, 0.0012359619140625, 0.00319671630859375, 0.005157470703125, 0.00711822509765625, 0.0090789794921875, 0.01103973388671875, 0.01300048828125, 0.01496124267578125, 0.0169219970703125, 0.01888275146484375, 0.020843505859375, 0.02280426025390625, 0.0247650146484375, 0.02672576904296875, 0.0286865234375, 0.03064727783203125, 0.0326080322265625, 0.03456878662109375, 0.036529541015625, 0.03849029541015625, 0.0404510498046875, 0.04241180419921875, 0.04437255859375, 0.04633331298828125, 0.0482940673828125, 0.05025482177734375, 0.052215576171875, 0.05417633056640625, 0.0561370849609375, 0.05809783935546875, 0.06005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 6.0, 12.0, 13.0, 16.0, 20.0, 28.0, 55.0, 90.0, 120.0, 193.0, 296.0, 603.0, 1236.0, 3080.0, 8707.0, 32822.0, 186715.0, 3540404.0, 351426.0, 48814.0, 12431.0, 3989.0, 1599.0, 696.0, 363.0, 187.0, 117.0, 76.0, 43.0, 30.0, 31.0, 13.0, 14.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0187835693359375, -0.018284320831298828, -0.017785072326660156, -0.017285823822021484, -0.016786575317382812, -0.01628732681274414, -0.01578807830810547, -0.015288829803466797, -0.014789581298828125, -0.014290332794189453, -0.013791084289550781, -0.01329183578491211, -0.012792587280273438, -0.012293338775634766, -0.011794090270996094, -0.011294841766357422, -0.01079559326171875, -0.010296344757080078, -0.009797096252441406, -0.009297847747802734, -0.008798599243164062, -0.00829935073852539, -0.007800102233886719, -0.007300853729248047, -0.006801605224609375, -0.006302356719970703, -0.005803108215332031, -0.005303859710693359, -0.0048046112060546875, -0.004305362701416016, -0.0038061141967773438, -0.003306865692138672, -0.0028076171875, -0.002308368682861328, -0.0018091201782226562, -0.0013098716735839844, -0.0008106231689453125, -0.0003113746643066406, 0.00018787384033203125, 0.0006871223449707031, 0.001186370849609375, 0.0016856193542480469, 0.0021848678588867188, 0.0026841163635253906, 0.0031833648681640625, 0.0036826133728027344, 0.004181861877441406, 0.004681110382080078, 0.00518035888671875, 0.005679607391357422, 0.006178855895996094, 0.006678104400634766, 0.0071773529052734375, 0.007676601409912109, 0.008175849914550781, 0.008675098419189453, 0.009174346923828125, 0.009673595428466797, 0.010172843933105469, 0.01067209243774414, 0.011171340942382812, 0.011670589447021484, 0.012169837951660156, 0.012669086456298828, 0.0131683349609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 2.0, 7.0, 15.0, 20.0, 20.0, 32.0, 45.0, 61.0, 112.0, 246.0, 593.0, 1277.0, 808.0, 327.0, 150.0, 95.0, 58.0, 59.0, 32.0, 27.0, 16.0, 8.0, 11.0, 9.0, 6.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01275634765625, -0.012376904487609863, -0.011997461318969727, -0.01161801815032959, -0.011238574981689453, -0.010859131813049316, -0.01047968864440918, -0.010100245475769043, -0.009720802307128906, -0.00934135913848877, -0.008961915969848633, -0.008582472801208496, -0.00820302963256836, -0.007823586463928223, -0.007444143295288086, -0.007064700126647949, -0.0066852569580078125, -0.006305813789367676, -0.005926370620727539, -0.005546927452087402, -0.005167484283447266, -0.004788041114807129, -0.004408597946166992, -0.0040291547775268555, -0.0036497116088867188, -0.003270268440246582, -0.0028908252716064453, -0.0025113821029663086, -0.002131938934326172, -0.0017524957656860352, -0.0013730525970458984, -0.0009936094284057617, -0.000614166259765625, -0.00023472309112548828, 0.00014472007751464844, 0.0005241632461547852, 0.0009036064147949219, 0.0012830495834350586, 0.0016624927520751953, 0.002041935920715332, 0.0024213790893554688, 0.0028008222579956055, 0.003180265426635742, 0.003559708595275879, 0.003939151763916016, 0.004318594932556152, 0.004698038101196289, 0.005077481269836426, 0.0054569244384765625, 0.005836367607116699, 0.006215810775756836, 0.006595253944396973, 0.006974697113037109, 0.007354140281677246, 0.007733583450317383, 0.00811302661895752, 0.008492469787597656, 0.008871912956237793, 0.00925135612487793, 0.009630799293518066, 0.010010242462158203, 0.01038968563079834, 0.010769128799438477, 0.011148571968078613, 0.01152801513671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 13.0, 46.0, 143.0, 360.0, 273.0, 121.0, 34.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17345602810382843, -0.16957254707813263, -0.16568908095359802, -0.16180559992790222, -0.15792211890220642, -0.15403863787651062, -0.150155171751976, -0.1462716907262802, -0.1423882246017456, -0.1385047435760498, -0.1346212774515152, -0.1307377964258194, -0.1268543154001236, -0.12297084182500839, -0.11908736824989319, -0.11520388722419739, -0.11132040619850159, -0.10743693262338638, -0.10355345159769058, -0.09966997802257538, -0.09578649699687958, -0.09190302342176437, -0.08801954984664917, -0.08413606882095337, -0.08025259524583817, -0.07636912167072296, -0.07248564064502716, -0.06860216706991196, -0.06471869349479675, -0.06083521246910095, -0.05695173889398575, -0.053068261593580246, -0.04918479174375534, -0.04530131444334984, -0.041417837142944336, -0.03753436356782913, -0.03365088626742363, -0.029767408967018127, -0.025883933529257774, -0.02200045809149742, -0.01811698079109192, -0.014233504422008991, -0.010350028052926064, -0.006466551683843136, -0.002583075314760208, 0.0013004019856452942, 0.005183877423405647, 0.009067352861166, 0.012950830161571503, 0.016834307461977005, 0.020717782899737358, 0.02460125833749771, 0.028484735637903214, 0.032368212938308716, 0.03625168651342392, 0.04013516381382942, 0.044018641114234924, 0.04790211841464043, 0.05178559571504593, 0.05566906929016113, 0.059552546590566635, 0.06343602389097214, 0.06731949746608734, 0.07120297849178314, 0.07508645206689835]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 5.0, 6.0, 15.0, 20.0, 17.0, 15.0, 19.0, 20.0, 30.0, 36.0, 26.0, 32.0, 40.0, 38.0, 34.0, 39.0, 50.0, 39.0, 44.0, 40.0, 40.0, 46.0, 38.0, 32.0, 33.0, 28.0, 32.0, 20.0, 19.0, 19.0, 14.0, 18.0, 16.0, 15.0, 7.0, 4.0, 6.0, 5.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02538299560546875, -0.024583134800195694, -0.023783275857567787, -0.02298341691493988, -0.022183556109666824, -0.02138369530439377, -0.02058383636176586, -0.019783977419137955, -0.0189841166138649, -0.018184255808591843, -0.017384396865963936, -0.01658453792333603, -0.015784677118062973, -0.014984817244112492, -0.01418495737016201, -0.013385097496211529, -0.012585237622261047, -0.011785377748310566, -0.010985517874360085, -0.010185658000409603, -0.009385798126459122, -0.00858593825250864, -0.007786078378558159, -0.0069862185046076775, -0.006186358630657196, -0.005386498756706715, -0.004586638882756233, -0.003786779008805752, -0.0029869191348552704, -0.002187059260904789, -0.0013871993869543076, -0.0005873395130038261, 0.00021252036094665527, 0.0010123802348971367, 0.001812240108847618, 0.0026120999827980995, 0.003411959856748581, 0.004211819730699062, 0.005011679604649544, 0.005811539478600025, 0.006611399352550507, 0.007411259226500988, 0.00821111910045147, 0.00901097897440195, 0.009810838848352432, 0.010610698722302914, 0.011410558596253395, 0.012210418470203876, 0.013010278344154358, 0.01381013821810484, 0.01460999809205532, 0.015409857966005802, 0.016209717839956284, 0.01700957864522934, 0.017809437587857246, 0.018609296530485153, 0.01940915733575821, 0.020209018141031265, 0.021008877083659172, 0.02180873602628708, 0.022608596831560135, 0.02340845763683319, 0.024208316579461098, 0.025008175522089005, 0.02580803632736206]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 12.0, 13.0, 19.0, 13.0, 25.0, 24.0, 30.0, 39.0, 69.0, 76.0, 121.0, 141.0, 195.0, 275.0, 367.0, 624.0, 1114.0, 3213.0, 22214.0, 548118.0, 447588.0, 18395.0, 2893.0, 969.0, 576.0, 392.0, 251.0, 193.0, 123.0, 97.0, 92.0, 59.0, 46.0, 46.0, 35.0, 16.0, 17.0, 12.0, 13.0, 7.0, 5.0, 3.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.043548583984375, -0.042095184326171875, -0.04064178466796875, -0.039188385009765625, -0.0377349853515625, -0.036281585693359375, -0.03482818603515625, -0.033374786376953125, -0.03192138671875, -0.030467987060546875, -0.02901458740234375, -0.027561187744140625, -0.0261077880859375, -0.024654388427734375, -0.02320098876953125, -0.021747589111328125, -0.020294189453125, -0.018840789794921875, -0.01738739013671875, -0.015933990478515625, -0.0144805908203125, -0.013027191162109375, -0.01157379150390625, -0.010120391845703125, -0.0086669921875, -0.007213592529296875, -0.00576019287109375, -0.004306793212890625, -0.0028533935546875, -0.001399993896484375, 5.340576171875e-05, 0.001506805419921875, 0.002960205078125, 0.004413604736328125, 0.00586700439453125, 0.007320404052734375, 0.0087738037109375, 0.010227203369140625, 0.01168060302734375, 0.013134002685546875, 0.01458740234375, 0.016040802001953125, 0.01749420166015625, 0.018947601318359375, 0.0204010009765625, 0.021854400634765625, 0.02330780029296875, 0.024761199951171875, 0.026214599609375, 0.027667999267578125, 0.02912139892578125, 0.030574798583984375, 0.0320281982421875, 0.033481597900390625, 0.03493499755859375, 0.036388397216796875, 0.037841796875, 0.039295196533203125, 0.04074859619140625, 0.042201995849609375, 0.0436553955078125, 0.045108795166015625, 0.04656219482421875, 0.048015594482421875, 0.049468994140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 25.0, 118.0, 319.0, 361.0, 145.0, 26.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06493473052978516, -0.06291389465332031, -0.06089305877685547, -0.058872222900390625, -0.05685138702392578, -0.05483055114746094, -0.052809715270996094, -0.05078887939453125, -0.048768043518066406, -0.04674720764160156, -0.04472637176513672, -0.042705535888671875, -0.04068470001220703, -0.03866386413574219, -0.036643028259277344, -0.0346221923828125, -0.032601356506347656, -0.030580520629882812, -0.02855968475341797, -0.026538848876953125, -0.02451801300048828, -0.022497177124023438, -0.020476341247558594, -0.01845550537109375, -0.016434669494628906, -0.014413833618164062, -0.012392997741699219, -0.010372161865234375, -0.008351325988769531, -0.0063304901123046875, -0.004309654235839844, -0.002288818359375, -0.00026798248291015625, 0.0017528533935546875, 0.0037736892700195312, 0.005794525146484375, 0.007815361022949219, 0.009836196899414062, 0.011857032775878906, 0.01387786865234375, 0.015898704528808594, 0.017919540405273438, 0.01994037628173828, 0.021961212158203125, 0.02398204803466797, 0.026002883911132812, 0.028023719787597656, 0.0300445556640625, 0.032065391540527344, 0.03408622741699219, 0.03610706329345703, 0.038127899169921875, 0.04014873504638672, 0.04216957092285156, 0.044190406799316406, 0.04621124267578125, 0.048232078552246094, 0.05025291442871094, 0.05227375030517578, 0.054294586181640625, 0.05631542205810547, 0.05833625793457031, 0.060357093811035156, 0.0623779296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 10.0, 11.0, 19.0, 14.0, 30.0, 57.0, 98.0, 150.0, 334.0, 1064.0, 4389.0, 45974.0, 811919.0, 172981.0, 8792.0, 1656.0, 540.0, 200.0, 104.0, 53.0, 44.0, 36.0, 19.0, 11.0, 10.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.056157588958740234, -0.05466747283935547, -0.0531773567199707, -0.05168724060058594, -0.05019712448120117, -0.048707008361816406, -0.04721689224243164, -0.045726776123046875, -0.04423666000366211, -0.042746543884277344, -0.04125642776489258, -0.03976631164550781, -0.03827619552612305, -0.03678607940673828, -0.035295963287353516, -0.03380584716796875, -0.032315731048583984, -0.03082561492919922, -0.029335498809814453, -0.027845382690429688, -0.026355266571044922, -0.024865150451660156, -0.02337503433227539, -0.021884918212890625, -0.02039480209350586, -0.018904685974121094, -0.017414569854736328, -0.015924453735351562, -0.014434337615966797, -0.012944221496582031, -0.011454105377197266, -0.0099639892578125, -0.008473873138427734, -0.006983757019042969, -0.005493640899658203, -0.0040035247802734375, -0.002513408660888672, -0.0010232925415039062, 0.0004668235778808594, 0.001956939697265625, 0.0034470558166503906, 0.004937171936035156, 0.006427288055419922, 0.007917404174804688, 0.009407520294189453, 0.010897636413574219, 0.012387752532958984, 0.01387786865234375, 0.015367984771728516, 0.01685810089111328, 0.018348217010498047, 0.019838333129882812, 0.021328449249267578, 0.022818565368652344, 0.02430868148803711, 0.025798797607421875, 0.02728891372680664, 0.028779029846191406, 0.030269145965576172, 0.03175926208496094, 0.0332493782043457, 0.03473949432373047, 0.036229610443115234, 0.0377197265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 5.0, 11.0, 16.0, 24.0, 24.0, 25.0, 28.0, 40.0, 51.0, 46.0, 53.0, 43.0, 57.0, 56.0, 58.0, 54.0, 43.0, 50.0, 59.0, 40.0, 44.0, 35.0, 17.0, 24.0, 24.0, 15.0, 10.0, 10.0, 4.0, 10.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024688720703125, -0.02373027801513672, -0.022771835327148438, -0.021813392639160156, -0.020854949951171875, -0.019896507263183594, -0.018938064575195312, -0.01797962188720703, -0.01702117919921875, -0.01606273651123047, -0.015104293823242188, -0.014145851135253906, -0.013187408447265625, -0.012228965759277344, -0.011270523071289062, -0.010312080383300781, -0.0093536376953125, -0.008395195007324219, -0.0074367523193359375, -0.006478309631347656, -0.005519866943359375, -0.004561424255371094, -0.0036029815673828125, -0.0026445388793945312, -0.00168609619140625, -0.0007276535034179688, 0.0002307891845703125, 0.0011892318725585938, 0.002147674560546875, 0.0031061172485351562, 0.0040645599365234375, 0.005023002624511719, 0.0059814453125, 0.006939888000488281, 0.007898330688476562, 0.008856773376464844, 0.009815216064453125, 0.010773658752441406, 0.011732101440429688, 0.012690544128417969, 0.01364898681640625, 0.014607429504394531, 0.015565872192382812, 0.016524314880371094, 0.017482757568359375, 0.018441200256347656, 0.019399642944335938, 0.02035808563232422, 0.0213165283203125, 0.02227497100830078, 0.023233413696289062, 0.024191856384277344, 0.025150299072265625, 0.026108741760253906, 0.027067184448242188, 0.02802562713623047, 0.02898406982421875, 0.02994251251220703, 0.030900955200195312, 0.031859397888183594, 0.032817840576171875, 0.033776283264160156, 0.03473472595214844, 0.03569316864013672, 0.036651611328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 9.0, 15.0, 29.0, 16.0, 25.0, 46.0, 55.0, 73.0, 86.0, 141.0, 174.0, 254.0, 357.0, 420.0, 629.0, 808.0, 1248.0, 1697.0, 2507.0, 3974.0, 7201.0, 19719.0, 92532.0, 713864.0, 153103.0, 26993.0, 8649.0, 4466.0, 2785.0, 1867.0, 1287.0, 917.0, 660.0, 494.0, 386.0, 271.0, 182.0, 157.0, 133.0, 86.0, 55.0, 37.0, 32.0, 16.0, 26.0, 17.0, 10.0, 8.0, 10.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0113067626953125, -0.010949134826660156, -0.010591506958007812, -0.010233879089355469, -0.009876251220703125, -0.009518623352050781, -0.009160995483398438, -0.008803367614746094, -0.00844573974609375, -0.008088111877441406, -0.0077304840087890625, -0.007372856140136719, -0.007015228271484375, -0.006657600402832031, -0.0062999725341796875, -0.005942344665527344, -0.005584716796875, -0.005227088928222656, -0.0048694610595703125, -0.004511833190917969, -0.004154205322265625, -0.0037965774536132812, -0.0034389495849609375, -0.0030813217163085938, -0.00272369384765625, -0.0023660659790039062, -0.0020084381103515625, -0.0016508102416992188, -0.001293182373046875, -0.0009355545043945312, -0.0005779266357421875, -0.00022029876708984375, 0.0001373291015625, 0.0004949569702148438, 0.0008525848388671875, 0.0012102127075195312, 0.001567840576171875, 0.0019254684448242188, 0.0022830963134765625, 0.0026407241821289062, 0.00299835205078125, 0.0033559799194335938, 0.0037136077880859375, 0.004071235656738281, 0.004428863525390625, 0.004786491394042969, 0.0051441192626953125, 0.005501747131347656, 0.005859375, 0.006217002868652344, 0.0065746307373046875, 0.006932258605957031, 0.007289886474609375, 0.007647514343261719, 0.008005142211914062, 0.008362770080566406, 0.00872039794921875, 0.009078025817871094, 0.009435653686523438, 0.009793281555175781, 0.010150909423828125, 0.010508537292480469, 0.010866165161132812, 0.011223793029785156, 0.0115814208984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 8.0, 19.0, 36.0, 50.0, 81.0, 121.0, 164.0, 140.0, 146.0, 90.0, 40.0, 34.0, 18.0, 13.0, 5.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.0001427382230758667, -0.00013813376426696777, -0.00013352930545806885, -0.00012892484664916992, -0.000124320387840271, -0.00011971592903137207, -0.00011511147022247314, -0.00011050701141357422, -0.00010590255260467529, -0.00010129809379577637, -9.669363498687744e-05, -9.208917617797852e-05, -8.748471736907959e-05, -8.288025856018066e-05, -7.827579975128174e-05, -7.367134094238281e-05, -6.906688213348389e-05, -6.446242332458496e-05, -5.9857964515686035e-05, -5.525350570678711e-05, -5.0649046897888184e-05, -4.604458808898926e-05, -4.144012928009033e-05, -3.6835670471191406e-05, -3.223121166229248e-05, -2.7626752853393555e-05, -2.302229404449463e-05, -1.8417835235595703e-05, -1.3813376426696777e-05, -9.208917617797852e-06, -4.604458808898926e-06, 0.0, 4.604458808898926e-06, 9.208917617797852e-06, 1.3813376426696777e-05, 1.8417835235595703e-05, 2.302229404449463e-05, 2.7626752853393555e-05, 3.223121166229248e-05, 3.6835670471191406e-05, 4.144012928009033e-05, 4.604458808898926e-05, 5.0649046897888184e-05, 5.525350570678711e-05, 5.9857964515686035e-05, 6.446242332458496e-05, 6.906688213348389e-05, 7.367134094238281e-05, 7.827579975128174e-05, 8.288025856018066e-05, 8.748471736907959e-05, 9.208917617797852e-05, 9.669363498687744e-05, 0.00010129809379577637, 0.00010590255260467529, 0.00011050701141357422, 0.00011511147022247314, 0.00011971592903137207, 0.000124320387840271, 0.00012892484664916992, 0.00013352930545806885, 0.00013813376426696777, 0.0001427382230758667, 0.00014734268188476562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 4.0, 5.0, 6.0, 11.0, 12.0, 12.0, 25.0, 31.0, 50.0, 75.0, 114.0, 215.0, 388.0, 775.0, 1459.0, 3297.0, 8730.0, 33974.0, 346728.0, 588613.0, 45977.0, 10629.0, 3685.0, 1802.0, 827.0, 452.0, 245.0, 146.0, 86.0, 59.0, 34.0, 26.0, 17.0, 11.0, 9.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.016937255859375, -0.016425371170043945, -0.01591348648071289, -0.015401601791381836, -0.014889717102050781, -0.014377832412719727, -0.013865947723388672, -0.013354063034057617, -0.012842178344726562, -0.012330293655395508, -0.011818408966064453, -0.011306524276733398, -0.010794639587402344, -0.010282754898071289, -0.009770870208740234, -0.00925898551940918, -0.008747100830078125, -0.00823521614074707, -0.007723331451416016, -0.007211446762084961, -0.006699562072753906, -0.0061876773834228516, -0.005675792694091797, -0.005163908004760742, -0.0046520233154296875, -0.004140138626098633, -0.003628253936767578, -0.0031163692474365234, -0.0026044845581054688, -0.002092599868774414, -0.0015807151794433594, -0.0010688304901123047, -0.00055694580078125, -4.506111145019531e-05, 0.0004668235778808594, 0.000978708267211914, 0.0014905929565429688, 0.0020024776458740234, 0.002514362335205078, 0.003026247024536133, 0.0035381317138671875, 0.004050016403198242, 0.004561901092529297, 0.0050737857818603516, 0.005585670471191406, 0.006097555160522461, 0.006609439849853516, 0.00712132453918457, 0.007633209228515625, 0.00814509391784668, 0.008656978607177734, 0.009168863296508789, 0.009680747985839844, 0.010192632675170898, 0.010704517364501953, 0.011216402053833008, 0.011728286743164062, 0.012240171432495117, 0.012752056121826172, 0.013263940811157227, 0.013775825500488281, 0.014287710189819336, 0.01479959487915039, 0.015311479568481445, 0.0158233642578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 2.0, 8.0, 11.0, 13.0, 39.0, 126.0, 256.0, 303.0, 131.0, 47.0, 27.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015960693359375, -0.015298604965209961, -0.014636516571044922, -0.013974428176879883, -0.013312339782714844, -0.012650251388549805, -0.011988162994384766, -0.011326074600219727, -0.010663986206054688, -0.010001897811889648, -0.00933980941772461, -0.00867772102355957, -0.008015632629394531, -0.007353544235229492, -0.006691455841064453, -0.006029367446899414, -0.005367279052734375, -0.004705190658569336, -0.004043102264404297, -0.003381013870239258, -0.0027189254760742188, -0.0020568370819091797, -0.0013947486877441406, -0.0007326602935791016, -7.05718994140625e-05, 0.0005915164947509766, 0.0012536048889160156, 0.0019156932830810547, 0.0025777816772460938, 0.003239870071411133, 0.003901958465576172, 0.004564046859741211, 0.00522613525390625, 0.005888223648071289, 0.006550312042236328, 0.007212400436401367, 0.007874488830566406, 0.008536577224731445, 0.009198665618896484, 0.009860754013061523, 0.010522842407226562, 0.011184930801391602, 0.01184701919555664, 0.01250910758972168, 0.013171195983886719, 0.013833284378051758, 0.014495372772216797, 0.015157461166381836, 0.015819549560546875, 0.016481637954711914, 0.017143726348876953, 0.017805814743041992, 0.01846790313720703, 0.01912999153137207, 0.01979207992553711, 0.02045416831970215, 0.021116256713867188, 0.021778345108032227, 0.022440433502197266, 0.023102521896362305, 0.023764610290527344, 0.024426698684692383, 0.025088787078857422, 0.02575087547302246, 0.0264129638671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 43.0, 535.0, 388.0, 35.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.201520323753357, -1.180418610572815, -1.1593170166015625, -1.1382153034210205, -1.1171135902404785, -1.096011996269226, -1.074910283088684, -1.0538086891174316, -1.0327069759368896, -1.0116052627563477, -0.9905036091804504, -0.9694019556045532, -0.948300302028656, -0.9271986484527588, -0.9060969352722168, -0.8849952816963196, -0.8638936281204224, -0.8427919745445251, -0.8216902613639832, -0.8005886077880859, -0.7794869542121887, -0.7583853006362915, -0.7372835874557495, -0.7161819338798523, -0.6950802206993103, -0.6739785671234131, -0.6528768539428711, -0.6317752003669739, -0.6106735467910767, -0.5895718932151794, -0.5684701800346375, -0.5473685264587402, -0.5262669324874878, -0.5051652789115906, -0.48406359553337097, -0.46296191215515137, -0.44186025857925415, -0.42075857520103455, -0.39965689182281494, -0.3785552382469177, -0.35745352506637573, -0.33635184168815613, -0.3152501881122589, -0.2941485047340393, -0.2730468511581421, -0.2519451677799225, -0.23084349930286407, -0.20974183082580566, -0.18864017724990845, -0.16753850877285004, -0.14643684029579163, -0.12533515691757202, -0.10423349589109421, -0.0831318274140358, -0.06203015148639679, -0.04092848300933838, -0.019826814532279968, 0.0012748558074235916, 0.02237652614712715, 0.04347819834947586, 0.06457986682653427, 0.08568153530359268, 0.10678321123123169, 0.1278848797082901, 0.1489865481853485]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 12.0, 11.0, 17.0, 12.0, 16.0, 14.0, 20.0, 20.0, 24.0, 24.0, 37.0, 17.0, 37.0, 34.0, 39.0, 38.0, 39.0, 32.0, 43.0, 27.0, 45.0, 35.0, 30.0, 36.0, 24.0, 33.0, 32.0, 36.0, 19.0, 41.0, 17.0, 16.0, 10.0, 12.0, 14.0, 7.0, 13.0, 11.0, 9.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.07135003805160522, -0.06931910663843155, -0.06728818267583847, -0.0652572512626648, -0.06322632730007172, -0.06119539588689804, -0.059164464473724365, -0.05713353678584099, -0.05510260909795761, -0.053071681410074234, -0.05104075372219086, -0.04900982230901718, -0.046978894621133804, -0.04494796693325043, -0.04291703552007675, -0.040886107832193375, -0.03885518014431, -0.03682425245642662, -0.03479332476854324, -0.03276239335536957, -0.03073146566748619, -0.028700537979602814, -0.026669608429074287, -0.02463867887854576, -0.022607751190662384, -0.020576823502779007, -0.01854589395225048, -0.016514964401721954, -0.014484036713838577, -0.012453108094632626, -0.010422179475426674, -0.008391250856220722, -0.0063603222370147705, -0.004329393617808819, -0.002298464998602867, -0.00026753637939691544, 0.0017633922398090363, 0.003794320859014988, 0.00582524947822094, 0.007856178097426891, 0.009887106716632843, 0.011918035335838795, 0.013948963955044746, 0.015979893505573273, 0.01801082119345665, 0.020041748881340027, 0.022072678431868553, 0.02410360798239708, 0.026134535670280457, 0.028165463358163834, 0.03019639290869236, 0.032227322459220886, 0.03425825014710426, 0.03628917783498764, 0.038320109248161316, 0.04035103693604469, 0.04238196462392807, 0.04441289231181145, 0.046443819999694824, 0.0484747514128685, 0.05050567910075188, 0.052536606788635254, 0.05456753820180893, 0.056598465889692307, 0.058629393577575684]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 15.0, 19.0, 40.0, 87.0, 284.0, 595.0, 1410.0, 2187.0, 5635.0, 70659.0, 4062273.0, 43490.0, 4330.0, 1736.0, 644.0, 374.0, 289.0, 93.0, 39.0, 26.0, 17.0, 13.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05462646484375, -0.0529932975769043, -0.051360130310058594, -0.04972696304321289, -0.04809379577636719, -0.046460628509521484, -0.04482746124267578, -0.04319429397583008, -0.041561126708984375, -0.03992795944213867, -0.03829479217529297, -0.036661624908447266, -0.03502845764160156, -0.03339529037475586, -0.031762123107910156, -0.030128955841064453, -0.02849578857421875, -0.026862621307373047, -0.025229454040527344, -0.02359628677368164, -0.021963119506835938, -0.020329952239990234, -0.01869678497314453, -0.017063617706298828, -0.015430450439453125, -0.013797283172607422, -0.012164115905761719, -0.010530948638916016, -0.008897781372070312, -0.007264614105224609, -0.005631446838378906, -0.003998279571533203, -0.0023651123046875, -0.0007319450378417969, 0.0009012222290039062, 0.0025343894958496094, 0.0041675567626953125, 0.005800724029541016, 0.007433891296386719, 0.009067058563232422, 0.010700225830078125, 0.012333393096923828, 0.013966560363769531, 0.015599727630615234, 0.017232894897460938, 0.01886606216430664, 0.020499229431152344, 0.022132396697998047, 0.02376556396484375, 0.025398731231689453, 0.027031898498535156, 0.02866506576538086, 0.030298233032226562, 0.031931400299072266, 0.03356456756591797, 0.03519773483276367, 0.036830902099609375, 0.03846406936645508, 0.04009723663330078, 0.041730403900146484, 0.04336357116699219, 0.04499673843383789, 0.046629905700683594, 0.0482630729675293, 0.049896240234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 11.0, 55.0, 218.0, 368.0, 258.0, 76.0, 12.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.06295013427734375, -0.0609588623046875, -0.05896759033203125, -0.056976318359375, -0.05498504638671875, -0.0529937744140625, -0.05100250244140625, -0.04901123046875, -0.04701995849609375, -0.0450286865234375, -0.04303741455078125, -0.041046142578125, -0.03905487060546875, -0.0370635986328125, -0.03507232666015625, -0.0330810546875, -0.03108978271484375, -0.0290985107421875, -0.02710723876953125, -0.025115966796875, -0.02312469482421875, -0.0211334228515625, -0.01914215087890625, -0.01715087890625, -0.01515960693359375, -0.0131683349609375, -0.01117706298828125, -0.009185791015625, -0.00719451904296875, -0.0052032470703125, -0.00321197509765625, -0.001220703125, 0.00077056884765625, 0.0027618408203125, 0.00475311279296875, 0.006744384765625, 0.00873565673828125, 0.0107269287109375, 0.01271820068359375, 0.01470947265625, 0.01670074462890625, 0.0186920166015625, 0.02068328857421875, 0.022674560546875, 0.02466583251953125, 0.0266571044921875, 0.02864837646484375, 0.0306396484375, 0.03263092041015625, 0.0346221923828125, 0.03661346435546875, 0.038604736328125, 0.04059600830078125, 0.0425872802734375, 0.04457855224609375, 0.04656982421875, 0.04856109619140625, 0.0505523681640625, 0.05254364013671875, 0.054534912109375, 0.05652618408203125, 0.0585174560546875, 0.06050872802734375, 0.0625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 16.0, 13.0, 23.0, 48.0, 86.0, 161.0, 273.0, 617.0, 1278.0, 4048.0, 23801.0, 505604.0, 3585456.0, 61730.0, 7612.0, 1983.0, 767.0, 384.0, 184.0, 94.0, 57.0, 23.0, 15.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0262451171875, -0.025279998779296875, -0.02431488037109375, -0.023349761962890625, -0.0223846435546875, -0.021419525146484375, -0.02045440673828125, -0.019489288330078125, -0.018524169921875, -0.017559051513671875, -0.01659393310546875, -0.015628814697265625, -0.0146636962890625, -0.013698577880859375, -0.01273345947265625, -0.011768341064453125, -0.01080322265625, -0.009838104248046875, -0.00887298583984375, -0.007907867431640625, -0.0069427490234375, -0.005977630615234375, -0.00501251220703125, -0.004047393798828125, -0.003082275390625, -0.002117156982421875, -0.00115203857421875, -0.000186920166015625, 0.0007781982421875, 0.001743316650390625, 0.00270843505859375, 0.003673553466796875, 0.004638671875, 0.005603790283203125, 0.00656890869140625, 0.007534027099609375, 0.0084991455078125, 0.009464263916015625, 0.01042938232421875, 0.011394500732421875, 0.012359619140625, 0.013324737548828125, 0.01428985595703125, 0.015254974365234375, 0.0162200927734375, 0.017185211181640625, 0.01815032958984375, 0.019115447998046875, 0.02008056640625, 0.021045684814453125, 0.02201080322265625, 0.022975921630859375, 0.0239410400390625, 0.024906158447265625, 0.02587127685546875, 0.026836395263671875, 0.027801513671875, 0.028766632080078125, 0.02973175048828125, 0.030696868896484375, 0.0316619873046875, 0.032627105712890625, 0.03359222412109375, 0.034557342529296875, 0.0355224609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 7.0, 9.0, 18.0, 32.0, 50.0, 99.0, 262.0, 852.0, 1666.0, 610.0, 192.0, 105.0, 56.0, 40.0, 24.0, 18.0, 16.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.02491903305053711, -0.02423381805419922, -0.023548603057861328, -0.022863388061523438, -0.022178173065185547, -0.021492958068847656, -0.020807743072509766, -0.020122528076171875, -0.019437313079833984, -0.018752098083496094, -0.018066883087158203, -0.017381668090820312, -0.016696453094482422, -0.01601123809814453, -0.01532602310180664, -0.01464080810546875, -0.01395559310913086, -0.013270378112792969, -0.012585163116455078, -0.011899948120117188, -0.011214733123779297, -0.010529518127441406, -0.009844303131103516, -0.009159088134765625, -0.008473873138427734, -0.007788658142089844, -0.007103443145751953, -0.0064182281494140625, -0.005733013153076172, -0.005047798156738281, -0.004362583160400391, -0.0036773681640625, -0.0029921531677246094, -0.0023069381713867188, -0.0016217231750488281, -0.0009365081787109375, -0.0002512931823730469, 0.00043392181396484375, 0.0011191368103027344, 0.001804351806640625, 0.0024895668029785156, 0.0031747817993164062, 0.003859996795654297, 0.0045452117919921875, 0.005230426788330078, 0.005915641784667969, 0.006600856781005859, 0.00728607177734375, 0.00797128677368164, 0.008656501770019531, 0.009341716766357422, 0.010026931762695312, 0.010712146759033203, 0.011397361755371094, 0.012082576751708984, 0.012767791748046875, 0.013453006744384766, 0.014138221740722656, 0.014823436737060547, 0.015508651733398438, 0.016193866729736328, 0.01687908172607422, 0.01756429672241211, 0.01824951171875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 33.0, 93.0, 287.0, 359.0, 169.0, 44.0, 10.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.27695393562316895, -0.27163928747177124, -0.2663246691226959, -0.2610100507736206, -0.2556954026222229, -0.2503807544708252, -0.24506613612174988, -0.23975150287151337, -0.23443686962127686, -0.22912223637104034, -0.22380760312080383, -0.21849296987056732, -0.2131783366203308, -0.2078637033700943, -0.2025490701198578, -0.19723443686962128, -0.19191980361938477, -0.18660517036914825, -0.18129053711891174, -0.17597590386867523, -0.17066127061843872, -0.1653466373682022, -0.1600320041179657, -0.1547173708677292, -0.14940273761749268, -0.14408810436725616, -0.13877347111701965, -0.13345883786678314, -0.12814420461654663, -0.12282957136631012, -0.11751493811607361, -0.1122003048658371, -0.10688565671443939, -0.10157102346420288, -0.09625639021396637, -0.09094175696372986, -0.08562712371349335, -0.08031249046325684, -0.07499785721302032, -0.06968322396278381, -0.0643685907125473, -0.05905395746231079, -0.05373932421207428, -0.04842469096183777, -0.04311005771160126, -0.037795424461364746, -0.032480791211128235, -0.027166157960891724, -0.021851524710655212, -0.0165368914604187, -0.01122225821018219, -0.005907624959945679, -0.0005929917097091675, 0.004721641540527344, 0.010036274790763855, 0.015350908041000366, 0.020665541291236877, 0.02598017454147339, 0.0312948077917099, 0.03660944104194641, 0.04192407429218292, 0.047238707542419434, 0.052553340792655945, 0.057867974042892456, 0.06318260729312897]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 12.0, 9.0, 17.0, 17.0, 17.0, 18.0, 28.0, 28.0, 35.0, 27.0, 43.0, 50.0, 53.0, 58.0, 48.0, 37.0, 51.0, 54.0, 50.0, 46.0, 31.0, 40.0, 32.0, 22.0, 23.0, 23.0, 18.0, 14.0, 13.0, 19.0, 16.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.039634883403778076, -0.0384724959731102, -0.03731011226773262, -0.03614772856235504, -0.034985341131687164, -0.03382295370101929, -0.03266056999564171, -0.03149818629026413, -0.030335798859596252, -0.029173413291573524, -0.028011027723550797, -0.02684864215552807, -0.02568625658750534, -0.024523871019482613, -0.023361485451459885, -0.022199099883437157, -0.02103671431541443, -0.0198743287473917, -0.018711943179368973, -0.017549557611346245, -0.016387172043323517, -0.015224786475300789, -0.014062400907278061, -0.012900015339255333, -0.011737629771232605, -0.010575244203209877, -0.009412858635187149, -0.008250473067164421, -0.007088087499141693, -0.005925701931118965, -0.004763316363096237, -0.003600930795073509, -0.0024385452270507812, -0.0012761596590280533, -0.00011377409100532532, 0.0010486114770174026, 0.0022109970450401306, 0.0033733826130628586, 0.0045357681810855865, 0.0056981537491083145, 0.0068605393171310425, 0.00802292488515377, 0.009185310453176498, 0.010347696021199226, 0.011510081589221954, 0.012672467157244682, 0.01383485272526741, 0.014997238293290138, 0.016159623861312866, 0.017322009429335594, 0.018484394997358322, 0.01964678056538105, 0.020809166133403778, 0.021971551701426506, 0.023133937269449234, 0.024296322837471962, 0.02545870840549469, 0.026621093973517418, 0.027783479541540146, 0.028945865109562874, 0.030108250677585602, 0.03127063810825348, 0.03243302181363106, 0.033595405519008636, 0.034757792949676514]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 9.0, 8.0, 11.0, 18.0, 23.0, 22.0, 41.0, 44.0, 68.0, 85.0, 119.0, 158.0, 211.0, 290.0, 467.0, 717.0, 1588.0, 5080.0, 38605.0, 755027.0, 226631.0, 13481.0, 2774.0, 1116.0, 598.0, 387.0, 242.0, 192.0, 143.0, 93.0, 76.0, 44.0, 40.0, 33.0, 21.0, 21.0, 11.0, 12.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.042882442474365234, -0.04139232635498047, -0.0399022102355957, -0.03841209411621094, -0.03692197799682617, -0.035431861877441406, -0.03394174575805664, -0.032451629638671875, -0.03096151351928711, -0.029471397399902344, -0.027981281280517578, -0.026491165161132812, -0.025001049041748047, -0.02351093292236328, -0.022020816802978516, -0.02053070068359375, -0.019040584564208984, -0.01755046844482422, -0.016060352325439453, -0.014570236206054688, -0.013080120086669922, -0.011590003967285156, -0.01009988784790039, -0.008609771728515625, -0.007119655609130859, -0.005629539489746094, -0.004139423370361328, -0.0026493072509765625, -0.0011591911315917969, 0.00033092498779296875, 0.0018210411071777344, 0.0033111572265625, 0.004801273345947266, 0.006291389465332031, 0.007781505584716797, 0.009271621704101562, 0.010761737823486328, 0.012251853942871094, 0.01374197006225586, 0.015232086181640625, 0.01672220230102539, 0.018212318420410156, 0.019702434539794922, 0.021192550659179688, 0.022682666778564453, 0.02417278289794922, 0.025662899017333984, 0.02715301513671875, 0.028643131256103516, 0.03013324737548828, 0.03162336349487305, 0.03311347961425781, 0.03460359573364258, 0.036093711853027344, 0.03758382797241211, 0.039073944091796875, 0.04056406021118164, 0.042054176330566406, 0.04354429244995117, 0.04503440856933594, 0.0465245246887207, 0.04801464080810547, 0.049504756927490234, 0.050994873046875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 52.0, 213.0, 384.0, 249.0, 84.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06561708450317383, -0.06360721588134766, -0.061597347259521484, -0.05958747863769531, -0.05757761001586914, -0.05556774139404297, -0.0535578727722168, -0.051548004150390625, -0.04953813552856445, -0.04752826690673828, -0.04551839828491211, -0.04350852966308594, -0.041498661041259766, -0.039488792419433594, -0.03747892379760742, -0.03546905517578125, -0.03345918655395508, -0.031449317932128906, -0.029439449310302734, -0.027429580688476562, -0.02541971206665039, -0.02340984344482422, -0.021399974822998047, -0.019390106201171875, -0.017380237579345703, -0.015370368957519531, -0.01336050033569336, -0.011350631713867188, -0.009340763092041016, -0.007330894470214844, -0.005321025848388672, -0.0033111572265625, -0.0013012886047363281, 0.0007085800170898438, 0.0027184486389160156, 0.0047283172607421875, 0.006738185882568359, 0.008748054504394531, 0.010757923126220703, 0.012767791748046875, 0.014777660369873047, 0.01678752899169922, 0.01879739761352539, 0.020807266235351562, 0.022817134857177734, 0.024827003479003906, 0.026836872100830078, 0.02884674072265625, 0.030856609344482422, 0.032866477966308594, 0.034876346588134766, 0.03688621520996094, 0.03889608383178711, 0.04090595245361328, 0.04291582107543945, 0.044925689697265625, 0.0469355583190918, 0.04894542694091797, 0.05095529556274414, 0.05296516418457031, 0.054975032806396484, 0.056984901428222656, 0.05899477005004883, 0.061004638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 23.0, 20.0, 35.0, 74.0, 115.0, 171.0, 438.0, 1156.0, 4178.0, 23721.0, 387281.0, 589031.0, 34480.0, 5393.0, 1431.0, 495.0, 220.0, 107.0, 49.0, 35.0, 27.0, 23.0, 7.0, 4.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.03630495071411133, -0.035012245178222656, -0.033719539642333984, -0.03242683410644531, -0.03113412857055664, -0.02984142303466797, -0.028548717498779297, -0.027256011962890625, -0.025963306427001953, -0.02467060089111328, -0.02337789535522461, -0.022085189819335938, -0.020792484283447266, -0.019499778747558594, -0.018207073211669922, -0.01691436767578125, -0.015621662139892578, -0.014328956604003906, -0.013036251068115234, -0.011743545532226562, -0.01045083999633789, -0.009158134460449219, -0.007865428924560547, -0.006572723388671875, -0.005280017852783203, -0.003987312316894531, -0.0026946067810058594, -0.0014019012451171875, -0.00010919570922851562, 0.0011835098266601562, 0.002476215362548828, 0.0037689208984375, 0.005061626434326172, 0.006354331970214844, 0.007647037506103516, 0.008939743041992188, 0.01023244857788086, 0.011525154113769531, 0.012817859649658203, 0.014110565185546875, 0.015403270721435547, 0.01669597625732422, 0.01798868179321289, 0.019281387329101562, 0.020574092864990234, 0.021866798400878906, 0.023159503936767578, 0.02445220947265625, 0.025744915008544922, 0.027037620544433594, 0.028330326080322266, 0.029623031616210938, 0.03091573715209961, 0.03220844268798828, 0.03350114822387695, 0.034793853759765625, 0.0360865592956543, 0.03737926483154297, 0.03867197036743164, 0.03996467590332031, 0.041257381439208984, 0.042550086975097656, 0.04384279251098633, 0.045135498046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 9.0, 20.0, 30.0, 42.0, 41.0, 61.0, 56.0, 80.0, 78.0, 105.0, 87.0, 75.0, 54.0, 47.0, 50.0, 43.0, 31.0, 23.0, 11.0, 15.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04168701171875, -0.04027509689331055, -0.038863182067871094, -0.03745126724243164, -0.03603935241699219, -0.034627437591552734, -0.03321552276611328, -0.03180360794067383, -0.030391693115234375, -0.028979778289794922, -0.02756786346435547, -0.026155948638916016, -0.024744033813476562, -0.02333211898803711, -0.021920204162597656, -0.020508289337158203, -0.01909637451171875, -0.017684459686279297, -0.016272544860839844, -0.01486063003540039, -0.013448715209960938, -0.012036800384521484, -0.010624885559082031, -0.009212970733642578, -0.007801055908203125, -0.006389141082763672, -0.004977226257324219, -0.0035653114318847656, -0.0021533966064453125, -0.0007414817810058594, 0.0006704330444335938, 0.002082347869873047, 0.0034942626953125, 0.004906177520751953, 0.006318092346191406, 0.007730007171630859, 0.009141921997070312, 0.010553836822509766, 0.011965751647949219, 0.013377666473388672, 0.014789581298828125, 0.016201496124267578, 0.01761341094970703, 0.019025325775146484, 0.020437240600585938, 0.02184915542602539, 0.023261070251464844, 0.024672985076904297, 0.02608489990234375, 0.027496814727783203, 0.028908729553222656, 0.03032064437866211, 0.03173255920410156, 0.033144474029541016, 0.03455638885498047, 0.03596830368041992, 0.037380218505859375, 0.03879213333129883, 0.04020404815673828, 0.041615962982177734, 0.04302787780761719, 0.04443979263305664, 0.045851707458496094, 0.04726362228393555, 0.048675537109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 14.0, 27.0, 38.0, 78.0, 138.0, 285.0, 554.0, 1130.0, 2306.0, 4782.0, 11319.0, 29560.0, 118379.0, 640462.0, 178037.0, 37075.0, 13539.0, 5732.0, 2522.0, 1236.0, 641.0, 304.0, 166.0, 93.0, 45.0, 38.0, 16.0, 16.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01053619384765625, -0.010202765464782715, -0.00986933708190918, -0.009535908699035645, -0.00920248031616211, -0.008869051933288574, -0.008535623550415039, -0.008202195167541504, -0.007868766784667969, -0.007535338401794434, -0.0072019100189208984, -0.006868481636047363, -0.006535053253173828, -0.006201624870300293, -0.005868196487426758, -0.005534768104553223, -0.0052013397216796875, -0.004867911338806152, -0.004534482955932617, -0.004201054573059082, -0.003867626190185547, -0.0035341978073120117, -0.0032007694244384766, -0.0028673410415649414, -0.0025339126586914062, -0.002200484275817871, -0.001867055892944336, -0.0015336275100708008, -0.0012001991271972656, -0.0008667707443237305, -0.0005333423614501953, -0.00019991397857666016, 0.000133514404296875, 0.00046694278717041016, 0.0008003711700439453, 0.0011337995529174805, 0.0014672279357910156, 0.0018006563186645508, 0.002134084701538086, 0.002467513084411621, 0.0028009414672851562, 0.0031343698501586914, 0.0034677982330322266, 0.0038012266159057617, 0.004134654998779297, 0.004468083381652832, 0.004801511764526367, 0.005134940147399902, 0.0054683685302734375, 0.005801796913146973, 0.006135225296020508, 0.006468653678894043, 0.006802082061767578, 0.007135510444641113, 0.0074689388275146484, 0.007802367210388184, 0.008135795593261719, 0.008469223976135254, 0.008802652359008789, 0.009136080741882324, 0.00946950912475586, 0.009802937507629395, 0.01013636589050293, 0.010469794273376465, 0.01080322265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 7.0, 7.0, 8.0, 9.0, 16.0, 23.0, 25.0, 28.0, 42.0, 57.0, 61.0, 92.0, 116.0, 101.0, 90.0, 82.0, 62.0, 41.0, 34.0, 22.0, 16.0, 17.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.00010138750076293945, -9.87071543931961e-05, -9.602680802345276e-05, -9.334646165370941e-05, -9.066611528396606e-05, -8.798576891422272e-05, -8.530542254447937e-05, -8.262507617473602e-05, -7.994472980499268e-05, -7.726438343524933e-05, -7.458403706550598e-05, -7.190369069576263e-05, -6.922334432601929e-05, -6.654299795627594e-05, -6.386265158653259e-05, -6.118230521678925e-05, -5.85019588470459e-05, -5.582161247730255e-05, -5.3141266107559204e-05, -5.046091973781586e-05, -4.778057336807251e-05, -4.510022699832916e-05, -4.2419880628585815e-05, -3.973953425884247e-05, -3.705918788909912e-05, -3.4378841519355774e-05, -3.169849514961243e-05, -2.901814877986908e-05, -2.6337802410125732e-05, -2.3657456040382385e-05, -2.0977109670639038e-05, -1.829676330089569e-05, -1.5616416931152344e-05, -1.2936070561408997e-05, -1.025572419166565e-05, -7.575377821922302e-06, -4.895031452178955e-06, -2.214685082435608e-06, 4.6566128730773926e-07, 3.1460076570510864e-06, 5.826354026794434e-06, 8.50670039653778e-06, 1.1187046766281128e-05, 1.3867393136024475e-05, 1.6547739505767822e-05, 1.922808587551117e-05, 2.1908432245254517e-05, 2.4588778614997864e-05, 2.726912498474121e-05, 2.9949471354484558e-05, 3.2629817724227905e-05, 3.531016409397125e-05, 3.79905104637146e-05, 4.067085683345795e-05, 4.3351203203201294e-05, 4.603154957294464e-05, 4.871189594268799e-05, 5.1392242312431335e-05, 5.407258868217468e-05, 5.675293505191803e-05, 5.943328142166138e-05, 6.211362779140472e-05, 6.479397416114807e-05, 6.747432053089142e-05, 7.015466690063477e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 10.0, 15.0, 29.0, 25.0, 35.0, 61.0, 102.0, 190.0, 316.0, 595.0, 1166.0, 2391.0, 5057.0, 11807.0, 32428.0, 130707.0, 632423.0, 168987.0, 37593.0, 13426.0, 5602.0, 2620.0, 1287.0, 713.0, 350.0, 236.0, 120.0, 76.0, 38.0, 31.0, 25.0, 17.0, 10.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01085662841796875, -0.010512709617614746, -0.010168790817260742, -0.009824872016906738, -0.009480953216552734, -0.00913703441619873, -0.008793115615844727, -0.008449196815490723, -0.008105278015136719, -0.007761359214782715, -0.007417440414428711, -0.007073521614074707, -0.006729602813720703, -0.006385684013366699, -0.006041765213012695, -0.005697846412658691, -0.0053539276123046875, -0.005010008811950684, -0.00466609001159668, -0.004322171211242676, -0.003978252410888672, -0.003634333610534668, -0.003290414810180664, -0.00294649600982666, -0.0026025772094726562, -0.0022586584091186523, -0.0019147396087646484, -0.0015708208084106445, -0.0012269020080566406, -0.0008829832077026367, -0.0005390644073486328, -0.0001951456069946289, 0.000148773193359375, 0.0004926919937133789, 0.0008366107940673828, 0.0011805295944213867, 0.0015244483947753906, 0.0018683671951293945, 0.0022122859954833984, 0.0025562047958374023, 0.0029001235961914062, 0.00324404239654541, 0.003587961196899414, 0.003931879997253418, 0.004275798797607422, 0.004619717597961426, 0.00496363639831543, 0.005307555198669434, 0.0056514739990234375, 0.005995392799377441, 0.006339311599731445, 0.006683230400085449, 0.007027149200439453, 0.007371068000793457, 0.007714986801147461, 0.008058905601501465, 0.008402824401855469, 0.008746743202209473, 0.009090662002563477, 0.00943458080291748, 0.009778499603271484, 0.010122418403625488, 0.010466337203979492, 0.010810256004333496, 0.0111541748046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 9.0, 1.0, 3.0, 11.0, 9.0, 6.0, 13.0, 23.0, 22.0, 40.0, 85.0, 110.0, 166.0, 171.0, 111.0, 82.0, 38.0, 16.0, 13.0, 10.0, 15.0, 11.0, 8.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01230621337890625, -0.011908650398254395, -0.011511087417602539, -0.011113524436950684, -0.010715961456298828, -0.010318398475646973, -0.009920835494995117, -0.009523272514343262, -0.009125709533691406, -0.00872814655303955, -0.008330583572387695, -0.00793302059173584, -0.007535457611083984, -0.007137894630432129, -0.0067403316497802734, -0.006342768669128418, -0.0059452056884765625, -0.005547642707824707, -0.0051500797271728516, -0.004752516746520996, -0.004354953765869141, -0.003957390785217285, -0.0035598278045654297, -0.0031622648239135742, -0.0027647018432617188, -0.0023671388626098633, -0.001969575881958008, -0.0015720129013061523, -0.0011744499206542969, -0.0007768869400024414, -0.00037932395935058594, 1.823902130126953e-05, 0.000415802001953125, 0.0008133649826049805, 0.001210927963256836, 0.0016084909439086914, 0.002006053924560547, 0.0024036169052124023, 0.002801179885864258, 0.0031987428665161133, 0.0035963058471679688, 0.003993868827819824, 0.00439143180847168, 0.004788994789123535, 0.005186557769775391, 0.005584120750427246, 0.0059816837310791016, 0.006379246711730957, 0.0067768096923828125, 0.007174372673034668, 0.0075719356536865234, 0.007969498634338379, 0.008367061614990234, 0.00876462459564209, 0.009162187576293945, 0.0095597505569458, 0.009957313537597656, 0.010354876518249512, 0.010752439498901367, 0.011150002479553223, 0.011547565460205078, 0.011945128440856934, 0.012342691421508789, 0.012740254402160645, 0.0131378173828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 42.0, 245.0, 544.0, 155.0, 13.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.746342658996582, -0.7326202392578125, -0.7188977599143982, -0.7051753401756287, -0.6914528608322144, -0.6777304410934448, -0.6640080213546753, -0.650285542011261, -0.6365631222724915, -0.6228407025337219, -0.6091182231903076, -0.5953958034515381, -0.5816733241081238, -0.5679509043693542, -0.5542284250259399, -0.5405060052871704, -0.5267835259437561, -0.5130611062049866, -0.49933862686157227, -0.48561620712280273, -0.4718937575817108, -0.4581713080406189, -0.444448858499527, -0.43072640895843506, -0.4170039892196655, -0.4032815396785736, -0.3895590901374817, -0.37583667039871216, -0.36211422085762024, -0.3483917713165283, -0.3346693217754364, -0.3209468722343445, -0.30722442269325256, -0.29350197315216064, -0.2797795236110687, -0.2660570740699768, -0.2523346543312073, -0.23861220479011536, -0.22488975524902344, -0.21116730570793152, -0.1974448561668396, -0.18372240662574768, -0.16999997198581696, -0.15627752244472504, -0.14255507290363312, -0.1288326382637024, -0.11511018872261047, -0.10138773918151855, -0.08766530454158783, -0.07394286245107651, -0.06022041290998459, -0.04649797081947327, -0.032775525003671646, -0.019053079187870026, -0.005330637097358704, 0.008391812443733215, 0.022114254534244537, 0.03583670035004616, 0.04955914616584778, 0.0632815882563591, 0.07700403034687042, 0.09072647988796234, 0.10444892197847366, 0.11817137151956558, 0.1318938136100769]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 6.0, 5.0, 7.0, 13.0, 13.0, 16.0, 14.0, 24.0, 28.0, 27.0, 39.0, 32.0, 36.0, 32.0, 42.0, 44.0, 35.0, 44.0, 47.0, 38.0, 40.0, 30.0, 39.0, 49.0, 38.0, 40.0, 34.0, 34.0, 30.0, 15.0, 21.0, 12.0, 14.0, 10.0, 13.0, 14.0, 4.0, 5.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07883483171463013, -0.07657977193593979, -0.07432471960783005, -0.07206965982913971, -0.06981460750102997, -0.06755954772233963, -0.06530448794364929, -0.06304943561553955, -0.06079437583684921, -0.05853931978344917, -0.05628426373004913, -0.054029203951358795, -0.051774147897958755, -0.049519091844558716, -0.04726403206586838, -0.04500897601246834, -0.0427539199590683, -0.04049886390566826, -0.03824380785226822, -0.03598874807357788, -0.03373369202017784, -0.0314786359667778, -0.029223578050732613, -0.026968520134687424, -0.024713464081287384, -0.022458408027887344, -0.020203350111842155, -0.017948292195796967, -0.015693236142396927, -0.013438179157674313, -0.011183122172951698, -0.00892806425690651, -0.00667300820350647, -0.0044179512187838554, -0.002162894234061241, 9.216275066137314e-05, 0.0023472197353839874, 0.004602276720106602, 0.006857333704829216, 0.009112391620874405, 0.011367447674274445, 0.013622504658997059, 0.015877561643719673, 0.018132619559764862, 0.0203876756131649, 0.02264273166656494, 0.02489778958261013, 0.02715284749865532, 0.02940790355205536, 0.0316629596054554, 0.03391801565885544, 0.036173075437545776, 0.038428131490945816, 0.040683187544345856, 0.042938247323036194, 0.045193303376436234, 0.04744835942983627, 0.04970341548323631, 0.05195847153663635, 0.05421353131532669, 0.05646858736872673, 0.05872364342212677, 0.06097870320081711, 0.06323376297950745, 0.06548881530761719]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 17.0, 129.0, 2586.0, 4123480.0, 66885.0, 1019.0, 115.0, 35.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.21615219116210938, -0.20977020263671875, -0.20338821411132812, -0.1970062255859375, -0.19062423706054688, -0.18424224853515625, -0.17786026000976562, -0.171478271484375, -0.16509628295898438, -0.15871429443359375, -0.15233230590820312, -0.1459503173828125, -0.13956832885742188, -0.13318634033203125, -0.12680435180664062, -0.12042236328125, -0.11404037475585938, -0.10765838623046875, -0.10127639770507812, -0.0948944091796875, -0.08851242065429688, -0.08213043212890625, -0.07574844360351562, -0.069366455078125, -0.06298446655273438, -0.05660247802734375, -0.050220489501953125, -0.0438385009765625, -0.037456512451171875, -0.03107452392578125, -0.024692535400390625, -0.018310546875, -0.011928558349609375, -0.00554656982421875, 0.000835418701171875, 0.0072174072265625, 0.013599395751953125, 0.01998138427734375, 0.026363372802734375, 0.032745361328125, 0.039127349853515625, 0.04550933837890625, 0.051891326904296875, 0.0582733154296875, 0.06465530395507812, 0.07103729248046875, 0.07741928100585938, 0.08380126953125, 0.09018325805664062, 0.09656524658203125, 0.10294723510742188, 0.1093292236328125, 0.11571121215820312, 0.12209320068359375, 0.12847518920898438, 0.134857177734375, 0.14123916625976562, 0.14762115478515625, 0.15400314331054688, 0.1603851318359375, 0.16676712036132812, 0.17314910888671875, 0.17953109741210938, 0.1859130859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 29.0, 141.0, 322.0, 331.0, 134.0, 38.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.06380558013916016, -0.06181526184082031, -0.05982494354248047, -0.057834625244140625, -0.05584430694580078, -0.05385398864746094, -0.051863670349121094, -0.04987335205078125, -0.047883033752441406, -0.04589271545410156, -0.04390239715576172, -0.041912078857421875, -0.03992176055908203, -0.03793144226074219, -0.035941123962402344, -0.0339508056640625, -0.031960487365722656, -0.029970169067382812, -0.02797985076904297, -0.025989532470703125, -0.02399921417236328, -0.022008895874023438, -0.020018577575683594, -0.01802825927734375, -0.016037940979003906, -0.014047622680664062, -0.012057304382324219, -0.010066986083984375, -0.008076667785644531, -0.0060863494873046875, -0.004096031188964844, -0.002105712890625, -0.00011539459228515625, 0.0018749237060546875, 0.0038652420043945312, 0.005855560302734375, 0.007845878601074219, 0.009836196899414062, 0.011826515197753906, 0.01381683349609375, 0.015807151794433594, 0.017797470092773438, 0.01978778839111328, 0.021778106689453125, 0.02376842498779297, 0.025758743286132812, 0.027749061584472656, 0.0297393798828125, 0.031729698181152344, 0.03372001647949219, 0.03571033477783203, 0.037700653076171875, 0.03969097137451172, 0.04168128967285156, 0.043671607971191406, 0.04566192626953125, 0.047652244567871094, 0.04964256286621094, 0.05163288116455078, 0.053623199462890625, 0.05561351776123047, 0.05760383605957031, 0.059594154357910156, 0.06158447265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 12.0, 26.0, 55.0, 118.0, 232.0, 491.0, 1233.0, 3629.0, 15419.0, 118325.0, 3696042.0, 321726.0, 28100.0, 5864.0, 1777.0, 675.0, 312.0, 123.0, 66.0, 28.0, 15.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218963623046875, -0.021008729934692383, -0.020121097564697266, -0.01923346519470215, -0.01834583282470703, -0.017458200454711914, -0.016570568084716797, -0.01568293571472168, -0.014795303344726562, -0.013907670974731445, -0.013020038604736328, -0.012132406234741211, -0.011244773864746094, -0.010357141494750977, -0.00946950912475586, -0.008581876754760742, -0.007694244384765625, -0.006806612014770508, -0.005918979644775391, -0.0050313472747802734, -0.004143714904785156, -0.003256082534790039, -0.002368450164794922, -0.0014808177947998047, -0.0005931854248046875, 0.0002944469451904297, 0.0011820793151855469, 0.002069711685180664, 0.0029573440551757812, 0.0038449764251708984, 0.004732608795166016, 0.005620241165161133, 0.00650787353515625, 0.007395505905151367, 0.008283138275146484, 0.009170770645141602, 0.010058403015136719, 0.010946035385131836, 0.011833667755126953, 0.01272130012512207, 0.013608932495117188, 0.014496564865112305, 0.015384197235107422, 0.01627182960510254, 0.017159461975097656, 0.018047094345092773, 0.01893472671508789, 0.019822359085083008, 0.020709991455078125, 0.021597623825073242, 0.02248525619506836, 0.023372888565063477, 0.024260520935058594, 0.02514815330505371, 0.026035785675048828, 0.026923418045043945, 0.027811050415039062, 0.02869868278503418, 0.029586315155029297, 0.030473947525024414, 0.03136157989501953, 0.03224921226501465, 0.033136844635009766, 0.03402447700500488, 0.034912109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 15.0, 28.0, 31.0, 60.0, 126.0, 231.0, 663.0, 1587.0, 763.0, 247.0, 116.0, 74.0, 42.0, 23.0, 22.0, 11.0, 10.0, 0.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.0220181941986084, -0.021361827850341797, -0.020705461502075195, -0.020049095153808594, -0.019392728805541992, -0.01873636245727539, -0.01807999610900879, -0.017423629760742188, -0.016767263412475586, -0.016110897064208984, -0.015454530715942383, -0.014798164367675781, -0.01414179801940918, -0.013485431671142578, -0.012829065322875977, -0.012172698974609375, -0.011516332626342773, -0.010859966278076172, -0.01020359992980957, -0.009547233581542969, -0.008890867233276367, -0.008234500885009766, -0.007578134536743164, -0.0069217681884765625, -0.006265401840209961, -0.005609035491943359, -0.004952669143676758, -0.004296302795410156, -0.0036399364471435547, -0.002983570098876953, -0.0023272037506103516, -0.00167083740234375, -0.0010144710540771484, -0.0003581047058105469, 0.0002982616424560547, 0.0009546279907226562, 0.0016109943389892578, 0.0022673606872558594, 0.002923727035522461, 0.0035800933837890625, 0.004236459732055664, 0.004892826080322266, 0.005549192428588867, 0.006205558776855469, 0.00686192512512207, 0.007518291473388672, 0.008174657821655273, 0.008831024169921875, 0.009487390518188477, 0.010143756866455078, 0.01080012321472168, 0.011456489562988281, 0.012112855911254883, 0.012769222259521484, 0.013425588607788086, 0.014081954956054688, 0.014738321304321289, 0.01539468765258789, 0.016051054000854492, 0.016707420349121094, 0.017363786697387695, 0.018020153045654297, 0.0186765193939209, 0.0193328857421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 32.0, 112.0, 236.0, 297.0, 196.0, 79.0, 23.0, 17.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.25808337330818176, -0.2533353567123413, -0.24858734011650085, -0.2438393384218216, -0.23909132182598114, -0.23434330523014069, -0.22959528863430023, -0.22484728693962097, -0.22009927034378052, -0.21535125374794006, -0.2106032371520996, -0.20585523545742035, -0.2011072188615799, -0.19635920226573944, -0.191611185669899, -0.18686318397521973, -0.18211516737937927, -0.17736715078353882, -0.17261913418769836, -0.1678711324930191, -0.16312311589717865, -0.1583750993013382, -0.15362708270549774, -0.14887908101081848, -0.14413104951381683, -0.13938303291797638, -0.13463501632213593, -0.12988701462745667, -0.1251389980316162, -0.12039098143577576, -0.1156429648399353, -0.11089495569467545, -0.10614694654941559, -0.10139892995357513, -0.09665092080831528, -0.09190290421247482, -0.08715489506721497, -0.08240687847137451, -0.07765886187553406, -0.0729108527302742, -0.06816283613443375, -0.06341481953859329, -0.058666810393333435, -0.05391879379749298, -0.049170784652233124, -0.04442276805639267, -0.039674755185842514, -0.03492674231529236, -0.030178729444742203, -0.025430716574192047, -0.02068270370364189, -0.015934688970446587, -0.011186676099896431, -0.006438663229346275, -0.0016906484961509705, 0.003057364374399185, 0.007805377244949341, 0.012553390115499496, 0.017301402986049652, 0.022049417719244957, 0.026797430589795113, 0.03154544532299042, 0.03629345819354057, 0.04104147106409073, 0.045789483934640884]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 2.0, 9.0, 16.0, 5.0, 12.0, 13.0, 23.0, 25.0, 29.0, 22.0, 41.0, 43.0, 37.0, 40.0, 40.0, 49.0, 35.0, 41.0, 51.0, 41.0, 43.0, 52.0, 34.0, 36.0, 37.0, 29.0, 23.0, 35.0, 21.0, 20.0, 15.0, 18.0, 8.0, 8.0, 10.0, 11.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.044088900089263916, -0.042980991303920746, -0.04187307879328728, -0.04076516628265381, -0.03965725749731064, -0.03854934871196747, -0.037441436201334, -0.03633352369070053, -0.03522561490535736, -0.03411770612001419, -0.03300979360938072, -0.03190188109874725, -0.030793972313404083, -0.029686061665415764, -0.028578151017427444, -0.027470240369439125, -0.026362329721450806, -0.025254419073462486, -0.024146508425474167, -0.023038597777485847, -0.021930687129497528, -0.02082277648150921, -0.01971486583352089, -0.01860695518553257, -0.01749904453754425, -0.01639113388955593, -0.015283223241567612, -0.014175312593579292, -0.013067401945590973, -0.011959491297602654, -0.010851580649614334, -0.009743670001626015, -0.008635759353637695, -0.007527848705649376, -0.0064199380576610565, -0.005312027409672737, -0.004204116761684418, -0.0030962061136960983, -0.001988295465707779, -0.0008803848177194595, 0.00022752583026885986, 0.0013354364782571793, 0.0024433471262454987, 0.003551257774233818, 0.0046591684222221375, 0.005767079070210457, 0.006874989718198776, 0.007982900366187096, 0.009090811014175415, 0.010198721662163734, 0.011306632310152054, 0.012414542958140373, 0.013522453606128693, 0.014630364254117012, 0.01573827490210533, 0.01684618555009365, 0.01795409619808197, 0.01906200684607029, 0.02016991749405861, 0.02127782814204693, 0.022385738790035248, 0.023493649438023567, 0.024601560086011887, 0.025709470734000206, 0.026817381381988525]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 17.0, 11.0, 18.0, 19.0, 25.0, 50.0, 64.0, 95.0, 139.0, 173.0, 269.0, 418.0, 706.0, 1516.0, 7021.0, 162296.0, 840550.0, 29468.0, 3141.0, 915.0, 516.0, 309.0, 254.0, 167.0, 115.0, 80.0, 64.0, 47.0, 25.0, 16.0, 15.0, 11.0, 5.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06062173843383789, -0.05874347686767578, -0.05686521530151367, -0.05498695373535156, -0.05310869216918945, -0.051230430603027344, -0.049352169036865234, -0.047473907470703125, -0.045595645904541016, -0.043717384338378906, -0.0418391227722168, -0.03996086120605469, -0.03808259963989258, -0.03620433807373047, -0.03432607650756836, -0.03244781494140625, -0.03056955337524414, -0.02869129180908203, -0.026813030242919922, -0.024934768676757812, -0.023056507110595703, -0.021178245544433594, -0.019299983978271484, -0.017421722412109375, -0.015543460845947266, -0.013665199279785156, -0.011786937713623047, -0.009908676147460938, -0.008030414581298828, -0.006152153015136719, -0.004273891448974609, -0.0023956298828125, -0.0005173683166503906, 0.0013608932495117188, 0.003239154815673828, 0.0051174163818359375, 0.006995677947998047, 0.008873939514160156, 0.010752201080322266, 0.012630462646484375, 0.014508724212646484, 0.016386985778808594, 0.018265247344970703, 0.020143508911132812, 0.022021770477294922, 0.02390003204345703, 0.02577829360961914, 0.02765655517578125, 0.02953481674194336, 0.03141307830810547, 0.03329133987426758, 0.03516960144042969, 0.0370478630065918, 0.038926124572753906, 0.040804386138916016, 0.042682647705078125, 0.044560909271240234, 0.046439170837402344, 0.04831743240356445, 0.05019569396972656, 0.05207395553588867, 0.05395221710205078, 0.05583047866821289, 0.057708740234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 28.0, 144.0, 334.0, 337.0, 127.0, 24.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06557750701904297, -0.06352806091308594, -0.061478614807128906, -0.059429168701171875, -0.057379722595214844, -0.05533027648925781, -0.05328083038330078, -0.05123138427734375, -0.04918193817138672, -0.04713249206542969, -0.045083045959472656, -0.043033599853515625, -0.040984153747558594, -0.03893470764160156, -0.03688526153564453, -0.0348358154296875, -0.03278636932373047, -0.030736923217773438, -0.028687477111816406, -0.026638031005859375, -0.024588584899902344, -0.022539138793945312, -0.02048969268798828, -0.01844024658203125, -0.01639080047607422, -0.014341354370117188, -0.012291908264160156, -0.010242462158203125, -0.008193016052246094, -0.0061435699462890625, -0.004094123840332031, -0.002044677734375, 4.76837158203125e-06, 0.0020542144775390625, 0.004103660583496094, 0.006153106689453125, 0.008202552795410156, 0.010251998901367188, 0.012301445007324219, 0.01435089111328125, 0.01640033721923828, 0.018449783325195312, 0.020499229431152344, 0.022548675537109375, 0.024598121643066406, 0.026647567749023438, 0.02869701385498047, 0.0307464599609375, 0.03279590606689453, 0.03484535217285156, 0.036894798278808594, 0.038944244384765625, 0.040993690490722656, 0.04304313659667969, 0.04509258270263672, 0.04714202880859375, 0.04919147491455078, 0.05124092102050781, 0.053290367126464844, 0.055339813232421875, 0.057389259338378906, 0.05943870544433594, 0.06148815155029297, 0.06353759765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 7.0, 15.0, 18.0, 23.0, 24.0, 29.0, 50.0, 46.0, 90.0, 154.0, 295.0, 735.0, 2027.0, 7146.0, 37344.0, 283719.0, 585225.0, 109198.0, 16288.0, 3813.0, 1209.0, 468.0, 213.0, 121.0, 68.0, 55.0, 34.0, 27.0, 26.0, 15.0, 18.0, 6.0, 4.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030242919921875, -0.029333829879760742, -0.028424739837646484, -0.027515649795532227, -0.02660655975341797, -0.02569746971130371, -0.024788379669189453, -0.023879289627075195, -0.022970199584960938, -0.02206110954284668, -0.021152019500732422, -0.020242929458618164, -0.019333839416503906, -0.01842474937438965, -0.01751565933227539, -0.016606569290161133, -0.015697479248046875, -0.014788389205932617, -0.01387929916381836, -0.012970209121704102, -0.012061119079589844, -0.011152029037475586, -0.010242938995361328, -0.00933384895324707, -0.008424758911132812, -0.007515668869018555, -0.006606578826904297, -0.005697488784790039, -0.004788398742675781, -0.0038793087005615234, -0.0029702186584472656, -0.002061128616333008, -0.00115203857421875, -0.0002429485321044922, 0.0006661415100097656, 0.0015752315521240234, 0.0024843215942382812, 0.003393411636352539, 0.004302501678466797, 0.005211591720581055, 0.0061206817626953125, 0.00702977180480957, 0.007938861846923828, 0.008847951889038086, 0.009757041931152344, 0.010666131973266602, 0.01157522201538086, 0.012484312057495117, 0.013393402099609375, 0.014302492141723633, 0.01521158218383789, 0.01612067222595215, 0.017029762268066406, 0.017938852310180664, 0.018847942352294922, 0.01975703239440918, 0.020666122436523438, 0.021575212478637695, 0.022484302520751953, 0.02339339256286621, 0.02430248260498047, 0.025211572647094727, 0.026120662689208984, 0.027029752731323242, 0.0279388427734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 11.0, 12.0, 9.0, 18.0, 20.0, 24.0, 29.0, 33.0, 39.0, 42.0, 47.0, 41.0, 47.0, 41.0, 29.0, 46.0, 54.0, 44.0, 43.0, 36.0, 44.0, 35.0, 38.0, 31.0, 19.0, 27.0, 27.0, 21.0, 17.0, 8.0, 12.0, 8.0, 9.0, 7.0, 2.0, 5.0, 4.0, 7.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0276947021484375, -0.0268709659576416, -0.026047229766845703, -0.025223493576049805, -0.024399757385253906, -0.023576021194458008, -0.02275228500366211, -0.02192854881286621, -0.021104812622070312, -0.020281076431274414, -0.019457340240478516, -0.018633604049682617, -0.01780986785888672, -0.01698613166809082, -0.016162395477294922, -0.015338659286499023, -0.014514923095703125, -0.013691186904907227, -0.012867450714111328, -0.01204371452331543, -0.011219978332519531, -0.010396242141723633, -0.009572505950927734, -0.008748769760131836, -0.007925033569335938, -0.007101297378540039, -0.006277561187744141, -0.005453824996948242, -0.004630088806152344, -0.0038063526153564453, -0.002982616424560547, -0.0021588802337646484, -0.00133514404296875, -0.0005114078521728516, 0.0003123283386230469, 0.0011360645294189453, 0.0019598007202148438, 0.002783536911010742, 0.0036072731018066406, 0.004431009292602539, 0.0052547454833984375, 0.006078481674194336, 0.006902217864990234, 0.007725954055786133, 0.008549690246582031, 0.00937342643737793, 0.010197162628173828, 0.011020898818969727, 0.011844635009765625, 0.012668371200561523, 0.013492107391357422, 0.01431584358215332, 0.015139579772949219, 0.015963315963745117, 0.016787052154541016, 0.017610788345336914, 0.018434524536132812, 0.01925826072692871, 0.02008199691772461, 0.020905733108520508, 0.021729469299316406, 0.022553205490112305, 0.023376941680908203, 0.0242006778717041, 0.0250244140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 24.0, 22.0, 33.0, 44.0, 79.0, 95.0, 162.0, 234.0, 380.0, 594.0, 1026.0, 1860.0, 3543.0, 7613.0, 20646.0, 77380.0, 409685.0, 410876.0, 78135.0, 20656.0, 7541.0, 3481.0, 1720.0, 997.0, 583.0, 416.0, 226.0, 167.0, 111.0, 52.0, 60.0, 39.0, 25.0, 14.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00881195068359375, -0.008518218994140625, -0.0082244873046875, -0.007930755615234375, -0.00763702392578125, -0.007343292236328125, -0.007049560546875, -0.006755828857421875, -0.00646209716796875, -0.006168365478515625, -0.0058746337890625, -0.005580902099609375, -0.00528717041015625, -0.004993438720703125, -0.00469970703125, -0.004405975341796875, -0.00411224365234375, -0.003818511962890625, -0.0035247802734375, -0.003231048583984375, -0.00293731689453125, -0.002643585205078125, -0.002349853515625, -0.002056121826171875, -0.00176239013671875, -0.001468658447265625, -0.0011749267578125, -0.000881195068359375, -0.00058746337890625, -0.000293731689453125, 0.0, 0.000293731689453125, 0.00058746337890625, 0.000881195068359375, 0.0011749267578125, 0.001468658447265625, 0.00176239013671875, 0.002056121826171875, 0.002349853515625, 0.002643585205078125, 0.00293731689453125, 0.003231048583984375, 0.0035247802734375, 0.003818511962890625, 0.00411224365234375, 0.004405975341796875, 0.00469970703125, 0.004993438720703125, 0.00528717041015625, 0.005580902099609375, 0.0058746337890625, 0.006168365478515625, 0.00646209716796875, 0.006755828857421875, 0.007049560546875, 0.007343292236328125, 0.00763702392578125, 0.007930755615234375, 0.0082244873046875, 0.008518218994140625, 0.00881195068359375, 0.009105682373046875, 0.0093994140625, 0.009693145751953125, 0.00998687744140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 15.0, 18.0, 34.0, 31.0, 51.0, 49.0, 66.0, 82.0, 118.0, 108.0, 87.0, 71.0, 53.0, 52.0, 26.0, 25.0, 26.0, 21.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011140108108520508, -0.00010846741497516632, -0.00010553374886512756, -0.0001026000827550888, -9.966641664505005e-05, -9.673275053501129e-05, -9.379908442497253e-05, -9.086541831493378e-05, -8.793175220489502e-05, -8.499808609485626e-05, -8.20644199848175e-05, -7.913075387477875e-05, -7.619708776473999e-05, -7.326342165470123e-05, -7.032975554466248e-05, -6.739608943462372e-05, -6.446242332458496e-05, -6.15287572145462e-05, -5.8595091104507446e-05, -5.566142499446869e-05, -5.272775888442993e-05, -4.9794092774391174e-05, -4.686042666435242e-05, -4.392676055431366e-05, -4.09930944442749e-05, -3.8059428334236145e-05, -3.512576222419739e-05, -3.219209611415863e-05, -2.9258430004119873e-05, -2.6324763894081116e-05, -2.339109778404236e-05, -2.04574316740036e-05, -1.7523765563964844e-05, -1.4590099453926086e-05, -1.1656433343887329e-05, -8.722767233848572e-06, -5.7891011238098145e-06, -2.855435013771057e-06, 7.82310962677002e-08, 3.0118972063064575e-06, 5.945563316345215e-06, 8.879229426383972e-06, 1.181289553642273e-05, 1.4746561646461487e-05, 1.7680227756500244e-05, 2.0613893866539e-05, 2.354755997657776e-05, 2.6481226086616516e-05, 2.9414892196655273e-05, 3.234855830669403e-05, 3.528222441673279e-05, 3.8215890526771545e-05, 4.11495566368103e-05, 4.408322274684906e-05, 4.701688885688782e-05, 4.9950554966926575e-05, 5.288422107696533e-05, 5.581788718700409e-05, 5.875155329704285e-05, 6.16852194070816e-05, 6.461888551712036e-05, 6.755255162715912e-05, 7.048621773719788e-05, 7.341988384723663e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 10.0, 14.0, 12.0, 19.0, 24.0, 63.0, 89.0, 129.0, 211.0, 364.0, 617.0, 1202.0, 2266.0, 4677.0, 10318.0, 23153.0, 64599.0, 230347.0, 457837.0, 167432.0, 49735.0, 18718.0, 8399.0, 3945.0, 1960.0, 1012.0, 545.0, 309.0, 192.0, 126.0, 78.0, 47.0, 36.0, 18.0, 17.0, 12.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0079803466796875, -0.00773388147354126, -0.0074874162673950195, -0.007240951061248779, -0.006994485855102539, -0.006748020648956299, -0.006501555442810059, -0.006255090236663818, -0.006008625030517578, -0.005762159824371338, -0.005515694618225098, -0.005269229412078857, -0.005022764205932617, -0.004776298999786377, -0.004529833793640137, -0.0042833685874938965, -0.004036903381347656, -0.003790438175201416, -0.0035439729690551758, -0.0032975077629089355, -0.0030510425567626953, -0.002804577350616455, -0.002558112144470215, -0.0023116469383239746, -0.0020651817321777344, -0.0018187165260314941, -0.001572251319885254, -0.0013257861137390137, -0.0010793209075927734, -0.0008328557014465332, -0.000586390495300293, -0.00033992528915405273, -9.34600830078125e-05, 0.00015300512313842773, 0.00039947032928466797, 0.0006459355354309082, 0.0008924007415771484, 0.0011388659477233887, 0.001385331153869629, 0.0016317963600158691, 0.0018782615661621094, 0.0021247267723083496, 0.00237119197845459, 0.00261765718460083, 0.0028641223907470703, 0.0031105875968933105, 0.0033570528030395508, 0.003603518009185791, 0.0038499832153320312, 0.0040964484214782715, 0.004342913627624512, 0.004589378833770752, 0.004835844039916992, 0.005082309246063232, 0.005328774452209473, 0.005575239658355713, 0.005821704864501953, 0.006068170070648193, 0.006314635276794434, 0.006561100482940674, 0.006807565689086914, 0.007054030895233154, 0.0073004961013793945, 0.007546961307525635, 0.007793426513671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 20.0, 17.0, 42.0, 50.0, 78.0, 91.0, 103.0, 132.0, 107.0, 99.0, 75.0, 47.0, 42.0, 24.0, 18.0, 11.0, 5.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010248303413391113, -0.009922266006469727, -0.00959622859954834, -0.009270191192626953, -0.008944153785705566, -0.00861811637878418, -0.008292078971862793, -0.007966041564941406, -0.0076400041580200195, -0.007313966751098633, -0.006987929344177246, -0.006661891937255859, -0.006335854530334473, -0.006009817123413086, -0.005683779716491699, -0.0053577423095703125, -0.005031704902648926, -0.004705667495727539, -0.004379630088806152, -0.004053592681884766, -0.003727555274963379, -0.003401517868041992, -0.0030754804611206055, -0.0027494430541992188, -0.002423405647277832, -0.0020973682403564453, -0.0017713308334350586, -0.0014452934265136719, -0.0011192560195922852, -0.0007932186126708984, -0.0004671812057495117, -0.000141143798828125, 0.00018489360809326172, 0.0005109310150146484, 0.0008369684219360352, 0.0011630058288574219, 0.0014890432357788086, 0.0018150806427001953, 0.002141118049621582, 0.0024671554565429688, 0.0027931928634643555, 0.003119230270385742, 0.003445267677307129, 0.0037713050842285156, 0.004097342491149902, 0.004423379898071289, 0.004749417304992676, 0.0050754547119140625, 0.005401492118835449, 0.005727529525756836, 0.006053566932678223, 0.006379604339599609, 0.006705641746520996, 0.007031679153442383, 0.0073577165603637695, 0.007683753967285156, 0.008009791374206543, 0.00833582878112793, 0.008661866188049316, 0.008987903594970703, 0.00931394100189209, 0.009639978408813477, 0.009966015815734863, 0.01029205322265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 20.0, 41.0, 91.0, 160.0, 235.0, 212.0, 119.0, 64.0, 24.0, 16.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.24155941605567932, -0.23699802160263062, -0.2324366271495819, -0.2278752326965332, -0.2233138382434845, -0.2187524437904358, -0.21419104933738708, -0.20962965488433838, -0.20506826043128967, -0.20050686597824097, -0.19594547152519226, -0.19138407707214355, -0.18682268261909485, -0.18226128816604614, -0.17769989371299744, -0.17313849925994873, -0.16857710480690002, -0.16401571035385132, -0.1594543159008026, -0.1548929214477539, -0.1503315269947052, -0.1457701325416565, -0.1412087380886078, -0.13664734363555908, -0.13208594918251038, -0.12752455472946167, -0.12296316027641296, -0.11840176582336426, -0.11384037137031555, -0.10927897691726685, -0.10471758246421814, -0.10015618801116943, -0.09559480845928192, -0.09103341400623322, -0.08647201955318451, -0.0819106251001358, -0.0773492306470871, -0.07278783619403839, -0.06822644174098969, -0.06366504728794098, -0.05910365283489227, -0.05454225838184357, -0.04998086392879486, -0.045419469475746155, -0.04085807502269745, -0.03629668056964874, -0.03173528611660004, -0.02717389166355133, -0.022612497210502625, -0.01805110275745392, -0.013489708304405212, -0.008928313851356506, -0.0043669193983078, 0.00019447505474090576, 0.004755869507789612, 0.009317263960838318, 0.013878658413887024, 0.01844005286693573, 0.023001447319984436, 0.027562841773033142, 0.03212423622608185, 0.036685630679130554, 0.04124702513217926, 0.045808419585227966, 0.05036981403827667]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 4.0, 5.0, 8.0, 7.0, 13.0, 13.0, 11.0, 27.0, 25.0, 22.0, 38.0, 29.0, 40.0, 40.0, 42.0, 47.0, 49.0, 54.0, 43.0, 46.0, 48.0, 50.0, 45.0, 42.0, 31.0, 48.0, 22.0, 22.0, 27.0, 21.0, 12.0, 11.0, 12.0, 15.0, 7.0, 9.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07508087158203125, -0.07260803878307343, -0.0701352134346962, -0.06766238063573837, -0.06518955528736115, -0.06271672248840332, -0.060243889689445496, -0.05777106061577797, -0.05529823154211044, -0.05282540246844292, -0.05035257339477539, -0.047879740595817566, -0.04540691152215004, -0.04293408244848251, -0.04046124964952469, -0.03798842057585716, -0.035515591502189636, -0.03304276242852211, -0.030569931492209435, -0.02809710055589676, -0.025624271482229233, -0.023151442408561707, -0.02067861147224903, -0.018205780535936356, -0.01573295146226883, -0.013260121457278728, -0.010787291452288628, -0.008314461447298527, -0.005841631442308426, -0.003368801437318325, -0.0008959714323282242, 0.0015768595039844513, 0.0040496885776519775, 0.006522518582642078, 0.00899534858763218, 0.01146817859262228, 0.013941008597612381, 0.016413837671279907, 0.018886668607592583, 0.021359499543905258, 0.023832328617572784, 0.02630515769124031, 0.028777988627552986, 0.03125081956386566, 0.03372364863753319, 0.036196477711200714, 0.03866931051015854, 0.041142139583826065, 0.04361496865749359, 0.04608779773116112, 0.048560626804828644, 0.05103345960378647, 0.053506288677453995, 0.05597911775112152, 0.058451950550079346, 0.06092477962374687, 0.0633976086974144, 0.06587044149637222, 0.06834326684474945, 0.07081609964370728, 0.0732889324426651, 0.07576175779104233, 0.07823459059000015, 0.08070741593837738, 0.0831802487373352]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 15.0, 42.0, 249.0, 3045.0, 4009048.0, 179992.0, 1583.0, 204.0, 53.0, 22.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.233154296875, -0.22628021240234375, -0.2194061279296875, -0.21253204345703125, -0.205657958984375, -0.19878387451171875, -0.1919097900390625, -0.18503570556640625, -0.17816162109375, -0.17128753662109375, -0.1644134521484375, -0.15753936767578125, -0.150665283203125, -0.14379119873046875, -0.1369171142578125, -0.13004302978515625, -0.1231689453125, -0.11629486083984375, -0.1094207763671875, -0.10254669189453125, -0.095672607421875, -0.08879852294921875, -0.0819244384765625, -0.07505035400390625, -0.06817626953125, -0.06130218505859375, -0.0544281005859375, -0.04755401611328125, -0.040679931640625, -0.03380584716796875, -0.0269317626953125, -0.02005767822265625, -0.01318359375, -0.00630950927734375, 0.0005645751953125, 0.00743865966796875, 0.014312744140625, 0.02118682861328125, 0.0280609130859375, 0.03493499755859375, 0.04180908203125, 0.04868316650390625, 0.0555572509765625, 0.06243133544921875, 0.069305419921875, 0.07617950439453125, 0.0830535888671875, 0.08992767333984375, 0.0968017578125, 0.10367584228515625, 0.1105499267578125, 0.11742401123046875, 0.124298095703125, 0.13117218017578125, 0.1380462646484375, 0.14492034912109375, 0.15179443359375, 0.15866851806640625, 0.1655426025390625, 0.17241668701171875, 0.179290771484375, 0.18616485595703125, 0.1930389404296875, 0.19991302490234375, 0.206787109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 22.0, 74.0, 235.0, 346.0, 236.0, 79.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.064453125, -0.0624699592590332, -0.060486793518066406, -0.05850362777709961, -0.05652046203613281, -0.054537296295166016, -0.05255413055419922, -0.05057096481323242, -0.048587799072265625, -0.04660463333129883, -0.04462146759033203, -0.042638301849365234, -0.04065513610839844, -0.03867197036743164, -0.036688804626464844, -0.03470563888549805, -0.03272247314453125, -0.030739307403564453, -0.028756141662597656, -0.02677297592163086, -0.024789810180664062, -0.022806644439697266, -0.02082347869873047, -0.018840312957763672, -0.016857147216796875, -0.014873981475830078, -0.012890815734863281, -0.010907649993896484, -0.008924484252929688, -0.006941318511962891, -0.004958152770996094, -0.002974987030029297, -0.0009918212890625, 0.0009913444519042969, 0.0029745101928710938, 0.004957675933837891, 0.0069408416748046875, 0.008924007415771484, 0.010907173156738281, 0.012890338897705078, 0.014873504638671875, 0.016856670379638672, 0.01883983612060547, 0.020823001861572266, 0.022806167602539062, 0.02478933334350586, 0.026772499084472656, 0.028755664825439453, 0.03073883056640625, 0.03272199630737305, 0.034705162048339844, 0.03668832778930664, 0.03867149353027344, 0.040654659271240234, 0.04263782501220703, 0.04462099075317383, 0.046604156494140625, 0.04858732223510742, 0.05057048797607422, 0.052553653717041016, 0.05453681945800781, 0.05651998519897461, 0.058503150939941406, 0.0604863166809082, 0.062469482421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 11.0, 24.0, 34.0, 44.0, 67.0, 83.0, 135.0, 273.0, 529.0, 1044.0, 2064.0, 5263.0, 16146.0, 68871.0, 762525.0, 3148759.0, 146795.0, 27562.0, 8121.0, 2946.0, 1345.0, 670.0, 373.0, 177.0, 140.0, 95.0, 60.0, 30.0, 28.0, 17.0, 16.0, 12.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.021364212036132812, -0.020679473876953125, -0.019994735717773438, -0.01930999755859375, -0.018625259399414062, -0.017940521240234375, -0.017255783081054688, -0.016571044921875, -0.015886306762695312, -0.015201568603515625, -0.014516830444335938, -0.01383209228515625, -0.013147354125976562, -0.012462615966796875, -0.011777877807617188, -0.0110931396484375, -0.010408401489257812, -0.009723663330078125, -0.009038925170898438, -0.00835418701171875, -0.0076694488525390625, -0.006984710693359375, -0.0062999725341796875, -0.005615234375, -0.0049304962158203125, -0.004245758056640625, -0.0035610198974609375, -0.00287628173828125, -0.0021915435791015625, -0.001506805419921875, -0.0008220672607421875, -0.0001373291015625, 0.0005474090576171875, 0.001232147216796875, 0.0019168853759765625, 0.00260162353515625, 0.0032863616943359375, 0.003971099853515625, 0.0046558380126953125, 0.005340576171875, 0.0060253143310546875, 0.006710052490234375, 0.0073947906494140625, 0.00807952880859375, 0.008764266967773438, 0.009449005126953125, 0.010133743286132812, 0.0108184814453125, 0.011503219604492188, 0.012187957763671875, 0.012872695922851562, 0.01355743408203125, 0.014242172241210938, 0.014926910400390625, 0.015611648559570312, 0.01629638671875, 0.016981124877929688, 0.017665863037109375, 0.018350601196289062, 0.01903533935546875, 0.019720077514648438, 0.020404815673828125, 0.021089553833007812, 0.0217742919921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 12.0, 21.0, 35.0, 56.0, 100.0, 249.0, 643.0, 1607.0, 789.0, 250.0, 109.0, 65.0, 38.0, 17.0, 26.0, 13.0, 14.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020477294921875, -0.019609451293945312, -0.018741607666015625, -0.017873764038085938, -0.01700592041015625, -0.016138076782226562, -0.015270233154296875, -0.014402389526367188, -0.0135345458984375, -0.012666702270507812, -0.011798858642578125, -0.010931015014648438, -0.01006317138671875, -0.009195327758789062, -0.008327484130859375, -0.0074596405029296875, -0.006591796875, -0.0057239532470703125, -0.004856109619140625, -0.0039882659912109375, -0.00312042236328125, -0.0022525787353515625, -0.001384735107421875, -0.0005168914794921875, 0.0003509521484375, 0.0012187957763671875, 0.002086639404296875, 0.0029544830322265625, 0.00382232666015625, 0.0046901702880859375, 0.005558013916015625, 0.0064258575439453125, 0.007293701171875, 0.008161544799804688, 0.009029388427734375, 0.009897232055664062, 0.01076507568359375, 0.011632919311523438, 0.012500762939453125, 0.013368606567382812, 0.0142364501953125, 0.015104293823242188, 0.015972137451171875, 0.016839981079101562, 0.01770782470703125, 0.018575668334960938, 0.019443511962890625, 0.020311355590820312, 0.02117919921875, 0.022047042846679688, 0.022914886474609375, 0.023782730102539062, 0.02465057373046875, 0.025518417358398438, 0.026386260986328125, 0.027254104614257812, 0.0281219482421875, 0.028989791870117188, 0.029857635498046875, 0.030725479125976562, 0.03159332275390625, 0.03246116638183594, 0.033329010009765625, 0.03419685363769531, 0.035064697265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 12.0, 22.0, 69.0, 186.0, 264.0, 230.0, 126.0, 50.0, 18.0, 9.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25066709518432617, -0.2449071854352951, -0.23914729058742523, -0.23338738083839417, -0.2276274859905243, -0.22186757624149323, -0.21610766649246216, -0.21034777164459229, -0.2045878767967224, -0.19882796704769135, -0.19306807219982147, -0.1873081624507904, -0.18154826760292053, -0.17578835785388947, -0.1700284481048584, -0.16426855325698853, -0.15850864350795746, -0.1527487337589264, -0.14698883891105652, -0.14122892916202545, -0.13546903431415558, -0.1297091245651245, -0.12394922226667404, -0.11818931996822357, -0.1124294176697731, -0.10666951537132263, -0.10090961307287216, -0.09514971077442169, -0.08938980102539062, -0.08362990617752075, -0.07786999642848969, -0.07211009413003922, -0.06635017693042755, -0.06059027463197708, -0.05483037233352661, -0.04907046630978584, -0.04331056401133537, -0.0375506617128849, -0.031790755689144135, -0.026030853390693665, -0.020270951092243195, -0.01451104786247015, -0.008751144632697105, -0.002991240471601486, 0.0027686618268489838, 0.008528564125299454, 0.014288470149040222, 0.020048372447490692, 0.025808274745941162, 0.03156817704439163, 0.0373280793428421, 0.04308798536658287, 0.04884788766503334, 0.05460778996348381, 0.06036769598722458, 0.06612759828567505, 0.07188750058412552, 0.07764740288257599, 0.08340730518102646, 0.08916720747947693, 0.094927117228508, 0.10068701207637787, 0.10644692182540894, 0.1122068241238594, 0.11796672642230988]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 7.0, 13.0, 21.0, 8.0, 22.0, 33.0, 21.0, 24.0, 30.0, 38.0, 39.0, 42.0, 56.0, 47.0, 51.0, 45.0, 44.0, 44.0, 46.0, 52.0, 41.0, 22.0, 36.0, 27.0, 26.0, 18.0, 15.0, 19.0, 14.0, 14.0, 11.0, 15.0, 15.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05937594175338745, -0.057429276406764984, -0.055482614785432816, -0.05353595316410065, -0.05158928781747818, -0.04964262247085571, -0.047695960849523544, -0.045749299228191376, -0.04380263388156891, -0.04185596853494644, -0.03990930691361427, -0.037962645292282104, -0.03601597994565964, -0.03406931459903717, -0.032122652977705, -0.030175989493727684, -0.028229326009750366, -0.02628266252577305, -0.02433599904179573, -0.022389335557818413, -0.020442672073841095, -0.018496008589863777, -0.01654934510588646, -0.014602681621909142, -0.012656018137931824, -0.010709354653954506, -0.008762691169977188, -0.00681602768599987, -0.0048693642020225525, -0.0029227007180452347, -0.0009760372340679169, 0.0009706262499094009, 0.0029172897338867188, 0.0048639532178640366, 0.006810616701841354, 0.008757280185818672, 0.01070394366979599, 0.012650607153773308, 0.014597270637750626, 0.016543934121727943, 0.01849059760570526, 0.02043726108968258, 0.022383924573659897, 0.024330588057637215, 0.026277251541614532, 0.02822391502559185, 0.030170578509569168, 0.03211724013090134, 0.034063905477523804, 0.03601057082414627, 0.03795723244547844, 0.03990389406681061, 0.041850559413433075, 0.04379722476005554, 0.04574388638138771, 0.04769054800271988, 0.049637213349342346, 0.05158387869596481, 0.05353054031729698, 0.05547720193862915, 0.05742386728525162, 0.059370532631874084, 0.06131719425320625, 0.06326385587453842, 0.06521052122116089]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 7.0, 11.0, 18.0, 22.0, 24.0, 27.0, 42.0, 55.0, 70.0, 93.0, 128.0, 184.0, 246.0, 349.0, 563.0, 979.0, 2755.0, 23760.0, 590485.0, 407264.0, 16471.0, 2323.0, 851.0, 485.0, 346.0, 248.0, 172.0, 142.0, 93.0, 75.0, 38.0, 51.0, 39.0, 33.0, 12.0, 16.0, 16.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0], "bins": [-0.07342529296875, -0.07126140594482422, -0.06909751892089844, -0.06693363189697266, -0.06476974487304688, -0.0626058578491211, -0.06044197082519531, -0.05827808380126953, -0.05611419677734375, -0.05395030975341797, -0.05178642272949219, -0.049622535705566406, -0.047458648681640625, -0.045294761657714844, -0.04313087463378906, -0.04096698760986328, -0.0388031005859375, -0.03663921356201172, -0.03447532653808594, -0.032311439514160156, -0.030147552490234375, -0.027983665466308594, -0.025819778442382812, -0.02365589141845703, -0.02149200439453125, -0.01932811737060547, -0.017164230346679688, -0.015000343322753906, -0.012836456298828125, -0.010672569274902344, -0.008508682250976562, -0.006344795227050781, -0.004180908203125, -0.0020170211791992188, 0.0001468658447265625, 0.0023107528686523438, 0.004474639892578125, 0.006638526916503906, 0.008802413940429688, 0.010966300964355469, 0.01313018798828125, 0.015294075012207031, 0.017457962036132812, 0.019621849060058594, 0.021785736083984375, 0.023949623107910156, 0.026113510131835938, 0.02827739715576172, 0.0304412841796875, 0.03260517120361328, 0.03476905822753906, 0.036932945251464844, 0.039096832275390625, 0.041260719299316406, 0.04342460632324219, 0.04558849334716797, 0.04775238037109375, 0.04991626739501953, 0.05208015441894531, 0.054244041442871094, 0.056407928466796875, 0.058571815490722656, 0.06073570251464844, 0.06289958953857422, 0.0650634765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 65.0, 191.0, 350.0, 248.0, 123.0, 13.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06451416015625, -0.06254434585571289, -0.06057453155517578, -0.05860471725463867, -0.05663490295410156, -0.05466508865356445, -0.052695274353027344, -0.050725460052490234, -0.048755645751953125, -0.046785831451416016, -0.044816017150878906, -0.0428462028503418, -0.04087638854980469, -0.03890657424926758, -0.03693675994873047, -0.03496694564819336, -0.03299713134765625, -0.03102731704711914, -0.02905750274658203, -0.027087688446044922, -0.025117874145507812, -0.023148059844970703, -0.021178245544433594, -0.019208431243896484, -0.017238616943359375, -0.015268802642822266, -0.013298988342285156, -0.011329174041748047, -0.009359359741210938, -0.007389545440673828, -0.005419731140136719, -0.0034499168395996094, -0.0014801025390625, 0.0004897117614746094, 0.0024595260620117188, 0.004429340362548828, 0.0063991546630859375, 0.008368968963623047, 0.010338783264160156, 0.012308597564697266, 0.014278411865234375, 0.016248226165771484, 0.018218040466308594, 0.020187854766845703, 0.022157669067382812, 0.024127483367919922, 0.02609729766845703, 0.02806711196899414, 0.03003692626953125, 0.03200674057006836, 0.03397655487060547, 0.03594636917114258, 0.03791618347167969, 0.0398859977722168, 0.041855812072753906, 0.043825626373291016, 0.045795440673828125, 0.047765254974365234, 0.049735069274902344, 0.05170488357543945, 0.05367469787597656, 0.05564451217651367, 0.05761432647705078, 0.05958414077758789, 0.061553955078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 16.0, 30.0, 29.0, 48.0, 82.0, 139.0, 248.0, 664.0, 2066.0, 11586.0, 123904.0, 765219.0, 129001.0, 12027.0, 2161.0, 651.0, 261.0, 129.0, 73.0, 41.0, 36.0, 19.0, 30.0, 12.0, 11.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.056640625, -0.05489826202392578, -0.05315589904785156, -0.051413536071777344, -0.049671173095703125, -0.047928810119628906, -0.04618644714355469, -0.04444408416748047, -0.04270172119140625, -0.04095935821533203, -0.03921699523925781, -0.037474632263183594, -0.035732269287109375, -0.033989906311035156, -0.03224754333496094, -0.03050518035888672, -0.0287628173828125, -0.02702045440673828, -0.025278091430664062, -0.023535728454589844, -0.021793365478515625, -0.020051002502441406, -0.018308639526367188, -0.01656627655029297, -0.01482391357421875, -0.013081550598144531, -0.011339187622070312, -0.009596824645996094, -0.007854461669921875, -0.006112098693847656, -0.0043697357177734375, -0.0026273727416992188, -0.000885009765625, 0.0008573532104492188, 0.0025997161865234375, 0.004342079162597656, 0.006084442138671875, 0.007826805114746094, 0.009569168090820312, 0.011311531066894531, 0.01305389404296875, 0.014796257019042969, 0.016538619995117188, 0.018280982971191406, 0.020023345947265625, 0.021765708923339844, 0.023508071899414062, 0.02525043487548828, 0.0269927978515625, 0.02873516082763672, 0.030477523803710938, 0.032219886779785156, 0.033962249755859375, 0.035704612731933594, 0.03744697570800781, 0.03918933868408203, 0.04093170166015625, 0.04267406463623047, 0.04441642761230469, 0.046158790588378906, 0.047901153564453125, 0.049643516540527344, 0.05138587951660156, 0.05312824249267578, 0.05487060546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 11.0, 17.0, 12.0, 20.0, 13.0, 16.0, 31.0, 33.0, 36.0, 38.0, 43.0, 43.0, 48.0, 40.0, 39.0, 41.0, 42.0, 48.0, 58.0, 45.0, 36.0, 40.0, 28.0, 39.0, 24.0, 23.0, 13.0, 21.0, 15.0, 21.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027740478515625, -0.026801586151123047, -0.025862693786621094, -0.02492380142211914, -0.023984909057617188, -0.023046016693115234, -0.02210712432861328, -0.021168231964111328, -0.020229339599609375, -0.019290447235107422, -0.01835155487060547, -0.017412662506103516, -0.016473770141601562, -0.01553487777709961, -0.014595985412597656, -0.013657093048095703, -0.01271820068359375, -0.011779308319091797, -0.010840415954589844, -0.00990152359008789, -0.008962631225585938, -0.008023738861083984, -0.007084846496582031, -0.006145954132080078, -0.005207061767578125, -0.004268169403076172, -0.0033292770385742188, -0.0023903846740722656, -0.0014514923095703125, -0.0005125999450683594, 0.00042629241943359375, 0.0013651847839355469, 0.0023040771484375, 0.003242969512939453, 0.004181861877441406, 0.005120754241943359, 0.0060596466064453125, 0.006998538970947266, 0.007937431335449219, 0.008876323699951172, 0.009815216064453125, 0.010754108428955078, 0.011693000793457031, 0.012631893157958984, 0.013570785522460938, 0.01450967788696289, 0.015448570251464844, 0.016387462615966797, 0.01732635498046875, 0.018265247344970703, 0.019204139709472656, 0.02014303207397461, 0.021081924438476562, 0.022020816802978516, 0.02295970916748047, 0.023898601531982422, 0.024837493896484375, 0.025776386260986328, 0.02671527862548828, 0.027654170989990234, 0.028593063354492188, 0.02953195571899414, 0.030470848083496094, 0.03140974044799805, 0.0323486328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 9.0, 9.0, 22.0, 33.0, 45.0, 62.0, 65.0, 119.0, 148.0, 233.0, 314.0, 506.0, 886.0, 1416.0, 2556.0, 4626.0, 9319.0, 20374.0, 48927.0, 136021.0, 357785.0, 290486.0, 102263.0, 38964.0, 16519.0, 7540.0, 3841.0, 2068.0, 1214.0, 723.0, 430.0, 331.0, 186.0, 146.0, 111.0, 58.0, 50.0, 34.0, 22.0, 15.0, 22.0, 7.0, 4.0, 8.0, 4.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00910186767578125, -0.00877523422241211, -0.008448600769042969, -0.008121967315673828, -0.0077953338623046875, -0.007468700408935547, -0.007142066955566406, -0.006815433502197266, -0.006488800048828125, -0.006162166595458984, -0.005835533142089844, -0.005508899688720703, -0.0051822662353515625, -0.004855632781982422, -0.004528999328613281, -0.004202365875244141, -0.003875732421875, -0.0035490989685058594, -0.0032224655151367188, -0.002895832061767578, -0.0025691986083984375, -0.002242565155029297, -0.0019159317016601562, -0.0015892982482910156, -0.001262664794921875, -0.0009360313415527344, -0.0006093978881835938, -0.0002827644348144531, 4.38690185546875e-05, 0.0003705024719238281, 0.0006971359252929688, 0.0010237693786621094, 0.00135040283203125, 0.0016770362854003906, 0.0020036697387695312, 0.002330303192138672, 0.0026569366455078125, 0.002983570098876953, 0.0033102035522460938, 0.0036368370056152344, 0.003963470458984375, 0.004290103912353516, 0.004616737365722656, 0.004943370819091797, 0.0052700042724609375, 0.005596637725830078, 0.005923271179199219, 0.006249904632568359, 0.0065765380859375, 0.006903171539306641, 0.007229804992675781, 0.007556438446044922, 0.007883071899414062, 0.008209705352783203, 0.008536338806152344, 0.008862972259521484, 0.009189605712890625, 0.009516239166259766, 0.009842872619628906, 0.010169506072998047, 0.010496139526367188, 0.010822772979736328, 0.011149406433105469, 0.01147603988647461, 0.01180267333984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 11.0, 6.0, 11.0, 20.0, 21.0, 33.0, 32.0, 48.0, 58.0, 75.0, 86.0, 83.0, 95.0, 64.0, 66.0, 63.0, 46.0, 30.0, 29.0, 19.0, 21.0, 13.0, 9.0, 7.0, 8.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.654594421386719e-05, -8.419528603553772e-05, -8.184462785720825e-05, -7.949396967887878e-05, -7.714331150054932e-05, -7.479265332221985e-05, -7.244199514389038e-05, -7.009133696556091e-05, -6.774067878723145e-05, -6.539002060890198e-05, -6.303936243057251e-05, -6.068870425224304e-05, -5.8338046073913574e-05, -5.5987387895584106e-05, -5.363672971725464e-05, -5.128607153892517e-05, -4.89354133605957e-05, -4.6584755182266235e-05, -4.423409700393677e-05, -4.18834388256073e-05, -3.953278064727783e-05, -3.7182122468948364e-05, -3.4831464290618896e-05, -3.248080611228943e-05, -3.013014793395996e-05, -2.7779489755630493e-05, -2.5428831577301025e-05, -2.3078173398971558e-05, -2.072751522064209e-05, -1.8376857042312622e-05, -1.6026198863983154e-05, -1.3675540685653687e-05, -1.1324882507324219e-05, -8.974224328994751e-06, -6.623566150665283e-06, -4.2729079723358154e-06, -1.9222497940063477e-06, 4.284083843231201e-07, 2.779066562652588e-06, 5.129724740982056e-06, 7.4803829193115234e-06, 9.831041097640991e-06, 1.2181699275970459e-05, 1.4532357454299927e-05, 1.6883015632629395e-05, 1.9233673810958862e-05, 2.158433198928833e-05, 2.3934990167617798e-05, 2.6285648345947266e-05, 2.8636306524276733e-05, 3.09869647026062e-05, 3.333762288093567e-05, 3.568828105926514e-05, 3.8038939237594604e-05, 4.038959741592407e-05, 4.274025559425354e-05, 4.509091377258301e-05, 4.7441571950912476e-05, 4.979223012924194e-05, 5.214288830757141e-05, 5.449354648590088e-05, 5.684420466423035e-05, 5.9194862842559814e-05, 6.154552102088928e-05, 6.389617919921875e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 6.0, 12.0, 15.0, 20.0, 33.0, 47.0, 73.0, 102.0, 189.0, 273.0, 405.0, 739.0, 1332.0, 2660.0, 5914.0, 13455.0, 33805.0, 99478.0, 346051.0, 372799.0, 108021.0, 36357.0, 14418.0, 6116.0, 2838.0, 1457.0, 697.0, 402.0, 266.0, 178.0, 121.0, 75.0, 48.0, 46.0, 25.0, 24.0, 17.0, 7.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.01499176025390625, -0.014575719833374023, -0.014159679412841797, -0.01374363899230957, -0.013327598571777344, -0.012911558151245117, -0.01249551773071289, -0.012079477310180664, -0.011663436889648438, -0.011247396469116211, -0.010831356048583984, -0.010415315628051758, -0.009999275207519531, -0.009583234786987305, -0.009167194366455078, -0.008751153945922852, -0.008335113525390625, -0.007919073104858398, -0.007503032684326172, -0.007086992263793945, -0.006670951843261719, -0.006254911422729492, -0.005838871002197266, -0.005422830581665039, -0.0050067901611328125, -0.004590749740600586, -0.004174709320068359, -0.003758668899536133, -0.0033426284790039062, -0.0029265880584716797, -0.002510547637939453, -0.0020945072174072266, -0.001678466796875, -0.0012624263763427734, -0.0008463859558105469, -0.0004303455352783203, -1.430511474609375e-05, 0.0004017353057861328, 0.0008177757263183594, 0.001233816146850586, 0.0016498565673828125, 0.002065896987915039, 0.0024819374084472656, 0.002897977828979492, 0.0033140182495117188, 0.0037300586700439453, 0.004146099090576172, 0.0045621395111083984, 0.004978179931640625, 0.0053942203521728516, 0.005810260772705078, 0.006226301193237305, 0.006642341613769531, 0.007058382034301758, 0.007474422454833984, 0.007890462875366211, 0.008306503295898438, 0.008722543716430664, 0.00913858413696289, 0.009554624557495117, 0.009970664978027344, 0.01038670539855957, 0.010802745819091797, 0.011218786239624023, 0.01163482666015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 13.0, 15.0, 13.0, 14.0, 18.0, 28.0, 33.0, 57.0, 68.0, 88.0, 90.0, 109.0, 101.0, 85.0, 53.0, 60.0, 31.0, 25.0, 20.0, 19.0, 14.0, 11.0, 4.0, 6.0, 5.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.013248682022094727, -0.012779712677001953, -0.01231074333190918, -0.011841773986816406, -0.011372804641723633, -0.01090383529663086, -0.010434865951538086, -0.009965896606445312, -0.009496927261352539, -0.009027957916259766, -0.008558988571166992, -0.008090019226074219, -0.007621049880981445, -0.007152080535888672, -0.0066831111907958984, -0.006214141845703125, -0.0057451725006103516, -0.005276203155517578, -0.004807233810424805, -0.004338264465332031, -0.003869295120239258, -0.0034003257751464844, -0.002931356430053711, -0.0024623870849609375, -0.001993417739868164, -0.0015244483947753906, -0.0010554790496826172, -0.0005865097045898438, -0.00011754035949707031, 0.0003514289855957031, 0.0008203983306884766, 0.00128936767578125, 0.0017583370208740234, 0.002227306365966797, 0.0026962757110595703, 0.0031652450561523438, 0.003634214401245117, 0.004103183746337891, 0.004572153091430664, 0.0050411224365234375, 0.005510091781616211, 0.005979061126708984, 0.006448030471801758, 0.006916999816894531, 0.007385969161987305, 0.007854938507080078, 0.008323907852172852, 0.008792877197265625, 0.009261846542358398, 0.009730815887451172, 0.010199785232543945, 0.010668754577636719, 0.011137723922729492, 0.011606693267822266, 0.012075662612915039, 0.012544631958007812, 0.013013601303100586, 0.01348257064819336, 0.013951539993286133, 0.014420509338378906, 0.01488947868347168, 0.015358448028564453, 0.015827417373657227, 0.01629638671875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 53.0, 207.0, 413.0, 265.0, 51.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58975750207901, -0.5752612948417664, -0.5607650279998779, -0.5462688207626343, -0.5317725539207458, -0.5172763466835022, -0.5027800798416138, -0.4882838726043701, -0.4737876057624817, -0.45929136872291565, -0.4447951316833496, -0.43029889464378357, -0.41580265760421753, -0.4013064205646515, -0.38681018352508545, -0.3723139762878418, -0.35781773924827576, -0.3433215022087097, -0.3288252651691437, -0.31432902812957764, -0.2998327910900116, -0.28533655405044556, -0.2708403468132019, -0.2563440799713135, -0.24184785783290863, -0.2273516207933426, -0.21285538375377655, -0.1983591616153717, -0.18386292457580566, -0.16936668753623962, -0.15487045049667358, -0.14037421345710754, -0.1258779764175415, -0.11138173937797546, -0.09688550233840942, -0.08238927274942398, -0.06789303570985794, -0.0533967986702919, -0.03890056908130646, -0.024404332041740417, -0.009908095002174377, 0.004588140174746513, 0.019084375351667404, 0.033580608665943146, 0.048076845705509186, 0.06257308274507523, 0.07706931233406067, 0.09156554937362671, 0.10606178641319275, 0.12055802345275879, 0.13505426049232483, 0.14955049753189087, 0.1640467345714569, 0.17854297161102295, 0.1930391937494278, 0.20753543078899384, 0.22203166782855988, 0.23652790486812592, 0.25102412700653076, 0.2655203640460968, 0.28001660108566284, 0.2945128381252289, 0.3090090751647949, 0.32350531220436096, 0.338001549243927]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 6.0, 15.0, 16.0, 16.0, 16.0, 20.0, 19.0, 32.0, 42.0, 33.0, 26.0, 33.0, 43.0, 37.0, 45.0, 32.0, 43.0, 41.0, 48.0, 29.0, 44.0, 37.0, 33.0, 28.0, 25.0, 31.0, 22.0, 34.0, 34.0, 14.0, 10.0, 14.0, 12.0, 15.0, 14.0, 3.0, 5.0, 5.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09329289197921753, -0.09056613594293594, -0.08783937245607376, -0.08511261641979218, -0.08238585293292999, -0.07965909689664841, -0.07693234086036682, -0.07420557737350464, -0.07147882133722305, -0.06875206530094147, -0.06602530181407928, -0.0632985457777977, -0.060571786016225815, -0.05784502625465393, -0.055118270218372345, -0.05239151045680046, -0.04966475069522858, -0.04693799093365669, -0.04421123117208481, -0.04148447513580322, -0.03875771537423134, -0.036030955612659454, -0.03330419957637787, -0.030577439814805984, -0.0278506800532341, -0.025123920291662216, -0.02239716239273548, -0.019670404493808746, -0.016943644732236862, -0.014216885901987553, -0.011490127071738243, -0.008763369172811508, -0.006036609411239624, -0.0033098505809903145, -0.0005830917507410049, 0.0021436670795083046, 0.004870425909757614, 0.007597184740006924, 0.010323943570256233, 0.013050701469182968, 0.015777461230754852, 0.018504220992326736, 0.02123097889125347, 0.023957736790180206, 0.02668449655175209, 0.029411256313323975, 0.03213801234960556, 0.034864772111177444, 0.03759153187274933, 0.04031829163432121, 0.0430450513958931, 0.04577180743217468, 0.04849856719374657, 0.05122532695531845, 0.05395208299160004, 0.05667884275317192, 0.059405602514743805, 0.06213236227631569, 0.06485912203788757, 0.06758587807416916, 0.07031263411045074, 0.07303939759731293, 0.07576615363359451, 0.0784929096698761, 0.08121967315673828]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 10.0, 8.0, 24.0, 155.0, 2021.0, 4125488.0, 65563.0, 864.0, 105.0, 31.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26702117919921875, -0.2588958740234375, -0.25077056884765625, -0.242645263671875, -0.23451995849609375, -0.2263946533203125, -0.21826934814453125, -0.21014404296875, -0.20201873779296875, -0.1938934326171875, -0.18576812744140625, -0.177642822265625, -0.16951751708984375, -0.1613922119140625, -0.15326690673828125, -0.1451416015625, -0.13701629638671875, -0.1288909912109375, -0.12076568603515625, -0.112640380859375, -0.10451507568359375, -0.0963897705078125, -0.08826446533203125, -0.08013916015625, -0.07201385498046875, -0.0638885498046875, -0.05576324462890625, -0.047637939453125, -0.03951263427734375, -0.0313873291015625, -0.02326202392578125, -0.01513671875, -0.00701141357421875, 0.0011138916015625, 0.00923919677734375, 0.017364501953125, 0.02548980712890625, 0.0336151123046875, 0.04174041748046875, 0.04986572265625, 0.05799102783203125, 0.0661163330078125, 0.07424163818359375, 0.082366943359375, 0.09049224853515625, 0.0986175537109375, 0.10674285888671875, 0.1148681640625, 0.12299346923828125, 0.1311187744140625, 0.13924407958984375, 0.147369384765625, 0.15549468994140625, 0.1636199951171875, 0.17174530029296875, 0.17987060546875, 0.18799591064453125, 0.1961212158203125, 0.20424652099609375, 0.212371826171875, 0.22049713134765625, 0.2286224365234375, 0.23674774169921875, 0.244873046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 112.0, 231.0, 312.0, 224.0, 88.0, 15.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06519222259521484, -0.06318473815917969, -0.06117725372314453, -0.059169769287109375, -0.05716228485107422, -0.05515480041503906, -0.053147315979003906, -0.05113983154296875, -0.049132347106933594, -0.04712486267089844, -0.04511737823486328, -0.043109893798828125, -0.04110240936279297, -0.03909492492675781, -0.037087440490722656, -0.0350799560546875, -0.033072471618652344, -0.031064987182617188, -0.02905750274658203, -0.027050018310546875, -0.02504253387451172, -0.023035049438476562, -0.021027565002441406, -0.01902008056640625, -0.017012596130371094, -0.015005111694335938, -0.012997627258300781, -0.010990142822265625, -0.008982658386230469, -0.0069751739501953125, -0.004967689514160156, -0.002960205078125, -0.0009527206420898438, 0.0010547637939453125, 0.0030622482299804688, 0.005069732666015625, 0.007077217102050781, 0.009084701538085938, 0.011092185974121094, 0.01309967041015625, 0.015107154846191406, 0.017114639282226562, 0.01912212371826172, 0.021129608154296875, 0.02313709259033203, 0.025144577026367188, 0.027152061462402344, 0.0291595458984375, 0.031167030334472656, 0.03317451477050781, 0.03518199920654297, 0.037189483642578125, 0.03919696807861328, 0.04120445251464844, 0.043211936950683594, 0.04521942138671875, 0.047226905822753906, 0.04923439025878906, 0.05124187469482422, 0.053249359130859375, 0.05525684356689453, 0.05726432800292969, 0.059271812438964844, 0.061279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 16.0, 10.0, 18.0, 35.0, 59.0, 91.0, 142.0, 199.0, 382.0, 753.0, 1605.0, 4455.0, 14077.0, 58432.0, 427589.0, 3336988.0, 285386.0, 45675.0, 11502.0, 3672.0, 1436.0, 671.0, 433.0, 234.0, 139.0, 81.0, 50.0, 40.0, 30.0, 20.0, 10.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023345947265625, -0.02257847785949707, -0.02181100845336914, -0.02104353904724121, -0.02027606964111328, -0.01950860023498535, -0.018741130828857422, -0.017973661422729492, -0.017206192016601562, -0.016438722610473633, -0.015671253204345703, -0.014903783798217773, -0.014136314392089844, -0.013368844985961914, -0.012601375579833984, -0.011833906173706055, -0.011066436767578125, -0.010298967361450195, -0.009531497955322266, -0.008764028549194336, -0.007996559143066406, -0.0072290897369384766, -0.006461620330810547, -0.005694150924682617, -0.0049266815185546875, -0.004159212112426758, -0.003391742706298828, -0.0026242733001708984, -0.0018568038940429688, -0.001089334487915039, -0.0003218650817871094, 0.0004456043243408203, 0.00121307373046875, 0.0019805431365966797, 0.0027480125427246094, 0.003515481948852539, 0.004282951354980469, 0.0050504207611083984, 0.005817890167236328, 0.006585359573364258, 0.0073528289794921875, 0.008120298385620117, 0.008887767791748047, 0.009655237197875977, 0.010422706604003906, 0.011190176010131836, 0.011957645416259766, 0.012725114822387695, 0.013492584228515625, 0.014260053634643555, 0.015027523040771484, 0.015794992446899414, 0.016562461853027344, 0.017329931259155273, 0.018097400665283203, 0.018864870071411133, 0.019632339477539062, 0.020399808883666992, 0.021167278289794922, 0.02193474769592285, 0.02270221710205078, 0.02346968650817871, 0.02423715591430664, 0.02500462532043457, 0.0257720947265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 13.0, 17.0, 33.0, 57.0, 80.0, 124.0, 245.0, 565.0, 1221.0, 888.0, 373.0, 187.0, 78.0, 64.0, 36.0, 33.0, 16.0, 13.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176849365234375, -0.016833066940307617, -0.015981197357177734, -0.015129327774047852, -0.014277458190917969, -0.013425588607788086, -0.012573719024658203, -0.01172184944152832, -0.010869979858398438, -0.010018110275268555, -0.009166240692138672, -0.008314371109008789, -0.007462501525878906, -0.0066106319427490234, -0.005758762359619141, -0.004906892776489258, -0.004055023193359375, -0.003203153610229492, -0.0023512840270996094, -0.0014994144439697266, -0.0006475448608398438, 0.00020432472229003906, 0.0010561943054199219, 0.0019080638885498047, 0.0027599334716796875, 0.0036118030548095703, 0.004463672637939453, 0.005315542221069336, 0.006167411804199219, 0.0070192813873291016, 0.007871150970458984, 0.008723020553588867, 0.00957489013671875, 0.010426759719848633, 0.011278629302978516, 0.012130498886108398, 0.012982368469238281, 0.013834238052368164, 0.014686107635498047, 0.01553797721862793, 0.016389846801757812, 0.017241716384887695, 0.018093585968017578, 0.01894545555114746, 0.019797325134277344, 0.020649194717407227, 0.02150106430053711, 0.022352933883666992, 0.023204803466796875, 0.024056673049926758, 0.02490854263305664, 0.025760412216186523, 0.026612281799316406, 0.02746415138244629, 0.028316020965576172, 0.029167890548706055, 0.030019760131835938, 0.03087162971496582, 0.0317234992980957, 0.032575368881225586, 0.03342723846435547, 0.03427910804748535, 0.035130977630615234, 0.03598284721374512, 0.036834716796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 21.0, 41.0, 84.0, 139.0, 186.0, 186.0, 151.0, 90.0, 43.0, 17.0, 13.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08364906907081604, -0.07913349568843842, -0.07461792975664139, -0.07010236382484436, -0.06558679044246674, -0.06107122078537941, -0.056555651128292084, -0.05204008147120476, -0.04752451181411743, -0.043008942157030106, -0.03849337249994278, -0.033977802842855453, -0.029462233185768127, -0.0249466635286808, -0.020431093871593475, -0.01591552421450615, -0.011399954557418823, -0.006884384900331497, -0.002368815243244171, 0.002146754413843155, 0.006662324070930481, 0.011177893728017807, 0.015693463385105133, 0.02020903304219246, 0.024724602699279785, 0.02924017235636711, 0.03375574201345444, 0.03827131167054176, 0.04278688132762909, 0.047302450984716415, 0.05181802064180374, 0.05633359029889107, 0.0608491450548172, 0.06536471843719482, 0.06988028436899185, 0.07439585030078888, 0.0789114236831665, 0.08342699706554413, 0.08794256299734116, 0.09245812892913818, 0.09697370231151581, 0.10148927569389343, 0.10600484162569046, 0.11052040755748749, 0.11503598093986511, 0.11955155432224274, 0.12406712025403976, 0.1285826861858368, 0.13309825956821442, 0.13761383295059204, 0.14212939143180847, 0.1466449648141861, 0.15116053819656372, 0.15567611157894135, 0.16019168496131897, 0.1647072434425354, 0.16922281682491302, 0.17373839020729065, 0.17825394868850708, 0.1827695220708847, 0.18728509545326233, 0.19180066883563995, 0.19631624221801758, 0.200831800699234, 0.20534737408161163]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 15.0, 15.0, 16.0, 11.0, 22.0, 18.0, 19.0, 24.0, 28.0, 24.0, 26.0, 35.0, 33.0, 47.0, 58.0, 51.0, 41.0, 49.0, 46.0, 45.0, 34.0, 39.0, 37.0, 53.0, 33.0, 28.0, 27.0, 23.0, 18.0, 20.0, 13.0, 12.0, 8.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.06870871782302856, -0.06682983785867691, -0.06495095789432526, -0.063072070479393, -0.06119319051504135, -0.0593143105506897, -0.057435426861047745, -0.05555654317140579, -0.05367766320705414, -0.051798783242702484, -0.04991989955306053, -0.04804101586341858, -0.046162135899066925, -0.04428325593471527, -0.04240437224507332, -0.040525488555431366, -0.03864660859107971, -0.03676772862672806, -0.034888844937086105, -0.03300996124744415, -0.0311310812830925, -0.029252199456095695, -0.027373317629098892, -0.02549443580210209, -0.023615553975105286, -0.021736672148108482, -0.01985779032111168, -0.017978908494114876, -0.016100026667118073, -0.01422114484012127, -0.012342263013124466, -0.010463381186127663, -0.00858449935913086, -0.006705617532134056, -0.004826735705137253, -0.0029478538781404495, -0.0010689720511436462, 0.000809909775853157, 0.0026887916028499603, 0.004567673429846764, 0.006446555256843567, 0.00832543708384037, 0.010204318910837173, 0.012083200737833977, 0.01396208256483078, 0.015840964391827583, 0.017719846218824387, 0.01959872804582119, 0.021477609872817993, 0.023356491699814796, 0.0252353735268116, 0.027114255353808403, 0.028993137180805206, 0.03087201900780201, 0.03275090083479881, 0.034629784524440765, 0.03650866448879242, 0.038387544453144073, 0.040266428142786026, 0.04214531183242798, 0.04402419179677963, 0.04590307176113129, 0.04778195545077324, 0.04966083914041519, 0.051539719104766846]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 2.0, 10.0, 14.0, 13.0, 29.0, 36.0, 48.0, 71.0, 99.0, 124.0, 196.0, 288.0, 437.0, 831.0, 2239.0, 14236.0, 343520.0, 656363.0, 24412.0, 3098.0, 940.0, 470.0, 330.0, 222.0, 157.0, 97.0, 64.0, 58.0, 43.0, 28.0, 18.0, 18.0, 12.0, 7.0, 6.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07373046875, -0.07101058959960938, -0.06829071044921875, -0.06557083129882812, -0.0628509521484375, -0.060131072998046875, -0.05741119384765625, -0.054691314697265625, -0.051971435546875, -0.049251556396484375, -0.04653167724609375, -0.043811798095703125, -0.0410919189453125, -0.038372039794921875, -0.03565216064453125, -0.032932281494140625, -0.03021240234375, -0.027492523193359375, -0.02477264404296875, -0.022052764892578125, -0.0193328857421875, -0.016613006591796875, -0.01389312744140625, -0.011173248291015625, -0.008453369140625, -0.005733489990234375, -0.00301361083984375, -0.000293731689453125, 0.0024261474609375, 0.005146026611328125, 0.00786590576171875, 0.010585784912109375, 0.0133056640625, 0.016025543212890625, 0.01874542236328125, 0.021465301513671875, 0.0241851806640625, 0.026905059814453125, 0.02962493896484375, 0.032344818115234375, 0.035064697265625, 0.037784576416015625, 0.04050445556640625, 0.043224334716796875, 0.0459442138671875, 0.048664093017578125, 0.05138397216796875, 0.054103851318359375, 0.05682373046875, 0.059543609619140625, 0.06226348876953125, 0.06498336791992188, 0.0677032470703125, 0.07042312622070312, 0.07314300537109375, 0.07586288452148438, 0.078582763671875, 0.08130264282226562, 0.08402252197265625, 0.08674240112304688, 0.0894622802734375, 0.09218215942382812, 0.09490203857421875, 0.09762191772460938, 0.100341796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 73.0, 205.0, 315.0, 252.0, 119.0, 23.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06360816955566406, -0.061603546142578125, -0.05959892272949219, -0.05759429931640625, -0.05558967590332031, -0.053585052490234375, -0.05158042907714844, -0.0495758056640625, -0.04757118225097656, -0.045566558837890625, -0.04356193542480469, -0.04155731201171875, -0.03955268859863281, -0.037548065185546875, -0.03554344177246094, -0.033538818359375, -0.03153419494628906, -0.029529571533203125, -0.027524948120117188, -0.02552032470703125, -0.023515701293945312, -0.021511077880859375, -0.019506454467773438, -0.0175018310546875, -0.015497207641601562, -0.013492584228515625, -0.011487960815429688, -0.00948333740234375, -0.0074787139892578125, -0.005474090576171875, -0.0034694671630859375, -0.00146484375, 0.0005397796630859375, 0.002544403076171875, 0.0045490264892578125, 0.00655364990234375, 0.008558273315429688, 0.010562896728515625, 0.012567520141601562, 0.0145721435546875, 0.016576766967773438, 0.018581390380859375, 0.020586013793945312, 0.02259063720703125, 0.024595260620117188, 0.026599884033203125, 0.028604507446289062, 0.030609130859375, 0.03261375427246094, 0.034618377685546875, 0.03662300109863281, 0.03862762451171875, 0.04063224792480469, 0.042636871337890625, 0.04464149475097656, 0.0466461181640625, 0.04865074157714844, 0.050655364990234375, 0.05265998840332031, 0.05466461181640625, 0.05666923522949219, 0.058673858642578125, 0.06067848205566406, 0.06268310546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 15.0, 11.0, 26.0, 50.0, 87.0, 142.0, 314.0, 812.0, 2184.0, 8872.0, 56849.0, 604162.0, 334731.0, 31644.0, 5819.0, 1635.0, 628.0, 265.0, 127.0, 65.0, 27.0, 20.0, 21.0, 12.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06085205078125, -0.058814048767089844, -0.05677604675292969, -0.05473804473876953, -0.052700042724609375, -0.05066204071044922, -0.04862403869628906, -0.046586036682128906, -0.04454803466796875, -0.042510032653808594, -0.04047203063964844, -0.03843402862548828, -0.036396026611328125, -0.03435802459716797, -0.03232002258300781, -0.030282020568847656, -0.0282440185546875, -0.026206016540527344, -0.024168014526367188, -0.02213001251220703, -0.020092010498046875, -0.01805400848388672, -0.016016006469726562, -0.013978004455566406, -0.01194000244140625, -0.009902000427246094, -0.007863998413085938, -0.005825996398925781, -0.003787994384765625, -0.0017499923706054688, 0.0002880096435546875, 0.0023260116577148438, 0.004364013671875, 0.006402015686035156, 0.008440017700195312, 0.010478019714355469, 0.012516021728515625, 0.014554023742675781, 0.016592025756835938, 0.018630027770996094, 0.02066802978515625, 0.022706031799316406, 0.024744033813476562, 0.02678203582763672, 0.028820037841796875, 0.03085803985595703, 0.03289604187011719, 0.034934043884277344, 0.0369720458984375, 0.039010047912597656, 0.04104804992675781, 0.04308605194091797, 0.045124053955078125, 0.04716205596923828, 0.04920005798339844, 0.051238059997558594, 0.05327606201171875, 0.055314064025878906, 0.05735206604003906, 0.05939006805419922, 0.061428070068359375, 0.06346607208251953, 0.06550407409667969, 0.06754207611083984, 0.069580078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 3.0, 5.0, 11.0, 15.0, 23.0, 23.0, 30.0, 38.0, 22.0, 40.0, 45.0, 64.0, 56.0, 64.0, 72.0, 60.0, 53.0, 42.0, 52.0, 47.0, 43.0, 37.0, 33.0, 21.0, 23.0, 17.0, 16.0, 10.0, 7.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056560516357421875, -0.05501556396484375, -0.053470611572265625, -0.0519256591796875, -0.050380706787109375, -0.04883575439453125, -0.047290802001953125, -0.045745849609375, -0.044200897216796875, -0.04265594482421875, -0.041110992431640625, -0.0395660400390625, -0.038021087646484375, -0.03647613525390625, -0.034931182861328125, -0.03338623046875, -0.031841278076171875, -0.03029632568359375, -0.028751373291015625, -0.0272064208984375, -0.025661468505859375, -0.02411651611328125, -0.022571563720703125, -0.021026611328125, -0.019481658935546875, -0.01793670654296875, -0.016391754150390625, -0.0148468017578125, -0.013301849365234375, -0.01175689697265625, -0.010211944580078125, -0.0086669921875, -0.007122039794921875, -0.00557708740234375, -0.004032135009765625, -0.0024871826171875, -0.000942230224609375, 0.00060272216796875, 0.002147674560546875, 0.003692626953125, 0.005237579345703125, 0.00678253173828125, 0.008327484130859375, 0.0098724365234375, 0.011417388916015625, 0.01296234130859375, 0.014507293701171875, 0.01605224609375, 0.017597198486328125, 0.01914215087890625, 0.020687103271484375, 0.0222320556640625, 0.023777008056640625, 0.02532196044921875, 0.026866912841796875, 0.028411865234375, 0.029956817626953125, 0.03150177001953125, 0.033046722412109375, 0.0345916748046875, 0.036136627197265625, 0.03768157958984375, 0.039226531982421875, 0.040771484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 13.0, 22.0, 52.0, 75.0, 121.0, 169.0, 305.0, 529.0, 848.0, 1532.0, 2950.0, 6221.0, 15693.0, 54707.0, 352222.0, 505340.0, 73350.0, 19354.0, 7335.0, 3462.0, 1776.0, 1017.0, 551.0, 348.0, 217.0, 126.0, 67.0, 48.0, 29.0, 15.0, 12.0, 16.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023673295974731445, -0.02288675308227539, -0.022100210189819336, -0.02131366729736328, -0.020527124404907227, -0.019740581512451172, -0.018954038619995117, -0.018167495727539062, -0.017380952835083008, -0.016594409942626953, -0.0158078670501709, -0.015021324157714844, -0.014234781265258789, -0.013448238372802734, -0.01266169548034668, -0.011875152587890625, -0.01108860969543457, -0.010302066802978516, -0.009515523910522461, -0.008728981018066406, -0.007942438125610352, -0.007155895233154297, -0.006369352340698242, -0.0055828094482421875, -0.004796266555786133, -0.004009723663330078, -0.0032231807708740234, -0.0024366378784179688, -0.001650094985961914, -0.0008635520935058594, -7.700920104980469e-05, 0.00070953369140625, 0.0014960765838623047, 0.0022826194763183594, 0.003069162368774414, 0.0038557052612304688, 0.0046422481536865234, 0.005428791046142578, 0.006215333938598633, 0.0070018768310546875, 0.007788419723510742, 0.008574962615966797, 0.009361505508422852, 0.010148048400878906, 0.010934591293334961, 0.011721134185791016, 0.01250767707824707, 0.013294219970703125, 0.01408076286315918, 0.014867305755615234, 0.01565384864807129, 0.016440391540527344, 0.0172269344329834, 0.018013477325439453, 0.018800020217895508, 0.019586563110351562, 0.020373106002807617, 0.021159648895263672, 0.021946191787719727, 0.02273273468017578, 0.023519277572631836, 0.02430582046508789, 0.025092363357543945, 0.02587890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 12.0, 6.0, 10.0, 16.0, 15.0, 10.0, 18.0, 32.0, 45.0, 49.0, 61.0, 70.0, 92.0, 89.0, 90.0, 63.0, 67.0, 54.0, 36.0, 40.0, 39.0, 18.0, 10.0, 16.0, 9.0, 7.0, 7.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.014108657836914e-05, -5.79003244638443e-05, -5.565956234931946e-05, -5.341880023479462e-05, -5.1178038120269775e-05, -4.8937276005744934e-05, -4.669651389122009e-05, -4.445575177669525e-05, -4.221498966217041e-05, -3.997422754764557e-05, -3.773346543312073e-05, -3.5492703318595886e-05, -3.3251941204071045e-05, -3.1011179089546204e-05, -2.8770416975021362e-05, -2.652965486049652e-05, -2.428889274597168e-05, -2.204813063144684e-05, -1.9807368516921997e-05, -1.7566606402397156e-05, -1.5325844287872314e-05, -1.3085082173347473e-05, -1.0844320058822632e-05, -8.60355794429779e-06, -6.362795829772949e-06, -4.122033715248108e-06, -1.8812716007232666e-06, 3.594905138015747e-07, 2.600252628326416e-06, 4.841014742851257e-06, 7.081776857376099e-06, 9.32253897190094e-06, 1.1563301086425781e-05, 1.3804063200950623e-05, 1.6044825315475464e-05, 1.8285587430000305e-05, 2.0526349544525146e-05, 2.2767111659049988e-05, 2.500787377357483e-05, 2.724863588809967e-05, 2.9489398002624512e-05, 3.173016011714935e-05, 3.3970922231674194e-05, 3.6211684346199036e-05, 3.845244646072388e-05, 4.069320857524872e-05, 4.293397068977356e-05, 4.51747328042984e-05, 4.741549491882324e-05, 4.9656257033348083e-05, 5.1897019147872925e-05, 5.4137781262397766e-05, 5.637854337692261e-05, 5.861930549144745e-05, 6.086006760597229e-05, 6.310082972049713e-05, 6.534159183502197e-05, 6.758235394954681e-05, 6.982311606407166e-05, 7.20638781785965e-05, 7.430464029312134e-05, 7.654540240764618e-05, 7.878616452217102e-05, 8.102692663669586e-05, 8.32676887512207e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 11.0, 8.0, 14.0, 12.0, 16.0, 31.0, 41.0, 58.0, 96.0, 181.0, 299.0, 491.0, 1025.0, 2258.0, 4911.0, 12290.0, 34506.0, 119699.0, 532422.0, 247637.0, 59665.0, 19322.0, 7224.0, 3189.0, 1458.0, 714.0, 380.0, 229.0, 128.0, 77.0, 57.0, 30.0, 22.0, 16.0, 11.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.02006840705871582, -0.01941537857055664, -0.01876235008239746, -0.01810932159423828, -0.0174562931060791, -0.016803264617919922, -0.016150236129760742, -0.015497207641601562, -0.014844179153442383, -0.014191150665283203, -0.013538122177124023, -0.012885093688964844, -0.012232065200805664, -0.011579036712646484, -0.010926008224487305, -0.010272979736328125, -0.009619951248168945, -0.008966922760009766, -0.008313894271850586, -0.007660865783691406, -0.0070078372955322266, -0.006354808807373047, -0.005701780319213867, -0.0050487518310546875, -0.004395723342895508, -0.003742694854736328, -0.0030896663665771484, -0.0024366378784179688, -0.001783609390258789, -0.0011305809020996094, -0.0004775524139404297, 0.00017547607421875, 0.0008285045623779297, 0.0014815330505371094, 0.002134561538696289, 0.0027875900268554688, 0.0034406185150146484, 0.004093647003173828, 0.004746675491333008, 0.0053997039794921875, 0.006052732467651367, 0.006705760955810547, 0.0073587894439697266, 0.008011817932128906, 0.008664846420288086, 0.009317874908447266, 0.009970903396606445, 0.010623931884765625, 0.011276960372924805, 0.011929988861083984, 0.012583017349243164, 0.013236045837402344, 0.013889074325561523, 0.014542102813720703, 0.015195131301879883, 0.015848159790039062, 0.016501188278198242, 0.017154216766357422, 0.0178072452545166, 0.01846027374267578, 0.01911330223083496, 0.01976633071899414, 0.02041935920715332, 0.0210723876953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 12.0, 14.0, 15.0, 33.0, 34.0, 36.0, 55.0, 83.0, 103.0, 117.0, 91.0, 79.0, 74.0, 41.0, 40.0, 34.0, 20.0, 28.0, 11.0, 9.0, 9.0, 5.0, 7.0, 4.0, 7.0, 3.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.014934778213500977, -0.014244556427001953, -0.01355433464050293, -0.012864112854003906, -0.012173891067504883, -0.01148366928100586, -0.010793447494506836, -0.010103225708007812, -0.009413003921508789, -0.008722782135009766, -0.008032560348510742, -0.007342338562011719, -0.006652116775512695, -0.005961894989013672, -0.0052716732025146484, -0.004581451416015625, -0.0038912296295166016, -0.003201007843017578, -0.0025107860565185547, -0.0018205642700195312, -0.0011303424835205078, -0.0004401206970214844, 0.00025010108947753906, 0.0009403228759765625, 0.001630544662475586, 0.0023207664489746094, 0.003010988235473633, 0.0037012100219726562, 0.00439143180847168, 0.005081653594970703, 0.0057718753814697266, 0.00646209716796875, 0.0071523189544677734, 0.007842540740966797, 0.00853276252746582, 0.009222984313964844, 0.009913206100463867, 0.01060342788696289, 0.011293649673461914, 0.011983871459960938, 0.012674093246459961, 0.013364315032958984, 0.014054536819458008, 0.014744758605957031, 0.015434980392456055, 0.016125202178955078, 0.0168154239654541, 0.017505645751953125, 0.01819586753845215, 0.018886089324951172, 0.019576311111450195, 0.02026653289794922, 0.020956754684448242, 0.021646976470947266, 0.02233719825744629, 0.023027420043945312, 0.023717641830444336, 0.02440786361694336, 0.025098085403442383, 0.025788307189941406, 0.02647852897644043, 0.027168750762939453, 0.027858972549438477, 0.0285491943359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 21.0, 47.0, 151.0, 278.0, 275.0, 145.0, 54.0, 17.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6444089412689209, -0.6295187473297119, -0.6146285533905029, -0.599738359451294, -0.584848165512085, -0.569957971572876, -0.555067777633667, -0.540177583694458, -0.5252873301506042, -0.5103971362113953, -0.4955069422721863, -0.4806167483329773, -0.4657265245914459, -0.45083633065223694, -0.43594613671302795, -0.42105594277381897, -0.4061657786369324, -0.3912755846977234, -0.3763853907585144, -0.3614951968193054, -0.34660497307777405, -0.33171477913856506, -0.3168245851993561, -0.3019343912601471, -0.2870441675186157, -0.27215397357940674, -0.25726377964019775, -0.24237357079982758, -0.2274833768606186, -0.2125931680202484, -0.19770297408103943, -0.18281278014183044, -0.16792258620262146, -0.15303239226341248, -0.1381421834230423, -0.12325198948383331, -0.10836179554462433, -0.09347159415483475, -0.07858139276504517, -0.06369119882583618, -0.0488009974360466, -0.03391079977154732, -0.019020600244402885, -0.004130400717258453, 0.01075979694724083, 0.025649994611740112, 0.040540196001529694, 0.05543038994073868, 0.07032059133052826, 0.08521079272031784, 0.10010098665952682, 0.1149911880493164, 0.1298813819885254, 0.14477157592773438, 0.15966178476810455, 0.17455197870731354, 0.18944218754768372, 0.2043323814868927, 0.21922259032726288, 0.23411278426647186, 0.24900297820568085, 0.263893187046051, 0.27878338098526, 0.293673574924469, 0.308563768863678]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 10.0, 10.0, 16.0, 14.0, 25.0, 21.0, 25.0, 33.0, 33.0, 50.0, 37.0, 45.0, 51.0, 62.0, 51.0, 43.0, 49.0, 56.0, 67.0, 42.0, 49.0, 38.0, 42.0, 25.0, 19.0, 24.0, 21.0, 19.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2123175859451294, -0.20689621567726135, -0.2014748454093933, -0.19605349004268646, -0.19063211977481842, -0.18521074950695038, -0.17978939414024353, -0.1743680238723755, -0.16894665360450745, -0.1635252833366394, -0.15810391306877136, -0.15268255770206451, -0.14726118743419647, -0.14183981716632843, -0.13641846179962158, -0.13099709153175354, -0.1255757212638855, -0.12015435099601746, -0.11473298817873001, -0.10931162536144257, -0.10389025509357452, -0.09846888482570648, -0.09304752200841904, -0.08762615919113159, -0.08220478892326355, -0.07678341865539551, -0.07136205583810806, -0.06594069302082062, -0.060519322752952576, -0.05509795621037483, -0.04967658966779709, -0.044255223125219345, -0.0388338565826416, -0.03341249004006386, -0.027991123497486115, -0.02256975695490837, -0.017148390412330627, -0.011727023869752884, -0.00630565732717514, -0.0008842907845973969, 0.004537075757980347, 0.00995844230055809, 0.015379808843135834, 0.020801175385713577, 0.02622254192829132, 0.031643908470869064, 0.03706527501344681, 0.04248664155602455, 0.047908008098602295, 0.05332937464118004, 0.05875074118375778, 0.06417210400104523, 0.06959347426891327, 0.07501484453678131, 0.08043620735406876, 0.0858575701713562, 0.09127894043922424, 0.09670031070709229, 0.10212167352437973, 0.10754303634166718, 0.11296440660953522, 0.11838577687740326, 0.1238071396946907, 0.12922850251197815, 0.1346498727798462]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 7.0, 16.0, 32.0, 162.0, 1028.0, 5436.0, 82677.0, 4078399.0, 23119.0, 2445.0, 719.0, 119.0, 47.0, 30.0, 14.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11102294921875, -0.10769462585449219, -0.10436630249023438, -0.10103797912597656, -0.09770965576171875, -0.09438133239746094, -0.09105300903320312, -0.08772468566894531, -0.0843963623046875, -0.08106803894042969, -0.07773971557617188, -0.07441139221191406, -0.07108306884765625, -0.06775474548339844, -0.06442642211914062, -0.06109809875488281, -0.057769775390625, -0.05444145202636719, -0.051113128662109375, -0.04778480529785156, -0.04445648193359375, -0.04112815856933594, -0.037799835205078125, -0.03447151184082031, -0.0311431884765625, -0.027814865112304688, -0.024486541748046875, -0.021158218383789062, -0.01782989501953125, -0.014501571655273438, -0.011173248291015625, -0.007844924926757812, -0.0045166015625, -0.0011882781982421875, 0.002140045166015625, 0.0054683685302734375, 0.00879669189453125, 0.012125015258789062, 0.015453338623046875, 0.018781661987304688, 0.0221099853515625, 0.025438308715820312, 0.028766632080078125, 0.03209495544433594, 0.03542327880859375, 0.03875160217285156, 0.042079925537109375, 0.04540824890136719, 0.048736572265625, 0.05206489562988281, 0.055393218994140625, 0.05872154235839844, 0.06204986572265625, 0.06537818908691406, 0.06870651245117188, 0.07203483581542969, 0.0753631591796875, 0.07869148254394531, 0.08201980590820312, 0.08534812927246094, 0.08867645263671875, 0.09200477600097656, 0.09533309936523438, 0.09866142272949219, 0.10198974609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 13.0, 62.0, 172.0, 269.0, 272.0, 149.0, 54.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.0664663314819336, -0.06445121765136719, -0.06243610382080078, -0.060420989990234375, -0.05840587615966797, -0.05639076232910156, -0.054375648498535156, -0.05236053466796875, -0.050345420837402344, -0.04833030700683594, -0.04631519317626953, -0.044300079345703125, -0.04228496551513672, -0.04026985168457031, -0.038254737854003906, -0.0362396240234375, -0.034224510192871094, -0.03220939636230469, -0.03019428253173828, -0.028179168701171875, -0.02616405487060547, -0.024148941040039062, -0.022133827209472656, -0.02011871337890625, -0.018103599548339844, -0.016088485717773438, -0.014073371887207031, -0.012058258056640625, -0.010043144226074219, -0.008028030395507812, -0.006012916564941406, -0.003997802734375, -0.0019826889038085938, 3.24249267578125e-05, 0.0020475387573242188, 0.004062652587890625, 0.006077766418457031, 0.008092880249023438, 0.010107994079589844, 0.01212310791015625, 0.014138221740722656, 0.016153335571289062, 0.01816844940185547, 0.020183563232421875, 0.02219867706298828, 0.024213790893554688, 0.026228904724121094, 0.0282440185546875, 0.030259132385253906, 0.03227424621582031, 0.03428936004638672, 0.036304473876953125, 0.03831958770751953, 0.04033470153808594, 0.042349815368652344, 0.04436492919921875, 0.046380043029785156, 0.04839515686035156, 0.05041027069091797, 0.052425384521484375, 0.05444049835205078, 0.05645561218261719, 0.058470726013183594, 0.06048583984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 19.0, 35.0, 45.0, 73.0, 117.0, 292.0, 733.0, 2148.0, 9092.0, 72680.0, 3216072.0, 847756.0, 36649.0, 5876.0, 1546.0, 578.0, 245.0, 125.0, 65.0, 40.0, 25.0, 16.0, 11.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040802001953125, -0.03909158706665039, -0.03738117218017578, -0.03567075729370117, -0.03396034240722656, -0.03224992752075195, -0.030539512634277344, -0.028829097747802734, -0.027118682861328125, -0.025408267974853516, -0.023697853088378906, -0.021987438201904297, -0.020277023315429688, -0.018566608428955078, -0.01685619354248047, -0.01514577865600586, -0.01343536376953125, -0.01172494888305664, -0.010014533996582031, -0.008304119110107422, -0.0065937042236328125, -0.004883289337158203, -0.0031728744506835938, -0.0014624595642089844, 0.000247955322265625, 0.0019583702087402344, 0.0036687850952148438, 0.005379199981689453, 0.0070896148681640625, 0.008800029754638672, 0.010510444641113281, 0.01222085952758789, 0.0139312744140625, 0.01564168930053711, 0.01735210418701172, 0.019062519073486328, 0.020772933959960938, 0.022483348846435547, 0.024193763732910156, 0.025904178619384766, 0.027614593505859375, 0.029325008392333984, 0.031035423278808594, 0.0327458381652832, 0.03445625305175781, 0.03616666793823242, 0.03787708282470703, 0.03958749771118164, 0.04129791259765625, 0.04300832748413086, 0.04471874237060547, 0.04642915725708008, 0.04813957214355469, 0.0498499870300293, 0.051560401916503906, 0.053270816802978516, 0.054981231689453125, 0.056691646575927734, 0.058402061462402344, 0.06011247634887695, 0.06182289123535156, 0.06353330612182617, 0.06524372100830078, 0.06695413589477539, 0.06866455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 7.0, 14.0, 16.0, 20.0, 38.0, 68.0, 109.0, 205.0, 442.0, 976.0, 1132.0, 481.0, 222.0, 133.0, 81.0, 53.0, 21.0, 20.0, 9.0, 12.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.01960277557373047, -0.018453598022460938, -0.017304420471191406, -0.016155242919921875, -0.015006065368652344, -0.013856887817382812, -0.012707710266113281, -0.01155853271484375, -0.010409355163574219, -0.009260177612304688, -0.008111000061035156, -0.006961822509765625, -0.005812644958496094, -0.0046634674072265625, -0.0035142898559570312, -0.0023651123046875, -0.0012159347534179688, -6.67572021484375e-05, 0.0010824203491210938, 0.002231597900390625, 0.0033807754516601562, 0.0045299530029296875, 0.005679130554199219, 0.00682830810546875, 0.007977485656738281, 0.009126663208007812, 0.010275840759277344, 0.011425018310546875, 0.012574195861816406, 0.013723373413085938, 0.014872550964355469, 0.016021728515625, 0.01717090606689453, 0.018320083618164062, 0.019469261169433594, 0.020618438720703125, 0.021767616271972656, 0.022916793823242188, 0.02406597137451172, 0.02521514892578125, 0.02636432647705078, 0.027513504028320312, 0.028662681579589844, 0.029811859130859375, 0.030961036682128906, 0.03211021423339844, 0.03325939178466797, 0.0344085693359375, 0.03555774688720703, 0.03670692443847656, 0.037856101989746094, 0.039005279541015625, 0.040154457092285156, 0.04130363464355469, 0.04245281219482422, 0.04360198974609375, 0.04475116729736328, 0.04590034484863281, 0.047049522399902344, 0.048198699951171875, 0.049347877502441406, 0.05049705505371094, 0.05164623260498047, 0.05279541015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 6.0, 23.0, 48.0, 102.0, 169.0, 220.0, 180.0, 108.0, 63.0, 42.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26920008659362793, -0.2613925039768219, -0.25358492136001587, -0.24577733874320984, -0.23796974122524261, -0.23016215860843658, -0.22235457599163055, -0.21454699337482452, -0.2067394107580185, -0.19893182814121246, -0.19112424552440643, -0.1833166480064392, -0.17550906538963318, -0.16770148277282715, -0.15989390015602112, -0.1520863175392151, -0.14427873492240906, -0.13647115230560303, -0.128663569688797, -0.12085597962141037, -0.11304839700460434, -0.10524080693721771, -0.09743322432041168, -0.08962564170360565, -0.08181804418563843, -0.0740104615688324, -0.06620287150144577, -0.05839528888463974, -0.05058770626783371, -0.04278011992573738, -0.03497253358364105, -0.027164950966835022, -0.01935736835002899, -0.011549783870577812, -0.003742198459804058, 0.004065386950969696, 0.011872971430420876, 0.019680555909872055, 0.027488142251968384, 0.035295724868774414, 0.04310331121087074, 0.05091089755296707, 0.0587184801697731, 0.06652607023715973, 0.07433365285396576, 0.08214123547077179, 0.08994881808757782, 0.09775640070438385, 0.10556399077177048, 0.11337157338857651, 0.12117916345596313, 0.12898674607276917, 0.1367943286895752, 0.14460191130638123, 0.15240949392318726, 0.1602170765399933, 0.1680246740579605, 0.17583225667476654, 0.18363983929157257, 0.1914474368095398, 0.19925501942634583, 0.20706260204315186, 0.21487018465995789, 0.22267776727676392, 0.23048534989356995]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 7.0, 12.0, 16.0, 10.0, 12.0, 10.0, 22.0, 22.0, 28.0, 27.0, 34.0, 32.0, 39.0, 41.0, 59.0, 38.0, 51.0, 50.0, 35.0, 36.0, 51.0, 36.0, 40.0, 37.0, 36.0, 22.0, 30.0, 25.0, 19.0, 19.0, 19.0, 16.0, 14.0, 8.0, 12.0, 2.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07784855365753174, -0.07550067454576492, -0.07315279543399811, -0.0708049088716507, -0.06845702975988388, -0.06610915064811707, -0.06376126408576965, -0.06141338497400284, -0.05906550586223602, -0.05671762675046921, -0.054369743913412094, -0.05202186107635498, -0.049673981964588165, -0.04732610285282135, -0.044978220015764236, -0.04263033717870712, -0.04028245806694031, -0.03793457895517349, -0.03558669611811638, -0.033238813281059265, -0.03089093416929245, -0.028543053194880486, -0.02619517222046852, -0.023847291246056557, -0.021499410271644592, -0.019151529297232628, -0.016803648322820663, -0.014455767348408699, -0.012107886373996735, -0.00976000539958477, -0.007412124425172806, -0.005064243450760841, -0.002716362476348877, -0.00036848150193691254, 0.001979399472475052, 0.004327280446887016, 0.006675161421298981, 0.009023042395710945, 0.01137092337012291, 0.013718804344534874, 0.01606668531894684, 0.018414566293358803, 0.020762447267770767, 0.02311032824218273, 0.025458209216594696, 0.02780609019100666, 0.030153971165418625, 0.03250185400247574, 0.034849733114242554, 0.03719761222600937, 0.03954549506306648, 0.041893377900123596, 0.04424125701189041, 0.04658913612365723, 0.04893701896071434, 0.051284901797771454, 0.05363278090953827, 0.055980660021305084, 0.0583285428583622, 0.06067642569541931, 0.06302430480718613, 0.06537218391895294, 0.06772007048130035, 0.07006794959306717, 0.07241582870483398]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 7.0, 5.0, 6.0, 12.0, 14.0, 13.0, 20.0, 19.0, 25.0, 46.0, 56.0, 63.0, 97.0, 118.0, 151.0, 255.0, 356.0, 624.0, 1271.0, 4342.0, 27039.0, 470384.0, 506842.0, 29136.0, 4422.0, 1331.0, 631.0, 331.0, 246.0, 176.0, 144.0, 95.0, 87.0, 48.0, 29.0, 26.0, 29.0, 17.0, 8.0, 8.0, 10.0, 7.0, 6.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.08741950988769531, -0.08450698852539062, -0.08159446716308594, -0.07868194580078125, -0.07576942443847656, -0.07285690307617188, -0.06994438171386719, -0.0670318603515625, -0.06411933898925781, -0.061206817626953125, -0.05829429626464844, -0.05538177490234375, -0.05246925354003906, -0.049556732177734375, -0.04664421081542969, -0.043731689453125, -0.04081916809082031, -0.037906646728515625, -0.03499412536621094, -0.03208160400390625, -0.029169082641601562, -0.026256561279296875, -0.023344039916992188, -0.0204315185546875, -0.017518997192382812, -0.014606475830078125, -0.011693954467773438, -0.00878143310546875, -0.0058689117431640625, -0.002956390380859375, -4.38690185546875e-05, 0.00286865234375, 0.0057811737060546875, 0.008693695068359375, 0.011606216430664062, 0.01451873779296875, 0.017431259155273438, 0.020343780517578125, 0.023256301879882812, 0.0261688232421875, 0.029081344604492188, 0.031993865966796875, 0.03490638732910156, 0.03781890869140625, 0.04073143005371094, 0.043643951416015625, 0.04655647277832031, 0.049468994140625, 0.05238151550292969, 0.055294036865234375, 0.05820655822753906, 0.06111907958984375, 0.06403160095214844, 0.06694412231445312, 0.06985664367675781, 0.0727691650390625, 0.07568168640136719, 0.07859420776367188, 0.08150672912597656, 0.08441925048828125, 0.08733177185058594, 0.09024429321289062, 0.09315681457519531, 0.0960693359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 36.0, 122.0, 257.0, 280.0, 199.0, 79.0, 18.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.0635833740234375, -0.061553955078125, -0.0595245361328125, -0.0574951171875, -0.0554656982421875, -0.053436279296875, -0.0514068603515625, -0.04937744140625, -0.0473480224609375, -0.045318603515625, -0.0432891845703125, -0.041259765625, -0.0392303466796875, -0.037200927734375, -0.0351715087890625, -0.03314208984375, -0.0311126708984375, -0.029083251953125, -0.0270538330078125, -0.0250244140625, -0.0229949951171875, -0.020965576171875, -0.0189361572265625, -0.01690673828125, -0.0148773193359375, -0.012847900390625, -0.0108184814453125, -0.0087890625, -0.0067596435546875, -0.004730224609375, -0.0027008056640625, -0.00067138671875, 0.0013580322265625, 0.003387451171875, 0.0054168701171875, 0.0074462890625, 0.0094757080078125, 0.011505126953125, 0.0135345458984375, 0.01556396484375, 0.0175933837890625, 0.019622802734375, 0.0216522216796875, 0.023681640625, 0.0257110595703125, 0.027740478515625, 0.0297698974609375, 0.03179931640625, 0.0338287353515625, 0.035858154296875, 0.0378875732421875, 0.0399169921875, 0.0419464111328125, 0.043975830078125, 0.0460052490234375, 0.04803466796875, 0.0500640869140625, 0.052093505859375, 0.0541229248046875, 0.05615234375, 0.0581817626953125, 0.060211181640625, 0.0622406005859375, 0.06427001953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 10.0, 11.0, 20.0, 27.0, 27.0, 36.0, 71.0, 80.0, 164.0, 258.0, 528.0, 1123.0, 2765.0, 7903.0, 29241.0, 180646.0, 660421.0, 130453.0, 23337.0, 6813.0, 2408.0, 1030.0, 509.0, 269.0, 125.0, 83.0, 50.0, 37.0, 33.0, 13.0, 21.0, 12.0, 5.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06275653839111328, -0.06069374084472656, -0.058630943298339844, -0.056568145751953125, -0.054505348205566406, -0.05244255065917969, -0.05037975311279297, -0.04831695556640625, -0.04625415802001953, -0.04419136047363281, -0.042128562927246094, -0.040065765380859375, -0.038002967834472656, -0.03594017028808594, -0.03387737274169922, -0.0318145751953125, -0.02975177764892578, -0.027688980102539062, -0.025626182556152344, -0.023563385009765625, -0.021500587463378906, -0.019437789916992188, -0.01737499237060547, -0.01531219482421875, -0.013249397277832031, -0.011186599731445312, -0.009123802185058594, -0.007061004638671875, -0.004998207092285156, -0.0029354095458984375, -0.0008726119995117188, 0.001190185546875, 0.0032529830932617188, 0.0053157806396484375, 0.007378578186035156, 0.009441375732421875, 0.011504173278808594, 0.013566970825195312, 0.01562976837158203, 0.01769256591796875, 0.01975536346435547, 0.021818161010742188, 0.023880958557128906, 0.025943756103515625, 0.028006553649902344, 0.030069351196289062, 0.03213214874267578, 0.0341949462890625, 0.03625774383544922, 0.03832054138183594, 0.040383338928222656, 0.042446136474609375, 0.044508934020996094, 0.04657173156738281, 0.04863452911376953, 0.05069732666015625, 0.05276012420654297, 0.05482292175292969, 0.056885719299316406, 0.058948516845703125, 0.061011314392089844, 0.06307411193847656, 0.06513690948486328, 0.06719970703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 8.0, 18.0, 17.0, 23.0, 23.0, 44.0, 45.0, 64.0, 56.0, 75.0, 85.0, 81.0, 74.0, 69.0, 53.0, 55.0, 36.0, 28.0, 33.0, 25.0, 22.0, 14.0, 6.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07574462890625, -0.0736093521118164, -0.07147407531738281, -0.06933879852294922, -0.06720352172851562, -0.06506824493408203, -0.06293296813964844, -0.060797691345214844, -0.05866241455078125, -0.056527137756347656, -0.05439186096191406, -0.05225658416748047, -0.050121307373046875, -0.04798603057861328, -0.04585075378417969, -0.043715476989746094, -0.0415802001953125, -0.039444923400878906, -0.03730964660644531, -0.03517436981201172, -0.033039093017578125, -0.03090381622314453, -0.028768539428710938, -0.026633262634277344, -0.02449798583984375, -0.022362709045410156, -0.020227432250976562, -0.01809215545654297, -0.015956878662109375, -0.013821601867675781, -0.011686325073242188, -0.009551048278808594, -0.007415771484375, -0.005280494689941406, -0.0031452178955078125, -0.0010099411010742188, 0.001125335693359375, 0.0032606124877929688, 0.0053958892822265625, 0.007531166076660156, 0.00966644287109375, 0.011801719665527344, 0.013936996459960938, 0.01607227325439453, 0.018207550048828125, 0.02034282684326172, 0.022478103637695312, 0.024613380432128906, 0.0267486572265625, 0.028883934020996094, 0.031019210815429688, 0.03315448760986328, 0.035289764404296875, 0.03742504119873047, 0.03956031799316406, 0.041695594787597656, 0.04383087158203125, 0.045966148376464844, 0.04810142517089844, 0.05023670196533203, 0.052371978759765625, 0.05450725555419922, 0.05664253234863281, 0.058777809143066406, 0.0609130859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 7.0, 12.0, 12.0, 11.0, 22.0, 23.0, 43.0, 47.0, 104.0, 123.0, 191.0, 307.0, 453.0, 764.0, 1214.0, 2145.0, 3689.0, 7085.0, 15204.0, 39846.0, 197014.0, 616290.0, 110158.0, 28067.0, 11822.0, 6001.0, 3150.0, 1837.0, 1046.0, 611.0, 439.0, 262.0, 157.0, 111.0, 78.0, 63.0, 41.0, 27.0, 12.0, 20.0, 11.0, 8.0, 12.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0338134765625, -0.03273487091064453, -0.03165626525878906, -0.030577659606933594, -0.029499053955078125, -0.028420448303222656, -0.027341842651367188, -0.02626323699951172, -0.02518463134765625, -0.02410602569580078, -0.023027420043945312, -0.021948814392089844, -0.020870208740234375, -0.019791603088378906, -0.018712997436523438, -0.01763439178466797, -0.0165557861328125, -0.015477180480957031, -0.014398574829101562, -0.013319969177246094, -0.012241363525390625, -0.011162757873535156, -0.010084152221679688, -0.009005546569824219, -0.00792694091796875, -0.006848335266113281, -0.0057697296142578125, -0.004691123962402344, -0.003612518310546875, -0.0025339126586914062, -0.0014553070068359375, -0.00037670135498046875, 0.000701904296875, 0.0017805099487304688, 0.0028591156005859375, 0.003937721252441406, 0.005016326904296875, 0.006094932556152344, 0.0071735382080078125, 0.008252143859863281, 0.00933074951171875, 0.010409355163574219, 0.011487960815429688, 0.012566566467285156, 0.013645172119140625, 0.014723777770996094, 0.015802383422851562, 0.01688098907470703, 0.0179595947265625, 0.01903820037841797, 0.020116806030273438, 0.021195411682128906, 0.022274017333984375, 0.023352622985839844, 0.024431228637695312, 0.02550983428955078, 0.02658843994140625, 0.02766704559326172, 0.028745651245117188, 0.029824256896972656, 0.030902862548828125, 0.031981468200683594, 0.03306007385253906, 0.03413867950439453, 0.03521728515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 10.0, 16.0, 15.0, 20.0, 27.0, 38.0, 53.0, 102.0, 133.0, 131.0, 124.0, 81.0, 59.0, 37.0, 35.0, 14.0, 17.0, 12.0, 5.0, 3.0, 2.0, 10.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0001157522201538086, -0.00011227652430534363, -0.00010880082845687866, -0.0001053251326084137, -0.00010184943675994873, -9.837374091148376e-05, -9.48980450630188e-05, -9.142234921455383e-05, -8.794665336608887e-05, -8.44709575176239e-05, -8.099526166915894e-05, -7.751956582069397e-05, -7.4043869972229e-05, -7.056817412376404e-05, -6.709247827529907e-05, -6.36167824268341e-05, -6.014108657836914e-05, -5.6665390729904175e-05, -5.318969488143921e-05, -4.971399903297424e-05, -4.623830318450928e-05, -4.276260733604431e-05, -3.9286911487579346e-05, -3.581121563911438e-05, -3.2335519790649414e-05, -2.8859823942184448e-05, -2.5384128093719482e-05, -2.1908432245254517e-05, -1.843273639678955e-05, -1.4957040548324585e-05, -1.1481344699859619e-05, -8.005648851394653e-06, -4.5299530029296875e-06, -1.0542571544647217e-06, 2.421438694000244e-06, 5.89713454246521e-06, 9.372830390930176e-06, 1.2848526239395142e-05, 1.6324222087860107e-05, 1.9799917936325073e-05, 2.327561378479004e-05, 2.6751309633255005e-05, 3.022700548171997e-05, 3.3702701330184937e-05, 3.71783971786499e-05, 4.065409302711487e-05, 4.4129788875579834e-05, 4.76054847240448e-05, 5.1081180572509766e-05, 5.455687642097473e-05, 5.80325722694397e-05, 6.150826811790466e-05, 6.498396396636963e-05, 6.84596598148346e-05, 7.193535566329956e-05, 7.541105151176453e-05, 7.888674736022949e-05, 8.236244320869446e-05, 8.583813905715942e-05, 8.931383490562439e-05, 9.278953075408936e-05, 9.626522660255432e-05, 9.974092245101929e-05, 0.00010321661829948425, 0.00010669231414794922]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 17.0, 9.0, 13.0, 19.0, 27.0, 46.0, 63.0, 110.0, 175.0, 292.0, 510.0, 896.0, 1631.0, 3054.0, 6403.0, 14139.0, 36953.0, 134264.0, 570816.0, 198034.0, 48151.0, 17447.0, 7570.0, 3589.0, 1922.0, 984.0, 558.0, 305.0, 209.0, 113.0, 63.0, 47.0, 27.0, 22.0, 14.0, 11.0, 14.0, 9.0, 3.0, 2.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.032318115234375, -0.031327247619628906, -0.030336380004882812, -0.02934551239013672, -0.028354644775390625, -0.02736377716064453, -0.026372909545898438, -0.025382041931152344, -0.02439117431640625, -0.023400306701660156, -0.022409439086914062, -0.02141857147216797, -0.020427703857421875, -0.01943683624267578, -0.018445968627929688, -0.017455101013183594, -0.0164642333984375, -0.015473365783691406, -0.014482498168945312, -0.013491630554199219, -0.012500762939453125, -0.011509895324707031, -0.010519027709960938, -0.009528160095214844, -0.00853729248046875, -0.007546424865722656, -0.0065555572509765625, -0.005564689636230469, -0.004573822021484375, -0.0035829544067382812, -0.0025920867919921875, -0.0016012191772460938, -0.0006103515625, 0.00038051605224609375, 0.0013713836669921875, 0.0023622512817382812, 0.003353118896484375, 0.004343986511230469, 0.0053348541259765625, 0.006325721740722656, 0.00731658935546875, 0.008307456970214844, 0.009298324584960938, 0.010289192199707031, 0.011280059814453125, 0.012270927429199219, 0.013261795043945312, 0.014252662658691406, 0.0152435302734375, 0.016234397888183594, 0.017225265502929688, 0.01821613311767578, 0.019207000732421875, 0.02019786834716797, 0.021188735961914062, 0.022179603576660156, 0.02317047119140625, 0.024161338806152344, 0.025152206420898438, 0.02614307403564453, 0.027133941650390625, 0.02812480926513672, 0.029115676879882812, 0.030106544494628906, 0.031097412109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 9.0, 11.0, 13.0, 27.0, 28.0, 62.0, 85.0, 124.0, 141.0, 144.0, 105.0, 71.0, 50.0, 31.0, 19.0, 16.0, 12.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265655517578125, -0.02535223960876465, -0.024138927459716797, -0.022925615310668945, -0.021712303161621094, -0.020498991012573242, -0.01928567886352539, -0.01807236671447754, -0.016859054565429688, -0.015645742416381836, -0.014432430267333984, -0.013219118118286133, -0.012005805969238281, -0.01079249382019043, -0.009579181671142578, -0.008365869522094727, -0.007152557373046875, -0.0059392452239990234, -0.004725933074951172, -0.0035126209259033203, -0.0022993087768554688, -0.0010859966278076172, 0.00012731552124023438, 0.001340627670288086, 0.0025539398193359375, 0.003767251968383789, 0.004980564117431641, 0.006193876266479492, 0.007407188415527344, 0.008620500564575195, 0.009833812713623047, 0.011047124862670898, 0.01226043701171875, 0.013473749160766602, 0.014687061309814453, 0.015900373458862305, 0.017113685607910156, 0.018326997756958008, 0.01954030990600586, 0.02075362205505371, 0.021966934204101562, 0.023180246353149414, 0.024393558502197266, 0.025606870651245117, 0.02682018280029297, 0.02803349494934082, 0.029246807098388672, 0.030460119247436523, 0.031673431396484375, 0.03288674354553223, 0.03410005569458008, 0.03531336784362793, 0.03652667999267578, 0.03773999214172363, 0.038953304290771484, 0.040166616439819336, 0.04137992858886719, 0.04259324073791504, 0.04380655288696289, 0.04501986503601074, 0.046233177185058594, 0.047446489334106445, 0.0486598014831543, 0.04987311363220215, 0.05108642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 57.0, 165.0, 240.0, 243.0, 140.0, 54.0, 22.0, 14.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6857501864433289, -0.6677188873291016, -0.6496875286102295, -0.6316562294960022, -0.6136248707771301, -0.5955935716629028, -0.5775622129440308, -0.5595309138298035, -0.5414996147155762, -0.5234683156013489, -0.5054369568824768, -0.4874056279659271, -0.46937429904937744, -0.45134299993515015, -0.43331167101860046, -0.4152803421020508, -0.3972489833831787, -0.37921765446662903, -0.36118632555007935, -0.34315499663352966, -0.32512366771698, -0.3070923686027527, -0.289061039686203, -0.2710297107696533, -0.25299838185310364, -0.23496705293655396, -0.21693572402000427, -0.19890441000461578, -0.1808730810880661, -0.16284175217151642, -0.14481043815612793, -0.12677910923957825, -0.10874775052070618, -0.0907164216041565, -0.07268510013818741, -0.054653774946928024, -0.03662244975566864, -0.018591120839118958, -0.0005597993731498718, 0.017471522092819214, 0.035502851009368896, 0.05353417620062828, 0.07156550139188766, 0.08959682285785675, 0.10762815177440643, 0.12565948069095612, 0.1436907947063446, 0.1617221236228943, 0.17975345253944397, 0.19778478145599365, 0.21581611037254333, 0.23384742438793182, 0.2518787384033203, 0.2699100971221924, 0.2879413962364197, 0.30597272515296936, 0.32400405406951904, 0.3420353829860687, 0.3600667119026184, 0.3780980408191681, 0.3961293697357178, 0.41416066884994507, 0.43219199776649475, 0.45022332668304443, 0.4682546555995941]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 10.0, 10.0, 8.0, 19.0, 16.0, 32.0, 38.0, 38.0, 35.0, 44.0, 42.0, 45.0, 49.0, 59.0, 44.0, 41.0, 47.0, 54.0, 47.0, 50.0, 40.0, 31.0, 27.0, 35.0, 24.0, 30.0, 15.0, 14.0, 21.0, 7.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2079530954360962, -0.2026481330394745, -0.19734317064285278, -0.19203820824623108, -0.18673324584960938, -0.18142828345298767, -0.17612332105636597, -0.17081835865974426, -0.16551339626312256, -0.16020843386650085, -0.15490347146987915, -0.14959850907325745, -0.14429354667663574, -0.13898858428001404, -0.13368362188339233, -0.12837865948677063, -0.12307369709014893, -0.11776873469352722, -0.11246377229690552, -0.10715880990028381, -0.10185384750366211, -0.0965488851070404, -0.0912439227104187, -0.085938960313797, -0.08063399791717529, -0.07532903552055359, -0.07002407312393188, -0.06471911072731018, -0.05941414833068848, -0.05410918593406677, -0.04880422353744507, -0.043499261140823364, -0.03819429874420166, -0.032889336347579956, -0.027584373950958252, -0.022279411554336548, -0.016974449157714844, -0.01166948676109314, -0.0063645243644714355, -0.0010595619678497314, 0.004245400428771973, 0.009550362825393677, 0.01485532522201538, 0.020160287618637085, 0.02546525001525879, 0.030770212411880493, 0.0360751748085022, 0.0413801372051239, 0.046685099601745605, 0.05199006199836731, 0.057295024394989014, 0.06259998679161072, 0.06790494918823242, 0.07320991158485413, 0.07851487398147583, 0.08381983637809753, 0.08912479877471924, 0.09442976117134094, 0.09973472356796265, 0.10503968596458435, 0.11034464836120605, 0.11564961075782776, 0.12095457315444946, 0.12625953555107117, 0.13156449794769287]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 12.0, 29.0, 56.0, 281.0, 6266.0, 3995236.0, 190022.0, 2030.0, 217.0, 60.0, 28.0, 15.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21142578125, -0.2049884796142578, -0.19855117797851562, -0.19211387634277344, -0.18567657470703125, -0.17923927307128906, -0.17280197143554688, -0.1663646697998047, -0.1599273681640625, -0.1534900665283203, -0.14705276489257812, -0.14061546325683594, -0.13417816162109375, -0.12774085998535156, -0.12130355834960938, -0.11486625671386719, -0.108428955078125, -0.10199165344238281, -0.09555435180664062, -0.08911705017089844, -0.08267974853515625, -0.07624244689941406, -0.06980514526367188, -0.06336784362792969, -0.0569305419921875, -0.05049324035644531, -0.044055938720703125, -0.03761863708496094, -0.03118133544921875, -0.024744033813476562, -0.018306732177734375, -0.011869430541992188, -0.00543212890625, 0.0010051727294921875, 0.007442474365234375, 0.013879776000976562, 0.02031707763671875, 0.026754379272460938, 0.033191680908203125, 0.03962898254394531, 0.0460662841796875, 0.05250358581542969, 0.058940887451171875, 0.06537818908691406, 0.07181549072265625, 0.07825279235839844, 0.08469009399414062, 0.09112739562988281, 0.097564697265625, 0.10400199890136719, 0.11043930053710938, 0.11687660217285156, 0.12331390380859375, 0.12975120544433594, 0.13618850708007812, 0.1426258087158203, 0.1490631103515625, 0.1555004119873047, 0.16193771362304688, 0.16837501525878906, 0.17481231689453125, 0.18124961853027344, 0.18768692016601562, 0.1941242218017578, 0.2005615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 28.0, 78.0, 145.0, 263.0, 222.0, 169.0, 69.0, 17.0, 12.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.06232309341430664, -0.06037616729736328, -0.05842924118041992, -0.05648231506347656, -0.0545353889465332, -0.052588462829589844, -0.050641536712646484, -0.048694610595703125, -0.046747684478759766, -0.044800758361816406, -0.04285383224487305, -0.04090690612792969, -0.03895998001098633, -0.03701305389404297, -0.03506612777709961, -0.03311920166015625, -0.03117227554321289, -0.02922534942626953, -0.027278423309326172, -0.025331497192382812, -0.023384571075439453, -0.021437644958496094, -0.019490718841552734, -0.017543792724609375, -0.015596866607666016, -0.013649940490722656, -0.011703014373779297, -0.009756088256835938, -0.007809162139892578, -0.005862236022949219, -0.003915309906005859, -0.0019683837890625, -2.1457672119140625e-05, 0.0019254684448242188, 0.003872394561767578, 0.0058193206787109375, 0.007766246795654297, 0.009713172912597656, 0.011660099029541016, 0.013607025146484375, 0.015553951263427734, 0.017500877380371094, 0.019447803497314453, 0.021394729614257812, 0.023341655731201172, 0.02528858184814453, 0.02723550796508789, 0.02918243408203125, 0.03112936019897461, 0.03307628631591797, 0.03502321243286133, 0.03697013854980469, 0.03891706466674805, 0.040863990783691406, 0.042810916900634766, 0.044757843017578125, 0.046704769134521484, 0.048651695251464844, 0.0505986213684082, 0.05254554748535156, 0.05449247360229492, 0.05643939971923828, 0.05838632583618164, 0.060333251953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 6.0, 6.0, 3.0, 11.0, 22.0, 32.0, 47.0, 58.0, 115.0, 207.0, 402.0, 723.0, 1529.0, 3472.0, 8619.0, 25737.0, 110515.0, 1891349.0, 1996565.0, 113306.0, 25977.0, 8797.0, 3489.0, 1542.0, 828.0, 375.0, 214.0, 127.0, 76.0, 45.0, 26.0, 22.0, 14.0, 13.0, 11.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0555419921875, -0.05399942398071289, -0.05245685577392578, -0.05091428756713867, -0.04937171936035156, -0.04782915115356445, -0.046286582946777344, -0.044744014739990234, -0.043201446533203125, -0.041658878326416016, -0.040116310119628906, -0.0385737419128418, -0.03703117370605469, -0.03548860549926758, -0.03394603729248047, -0.03240346908569336, -0.03086090087890625, -0.02931833267211914, -0.02777576446533203, -0.026233196258544922, -0.024690628051757812, -0.023148059844970703, -0.021605491638183594, -0.020062923431396484, -0.018520355224609375, -0.016977787017822266, -0.015435218811035156, -0.013892650604248047, -0.012350082397460938, -0.010807514190673828, -0.009264945983886719, -0.007722377777099609, -0.0061798095703125, -0.004637241363525391, -0.0030946731567382812, -0.0015521049499511719, -9.5367431640625e-06, 0.0015330314636230469, 0.0030755996704101562, 0.004618167877197266, 0.006160736083984375, 0.007703304290771484, 0.009245872497558594, 0.010788440704345703, 0.012331008911132812, 0.013873577117919922, 0.015416145324707031, 0.01695871353149414, 0.01850128173828125, 0.02004384994506836, 0.02158641815185547, 0.023128986358642578, 0.024671554565429688, 0.026214122772216797, 0.027756690979003906, 0.029299259185791016, 0.030841827392578125, 0.032384395599365234, 0.033926963806152344, 0.03546953201293945, 0.03701210021972656, 0.03855466842651367, 0.04009723663330078, 0.04163980484008789, 0.043182373046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 22.0, 28.0, 42.0, 59.0, 104.0, 143.0, 237.0, 475.0, 1034.0, 944.0, 353.0, 204.0, 113.0, 80.0, 42.0, 38.0, 32.0, 18.0, 19.0, 12.0, 9.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03314208984375, -0.03186225891113281, -0.030582427978515625, -0.029302597045898438, -0.02802276611328125, -0.026742935180664062, -0.025463104248046875, -0.024183273315429688, -0.0229034423828125, -0.021623611450195312, -0.020343780517578125, -0.019063949584960938, -0.01778411865234375, -0.016504287719726562, -0.015224456787109375, -0.013944625854492188, -0.012664794921875, -0.011384963989257812, -0.010105133056640625, -0.008825302124023438, -0.00754547119140625, -0.0062656402587890625, -0.004985809326171875, -0.0037059783935546875, -0.0024261474609375, -0.0011463165283203125, 0.000133514404296875, 0.0014133453369140625, 0.00269317626953125, 0.0039730072021484375, 0.005252838134765625, 0.0065326690673828125, 0.0078125, 0.009092330932617188, 0.010372161865234375, 0.011651992797851562, 0.01293182373046875, 0.014211654663085938, 0.015491485595703125, 0.016771316528320312, 0.0180511474609375, 0.019330978393554688, 0.020610809326171875, 0.021890640258789062, 0.02317047119140625, 0.024450302124023438, 0.025730133056640625, 0.027009963989257812, 0.028289794921875, 0.029569625854492188, 0.030849456787109375, 0.03212928771972656, 0.03340911865234375, 0.03468894958496094, 0.035968780517578125, 0.03724861145019531, 0.0385284423828125, 0.03980827331542969, 0.041088104248046875, 0.04236793518066406, 0.04364776611328125, 0.04492759704589844, 0.046207427978515625, 0.04748725891113281, 0.04876708984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 5.0, 16.0, 59.0, 122.0, 250.0, 277.0, 177.0, 59.0, 19.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40764015913009644, -0.39084571599960327, -0.3740512728691101, -0.35725682973861694, -0.3404623866081238, -0.3236679434776306, -0.30687350034713745, -0.2900790572166443, -0.2732846140861511, -0.25649017095565796, -0.2396957278251648, -0.22290128469467163, -0.20610684156417847, -0.1893123984336853, -0.17251795530319214, -0.15572351217269897, -0.1389290690422058, -0.12213462591171265, -0.10534018278121948, -0.08854573965072632, -0.07175129652023315, -0.05495685338973999, -0.038162410259246826, -0.021367967128753662, -0.004573523998260498, 0.012220919132232666, 0.02901536226272583, 0.045809805393218994, 0.06260424852371216, 0.07939869165420532, 0.09619313478469849, 0.11298757791519165, 0.1297820806503296, 0.14657652378082275, 0.16337096691131592, 0.18016541004180908, 0.19695985317230225, 0.2137542963027954, 0.23054873943328857, 0.24734318256378174, 0.2641376256942749, 0.28093206882476807, 0.29772651195526123, 0.3145209550857544, 0.33131539821624756, 0.3481098413467407, 0.3649042844772339, 0.38169872760772705, 0.3984931707382202, 0.4152876138687134, 0.43208205699920654, 0.4488765001296997, 0.46567094326019287, 0.48246538639068604, 0.4992598295211792, 0.5160542726516724, 0.5328487157821655, 0.5496431589126587, 0.5664376020431519, 0.583232045173645, 0.6000264883041382, 0.6168209314346313, 0.6336153745651245, 0.6504098176956177, 0.6672042608261108]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 11.0, 8.0, 11.0, 13.0, 15.0, 19.0, 29.0, 33.0, 38.0, 42.0, 47.0, 54.0, 56.0, 59.0, 43.0, 51.0, 51.0, 44.0, 52.0, 45.0, 54.0, 39.0, 46.0, 25.0, 25.0, 26.0, 17.0, 12.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13766473531723022, -0.13339976966381073, -0.12913478910923004, -0.12486982345581055, -0.12060485035181046, -0.11633987724781036, -0.11207491159439087, -0.10780993849039078, -0.10354496538639069, -0.0992799922823906, -0.0950150191783905, -0.09075005352497101, -0.08648508042097092, -0.08222010731697083, -0.07795514166355133, -0.07369016855955124, -0.06942519545555115, -0.06516022235155106, -0.06089525297284126, -0.05663028359413147, -0.05236531049013138, -0.04810033738613129, -0.043835368007421494, -0.0395703986287117, -0.03530542552471161, -0.031040454283356667, -0.026775483042001724, -0.022510511800646782, -0.01824554055929184, -0.013980569317936897, -0.009715598076581955, -0.005450626835227013, -0.0011856555938720703, 0.003079315647482872, 0.007344286888837814, 0.011609258130192757, 0.0158742293715477, 0.02013920061290264, 0.024404171854257584, 0.028669143095612526, 0.03293411433696747, 0.03719908744096756, 0.04146405681967735, 0.045729026198387146, 0.04999399930238724, 0.05425897240638733, 0.05852394178509712, 0.06278891116380692, 0.067053884267807, 0.0713188573718071, 0.07558383047580719, 0.07984879612922668, 0.08411376923322678, 0.08837874233722687, 0.09264370799064636, 0.09690868109464645, 0.10117365419864655, 0.10543862730264664, 0.10970360040664673, 0.11396856606006622, 0.11823353916406631, 0.1224985122680664, 0.1267634779214859, 0.1310284584760666, 0.13529342412948608]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 2.0, 8.0, 13.0, 13.0, 10.0, 14.0, 17.0, 32.0, 42.0, 64.0, 59.0, 75.0, 120.0, 176.0, 230.0, 304.0, 441.0, 729.0, 1792.0, 9417.0, 97134.0, 709832.0, 205619.0, 16990.0, 2637.0, 917.0, 524.0, 333.0, 258.0, 178.0, 122.0, 109.0, 78.0, 61.0, 39.0, 35.0, 21.0, 23.0, 21.0, 13.0, 13.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.117919921875, -0.11430740356445312, -0.11069488525390625, -0.10708236694335938, -0.1034698486328125, -0.09985733032226562, -0.09624481201171875, -0.09263229370117188, -0.089019775390625, -0.08540725708007812, -0.08179473876953125, -0.07818222045898438, -0.0745697021484375, -0.07095718383789062, -0.06734466552734375, -0.06373214721679688, -0.06011962890625, -0.056507110595703125, -0.05289459228515625, -0.049282073974609375, -0.0456695556640625, -0.042057037353515625, -0.03844451904296875, -0.034832000732421875, -0.031219482421875, -0.027606964111328125, -0.02399444580078125, -0.020381927490234375, -0.0167694091796875, -0.013156890869140625, -0.00954437255859375, -0.005931854248046875, -0.0023193359375, 0.001293182373046875, 0.00490570068359375, 0.008518218994140625, 0.0121307373046875, 0.015743255615234375, 0.01935577392578125, 0.022968292236328125, 0.026580810546875, 0.030193328857421875, 0.03380584716796875, 0.037418365478515625, 0.0410308837890625, 0.044643402099609375, 0.04825592041015625, 0.051868438720703125, 0.05548095703125, 0.059093475341796875, 0.06270599365234375, 0.06631851196289062, 0.0699310302734375, 0.07354354858398438, 0.07715606689453125, 0.08076858520507812, 0.084381103515625, 0.08799362182617188, 0.09160614013671875, 0.09521865844726562, 0.0988311767578125, 0.10244369506835938, 0.10605621337890625, 0.10966873168945312, 0.11328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 33.0, 82.0, 198.0, 251.0, 231.0, 134.0, 57.0, 7.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06656837463378906, -0.06447219848632812, -0.06237602233886719, -0.06027984619140625, -0.05818367004394531, -0.056087493896484375, -0.05399131774902344, -0.0518951416015625, -0.04979896545410156, -0.047702789306640625, -0.04560661315917969, -0.04351043701171875, -0.04141426086425781, -0.039318084716796875, -0.03722190856933594, -0.035125732421875, -0.03302955627441406, -0.030933380126953125, -0.028837203979492188, -0.02674102783203125, -0.024644851684570312, -0.022548675537109375, -0.020452499389648438, -0.0183563232421875, -0.016260147094726562, -0.014163970947265625, -0.012067794799804688, -0.00997161865234375, -0.007875442504882812, -0.005779266357421875, -0.0036830902099609375, -0.0015869140625, 0.0005092620849609375, 0.002605438232421875, 0.0047016143798828125, 0.00679779052734375, 0.008893966674804688, 0.010990142822265625, 0.013086318969726562, 0.0151824951171875, 0.017278671264648438, 0.019374847412109375, 0.021471023559570312, 0.02356719970703125, 0.025663375854492188, 0.027759552001953125, 0.029855728149414062, 0.031951904296875, 0.03404808044433594, 0.036144256591796875, 0.03824043273925781, 0.04033660888671875, 0.04243278503417969, 0.044528961181640625, 0.04662513732910156, 0.0487213134765625, 0.05081748962402344, 0.052913665771484375, 0.05500984191894531, 0.05710601806640625, 0.05920219421386719, 0.061298370361328125, 0.06339454650878906, 0.06549072265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 12.0, 12.0, 20.0, 31.0, 40.0, 61.0, 91.0, 154.0, 213.0, 401.0, 735.0, 1366.0, 2800.0, 5605.0, 13214.0, 32553.0, 90004.0, 256386.0, 379784.0, 167105.0, 58191.0, 21849.0, 9233.0, 4183.0, 2013.0, 1029.0, 570.0, 336.0, 217.0, 116.0, 70.0, 51.0, 31.0, 20.0, 11.0, 13.0, 5.0, 7.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.046234130859375, -0.0447077751159668, -0.043181419372558594, -0.04165506362915039, -0.04012870788574219, -0.038602352142333984, -0.03707599639892578, -0.03554964065551758, -0.034023284912109375, -0.03249692916870117, -0.03097057342529297, -0.029444217681884766, -0.027917861938476562, -0.02639150619506836, -0.024865150451660156, -0.023338794708251953, -0.02181243896484375, -0.020286083221435547, -0.018759727478027344, -0.01723337173461914, -0.015707015991210938, -0.014180660247802734, -0.012654304504394531, -0.011127948760986328, -0.009601593017578125, -0.008075237274169922, -0.006548881530761719, -0.005022525787353516, -0.0034961700439453125, -0.0019698143005371094, -0.00044345855712890625, 0.0010828971862792969, 0.0026092529296875, 0.004135608673095703, 0.005661964416503906, 0.007188320159912109, 0.008714675903320312, 0.010241031646728516, 0.011767387390136719, 0.013293743133544922, 0.014820098876953125, 0.016346454620361328, 0.01787281036376953, 0.019399166107177734, 0.020925521850585938, 0.02245187759399414, 0.023978233337402344, 0.025504589080810547, 0.02703094482421875, 0.028557300567626953, 0.030083656311035156, 0.03161001205444336, 0.03313636779785156, 0.034662723541259766, 0.03618907928466797, 0.03771543502807617, 0.039241790771484375, 0.04076814651489258, 0.04229450225830078, 0.043820858001708984, 0.04534721374511719, 0.04687356948852539, 0.048399925231933594, 0.0499262809753418, 0.05145263671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 5.0, 6.0, 2.0, 12.0, 15.0, 13.0, 13.0, 17.0, 30.0, 29.0, 19.0, 39.0, 43.0, 32.0, 46.0, 45.0, 45.0, 64.0, 47.0, 45.0, 44.0, 52.0, 45.0, 49.0, 41.0, 18.0, 20.0, 28.0, 21.0, 22.0, 9.0, 14.0, 12.0, 12.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.06365966796875, -0.061914920806884766, -0.06017017364501953, -0.0584254264831543, -0.05668067932128906, -0.05493593215942383, -0.053191184997558594, -0.05144643783569336, -0.049701690673828125, -0.04795694351196289, -0.046212196350097656, -0.04446744918823242, -0.04272270202636719, -0.04097795486450195, -0.03923320770263672, -0.037488460540771484, -0.03574371337890625, -0.033998966217041016, -0.03225421905517578, -0.030509471893310547, -0.028764724731445312, -0.027019977569580078, -0.025275230407714844, -0.02353048324584961, -0.021785736083984375, -0.02004098892211914, -0.018296241760253906, -0.016551494598388672, -0.014806747436523438, -0.013062000274658203, -0.011317253112792969, -0.009572505950927734, -0.0078277587890625, -0.006083011627197266, -0.004338264465332031, -0.002593517303466797, -0.0008487701416015625, 0.0008959770202636719, 0.0026407241821289062, 0.004385471343994141, 0.006130218505859375, 0.00787496566772461, 0.009619712829589844, 0.011364459991455078, 0.013109207153320312, 0.014853954315185547, 0.01659870147705078, 0.018343448638916016, 0.02008819580078125, 0.021832942962646484, 0.02357769012451172, 0.025322437286376953, 0.027067184448242188, 0.028811931610107422, 0.030556678771972656, 0.03230142593383789, 0.034046173095703125, 0.03579092025756836, 0.037535667419433594, 0.03928041458129883, 0.04102516174316406, 0.0427699089050293, 0.04451465606689453, 0.046259403228759766, 0.048004150390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 10.0, 10.0, 16.0, 38.0, 37.0, 38.0, 67.0, 127.0, 165.0, 278.0, 403.0, 660.0, 1092.0, 1791.0, 2958.0, 4959.0, 9104.0, 17958.0, 41065.0, 124373.0, 421920.0, 283575.0, 77785.0, 29042.0, 13567.0, 7134.0, 4019.0, 2372.0, 1466.0, 928.0, 564.0, 356.0, 217.0, 142.0, 116.0, 53.0, 49.0, 25.0, 18.0, 14.0, 12.0, 5.0, 10.0, 6.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0312042236328125, -0.03022313117980957, -0.02924203872680664, -0.02826094627380371, -0.02727985382080078, -0.02629876136779785, -0.025317668914794922, -0.024336576461791992, -0.023355484008789062, -0.022374391555786133, -0.021393299102783203, -0.020412206649780273, -0.019431114196777344, -0.018450021743774414, -0.017468929290771484, -0.016487836837768555, -0.015506744384765625, -0.014525651931762695, -0.013544559478759766, -0.012563467025756836, -0.011582374572753906, -0.010601282119750977, -0.009620189666748047, -0.008639097213745117, -0.0076580047607421875, -0.006676912307739258, -0.005695819854736328, -0.0047147274017333984, -0.0037336349487304688, -0.002752542495727539, -0.0017714500427246094, -0.0007903575897216797, 0.00019073486328125, 0.0011718273162841797, 0.0021529197692871094, 0.003134012222290039, 0.004115104675292969, 0.0050961971282958984, 0.006077289581298828, 0.007058382034301758, 0.008039474487304688, 0.009020566940307617, 0.010001659393310547, 0.010982751846313477, 0.011963844299316406, 0.012944936752319336, 0.013926029205322266, 0.014907121658325195, 0.015888214111328125, 0.016869306564331055, 0.017850399017333984, 0.018831491470336914, 0.019812583923339844, 0.020793676376342773, 0.021774768829345703, 0.022755861282348633, 0.023736953735351562, 0.024718046188354492, 0.025699138641357422, 0.02668023109436035, 0.02766132354736328, 0.02864241600036621, 0.02962350845336914, 0.03060460090637207, 0.031585693359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 15.0, 7.0, 10.0, 8.0, 25.0, 18.0, 30.0, 24.0, 28.0, 41.0, 64.0, 70.0, 75.0, 65.0, 69.0, 72.0, 60.0, 51.0, 38.0, 40.0, 26.0, 18.0, 21.0, 15.0, 23.0, 11.0, 9.0, 5.0, 5.0, 3.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.94044104218483e-05, -5.765445530414581e-05, -5.590450018644333e-05, -5.4154545068740845e-05, -5.240458995103836e-05, -5.0654634833335876e-05, -4.890467971563339e-05, -4.715472459793091e-05, -4.5404769480228424e-05, -4.365481436252594e-05, -4.1904859244823456e-05, -4.015490412712097e-05, -3.840494900941849e-05, -3.6654993891716003e-05, -3.490503877401352e-05, -3.3155083656311035e-05, -3.140512853860855e-05, -2.9655173420906067e-05, -2.7905218303203583e-05, -2.61552631855011e-05, -2.4405308067798615e-05, -2.265535295009613e-05, -2.0905397832393646e-05, -1.9155442714691162e-05, -1.7405487596988678e-05, -1.5655532479286194e-05, -1.390557736158371e-05, -1.2155622243881226e-05, -1.0405667126178741e-05, -8.655712008476257e-06, -6.905756890773773e-06, -5.155801773071289e-06, -3.405846655368805e-06, -1.6558915376663208e-06, 9.406358003616333e-08, 1.8440186977386475e-06, 3.5939738154411316e-06, 5.343928933143616e-06, 7.0938840508461e-06, 8.843839168548584e-06, 1.0593794286251068e-05, 1.2343749403953552e-05, 1.4093704521656036e-05, 1.584365963935852e-05, 1.7593614757061005e-05, 1.934356987476349e-05, 2.1093524992465973e-05, 2.2843480110168457e-05, 2.459343522787094e-05, 2.6343390345573425e-05, 2.809334546327591e-05, 2.9843300580978394e-05, 3.159325569868088e-05, 3.334321081638336e-05, 3.5093165934085846e-05, 3.684312105178833e-05, 3.8593076169490814e-05, 4.03430312871933e-05, 4.209298640489578e-05, 4.3842941522598267e-05, 4.559289664030075e-05, 4.7342851758003235e-05, 4.909280687570572e-05, 5.08427619934082e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 4.0, 4.0, 6.0, 12.0, 15.0, 12.0, 25.0, 35.0, 61.0, 92.0, 150.0, 251.0, 477.0, 890.0, 1598.0, 3085.0, 6175.0, 14714.0, 40575.0, 139522.0, 478903.0, 255429.0, 66606.0, 21999.0, 9042.0, 4178.0, 2073.0, 1138.0, 609.0, 356.0, 220.0, 99.0, 61.0, 42.0, 30.0, 25.0, 5.0, 7.0, 8.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0380859375, -0.03698873519897461, -0.03589153289794922, -0.03479433059692383, -0.03369712829589844, -0.03259992599487305, -0.031502723693847656, -0.030405521392822266, -0.029308319091796875, -0.028211116790771484, -0.027113914489746094, -0.026016712188720703, -0.024919509887695312, -0.023822307586669922, -0.02272510528564453, -0.02162790298461914, -0.02053070068359375, -0.01943349838256836, -0.01833629608154297, -0.017239093780517578, -0.016141891479492188, -0.015044689178466797, -0.013947486877441406, -0.012850284576416016, -0.011753082275390625, -0.010655879974365234, -0.009558677673339844, -0.008461475372314453, -0.0073642730712890625, -0.006267070770263672, -0.005169868469238281, -0.004072666168212891, -0.0029754638671875, -0.0018782615661621094, -0.0007810592651367188, 0.0003161430358886719, 0.0014133453369140625, 0.002510547637939453, 0.0036077499389648438, 0.004704952239990234, 0.005802154541015625, 0.006899356842041016, 0.007996559143066406, 0.009093761444091797, 0.010190963745117188, 0.011288166046142578, 0.012385368347167969, 0.01348257064819336, 0.01457977294921875, 0.01567697525024414, 0.01677417755126953, 0.017871379852294922, 0.018968582153320312, 0.020065784454345703, 0.021162986755371094, 0.022260189056396484, 0.023357391357421875, 0.024454593658447266, 0.025551795959472656, 0.026648998260498047, 0.027746200561523438, 0.028843402862548828, 0.02994060516357422, 0.03103780746459961, 0.032135009765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 3.0, 6.0, 13.0, 10.0, 10.0, 13.0, 18.0, 38.0, 21.0, 35.0, 32.0, 55.0, 72.0, 83.0, 92.0, 113.0, 73.0, 49.0, 51.0, 32.0, 25.0, 21.0, 21.0, 12.0, 10.0, 11.0, 11.0, 13.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0289764404296875, -0.02806711196899414, -0.02715778350830078, -0.026248455047607422, -0.025339126586914062, -0.024429798126220703, -0.023520469665527344, -0.022611141204833984, -0.021701812744140625, -0.020792484283447266, -0.019883155822753906, -0.018973827362060547, -0.018064498901367188, -0.017155170440673828, -0.01624584197998047, -0.01533651351928711, -0.01442718505859375, -0.01351785659790039, -0.012608528137207031, -0.011699199676513672, -0.010789871215820312, -0.009880542755126953, -0.008971214294433594, -0.008061885833740234, -0.007152557373046875, -0.006243228912353516, -0.005333900451660156, -0.004424571990966797, -0.0035152435302734375, -0.002605915069580078, -0.0016965866088867188, -0.0007872581481933594, 0.0001220703125, 0.0010313987731933594, 0.0019407272338867188, 0.002850055694580078, 0.0037593841552734375, 0.004668712615966797, 0.005578041076660156, 0.006487369537353516, 0.007396697998046875, 0.008306026458740234, 0.009215354919433594, 0.010124683380126953, 0.011034011840820312, 0.011943340301513672, 0.012852668762207031, 0.01376199722290039, 0.01467132568359375, 0.01558065414428711, 0.01648998260498047, 0.017399311065673828, 0.018308639526367188, 0.019217967987060547, 0.020127296447753906, 0.021036624908447266, 0.021945953369140625, 0.022855281829833984, 0.023764610290527344, 0.024673938751220703, 0.025583267211914062, 0.026492595672607422, 0.02740192413330078, 0.02831125259399414, 0.0292205810546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 9.0, 17.0, 39.0, 71.0, 122.0, 157.0, 205.0, 139.0, 120.0, 60.0, 27.0, 16.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5905942916870117, -0.5747577548027039, -0.5589211583137512, -0.5430846214294434, -0.5272480249404907, -0.5114114880561829, -0.4955749213695526, -0.47973835468292236, -0.4639017879962921, -0.44806522130966187, -0.4322286546230316, -0.41639208793640137, -0.4005555510520935, -0.38471895456314087, -0.368882417678833, -0.35304585099220276, -0.3372092843055725, -0.32137271761894226, -0.305536150932312, -0.28969958424568176, -0.2738630175590515, -0.25802648067474365, -0.2421899139881134, -0.22635334730148315, -0.2105167806148529, -0.19468021392822266, -0.1788436472415924, -0.16300709545612335, -0.1471705287694931, -0.13133396208286285, -0.1154974028468132, -0.09966084361076355, -0.08382433652877808, -0.06798776984214783, -0.052151210606098175, -0.036314647644758224, -0.020478084683418274, -0.004641517996788025, 0.011195041239261627, 0.02703160047531128, 0.04286816716194153, 0.05870473012328148, 0.07454129308462143, 0.09037785232067108, 0.10621441900730133, 0.12205098569393158, 0.13788753747940063, 0.15372410416603088, 0.16956067085266113, 0.18539723753929138, 0.20123380422592163, 0.21707035601139069, 0.23290692269802094, 0.24874348938465118, 0.26458004117012024, 0.2804166078567505, 0.29625317454338074, 0.312089741230011, 0.32792630791664124, 0.3437628746032715, 0.35959941148757935, 0.375436007976532, 0.39127254486083984, 0.4071091115474701, 0.42294567823410034]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 13.0, 8.0, 16.0, 12.0, 18.0, 23.0, 26.0, 44.0, 25.0, 46.0, 52.0, 51.0, 44.0, 50.0, 56.0, 46.0, 54.0, 42.0, 40.0, 49.0, 30.0, 32.0, 41.0, 37.0, 27.0, 20.0, 20.0, 13.0, 14.0, 10.0, 8.0, 2.0, 3.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.23809468746185303, -0.23166514933109283, -0.22523559629917145, -0.21880605816841125, -0.21237650513648987, -0.20594696700572968, -0.19951742887496948, -0.1930878758430481, -0.1866583377122879, -0.1802287995815277, -0.17379924654960632, -0.16736970841884613, -0.16094017028808594, -0.15451061725616455, -0.14808107912540436, -0.14165154099464417, -0.13522198796272278, -0.12879244983196259, -0.1223628968000412, -0.115933358669281, -0.10950381308794022, -0.10307426750659943, -0.09664472937583923, -0.09021518379449844, -0.08378563821315765, -0.07735609263181686, -0.07092654705047607, -0.06449700891971588, -0.05806746333837509, -0.0516379177570343, -0.04520837590098381, -0.03877883404493332, -0.03234928846359253, -0.02591974474489689, -0.019490201026201248, -0.013060657307505608, -0.006631113588809967, -0.00020156800746917725, 0.006227973848581314, 0.012657515704631805, 0.019087061285972595, 0.025516605004668236, 0.031946148723363876, 0.03837569057941437, 0.04480523616075516, 0.05123478174209595, 0.05766432359814644, 0.06409386545419693, 0.07052341103553772, 0.07695295661687851, 0.0833825021982193, 0.08981204032897949, 0.09624158591032028, 0.10267113149166107, 0.10910066962242126, 0.11553021520376205, 0.12195976078510284, 0.12838929891586304, 0.13481885194778442, 0.14124839007854462, 0.1476779282093048, 0.1541074812412262, 0.1605370193719864, 0.16696655750274658, 0.17339611053466797]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 13.0, 38.0, 118.0, 707.0, 12676.0, 3952871.0, 223890.0, 3506.0, 266.0, 104.0, 37.0, 17.0, 7.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187744140625, -0.1820220947265625, -0.176300048828125, -0.1705780029296875, -0.16485595703125, -0.1591339111328125, -0.153411865234375, -0.1476898193359375, -0.1419677734375, -0.1362457275390625, -0.130523681640625, -0.1248016357421875, -0.11907958984375, -0.1133575439453125, -0.107635498046875, -0.1019134521484375, -0.09619140625, -0.0904693603515625, -0.084747314453125, -0.0790252685546875, -0.07330322265625, -0.0675811767578125, -0.061859130859375, -0.0561370849609375, -0.0504150390625, -0.0446929931640625, -0.038970947265625, -0.0332489013671875, -0.02752685546875, -0.0218048095703125, -0.016082763671875, -0.0103607177734375, -0.004638671875, 0.0010833740234375, 0.006805419921875, 0.0125274658203125, 0.01824951171875, 0.0239715576171875, 0.029693603515625, 0.0354156494140625, 0.0411376953125, 0.0468597412109375, 0.052581787109375, 0.0583038330078125, 0.06402587890625, 0.0697479248046875, 0.075469970703125, 0.0811920166015625, 0.0869140625, 0.0926361083984375, 0.098358154296875, 0.1040802001953125, 0.10980224609375, 0.1155242919921875, 0.121246337890625, 0.1269683837890625, 0.1326904296875, 0.1384124755859375, 0.144134521484375, 0.1498565673828125, 0.15557861328125, 0.1613006591796875, 0.167022705078125, 0.1727447509765625, 0.178466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 24.0, 62.0, 99.0, 177.0, 209.0, 174.0, 148.0, 70.0, 25.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06283092498779297, -0.06078147888183594, -0.058732032775878906, -0.056682586669921875, -0.054633140563964844, -0.05258369445800781, -0.05053424835205078, -0.04848480224609375, -0.04643535614013672, -0.04438591003417969, -0.042336463928222656, -0.040287017822265625, -0.038237571716308594, -0.03618812561035156, -0.03413867950439453, -0.0320892333984375, -0.03003978729248047, -0.027990341186523438, -0.025940895080566406, -0.023891448974609375, -0.021842002868652344, -0.019792556762695312, -0.01774311065673828, -0.01569366455078125, -0.013644218444824219, -0.011594772338867188, -0.009545326232910156, -0.007495880126953125, -0.005446434020996094, -0.0033969879150390625, -0.0013475418090820312, 0.000701904296875, 0.0027513504028320312, 0.0048007965087890625, 0.006850242614746094, 0.008899688720703125, 0.010949134826660156, 0.012998580932617188, 0.015048027038574219, 0.01709747314453125, 0.01914691925048828, 0.021196365356445312, 0.023245811462402344, 0.025295257568359375, 0.027344703674316406, 0.029394149780273438, 0.03144359588623047, 0.0334930419921875, 0.03554248809814453, 0.03759193420410156, 0.039641380310058594, 0.041690826416015625, 0.043740272521972656, 0.04578971862792969, 0.04783916473388672, 0.04988861083984375, 0.05193805694580078, 0.05398750305175781, 0.056036949157714844, 0.058086395263671875, 0.060135841369628906, 0.06218528747558594, 0.06423473358154297, 0.0662841796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 15.0, 26.0, 27.0, 67.0, 121.0, 201.0, 420.0, 941.0, 2171.0, 6124.0, 22284.0, 133848.0, 3365117.0, 592344.0, 52362.0, 11719.0, 3760.0, 1450.0, 618.0, 301.0, 162.0, 73.0, 34.0, 39.0, 18.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0916748046875, -0.08953094482421875, -0.0873870849609375, -0.08524322509765625, -0.083099365234375, -0.08095550537109375, -0.0788116455078125, -0.07666778564453125, -0.07452392578125, -0.07238006591796875, -0.0702362060546875, -0.06809234619140625, -0.065948486328125, -0.06380462646484375, -0.0616607666015625, -0.05951690673828125, -0.057373046875, -0.05522918701171875, -0.0530853271484375, -0.05094146728515625, -0.048797607421875, -0.04665374755859375, -0.0445098876953125, -0.04236602783203125, -0.04022216796875, -0.03807830810546875, -0.0359344482421875, -0.03379058837890625, -0.031646728515625, -0.02950286865234375, -0.0273590087890625, -0.02521514892578125, -0.0230712890625, -0.02092742919921875, -0.0187835693359375, -0.01663970947265625, -0.014495849609375, -0.01235198974609375, -0.0102081298828125, -0.00806427001953125, -0.00592041015625, -0.00377655029296875, -0.0016326904296875, 0.00051116943359375, 0.002655029296875, 0.00479888916015625, 0.0069427490234375, 0.00908660888671875, 0.01123046875, 0.01337432861328125, 0.0155181884765625, 0.01766204833984375, 0.019805908203125, 0.02194976806640625, 0.0240936279296875, 0.02623748779296875, 0.02838134765625, 0.03052520751953125, 0.0326690673828125, 0.03481292724609375, 0.036956787109375, 0.03910064697265625, 0.0412445068359375, 0.04338836669921875, 0.0455322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 7.0, 14.0, 19.0, 15.0, 26.0, 30.0, 41.0, 69.0, 92.0, 135.0, 168.0, 328.0, 606.0, 919.0, 618.0, 309.0, 185.0, 116.0, 83.0, 60.0, 51.0, 36.0, 31.0, 19.0, 16.0, 9.0, 16.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028594970703125, -0.02755451202392578, -0.026514053344726562, -0.025473594665527344, -0.024433135986328125, -0.023392677307128906, -0.022352218627929688, -0.02131175994873047, -0.02027130126953125, -0.01923084259033203, -0.018190383911132812, -0.017149925231933594, -0.016109466552734375, -0.015069007873535156, -0.014028549194335938, -0.012988090515136719, -0.0119476318359375, -0.010907173156738281, -0.009866714477539062, -0.008826255798339844, -0.007785797119140625, -0.006745338439941406, -0.0057048797607421875, -0.004664421081542969, -0.00362396240234375, -0.0025835037231445312, -0.0015430450439453125, -0.0005025863647460938, 0.000537872314453125, 0.0015783309936523438, 0.0026187896728515625, 0.0036592483520507812, 0.00469970703125, 0.005740165710449219, 0.0067806243896484375, 0.007821083068847656, 0.008861541748046875, 0.009902000427246094, 0.010942459106445312, 0.011982917785644531, 0.01302337646484375, 0.014063835144042969, 0.015104293823242188, 0.016144752502441406, 0.017185211181640625, 0.018225669860839844, 0.019266128540039062, 0.02030658721923828, 0.0213470458984375, 0.02238750457763672, 0.023427963256835938, 0.024468421936035156, 0.025508880615234375, 0.026549339294433594, 0.027589797973632812, 0.02863025665283203, 0.02967071533203125, 0.03071117401123047, 0.03175163269042969, 0.032792091369628906, 0.033832550048828125, 0.034873008728027344, 0.03591346740722656, 0.03695392608642578, 0.037994384765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 21.0, 54.0, 136.0, 212.0, 249.0, 179.0, 80.0, 34.0, 13.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318085253238678, -0.30235299468040466, -0.28662076592445374, -0.2708885073661804, -0.2551562786102295, -0.23942402005195618, -0.22369176149368286, -0.20795951783657074, -0.19222727417945862, -0.1764950305223465, -0.16076278686523438, -0.14503052830696106, -0.12929828464984894, -0.11356604099273682, -0.0978337898850441, -0.08210153877735138, -0.06636929512023926, -0.05063704773783684, -0.03490480035543442, -0.019172552973031998, -0.0034403055906295776, 0.012291938066482544, 0.028024189174175262, 0.04375644028186798, 0.0594886839389801, 0.07522092759609222, 0.09095317870378494, 0.10668542981147766, 0.12241767346858978, 0.1381499171257019, 0.15388217568397522, 0.16961441934108734, 0.18534666299819946, 0.20107890665531158, 0.2168111503124237, 0.23254340887069702, 0.24827565252780914, 0.26400789618492126, 0.2797401547431946, 0.2954723834991455, 0.3112046420574188, 0.32693690061569214, 0.34266912937164307, 0.3584013879299164, 0.3741336464881897, 0.3898658752441406, 0.40559813380241394, 0.42133039236068726, 0.4370626211166382, 0.4527948796749115, 0.4685271084308624, 0.48425936698913574, 0.49999159574508667, 0.5157238245010376, 0.5314561128616333, 0.5471883416175842, 0.5629205703735352, 0.5786527991294861, 0.5943850874900818, 0.6101173162460327, 0.6258495450019836, 0.6415817737579346, 0.6573140621185303, 0.6730462908744812, 0.6887785792350769]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 13.0, 15.0, 16.0, 18.0, 24.0, 20.0, 29.0, 35.0, 32.0, 38.0, 48.0, 29.0, 47.0, 47.0, 46.0, 50.0, 50.0, 46.0, 38.0, 36.0, 41.0, 32.0, 28.0, 33.0, 24.0, 32.0, 13.0, 16.0, 17.0, 16.0, 17.0, 7.0, 10.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11295676231384277, -0.10939712077379227, -0.10583748668432236, -0.10227784514427185, -0.09871821105480194, -0.09515856951475143, -0.09159892797470093, -0.08803929388523102, -0.08447965234518051, -0.08092001080513, -0.0773603767156601, -0.07380073517560959, -0.07024109363555908, -0.06668145954608917, -0.06312181800603867, -0.05956218019127846, -0.05600254237651825, -0.05244290456175804, -0.04888326674699783, -0.04532362520694733, -0.04176398739218712, -0.03820434957742691, -0.034644708037376404, -0.031085070222616196, -0.027525432407855988, -0.02396579459309578, -0.020406154915690422, -0.016846515238285065, -0.013286877423524857, -0.009727239608764648, -0.006167599931359291, -0.0026079602539539337, 0.0009516775608062744, 0.004511316306889057, 0.00807095505297184, 0.011630593799054623, 0.015190232545137405, 0.018749870359897614, 0.02230951003730297, 0.025869149714708328, 0.029428787529468536, 0.032988425344228745, 0.03654806315898895, 0.04010770469903946, 0.04366734251379967, 0.047226980328559875, 0.05078662186861038, 0.05434625968337059, 0.0579058974981308, 0.061465535312891006, 0.06502517312765121, 0.06858481466770172, 0.07214444875717163, 0.07570409029722214, 0.07926373183727264, 0.08282336592674255, 0.08638300746679306, 0.08994264900684357, 0.09350228309631348, 0.09706192463636398, 0.10062156617641449, 0.1041812002658844, 0.1077408418059349, 0.11130048334598541, 0.11486011743545532]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 12.0, 9.0, 17.0, 33.0, 32.0, 55.0, 102.0, 127.0, 176.0, 316.0, 531.0, 1289.0, 4942.0, 36577.0, 429914.0, 518924.0, 46547.0, 5989.0, 1470.0, 581.0, 287.0, 199.0, 139.0, 84.0, 59.0, 41.0, 25.0, 17.0, 9.0, 12.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15074539184570312, -0.14572906494140625, -0.14071273803710938, -0.1356964111328125, -0.13068008422851562, -0.12566375732421875, -0.12064743041992188, -0.115631103515625, -0.11061477661132812, -0.10559844970703125, -0.10058212280273438, -0.0955657958984375, -0.09054946899414062, -0.08553314208984375, -0.08051681518554688, -0.07550048828125, -0.07048416137695312, -0.06546783447265625, -0.060451507568359375, -0.0554351806640625, -0.050418853759765625, -0.04540252685546875, -0.040386199951171875, -0.035369873046875, -0.030353546142578125, -0.02533721923828125, -0.020320892333984375, -0.0153045654296875, -0.010288238525390625, -0.00527191162109375, -0.000255584716796875, 0.0047607421875, 0.009777069091796875, 0.01479339599609375, 0.019809722900390625, 0.0248260498046875, 0.029842376708984375, 0.03485870361328125, 0.039875030517578125, 0.044891357421875, 0.049907684326171875, 0.05492401123046875, 0.059940338134765625, 0.0649566650390625, 0.06997299194335938, 0.07498931884765625, 0.08000564575195312, 0.08502197265625, 0.09003829956054688, 0.09505462646484375, 0.10007095336914062, 0.1050872802734375, 0.11010360717773438, 0.11511993408203125, 0.12013626098632812, 0.125152587890625, 0.13016891479492188, 0.13518524169921875, 0.14020156860351562, 0.1452178955078125, 0.15023422241210938, 0.15525054931640625, 0.16026687622070312, 0.165283203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 19.0, 61.0, 121.0, 175.0, 210.0, 177.0, 132.0, 65.0, 26.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06501293182373047, -0.06288719177246094, -0.060761451721191406, -0.058635711669921875, -0.056509971618652344, -0.05438423156738281, -0.05225849151611328, -0.05013275146484375, -0.04800701141357422, -0.04588127136230469, -0.043755531311035156, -0.041629791259765625, -0.039504051208496094, -0.03737831115722656, -0.03525257110595703, -0.0331268310546875, -0.03100109100341797, -0.028875350952148438, -0.026749610900878906, -0.024623870849609375, -0.022498130798339844, -0.020372390747070312, -0.01824665069580078, -0.01612091064453125, -0.013995170593261719, -0.011869430541992188, -0.009743690490722656, -0.007617950439453125, -0.005492210388183594, -0.0033664703369140625, -0.0012407302856445312, 0.000885009765625, 0.0030107498168945312, 0.0051364898681640625, 0.007262229919433594, 0.009387969970703125, 0.011513710021972656, 0.013639450073242188, 0.01576519012451172, 0.01789093017578125, 0.02001667022705078, 0.022142410278320312, 0.024268150329589844, 0.026393890380859375, 0.028519630432128906, 0.030645370483398438, 0.03277111053466797, 0.0348968505859375, 0.03702259063720703, 0.03914833068847656, 0.041274070739746094, 0.043399810791015625, 0.045525550842285156, 0.04765129089355469, 0.04977703094482422, 0.05190277099609375, 0.05402851104736328, 0.05615425109863281, 0.058279991149902344, 0.060405731201171875, 0.0625314712524414, 0.06465721130371094, 0.06678295135498047, 0.06890869140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 25.0, 39.0, 68.0, 92.0, 146.0, 278.0, 448.0, 733.0, 1327.0, 2709.0, 5755.0, 12298.0, 29794.0, 76892.0, 206185.0, 371099.0, 208605.0, 78028.0, 30032.0, 12503.0, 5513.0, 2668.0, 1444.0, 723.0, 460.0, 258.0, 148.0, 96.0, 46.0, 34.0, 29.0, 14.0, 14.0, 6.0, 11.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.055428504943847656, -0.05348396301269531, -0.05153942108154297, -0.049594879150390625, -0.04765033721923828, -0.04570579528808594, -0.043761253356933594, -0.04181671142578125, -0.039872169494628906, -0.03792762756347656, -0.03598308563232422, -0.034038543701171875, -0.03209400177001953, -0.030149459838867188, -0.028204917907714844, -0.0262603759765625, -0.024315834045410156, -0.022371292114257812, -0.02042675018310547, -0.018482208251953125, -0.01653766632080078, -0.014593124389648438, -0.012648582458496094, -0.01070404052734375, -0.008759498596191406, -0.0068149566650390625, -0.004870414733886719, -0.002925872802734375, -0.0009813308715820312, 0.0009632110595703125, 0.0029077529907226562, 0.004852294921875, 0.006796836853027344, 0.008741378784179688, 0.010685920715332031, 0.012630462646484375, 0.014575004577636719, 0.016519546508789062, 0.018464088439941406, 0.02040863037109375, 0.022353172302246094, 0.024297714233398438, 0.02624225616455078, 0.028186798095703125, 0.03013134002685547, 0.03207588195800781, 0.034020423889160156, 0.0359649658203125, 0.037909507751464844, 0.03985404968261719, 0.04179859161376953, 0.043743133544921875, 0.04568767547607422, 0.04763221740722656, 0.049576759338378906, 0.05152130126953125, 0.053465843200683594, 0.05541038513183594, 0.05735492706298828, 0.059299468994140625, 0.06124401092529297, 0.06318855285644531, 0.06513309478759766, 0.06707763671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 7.0, 7.0, 4.0, 9.0, 11.0, 14.0, 16.0, 12.0, 26.0, 29.0, 37.0, 31.0, 44.0, 47.0, 47.0, 56.0, 61.0, 49.0, 61.0, 51.0, 56.0, 51.0, 49.0, 42.0, 41.0, 29.0, 32.0, 24.0, 16.0, 8.0, 5.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07361507415771484, -0.07130241394042969, -0.06898975372314453, -0.06667709350585938, -0.06436443328857422, -0.06205177307128906, -0.059739112854003906, -0.05742645263671875, -0.055113792419433594, -0.05280113220214844, -0.05048847198486328, -0.048175811767578125, -0.04586315155029297, -0.04355049133300781, -0.041237831115722656, -0.0389251708984375, -0.036612510681152344, -0.03429985046386719, -0.03198719024658203, -0.029674530029296875, -0.02736186981201172, -0.025049209594726562, -0.022736549377441406, -0.02042388916015625, -0.018111228942871094, -0.015798568725585938, -0.013485908508300781, -0.011173248291015625, -0.008860588073730469, -0.0065479278564453125, -0.004235267639160156, -0.001922607421875, 0.00039005279541015625, 0.0027027130126953125, 0.005015373229980469, 0.007328033447265625, 0.009640693664550781, 0.011953353881835938, 0.014266014099121094, 0.01657867431640625, 0.018891334533691406, 0.021203994750976562, 0.02351665496826172, 0.025829315185546875, 0.02814197540283203, 0.030454635620117188, 0.032767295837402344, 0.0350799560546875, 0.037392616271972656, 0.03970527648925781, 0.04201793670654297, 0.044330596923828125, 0.04664325714111328, 0.04895591735839844, 0.051268577575683594, 0.05358123779296875, 0.055893898010253906, 0.05820655822753906, 0.06051921844482422, 0.06283187866210938, 0.06514453887939453, 0.06745719909667969, 0.06976985931396484, 0.07208251953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 2.0, 9.0, 7.0, 7.0, 3.0, 6.0, 13.0, 18.0, 29.0, 27.0, 42.0, 72.0, 86.0, 142.0, 187.0, 309.0, 408.0, 538.0, 788.0, 1224.0, 1730.0, 2882.0, 4990.0, 11957.0, 44965.0, 313607.0, 550845.0, 79754.0, 17562.0, 6541.0, 3310.0, 2008.0, 1294.0, 925.0, 659.0, 472.0, 329.0, 240.0, 159.0, 107.0, 89.0, 61.0, 38.0, 33.0, 26.0, 20.0, 13.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.08270263671875, -0.08013153076171875, -0.0775604248046875, -0.07498931884765625, -0.072418212890625, -0.06984710693359375, -0.0672760009765625, -0.06470489501953125, -0.0621337890625, -0.05956268310546875, -0.0569915771484375, -0.05442047119140625, -0.051849365234375, -0.04927825927734375, -0.0467071533203125, -0.04413604736328125, -0.04156494140625, -0.03899383544921875, -0.0364227294921875, -0.03385162353515625, -0.031280517578125, -0.02870941162109375, -0.0261383056640625, -0.02356719970703125, -0.02099609375, -0.01842498779296875, -0.0158538818359375, -0.01328277587890625, -0.010711669921875, -0.00814056396484375, -0.0055694580078125, -0.00299835205078125, -0.00042724609375, 0.00214385986328125, 0.0047149658203125, 0.00728607177734375, 0.009857177734375, 0.01242828369140625, 0.0149993896484375, 0.01757049560546875, 0.0201416015625, 0.02271270751953125, 0.0252838134765625, 0.02785491943359375, 0.030426025390625, 0.03299713134765625, 0.0355682373046875, 0.03813934326171875, 0.04071044921875, 0.04328155517578125, 0.0458526611328125, 0.04842376708984375, 0.050994873046875, 0.05356597900390625, 0.0561370849609375, 0.05870819091796875, 0.061279296875, 0.06385040283203125, 0.0664215087890625, 0.06899261474609375, 0.071563720703125, 0.07413482666015625, 0.0767059326171875, 0.07927703857421875, 0.08184814453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 12.0, 17.0, 19.0, 26.0, 30.0, 44.0, 53.0, 96.0, 120.0, 138.0, 104.0, 88.0, 48.0, 37.0, 40.0, 33.0, 17.0, 12.0, 14.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011986494064331055, -0.00011617504060268402, -0.0001124851405620575, -0.00010879524052143097, -0.00010510534048080444, -0.00010141544044017792, -9.772554039955139e-05, -9.403564035892487e-05, -9.034574031829834e-05, -8.665584027767181e-05, -8.296594023704529e-05, -7.927604019641876e-05, -7.558614015579224e-05, -7.189624011516571e-05, -6.820634007453918e-05, -6.451644003391266e-05, -6.082653999328613e-05, -5.713663995265961e-05, -5.344673991203308e-05, -4.9756839871406555e-05, -4.606693983078003e-05, -4.2377039790153503e-05, -3.868713974952698e-05, -3.499723970890045e-05, -3.1307339668273926e-05, -2.76174396276474e-05, -2.3927539587020874e-05, -2.0237639546394348e-05, -1.6547739505767822e-05, -1.2857839465141296e-05, -9.16793942451477e-06, -5.478039383888245e-06, -1.7881393432617188e-06, 1.9017606973648071e-06, 5.591660737991333e-06, 9.281560778617859e-06, 1.2971460819244385e-05, 1.666136085987091e-05, 2.0351260900497437e-05, 2.4041160941123962e-05, 2.7731060981750488e-05, 3.1420961022377014e-05, 3.511086106300354e-05, 3.8800761103630066e-05, 4.249066114425659e-05, 4.618056118488312e-05, 4.9870461225509644e-05, 5.356036126613617e-05, 5.7250261306762695e-05, 6.094016134738922e-05, 6.463006138801575e-05, 6.831996142864227e-05, 7.20098614692688e-05, 7.569976150989532e-05, 7.938966155052185e-05, 8.307956159114838e-05, 8.67694616317749e-05, 9.045936167240143e-05, 9.414926171302795e-05, 9.783916175365448e-05, 0.000101529061794281, 0.00010521896183490753, 0.00010890886187553406, 0.00011259876191616058, 0.00011628866195678711]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 12.0, 16.0, 33.0, 39.0, 73.0, 93.0, 112.0, 192.0, 257.0, 431.0, 670.0, 1194.0, 1980.0, 4070.0, 10047.0, 37383.0, 262210.0, 606419.0, 92273.0, 18075.0, 6130.0, 2881.0, 1570.0, 889.0, 524.0, 327.0, 202.0, 133.0, 95.0, 61.0, 37.0, 32.0, 16.0, 16.0, 17.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08015632629394531, -0.07767105102539062, -0.07518577575683594, -0.07270050048828125, -0.07021522521972656, -0.06772994995117188, -0.06524467468261719, -0.0627593994140625, -0.06027412414550781, -0.057788848876953125, -0.05530357360839844, -0.05281829833984375, -0.05033302307128906, -0.047847747802734375, -0.04536247253417969, -0.042877197265625, -0.04039192199707031, -0.037906646728515625, -0.03542137145996094, -0.03293609619140625, -0.030450820922851562, -0.027965545654296875, -0.025480270385742188, -0.0229949951171875, -0.020509719848632812, -0.018024444580078125, -0.015539169311523438, -0.01305389404296875, -0.010568618774414062, -0.008083343505859375, -0.0055980682373046875, -0.00311279296875, -0.0006275177001953125, 0.001857757568359375, 0.0043430328369140625, 0.00682830810546875, 0.009313583374023438, 0.011798858642578125, 0.014284133911132812, 0.0167694091796875, 0.019254684448242188, 0.021739959716796875, 0.024225234985351562, 0.02671051025390625, 0.029195785522460938, 0.031681060791015625, 0.03416633605957031, 0.036651611328125, 0.03913688659667969, 0.041622161865234375, 0.04410743713378906, 0.04659271240234375, 0.04907798767089844, 0.051563262939453125, 0.05404853820800781, 0.0565338134765625, 0.05901908874511719, 0.061504364013671875, 0.06398963928222656, 0.06647491455078125, 0.06896018981933594, 0.07144546508789062, 0.07393074035644531, 0.076416015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 11.0, 9.0, 11.0, 6.0, 19.0, 25.0, 44.0, 39.0, 73.0, 79.0, 113.0, 102.0, 116.0, 100.0, 65.0, 60.0, 38.0, 23.0, 14.0, 14.0, 11.0, 8.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0596923828125, -0.057801246643066406, -0.05591011047363281, -0.05401897430419922, -0.052127838134765625, -0.05023670196533203, -0.04834556579589844, -0.046454429626464844, -0.04456329345703125, -0.042672157287597656, -0.04078102111816406, -0.03888988494873047, -0.036998748779296875, -0.03510761260986328, -0.03321647644042969, -0.031325340270996094, -0.0294342041015625, -0.027543067932128906, -0.025651931762695312, -0.02376079559326172, -0.021869659423828125, -0.01997852325439453, -0.018087387084960938, -0.016196250915527344, -0.01430511474609375, -0.012413978576660156, -0.010522842407226562, -0.008631706237792969, -0.006740570068359375, -0.004849433898925781, -0.0029582977294921875, -0.0010671615600585938, 0.000823974609375, 0.0027151107788085938, 0.0046062469482421875, 0.006497383117675781, 0.008388519287109375, 0.010279655456542969, 0.012170791625976562, 0.014061927795410156, 0.01595306396484375, 0.017844200134277344, 0.019735336303710938, 0.02162647247314453, 0.023517608642578125, 0.02540874481201172, 0.027299880981445312, 0.029191017150878906, 0.0310821533203125, 0.032973289489746094, 0.03486442565917969, 0.03675556182861328, 0.038646697998046875, 0.04053783416748047, 0.04242897033691406, 0.044320106506347656, 0.04621124267578125, 0.048102378845214844, 0.04999351501464844, 0.05188465118408203, 0.053775787353515625, 0.05566692352294922, 0.05755805969238281, 0.059449195861816406, 0.06134033203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 20.0, 55.0, 119.0, 223.0, 268.0, 161.0, 76.0, 29.0, 14.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.948332667350769, -0.9133965969085693, -0.8784605264663696, -0.8435244560241699, -0.8085883855819702, -0.7736523151397705, -0.7387163043022156, -0.7037802338600159, -0.6688441634178162, -0.6339080929756165, -0.5989720225334167, -0.564035952091217, -0.5290999412536621, -0.49416384100914, -0.4592278003692627, -0.424291729927063, -0.3893556594848633, -0.3544195890426636, -0.31948351860046387, -0.28454747796058655, -0.24961140751838684, -0.21467533707618713, -0.17973928153514862, -0.1448032259941101, -0.1098671555519104, -0.07493109256029129, -0.03999502956867218, -0.00505896657705307, 0.02987709641456604, 0.06481316685676575, 0.09974922239780426, 0.13468527793884277, 0.16962134838104248, 0.2045574188232422, 0.2394934743642807, 0.2744295299053192, 0.3093656003475189, 0.34430167078971863, 0.37923771142959595, 0.41417378187179565, 0.44910985231399536, 0.48404592275619507, 0.5189819931983948, 0.5539180636405945, 0.5888540744781494, 0.6237901449203491, 0.6587262153625488, 0.6936622858047485, 0.7285983562469482, 0.763534426689148, 0.7984704971313477, 0.8334065675735474, 0.8683426380157471, 0.9032787084579468, 0.9382147192955017, 0.9731507897377014, 1.008086919784546, 1.0430229902267456, 1.0779590606689453, 1.112895131111145, 1.1478312015533447, 1.1827672719955444, 1.2177033424377441, 1.2526392936706543, 1.287575364112854]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 3.0, 8.0, 9.0, 10.0, 10.0, 15.0, 15.0, 23.0, 25.0, 37.0, 35.0, 29.0, 44.0, 33.0, 49.0, 39.0, 43.0, 44.0, 34.0, 47.0, 52.0, 53.0, 40.0, 39.0, 35.0, 26.0, 27.0, 28.0, 28.0, 26.0, 16.0, 22.0, 8.0, 12.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0], "bins": [-0.287497341632843, -0.28001266717910767, -0.2725279927253723, -0.26504331827163696, -0.2575586438179016, -0.25007396936416626, -0.2425892949104309, -0.23510462045669556, -0.2276199460029602, -0.22013527154922485, -0.2126505970954895, -0.20516592264175415, -0.1976812481880188, -0.19019657373428345, -0.1827118992805481, -0.17522722482681274, -0.1677425503730774, -0.16025787591934204, -0.1527732014656067, -0.14528852701187134, -0.137803852558136, -0.13031917810440063, -0.12283450365066528, -0.11534982919692993, -0.10786515474319458, -0.10038048028945923, -0.09289580583572388, -0.08541113138198853, -0.07792645692825317, -0.07044178247451782, -0.06295710802078247, -0.05547243356704712, -0.04798775911331177, -0.040503084659576416, -0.033018410205841064, -0.025533735752105713, -0.01804906129837036, -0.01056438684463501, -0.003079712390899658, 0.004404962062835693, 0.011889636516571045, 0.019374310970306396, 0.026858985424041748, 0.0343436598777771, 0.04182833433151245, 0.0493130087852478, 0.056797683238983154, 0.0642823576927185, 0.07176703214645386, 0.07925170660018921, 0.08673638105392456, 0.09422105550765991, 0.10170572996139526, 0.10919040441513062, 0.11667507886886597, 0.12415975332260132, 0.13164442777633667, 0.13912910223007202, 0.14661377668380737, 0.15409845113754272, 0.16158312559127808, 0.16906780004501343, 0.17655247449874878, 0.18403714895248413, 0.19152182340621948]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 17.0, 44.0, 161.0, 1124.0, 19784.0, 3951692.0, 216467.0, 4419.0, 413.0, 93.0, 37.0, 11.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.22522544860839844, -0.21790695190429688, -0.2105884552001953, -0.20326995849609375, -0.1959514617919922, -0.18863296508789062, -0.18131446838378906, -0.1739959716796875, -0.16667747497558594, -0.15935897827148438, -0.1520404815673828, -0.14472198486328125, -0.1374034881591797, -0.13008499145507812, -0.12276649475097656, -0.115447998046875, -0.10812950134277344, -0.10081100463867188, -0.09349250793457031, -0.08617401123046875, -0.07885551452636719, -0.07153701782226562, -0.06421852111816406, -0.0569000244140625, -0.04958152770996094, -0.042263031005859375, -0.03494453430175781, -0.02762603759765625, -0.020307540893554688, -0.012989044189453125, -0.0056705474853515625, 0.00164794921875, 0.008966445922851562, 0.016284942626953125, 0.023603439331054688, 0.03092193603515625, 0.03824043273925781, 0.045558929443359375, 0.05287742614746094, 0.0601959228515625, 0.06751441955566406, 0.07483291625976562, 0.08215141296386719, 0.08946990966796875, 0.09678840637207031, 0.10410690307617188, 0.11142539978027344, 0.118743896484375, 0.12606239318847656, 0.13338088989257812, 0.1406993865966797, 0.14801788330078125, 0.1553363800048828, 0.16265487670898438, 0.16997337341308594, 0.1772918701171875, 0.18461036682128906, 0.19192886352539062, 0.1992473602294922, 0.20656585693359375, 0.2138843536376953, 0.22120285034179688, 0.22852134704589844, 0.23583984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 18.0, 28.0, 59.0, 113.0, 134.0, 155.0, 165.0, 132.0, 89.0, 70.0, 22.0, 12.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.06089496612548828, -0.05886268615722656, -0.056830406188964844, -0.054798126220703125, -0.052765846252441406, -0.05073356628417969, -0.04870128631591797, -0.04666900634765625, -0.04463672637939453, -0.04260444641113281, -0.040572166442871094, -0.038539886474609375, -0.036507606506347656, -0.03447532653808594, -0.03244304656982422, -0.0304107666015625, -0.02837848663330078, -0.026346206665039062, -0.024313926696777344, -0.022281646728515625, -0.020249366760253906, -0.018217086791992188, -0.01618480682373047, -0.01415252685546875, -0.012120246887207031, -0.010087966918945312, -0.008055686950683594, -0.006023406982421875, -0.003991127014160156, -0.0019588470458984375, 7.343292236328125e-05, 0.002105712890625, 0.004137992858886719, 0.0061702728271484375, 0.008202552795410156, 0.010234832763671875, 0.012267112731933594, 0.014299392700195312, 0.01633167266845703, 0.01836395263671875, 0.02039623260498047, 0.022428512573242188, 0.024460792541503906, 0.026493072509765625, 0.028525352478027344, 0.030557632446289062, 0.03258991241455078, 0.0346221923828125, 0.03665447235107422, 0.03868675231933594, 0.040719032287597656, 0.042751312255859375, 0.044783592224121094, 0.04681587219238281, 0.04884815216064453, 0.05088043212890625, 0.05291271209716797, 0.05494499206542969, 0.056977272033691406, 0.059009552001953125, 0.061041831970214844, 0.06307411193847656, 0.06510639190673828, 0.067138671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 10.0, 25.0, 27.0, 49.0, 61.0, 103.0, 158.0, 217.0, 379.0, 670.0, 1064.0, 1917.0, 3576.0, 7529.0, 17953.0, 53296.0, 230219.0, 2826805.0, 878900.0, 115007.0, 32363.0, 12153.0, 5396.0, 2701.0, 1434.0, 907.0, 477.0, 337.0, 210.0, 101.0, 85.0, 54.0, 39.0, 14.0, 10.0, 10.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.05586385726928711, -0.05398845672607422, -0.05211305618286133, -0.05023765563964844, -0.04836225509643555, -0.046486854553222656, -0.044611454010009766, -0.042736053466796875, -0.040860652923583984, -0.038985252380371094, -0.0371098518371582, -0.03523445129394531, -0.03335905075073242, -0.03148365020751953, -0.02960824966430664, -0.02773284912109375, -0.02585744857788086, -0.02398204803466797, -0.022106647491455078, -0.020231246948242188, -0.018355846405029297, -0.016480445861816406, -0.014605045318603516, -0.012729644775390625, -0.010854244232177734, -0.008978843688964844, -0.007103443145751953, -0.0052280426025390625, -0.003352642059326172, -0.0014772415161132812, 0.0003981590270996094, 0.0022735595703125, 0.004148960113525391, 0.006024360656738281, 0.007899761199951172, 0.009775161743164062, 0.011650562286376953, 0.013525962829589844, 0.015401363372802734, 0.017276763916015625, 0.019152164459228516, 0.021027565002441406, 0.022902965545654297, 0.024778366088867188, 0.026653766632080078, 0.02852916717529297, 0.03040456771850586, 0.03227996826171875, 0.03415536880493164, 0.03603076934814453, 0.03790616989135742, 0.03978157043457031, 0.0416569709777832, 0.043532371520996094, 0.045407772064208984, 0.047283172607421875, 0.049158573150634766, 0.051033973693847656, 0.05290937423706055, 0.05478477478027344, 0.05666017532348633, 0.05853557586669922, 0.06041097640991211, 0.062286376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 12.0, 14.0, 13.0, 28.0, 33.0, 54.0, 55.0, 107.0, 137.0, 191.0, 352.0, 710.0, 1037.0, 532.0, 266.0, 170.0, 89.0, 67.0, 52.0, 35.0, 27.0, 19.0, 14.0, 9.0, 7.0, 5.0, 6.0, 9.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.05963134765625, -0.05798530578613281, -0.056339263916015625, -0.05469322204589844, -0.05304718017578125, -0.05140113830566406, -0.049755096435546875, -0.04810905456542969, -0.0464630126953125, -0.04481697082519531, -0.043170928955078125, -0.04152488708496094, -0.03987884521484375, -0.03823280334472656, -0.036586761474609375, -0.03494071960449219, -0.033294677734375, -0.03164863586425781, -0.030002593994140625, -0.028356552124023438, -0.02671051025390625, -0.025064468383789062, -0.023418426513671875, -0.021772384643554688, -0.0201263427734375, -0.018480300903320312, -0.016834259033203125, -0.015188217163085938, -0.01354217529296875, -0.011896133422851562, -0.010250091552734375, -0.008604049682617188, -0.0069580078125, -0.0053119659423828125, -0.003665924072265625, -0.0020198822021484375, -0.00037384033203125, 0.0012722015380859375, 0.002918243408203125, 0.0045642852783203125, 0.0062103271484375, 0.007856369018554688, 0.009502410888671875, 0.011148452758789062, 0.01279449462890625, 0.014440536499023438, 0.016086578369140625, 0.017732620239257812, 0.019378662109375, 0.021024703979492188, 0.022670745849609375, 0.024316787719726562, 0.02596282958984375, 0.027608871459960938, 0.029254913330078125, 0.030900955200195312, 0.0325469970703125, 0.03419303894042969, 0.035839080810546875, 0.03748512268066406, 0.03913116455078125, 0.04077720642089844, 0.042423248291015625, 0.04406929016113281, 0.04571533203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 20.0, 22.0, 40.0, 54.0, 112.0, 154.0, 179.0, 167.0, 100.0, 54.0, 41.0, 26.0, 13.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2858421802520752, -0.27044135332107544, -0.25504055619239807, -0.23963972926139832, -0.22423893213272095, -0.2088381052017212, -0.19343729317188263, -0.17803648114204407, -0.1626356691122055, -0.14723485708236694, -0.13183404505252838, -0.11643322557210922, -0.10103241354227066, -0.0856316015124321, -0.07023078203201294, -0.05482997000217438, -0.039429157972335815, -0.024028344079852104, -0.008627530187368393, 0.0067732855677604675, 0.02217409759759903, 0.03757490962743759, 0.05297572910785675, 0.06837654113769531, 0.08377735316753387, 0.09917816519737244, 0.114578977227211, 0.12997978925704956, 0.14538061618804932, 0.16078141331672668, 0.17618224024772644, 0.191583052277565, 0.20698386430740356, 0.22238467633724213, 0.2377854883670807, 0.25318631529808044, 0.2685871124267578, 0.28398793935775757, 0.2993887662887573, 0.3147895634174347, 0.33019036054611206, 0.3455911874771118, 0.3609919846057892, 0.37639281153678894, 0.3917936086654663, 0.40719443559646606, 0.4225952625274658, 0.4379960596561432, 0.45339688658714294, 0.4687977135181427, 0.48419851064682007, 0.4995993375778198, 0.5150001645088196, 0.5304009318351746, 0.5458017587661743, 0.5612025856971741, 0.5766034126281738, 0.5920042395591736, 0.6074050664901733, 0.6228058338165283, 0.6382066607475281, 0.6536074876785278, 0.6690083146095276, 0.6844091415405273, 0.6998099088668823]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 13.0, 7.0, 4.0, 12.0, 9.0, 8.0, 14.0, 13.0, 22.0, 23.0, 20.0, 30.0, 38.0, 37.0, 31.0, 24.0, 33.0, 43.0, 42.0, 52.0, 40.0, 42.0, 40.0, 44.0, 41.0, 44.0, 39.0, 29.0, 29.0, 29.0, 23.0, 27.0, 16.0, 17.0, 14.0, 8.0, 5.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.14816880226135254, -0.143440380692482, -0.13871195912361145, -0.1339835524559021, -0.12925513088703156, -0.12452670931816101, -0.11979828774929047, -0.11506986618041992, -0.11034145206212997, -0.10561303049325943, -0.10088461637496948, -0.09615619480609894, -0.0914277732372284, -0.08669935911893845, -0.0819709375500679, -0.07724252343177795, -0.07251410186290741, -0.06778568029403687, -0.06305726617574692, -0.05832884460687637, -0.05360042676329613, -0.04887200891971588, -0.04414358735084534, -0.03941516950726509, -0.034686751663684845, -0.0299583338201046, -0.025229914113879204, -0.02050149440765381, -0.015773076564073563, -0.011044658720493317, -0.0063162390142679214, -0.0015878193080425262, 0.0031405985355377197, 0.00786901731044054, 0.012597436085343361, 0.017325855791568756, 0.022054273635149002, 0.026782691478729248, 0.03151111304759979, 0.03623953089118004, 0.040967948734760284, 0.04569636657834053, 0.050424784421920776, 0.05515320599079132, 0.05988162383437157, 0.06461004167795181, 0.06933846324682236, 0.0740668773651123, 0.07879529893398285, 0.0835237205028534, 0.08825213462114334, 0.09298055619001389, 0.09770897030830383, 0.10243739187717438, 0.10716581344604492, 0.11189423501491547, 0.11662264913320541, 0.12135107070207596, 0.1260794848203659, 0.13080790638923645, 0.135536327958107, 0.14026474952697754, 0.1449931561946869, 0.14972157776355743, 0.15444999933242798]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 11.0, 15.0, 14.0, 24.0, 40.0, 53.0, 89.0, 120.0, 212.0, 347.0, 787.0, 1967.0, 7122.0, 33543.0, 178853.0, 545100.0, 225151.0, 42159.0, 8865.0, 2259.0, 797.0, 390.0, 214.0, 119.0, 92.0, 57.0, 52.0, 27.0, 23.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14381790161132812, -0.13895416259765625, -0.13409042358398438, -0.1292266845703125, -0.12436294555664062, -0.11949920654296875, -0.11463546752929688, -0.109771728515625, -0.10490798950195312, -0.10004425048828125, -0.09518051147460938, -0.0903167724609375, -0.08545303344726562, -0.08058929443359375, -0.07572555541992188, -0.07086181640625, -0.06599807739257812, -0.06113433837890625, -0.056270599365234375, -0.0514068603515625, -0.046543121337890625, -0.04167938232421875, -0.036815643310546875, -0.031951904296875, -0.027088165283203125, -0.02222442626953125, -0.017360687255859375, -0.0124969482421875, -0.007633209228515625, -0.00276947021484375, 0.002094268798828125, 0.0069580078125, 0.011821746826171875, 0.01668548583984375, 0.021549224853515625, 0.0264129638671875, 0.031276702880859375, 0.03614044189453125, 0.041004180908203125, 0.045867919921875, 0.050731658935546875, 0.05559539794921875, 0.060459136962890625, 0.0653228759765625, 0.07018661499023438, 0.07505035400390625, 0.07991409301757812, 0.08477783203125, 0.08964157104492188, 0.09450531005859375, 0.09936904907226562, 0.1042327880859375, 0.10909652709960938, 0.11396026611328125, 0.11882400512695312, 0.123687744140625, 0.12855148315429688, 0.13341522216796875, 0.13827896118164062, 0.1431427001953125, 0.14800643920898438, 0.15287017822265625, 0.15773391723632812, 0.16259765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 12.0, 24.0, 54.0, 72.0, 101.0, 164.0, 147.0, 150.0, 122.0, 70.0, 49.0, 21.0, 9.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06494808197021484, -0.06281852722167969, -0.06068897247314453, -0.058559417724609375, -0.05642986297607422, -0.05430030822753906, -0.052170753479003906, -0.05004119873046875, -0.047911643981933594, -0.04578208923339844, -0.04365253448486328, -0.041522979736328125, -0.03939342498779297, -0.03726387023925781, -0.035134315490722656, -0.0330047607421875, -0.030875205993652344, -0.028745651245117188, -0.02661609649658203, -0.024486541748046875, -0.02235698699951172, -0.020227432250976562, -0.018097877502441406, -0.01596832275390625, -0.013838768005371094, -0.011709213256835938, -0.009579658508300781, -0.007450103759765625, -0.005320549011230469, -0.0031909942626953125, -0.0010614395141601562, 0.001068115234375, 0.0031976699829101562, 0.0053272247314453125, 0.007456779479980469, 0.009586334228515625, 0.011715888977050781, 0.013845443725585938, 0.015974998474121094, 0.01810455322265625, 0.020234107971191406, 0.022363662719726562, 0.02449321746826172, 0.026622772216796875, 0.02875232696533203, 0.030881881713867188, 0.033011436462402344, 0.0351409912109375, 0.037270545959472656, 0.03940010070800781, 0.04152965545654297, 0.043659210205078125, 0.04578876495361328, 0.04791831970214844, 0.050047874450683594, 0.05217742919921875, 0.054306983947753906, 0.05643653869628906, 0.05856609344482422, 0.060695648193359375, 0.06282520294189453, 0.06495475769042969, 0.06708431243896484, 0.0692138671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 7.0, 11.0, 11.0, 22.0, 18.0, 26.0, 44.0, 80.0, 117.0, 192.0, 306.0, 572.0, 1165.0, 2445.0, 5255.0, 12223.0, 31256.0, 82182.0, 217071.0, 361491.0, 205557.0, 76972.0, 29877.0, 11834.0, 5066.0, 2228.0, 1120.0, 570.0, 326.0, 188.0, 100.0, 63.0, 30.0, 44.0, 26.0, 16.0, 8.0, 6.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07563400268554688, -0.07277679443359375, -0.06991958618164062, -0.0670623779296875, -0.06420516967773438, -0.06134796142578125, -0.058490753173828125, -0.055633544921875, -0.052776336669921875, -0.04991912841796875, -0.047061920166015625, -0.0442047119140625, -0.041347503662109375, -0.03849029541015625, -0.035633087158203125, -0.03277587890625, -0.029918670654296875, -0.02706146240234375, -0.024204254150390625, -0.0213470458984375, -0.018489837646484375, -0.01563262939453125, -0.012775421142578125, -0.009918212890625, -0.007061004638671875, -0.00420379638671875, -0.001346588134765625, 0.0015106201171875, 0.004367828369140625, 0.00722503662109375, 0.010082244873046875, 0.012939453125, 0.015796661376953125, 0.01865386962890625, 0.021511077880859375, 0.0243682861328125, 0.027225494384765625, 0.03008270263671875, 0.032939910888671875, 0.035797119140625, 0.038654327392578125, 0.04151153564453125, 0.044368743896484375, 0.0472259521484375, 0.050083160400390625, 0.05294036865234375, 0.055797576904296875, 0.05865478515625, 0.061511993408203125, 0.06436920166015625, 0.06722640991210938, 0.0700836181640625, 0.07294082641601562, 0.07579803466796875, 0.07865524291992188, 0.081512451171875, 0.08436965942382812, 0.08722686767578125, 0.09008407592773438, 0.0929412841796875, 0.09579849243164062, 0.09865570068359375, 0.10151290893554688, 0.1043701171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 6.0, 5.0, 9.0, 8.0, 12.0, 10.0, 16.0, 16.0, 30.0, 25.0, 26.0, 27.0, 41.0, 32.0, 46.0, 28.0, 36.0, 33.0, 42.0, 51.0, 46.0, 42.0, 40.0, 30.0, 36.0, 31.0, 36.0, 28.0, 24.0, 24.0, 24.0, 16.0, 15.0, 14.0, 15.0, 12.0, 11.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.08294677734375, -0.08051300048828125, -0.0780792236328125, -0.07564544677734375, -0.073211669921875, -0.07077789306640625, -0.0683441162109375, -0.06591033935546875, -0.0634765625, -0.06104278564453125, -0.0586090087890625, -0.05617523193359375, -0.053741455078125, -0.05130767822265625, -0.0488739013671875, -0.04644012451171875, -0.04400634765625, -0.04157257080078125, -0.0391387939453125, -0.03670501708984375, -0.034271240234375, -0.03183746337890625, -0.0294036865234375, -0.02696990966796875, -0.0245361328125, -0.02210235595703125, -0.0196685791015625, -0.01723480224609375, -0.014801025390625, -0.01236724853515625, -0.0099334716796875, -0.00749969482421875, -0.00506591796875, -0.00263214111328125, -0.0001983642578125, 0.00223541259765625, 0.004669189453125, 0.00710296630859375, 0.0095367431640625, 0.01197052001953125, 0.014404296875, 0.01683807373046875, 0.0192718505859375, 0.02170562744140625, 0.024139404296875, 0.02657318115234375, 0.0290069580078125, 0.03144073486328125, 0.03387451171875, 0.03630828857421875, 0.0387420654296875, 0.04117584228515625, 0.043609619140625, 0.04604339599609375, 0.0484771728515625, 0.05091094970703125, 0.0533447265625, 0.05577850341796875, 0.0582122802734375, 0.06064605712890625, 0.063079833984375, 0.06551361083984375, 0.0679473876953125, 0.07038116455078125, 0.07281494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 7.0, 8.0, 18.0, 21.0, 30.0, 41.0, 48.0, 84.0, 99.0, 150.0, 219.0, 320.0, 482.0, 740.0, 1316.0, 2404.0, 5063.0, 13187.0, 59825.0, 734139.0, 190998.0, 23908.0, 7589.0, 3276.0, 1717.0, 971.0, 630.0, 376.0, 259.0, 174.0, 121.0, 93.0, 81.0, 44.0, 33.0, 23.0, 19.0, 9.0, 4.0, 11.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.15937042236328125, -0.1538238525390625, -0.14827728271484375, -0.142730712890625, -0.13718414306640625, -0.1316375732421875, -0.12609100341796875, -0.12054443359375, -0.11499786376953125, -0.1094512939453125, -0.10390472412109375, -0.098358154296875, -0.09281158447265625, -0.0872650146484375, -0.08171844482421875, -0.076171875, -0.07062530517578125, -0.0650787353515625, -0.05953216552734375, -0.053985595703125, -0.04843902587890625, -0.0428924560546875, -0.03734588623046875, -0.03179931640625, -0.02625274658203125, -0.0207061767578125, -0.01515960693359375, -0.009613037109375, -0.00406646728515625, 0.0014801025390625, 0.00702667236328125, 0.0125732421875, 0.01811981201171875, 0.0236663818359375, 0.02921295166015625, 0.034759521484375, 0.04030609130859375, 0.0458526611328125, 0.05139923095703125, 0.05694580078125, 0.06249237060546875, 0.0680389404296875, 0.07358551025390625, 0.079132080078125, 0.08467864990234375, 0.0902252197265625, 0.09577178955078125, 0.101318359375, 0.10686492919921875, 0.1124114990234375, 0.11795806884765625, 0.123504638671875, 0.12905120849609375, 0.1345977783203125, 0.14014434814453125, 0.14569091796875, 0.15123748779296875, 0.1567840576171875, 0.16233062744140625, 0.167877197265625, 0.17342376708984375, 0.1789703369140625, 0.18451690673828125, 0.1900634765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 10.0, 8.0, 15.0, 13.0, 20.0, 21.0, 44.0, 51.0, 75.0, 101.0, 115.0, 112.0, 103.0, 86.0, 50.0, 57.0, 28.0, 21.0, 16.0, 17.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.790327072143555e-05, -7.561221718788147e-05, -7.332116365432739e-05, -7.103011012077332e-05, -6.873905658721924e-05, -6.644800305366516e-05, -6.415694952011108e-05, -6.186589598655701e-05, -5.957484245300293e-05, -5.728378891944885e-05, -5.4992735385894775e-05, -5.27016818523407e-05, -5.041062831878662e-05, -4.8119574785232544e-05, -4.582852125167847e-05, -4.353746771812439e-05, -4.124641418457031e-05, -3.8955360651016235e-05, -3.666430711746216e-05, -3.437325358390808e-05, -3.2082200050354004e-05, -2.9791146516799927e-05, -2.750009298324585e-05, -2.5209039449691772e-05, -2.2917985916137695e-05, -2.0626932382583618e-05, -1.833587884902954e-05, -1.6044825315475464e-05, -1.3753771781921387e-05, -1.146271824836731e-05, -9.171664714813232e-06, -6.880611181259155e-06, -4.589557647705078e-06, -2.298504114151001e-06, -7.450580596923828e-09, 2.2836029529571533e-06, 4.5746564865112305e-06, 6.865710020065308e-06, 9.156763553619385e-06, 1.1447817087173462e-05, 1.3738870620727539e-05, 1.6029924154281616e-05, 1.8320977687835693e-05, 2.061203122138977e-05, 2.2903084754943848e-05, 2.5194138288497925e-05, 2.7485191822052002e-05, 2.977624535560608e-05, 3.2067298889160156e-05, 3.4358352422714233e-05, 3.664940595626831e-05, 3.894045948982239e-05, 4.1231513023376465e-05, 4.352256655693054e-05, 4.581362009048462e-05, 4.8104673624038696e-05, 5.0395727157592773e-05, 5.268678069114685e-05, 5.497783422470093e-05, 5.7268887758255005e-05, 5.955994129180908e-05, 6.185099482536316e-05, 6.414204835891724e-05, 6.643310189247131e-05, 6.872415542602539e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 13.0, 13.0, 19.0, 31.0, 42.0, 59.0, 118.0, 156.0, 255.0, 451.0, 702.0, 1185.0, 2169.0, 3966.0, 8623.0, 34676.0, 698073.0, 262989.0, 20540.0, 6647.0, 3289.0, 1789.0, 1098.0, 628.0, 383.0, 230.0, 133.0, 107.0, 43.0, 36.0, 18.0, 16.0, 8.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.22036170959472656, -0.21403884887695312, -0.2077159881591797, -0.20139312744140625, -0.1950702667236328, -0.18874740600585938, -0.18242454528808594, -0.1761016845703125, -0.16977882385253906, -0.16345596313476562, -0.1571331024169922, -0.15081024169921875, -0.1444873809814453, -0.13816452026367188, -0.13184165954589844, -0.125518798828125, -0.11919593811035156, -0.11287307739257812, -0.10655021667480469, -0.10022735595703125, -0.09390449523925781, -0.08758163452148438, -0.08125877380371094, -0.0749359130859375, -0.06861305236816406, -0.062290191650390625, -0.05596733093261719, -0.04964447021484375, -0.04332160949707031, -0.036998748779296875, -0.030675888061523438, -0.02435302734375, -0.018030166625976562, -0.011707305908203125, -0.0053844451904296875, 0.00093841552734375, 0.0072612762451171875, 0.013584136962890625, 0.019906997680664062, 0.0262298583984375, 0.03255271911621094, 0.038875579833984375, 0.04519844055175781, 0.05152130126953125, 0.05784416198730469, 0.06416702270507812, 0.07048988342285156, 0.076812744140625, 0.08313560485839844, 0.08945846557617188, 0.09578132629394531, 0.10210418701171875, 0.10842704772949219, 0.11474990844726562, 0.12107276916503906, 0.1273956298828125, 0.13371849060058594, 0.14004135131835938, 0.1463642120361328, 0.15268707275390625, 0.1590099334716797, 0.16533279418945312, 0.17165565490722656, 0.177978515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 12.0, 17.0, 23.0, 29.0, 70.0, 113.0, 228.0, 200.0, 123.0, 61.0, 32.0, 17.0, 11.0, 11.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1905517578125, -0.18566226959228516, -0.1807727813720703, -0.17588329315185547, -0.17099380493164062, -0.16610431671142578, -0.16121482849121094, -0.1563253402709961, -0.15143585205078125, -0.1465463638305664, -0.14165687561035156, -0.13676738739013672, -0.13187789916992188, -0.12698841094970703, -0.12209892272949219, -0.11720943450927734, -0.1123199462890625, -0.10743045806884766, -0.10254096984863281, -0.09765148162841797, -0.09276199340820312, -0.08787250518798828, -0.08298301696777344, -0.0780935287475586, -0.07320404052734375, -0.0683145523071289, -0.06342506408691406, -0.05853557586669922, -0.053646087646484375, -0.04875659942626953, -0.04386711120605469, -0.038977622985839844, -0.034088134765625, -0.029198646545410156, -0.024309158325195312, -0.01941967010498047, -0.014530181884765625, -0.009640693664550781, -0.0047512054443359375, 0.00013828277587890625, 0.00502777099609375, 0.009917259216308594, 0.014806747436523438, 0.01969623565673828, 0.024585723876953125, 0.02947521209716797, 0.03436470031738281, 0.039254188537597656, 0.0441436767578125, 0.049033164978027344, 0.05392265319824219, 0.05881214141845703, 0.06370162963867188, 0.06859111785888672, 0.07348060607910156, 0.0783700942993164, 0.08325958251953125, 0.0881490707397461, 0.09303855895996094, 0.09792804718017578, 0.10281753540039062, 0.10770702362060547, 0.11259651184082031, 0.11748600006103516, 0.12237548828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 11.0, 17.0, 25.0, 29.0, 74.0, 134.0, 167.0, 168.0, 128.0, 86.0, 49.0, 26.0, 26.0, 18.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2190868854522705, -1.1799559593200684, -1.1408249139785767, -1.1016939878463745, -1.0625630617141724, -1.0234320163726807, -0.9843010902404785, -0.9451701045036316, -0.9060391187667847, -0.8669081330299377, -0.8277772068977356, -0.7886462211608887, -0.7495152354240417, -0.7103842496871948, -0.6712533235549927, -0.6321223378181458, -0.5929914116859436, -0.5538604259490967, -0.5147294998168945, -0.4755985140800476, -0.4364675283432007, -0.39733657240867615, -0.3582056164741516, -0.3190746307373047, -0.27994367480278015, -0.24081270396709442, -0.2016817331314087, -0.16255077719688416, -0.12341980636119843, -0.0842888355255127, -0.04515787959098816, -0.006026893854141235, 0.0331040620803833, 0.07223503291606903, 0.11136599630117416, 0.1504969596862793, 0.18962793052196503, 0.22875890135765076, 0.2678898572921753, 0.3070208430290222, 0.34615179896354675, 0.3852827548980713, 0.4244137406349182, 0.46354469656944275, 0.5026756525039673, 0.5418066382408142, 0.5809376239776611, 0.6200685501098633, 0.6591995358467102, 0.6983305215835571, 0.7374614477157593, 0.7765924334526062, 0.8157234191894531, 0.8548543453216553, 0.8939853310585022, 0.9331163167953491, 0.9722472429275513, 1.0113781690597534, 1.0505092144012451, 1.0896401405334473, 1.1287710666656494, 1.1679021120071411, 1.2070330381393433, 1.246164083480835, 1.285295009613037]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 17.0, 10.0, 16.0, 14.0, 29.0, 27.0, 25.0, 37.0, 37.0, 43.0, 38.0, 35.0, 53.0, 32.0, 57.0, 45.0, 53.0, 42.0, 52.0, 38.0, 48.0, 31.0, 44.0, 29.0, 35.0, 18.0, 15.0, 17.0, 9.0, 8.0, 6.0, 8.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4381658434867859, -0.42410337924957275, -0.41004088521003723, -0.3959784209728241, -0.38191595673561096, -0.36785346269607544, -0.3537909984588623, -0.33972853422164917, -0.32566606998443604, -0.3116036057472229, -0.2975411117076874, -0.28347864747047424, -0.2694161832332611, -0.2553536891937256, -0.24129122495651245, -0.22722876071929932, -0.213166281580925, -0.19910380244255066, -0.18504133820533752, -0.1709788590669632, -0.15691639482975006, -0.14285391569137573, -0.1287914514541626, -0.11472897231578827, -0.10066650062799454, -0.0866040289402008, -0.07254155725240707, -0.058479081839323044, -0.04441661015152931, -0.030354134738445282, -0.01629166305065155, -0.0022291913628578186, 0.011833280324935913, 0.025895752012729645, 0.039958223700523376, 0.05402069911360741, 0.06808316707611084, 0.08214564621448517, 0.0962081179022789, 0.11027058959007263, 0.12433306127786636, 0.1383955329656601, 0.15245801210403442, 0.16652047634124756, 0.1805829554796219, 0.19464543461799622, 0.20870789885520935, 0.22277036309242249, 0.23683284223079681, 0.25089532136917114, 0.2649577856063843, 0.2790202498435974, 0.29308274388313293, 0.30714520812034607, 0.3212076723575592, 0.3352701663970947, 0.34933263063430786, 0.363395094871521, 0.3774575889110565, 0.39152005314826965, 0.4055825173854828, 0.4196450114250183, 0.43370747566223145, 0.4477699398994446, 0.4618324041366577]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 10.0, 10.0, 13.0, 28.0, 30.0, 40.0, 78.0, 123.0, 222.0, 417.0, 703.0, 1236.0, 2474.0, 5489.0, 14510.0, 46171.0, 301789.0, 3350145.0, 392775.0, 50868.0, 15512.0, 5937.0, 2629.0, 1352.0, 706.0, 399.0, 223.0, 146.0, 83.0, 50.0, 25.0, 30.0, 15.0, 13.0, 9.0, 11.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12084770202636719, -0.11724472045898438, -0.11364173889160156, -0.11003875732421875, -0.10643577575683594, -0.10283279418945312, -0.09922981262207031, -0.0956268310546875, -0.09202384948730469, -0.08842086791992188, -0.08481788635253906, -0.08121490478515625, -0.07761192321777344, -0.07400894165039062, -0.07040596008300781, -0.066802978515625, -0.06319999694824219, -0.059597015380859375, -0.05599403381347656, -0.05239105224609375, -0.04878807067871094, -0.045185089111328125, -0.04158210754394531, -0.0379791259765625, -0.03437614440917969, -0.030773162841796875, -0.027170181274414062, -0.02356719970703125, -0.019964218139648438, -0.016361236572265625, -0.012758255004882812, -0.0091552734375, -0.0055522918701171875, -0.001949310302734375, 0.0016536712646484375, 0.00525665283203125, 0.008859634399414062, 0.012462615966796875, 0.016065597534179688, 0.0196685791015625, 0.023271560668945312, 0.026874542236328125, 0.030477523803710938, 0.03408050537109375, 0.03768348693847656, 0.041286468505859375, 0.04488945007324219, 0.048492431640625, 0.05209541320800781, 0.055698394775390625, 0.05930137634277344, 0.06290435791015625, 0.06650733947753906, 0.07011032104492188, 0.07371330261230469, 0.0773162841796875, 0.08091926574707031, 0.08452224731445312, 0.08812522888183594, 0.09172821044921875, 0.09533119201660156, 0.09893417358398438, 0.10253715515136719, 0.10614013671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 14.0, 23.0, 35.0, 58.0, 57.0, 100.0, 92.0, 101.0, 117.0, 104.0, 72.0, 92.0, 49.0, 33.0, 20.0, 13.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0626220703125, -0.060461997985839844, -0.05830192565917969, -0.05614185333251953, -0.053981781005859375, -0.05182170867919922, -0.04966163635253906, -0.047501564025878906, -0.04534149169921875, -0.043181419372558594, -0.04102134704589844, -0.03886127471923828, -0.036701202392578125, -0.03454113006591797, -0.03238105773925781, -0.030220985412597656, -0.0280609130859375, -0.025900840759277344, -0.023740768432617188, -0.02158069610595703, -0.019420623779296875, -0.01726055145263672, -0.015100479125976562, -0.012940406799316406, -0.01078033447265625, -0.008620262145996094, -0.0064601898193359375, -0.004300117492675781, -0.002140045166015625, 2.002716064453125e-05, 0.0021800994873046875, 0.004340171813964844, 0.006500244140625, 0.008660316467285156, 0.010820388793945312, 0.012980461120605469, 0.015140533447265625, 0.01730060577392578, 0.019460678100585938, 0.021620750427246094, 0.02378082275390625, 0.025940895080566406, 0.028100967407226562, 0.03026103973388672, 0.032421112060546875, 0.03458118438720703, 0.03674125671386719, 0.038901329040527344, 0.0410614013671875, 0.043221473693847656, 0.04538154602050781, 0.04754161834716797, 0.049701690673828125, 0.05186176300048828, 0.05402183532714844, 0.056181907653808594, 0.05834197998046875, 0.060502052307128906, 0.06266212463378906, 0.06482219696044922, 0.06698226928710938, 0.06914234161376953, 0.07130241394042969, 0.07346248626708984, 0.07562255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 12.0, 9.0, 22.0, 22.0, 39.0, 72.0, 76.0, 114.0, 208.0, 307.0, 531.0, 769.0, 1304.0, 2333.0, 4450.0, 8441.0, 18219.0, 44727.0, 137475.0, 749511.0, 2719995.0, 356378.0, 88681.0, 31928.0, 13739.0, 6590.0, 3472.0, 1905.0, 1090.0, 655.0, 405.0, 282.0, 170.0, 120.0, 70.0, 44.0, 42.0, 25.0, 16.0, 11.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.072998046875, -0.07066726684570312, -0.06833648681640625, -0.06600570678710938, -0.0636749267578125, -0.061344146728515625, -0.05901336669921875, -0.056682586669921875, -0.054351806640625, -0.052021026611328125, -0.04969024658203125, -0.047359466552734375, -0.0450286865234375, -0.042697906494140625, -0.04036712646484375, -0.038036346435546875, -0.03570556640625, -0.033374786376953125, -0.03104400634765625, -0.028713226318359375, -0.0263824462890625, -0.024051666259765625, -0.02172088623046875, -0.019390106201171875, -0.017059326171875, -0.014728546142578125, -0.01239776611328125, -0.010066986083984375, -0.0077362060546875, -0.005405426025390625, -0.00307464599609375, -0.000743865966796875, 0.0015869140625, 0.003917694091796875, 0.00624847412109375, 0.008579254150390625, 0.0109100341796875, 0.013240814208984375, 0.01557159423828125, 0.017902374267578125, 0.020233154296875, 0.022563934326171875, 0.02489471435546875, 0.027225494384765625, 0.0295562744140625, 0.031887054443359375, 0.03421783447265625, 0.036548614501953125, 0.03887939453125, 0.041210174560546875, 0.04354095458984375, 0.045871734619140625, 0.0482025146484375, 0.050533294677734375, 0.05286407470703125, 0.055194854736328125, 0.057525634765625, 0.059856414794921875, 0.06218719482421875, 0.06451797485351562, 0.0668487548828125, 0.06917953491210938, 0.07151031494140625, 0.07384109497070312, 0.076171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 16.0, 11.0, 31.0, 15.0, 28.0, 48.0, 71.0, 127.0, 170.0, 278.0, 500.0, 948.0, 762.0, 361.0, 209.0, 158.0, 85.0, 61.0, 49.0, 35.0, 19.0, 9.0, 16.0, 7.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08953857421875, -0.08687877655029297, -0.08421897888183594, -0.0815591812133789, -0.07889938354492188, -0.07623958587646484, -0.07357978820800781, -0.07091999053955078, -0.06826019287109375, -0.06560039520263672, -0.06294059753417969, -0.060280799865722656, -0.057621002197265625, -0.054961204528808594, -0.05230140686035156, -0.04964160919189453, -0.0469818115234375, -0.04432201385498047, -0.04166221618652344, -0.039002418518066406, -0.036342620849609375, -0.033682823181152344, -0.031023025512695312, -0.02836322784423828, -0.02570343017578125, -0.02304363250732422, -0.020383834838867188, -0.017724037170410156, -0.015064239501953125, -0.012404441833496094, -0.009744644165039062, -0.007084846496582031, -0.004425048828125, -0.0017652511596679688, 0.0008945465087890625, 0.0035543441772460938, 0.006214141845703125, 0.008873939514160156, 0.011533737182617188, 0.014193534851074219, 0.01685333251953125, 0.01951313018798828, 0.022172927856445312, 0.024832725524902344, 0.027492523193359375, 0.030152320861816406, 0.03281211853027344, 0.03547191619873047, 0.0381317138671875, 0.04079151153564453, 0.04345130920410156, 0.046111106872558594, 0.048770904541015625, 0.051430702209472656, 0.05409049987792969, 0.05675029754638672, 0.05941009521484375, 0.06206989288330078, 0.06472969055175781, 0.06738948822021484, 0.07004928588867188, 0.0727090835571289, 0.07536888122558594, 0.07802867889404297, 0.0806884765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 14.0, 16.0, 37.0, 50.0, 101.0, 139.0, 145.0, 141.0, 114.0, 96.0, 54.0, 45.0, 13.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3961721658706665, -0.3748897612094879, -0.3536073565483093, -0.33232492208480835, -0.31104251742362976, -0.28976011276245117, -0.2684776782989502, -0.2471952736377716, -0.22591286897659302, -0.20463046431541443, -0.18334804475307465, -0.16206562519073486, -0.14078322052955627, -0.11950080841779709, -0.0982183963060379, -0.07693597674369812, -0.05565357208251953, -0.034371159970760345, -0.01308874785900116, 0.008193664252758026, 0.029476076364517212, 0.0507584884762764, 0.07204090058803558, 0.09332332015037537, 0.11460572481155396, 0.13588812947273254, 0.15717054903507233, 0.1784529685974121, 0.1997353732585907, 0.2210177779197693, 0.24230019748210907, 0.26358261704444885, 0.28486502170562744, 0.30614742636680603, 0.3274298310279846, 0.3487122654914856, 0.3699946701526642, 0.3912770748138428, 0.41255950927734375, 0.43384191393852234, 0.4551243185997009, 0.4764067232608795, 0.4976891279220581, 0.5189715623855591, 0.5402539968490601, 0.5615363717079163, 0.5828188061714172, 0.6041011810302734, 0.6253836154937744, 0.6466660499572754, 0.6679484248161316, 0.6892308592796326, 0.7105132341384888, 0.7317956686019897, 0.7530781030654907, 0.7743605375289917, 0.7956429123878479, 0.8169253468513489, 0.8382077217102051, 0.859490156173706, 0.880772590637207, 0.9020549654960632, 0.9233373999595642, 0.9446197748184204, 0.9659022092819214]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 7.0, 6.0, 3.0, 9.0, 9.0, 12.0, 19.0, 16.0, 14.0, 19.0, 15.0, 26.0, 18.0, 30.0, 34.0, 32.0, 25.0, 37.0, 52.0, 35.0, 35.0, 35.0, 48.0, 34.0, 39.0, 39.0, 30.0, 30.0, 23.0, 41.0, 31.0, 17.0, 27.0, 23.0, 16.0, 14.0, 17.0, 10.0, 14.0, 15.0, 8.0, 14.0, 8.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2591901421546936, -0.2510605454444885, -0.24293096363544464, -0.23480138182640076, -0.22667178511619568, -0.2185421884059906, -0.21041260659694672, -0.20228302478790283, -0.19415342807769775, -0.18602383136749268, -0.1778942495584488, -0.1697646677494049, -0.16163507103919983, -0.15350547432899475, -0.14537589251995087, -0.13724631071090698, -0.1291167140007019, -0.12098712474107742, -0.11285753548145294, -0.10472794622182846, -0.09659835696220398, -0.0884687677025795, -0.08033917844295502, -0.07220958918333054, -0.06407999992370605, -0.055950410664081573, -0.04782082140445709, -0.03969123214483261, -0.03156164288520813, -0.02343205362558365, -0.015302464365959167, -0.007172875106334686, 0.0009567141532897949, 0.009086303412914276, 0.017215892672538757, 0.02534548193216324, 0.03347507119178772, 0.0416046604514122, 0.04973424971103668, 0.05786383897066116, 0.06599342823028564, 0.07412301748991013, 0.0822526067495346, 0.09038219600915909, 0.09851178526878357, 0.10664137452840805, 0.11477096378803253, 0.12290055304765701, 0.1310301423072815, 0.13915973901748657, 0.14728932082653046, 0.15541890263557434, 0.16354849934577942, 0.1716780960559845, 0.17980767786502838, 0.18793725967407227, 0.19606685638427734, 0.20419645309448242, 0.2123260349035263, 0.2204556167125702, 0.22858521342277527, 0.23671481013298035, 0.24484439194202423, 0.2529739737510681, 0.2611035704612732]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 11.0, 22.0, 24.0, 38.0, 57.0, 89.0, 109.0, 182.0, 296.0, 435.0, 721.0, 1312.0, 2334.0, 4275.0, 8317.0, 17161.0, 38034.0, 90467.0, 214113.0, 323316.0, 196723.0, 82490.0, 34922.0, 16001.0, 7782.0, 3937.0, 2209.0, 1300.0, 630.0, 426.0, 303.0, 165.0, 105.0, 83.0, 45.0, 35.0, 25.0, 18.0, 16.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09210205078125, -0.0891733169555664, -0.08624458312988281, -0.08331584930419922, -0.08038711547851562, -0.07745838165283203, -0.07452964782714844, -0.07160091400146484, -0.06867218017578125, -0.06574344635009766, -0.06281471252441406, -0.05988597869873047, -0.056957244873046875, -0.05402851104736328, -0.05109977722167969, -0.048171043395996094, -0.0452423095703125, -0.042313575744628906, -0.03938484191894531, -0.03645610809326172, -0.033527374267578125, -0.03059864044189453, -0.027669906616210938, -0.024741172790527344, -0.02181243896484375, -0.018883705139160156, -0.015954971313476562, -0.013026237487792969, -0.010097503662109375, -0.007168769836425781, -0.0042400360107421875, -0.0013113021850585938, 0.001617431640625, 0.004546165466308594, 0.0074748992919921875, 0.010403633117675781, 0.013332366943359375, 0.01626110076904297, 0.019189834594726562, 0.022118568420410156, 0.02504730224609375, 0.027976036071777344, 0.030904769897460938, 0.03383350372314453, 0.036762237548828125, 0.03969097137451172, 0.04261970520019531, 0.045548439025878906, 0.0484771728515625, 0.051405906677246094, 0.05433464050292969, 0.05726337432861328, 0.060192108154296875, 0.06312084197998047, 0.06604957580566406, 0.06897830963134766, 0.07190704345703125, 0.07483577728271484, 0.07776451110839844, 0.08069324493408203, 0.08362197875976562, 0.08655071258544922, 0.08947944641113281, 0.0924081802368164, 0.0953369140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 7.0, 14.0, 16.0, 18.0, 27.0, 44.0, 60.0, 62.0, 76.0, 91.0, 78.0, 98.0, 76.0, 82.0, 66.0, 58.0, 47.0, 33.0, 21.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06295585632324219, -0.060848236083984375, -0.05874061584472656, -0.05663299560546875, -0.05452537536621094, -0.052417755126953125, -0.05031013488769531, -0.0482025146484375, -0.04609489440917969, -0.043987274169921875, -0.04187965393066406, -0.03977203369140625, -0.03766441345214844, -0.035556793212890625, -0.03344917297363281, -0.031341552734375, -0.029233932495117188, -0.027126312255859375, -0.025018692016601562, -0.02291107177734375, -0.020803451538085938, -0.018695831298828125, -0.016588211059570312, -0.0144805908203125, -0.012372970581054688, -0.010265350341796875, -0.008157730102539062, -0.00605010986328125, -0.0039424896240234375, -0.001834869384765625, 0.0002727508544921875, 0.00238037109375, 0.0044879913330078125, 0.006595611572265625, 0.008703231811523438, 0.01081085205078125, 0.012918472290039062, 0.015026092529296875, 0.017133712768554688, 0.0192413330078125, 0.021348953247070312, 0.023456573486328125, 0.025564193725585938, 0.02767181396484375, 0.029779434204101562, 0.031887054443359375, 0.03399467468261719, 0.036102294921875, 0.03820991516113281, 0.040317535400390625, 0.04242515563964844, 0.04453277587890625, 0.04664039611816406, 0.048748016357421875, 0.05085563659667969, 0.0529632568359375, 0.05507087707519531, 0.057178497314453125, 0.05928611755371094, 0.06139373779296875, 0.06350135803222656, 0.06560897827148438, 0.06771659851074219, 0.06982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 3.0, 11.0, 16.0, 24.0, 35.0, 53.0, 81.0, 166.0, 278.0, 431.0, 882.0, 1529.0, 3039.0, 6012.0, 13174.0, 31323.0, 85516.0, 266210.0, 396849.0, 153110.0, 51491.0, 20064.0, 8897.0, 4358.0, 2250.0, 1150.0, 609.0, 391.0, 221.0, 130.0, 93.0, 50.0, 32.0, 23.0, 11.0, 8.0, 12.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10385513305664062, -0.10053253173828125, -0.09720993041992188, -0.0938873291015625, -0.09056472778320312, -0.08724212646484375, -0.08391952514648438, -0.080596923828125, -0.07727432250976562, -0.07395172119140625, -0.07062911987304688, -0.0673065185546875, -0.06398391723632812, -0.06066131591796875, -0.057338714599609375, -0.05401611328125, -0.050693511962890625, -0.04737091064453125, -0.044048309326171875, -0.0407257080078125, -0.037403106689453125, -0.03408050537109375, -0.030757904052734375, -0.027435302734375, -0.024112701416015625, -0.02079010009765625, -0.017467498779296875, -0.0141448974609375, -0.010822296142578125, -0.00749969482421875, -0.004177093505859375, -0.0008544921875, 0.002468109130859375, 0.00579071044921875, 0.009113311767578125, 0.0124359130859375, 0.015758514404296875, 0.01908111572265625, 0.022403717041015625, 0.025726318359375, 0.029048919677734375, 0.03237152099609375, 0.035694122314453125, 0.0390167236328125, 0.042339324951171875, 0.04566192626953125, 0.048984527587890625, 0.05230712890625, 0.055629730224609375, 0.05895233154296875, 0.062274932861328125, 0.0655975341796875, 0.06892013549804688, 0.07224273681640625, 0.07556533813476562, 0.078887939453125, 0.08221054077148438, 0.08553314208984375, 0.08885574340820312, 0.0921783447265625, 0.09550094604492188, 0.09882354736328125, 0.10214614868164062, 0.10546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 9.0, 9.0, 8.0, 14.0, 11.0, 18.0, 19.0, 27.0, 40.0, 44.0, 42.0, 58.0, 43.0, 71.0, 56.0, 60.0, 70.0, 52.0, 52.0, 52.0, 47.0, 35.0, 26.0, 16.0, 23.0, 19.0, 15.0, 11.0, 9.0, 9.0, 6.0, 2.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15755748748779297, -0.15312767028808594, -0.1486978530883789, -0.14426803588867188, -0.13983821868896484, -0.1354084014892578, -0.13097858428955078, -0.12654876708984375, -0.12211894989013672, -0.11768913269042969, -0.11325931549072266, -0.10882949829101562, -0.1043996810913086, -0.09996986389160156, -0.09554004669189453, -0.0911102294921875, -0.08668041229248047, -0.08225059509277344, -0.0778207778930664, -0.07339096069335938, -0.06896114349365234, -0.06453132629394531, -0.06010150909423828, -0.05567169189453125, -0.05124187469482422, -0.04681205749511719, -0.042382240295410156, -0.037952423095703125, -0.033522605895996094, -0.029092788696289062, -0.02466297149658203, -0.020233154296875, -0.01580333709716797, -0.011373519897460938, -0.006943702697753906, -0.002513885498046875, 0.0019159317016601562, 0.0063457489013671875, 0.010775566101074219, 0.01520538330078125, 0.01963520050048828, 0.024065017700195312, 0.028494834899902344, 0.032924652099609375, 0.037354469299316406, 0.04178428649902344, 0.04621410369873047, 0.0506439208984375, 0.05507373809814453, 0.05950355529785156, 0.0639333724975586, 0.06836318969726562, 0.07279300689697266, 0.07722282409667969, 0.08165264129638672, 0.08608245849609375, 0.09051227569580078, 0.09494209289550781, 0.09937191009521484, 0.10380172729492188, 0.1082315444946289, 0.11266136169433594, 0.11709117889404297, 0.12152099609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 7.0, 9.0, 12.0, 25.0, 29.0, 51.0, 52.0, 103.0, 131.0, 192.0, 286.0, 358.0, 560.0, 783.0, 1292.0, 1842.0, 2831.0, 4471.0, 7053.0, 12028.0, 20252.0, 39932.0, 92713.0, 243741.0, 337054.0, 153821.0, 59574.0, 28106.0, 15564.0, 9165.0, 5810.0, 3525.0, 2326.0, 1636.0, 1011.0, 727.0, 426.0, 329.0, 215.0, 150.0, 100.0, 71.0, 52.0, 44.0, 34.0, 17.0, 9.0, 13.0, 12.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030853271484375, -0.02986621856689453, -0.028879165649414062, -0.027892112731933594, -0.026905059814453125, -0.025918006896972656, -0.024930953979492188, -0.02394390106201172, -0.02295684814453125, -0.02196979522705078, -0.020982742309570312, -0.019995689392089844, -0.019008636474609375, -0.018021583557128906, -0.017034530639648438, -0.01604747772216797, -0.0150604248046875, -0.014073371887207031, -0.013086318969726562, -0.012099266052246094, -0.011112213134765625, -0.010125160217285156, -0.009138107299804688, -0.008151054382324219, -0.00716400146484375, -0.006176948547363281, -0.0051898956298828125, -0.004202842712402344, -0.003215789794921875, -0.0022287368774414062, -0.0012416839599609375, -0.00025463104248046875, 0.000732421875, 0.0017194747924804688, 0.0027065277099609375, 0.0036935806274414062, 0.004680633544921875, 0.005667686462402344, 0.0066547393798828125, 0.007641792297363281, 0.00862884521484375, 0.009615898132324219, 0.010602951049804688, 0.011590003967285156, 0.012577056884765625, 0.013564109802246094, 0.014551162719726562, 0.015538215637207031, 0.0165252685546875, 0.01751232147216797, 0.018499374389648438, 0.019486427307128906, 0.020473480224609375, 0.021460533142089844, 0.022447586059570312, 0.02343463897705078, 0.02442169189453125, 0.02540874481201172, 0.026395797729492188, 0.027382850646972656, 0.028369903564453125, 0.029356956481933594, 0.030344009399414062, 0.03133106231689453, 0.032318115234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 8.0, 9.0, 11.0, 16.0, 17.0, 22.0, 27.0, 34.0, 48.0, 45.0, 66.0, 66.0, 100.0, 94.0, 82.0, 74.0, 42.0, 38.0, 34.0, 32.0, 20.0, 17.0, 21.0, 12.0, 5.0, 7.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.2928924560546875e-05, -5.153939127922058e-05, -5.014985799789429e-05, -4.876032471656799e-05, -4.73707914352417e-05, -4.5981258153915405e-05, -4.459172487258911e-05, -4.320219159126282e-05, -4.1812658309936523e-05, -4.042312502861023e-05, -3.9033591747283936e-05, -3.764405846595764e-05, -3.625452518463135e-05, -3.4864991903305054e-05, -3.347545862197876e-05, -3.2085925340652466e-05, -3.069639205932617e-05, -2.9306858777999878e-05, -2.7917325496673584e-05, -2.652779221534729e-05, -2.5138258934020996e-05, -2.3748725652694702e-05, -2.2359192371368408e-05, -2.0969659090042114e-05, -1.958012580871582e-05, -1.8190592527389526e-05, -1.6801059246063232e-05, -1.541152596473694e-05, -1.4021992683410645e-05, -1.263245940208435e-05, -1.1242926120758057e-05, -9.853392839431763e-06, -8.463859558105469e-06, -7.074326276779175e-06, -5.684792995452881e-06, -4.295259714126587e-06, -2.905726432800293e-06, -1.516193151473999e-06, -1.2665987014770508e-07, 1.2628734111785889e-06, 2.652406692504883e-06, 4.041939973831177e-06, 5.431473255157471e-06, 6.821006536483765e-06, 8.210539817810059e-06, 9.600073099136353e-06, 1.0989606380462646e-05, 1.237913966178894e-05, 1.3768672943115234e-05, 1.5158206224441528e-05, 1.6547739505767822e-05, 1.7937272787094116e-05, 1.932680606842041e-05, 2.0716339349746704e-05, 2.2105872631072998e-05, 2.3495405912399292e-05, 2.4884939193725586e-05, 2.627447247505188e-05, 2.7664005756378174e-05, 2.9053539037704468e-05, 3.0443072319030762e-05, 3.1832605600357056e-05, 3.322213888168335e-05, 3.4611672163009644e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 12.0, 8.0, 4.0, 16.0, 16.0, 28.0, 27.0, 49.0, 85.0, 133.0, 223.0, 330.0, 645.0, 1133.0, 2201.0, 4570.0, 9957.0, 23924.0, 71214.0, 265664.0, 445240.0, 149517.0, 43261.0, 16154.0, 6938.0, 3312.0, 1638.0, 895.0, 523.0, 298.0, 193.0, 123.0, 83.0, 56.0, 24.0, 16.0, 15.0, 9.0, 8.0, 8.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04400634765625, -0.04259967803955078, -0.04119300842285156, -0.039786338806152344, -0.038379669189453125, -0.036972999572753906, -0.03556632995605469, -0.03415966033935547, -0.03275299072265625, -0.03134632110595703, -0.029939651489257812, -0.028532981872558594, -0.027126312255859375, -0.025719642639160156, -0.024312973022460938, -0.02290630340576172, -0.0214996337890625, -0.02009296417236328, -0.018686294555664062, -0.017279624938964844, -0.015872955322265625, -0.014466285705566406, -0.013059616088867188, -0.011652946472167969, -0.01024627685546875, -0.008839607238769531, -0.0074329376220703125, -0.006026268005371094, -0.004619598388671875, -0.0032129287719726562, -0.0018062591552734375, -0.00039958953857421875, 0.001007080078125, 0.0024137496948242188, 0.0038204193115234375, 0.005227088928222656, 0.006633758544921875, 0.008040428161621094, 0.009447097778320312, 0.010853767395019531, 0.01226043701171875, 0.013667106628417969, 0.015073776245117188, 0.016480445861816406, 0.017887115478515625, 0.019293785095214844, 0.020700454711914062, 0.02210712432861328, 0.0235137939453125, 0.02492046356201172, 0.026327133178710938, 0.027733802795410156, 0.029140472412109375, 0.030547142028808594, 0.03195381164550781, 0.03336048126220703, 0.03476715087890625, 0.03617382049560547, 0.03758049011230469, 0.038987159729003906, 0.040393829345703125, 0.041800498962402344, 0.04320716857910156, 0.04461383819580078, 0.0460205078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 15.0, 15.0, 21.0, 36.0, 42.0, 39.0, 79.0, 84.0, 85.0, 99.0, 94.0, 90.0, 72.0, 35.0, 37.0, 24.0, 28.0, 14.0, 12.0, 6.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054107666015625, -0.05243062973022461, -0.05075359344482422, -0.04907655715942383, -0.04739952087402344, -0.04572248458862305, -0.044045448303222656, -0.042368412017822266, -0.040691375732421875, -0.039014339447021484, -0.037337303161621094, -0.0356602668762207, -0.03398323059082031, -0.03230619430541992, -0.03062915802001953, -0.02895212173461914, -0.02727508544921875, -0.02559804916381836, -0.02392101287841797, -0.022243976593017578, -0.020566940307617188, -0.018889904022216797, -0.017212867736816406, -0.015535831451416016, -0.013858795166015625, -0.012181758880615234, -0.010504722595214844, -0.008827686309814453, -0.0071506500244140625, -0.005473613739013672, -0.0037965774536132812, -0.0021195411682128906, -0.0004425048828125, 0.0012345314025878906, 0.0029115676879882812, 0.004588603973388672, 0.0062656402587890625, 0.007942676544189453, 0.009619712829589844, 0.011296749114990234, 0.012973785400390625, 0.014650821685791016, 0.016327857971191406, 0.018004894256591797, 0.019681930541992188, 0.021358966827392578, 0.02303600311279297, 0.02471303939819336, 0.02639007568359375, 0.02806711196899414, 0.02974414825439453, 0.03142118453979492, 0.03309822082519531, 0.0347752571105957, 0.036452293395996094, 0.038129329681396484, 0.039806365966796875, 0.041483402252197266, 0.043160438537597656, 0.04483747482299805, 0.04651451110839844, 0.04819154739379883, 0.04986858367919922, 0.05154561996459961, 0.05322265625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 27.0, 40.0, 82.0, 145.0, 170.0, 164.0, 152.0, 92.0, 46.0, 25.0, 13.0, 11.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8332950472831726, -0.8010374903678894, -0.7687799334526062, -0.736522376537323, -0.7042648196220398, -0.6720072627067566, -0.6397497057914734, -0.6074921488761902, -0.575234591960907, -0.5429770350456238, -0.5107194781303406, -0.4784619212150574, -0.44620436429977417, -0.41394680738449097, -0.38168925046920776, -0.34943169355392456, -0.31717413663864136, -0.28491657972335815, -0.25265902280807495, -0.22040146589279175, -0.18814390897750854, -0.15588635206222534, -0.12362879514694214, -0.09137123823165894, -0.05911368131637573, -0.02685612440109253, 0.005401432514190674, 0.03765898942947388, 0.06991654634475708, 0.10217410326004028, 0.1344316601753235, 0.1666892170906067, 0.19894683361053467, 0.23120439052581787, 0.2634619474411011, 0.2957195043563843, 0.3279770612716675, 0.3602346181869507, 0.3924921751022339, 0.4247497320175171, 0.4570072889328003, 0.4892648458480835, 0.5215224027633667, 0.5537799596786499, 0.5860375165939331, 0.6182950735092163, 0.6505526304244995, 0.6828101873397827, 0.7150677442550659, 0.7473253011703491, 0.7795828580856323, 0.8118404150009155, 0.8440979719161987, 0.8763555288314819, 0.9086130857467651, 0.9408706426620483, 0.9731281995773315, 1.0053857564926147, 1.037643313407898, 1.0699008703231812, 1.1021584272384644, 1.1344159841537476, 1.1666735410690308, 1.198931097984314, 1.2311886548995972]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 4.0, 10.0, 17.0, 15.0, 7.0, 14.0, 21.0, 20.0, 30.0, 27.0, 27.0, 27.0, 35.0, 32.0, 38.0, 32.0, 45.0, 39.0, 42.0, 43.0, 42.0, 32.0, 47.0, 40.0, 35.0, 26.0, 19.0, 30.0, 19.0, 40.0, 20.0, 12.0, 19.0, 15.0, 10.0, 11.0, 10.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.33496761322021484, -0.32481276988983154, -0.31465792655944824, -0.30450308322906494, -0.29434823989868164, -0.28419339656829834, -0.27403855323791504, -0.26388370990753174, -0.25372886657714844, -0.24357402324676514, -0.23341917991638184, -0.22326433658599854, -0.21310949325561523, -0.20295464992523193, -0.19279980659484863, -0.18264496326446533, -0.17249010503292084, -0.16233526170253754, -0.15218041837215424, -0.14202557504177094, -0.13187073171138763, -0.12171588838100433, -0.11156103760004044, -0.10140619426965714, -0.09125135093927383, -0.08109650760889053, -0.07094166427850723, -0.06078681722283363, -0.05063197389245033, -0.04047713056206703, -0.030322283506393433, -0.020167440176010132, -0.010012596845626831, 0.00014224741607904434, 0.01029709167778492, 0.02045193687081337, 0.03060678020119667, 0.04076162353157997, 0.05091647058725357, 0.06107131391763687, 0.07122615724802017, 0.08138100057840347, 0.09153584390878677, 0.10169069468975067, 0.11184553802013397, 0.12200038135051727, 0.13215522468090057, 0.14231006801128387, 0.15246491134166718, 0.16261975467205048, 0.17277459800243378, 0.18292944133281708, 0.19308428466320038, 0.20323912799358368, 0.21339398622512817, 0.22354882955551147, 0.23370367288589478, 0.24385851621627808, 0.2540133595466614, 0.2641682028770447, 0.274323046207428, 0.2844778895378113, 0.2946327328681946, 0.3047875761985779, 0.3149424195289612]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 13.0, 16.0, 27.0, 48.0, 96.0, 166.0, 360.0, 717.0, 1584.0, 4048.0, 11620.0, 43989.0, 401609.0, 3360010.0, 314181.0, 38726.0, 10508.0, 3822.0, 1440.0, 600.0, 318.0, 138.0, 90.0, 38.0, 30.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12363338470458984, -0.11970329284667969, -0.11577320098876953, -0.11184310913085938, -0.10791301727294922, -0.10398292541503906, -0.1000528335571289, -0.09612274169921875, -0.0921926498413086, -0.08826255798339844, -0.08433246612548828, -0.08040237426757812, -0.07647228240966797, -0.07254219055175781, -0.06861209869384766, -0.0646820068359375, -0.060751914978027344, -0.05682182312011719, -0.05289173126220703, -0.048961639404296875, -0.04503154754638672, -0.04110145568847656, -0.037171363830566406, -0.03324127197265625, -0.029311180114746094, -0.025381088256835938, -0.02145099639892578, -0.017520904541015625, -0.013590812683105469, -0.009660720825195312, -0.005730628967285156, -0.001800537109375, 0.0021295547485351562, 0.0060596466064453125, 0.009989738464355469, 0.013919830322265625, 0.01784992218017578, 0.021780014038085938, 0.025710105895996094, 0.02964019775390625, 0.033570289611816406, 0.03750038146972656, 0.04143047332763672, 0.045360565185546875, 0.04929065704345703, 0.05322074890136719, 0.057150840759277344, 0.0610809326171875, 0.06501102447509766, 0.06894111633300781, 0.07287120819091797, 0.07680130004882812, 0.08073139190673828, 0.08466148376464844, 0.0885915756225586, 0.09252166748046875, 0.0964517593383789, 0.10038185119628906, 0.10431194305419922, 0.10824203491210938, 0.11217212677001953, 0.11610221862792969, 0.12003231048583984, 0.12396240234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 8.0, 8.0, 16.0, 35.0, 27.0, 46.0, 56.0, 62.0, 63.0, 83.0, 72.0, 84.0, 68.0, 92.0, 74.0, 53.0, 38.0, 39.0, 24.0, 23.0, 11.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0615234375, -0.05948066711425781, -0.057437896728515625, -0.05539512634277344, -0.05335235595703125, -0.05130958557128906, -0.049266815185546875, -0.04722404479980469, -0.0451812744140625, -0.04313850402832031, -0.041095733642578125, -0.03905296325683594, -0.03701019287109375, -0.03496742248535156, -0.032924652099609375, -0.030881881713867188, -0.028839111328125, -0.026796340942382812, -0.024753570556640625, -0.022710800170898438, -0.02066802978515625, -0.018625259399414062, -0.016582489013671875, -0.014539718627929688, -0.0124969482421875, -0.010454177856445312, -0.008411407470703125, -0.0063686370849609375, -0.00432586669921875, -0.0022830963134765625, -0.000240325927734375, 0.0018024444580078125, 0.00384521484375, 0.0058879852294921875, 0.007930755615234375, 0.009973526000976562, 0.01201629638671875, 0.014059066772460938, 0.016101837158203125, 0.018144607543945312, 0.0201873779296875, 0.022230148315429688, 0.024272918701171875, 0.026315689086914062, 0.02835845947265625, 0.030401229858398438, 0.032444000244140625, 0.03448677062988281, 0.036529541015625, 0.03857231140136719, 0.040615081787109375, 0.04265785217285156, 0.04470062255859375, 0.04674339294433594, 0.048786163330078125, 0.05082893371582031, 0.0528717041015625, 0.05491447448730469, 0.056957244873046875, 0.05900001525878906, 0.06104278564453125, 0.06308555603027344, 0.06512832641601562, 0.06717109680175781, 0.0692138671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 13.0, 16.0, 29.0, 42.0, 50.0, 78.0, 124.0, 189.0, 274.0, 405.0, 635.0, 1030.0, 1692.0, 2758.0, 4907.0, 8724.0, 17208.0, 36746.0, 94399.0, 376144.0, 2704730.0, 714921.0, 134848.0, 48000.0, 21556.0, 10740.0, 5696.0, 3212.0, 1825.0, 1202.0, 716.0, 439.0, 334.0, 200.0, 141.0, 81.0, 52.0, 36.0, 31.0, 13.0, 16.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07293701171875, -0.07070350646972656, -0.06847000122070312, -0.06623649597167969, -0.06400299072265625, -0.06176948547363281, -0.059535980224609375, -0.05730247497558594, -0.0550689697265625, -0.05283546447753906, -0.050601959228515625, -0.04836845397949219, -0.04613494873046875, -0.04390144348144531, -0.041667938232421875, -0.03943443298339844, -0.037200927734375, -0.03496742248535156, -0.032733917236328125, -0.030500411987304688, -0.02826690673828125, -0.026033401489257812, -0.023799896240234375, -0.021566390991210938, -0.0193328857421875, -0.017099380493164062, -0.014865875244140625, -0.012632369995117188, -0.01039886474609375, -0.008165359497070312, -0.005931854248046875, -0.0036983489990234375, -0.00146484375, 0.0007686614990234375, 0.003002166748046875, 0.0052356719970703125, 0.00746917724609375, 0.009702682495117188, 0.011936187744140625, 0.014169692993164062, 0.0164031982421875, 0.018636703491210938, 0.020870208740234375, 0.023103713989257812, 0.02533721923828125, 0.027570724487304688, 0.029804229736328125, 0.03203773498535156, 0.034271240234375, 0.03650474548339844, 0.038738250732421875, 0.04097175598144531, 0.04320526123046875, 0.04543876647949219, 0.047672271728515625, 0.04990577697753906, 0.0521392822265625, 0.05437278747558594, 0.056606292724609375, 0.05883979797363281, 0.06107330322265625, 0.06330680847167969, 0.06554031372070312, 0.06777381896972656, 0.07000732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 16.0, 19.0, 27.0, 41.0, 49.0, 68.0, 96.0, 174.0, 312.0, 624.0, 987.0, 691.0, 326.0, 178.0, 131.0, 85.0, 50.0, 42.0, 25.0, 31.0, 13.0, 12.0, 13.0, 11.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.106201171875, -0.10312652587890625, -0.1000518798828125, -0.09697723388671875, -0.093902587890625, -0.09082794189453125, -0.0877532958984375, -0.08467864990234375, -0.08160400390625, -0.07852935791015625, -0.0754547119140625, -0.07238006591796875, -0.069305419921875, -0.06623077392578125, -0.0631561279296875, -0.06008148193359375, -0.0570068359375, -0.05393218994140625, -0.0508575439453125, -0.04778289794921875, -0.044708251953125, -0.04163360595703125, -0.0385589599609375, -0.03548431396484375, -0.03240966796875, -0.02933502197265625, -0.0262603759765625, -0.02318572998046875, -0.020111083984375, -0.01703643798828125, -0.0139617919921875, -0.01088714599609375, -0.0078125, -0.00473785400390625, -0.0016632080078125, 0.00141143798828125, 0.004486083984375, 0.00756072998046875, 0.0106353759765625, 0.01371002197265625, 0.01678466796875, 0.01985931396484375, 0.0229339599609375, 0.02600860595703125, 0.029083251953125, 0.03215789794921875, 0.0352325439453125, 0.03830718994140625, 0.0413818359375, 0.04445648193359375, 0.0475311279296875, 0.05060577392578125, 0.053680419921875, 0.05675506591796875, 0.0598297119140625, 0.06290435791015625, 0.06597900390625, 0.06905364990234375, 0.0721282958984375, 0.07520294189453125, 0.078277587890625, 0.08135223388671875, 0.0844268798828125, 0.08750152587890625, 0.090576171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 15.0, 9.0, 22.0, 37.0, 53.0, 85.0, 136.0, 116.0, 117.0, 127.0, 93.0, 54.0, 35.0, 36.0, 11.0, 12.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43688398599624634, -0.4169860780239105, -0.3970881700515747, -0.3771902918815613, -0.35729238390922546, -0.33739447593688965, -0.3174965977668762, -0.2975986897945404, -0.2777007818222046, -0.2578028738498688, -0.23790498077869415, -0.21800708770751953, -0.19810917973518372, -0.1782112717628479, -0.15831337869167328, -0.13841548562049866, -0.11851757764816284, -0.09861967712640762, -0.0787217766046524, -0.058823876082897186, -0.03892597556114197, -0.01902807503938675, 0.0008698254823684692, 0.02076771855354309, 0.040665626525878906, 0.060563527047634125, 0.08046142756938934, 0.10035932809114456, 0.12025722861289978, 0.1401551365852356, 0.16005302965641022, 0.17995092272758484, 0.19984877109527588, 0.2197466790676117, 0.23964457213878632, 0.25954246520996094, 0.27944037318229675, 0.29933828115463257, 0.319236159324646, 0.3391340672969818, 0.3590319752693176, 0.37892988324165344, 0.39882779121398926, 0.4187256693840027, 0.4386235773563385, 0.4585214853286743, 0.47841936349868774, 0.49831727147102356, 0.5182151794433594, 0.5381130576133728, 0.558010995388031, 0.5779088735580444, 0.5978068113327026, 0.6177046895027161, 0.6376025676727295, 0.6575005054473877, 0.6773983836174011, 0.6972962617874146, 0.7171941995620728, 0.7370920777320862, 0.7569899559020996, 0.7768878936767578, 0.7967857718467712, 0.8166836500167847, 0.8365815877914429]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 14.0, 9.0, 17.0, 19.0, 20.0, 28.0, 29.0, 34.0, 37.0, 42.0, 43.0, 35.0, 47.0, 58.0, 46.0, 38.0, 32.0, 31.0, 43.0, 40.0, 37.0, 26.0, 28.0, 46.0, 28.0, 22.0, 23.0, 27.0, 23.0, 8.0, 19.0, 10.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28855353593826294, -0.2785467505455017, -0.2685399353504181, -0.25853314995765686, -0.24852633476257324, -0.23851953446865082, -0.2285127341747284, -0.21850594878196716, -0.20849913358688354, -0.19849233329296112, -0.1884855329990387, -0.17847873270511627, -0.16847193241119385, -0.15846513211727142, -0.148458331823349, -0.13845154643058777, -0.12844474613666534, -0.11843794584274292, -0.1084311455488205, -0.09842434525489807, -0.08841754496097565, -0.07841074466705322, -0.0684039518237114, -0.05839715152978897, -0.04839035123586655, -0.03838355094194412, -0.028376752510666847, -0.018369954079389572, -0.008363153785467148, 0.0016436465084552765, 0.011650443077087402, 0.021657243371009827, 0.03166404366493225, 0.041670843958854675, 0.0516776442527771, 0.061684440821409225, 0.07169124484062195, 0.08169804513454437, 0.0917048379778862, 0.10171163827180862, 0.11171843856573105, 0.12172523885965347, 0.1317320317029953, 0.14173883199691772, 0.15174563229084015, 0.16175243258476257, 0.171759232878685, 0.18176603317260742, 0.19177283346652985, 0.20177963376045227, 0.2117864340543747, 0.22179323434829712, 0.23180003464221954, 0.24180683493614197, 0.2518136203289032, 0.2618204355239868, 0.27182722091674805, 0.2818340063095093, 0.2918408215045929, 0.3018476068973541, 0.31185442209243774, 0.321861207485199, 0.3318680226802826, 0.3418748080730438, 0.35188162326812744]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 17.0, 18.0, 39.0, 50.0, 91.0, 112.0, 167.0, 266.0, 425.0, 723.0, 1211.0, 2164.0, 3935.0, 7215.0, 13647.0, 27155.0, 56742.0, 121500.0, 238082.0, 273867.0, 155789.0, 73413.0, 34714.0, 16966.0, 8868.0, 4922.0, 2665.0, 1494.0, 853.0, 519.0, 349.0, 187.0, 123.0, 73.0, 64.0, 27.0, 26.0, 17.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.06998825073242188, -0.06758880615234375, -0.06518936157226562, -0.0627899169921875, -0.060390472412109375, -0.05799102783203125, -0.055591583251953125, -0.053192138671875, -0.050792694091796875, -0.04839324951171875, -0.045993804931640625, -0.0435943603515625, -0.041194915771484375, -0.03879547119140625, -0.036396026611328125, -0.03399658203125, -0.031597137451171875, -0.02919769287109375, -0.026798248291015625, -0.0243988037109375, -0.021999359130859375, -0.01959991455078125, -0.017200469970703125, -0.014801025390625, -0.012401580810546875, -0.01000213623046875, -0.007602691650390625, -0.0052032470703125, -0.002803802490234375, -0.00040435791015625, 0.001995086669921875, 0.00439453125, 0.006793975830078125, 0.00919342041015625, 0.011592864990234375, 0.0139923095703125, 0.016391754150390625, 0.01879119873046875, 0.021190643310546875, 0.023590087890625, 0.025989532470703125, 0.02838897705078125, 0.030788421630859375, 0.0331878662109375, 0.035587310791015625, 0.03798675537109375, 0.040386199951171875, 0.04278564453125, 0.045185089111328125, 0.04758453369140625, 0.049983978271484375, 0.0523834228515625, 0.054782867431640625, 0.05718231201171875, 0.059581756591796875, 0.061981201171875, 0.06438064575195312, 0.06678009033203125, 0.06917953491210938, 0.0715789794921875, 0.07397842407226562, 0.07637786865234375, 0.07877731323242188, 0.0811767578125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 4.0, 11.0, 14.0, 20.0, 25.0, 41.0, 44.0, 53.0, 48.0, 54.0, 70.0, 58.0, 65.0, 68.0, 62.0, 63.0, 57.0, 47.0, 47.0, 28.0, 32.0, 19.0, 16.0, 15.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056610107421875, -0.054692745208740234, -0.05277538299560547, -0.0508580207824707, -0.04894065856933594, -0.04702329635620117, -0.045105934143066406, -0.04318857192993164, -0.041271209716796875, -0.03935384750366211, -0.037436485290527344, -0.03551912307739258, -0.03360176086425781, -0.03168439865112305, -0.02976703643798828, -0.027849674224853516, -0.02593231201171875, -0.024014949798583984, -0.02209758758544922, -0.020180225372314453, -0.018262863159179688, -0.016345500946044922, -0.014428138732910156, -0.01251077651977539, -0.010593414306640625, -0.00867605209350586, -0.006758689880371094, -0.004841327667236328, -0.0029239654541015625, -0.0010066032409667969, 0.0009107589721679688, 0.0028281211853027344, 0.0047454833984375, 0.006662845611572266, 0.008580207824707031, 0.010497570037841797, 0.012414932250976562, 0.014332294464111328, 0.016249656677246094, 0.01816701889038086, 0.020084381103515625, 0.02200174331665039, 0.023919105529785156, 0.025836467742919922, 0.027753829956054688, 0.029671192169189453, 0.03158855438232422, 0.033505916595458984, 0.03542327880859375, 0.037340641021728516, 0.03925800323486328, 0.04117536544799805, 0.04309272766113281, 0.04501008987426758, 0.046927452087402344, 0.04884481430053711, 0.050762176513671875, 0.05267953872680664, 0.054596900939941406, 0.05651426315307617, 0.05843162536621094, 0.0603489875793457, 0.06226634979248047, 0.06418371200561523, 0.06610107421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 14.0, 8.0, 20.0, 16.0, 29.0, 53.0, 52.0, 119.0, 168.0, 280.0, 436.0, 775.0, 1372.0, 2488.0, 4609.0, 9359.0, 20640.0, 51974.0, 154214.0, 429455.0, 241025.0, 76934.0, 28800.0, 12571.0, 5841.0, 3112.0, 1712.0, 992.0, 572.0, 310.0, 204.0, 111.0, 81.0, 55.0, 42.0, 25.0, 23.0, 17.0, 5.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10910606384277344, -0.10566329956054688, -0.10222053527832031, -0.09877777099609375, -0.09533500671386719, -0.09189224243164062, -0.08844947814941406, -0.0850067138671875, -0.08156394958496094, -0.07812118530273438, -0.07467842102050781, -0.07123565673828125, -0.06779289245605469, -0.06435012817382812, -0.06090736389160156, -0.057464599609375, -0.05402183532714844, -0.050579071044921875, -0.04713630676269531, -0.04369354248046875, -0.04025077819824219, -0.036808013916015625, -0.03336524963378906, -0.0299224853515625, -0.026479721069335938, -0.023036956787109375, -0.019594192504882812, -0.01615142822265625, -0.012708663940429688, -0.009265899658203125, -0.0058231353759765625, -0.00238037109375, 0.0010623931884765625, 0.004505157470703125, 0.007947921752929688, 0.01139068603515625, 0.014833450317382812, 0.018276214599609375, 0.021718978881835938, 0.0251617431640625, 0.028604507446289062, 0.032047271728515625, 0.03549003601074219, 0.03893280029296875, 0.04237556457519531, 0.045818328857421875, 0.04926109313964844, 0.052703857421875, 0.05614662170410156, 0.059589385986328125, 0.06303215026855469, 0.06647491455078125, 0.06991767883300781, 0.07336044311523438, 0.07680320739746094, 0.0802459716796875, 0.08368873596191406, 0.08713150024414062, 0.09057426452636719, 0.09401702880859375, 0.09745979309082031, 0.10090255737304688, 0.10434532165527344, 0.1077880859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 12.0, 15.0, 16.0, 19.0, 30.0, 29.0, 53.0, 49.0, 34.0, 46.0, 58.0, 67.0, 69.0, 60.0, 60.0, 48.0, 44.0, 46.0, 39.0, 35.0, 31.0, 18.0, 17.0, 17.0, 12.0, 8.0, 6.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1761474609375, -0.1710338592529297, -0.16592025756835938, -0.16080665588378906, -0.15569305419921875, -0.15057945251464844, -0.14546585083007812, -0.1403522491455078, -0.1352386474609375, -0.1301250457763672, -0.12501144409179688, -0.11989784240722656, -0.11478424072265625, -0.10967063903808594, -0.10455703735351562, -0.09944343566894531, -0.094329833984375, -0.08921623229980469, -0.08410263061523438, -0.07898902893066406, -0.07387542724609375, -0.06876182556152344, -0.06364822387695312, -0.05853462219238281, -0.0534210205078125, -0.04830741882324219, -0.043193817138671875, -0.03808021545410156, -0.03296661376953125, -0.027853012084960938, -0.022739410400390625, -0.017625808715820312, -0.01251220703125, -0.0073986053466796875, -0.002285003662109375, 0.0028285980224609375, 0.00794219970703125, 0.013055801391601562, 0.018169403076171875, 0.023283004760742188, 0.0283966064453125, 0.03351020812988281, 0.038623809814453125, 0.04373741149902344, 0.04885101318359375, 0.05396461486816406, 0.059078216552734375, 0.06419181823730469, 0.069305419921875, 0.07441902160644531, 0.07953262329101562, 0.08464622497558594, 0.08975982666015625, 0.09487342834472656, 0.09998703002929688, 0.10510063171386719, 0.1102142333984375, 0.11532783508300781, 0.12044143676757812, 0.12555503845214844, 0.13066864013671875, 0.13578224182128906, 0.14089584350585938, 0.1460094451904297, 0.151123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 10.0, 15.0, 26.0, 31.0, 54.0, 67.0, 108.0, 138.0, 220.0, 351.0, 561.0, 851.0, 1502.0, 2565.0, 4645.0, 9494.0, 21617.0, 60771.0, 219248.0, 480759.0, 162695.0, 47133.0, 17812.0, 8048.0, 4083.0, 2232.0, 1279.0, 780.0, 480.0, 308.0, 195.0, 138.0, 110.0, 85.0, 33.0, 27.0, 18.0, 17.0, 14.0, 7.0, 2.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.034844398498535156, -0.03361701965332031, -0.03238964080810547, -0.031162261962890625, -0.02993488311767578, -0.028707504272460938, -0.027480125427246094, -0.02625274658203125, -0.025025367736816406, -0.023797988891601562, -0.02257061004638672, -0.021343231201171875, -0.02011585235595703, -0.018888473510742188, -0.017661094665527344, -0.0164337158203125, -0.015206336975097656, -0.013978958129882812, -0.012751579284667969, -0.011524200439453125, -0.010296821594238281, -0.009069442749023438, -0.007842063903808594, -0.00661468505859375, -0.005387306213378906, -0.0041599273681640625, -0.0029325485229492188, -0.001705169677734375, -0.00047779083251953125, 0.0007495880126953125, 0.0019769668579101562, 0.003204345703125, 0.004431724548339844, 0.0056591033935546875, 0.006886482238769531, 0.008113861083984375, 0.009341239929199219, 0.010568618774414062, 0.011795997619628906, 0.01302337646484375, 0.014250755310058594, 0.015478134155273438, 0.01670551300048828, 0.017932891845703125, 0.01916027069091797, 0.020387649536132812, 0.021615028381347656, 0.0228424072265625, 0.024069786071777344, 0.025297164916992188, 0.02652454376220703, 0.027751922607421875, 0.02897930145263672, 0.030206680297851562, 0.031434059143066406, 0.03266143798828125, 0.033888816833496094, 0.03511619567871094, 0.03634357452392578, 0.037570953369140625, 0.03879833221435547, 0.04002571105957031, 0.041253089904785156, 0.04248046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 4.0, 8.0, 6.0, 7.0, 13.0, 8.0, 24.0, 21.0, 33.0, 24.0, 39.0, 35.0, 45.0, 51.0, 56.0, 78.0, 61.0, 76.0, 61.0, 58.0, 53.0, 50.0, 36.0, 22.0, 26.0, 22.0, 22.0, 13.0, 16.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.863032907247543e-05, -3.726594150066376e-05, -3.590155392885208e-05, -3.4537166357040405e-05, -3.317277878522873e-05, -3.180839121341705e-05, -3.0444003641605377e-05, -2.90796160697937e-05, -2.7715228497982025e-05, -2.635084092617035e-05, -2.4986453354358673e-05, -2.3622065782546997e-05, -2.225767821073532e-05, -2.0893290638923645e-05, -1.952890306711197e-05, -1.8164515495300293e-05, -1.6800127923488617e-05, -1.543574035167694e-05, -1.4071352779865265e-05, -1.2706965208053589e-05, -1.1342577636241913e-05, -9.978190064430237e-06, -8.61380249261856e-06, -7.249414920806885e-06, -5.885027348995209e-06, -4.520639777183533e-06, -3.1562522053718567e-06, -1.7918646335601807e-06, -4.2747706174850464e-07, 9.369105100631714e-07, 2.3012980818748474e-06, 3.6656856536865234e-06, 5.0300732254981995e-06, 6.3944607973098755e-06, 7.758848369121552e-06, 9.123235940933228e-06, 1.0487623512744904e-05, 1.185201108455658e-05, 1.3216398656368256e-05, 1.4580786228179932e-05, 1.5945173799991608e-05, 1.7309561371803284e-05, 1.867394894361496e-05, 2.0038336515426636e-05, 2.1402724087238312e-05, 2.2767111659049988e-05, 2.4131499230861664e-05, 2.549588680267334e-05, 2.6860274374485016e-05, 2.8224661946296692e-05, 2.9589049518108368e-05, 3.0953437089920044e-05, 3.231782466173172e-05, 3.3682212233543396e-05, 3.504659980535507e-05, 3.641098737716675e-05, 3.7775374948978424e-05, 3.91397625207901e-05, 4.0504150092601776e-05, 4.186853766441345e-05, 4.323292523622513e-05, 4.4597312808036804e-05, 4.596170037984848e-05, 4.7326087951660156e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 11.0, 14.0, 14.0, 19.0, 24.0, 54.0, 55.0, 84.0, 140.0, 262.0, 406.0, 803.0, 1381.0, 2511.0, 5144.0, 11549.0, 27556.0, 78636.0, 250657.0, 430372.0, 153850.0, 49937.0, 18845.0, 8065.0, 3829.0, 1905.0, 984.0, 564.0, 329.0, 211.0, 120.0, 83.0, 65.0, 26.0, 14.0, 14.0, 10.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.038726806640625, -0.037659645080566406, -0.03659248352050781, -0.03552532196044922, -0.034458160400390625, -0.03339099884033203, -0.03232383728027344, -0.031256675720214844, -0.03018951416015625, -0.029122352600097656, -0.028055191040039062, -0.02698802947998047, -0.025920867919921875, -0.02485370635986328, -0.023786544799804688, -0.022719383239746094, -0.0216522216796875, -0.020585060119628906, -0.019517898559570312, -0.01845073699951172, -0.017383575439453125, -0.01631641387939453, -0.015249252319335938, -0.014182090759277344, -0.01311492919921875, -0.012047767639160156, -0.010980606079101562, -0.009913444519042969, -0.008846282958984375, -0.007779121398925781, -0.0067119598388671875, -0.005644798278808594, -0.00457763671875, -0.0035104751586914062, -0.0024433135986328125, -0.0013761520385742188, -0.000308990478515625, 0.0007581710815429688, 0.0018253326416015625, 0.0028924942016601562, 0.00395965576171875, 0.005026817321777344, 0.0060939788818359375, 0.007161140441894531, 0.008228302001953125, 0.009295463562011719, 0.010362625122070312, 0.011429786682128906, 0.0124969482421875, 0.013564109802246094, 0.014631271362304688, 0.01569843292236328, 0.016765594482421875, 0.01783275604248047, 0.018899917602539062, 0.019967079162597656, 0.02103424072265625, 0.022101402282714844, 0.023168563842773438, 0.02423572540283203, 0.025302886962890625, 0.02637004852294922, 0.027437210083007812, 0.028504371643066406, 0.029571533203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 2.0, 14.0, 23.0, 23.0, 31.0, 46.0, 69.0, 107.0, 132.0, 100.0, 119.0, 91.0, 72.0, 43.0, 35.0, 22.0, 15.0, 12.0, 5.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0582275390625, -0.056382179260253906, -0.05453681945800781, -0.05269145965576172, -0.050846099853515625, -0.04900074005126953, -0.04715538024902344, -0.045310020446777344, -0.04346466064453125, -0.041619300842285156, -0.03977394104003906, -0.03792858123779297, -0.036083221435546875, -0.03423786163330078, -0.03239250183105469, -0.030547142028808594, -0.0287017822265625, -0.026856422424316406, -0.025011062622070312, -0.02316570281982422, -0.021320343017578125, -0.01947498321533203, -0.017629623413085938, -0.015784263610839844, -0.01393890380859375, -0.012093544006347656, -0.010248184204101562, -0.008402824401855469, -0.006557464599609375, -0.004712104797363281, -0.0028667449951171875, -0.0010213851928710938, 0.000823974609375, 0.0026693344116210938, 0.0045146942138671875, 0.006360054016113281, 0.008205413818359375, 0.010050773620605469, 0.011896133422851562, 0.013741493225097656, 0.01558685302734375, 0.017432212829589844, 0.019277572631835938, 0.02112293243408203, 0.022968292236328125, 0.02481365203857422, 0.026659011840820312, 0.028504371643066406, 0.0303497314453125, 0.032195091247558594, 0.03404045104980469, 0.03588581085205078, 0.037731170654296875, 0.03957653045654297, 0.04142189025878906, 0.043267250061035156, 0.04511260986328125, 0.046957969665527344, 0.04880332946777344, 0.05064868927001953, 0.052494049072265625, 0.05433940887451172, 0.05618476867675781, 0.058030128479003906, 0.05987548828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 7.0, 7.0, 20.0, 21.0, 50.0, 93.0, 147.0, 183.0, 181.0, 120.0, 76.0, 48.0, 19.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2651619911193848, -1.2298510074615479, -1.194540023803711, -1.1592289209365845, -1.1239179372787476, -1.0886069536209106, -1.0532959699630737, -1.0179849863052368, -0.9826739430427551, -0.9473629593849182, -0.9120519161224365, -0.8767409324645996, -0.8414299488067627, -0.806118905544281, -0.7708079218864441, -0.7354968786239624, -0.7001858949661255, -0.6648749113082886, -0.6295638680458069, -0.59425288438797, -0.5589418411254883, -0.5236308574676514, -0.48831987380981445, -0.45300886034965515, -0.41769784688949585, -0.38238683342933655, -0.34707581996917725, -0.31176483631134033, -0.27645382285118103, -0.24114280939102173, -0.20583181083202362, -0.1705208122730255, -0.13520967960357666, -0.09989867359399796, -0.06458766758441925, -0.029276661574840546, 0.006034344434738159, 0.04134535789489746, 0.07665635645389557, 0.11196735501289368, 0.14727836847305298, 0.18258938193321228, 0.2179003804922104, 0.2532113790512085, 0.2885223925113678, 0.3238334059715271, 0.359144389629364, 0.3944554030895233, 0.4297664165496826, 0.4650774300098419, 0.5003884434700012, 0.5356994271278381, 0.5710104703903198, 0.6063214540481567, 0.6416324377059937, 0.6769434213638306, 0.7122544646263123, 0.7475654482841492, 0.7828764915466309, 0.8181874752044678, 0.8534984588623047, 0.8888095021247864, 0.9241204857826233, 0.959431529045105, 0.9947425127029419]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 18.0, 16.0, 13.0, 21.0, 23.0, 17.0, 28.0, 34.0, 39.0, 28.0, 30.0, 42.0, 54.0, 49.0, 50.0, 51.0, 39.0, 44.0, 43.0, 46.0, 34.0, 33.0, 37.0, 26.0, 30.0, 31.0, 19.0, 12.0, 10.0, 5.0, 13.0, 6.0, 6.0, 3.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4245501756668091, -0.4117284119129181, -0.3989066481590271, -0.3860848844051361, -0.3732631206512451, -0.36044132709503174, -0.34761959314346313, -0.33479779958724976, -0.32197603583335876, -0.3091542720794678, -0.2963325083255768, -0.2835107445716858, -0.2706889808177948, -0.2578672170639038, -0.24504543840885162, -0.23222365975379944, -0.21940191090106964, -0.20658014714717865, -0.19375838339328766, -0.18093660473823547, -0.16811484098434448, -0.1552930772304535, -0.1424713134765625, -0.1296495497226715, -0.11682777851819992, -0.10400601476430893, -0.09118424355983734, -0.07836247980594635, -0.06554071605205536, -0.05271894484758377, -0.03989718109369278, -0.02707540988922119, -0.0142536461353302, -0.0014318795874714851, 0.01138988696038723, 0.02421165257692337, 0.03703342005610466, 0.04985518753528595, 0.06267695128917694, 0.07549872249364853, 0.08832048624753952, 0.10114225000143051, 0.1139640212059021, 0.1267857849597931, 0.13960754871368408, 0.15242931246757507, 0.16525107622146606, 0.17807285487651825, 0.19089461863040924, 0.20371638238430023, 0.21653814613819122, 0.2293599247932434, 0.2421816885471344, 0.2550034523010254, 0.2678252160549164, 0.2806469798088074, 0.29346874356269836, 0.30629050731658936, 0.31911227107048035, 0.33193403482437134, 0.34475579857826233, 0.3575775623321533, 0.3703993558883667, 0.3832211196422577, 0.3960428833961487]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 9.0, 8.0, 12.0, 18.0, 20.0, 35.0, 46.0, 82.0, 113.0, 201.0, 429.0, 769.0, 1888.0, 4982.0, 14796.0, 53477.0, 278045.0, 2130372.0, 1470252.0, 179908.0, 39383.0, 11815.0, 4182.0, 1618.0, 788.0, 377.0, 210.0, 158.0, 64.0, 38.0, 62.0, 29.0, 20.0, 19.0, 12.0, 6.0, 9.0, 6.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1522216796875, -0.1472930908203125, -0.142364501953125, -0.1374359130859375, -0.13250732421875, -0.1275787353515625, -0.122650146484375, -0.1177215576171875, -0.11279296875, -0.1078643798828125, -0.102935791015625, -0.0980072021484375, -0.09307861328125, -0.0881500244140625, -0.083221435546875, -0.0782928466796875, -0.0733642578125, -0.0684356689453125, -0.063507080078125, -0.0585784912109375, -0.05364990234375, -0.0487213134765625, -0.043792724609375, -0.0388641357421875, -0.033935546875, -0.0290069580078125, -0.024078369140625, -0.0191497802734375, -0.01422119140625, -0.0092926025390625, -0.004364013671875, 0.0005645751953125, 0.0054931640625, 0.0104217529296875, 0.015350341796875, 0.0202789306640625, 0.02520751953125, 0.0301361083984375, 0.035064697265625, 0.0399932861328125, 0.044921875, 0.0498504638671875, 0.054779052734375, 0.0597076416015625, 0.06463623046875, 0.0695648193359375, 0.074493408203125, 0.0794219970703125, 0.0843505859375, 0.0892791748046875, 0.094207763671875, 0.0991363525390625, 0.10406494140625, 0.1089935302734375, 0.113922119140625, 0.1188507080078125, 0.123779296875, 0.1287078857421875, 0.133636474609375, 0.1385650634765625, 0.14349365234375, 0.1484222412109375, 0.153350830078125, 0.1582794189453125, 0.1632080078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 12.0, 8.0, 15.0, 25.0, 26.0, 35.0, 46.0, 55.0, 49.0, 63.0, 73.0, 56.0, 76.0, 72.0, 76.0, 78.0, 64.0, 46.0, 31.0, 31.0, 23.0, 14.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.061908721923828125, -0.05985260009765625, -0.057796478271484375, -0.0557403564453125, -0.053684234619140625, -0.05162811279296875, -0.049571990966796875, -0.047515869140625, -0.045459747314453125, -0.04340362548828125, -0.041347503662109375, -0.0392913818359375, -0.037235260009765625, -0.03517913818359375, -0.033123016357421875, -0.03106689453125, -0.029010772705078125, -0.02695465087890625, -0.024898529052734375, -0.0228424072265625, -0.020786285400390625, -0.01873016357421875, -0.016674041748046875, -0.014617919921875, -0.012561798095703125, -0.01050567626953125, -0.008449554443359375, -0.0063934326171875, -0.004337310791015625, -0.00228118896484375, -0.000225067138671875, 0.0018310546875, 0.003887176513671875, 0.00594329833984375, 0.007999420166015625, 0.0100555419921875, 0.012111663818359375, 0.01416778564453125, 0.016223907470703125, 0.018280029296875, 0.020336151123046875, 0.02239227294921875, 0.024448394775390625, 0.0265045166015625, 0.028560638427734375, 0.03061676025390625, 0.032672882080078125, 0.03472900390625, 0.036785125732421875, 0.03884124755859375, 0.040897369384765625, 0.0429534912109375, 0.045009613037109375, 0.04706573486328125, 0.049121856689453125, 0.051177978515625, 0.053234100341796875, 0.05529022216796875, 0.057346343994140625, 0.0594024658203125, 0.061458587646484375, 0.06351470947265625, 0.06557083129882812, 0.067626953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 17.0, 33.0, 55.0, 101.0, 222.0, 439.0, 1011.0, 3162.0, 14009.0, 173742.0, 3778692.0, 202458.0, 14990.0, 3275.0, 1210.0, 422.0, 203.0, 101.0, 48.0, 29.0, 18.0, 12.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3075752258300781, -0.29679107666015625, -0.2860069274902344, -0.2752227783203125, -0.2644386291503906, -0.25365447998046875, -0.24287033081054688, -0.232086181640625, -0.22130203247070312, -0.21051788330078125, -0.19973373413085938, -0.1889495849609375, -0.17816543579101562, -0.16738128662109375, -0.15659713745117188, -0.14581298828125, -0.13502883911132812, -0.12424468994140625, -0.11346054077148438, -0.1026763916015625, -0.09189224243164062, -0.08110809326171875, -0.07032394409179688, -0.059539794921875, -0.048755645751953125, -0.03797149658203125, -0.027187347412109375, -0.0164031982421875, -0.005619049072265625, 0.00516510009765625, 0.015949249267578125, 0.0267333984375, 0.037517547607421875, 0.04830169677734375, 0.059085845947265625, 0.0698699951171875, 0.08065414428710938, 0.09143829345703125, 0.10222244262695312, 0.113006591796875, 0.12379074096679688, 0.13457489013671875, 0.14535903930664062, 0.1561431884765625, 0.16692733764648438, 0.17771148681640625, 0.18849563598632812, 0.19927978515625, 0.21006393432617188, 0.22084808349609375, 0.23163223266601562, 0.2424163818359375, 0.2532005310058594, 0.26398468017578125, 0.2747688293457031, 0.285552978515625, 0.2963371276855469, 0.30712127685546875, 0.3179054260253906, 0.3286895751953125, 0.3394737243652344, 0.35025787353515625, 0.3610420227050781, 0.371826171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 18.0, 24.0, 35.0, 38.0, 62.0, 137.0, 181.0, 311.0, 433.0, 599.0, 663.0, 546.0, 342.0, 231.0, 149.0, 91.0, 69.0, 37.0, 26.0, 20.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2386474609375, -0.23171043395996094, -0.22477340698242188, -0.2178363800048828, -0.21089935302734375, -0.2039623260498047, -0.19702529907226562, -0.19008827209472656, -0.1831512451171875, -0.17621421813964844, -0.16927719116210938, -0.1623401641845703, -0.15540313720703125, -0.1484661102294922, -0.14152908325195312, -0.13459205627441406, -0.127655029296875, -0.12071800231933594, -0.11378097534179688, -0.10684394836425781, -0.09990692138671875, -0.09296989440917969, -0.08603286743164062, -0.07909584045410156, -0.0721588134765625, -0.06522178649902344, -0.058284759521484375, -0.05134773254394531, -0.04441070556640625, -0.03747367858886719, -0.030536651611328125, -0.023599624633789062, -0.01666259765625, -0.009725570678710938, -0.002788543701171875, 0.0041484832763671875, 0.01108551025390625, 0.018022537231445312, 0.024959564208984375, 0.03189659118652344, 0.0388336181640625, 0.04577064514160156, 0.052707672119140625, 0.05964469909667969, 0.06658172607421875, 0.07351875305175781, 0.08045578002929688, 0.08739280700683594, 0.094329833984375, 0.10126686096191406, 0.10820388793945312, 0.11514091491699219, 0.12207794189453125, 0.1290149688720703, 0.13595199584960938, 0.14288902282714844, 0.1498260498046875, 0.15676307678222656, 0.16370010375976562, 0.1706371307373047, 0.17757415771484375, 0.1845111846923828, 0.19144821166992188, 0.19838523864746094, 0.205322265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 9.0, 28.0, 32.0, 133.0, 273.0, 301.0, 120.0, 49.0, 21.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44143009185791, -4.249141693115234, -4.056853294372559, -3.8645644187927246, -3.672276020050049, -3.479987621307373, -3.287698984146118, -3.0954103469848633, -2.9031219482421875, -2.7108335494995117, -2.518544912338257, -2.326256275177002, -2.133967876434326, -1.9416793584823608, -1.7493908405303955, -1.5571023225784302, -1.3648138046264648, -1.1725252866744995, -0.9802367687225342, -0.7879482507705688, -0.5956597328186035, -0.4033712148666382, -0.21108269691467285, -0.01879417896270752, 0.1734943389892578, 0.36578285694122314, 0.5580713748931885, 0.7503598928451538, 0.9426484107971191, 1.1349369287490845, 1.3272254467010498, 1.5195139646530151, 1.7118024826049805, 1.9040910005569458, 2.096379518508911, 2.288668155670166, 2.480956554412842, 2.6732449531555176, 2.8655335903167725, 3.0578222274780273, 3.250110626220703, 3.442399024963379, 3.634687662124634, 3.8269762992858887, 4.0192646980285645, 4.21155309677124, 4.403841972351074, 4.59613037109375, 4.788418769836426, 4.980707168579102, 5.172995567321777, 5.365284442901611, 5.557572841644287, 5.749861240386963, 5.942150115966797, 6.134438514709473, 6.326726913452148, 6.519015312194824, 6.7113037109375, 6.903592586517334, 7.09588098526001, 7.2881693840026855, 7.4804582595825195, 7.672746658325195, 7.865035057067871]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 14.0, 14.0, 22.0, 33.0, 31.0, 42.0, 52.0, 68.0, 70.0, 71.0, 74.0, 83.0, 70.0, 66.0, 55.0, 49.0, 44.0, 29.0, 27.0, 17.0, 17.0, 11.0, 6.0, 5.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6712656021118164, -1.6157715320587158, -1.5602774620056152, -1.5047833919525146, -1.449289321899414, -1.3937952518463135, -1.338301181793213, -1.2828071117401123, -1.2273130416870117, -1.1718189716339111, -1.1163249015808105, -1.06083083152771, -1.0053367614746094, -0.9498426914215088, -0.8943486213684082, -0.8388545513153076, -0.783360481262207, -0.7278664112091064, -0.6723723411560059, -0.6168782711029053, -0.5613842010498047, -0.5058901309967041, -0.4503960609436035, -0.39490199089050293, -0.33940792083740234, -0.28391385078430176, -0.22841978073120117, -0.17292571067810059, -0.117431640625, -0.061937570571899414, -0.006443500518798828, 0.04905056953430176, 0.10454463958740234, 0.16003870964050293, 0.21553277969360352, 0.2710268497467041, 0.3265209197998047, 0.3820149898529053, 0.43750905990600586, 0.49300312995910645, 0.548497200012207, 0.6039912700653076, 0.6594853401184082, 0.7149794101715088, 0.7704734802246094, 0.82596755027771, 0.8814616203308105, 0.9369556903839111, 0.9924497604370117, 1.0479438304901123, 1.103437900543213, 1.1589319705963135, 1.214426040649414, 1.2699201107025146, 1.3254141807556152, 1.3809082508087158, 1.4364023208618164, 1.491896390914917, 1.5473904609680176, 1.6028845310211182, 1.6583786010742188, 1.7138726711273193, 1.76936674118042, 1.8248608112335205, 1.880354881286621]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 11.0, 12.0, 17.0, 27.0, 30.0, 41.0, 67.0, 97.0, 167.0, 226.0, 394.0, 696.0, 1232.0, 2262.0, 5014.0, 11881.0, 32827.0, 116354.0, 413395.0, 332257.0, 87123.0, 25909.0, 9540.0, 4225.0, 2017.0, 1049.0, 584.0, 364.0, 237.0, 160.0, 96.0, 68.0, 41.0, 33.0, 20.0, 11.0, 12.0, 9.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.13869857788085938, -0.13420867919921875, -0.12971878051757812, -0.1252288818359375, -0.12073898315429688, -0.11624908447265625, -0.11175918579101562, -0.107269287109375, -0.10277938842773438, -0.09828948974609375, -0.09379959106445312, -0.0893096923828125, -0.08481979370117188, -0.08032989501953125, -0.07583999633789062, -0.07135009765625, -0.06686019897460938, -0.06237030029296875, -0.057880401611328125, -0.0533905029296875, -0.048900604248046875, -0.04441070556640625, -0.039920806884765625, -0.035430908203125, -0.030941009521484375, -0.02645111083984375, -0.021961212158203125, -0.0174713134765625, -0.012981414794921875, -0.00849151611328125, -0.004001617431640625, 0.00048828125, 0.004978179931640625, 0.00946807861328125, 0.013957977294921875, 0.0184478759765625, 0.022937774658203125, 0.02742767333984375, 0.031917572021484375, 0.036407470703125, 0.040897369384765625, 0.04538726806640625, 0.049877166748046875, 0.0543670654296875, 0.058856964111328125, 0.06334686279296875, 0.06783676147460938, 0.07232666015625, 0.07681655883789062, 0.08130645751953125, 0.08579635620117188, 0.0902862548828125, 0.09477615356445312, 0.09926605224609375, 0.10375595092773438, 0.108245849609375, 0.11273574829101562, 0.11722564697265625, 0.12171554565429688, 0.1262054443359375, 0.13069534301757812, 0.13518524169921875, 0.13967514038085938, 0.1441650390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 14.0, 20.0, 33.0, 30.0, 41.0, 61.0, 65.0, 76.0, 85.0, 91.0, 79.0, 85.0, 76.0, 51.0, 42.0, 29.0, 22.0, 22.0, 15.0, 12.0, 9.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13518524169921875, -0.1304779052734375, -0.12577056884765625, -0.121063232421875, -0.11635589599609375, -0.1116485595703125, -0.10694122314453125, -0.10223388671875, -0.09752655029296875, -0.0928192138671875, -0.08811187744140625, -0.083404541015625, -0.07869720458984375, -0.0739898681640625, -0.06928253173828125, -0.0645751953125, -0.05986785888671875, -0.0551605224609375, -0.05045318603515625, -0.045745849609375, -0.04103851318359375, -0.0363311767578125, -0.03162384033203125, -0.02691650390625, -0.02220916748046875, -0.0175018310546875, -0.01279449462890625, -0.008087158203125, -0.00337982177734375, 0.0013275146484375, 0.00603485107421875, 0.0107421875, 0.01544952392578125, 0.0201568603515625, 0.02486419677734375, 0.029571533203125, 0.03427886962890625, 0.0389862060546875, 0.04369354248046875, 0.04840087890625, 0.05310821533203125, 0.0578155517578125, 0.06252288818359375, 0.067230224609375, 0.07193756103515625, 0.0766448974609375, 0.08135223388671875, 0.0860595703125, 0.09076690673828125, 0.0954742431640625, 0.10018157958984375, 0.104888916015625, 0.10959625244140625, 0.1143035888671875, 0.11901092529296875, 0.12371826171875, 0.12842559814453125, 0.1331329345703125, 0.13784027099609375, 0.142547607421875, 0.14725494384765625, 0.1519622802734375, 0.15666961669921875, 0.161376953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 16.0, 13.0, 30.0, 42.0, 88.0, 162.0, 558.0, 1841.0, 9328.0, 121539.0, 870613.0, 37582.0, 4861.0, 1163.0, 370.0, 138.0, 82.0, 39.0, 26.0, 9.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.46343994140625, -0.4490966796875, -0.43475341796875, -0.42041015625, -0.40606689453125, -0.3917236328125, -0.37738037109375, -0.363037109375, -0.34869384765625, -0.3343505859375, -0.32000732421875, -0.3056640625, -0.29132080078125, -0.2769775390625, -0.26263427734375, -0.248291015625, -0.23394775390625, -0.2196044921875, -0.20526123046875, -0.19091796875, -0.17657470703125, -0.1622314453125, -0.14788818359375, -0.133544921875, -0.11920166015625, -0.1048583984375, -0.09051513671875, -0.076171875, -0.06182861328125, -0.0474853515625, -0.03314208984375, -0.018798828125, -0.00445556640625, 0.0098876953125, 0.02423095703125, 0.03857421875, 0.05291748046875, 0.0672607421875, 0.08160400390625, 0.095947265625, 0.11029052734375, 0.1246337890625, 0.13897705078125, 0.1533203125, 0.16766357421875, 0.1820068359375, 0.19635009765625, 0.210693359375, 0.22503662109375, 0.2393798828125, 0.25372314453125, 0.26806640625, 0.28240966796875, 0.2967529296875, 0.31109619140625, 0.325439453125, 0.33978271484375, 0.3541259765625, 0.36846923828125, 0.3828125, 0.39715576171875, 0.4114990234375, 0.42584228515625, 0.440185546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 10.0, 8.0, 9.0, 8.0, 16.0, 17.0, 28.0, 34.0, 67.0, 55.0, 74.0, 85.0, 108.0, 104.0, 82.0, 79.0, 61.0, 52.0, 33.0, 29.0, 16.0, 14.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6230010986328125, -0.600494384765625, -0.5779876708984375, -0.55548095703125, -0.5329742431640625, -0.510467529296875, -0.4879608154296875, -0.4654541015625, -0.4429473876953125, -0.420440673828125, -0.3979339599609375, -0.37542724609375, -0.3529205322265625, -0.330413818359375, -0.3079071044921875, -0.285400390625, -0.2628936767578125, -0.240386962890625, -0.2178802490234375, -0.19537353515625, -0.1728668212890625, -0.150360107421875, -0.1278533935546875, -0.1053466796875, -0.0828399658203125, -0.060333251953125, -0.0378265380859375, -0.01531982421875, 0.0071868896484375, 0.029693603515625, 0.0522003173828125, 0.07470703125, 0.0972137451171875, 0.119720458984375, 0.1422271728515625, 0.16473388671875, 0.1872406005859375, 0.209747314453125, 0.2322540283203125, 0.2547607421875, 0.2772674560546875, 0.299774169921875, 0.3222808837890625, 0.34478759765625, 0.3672943115234375, 0.389801025390625, 0.4123077392578125, 0.434814453125, 0.4573211669921875, 0.479827880859375, 0.5023345947265625, 0.52484130859375, 0.5473480224609375, 0.569854736328125, 0.5923614501953125, 0.6148681640625, 0.6373748779296875, 0.659881591796875, 0.6823883056640625, 0.70489501953125, 0.7274017333984375, 0.749908447265625, 0.7724151611328125, 0.794921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 20.0, 28.0, 46.0, 159.0, 1042.0, 96823.0, 948323.0, 1697.0, 243.0, 57.0, 40.0, 22.0, 15.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265625, -0.702423095703125, -0.67828369140625, -0.654144287109375, -0.6300048828125, -0.605865478515625, -0.58172607421875, -0.557586669921875, -0.533447265625, -0.509307861328125, -0.48516845703125, -0.461029052734375, -0.4368896484375, -0.412750244140625, -0.38861083984375, -0.364471435546875, -0.34033203125, -0.316192626953125, -0.29205322265625, -0.267913818359375, -0.2437744140625, -0.219635009765625, -0.19549560546875, -0.171356201171875, -0.147216796875, -0.123077392578125, -0.09893798828125, -0.074798583984375, -0.0506591796875, -0.026519775390625, -0.00238037109375, 0.021759033203125, 0.0458984375, 0.070037841796875, 0.09417724609375, 0.118316650390625, 0.1424560546875, 0.166595458984375, 0.19073486328125, 0.214874267578125, 0.239013671875, 0.263153076171875, 0.28729248046875, 0.311431884765625, 0.3355712890625, 0.359710693359375, 0.38385009765625, 0.407989501953125, 0.43212890625, 0.456268310546875, 0.48040771484375, 0.504547119140625, 0.5286865234375, 0.552825927734375, 0.57696533203125, 0.601104736328125, 0.625244140625, 0.649383544921875, 0.67352294921875, 0.697662353515625, 0.7218017578125, 0.745941162109375, 0.77008056640625, 0.794219970703125, 0.818359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 5.0, 2.0, 4.0, 9.0, 7.0, 11.0, 10.0, 15.0, 11.0, 14.0, 29.0, 32.0, 38.0, 54.0, 67.0, 105.0, 93.0, 102.0, 81.0, 62.0, 43.0, 23.0, 30.0, 20.0, 21.0, 13.0, 11.0, 11.0, 7.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7239322662353516e-05, -2.632010728120804e-05, -2.540089190006256e-05, -2.4481676518917084e-05, -2.3562461137771606e-05, -2.264324575662613e-05, -2.1724030375480652e-05, -2.0804814994335175e-05, -1.9885599613189697e-05, -1.896638423204422e-05, -1.8047168850898743e-05, -1.7127953469753265e-05, -1.6208738088607788e-05, -1.528952270746231e-05, -1.4370307326316833e-05, -1.3451091945171356e-05, -1.2531876564025879e-05, -1.1612661182880402e-05, -1.0693445801734924e-05, -9.774230420589447e-06, -8.85501503944397e-06, -7.935799658298492e-06, -7.016584277153015e-06, -6.097368896007538e-06, -5.1781535148620605e-06, -4.258938133716583e-06, -3.339722752571106e-06, -2.4205073714256287e-06, -1.5012919902801514e-06, -5.820766091346741e-07, 3.371387720108032e-07, 1.2563541531562805e-06, 2.175569534301758e-06, 3.094784915447235e-06, 4.014000296592712e-06, 4.93321567773819e-06, 5.852431058883667e-06, 6.771646440029144e-06, 7.690861821174622e-06, 8.610077202320099e-06, 9.529292583465576e-06, 1.0448507964611053e-05, 1.136772334575653e-05, 1.2286938726902008e-05, 1.3206154108047485e-05, 1.4125369489192963e-05, 1.504458487033844e-05, 1.5963800251483917e-05, 1.6883015632629395e-05, 1.7802231013774872e-05, 1.872144639492035e-05, 1.9640661776065826e-05, 2.0559877157211304e-05, 2.147909253835678e-05, 2.2398307919502258e-05, 2.3317523300647736e-05, 2.4236738681793213e-05, 2.515595406293869e-05, 2.6075169444084167e-05, 2.6994384825229645e-05, 2.7913600206375122e-05, 2.88328155875206e-05, 2.9752030968666077e-05, 3.0671246349811554e-05, 3.159046173095703e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 15.0, 22.0, 27.0, 35.0, 42.0, 57.0, 90.0, 144.0, 210.0, 401.0, 633.0, 1292.0, 3065.0, 11338.0, 85716.0, 833483.0, 93575.0, 12023.0, 3333.0, 1328.0, 685.0, 364.0, 223.0, 133.0, 82.0, 55.0, 40.0, 38.0, 19.0, 13.0, 11.0, 8.0, 11.0, 2.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12158203125, -0.11699676513671875, -0.1124114990234375, -0.10782623291015625, -0.103240966796875, -0.09865570068359375, -0.0940704345703125, -0.08948516845703125, -0.08489990234375, -0.08031463623046875, -0.0757293701171875, -0.07114410400390625, -0.066558837890625, -0.06197357177734375, -0.0573883056640625, -0.05280303955078125, -0.0482177734375, -0.04363250732421875, -0.0390472412109375, -0.03446197509765625, -0.029876708984375, -0.02529144287109375, -0.0207061767578125, -0.01612091064453125, -0.01153564453125, -0.00695037841796875, -0.0023651123046875, 0.00222015380859375, 0.006805419921875, 0.01139068603515625, 0.0159759521484375, 0.02056121826171875, 0.025146484375, 0.02973175048828125, 0.0343170166015625, 0.03890228271484375, 0.043487548828125, 0.04807281494140625, 0.0526580810546875, 0.05724334716796875, 0.06182861328125, 0.06641387939453125, 0.0709991455078125, 0.07558441162109375, 0.080169677734375, 0.08475494384765625, 0.0893402099609375, 0.09392547607421875, 0.0985107421875, 0.10309600830078125, 0.1076812744140625, 0.11226654052734375, 0.116851806640625, 0.12143707275390625, 0.1260223388671875, 0.13060760498046875, 0.13519287109375, 0.13977813720703125, 0.1443634033203125, 0.14894866943359375, 0.153533935546875, 0.15811920166015625, 0.1627044677734375, 0.16728973388671875, 0.171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 20.0, 38.0, 67.0, 90.0, 115.0, 164.0, 138.0, 101.0, 88.0, 56.0, 35.0, 18.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.2091503143310547, -0.20162582397460938, -0.19410133361816406, -0.18657684326171875, -0.17905235290527344, -0.17152786254882812, -0.1640033721923828, -0.1564788818359375, -0.1489543914794922, -0.14142990112304688, -0.13390541076660156, -0.12638092041015625, -0.11885643005371094, -0.11133193969726562, -0.10380744934082031, -0.096282958984375, -0.08875846862792969, -0.08123397827148438, -0.07370948791503906, -0.06618499755859375, -0.05866050720214844, -0.051136016845703125, -0.04361152648925781, -0.0360870361328125, -0.028562545776367188, -0.021038055419921875, -0.013513565063476562, -0.00598907470703125, 0.0015354156494140625, 0.009059906005859375, 0.016584396362304688, 0.02410888671875, 0.03163337707519531, 0.039157867431640625, 0.04668235778808594, 0.05420684814453125, 0.06173133850097656, 0.06925582885742188, 0.07678031921386719, 0.0843048095703125, 0.09182929992675781, 0.09935379028320312, 0.10687828063964844, 0.11440277099609375, 0.12192726135253906, 0.12945175170898438, 0.1369762420654297, 0.144500732421875, 0.1520252227783203, 0.15954971313476562, 0.16707420349121094, 0.17459869384765625, 0.18212318420410156, 0.18964767456054688, 0.1971721649169922, 0.2046966552734375, 0.2122211456298828, 0.21974563598632812, 0.22727012634277344, 0.23479461669921875, 0.24231910705566406, 0.24984359741210938, 0.2573680877685547, 0.264892578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 34.0, 72.0, 136.0, 246.0, 213.0, 116.0, 65.0, 27.0, 18.0, 8.0, 13.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.995100498199463, -4.8752851486206055, -4.75546932220459, -4.635653972625732, -4.515838146209717, -4.396022796630859, -4.276207447052002, -4.156391620635986, -4.036576271057129, -3.9167606830596924, -3.796945095062256, -3.6771297454833984, -3.557314157485962, -3.4374985694885254, -3.317682981491089, -3.1978673934936523, -3.078052043914795, -2.9582364559173584, -2.838420867919922, -2.7186055183410645, -2.598789930343628, -2.4789743423461914, -2.359158754348755, -2.2393431663513184, -2.119527578353882, -1.9997119903564453, -1.8798965215682983, -1.7600809335708618, -1.6402654647827148, -1.5204498767852783, -1.4006342887878418, -1.2808188199996948, -1.1610033512115479, -1.0411877632141113, -0.9213722944259644, -0.8015567064285278, -0.6817412376403809, -0.5619256496429443, -0.4421101212501526, -0.32229459285736084, -0.2024790644645691, -0.08266352862119675, 0.0371520072221756, 0.15696755051612854, 0.2767830789089203, 0.3965986371040344, 0.5164141654968262, 0.6362296938896179, 0.7560452222824097, 0.8758607506752014, 0.9956762790679932, 1.1154918670654297, 1.2353073358535767, 1.3551229238510132, 1.4749383926391602, 1.5947539806365967, 1.7145695686340332, 1.8343851566314697, 1.9542006254196167, 2.0740160942077637, 2.1938316822052, 2.3136472702026367, 2.4334628582000732, 2.5532784461975098, 2.673093795776367]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 9.0, 17.0, 26.0, 36.0, 52.0, 99.0, 121.0, 177.0, 149.0, 110.0, 74.0, 57.0, 23.0, 16.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.316988945007324, -6.176357746124268, -6.035726547241211, -5.895095348358154, -5.754464149475098, -5.613832473754883, -5.473201274871826, -5.3325700759887695, -5.191938877105713, -5.051307678222656, -4.9106764793396, -4.770045280456543, -4.629413604736328, -4.4887824058532715, -4.348151206970215, -4.207520008087158, -4.066888809204102, -3.926257610321045, -3.7856264114379883, -3.6449949741363525, -3.504363775253296, -3.3637325763702393, -3.2231011390686035, -3.082469940185547, -2.9418387413024902, -2.8012075424194336, -2.660576343536377, -2.519944906234741, -2.3793137073516846, -2.238682508468628, -2.098051071166992, -1.9574198722839355, -1.816789150238037, -1.6761579513549805, -1.5355266332626343, -1.394895315170288, -1.2542641162872314, -1.1136329174041748, -0.9730015993118286, -0.8323703408241272, -0.6917390823364258, -0.5511078238487244, -0.41047656536102295, -0.26984530687332153, -0.12921404838562012, 0.011417210102081299, 0.15204846858978271, 0.29267972707748413, 0.43331098556518555, 0.573942244052887, 0.7145735025405884, 0.8552047610282898, 0.9958360195159912, 1.1364672183990479, 1.277098536491394, 1.4177298545837402, 1.5583610534667969, 1.6989922523498535, 1.8396235704421997, 1.980254888534546, 2.1208860874176025, 2.261517286300659, 2.402148723602295, 2.5427799224853516, 2.683411121368408]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 10.0, 25.0, 28.0, 58.0, 180.0, 477.0, 86.0, 52.0, 38.0, 21.0, 10.0, 7.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.703125, -0.68853759765625, -0.6739501953125, -0.65936279296875, -0.644775390625, -0.63018798828125, -0.6156005859375, -0.60101318359375, -0.58642578125, -0.57183837890625, -0.5572509765625, -0.54266357421875, -0.528076171875, -0.51348876953125, -0.4989013671875, -0.48431396484375, -0.4697265625, -0.45513916015625, -0.4405517578125, -0.42596435546875, -0.411376953125, -0.39678955078125, -0.3822021484375, -0.36761474609375, -0.35302734375, -0.33843994140625, -0.3238525390625, -0.30926513671875, -0.294677734375, -0.28009033203125, -0.2655029296875, -0.25091552734375, -0.236328125, -0.22174072265625, -0.2071533203125, -0.19256591796875, -0.177978515625, -0.16339111328125, -0.1488037109375, -0.13421630859375, -0.11962890625, -0.10504150390625, -0.0904541015625, -0.07586669921875, -0.061279296875, -0.04669189453125, -0.0321044921875, -0.01751708984375, -0.0029296875, 0.01165771484375, 0.0262451171875, 0.04083251953125, 0.055419921875, 0.07000732421875, 0.0845947265625, 0.09918212890625, 0.11376953125, 0.12835693359375, 0.1429443359375, 0.15753173828125, 0.172119140625, 0.18670654296875, 0.2012939453125, 0.21588134765625, 0.23046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 4.0, 11.0, 6.0, 5.0, 14.0, 22.0, 11.0, 14.0, 28.0, 33.0, 50.0, 83.0, 132.0, 226.0, 408.0, 936.0, 2934.0, 17977.0, 8328513.0, 31257.0, 3892.0, 1133.0, 413.0, 178.0, 98.0, 46.0, 28.0, 21.0, 14.0, 15.0, 13.0, 11.0, 9.0, 11.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.0912374258041382, -1.0622166395187378, -1.0331958532333374, -1.004175066947937, -0.9751542210578918, -0.9461334347724915, -0.9171125888824463, -0.8880918025970459, -0.8590710163116455, -0.8300502300262451, -0.8010294437408447, -0.7720085978507996, -0.7429878115653992, -0.7139670252799988, -0.6849461793899536, -0.6559253931045532, -0.6269046068191528, -0.5978838205337524, -0.568863034248352, -0.5398421883583069, -0.5108214020729065, -0.4818006157875061, -0.4527797996997833, -0.42375898361206055, -0.39473819732666016, -0.36571741104125977, -0.336696594953537, -0.3076757788658142, -0.2786549925804138, -0.24963419139385223, -0.22061339020729065, -0.19159258902072906, -0.16257178783416748, -0.1335509866476059, -0.10453018546104431, -0.07550938427448273, -0.04648858308792114, -0.017467781901359558, 0.011553019285202026, 0.04057382047176361, 0.0695946216583252, 0.09861542284488678, 0.12763622403144836, 0.15665702521800995, 0.18567782640457153, 0.21469862759113312, 0.2437194287776947, 0.2727402448654175, 0.30176103115081787, 0.33078181743621826, 0.35980263352394104, 0.3888234496116638, 0.4178442358970642, 0.4468650221824646, 0.4758858382701874, 0.5049066543579102, 0.5339274406433105, 0.5629482269287109, 0.5919690132141113, 0.6209898591041565, 0.6500106453895569, 0.6790314316749573, 0.7080522775650024, 0.7370730638504028, 0.7660938501358032]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.9121706485748291, -0.8577847480773926, -0.803398847579956, -0.7490128874778748, -0.6946269869804382, -0.6402410864830017, -0.5858551263809204, -0.5314692258834839, -0.47708332538604736, -0.42269742488861084, -0.36831149458885193, -0.313925564289093, -0.2595396637916565, -0.20515376329421997, -0.15076783299446106, -0.09638190269470215, -0.041996002197265625, 0.012389913201332092, 0.06677582859992981, 0.12116174399852753, 0.17554765939712524, 0.22993355989456177, 0.2843194901943207, 0.3387054204940796, 0.3930913209915161, 0.44747722148895264, 0.5018631219863892, 0.5562490820884705, 0.610634982585907, 0.6650208830833435, 0.7194068431854248, 0.7737927436828613, 0.8281786441802979, 0.8825645446777344, 0.9369504451751709, 0.9913364052772522, 1.045722246170044, 1.1001081466674805, 1.1544941663742065, 1.208880066871643, 1.2632659673690796, 1.3176518678665161, 1.3720377683639526, 1.4264236688613892, 1.4808096885681152, 1.5351955890655518, 1.5895814895629883, 1.6439673900604248, 1.6983532905578613, 1.7527391910552979, 1.8071250915527344, 1.861510992050171, 1.9158968925476074, 1.970282793045044, 2.0246686935424805, 2.079054832458496, 2.1334404945373535, 2.18782639503479, 2.2422122955322266, 2.296598196029663, 2.3509840965270996, 2.405369997024536, 2.4597558975219727, 2.5141420364379883, 2.568527936935425]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 24.0, 29.0, 33.0, 58.0, 76.0, 87.0, 98.0, 119.0, 97.0, 91.0, 72.0, 53.0, 38.0, 29.0, 21.0, 12.0, 10.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.1303853988647461, -0.1272258758544922, -0.12406635284423828, -0.12090682983398438, -0.11774730682373047, -0.11458778381347656, -0.11142826080322266, -0.10826873779296875, -0.10510921478271484, -0.10194969177246094, -0.09879016876220703, -0.09563064575195312, -0.09247112274169922, -0.08931159973144531, -0.0861520767211914, -0.0829925537109375, -0.0798330307006836, -0.07667350769042969, -0.07351398468017578, -0.07035446166992188, -0.06719493865966797, -0.06403541564941406, -0.060875892639160156, -0.05771636962890625, -0.054556846618652344, -0.05139732360839844, -0.04823780059814453, -0.045078277587890625, -0.04191875457763672, -0.03875923156738281, -0.035599708557128906, -0.032440185546875, -0.029280662536621094, -0.026121139526367188, -0.02296161651611328, -0.019802093505859375, -0.01664257049560547, -0.013483047485351562, -0.010323524475097656, -0.00716400146484375, -0.004004478454589844, -0.0008449554443359375, 0.0023145675659179688, 0.005474090576171875, 0.008633613586425781, 0.011793136596679688, 0.014952659606933594, 0.0181121826171875, 0.021271705627441406, 0.024431228637695312, 0.02759075164794922, 0.030750274658203125, 0.03390979766845703, 0.03706932067871094, 0.040228843688964844, 0.04338836669921875, 0.046547889709472656, 0.04970741271972656, 0.05286693572998047, 0.056026458740234375, 0.05918598175048828, 0.06234550476074219, 0.0655050277709961, 0.06866455078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 11.0, 12.0, 12.0, 17.0, 24.0, 30.0, 43.0, 71.0, 91.0, 144.0, 191.0, 306.0, 481.0, 843.0, 1673.0, 3264.0, 7042.0, 17922.0, 53677.0, 199075.0, 167342.0, 44458.0, 15183.0, 5990.0, 2810.0, 1457.0, 780.0, 440.0, 302.0, 185.0, 105.0, 92.0, 49.0, 38.0, 35.0, 22.0, 11.0, 5.0, 11.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0186920166015625, -0.984649658203125, -0.9506072998046875, -0.91656494140625, -0.8825225830078125, -0.848480224609375, -0.8144378662109375, -0.7803955078125, -0.7463531494140625, -0.712310791015625, -0.6782684326171875, -0.64422607421875, -0.6101837158203125, -0.576141357421875, -0.5420989990234375, -0.508056640625, -0.4740142822265625, -0.439971923828125, -0.4059295654296875, -0.37188720703125, -0.3378448486328125, -0.303802490234375, -0.2697601318359375, -0.2357177734375, -0.2016754150390625, -0.167633056640625, -0.1335906982421875, -0.09954833984375, -0.0655059814453125, -0.031463623046875, 0.0025787353515625, 0.03662109375, 0.0706634521484375, 0.104705810546875, 0.1387481689453125, 0.17279052734375, 0.2068328857421875, 0.240875244140625, 0.2749176025390625, 0.3089599609375, 0.3430023193359375, 0.377044677734375, 0.4110870361328125, 0.44512939453125, 0.4791717529296875, 0.513214111328125, 0.5472564697265625, 0.581298828125, 0.6153411865234375, 0.649383544921875, 0.6834259033203125, 0.71746826171875, 0.7515106201171875, 0.785552978515625, 0.8195953369140625, 0.8536376953125, 0.8876800537109375, 0.921722412109375, 0.9557647705078125, 0.98980712890625, 1.0238494873046875, 1.057891845703125, 1.0919342041015625, 1.1259765625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 21.0, 21.0, 35.0, 42.0, 60.0, 57.0, 84.0, 105.0, 88.0, 95.0, 80.0, 66.0, 60.0, 35.0, 30.0, 18.0, 17.0, 16.0, 15.0, 5.0, 5.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1961669921875, -0.18860435485839844, -0.18104171752929688, -0.1734790802001953, -0.16591644287109375, -0.1583538055419922, -0.15079116821289062, -0.14322853088378906, -0.1356658935546875, -0.12810325622558594, -0.12054061889648438, -0.11297798156738281, -0.10541534423828125, -0.09785270690917969, -0.09029006958007812, -0.08272743225097656, -0.075164794921875, -0.06760215759277344, -0.060039520263671875, -0.05247688293457031, -0.04491424560546875, -0.03735160827636719, -0.029788970947265625, -0.022226333618164062, -0.0146636962890625, -0.0071010589599609375, 0.000461578369140625, 0.008024215698242188, 0.01558685302734375, 0.023149490356445312, 0.030712127685546875, 0.03827476501464844, 0.04583740234375, 0.05340003967285156, 0.060962677001953125, 0.06852531433105469, 0.07608795166015625, 0.08365058898925781, 0.09121322631835938, 0.09877586364746094, 0.1063385009765625, 0.11390113830566406, 0.12146377563476562, 0.1290264129638672, 0.13658905029296875, 0.1441516876220703, 0.15171432495117188, 0.15927696228027344, 0.166839599609375, 0.17440223693847656, 0.18196487426757812, 0.1895275115966797, 0.19709014892578125, 0.2046527862548828, 0.21221542358398438, 0.21977806091308594, 0.2273406982421875, 0.23490333557128906, 0.24246597290039062, 0.2500286102294922, 0.25759124755859375, 0.2651538848876953, 0.2727165222167969, 0.28027915954589844, 0.287841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 8.0, 11.0, 9.0, 23.0, 21.0, 31.0, 40.0, 45.0, 48.0, 44.0, 39.0, 37.0, 34.0, 23.0, 12.0, 19.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6611654758453369, -0.6370133757591248, -0.6128613352775574, -0.5887092351913452, -0.5645571947097778, -0.5404050946235657, -0.5162529945373535, -0.49210095405578613, -0.46794888377189636, -0.4437968134880066, -0.4196447432041168, -0.39549267292022705, -0.3713405728340149, -0.3471885323524475, -0.32303643226623535, -0.2988843619823456, -0.2747322916984558, -0.25058022141456604, -0.22642815113067627, -0.2022760659456253, -0.17812399566173553, -0.15397192537784576, -0.1298198401927948, -0.10566776990890503, -0.08151569962501526, -0.05736362561583519, -0.03321155160665512, -0.009059473872184753, 0.015092596411705017, 0.03924466669559479, 0.06339675188064575, 0.08754882216453552, 0.11170083284378052, 0.1358529031276703, 0.16000497341156006, 0.18415705859661102, 0.2083091288805008, 0.23246119916439056, 0.25661328434944153, 0.2807653546333313, 0.30491742491722107, 0.32906949520111084, 0.3532215654850006, 0.3773736357688904, 0.40152573585510254, 0.4256777763366699, 0.4498298764228821, 0.47398194670677185, 0.4981340169906616, 0.5222861170768738, 0.5464381575584412, 0.5705902576446533, 0.5947422981262207, 0.6188943982124329, 0.643046498298645, 0.6671985387802124, 0.6913505792617798, 0.7155026793479919, 0.7396547198295593, 0.7638068199157715, 0.7879588603973389, 0.812110960483551, 0.8362630605697632, 0.8604151010513306, 0.8845672011375427]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 6.0, 12.0, 16.0, 10.0, 23.0, 27.0, 38.0, 35.0, 43.0, 39.0, 39.0, 31.0, 33.0, 23.0, 23.0, 16.0, 10.0, 13.0, 4.0, 5.0, 9.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6281315088272095, -1.5818910598754883, -1.535650610923767, -1.489410161972046, -1.4431697130203247, -1.3969292640686035, -1.3506886959075928, -1.3044483661651611, -1.2582077980041504, -1.2119673490524292, -1.165726900100708, -1.1194864511489868, -1.0732460021972656, -1.0270055532455444, -0.9807650446891785, -0.9345245957374573, -0.8882842063903809, -0.8420437574386597, -0.7958033084869385, -0.7495628595352173, -0.7033224105834961, -0.6570819616317749, -0.6108414530754089, -0.5646010041236877, -0.5183605551719666, -0.47212010622024536, -0.42587965726852417, -0.3796391785144806, -0.3333987295627594, -0.2871582806110382, -0.24091780185699463, -0.19467735290527344, -0.1484370231628418, -0.10219656676054001, -0.05595611035823822, -0.009715646505355835, 0.036524802446365356, 0.08276525139808655, 0.12900573015213013, 0.17524617910385132, 0.2214866280555725, 0.2677270770072937, 0.3139675259590149, 0.36020800471305847, 0.40644845366477966, 0.45268890261650085, 0.49892938137054443, 0.5451698303222656, 0.5914102792739868, 0.637650728225708, 0.6838911771774292, 0.7301316261291504, 0.7763720750808716, 0.8226125240325928, 0.8688530325889587, 0.9150934815406799, 0.9613339304924011, 1.007574439048767, 1.0538148880004883, 1.1000553369522095, 1.1462957859039307, 1.1925362348556519, 1.238776683807373, 1.2850171327590942, 1.3312575817108154]}, "eval/loss": 4.170206069946289, "eval/bleu": 2.2622740788922234e-13, "eval/runtime": 2580.4115, "eval/samples_per_second": 5.72, "eval/steps_per_second": 0.715} \ No newline at end of file +{"train/loss": 3.6918, "train/learning_rate": 0.00015060403339576736, "train/epoch": 1.7, "train/global_step": 5500, "_runtime": 52364, "_timestamp": 1651726453, "_step": 5510, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 526.0, 488.0, 3.0, 1.0], "bins": [-104.2026138305664, -102.4944839477539, -100.78634643554688, -99.07821655273438, -97.37008666992188, -95.66195678710938, -93.95381927490234, -92.24568939208984, -90.53755950927734, -88.82942962646484, -87.12129211425781, -85.41316223144531, -83.70503234863281, -81.99690246582031, -80.28876495361328, -78.58063507080078, -76.87249755859375, -75.16436767578125, -73.45623016357422, -71.74810028076172, -70.03997039794922, -68.33183288574219, -66.62370300292969, -64.91557312011719, -63.20744323730469, -61.49930953979492, -59.79117965698242, -58.083045959472656, -56.374916076660156, -54.66678237915039, -52.958648681640625, -51.250518798828125, -49.54238510131836, -47.834251403808594, -46.126121520996094, -44.41798782348633, -42.70985794067383, -41.00172424316406, -39.29359436035156, -37.5854606628418, -35.87732696533203, -34.169193267822266, -32.461063385009766, -30.7529296875, -29.044797897338867, -27.336666107177734, -25.6285343170166, -23.92040252685547, -22.212268829345703, -20.50413703918457, -18.796005249023438, -17.087871551513672, -15.379739761352539, -13.671607971191406, -11.963476181030273, -10.255343437194824, -8.547212600708008, -6.839080333709717, -5.130948066711426, -3.422816276550293, -1.714684009552002, -0.0065517425537109375, 1.7015800476074219, 3.409712791442871, 5.117844581604004]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 8.0, 9.0, 13.0, 6.0, 9.0, 10.0, 11.0, 20.0, 23.0, 16.0, 20.0, 37.0, 31.0, 29.0, 44.0, 48.0, 43.0, 53.0, 43.0, 36.0, 46.0, 37.0, 49.0, 51.0, 53.0, 31.0, 39.0, 20.0, 27.0, 21.0, 22.0, 18.0, 14.0, 10.0, 14.0, 9.0, 8.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.933584690093994, -4.764078140258789, -4.594571590423584, -4.425065040588379, -4.255558013916016, -4.0860514640808105, -3.9165449142456055, -3.7470383644104004, -3.577531576156616, -3.408025026321411, -3.238518238067627, -3.069011688232422, -2.899505138397217, -2.7299983501434326, -2.5604918003082275, -2.3909850120544434, -2.2214784622192383, -2.051971912384033, -1.882465124130249, -1.712958574295044, -1.5434519052505493, -1.3739452362060547, -1.2044386863708496, -1.034932017326355, -0.8654253482818604, -0.6959186792373657, -0.5264120697975159, -0.356905460357666, -0.1873987913131714, -0.017892122268676758, 0.15161442756652832, 0.32112109661102295, 0.4906282424926758, 0.6601349115371704, 0.8296415209770203, 0.9991481304168701, 1.1686547994613647, 1.3381614685058594, 1.5076680183410645, 1.677174687385559, 1.8466813564300537, 2.016187906265259, 2.185694694519043, 2.355201244354248, 2.524707794189453, 2.6942145824432373, 2.8637211322784424, 3.0332279205322266, 3.2027344703674316, 3.3722410202026367, 3.541747808456421, 3.711254358291626, 3.88076114654541, 4.050267696380615, 4.21977424621582, 4.389280796051025, 4.5587873458862305, 4.7282938957214355, 4.897800445556641, 5.067307472229004, 5.236814022064209, 5.406320571899414, 5.575827121734619, 5.745333671569824, 5.9148406982421875]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 26.0, 40.0, 62.0, 104.0, 188.0, 342.0, 586.0, 1169.0, 2297.0, 4760.0, 9775.0, 21790.0, 48715.0, 112725.0, 480614.0, 3085890.0, 266726.0, 86423.0, 38511.0, 17593.0, 8080.0, 3790.0, 1867.0, 935.0, 543.0, 300.0, 171.0, 95.0, 57.0, 28.0, 21.0, 15.0, 13.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.154296875, -3.038970947265625, -2.92364501953125, -2.808319091796875, -2.6929931640625, -2.577667236328125, -2.46234130859375, -2.347015380859375, -2.231689453125, -2.116363525390625, -2.00103759765625, -1.885711669921875, -1.7703857421875, -1.655059814453125, -1.53973388671875, -1.424407958984375, -1.30908203125, -1.193756103515625, -1.07843017578125, -0.963104248046875, -0.8477783203125, -0.732452392578125, -0.61712646484375, -0.501800537109375, -0.386474609375, -0.271148681640625, -0.15582275390625, -0.040496826171875, 0.0748291015625, 0.190155029296875, 0.30548095703125, 0.420806884765625, 0.5361328125, 0.651458740234375, 0.76678466796875, 0.882110595703125, 0.9974365234375, 1.112762451171875, 1.22808837890625, 1.343414306640625, 1.458740234375, 1.574066162109375, 1.68939208984375, 1.804718017578125, 1.9200439453125, 2.035369873046875, 2.15069580078125, 2.266021728515625, 2.38134765625, 2.496673583984375, 2.61199951171875, 2.727325439453125, 2.8426513671875, 2.957977294921875, 3.07330322265625, 3.188629150390625, 3.303955078125, 3.419281005859375, 3.53460693359375, 3.649932861328125, 3.7652587890625, 3.880584716796875, 3.99591064453125, 4.111236572265625, 4.2265625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 5.0, 3.0, 8.0, 8.0, 6.0, 10.0, 16.0, 10.0, 14.0, 21.0, 22.0, 31.0, 19.0, 34.0, 43.0, 41.0, 53.0, 51.0, 53.0, 44.0, 54.0, 43.0, 44.0, 44.0, 44.0, 35.0, 40.0, 32.0, 29.0, 28.0, 19.0, 17.0, 10.0, 16.0, 15.0, 8.0, 11.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.07086181640625, -4.9073486328125, -4.74383544921875, -4.580322265625, -4.41680908203125, -4.2532958984375, -4.08978271484375, -3.92626953125, -3.76275634765625, -3.5992431640625, -3.43572998046875, -3.272216796875, -3.10870361328125, -2.9451904296875, -2.78167724609375, -2.6181640625, -2.45465087890625, -2.2911376953125, -2.12762451171875, -1.964111328125, -1.80059814453125, -1.6370849609375, -1.47357177734375, -1.31005859375, -1.14654541015625, -0.9830322265625, -0.81951904296875, -0.656005859375, -0.49249267578125, -0.3289794921875, -0.16546630859375, -0.001953125, 0.16156005859375, 0.3250732421875, 0.48858642578125, 0.652099609375, 0.81561279296875, 0.9791259765625, 1.14263916015625, 1.30615234375, 1.46966552734375, 1.6331787109375, 1.79669189453125, 1.960205078125, 2.12371826171875, 2.2872314453125, 2.45074462890625, 2.6142578125, 2.77777099609375, 2.9412841796875, 3.10479736328125, 3.268310546875, 3.43182373046875, 3.5953369140625, 3.75885009765625, 3.92236328125, 4.08587646484375, 4.2493896484375, 4.41290283203125, 4.576416015625, 4.73992919921875, 4.9034423828125, 5.06695556640625, 5.23046875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 18.0, 14.0, 24.0, 32.0, 29.0, 43.0, 65.0, 138.0, 648.0, 4191780.0, 1098.0, 148.0, 62.0, 50.0, 25.0, 23.0, 12.0, 14.0, 10.0, 11.0, 7.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.25, -160.298828125, -156.34765625, -152.396484375, -148.4453125, -144.494140625, -140.54296875, -136.591796875, -132.640625, -128.689453125, -124.73828125, -120.787109375, -116.8359375, -112.884765625, -108.93359375, -104.982421875, -101.03125, -97.080078125, -93.12890625, -89.177734375, -85.2265625, -81.275390625, -77.32421875, -73.373046875, -69.421875, -65.470703125, -61.51953125, -57.568359375, -53.6171875, -49.666015625, -45.71484375, -41.763671875, -37.8125, -33.861328125, -29.91015625, -25.958984375, -22.0078125, -18.056640625, -14.10546875, -10.154296875, -6.203125, -2.251953125, 1.69921875, 5.650390625, 9.6015625, 13.552734375, 17.50390625, 21.455078125, 25.40625, 29.357421875, 33.30859375, 37.259765625, 41.2109375, 45.162109375, 49.11328125, 53.064453125, 57.015625, 60.966796875, 64.91796875, 68.869140625, 72.8203125, 76.771484375, 80.72265625, 84.673828125, 88.625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 2.0, 6.0, 8.0, 11.0, 11.0, 18.0, 26.0, 30.0, 30.0, 49.0, 72.0, 129.0, 500.0, 2512.0, 350.0, 114.0, 57.0, 49.0, 22.0, 17.0, 13.0, 14.0, 12.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.47265625, -3.3907623291015625, -3.308868408203125, -3.2269744873046875, -3.14508056640625, -3.0631866455078125, -2.981292724609375, -2.8993988037109375, -2.8175048828125, -2.7356109619140625, -2.653717041015625, -2.5718231201171875, -2.48992919921875, -2.4080352783203125, -2.326141357421875, -2.2442474365234375, -2.162353515625, -2.0804595947265625, -1.998565673828125, -1.9166717529296875, -1.83477783203125, -1.7528839111328125, -1.670989990234375, -1.5890960693359375, -1.5072021484375, -1.4253082275390625, -1.343414306640625, -1.2615203857421875, -1.17962646484375, -1.0977325439453125, -1.015838623046875, -0.9339447021484375, -0.85205078125, -0.7701568603515625, -0.688262939453125, -0.6063690185546875, -0.52447509765625, -0.4425811767578125, -0.360687255859375, -0.2787933349609375, -0.1968994140625, -0.1150054931640625, -0.033111572265625, 0.0487823486328125, 0.13067626953125, 0.2125701904296875, 0.294464111328125, 0.3763580322265625, 0.458251953125, 0.5401458740234375, 0.622039794921875, 0.7039337158203125, 0.78582763671875, 0.8677215576171875, 0.949615478515625, 1.0315093994140625, 1.1134033203125, 1.1952972412109375, 1.277191162109375, 1.3590850830078125, 1.44097900390625, 1.5228729248046875, 1.604766845703125, 1.6866607666015625, 1.7685546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 19.0, 36.0, 52.0, 70.0, 126.0, 150.0, 158.0, 126.0, 87.0, 55.0, 34.0, 23.0, 16.0, 12.0, 9.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.129372596740723, -9.826116561889648, -9.522860527038574, -9.2196044921875, -8.916348457336426, -8.613092422485352, -8.309836387634277, -8.006580352783203, -7.703323841094971, -7.4000678062438965, -7.096811771392822, -6.793555736541748, -6.490299224853516, -6.187043190002441, -5.883787155151367, -5.580531120300293, -5.277275085449219, -4.9740190505981445, -4.67076301574707, -4.367506980895996, -4.064250946044922, -3.7609946727752686, -3.4577383995056152, -3.154482364654541, -2.851226329803467, -2.5479702949523926, -2.2447142601013184, -1.941457986831665, -1.6382019519805908, -1.3349459171295166, -1.0316897630691528, -0.7284336090087891, -0.42517757415771484, -0.12192147970199585, 0.18133461475372314, 0.48459070920944214, 0.7878468036651611, 1.0911028385162354, 1.3943589925765991, 1.697615146636963, 2.000871181488037, 2.3041272163391113, 2.6073832511901855, 2.910639524459839, 3.213895559310913, 3.5171515941619873, 3.8204078674316406, 4.123663902282715, 4.426919937133789, 4.730175971984863, 5.0334320068359375, 5.336688041687012, 5.639944076538086, 5.94320011138916, 6.246456623077393, 6.549712657928467, 6.852968692779541, 7.156224727630615, 7.4594807624816895, 7.762736797332764, 8.065993309020996, 8.36924934387207, 8.672505378723145, 8.975761413574219, 9.279017448425293]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 5.0, 6.0, 10.0, 12.0, 19.0, 16.0, 19.0, 22.0, 14.0, 26.0, 35.0, 27.0, 31.0, 47.0, 34.0, 38.0, 40.0, 43.0, 36.0, 48.0, 52.0, 40.0, 47.0, 34.0, 31.0, 41.0, 28.0, 38.0, 28.0, 14.0, 15.0, 17.0, 14.0, 8.0, 12.0, 12.0, 8.0, 5.0, 5.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.329255104064941, -4.189163684844971, -4.049072265625, -3.90898060798645, -3.7688889503479004, -3.6287975311279297, -3.488706111907959, -3.3486146926879883, -3.2085230350494385, -3.0684316158294678, -2.928339958190918, -2.7882485389709473, -2.6481571197509766, -2.5080654621124268, -2.367974042892456, -2.2278823852539062, -2.0877909660339355, -1.9476994276046753, -1.807607889175415, -1.6675164699554443, -1.527424931526184, -1.3873333930969238, -1.2472419738769531, -1.1071504354476929, -0.9670588970184326, -0.8269673585891724, -0.6868758797645569, -0.5467844009399414, -0.40669286251068115, -0.2666013240814209, -0.12650984525680542, 0.013581633567810059, 0.15367364883422852, 0.2937651574611664, 0.43385666608810425, 0.5739481449127197, 0.71403968334198, 0.8541312217712402, 0.9942227005958557, 1.1343141794204712, 1.2744057178497314, 1.4144972562789917, 1.554588794708252, 1.6946802139282227, 1.834771752357483, 1.9748632907867432, 2.114954710006714, 2.2550463676452637, 2.3951377868652344, 2.535229206085205, 2.675320863723755, 2.8154122829437256, 2.9555039405822754, 3.095595359802246, 3.235686779022217, 3.3757781982421875, 3.5158698558807373, 3.655961275100708, 3.796052932739258, 3.9361443519592285, 4.076235771179199, 4.216327667236328, 4.356419086456299, 4.4965105056762695, 4.63660192489624]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 15.0, 15.0, 24.0, 26.0, 38.0, 49.0, 61.0, 81.0, 122.0, 180.0, 289.0, 361.0, 668.0, 1103.0, 2150.0, 4879.0, 12203.0, 34668.0, 107039.0, 323899.0, 364586.0, 128916.0, 41460.0, 14383.0, 5594.0, 2492.0, 1219.0, 703.0, 415.0, 257.0, 169.0, 135.0, 81.0, 68.0, 43.0, 43.0, 28.0, 28.0, 15.0, 16.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8486328125, -0.82373046875, -0.798828125, -0.77392578125, -0.7490234375, -0.72412109375, -0.69921875, -0.67431640625, -0.6494140625, -0.62451171875, -0.599609375, -0.57470703125, -0.5498046875, -0.52490234375, -0.5, -0.47509765625, -0.4501953125, -0.42529296875, -0.400390625, -0.37548828125, -0.3505859375, -0.32568359375, -0.30078125, -0.27587890625, -0.2509765625, -0.22607421875, -0.201171875, -0.17626953125, -0.1513671875, -0.12646484375, -0.1015625, -0.07666015625, -0.0517578125, -0.02685546875, -0.001953125, 0.02294921875, 0.0478515625, 0.07275390625, 0.09765625, 0.12255859375, 0.1474609375, 0.17236328125, 0.197265625, 0.22216796875, 0.2470703125, 0.27197265625, 0.296875, 0.32177734375, 0.3466796875, 0.37158203125, 0.396484375, 0.42138671875, 0.4462890625, 0.47119140625, 0.49609375, 0.52099609375, 0.5458984375, 0.57080078125, 0.595703125, 0.62060546875, 0.6455078125, 0.67041015625, 0.6953125, 0.72021484375, 0.7451171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 0.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 3.0, 5.0, 7.0, 10.0, 10.0, 11.0, 12.0, 19.0, 16.0, 24.0, 19.0, 26.0, 24.0, 27.0, 30.0, 43.0, 44.0, 49.0, 33.0, 49.0, 32.0, 41.0, 59.0, 39.0, 38.0, 38.0, 42.0, 23.0, 34.0, 27.0, 18.0, 21.0, 20.0, 12.0, 11.0, 7.0, 13.0, 12.0, 7.0, 13.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.109375, -3.0074462890625, -2.905517578125, -2.8035888671875, -2.70166015625, -2.5997314453125, -2.497802734375, -2.3958740234375, -2.2939453125, -2.1920166015625, -2.090087890625, -1.9881591796875, -1.88623046875, -1.7843017578125, -1.682373046875, -1.5804443359375, -1.478515625, -1.3765869140625, -1.274658203125, -1.1727294921875, -1.07080078125, -0.9688720703125, -0.866943359375, -0.7650146484375, -0.6630859375, -0.5611572265625, -0.459228515625, -0.3572998046875, -0.25537109375, -0.1534423828125, -0.051513671875, 0.0504150390625, 0.15234375, 0.2542724609375, 0.356201171875, 0.4581298828125, 0.56005859375, 0.6619873046875, 0.763916015625, 0.8658447265625, 0.9677734375, 1.0697021484375, 1.171630859375, 1.2735595703125, 1.37548828125, 1.4774169921875, 1.579345703125, 1.6812744140625, 1.783203125, 1.8851318359375, 1.987060546875, 2.0889892578125, 2.19091796875, 2.2928466796875, 2.394775390625, 2.4967041015625, 2.5986328125, 2.7005615234375, 2.802490234375, 2.9044189453125, 3.00634765625, 3.1082763671875, 3.210205078125, 3.3121337890625, 3.4140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 16.0, 13.0, 21.0, 25.0, 28.0, 48.0, 57.0, 71.0, 83.0, 108.0, 150.0, 215.0, 288.0, 362.0, 498.0, 960.0, 3602.0, 33854.0, 519309.0, 453627.0, 29101.0, 3207.0, 950.0, 490.0, 326.0, 272.0, 216.0, 151.0, 111.0, 97.0, 82.0, 52.0, 29.0, 34.0, 20.0, 20.0, 10.0, 15.0, 6.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0662841796875, -1.033935546875, -1.0015869140625, -0.96923828125, -0.9368896484375, -0.904541015625, -0.8721923828125, -0.83984375, -0.8074951171875, -0.775146484375, -0.7427978515625, -0.71044921875, -0.6781005859375, -0.645751953125, -0.6134033203125, -0.5810546875, -0.5487060546875, -0.516357421875, -0.4840087890625, -0.45166015625, -0.4193115234375, -0.386962890625, -0.3546142578125, -0.322265625, -0.2899169921875, -0.257568359375, -0.2252197265625, -0.19287109375, -0.1605224609375, -0.128173828125, -0.0958251953125, -0.0634765625, -0.0311279296875, 0.001220703125, 0.0335693359375, 0.06591796875, 0.0982666015625, 0.130615234375, 0.1629638671875, 0.1953125, 0.2276611328125, 0.260009765625, 0.2923583984375, 0.32470703125, 0.3570556640625, 0.389404296875, 0.4217529296875, 0.4541015625, 0.4864501953125, 0.518798828125, 0.5511474609375, 0.58349609375, 0.6158447265625, 0.648193359375, 0.6805419921875, 0.712890625, 0.7452392578125, 0.777587890625, 0.8099365234375, 0.84228515625, 0.8746337890625, 0.906982421875, 0.9393310546875, 0.9716796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 6.0, 7.0, 11.0, 13.0, 15.0, 25.0, 20.0, 34.0, 31.0, 25.0, 30.0, 33.0, 40.0, 40.0, 31.0, 44.0, 46.0, 45.0, 41.0, 45.0, 50.0, 26.0, 43.0, 39.0, 23.0, 29.0, 26.0, 29.0, 26.0, 16.0, 14.0, 15.0, 17.0, 9.0, 8.0, 12.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.642822265625, -6.43017578125, -6.217529296875, -6.0048828125, -5.792236328125, -5.57958984375, -5.366943359375, -5.154296875, -4.941650390625, -4.72900390625, -4.516357421875, -4.3037109375, -4.091064453125, -3.87841796875, -3.665771484375, -3.453125, -3.240478515625, -3.02783203125, -2.815185546875, -2.6025390625, -2.389892578125, -2.17724609375, -1.964599609375, -1.751953125, -1.539306640625, -1.32666015625, -1.114013671875, -0.9013671875, -0.688720703125, -0.47607421875, -0.263427734375, -0.05078125, 0.161865234375, 0.37451171875, 0.587158203125, 0.7998046875, 1.012451171875, 1.22509765625, 1.437744140625, 1.650390625, 1.863037109375, 2.07568359375, 2.288330078125, 2.5009765625, 2.713623046875, 2.92626953125, 3.138916015625, 3.3515625, 3.564208984375, 3.77685546875, 3.989501953125, 4.2021484375, 4.414794921875, 4.62744140625, 4.840087890625, 5.052734375, 5.265380859375, 5.47802734375, 5.690673828125, 5.9033203125, 6.115966796875, 6.32861328125, 6.541259765625, 6.75390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 18.0, 23.0, 41.0, 48.0, 78.0, 151.0, 325.0, 1174.0, 15003.0, 1015068.0, 14835.0, 1032.0, 323.0, 145.0, 89.0, 50.0, 45.0, 24.0, 15.0, 13.0, 12.0, 8.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25341796875, -0.24348068237304688, -0.23354339599609375, -0.22360610961914062, -0.2136688232421875, -0.20373153686523438, -0.19379425048828125, -0.18385696411132812, -0.173919677734375, -0.16398239135742188, -0.15404510498046875, -0.14410781860351562, -0.1341705322265625, -0.12423324584960938, -0.11429595947265625, -0.10435867309570312, -0.09442138671875, -0.08448410034179688, -0.07454681396484375, -0.06460952758789062, -0.0546722412109375, -0.044734954833984375, -0.03479766845703125, -0.024860382080078125, -0.014923095703125, -0.004985809326171875, 0.00495147705078125, 0.014888763427734375, 0.0248260498046875, 0.034763336181640625, 0.04470062255859375, 0.054637908935546875, 0.0645751953125, 0.07451248168945312, 0.08444976806640625, 0.09438705444335938, 0.1043243408203125, 0.11426162719726562, 0.12419891357421875, 0.13413619995117188, 0.144073486328125, 0.15401077270507812, 0.16394805908203125, 0.17388534545898438, 0.1838226318359375, 0.19375991821289062, 0.20369720458984375, 0.21363449096679688, 0.22357177734375, 0.23350906372070312, 0.24344635009765625, 0.2533836364746094, 0.2633209228515625, 0.2732582092285156, 0.28319549560546875, 0.2931327819824219, 0.303070068359375, 0.3130073547363281, 0.32294464111328125, 0.3328819274902344, 0.3428192138671875, 0.3527565002441406, 0.36269378662109375, 0.3726310729980469, 0.382568359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 10.0, 10.0, 11.0, 16.0, 19.0, 28.0, 33.0, 45.0, 53.0, 78.0, 94.0, 117.0, 112.0, 94.0, 68.0, 50.0, 37.0, 31.0, 23.0, 16.0, 13.0, 3.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.726119995117188e-05, -8.459948003292084e-05, -8.19377601146698e-05, -7.927604019641876e-05, -7.661432027816772e-05, -7.395260035991669e-05, -7.129088044166565e-05, -6.862916052341461e-05, -6.596744060516357e-05, -6.330572068691254e-05, -6.06440007686615e-05, -5.798228085041046e-05, -5.5320560932159424e-05, -5.2658841013908386e-05, -4.999712109565735e-05, -4.733540117740631e-05, -4.4673681259155273e-05, -4.2011961340904236e-05, -3.93502414226532e-05, -3.668852150440216e-05, -3.402680158615112e-05, -3.1365081667900085e-05, -2.8703361749649048e-05, -2.604164183139801e-05, -2.3379921913146973e-05, -2.0718201994895935e-05, -1.8056482076644897e-05, -1.539476215839386e-05, -1.2733042240142822e-05, -1.0071322321891785e-05, -7.409602403640747e-06, -4.7478824853897095e-06, -2.086162567138672e-06, 5.755573511123657e-07, 3.2372772693634033e-06, 5.898997187614441e-06, 8.560717105865479e-06, 1.1222437024116516e-05, 1.3884156942367554e-05, 1.654587686061859e-05, 1.920759677886963e-05, 2.1869316697120667e-05, 2.4531036615371704e-05, 2.7192756533622742e-05, 2.985447645187378e-05, 3.251619637012482e-05, 3.5177916288375854e-05, 3.783963620662689e-05, 4.050135612487793e-05, 4.316307604312897e-05, 4.5824795961380005e-05, 4.848651587963104e-05, 5.114823579788208e-05, 5.380995571613312e-05, 5.6471675634384155e-05, 5.913339555263519e-05, 6.179511547088623e-05, 6.445683538913727e-05, 6.71185553073883e-05, 6.978027522563934e-05, 7.244199514389038e-05, 7.510371506214142e-05, 7.776543498039246e-05, 8.04271548986435e-05, 8.308887481689453e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 8.0, 7.0, 19.0, 23.0, 34.0, 40.0, 95.0, 194.0, 828.0, 15785.0, 1014337.0, 15840.0, 918.0, 181.0, 74.0, 45.0, 31.0, 29.0, 19.0, 17.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7683944702148438, -0.7467498779296875, -0.7251052856445312, -0.703460693359375, -0.6818161010742188, -0.6601715087890625, -0.6385269165039062, -0.61688232421875, -0.5952377319335938, -0.5735931396484375, -0.5519485473632812, -0.530303955078125, -0.5086593627929688, -0.4870147705078125, -0.46537017822265625, -0.4437255859375, -0.42208099365234375, -0.4004364013671875, -0.37879180908203125, -0.357147216796875, -0.33550262451171875, -0.3138580322265625, -0.29221343994140625, -0.27056884765625, -0.24892425537109375, -0.2272796630859375, -0.20563507080078125, -0.183990478515625, -0.16234588623046875, -0.1407012939453125, -0.11905670166015625, -0.097412109375, -0.07576751708984375, -0.0541229248046875, -0.03247833251953125, -0.010833740234375, 0.01081085205078125, 0.0324554443359375, 0.05410003662109375, 0.07574462890625, 0.09738922119140625, 0.1190338134765625, 0.14067840576171875, 0.162322998046875, 0.18396759033203125, 0.2056121826171875, 0.22725677490234375, 0.2489013671875, 0.27054595947265625, 0.2921905517578125, 0.31383514404296875, 0.335479736328125, 0.35712432861328125, 0.3787689208984375, 0.40041351318359375, 0.42205810546875, 0.44370269775390625, 0.4653472900390625, 0.48699188232421875, 0.508636474609375, 0.5302810668945312, 0.5519256591796875, 0.5735702514648438, 0.59521484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 12.0, 24.0, 22.0, 41.0, 73.0, 85.0, 127.0, 145.0, 143.0, 111.0, 67.0, 43.0, 32.0, 24.0, 14.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0655517578125, -0.06375694274902344, -0.061962127685546875, -0.06016731262207031, -0.05837249755859375, -0.05657768249511719, -0.054782867431640625, -0.05298805236816406, -0.0511932373046875, -0.04939842224121094, -0.047603607177734375, -0.04580879211425781, -0.04401397705078125, -0.04221916198730469, -0.040424346923828125, -0.03862953186035156, -0.036834716796875, -0.03503990173339844, -0.033245086669921875, -0.03145027160644531, -0.02965545654296875, -0.027860641479492188, -0.026065826416015625, -0.024271011352539062, -0.0224761962890625, -0.020681381225585938, -0.018886566162109375, -0.017091751098632812, -0.01529693603515625, -0.013502120971679688, -0.011707305908203125, -0.009912490844726562, -0.00811767578125, -0.0063228607177734375, -0.004528045654296875, -0.0027332305908203125, -0.00093841552734375, 0.0008563995361328125, 0.002651214599609375, 0.0044460296630859375, 0.0062408447265625, 0.008035659790039062, 0.009830474853515625, 0.011625289916992188, 0.01342010498046875, 0.015214920043945312, 0.017009735107421875, 0.018804550170898438, 0.020599365234375, 0.022394180297851562, 0.024188995361328125, 0.025983810424804688, 0.02777862548828125, 0.029573440551757812, 0.031368255615234375, 0.03316307067871094, 0.0349578857421875, 0.03675270080566406, 0.038547515869140625, 0.04034233093261719, 0.04213714599609375, 0.04393196105957031, 0.045726776123046875, 0.04752159118652344, 0.04931640625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 16.0, 22.0, 59.0, 153.0, 287.0, 246.0, 116.0, 47.0, 28.0, 11.0, 6.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.506767272949219, -11.064101219177246, -10.62143611907959, -10.178770065307617, -9.736104965209961, -9.293438911437988, -8.850772857666016, -8.40810775756836, -7.965441703796387, -7.522776126861572, -7.080110549926758, -6.637444496154785, -6.194778919219971, -5.752113342285156, -5.309447288513184, -4.866781711578369, -4.424116134643555, -3.9814505577087402, -3.5387847423553467, -3.096118927001953, -2.6534533500671387, -2.210787773132324, -1.7681219577789307, -1.325456142425537, -0.8827905654907227, -0.44012486934661865, 0.0025408267974853516, 0.44520652294158936, 0.8878722190856934, 1.3305377960205078, 1.7732036113739014, 2.215869426727295, 2.6585350036621094, 3.101200580596924, 3.5438663959503174, 3.986532211303711, 4.429197788238525, 4.87186336517334, 5.3145294189453125, 5.757194995880127, 6.199860572814941, 6.642526149749756, 7.08519172668457, 7.527857780456543, 7.970523357391357, 8.413188934326172, 8.855854988098145, 9.298521041870117, 9.741186141967773, 10.183852195739746, 10.626517295837402, 11.069183349609375, 11.511848449707031, 11.954514503479004, 12.397180557250977, 12.839845657348633, 13.282511711120605, 13.725177764892578, 14.167842864990234, 14.610508918762207, 15.05317497253418, 15.495840072631836, 15.938506126403809, 16.38117218017578, 16.823837280273438]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 7.0, 10.0, 12.0, 15.0, 11.0, 27.0, 19.0, 23.0, 21.0, 32.0, 30.0, 40.0, 40.0, 37.0, 42.0, 40.0, 49.0, 48.0, 44.0, 45.0, 45.0, 34.0, 34.0, 42.0, 38.0, 30.0, 26.0, 27.0, 22.0, 12.0, 14.0, 10.0, 11.0, 11.0, 7.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1854710578918457, -3.080415964126587, -2.975360870361328, -2.8703060150146484, -2.7652509212493896, -2.660195827484131, -2.555140733718872, -2.4500856399536133, -2.3450307846069336, -2.239975690841675, -2.134920597076416, -2.0298657417297363, -1.9248106479644775, -1.8197555541992188, -1.71470046043396, -1.6096453666687012, -1.5045902729034424, -1.3995351791381836, -1.2944802045822144, -1.1894251108169556, -1.0843701362609863, -0.9793150424957275, -0.8742599487304688, -0.7692049145698547, -0.6641498804092407, -0.5590948462486267, -0.4540397822856903, -0.3489847183227539, -0.2439296841621399, -0.13887465000152588, -0.03381955623626709, 0.07123547792434692, 0.17629051208496094, 0.28134554624557495, 0.38640061020851135, 0.49145567417144775, 0.5965107083320618, 0.7015657424926758, 0.8066208362579346, 0.9116758704185486, 1.0167309045791626, 1.1217859983444214, 1.2268409729003906, 1.3318960666656494, 1.4369511604309082, 1.5420061349868774, 1.6470612287521362, 1.7521162033081055, 1.8571712970733643, 1.962226390838623, 2.067281484603882, 2.1723365783691406, 2.2773914337158203, 2.382446527481079, 2.487501621246338, 2.5925567150115967, 2.6976118087768555, 2.8026669025421143, 2.907721996307373, 3.0127768516540527, 3.1178319454193115, 3.2228870391845703, 3.327942132949829, 3.432997226715088, 3.5380520820617676]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 8.0, 6.0, 15.0, 19.0, 31.0, 53.0, 69.0, 121.0, 193.0, 286.0, 516.0, 964.0, 1797.0, 3530.0, 7191.0, 15810.0, 38374.0, 112404.0, 434276.0, 301523.0, 78172.0, 28689.0, 12414.0, 5710.0, 2842.0, 1513.0, 820.0, 470.0, 254.0, 162.0, 109.0, 67.0, 35.0, 22.0, 29.0, 14.0, 11.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.380859375, -2.308380126953125, -2.23590087890625, -2.163421630859375, -2.0909423828125, -2.018463134765625, -1.94598388671875, -1.873504638671875, -1.801025390625, -1.728546142578125, -1.65606689453125, -1.583587646484375, -1.5111083984375, -1.438629150390625, -1.36614990234375, -1.293670654296875, -1.22119140625, -1.148712158203125, -1.07623291015625, -1.003753662109375, -0.9312744140625, -0.858795166015625, -0.78631591796875, -0.713836669921875, -0.641357421875, -0.568878173828125, -0.49639892578125, -0.423919677734375, -0.3514404296875, -0.278961181640625, -0.20648193359375, -0.134002685546875, -0.0615234375, 0.010955810546875, 0.08343505859375, 0.155914306640625, 0.2283935546875, 0.300872802734375, 0.37335205078125, 0.445831298828125, 0.518310546875, 0.590789794921875, 0.66326904296875, 0.735748291015625, 0.8082275390625, 0.880706787109375, 0.95318603515625, 1.025665283203125, 1.09814453125, 1.170623779296875, 1.24310302734375, 1.315582275390625, 1.3880615234375, 1.460540771484375, 1.53302001953125, 1.605499267578125, 1.677978515625, 1.750457763671875, 1.82293701171875, 1.895416259765625, 1.9678955078125, 2.040374755859375, 2.11285400390625, 2.185333251953125, 2.2578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 8.0, 6.0, 9.0, 9.0, 11.0, 18.0, 25.0, 23.0, 34.0, 34.0, 34.0, 57.0, 50.0, 52.0, 46.0, 54.0, 62.0, 46.0, 46.0, 46.0, 49.0, 49.0, 35.0, 26.0, 26.0, 21.0, 25.0, 16.0, 19.0, 9.0, 15.0, 2.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.953125, -11.6240234375, -11.294921875, -10.9658203125, -10.63671875, -10.3076171875, -9.978515625, -9.6494140625, -9.3203125, -8.9912109375, -8.662109375, -8.3330078125, -8.00390625, -7.6748046875, -7.345703125, -7.0166015625, -6.6875, -6.3583984375, -6.029296875, -5.7001953125, -5.37109375, -5.0419921875, -4.712890625, -4.3837890625, -4.0546875, -3.7255859375, -3.396484375, -3.0673828125, -2.73828125, -2.4091796875, -2.080078125, -1.7509765625, -1.421875, -1.0927734375, -0.763671875, -0.4345703125, -0.10546875, 0.2236328125, 0.552734375, 0.8818359375, 1.2109375, 1.5400390625, 1.869140625, 2.1982421875, 2.52734375, 2.8564453125, 3.185546875, 3.5146484375, 3.84375, 4.1728515625, 4.501953125, 4.8310546875, 5.16015625, 5.4892578125, 5.818359375, 6.1474609375, 6.4765625, 6.8056640625, 7.134765625, 7.4638671875, 7.79296875, 8.1220703125, 8.451171875, 8.7802734375, 9.109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 7.0, 9.0, 10.0, 16.0, 15.0, 12.0, 18.0, 26.0, 29.0, 45.0, 77.0, 125.0, 213.0, 509.0, 5236.0, 1013467.0, 27161.0, 888.0, 241.0, 133.0, 86.0, 41.0, 42.0, 31.0, 23.0, 14.0, 15.0, 12.0, 6.0, 7.0, 5.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.59375, -16.034423828125, -15.47509765625, -14.915771484375, -14.3564453125, -13.797119140625, -13.23779296875, -12.678466796875, -12.119140625, -11.559814453125, -11.00048828125, -10.441162109375, -9.8818359375, -9.322509765625, -8.76318359375, -8.203857421875, -7.64453125, -7.085205078125, -6.52587890625, -5.966552734375, -5.4072265625, -4.847900390625, -4.28857421875, -3.729248046875, -3.169921875, -2.610595703125, -2.05126953125, -1.491943359375, -0.9326171875, -0.373291015625, 0.18603515625, 0.745361328125, 1.3046875, 1.864013671875, 2.42333984375, 2.982666015625, 3.5419921875, 4.101318359375, 4.66064453125, 5.219970703125, 5.779296875, 6.338623046875, 6.89794921875, 7.457275390625, 8.0166015625, 8.575927734375, 9.13525390625, 9.694580078125, 10.25390625, 10.813232421875, 11.37255859375, 11.931884765625, 12.4912109375, 13.050537109375, 13.60986328125, 14.169189453125, 14.728515625, 15.287841796875, 15.84716796875, 16.406494140625, 16.9658203125, 17.525146484375, 18.08447265625, 18.643798828125, 19.203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 5.0, 7.0, 9.0, 12.0, 18.0, 23.0, 25.0, 27.0, 37.0, 34.0, 38.0, 58.0, 45.0, 54.0, 60.0, 49.0, 59.0, 52.0, 47.0, 44.0, 38.0, 44.0, 31.0, 36.0, 28.0, 22.0, 15.0, 14.0, 8.0, 9.0, 13.0, 11.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.984375, -11.6083984375, -11.232421875, -10.8564453125, -10.48046875, -10.1044921875, -9.728515625, -9.3525390625, -8.9765625, -8.6005859375, -8.224609375, -7.8486328125, -7.47265625, -7.0966796875, -6.720703125, -6.3447265625, -5.96875, -5.5927734375, -5.216796875, -4.8408203125, -4.46484375, -4.0888671875, -3.712890625, -3.3369140625, -2.9609375, -2.5849609375, -2.208984375, -1.8330078125, -1.45703125, -1.0810546875, -0.705078125, -0.3291015625, 0.046875, 0.4228515625, 0.798828125, 1.1748046875, 1.55078125, 1.9267578125, 2.302734375, 2.6787109375, 3.0546875, 3.4306640625, 3.806640625, 4.1826171875, 4.55859375, 4.9345703125, 5.310546875, 5.6865234375, 6.0625, 6.4384765625, 6.814453125, 7.1904296875, 7.56640625, 7.9423828125, 8.318359375, 8.6943359375, 9.0703125, 9.4462890625, 9.822265625, 10.1982421875, 10.57421875, 10.9501953125, 11.326171875, 11.7021484375, 12.078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 22.0, 36.0, 94.0, 522.0, 21710.0, 1022719.0, 3093.0, 235.0, 72.0, 19.0, 13.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.5350341796875, -5.382568359375, -5.2301025390625, -5.07763671875, -4.9251708984375, -4.772705078125, -4.6202392578125, -4.4677734375, -4.3153076171875, -4.162841796875, -4.0103759765625, -3.85791015625, -3.7054443359375, -3.552978515625, -3.4005126953125, -3.248046875, -3.0955810546875, -2.943115234375, -2.7906494140625, -2.63818359375, -2.4857177734375, -2.333251953125, -2.1807861328125, -2.0283203125, -1.8758544921875, -1.723388671875, -1.5709228515625, -1.41845703125, -1.2659912109375, -1.113525390625, -0.9610595703125, -0.80859375, -0.6561279296875, -0.503662109375, -0.3511962890625, -0.19873046875, -0.0462646484375, 0.106201171875, 0.2586669921875, 0.4111328125, 0.5635986328125, 0.716064453125, 0.8685302734375, 1.02099609375, 1.1734619140625, 1.325927734375, 1.4783935546875, 1.630859375, 1.7833251953125, 1.935791015625, 2.0882568359375, 2.24072265625, 2.3931884765625, 2.545654296875, 2.6981201171875, 2.8505859375, 3.0030517578125, 3.155517578125, 3.3079833984375, 3.46044921875, 3.6129150390625, 3.765380859375, 3.9178466796875, 4.0703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 11.0, 8.0, 15.0, 10.0, 23.0, 24.0, 27.0, 65.0, 80.0, 204.0, 227.0, 98.0, 64.0, 45.0, 26.0, 22.0, 16.0, 12.0, 13.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020873546600341797, -0.00020277313888072968, -0.00019681081175804138, -0.0001908484846353531, -0.0001848861575126648, -0.0001789238303899765, -0.0001729615032672882, -0.00016699917614459991, -0.00016103684902191162, -0.00015507452189922333, -0.00014911219477653503, -0.00014314986765384674, -0.00013718754053115845, -0.00013122521340847015, -0.00012526288628578186, -0.00011930055916309357, -0.00011333823204040527, -0.00010737590491771698, -0.00010141357779502869, -9.545125067234039e-05, -8.94889235496521e-05, -8.35265964269638e-05, -7.756426930427551e-05, -7.160194218158722e-05, -6.563961505889893e-05, -5.967728793621063e-05, -5.371496081352234e-05, -4.7752633690834045e-05, -4.179030656814575e-05, -3.582797944545746e-05, -2.9865652322769165e-05, -2.390332520008087e-05, -1.7940998077392578e-05, -1.1978670954704285e-05, -6.016343832015991e-06, -5.4016709327697754e-08, 5.908310413360596e-06, 1.187063753604889e-05, 1.7832964658737183e-05, 2.3795291781425476e-05, 2.975761890411377e-05, 3.571994602680206e-05, 4.1682273149490356e-05, 4.764460027217865e-05, 5.360692739486694e-05, 5.956925451755524e-05, 6.553158164024353e-05, 7.149390876293182e-05, 7.745623588562012e-05, 8.341856300830841e-05, 8.93808901309967e-05, 9.5343217253685e-05, 0.00010130554437637329, 0.00010726787149906158, 0.00011323019862174988, 0.00011919252574443817, 0.00012515485286712646, 0.00013111717998981476, 0.00013707950711250305, 0.00014304183423519135, 0.00014900416135787964, 0.00015496648848056793, 0.00016092881560325623, 0.00016689114272594452, 0.0001728534698486328]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 11.0, 22.0, 14.0, 58.0, 76.0, 338.0, 2908.0, 191046.0, 848906.0, 4513.0, 425.0, 103.0, 38.0, 21.0, 15.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -2.999847412109375, -2.90008544921875, -2.800323486328125, -2.7005615234375, -2.600799560546875, -2.50103759765625, -2.401275634765625, -2.301513671875, -2.201751708984375, -2.10198974609375, -2.002227783203125, -1.9024658203125, -1.802703857421875, -1.70294189453125, -1.603179931640625, -1.50341796875, -1.403656005859375, -1.30389404296875, -1.204132080078125, -1.1043701171875, -1.004608154296875, -0.90484619140625, -0.805084228515625, -0.705322265625, -0.605560302734375, -0.50579833984375, -0.406036376953125, -0.3062744140625, -0.206512451171875, -0.10675048828125, -0.006988525390625, 0.0927734375, 0.192535400390625, 0.29229736328125, 0.392059326171875, 0.4918212890625, 0.591583251953125, 0.69134521484375, 0.791107177734375, 0.890869140625, 0.990631103515625, 1.09039306640625, 1.190155029296875, 1.2899169921875, 1.389678955078125, 1.48944091796875, 1.589202880859375, 1.68896484375, 1.788726806640625, 1.88848876953125, 1.988250732421875, 2.0880126953125, 2.187774658203125, 2.28753662109375, 2.387298583984375, 2.487060546875, 2.586822509765625, 2.68658447265625, 2.786346435546875, 2.8861083984375, 2.985870361328125, 3.08563232421875, 3.185394287109375, 3.28515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 9.0, 15.0, 8.0, 15.0, 21.0, 23.0, 36.0, 51.0, 91.0, 400.0, 123.0, 62.0, 39.0, 29.0, 20.0, 13.0, 14.0, 6.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.49364471435546875, -0.4770355224609375, -0.46042633056640625, -0.443817138671875, -0.42720794677734375, -0.4105987548828125, -0.39398956298828125, -0.37738037109375, -0.36077117919921875, -0.3441619873046875, -0.32755279541015625, -0.310943603515625, -0.29433441162109375, -0.2777252197265625, -0.26111602783203125, -0.2445068359375, -0.22789764404296875, -0.2112884521484375, -0.19467926025390625, -0.178070068359375, -0.16146087646484375, -0.1448516845703125, -0.12824249267578125, -0.11163330078125, -0.09502410888671875, -0.0784149169921875, -0.06180572509765625, -0.045196533203125, -0.02858734130859375, -0.0119781494140625, 0.00463104248046875, 0.021240234375, 0.03784942626953125, 0.0544586181640625, 0.07106781005859375, 0.087677001953125, 0.10428619384765625, 0.1208953857421875, 0.13750457763671875, 0.15411376953125, 0.17072296142578125, 0.1873321533203125, 0.20394134521484375, 0.220550537109375, 0.23715972900390625, 0.2537689208984375, 0.27037811279296875, 0.2869873046875, 0.30359649658203125, 0.3202056884765625, 0.33681488037109375, 0.353424072265625, 0.37003326416015625, 0.3866424560546875, 0.40325164794921875, 0.41986083984375, 0.43647003173828125, 0.4530792236328125, 0.46968841552734375, 0.486297607421875, 0.5029067993164062, 0.5195159912109375, 0.5361251831054688, 0.552734375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 25.0, 874.0, 118.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.262463569641113, -11.119471549987793, -6.976479530334473, -2.8334875106811523, 1.309504508972168, 5.452496528625488, 9.595488548278809, 13.738480567932129, 17.881473541259766, 22.024465560913086, 26.167457580566406, 30.310449600219727, 34.45344161987305, 38.596435546875, 42.73942565917969, 46.882415771484375, 51.02540969848633, 55.16840362548828, 59.31139373779297, 63.454383850097656, 67.59738159179688, 71.74037170410156, 75.88336181640625, 80.02635192871094, 84.16934204101562, 88.31233215332031, 92.455322265625, 96.59832000732422, 100.7413101196289, 104.8843002319336, 109.02729797363281, 113.1702880859375, 117.31327819824219, 121.45626831054688, 125.59925842285156, 129.74224853515625, 133.88525390625, 138.0282440185547, 142.17123413085938, 146.31422424316406, 150.45721435546875, 154.60020446777344, 158.74319458007812, 162.8861846923828, 167.0291748046875, 171.17218017578125, 175.31517028808594, 179.45816040039062, 183.6011505126953, 187.744140625, 191.8871307373047, 196.03012084960938, 200.17312622070312, 204.3161163330078, 208.4591064453125, 212.6020965576172, 216.74508666992188, 220.88807678222656, 225.03106689453125, 229.17405700683594, 233.31704711914062, 237.46005249023438, 241.60304260253906, 245.74603271484375, 249.88902282714844]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 15.0, 7.0, 9.0, 15.0, 24.0, 10.0, 27.0, 37.0, 24.0, 37.0, 30.0, 37.0, 42.0, 28.0, 39.0, 29.0, 41.0, 40.0, 29.0, 37.0, 51.0, 30.0, 33.0, 28.0, 40.0, 40.0, 30.0, 31.0, 18.0, 20.0, 17.0, 23.0, 14.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.498571395874023, -14.053396224975586, -13.608222007751465, -13.163047790527344, -12.717872619628906, -12.272697448730469, -11.827523231506348, -11.382349014282227, -10.937173843383789, -10.491998672485352, -10.04682445526123, -9.60165023803711, -9.156475067138672, -8.711299896240234, -8.266125679016113, -7.820950984954834, -7.375776290893555, -6.930601596832275, -6.485426902770996, -6.040252208709717, -5.5950775146484375, -5.149902820587158, -4.704728126525879, -4.2595534324646, -3.8143787384033203, -3.369204044342041, -2.9240293502807617, -2.4788546562194824, -2.033679962158203, -1.5885052680969238, -1.1433305740356445, -0.6981558799743652, -0.25298213958740234, 0.19219255447387695, 0.6373672485351562, 1.0825419425964355, 1.5277166366577148, 1.9728913307189941, 2.4180660247802734, 2.8632407188415527, 3.308415412902832, 3.7535901069641113, 4.198764801025391, 4.64393949508667, 5.089114189147949, 5.5342888832092285, 5.979463577270508, 6.424638271331787, 6.869812965393066, 7.314987659454346, 7.760162353515625, 8.205337524414062, 8.650511741638184, 9.095685958862305, 9.540861129760742, 9.98603630065918, 10.4312105178833, 10.876384735107422, 11.32155990600586, 11.766735076904297, 12.211909294128418, 12.657083511352539, 13.102258682250977, 13.547433853149414, 13.992608070373535]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 3.0, 2.0, 5.0, 10.0, 6.0, 14.0, 24.0, 27.0, 46.0, 72.0, 72.0, 119.0, 256.0, 556.0, 1198.0, 3101.0, 9451.0, 38527.0, 259469.0, 3279838.0, 523369.0, 57709.0, 13499.0, 4046.0, 1460.0, 618.0, 301.0, 166.0, 81.0, 64.0, 44.0, 22.0, 22.0, 22.0, 13.0, 15.0, 6.0, 7.0, 3.0, 2.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.32232666015625, -5.1485595703125, -4.97479248046875, -4.801025390625, -4.62725830078125, -4.4534912109375, -4.27972412109375, -4.10595703125, -3.93218994140625, -3.7584228515625, -3.58465576171875, -3.410888671875, -3.23712158203125, -3.0633544921875, -2.88958740234375, -2.7158203125, -2.54205322265625, -2.3682861328125, -2.19451904296875, -2.020751953125, -1.84698486328125, -1.6732177734375, -1.49945068359375, -1.32568359375, -1.15191650390625, -0.9781494140625, -0.80438232421875, -0.630615234375, -0.45684814453125, -0.2830810546875, -0.10931396484375, 0.064453125, 0.23822021484375, 0.4119873046875, 0.58575439453125, 0.759521484375, 0.93328857421875, 1.1070556640625, 1.28082275390625, 1.45458984375, 1.62835693359375, 1.8021240234375, 1.97589111328125, 2.149658203125, 2.32342529296875, 2.4971923828125, 2.67095947265625, 2.8447265625, 3.01849365234375, 3.1922607421875, 3.36602783203125, 3.539794921875, 3.71356201171875, 3.8873291015625, 4.06109619140625, 4.23486328125, 4.40863037109375, 4.5823974609375, 4.75616455078125, 4.929931640625, 5.10369873046875, 5.2774658203125, 5.45123291015625, 5.625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 17.0, 15.0, 16.0, 14.0, 16.0, 32.0, 33.0, 33.0, 60.0, 44.0, 60.0, 58.0, 56.0, 64.0, 57.0, 54.0, 58.0, 51.0, 40.0, 31.0, 30.0, 38.0, 32.0, 20.0, 15.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.213714599609375, -4.08367919921875, -3.953643798828125, -3.8236083984375, -3.693572998046875, -3.56353759765625, -3.433502197265625, -3.303466796875, -3.173431396484375, -3.04339599609375, -2.913360595703125, -2.7833251953125, -2.653289794921875, -2.52325439453125, -2.393218994140625, -2.26318359375, -2.133148193359375, -2.00311279296875, -1.873077392578125, -1.7430419921875, -1.613006591796875, -1.48297119140625, -1.352935791015625, -1.222900390625, -1.092864990234375, -0.96282958984375, -0.832794189453125, -0.7027587890625, -0.572723388671875, -0.44268798828125, -0.312652587890625, -0.1826171875, -0.052581787109375, 0.07745361328125, 0.207489013671875, 0.3375244140625, 0.467559814453125, 0.59759521484375, 0.727630615234375, 0.857666015625, 0.987701416015625, 1.11773681640625, 1.247772216796875, 1.3778076171875, 1.507843017578125, 1.63787841796875, 1.767913818359375, 1.89794921875, 2.027984619140625, 2.15802001953125, 2.288055419921875, 2.4180908203125, 2.548126220703125, 2.67816162109375, 2.808197021484375, 2.938232421875, 3.068267822265625, 3.19830322265625, 3.328338623046875, 3.4583740234375, 3.588409423828125, 3.71844482421875, 3.848480224609375, 3.978515625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 18.0, 50.0, 492.0, 4193322.0, 342.0, 35.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.625, -119.73046875, -114.8359375, -109.94140625, -105.046875, -100.15234375, -95.2578125, -90.36328125, -85.46875, -80.57421875, -75.6796875, -70.78515625, -65.890625, -60.99609375, -56.1015625, -51.20703125, -46.3125, -41.41796875, -36.5234375, -31.62890625, -26.734375, -21.83984375, -16.9453125, -12.05078125, -7.15625, -2.26171875, 2.6328125, 7.52734375, 12.421875, 17.31640625, 22.2109375, 27.10546875, 32.0, 36.89453125, 41.7890625, 46.68359375, 51.578125, 56.47265625, 61.3671875, 66.26171875, 71.15625, 76.05078125, 80.9453125, 85.83984375, 90.734375, 95.62890625, 100.5234375, 105.41796875, 110.3125, 115.20703125, 120.1015625, 124.99609375, 129.890625, 134.78515625, 139.6796875, 144.57421875, 149.46875, 154.36328125, 159.2578125, 164.15234375, 169.046875, 173.94140625, 178.8359375, 183.73046875, 188.625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 14.0, 20.0, 15.0, 49.0, 85.0, 158.0, 305.0, 769.0, 1611.0, 575.0, 199.0, 118.0, 60.0, 29.0, 19.0, 14.0, 12.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.19140625, -3.1209716796875, -3.050537109375, -2.9801025390625, -2.90966796875, -2.8392333984375, -2.768798828125, -2.6983642578125, -2.6279296875, -2.5574951171875, -2.487060546875, -2.4166259765625, -2.34619140625, -2.2757568359375, -2.205322265625, -2.1348876953125, -2.064453125, -1.9940185546875, -1.923583984375, -1.8531494140625, -1.78271484375, -1.7122802734375, -1.641845703125, -1.5714111328125, -1.5009765625, -1.4305419921875, -1.360107421875, -1.2896728515625, -1.21923828125, -1.1488037109375, -1.078369140625, -1.0079345703125, -0.9375, -0.8670654296875, -0.796630859375, -0.7261962890625, -0.65576171875, -0.5853271484375, -0.514892578125, -0.4444580078125, -0.3740234375, -0.3035888671875, -0.233154296875, -0.1627197265625, -0.09228515625, -0.0218505859375, 0.048583984375, 0.1190185546875, 0.189453125, 0.2598876953125, 0.330322265625, 0.4007568359375, 0.47119140625, 0.5416259765625, 0.612060546875, 0.6824951171875, 0.7529296875, 0.8233642578125, 0.893798828125, 0.9642333984375, 1.03466796875, 1.1051025390625, 1.175537109375, 1.2459716796875, 1.31640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 17.0, 36.0, 72.0, 132.0, 197.0, 202.0, 149.0, 88.0, 34.0, 30.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.766993522644043, -9.421097755432129, -9.075201034545898, -8.729305267333984, -8.383408546447754, -8.03751277923584, -7.691616535186768, -7.345720291137695, -6.999824523925781, -6.653928279876709, -6.308032035827637, -5.962136268615723, -5.61624002456665, -5.270343780517578, -4.924447536468506, -4.578551292419434, -4.232655048370361, -3.886758804321289, -3.540862798690796, -3.1949665546417236, -2.8490705490112305, -2.503174304962158, -2.157278060913086, -1.8113820552825928, -1.4654858112335205, -1.1195896863937378, -0.7736935019493103, -0.4277973175048828, -0.0819011926651001, 0.2639949321746826, 0.6098911762237549, 0.955787181854248, 1.3016834259033203, 1.647579550743103, 1.9934756755828857, 2.339371919631958, 2.685267925262451, 3.0311641693115234, 3.3770604133605957, 3.722956418991089, 4.068852424621582, 4.414748668670654, 4.760644912719727, 5.106540679931641, 5.452436923980713, 5.798333168029785, 6.144229412078857, 6.49012565612793, 6.836021900177002, 7.181918144226074, 7.5278143882751465, 7.873710632324219, 8.219606399536133, 8.565502166748047, 8.911398887634277, 9.257294654846191, 9.603191375732422, 9.949087142944336, 10.294983863830566, 10.64087963104248, 10.986776351928711, 11.332672119140625, 11.678567886352539, 12.02446460723877, 12.370360374450684]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 3.0, 15.0, 13.0, 18.0, 16.0, 19.0, 30.0, 31.0, 36.0, 40.0, 42.0, 40.0, 48.0, 53.0, 54.0, 53.0, 55.0, 53.0, 45.0, 39.0, 39.0, 44.0, 30.0, 29.0, 28.0, 26.0, 17.0, 22.0, 10.0, 11.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.364370822906494, -3.2407140731811523, -3.1170573234558105, -2.9934005737304688, -2.869743824005127, -2.746087074279785, -2.6224303245544434, -2.4987733364105225, -2.3751165866851807, -2.251459836959839, -2.127803087234497, -2.0041463375091553, -1.880489468574524, -1.7568327188491821, -1.6331759691238403, -1.509519100189209, -1.3858624696731567, -1.262205719947815, -1.1385489702224731, -1.0148921012878418, -0.8912353515625, -0.7675786018371582, -0.6439218521118164, -0.5202650427818298, -0.39660829305648804, -0.27295151352882385, -0.14929474890232086, -0.02563798427581787, 0.09801879525184631, 0.2216755747795105, 0.3453323245048523, 0.46898913383483887, 0.5926458835601807, 0.7163026332855225, 0.839959442615509, 0.9636161923408508, 1.0872730016708374, 1.2109297513961792, 1.334586501121521, 1.4582433700561523, 1.5819001197814941, 1.705556869506836, 1.8292136192321777, 1.9528703689575195, 2.0765271186828613, 2.200183868408203, 2.323840618133545, 2.447497606277466, 2.5711541175842285, 2.6948108673095703, 2.818467617034912, 2.942124366760254, 3.0657811164855957, 3.1894378662109375, 3.3130946159362793, 3.4367516040802, 3.560408353805542, 3.684065103530884, 3.8077218532562256, 3.9313786029815674, 4.055035591125488, 4.17869234085083, 4.302349090576172, 4.426005840301514, 4.5496625900268555]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 8.0, 7.0, 11.0, 14.0, 18.0, 27.0, 33.0, 58.0, 82.0, 103.0, 160.0, 197.0, 352.0, 499.0, 853.0, 1540.0, 3093.0, 7817.0, 27015.0, 169650.0, 666331.0, 133886.0, 23345.0, 6887.0, 2859.0, 1396.0, 758.0, 505.0, 317.0, 208.0, 141.0, 120.0, 73.0, 45.0, 38.0, 29.0, 23.0, 18.0, 8.0, 8.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.7744140625, -0.749786376953125, -0.72515869140625, -0.700531005859375, -0.6759033203125, -0.651275634765625, -0.62664794921875, -0.602020263671875, -0.577392578125, -0.552764892578125, -0.52813720703125, -0.503509521484375, -0.4788818359375, -0.454254150390625, -0.42962646484375, -0.404998779296875, -0.38037109375, -0.355743408203125, -0.33111572265625, -0.306488037109375, -0.2818603515625, -0.257232666015625, -0.23260498046875, -0.207977294921875, -0.183349609375, -0.158721923828125, -0.13409423828125, -0.109466552734375, -0.0848388671875, -0.060211181640625, -0.03558349609375, -0.010955810546875, 0.013671875, 0.038299560546875, 0.06292724609375, 0.087554931640625, 0.1121826171875, 0.136810302734375, 0.16143798828125, 0.186065673828125, 0.210693359375, 0.235321044921875, 0.25994873046875, 0.284576416015625, 0.3092041015625, 0.333831787109375, 0.35845947265625, 0.383087158203125, 0.40771484375, 0.432342529296875, 0.45697021484375, 0.481597900390625, 0.5062255859375, 0.530853271484375, 0.55548095703125, 0.580108642578125, 0.604736328125, 0.629364013671875, 0.65399169921875, 0.678619384765625, 0.7032470703125, 0.727874755859375, 0.75250244140625, 0.777130126953125, 0.8017578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 1.0, 6.0, 4.0, 5.0, 11.0, 15.0, 16.0, 15.0, 18.0, 25.0, 29.0, 40.0, 31.0, 41.0, 51.0, 47.0, 52.0, 60.0, 53.0, 47.0, 53.0, 51.0, 51.0, 43.0, 28.0, 29.0, 30.0, 26.0, 21.0, 10.0, 14.0, 14.0, 10.0, 11.0, 6.0, 7.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.5, -2.414886474609375, -2.32977294921875, -2.244659423828125, -2.1595458984375, -2.074432373046875, -1.98931884765625, -1.904205322265625, -1.819091796875, -1.733978271484375, -1.64886474609375, -1.563751220703125, -1.4786376953125, -1.393524169921875, -1.30841064453125, -1.223297119140625, -1.13818359375, -1.053070068359375, -0.96795654296875, -0.882843017578125, -0.7977294921875, -0.712615966796875, -0.62750244140625, -0.542388916015625, -0.457275390625, -0.372161865234375, -0.28704833984375, -0.201934814453125, -0.1168212890625, -0.031707763671875, 0.05340576171875, 0.138519287109375, 0.2236328125, 0.308746337890625, 0.39385986328125, 0.478973388671875, 0.5640869140625, 0.649200439453125, 0.73431396484375, 0.819427490234375, 0.904541015625, 0.989654541015625, 1.07476806640625, 1.159881591796875, 1.2449951171875, 1.330108642578125, 1.41522216796875, 1.500335693359375, 1.58544921875, 1.670562744140625, 1.75567626953125, 1.840789794921875, 1.9259033203125, 2.011016845703125, 2.09613037109375, 2.181243896484375, 2.266357421875, 2.351470947265625, 2.43658447265625, 2.521697998046875, 2.6068115234375, 2.691925048828125, 2.77703857421875, 2.862152099609375, 2.947265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 11.0, 8.0, 16.0, 11.0, 23.0, 18.0, 41.0, 39.0, 52.0, 65.0, 110.0, 148.0, 203.0, 299.0, 485.0, 865.0, 2777.0, 35718.0, 806301.0, 190806.0, 7352.0, 1304.0, 605.0, 354.0, 258.0, 188.0, 142.0, 89.0, 58.0, 55.0, 33.0, 30.0, 19.0, 17.0, 7.0, 9.0, 4.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.91943359375, -0.8936996459960938, -0.8679656982421875, -0.8422317504882812, -0.816497802734375, -0.7907638549804688, -0.7650299072265625, -0.7392959594726562, -0.71356201171875, -0.6878280639648438, -0.6620941162109375, -0.6363601684570312, -0.610626220703125, -0.5848922729492188, -0.5591583251953125, -0.5334243774414062, -0.5076904296875, -0.48195648193359375, -0.4562225341796875, -0.43048858642578125, -0.404754638671875, -0.37902069091796875, -0.3532867431640625, -0.32755279541015625, -0.30181884765625, -0.27608489990234375, -0.2503509521484375, -0.22461700439453125, -0.198883056640625, -0.17314910888671875, -0.1474151611328125, -0.12168121337890625, -0.095947265625, -0.07021331787109375, -0.0444793701171875, -0.01874542236328125, 0.006988525390625, 0.03272247314453125, 0.0584564208984375, 0.08419036865234375, 0.10992431640625, 0.13565826416015625, 0.1613922119140625, 0.18712615966796875, 0.212860107421875, 0.23859405517578125, 0.2643280029296875, 0.29006195068359375, 0.3157958984375, 0.34152984619140625, 0.3672637939453125, 0.39299774169921875, 0.418731689453125, 0.44446563720703125, 0.4701995849609375, 0.49593353271484375, 0.52166748046875, 0.5474014282226562, 0.5731353759765625, 0.5988693237304688, 0.624603271484375, 0.6503372192382812, 0.6760711669921875, 0.7018051147460938, 0.7275390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 10.0, 4.0, 10.0, 16.0, 14.0, 20.0, 30.0, 25.0, 28.0, 26.0, 38.0, 39.0, 38.0, 35.0, 39.0, 39.0, 64.0, 42.0, 48.0, 50.0, 41.0, 31.0, 40.0, 48.0, 34.0, 28.0, 20.0, 23.0, 26.0, 15.0, 14.0, 17.0, 7.0, 10.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.57421875, -4.43536376953125, -4.2965087890625, -4.15765380859375, -4.018798828125, -3.87994384765625, -3.7410888671875, -3.60223388671875, -3.46337890625, -3.32452392578125, -3.1856689453125, -3.04681396484375, -2.907958984375, -2.76910400390625, -2.6302490234375, -2.49139404296875, -2.3525390625, -2.21368408203125, -2.0748291015625, -1.93597412109375, -1.797119140625, -1.65826416015625, -1.5194091796875, -1.38055419921875, -1.24169921875, -1.10284423828125, -0.9639892578125, -0.82513427734375, -0.686279296875, -0.54742431640625, -0.4085693359375, -0.26971435546875, -0.130859375, 0.00799560546875, 0.1468505859375, 0.28570556640625, 0.424560546875, 0.56341552734375, 0.7022705078125, 0.84112548828125, 0.97998046875, 1.11883544921875, 1.2576904296875, 1.39654541015625, 1.535400390625, 1.67425537109375, 1.8131103515625, 1.95196533203125, 2.0908203125, 2.22967529296875, 2.3685302734375, 2.50738525390625, 2.646240234375, 2.78509521484375, 2.9239501953125, 3.06280517578125, 3.20166015625, 3.34051513671875, 3.4793701171875, 3.61822509765625, 3.757080078125, 3.89593505859375, 4.0347900390625, 4.17364501953125, 4.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 4.0, 7.0, 14.0, 8.0, 18.0, 26.0, 28.0, 32.0, 89.0, 143.0, 347.0, 999.0, 9163.0, 1015782.0, 19607.0, 1388.0, 432.0, 183.0, 90.0, 49.0, 25.0, 21.0, 22.0, 11.0, 14.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2705078125, -0.2636756896972656, -0.25684356689453125, -0.2500114440917969, -0.2431793212890625, -0.23634719848632812, -0.22951507568359375, -0.22268295288085938, -0.215850830078125, -0.20901870727539062, -0.20218658447265625, -0.19535446166992188, -0.1885223388671875, -0.18169021606445312, -0.17485809326171875, -0.16802597045898438, -0.16119384765625, -0.15436172485351562, -0.14752960205078125, -0.14069747924804688, -0.1338653564453125, -0.12703323364257812, -0.12020111083984375, -0.11336898803710938, -0.106536865234375, -0.09970474243164062, -0.09287261962890625, -0.08604049682617188, -0.0792083740234375, -0.07237625122070312, -0.06554412841796875, -0.058712005615234375, -0.0518798828125, -0.045047760009765625, -0.03821563720703125, -0.031383514404296875, -0.0245513916015625, -0.017719268798828125, -0.01088714599609375, -0.004055023193359375, 0.002777099609375, 0.009609222412109375, 0.01644134521484375, 0.023273468017578125, 0.0301055908203125, 0.036937713623046875, 0.04376983642578125, 0.050601959228515625, 0.05743408203125, 0.06426620483398438, 0.07109832763671875, 0.07793045043945312, 0.0847625732421875, 0.09159469604492188, 0.09842681884765625, 0.10525894165039062, 0.112091064453125, 0.11892318725585938, 0.12575531005859375, 0.13258743286132812, 0.1394195556640625, 0.14625167846679688, 0.15308380126953125, 0.15991592407226562, 0.166748046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 18.0, 13.0, 48.0, 65.0, 120.0, 178.0, 179.0, 136.0, 81.0, 40.0, 25.0, 18.0, 20.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-05, -8.57347622513771e-05, -8.265860378742218e-05, -7.958244532346725e-05, -7.650628685951233e-05, -7.34301283955574e-05, -7.035396993160248e-05, -6.727781146764755e-05, -6.420165300369263e-05, -6.11254945397377e-05, -5.8049336075782776e-05, -5.497317761182785e-05, -5.1897019147872925e-05, -4.8820860683918e-05, -4.5744702219963074e-05, -4.266854375600815e-05, -3.959238529205322e-05, -3.65162268280983e-05, -3.344006836414337e-05, -3.0363909900188446e-05, -2.728775143623352e-05, -2.4211592972278595e-05, -2.113543450832367e-05, -1.8059276044368744e-05, -1.4983117580413818e-05, -1.1906959116458893e-05, -8.830800652503967e-06, -5.754642188549042e-06, -2.678483724594116e-06, 3.976747393608093e-07, 3.473833203315735e-06, 6.54999166727066e-06, 9.626150131225586e-06, 1.2702308595180511e-05, 1.5778467059135437e-05, 1.8854625523090363e-05, 2.1930783987045288e-05, 2.5006942451000214e-05, 2.808310091495514e-05, 3.1159259378910065e-05, 3.423541784286499e-05, 3.7311576306819916e-05, 4.038773477077484e-05, 4.346389323472977e-05, 4.654005169868469e-05, 4.961621016263962e-05, 5.2692368626594543e-05, 5.576852709054947e-05, 5.8844685554504395e-05, 6.192084401845932e-05, 6.499700248241425e-05, 6.807316094636917e-05, 7.11493194103241e-05, 7.422547787427902e-05, 7.730163633823395e-05, 8.037779480218887e-05, 8.34539532661438e-05, 8.653011173009872e-05, 8.960627019405365e-05, 9.268242865800858e-05, 9.57585871219635e-05, 9.883474558591843e-05, 0.00010191090404987335, 0.00010498706251382828, 0.0001080632209777832]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 11.0, 37.0, 1628.0, 1046088.0, 688.0, 38.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33160400390625, -2.2550048828125, -2.17840576171875, -2.101806640625, -2.02520751953125, -1.9486083984375, -1.87200927734375, -1.79541015625, -1.71881103515625, -1.6422119140625, -1.56561279296875, -1.489013671875, -1.41241455078125, -1.3358154296875, -1.25921630859375, -1.1826171875, -1.10601806640625, -1.0294189453125, -0.95281982421875, -0.876220703125, -0.79962158203125, -0.7230224609375, -0.64642333984375, -0.56982421875, -0.49322509765625, -0.4166259765625, -0.34002685546875, -0.263427734375, -0.18682861328125, -0.1102294921875, -0.03363037109375, 0.04296875, 0.11956787109375, 0.1961669921875, 0.27276611328125, 0.349365234375, 0.42596435546875, 0.5025634765625, 0.57916259765625, 0.65576171875, 0.73236083984375, 0.8089599609375, 0.88555908203125, 0.962158203125, 1.03875732421875, 1.1153564453125, 1.19195556640625, 1.2685546875, 1.34515380859375, 1.4217529296875, 1.49835205078125, 1.574951171875, 1.65155029296875, 1.7281494140625, 1.80474853515625, 1.88134765625, 1.95794677734375, 2.0345458984375, 2.11114501953125, 2.187744140625, 2.26434326171875, 2.3409423828125, 2.41754150390625, 2.494140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 5.0, 6.0, 8.0, 34.0, 176.0, 572.0, 115.0, 29.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.093505859375, -0.0905294418334961, -0.08755302429199219, -0.08457660675048828, -0.08160018920898438, -0.07862377166748047, -0.07564735412597656, -0.07267093658447266, -0.06969451904296875, -0.06671810150146484, -0.06374168395996094, -0.06076526641845703, -0.057788848876953125, -0.05481243133544922, -0.05183601379394531, -0.048859596252441406, -0.0458831787109375, -0.042906761169433594, -0.03993034362792969, -0.03695392608642578, -0.033977508544921875, -0.03100109100341797, -0.028024673461914062, -0.025048255920410156, -0.02207183837890625, -0.019095420837402344, -0.016119003295898438, -0.013142585754394531, -0.010166168212890625, -0.007189750671386719, -0.0042133331298828125, -0.0012369155883789062, 0.001739501953125, 0.004715919494628906, 0.0076923370361328125, 0.010668754577636719, 0.013645172119140625, 0.01662158966064453, 0.019598007202148438, 0.022574424743652344, 0.02555084228515625, 0.028527259826660156, 0.03150367736816406, 0.03448009490966797, 0.037456512451171875, 0.04043292999267578, 0.04340934753417969, 0.046385765075683594, 0.0493621826171875, 0.052338600158691406, 0.05531501770019531, 0.05829143524169922, 0.061267852783203125, 0.06424427032470703, 0.06722068786621094, 0.07019710540771484, 0.07317352294921875, 0.07614994049072266, 0.07912635803222656, 0.08210277557373047, 0.08507919311523438, 0.08805561065673828, 0.09103202819824219, 0.0940084457397461, 0.09698486328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 13.0, 33.0, 70.0, 151.0, 292.0, 235.0, 110.0, 48.0, 18.0, 11.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.63742208480835, -7.33046817779541, -7.0235137939453125, -6.716559886932373, -6.409605503082275, -6.102651596069336, -5.795697212219238, -5.488743305206299, -5.181789398193359, -4.87483549118042, -4.567881107330322, -4.260927200317383, -3.953972816467285, -3.6470189094543457, -3.340064764022827, -3.0331106185913086, -2.726156234741211, -2.4192020893096924, -2.112247943878174, -1.8052939176559448, -1.4983397722244263, -1.1913856267929077, -0.8844316005706787, -0.5774774551391602, -0.2705233097076416, 0.036430805921554565, 0.34338492155075073, 0.6503390073776245, 0.9572931528091431, 1.2642472982406616, 1.5712013244628906, 1.8781554698944092, 2.1851091384887695, 2.492063283920288, 2.7990174293518066, 3.105971336364746, 3.4129257202148438, 3.719879627227783, 4.026833534240723, 4.33378791809082, 4.640742301940918, 4.947696208953857, 5.254650592803955, 5.5616044998168945, 5.868558883666992, 6.175512790679932, 6.482466697692871, 6.789421081542969, 7.096374988555908, 7.403328895568848, 7.710283279418945, 8.017237663269043, 8.324191093444824, 8.631145477294922, 8.93809986114502, 9.245054244995117, 9.552007675170898, 9.858962059020996, 10.165915489196777, 10.472869873046875, 10.779824256896973, 11.08677864074707, 11.393732070922852, 11.70068645477295, 12.007640838623047]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 2.0, 14.0, 10.0, 18.0, 10.0, 24.0, 22.0, 30.0, 34.0, 39.0, 44.0, 44.0, 44.0, 51.0, 62.0, 72.0, 56.0, 49.0, 52.0, 47.0, 47.0, 36.0, 30.0, 23.0, 22.0, 23.0, 20.0, 19.0, 10.0, 6.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.516392469406128, -2.4287919998168945, -2.341191530227661, -2.2535910606384277, -2.1659905910491943, -2.078390121459961, -1.990789771080017, -1.9031893014907837, -1.8155888319015503, -1.727988362312317, -1.6403878927230835, -1.5527875423431396, -1.4651870727539062, -1.3775866031646729, -1.2899861335754395, -1.202385663986206, -1.1147851943969727, -1.0271847248077393, -0.9395842552185059, -0.8519838452339172, -0.7643833756446838, -0.6767829060554504, -0.5891824960708618, -0.5015820264816284, -0.413981556892395, -0.3263810873031616, -0.2387806475162506, -0.1511802077293396, -0.0635797381401062, 0.024020731449127197, 0.11162114143371582, 0.19922161102294922, 0.2868218421936035, 0.3744223117828369, 0.4620227515697479, 0.5496231913566589, 0.6372236609458923, 0.7248241305351257, 0.8124245405197144, 0.9000250101089478, 0.9876254796981812, 1.0752259492874146, 1.162826418876648, 1.2504267692565918, 1.3380272388458252, 1.4256277084350586, 1.513228178024292, 1.6008286476135254, 1.6884291172027588, 1.7760295867919922, 1.8636300563812256, 1.951230525970459, 2.0388309955596924, 2.126431465148926, 2.21403169631958, 2.3016324043273926, 2.389232635498047, 2.4768331050872803, 2.5644335746765137, 2.652034044265747, 2.7396345138549805, 2.827234983444214, 2.9148354530334473, 3.0024356842041016, 3.090036392211914]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 7.0, 12.0, 9.0, 22.0, 34.0, 50.0, 78.0, 98.0, 167.0, 274.0, 402.0, 679.0, 1081.0, 2003.0, 3382.0, 6032.0, 11946.0, 25280.0, 64717.0, 259796.0, 481897.0, 116629.0, 38000.0, 16808.0, 8321.0, 4489.0, 2536.0, 1491.0, 885.0, 486.0, 309.0, 215.0, 139.0, 86.0, 69.0, 42.0, 25.0, 15.0, 14.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.484375, -1.4336090087890625, -1.382843017578125, -1.3320770263671875, -1.28131103515625, -1.2305450439453125, -1.179779052734375, -1.1290130615234375, -1.0782470703125, -1.0274810791015625, -0.976715087890625, -0.9259490966796875, -0.87518310546875, -0.8244171142578125, -0.773651123046875, -0.7228851318359375, -0.672119140625, -0.6213531494140625, -0.570587158203125, -0.5198211669921875, -0.46905517578125, -0.4182891845703125, -0.367523193359375, -0.3167572021484375, -0.2659912109375, -0.2152252197265625, -0.164459228515625, -0.1136932373046875, -0.06292724609375, -0.0121612548828125, 0.038604736328125, 0.0893707275390625, 0.14013671875, 0.1909027099609375, 0.241668701171875, 0.2924346923828125, 0.34320068359375, 0.3939666748046875, 0.444732666015625, 0.4954986572265625, 0.5462646484375, 0.5970306396484375, 0.647796630859375, 0.6985626220703125, 0.74932861328125, 0.8000946044921875, 0.850860595703125, 0.9016265869140625, 0.952392578125, 1.0031585693359375, 1.053924560546875, 1.1046905517578125, 1.15545654296875, 1.2062225341796875, 1.256988525390625, 1.3077545166015625, 1.3585205078125, 1.4092864990234375, 1.460052490234375, 1.5108184814453125, 1.56158447265625, 1.6123504638671875, 1.663116455078125, 1.7138824462890625, 1.7646484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 9.0, 14.0, 15.0, 20.0, 25.0, 34.0, 29.0, 42.0, 38.0, 50.0, 59.0, 62.0, 53.0, 65.0, 59.0, 66.0, 56.0, 53.0, 55.0, 32.0, 31.0, 26.0, 28.0, 13.0, 20.0, 6.0, 11.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.33203125, -7.07305908203125, -6.8140869140625, -6.55511474609375, -6.296142578125, -6.03717041015625, -5.7781982421875, -5.51922607421875, -5.26025390625, -5.00128173828125, -4.7423095703125, -4.48333740234375, -4.224365234375, -3.96539306640625, -3.7064208984375, -3.44744873046875, -3.1884765625, -2.92950439453125, -2.6705322265625, -2.41156005859375, -2.152587890625, -1.89361572265625, -1.6346435546875, -1.37567138671875, -1.11669921875, -0.85772705078125, -0.5987548828125, -0.33978271484375, -0.080810546875, 0.17816162109375, 0.4371337890625, 0.69610595703125, 0.955078125, 1.21405029296875, 1.4730224609375, 1.73199462890625, 1.990966796875, 2.24993896484375, 2.5089111328125, 2.76788330078125, 3.02685546875, 3.28582763671875, 3.5447998046875, 3.80377197265625, 4.062744140625, 4.32171630859375, 4.5806884765625, 4.83966064453125, 5.0986328125, 5.35760498046875, 5.6165771484375, 5.87554931640625, 6.134521484375, 6.39349365234375, 6.6524658203125, 6.91143798828125, 7.17041015625, 7.42938232421875, 7.6883544921875, 7.94732666015625, 8.206298828125, 8.46527099609375, 8.7242431640625, 8.98321533203125, 9.2421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 10.0, 13.0, 4.0, 4.0, 10.0, 16.0, 9.0, 15.0, 23.0, 19.0, 33.0, 41.0, 30.0, 46.0, 38.0, 46.0, 93.0, 785.0, 1038977.0, 7744.0, 153.0, 68.0, 52.0, 38.0, 37.0, 33.0, 32.0, 34.0, 19.0, 15.0, 19.0, 18.0, 20.0, 9.0, 6.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.006103515625, -19.30908203125, -18.612060546875, -17.9150390625, -17.218017578125, -16.52099609375, -15.823974609375, -15.126953125, -14.429931640625, -13.73291015625, -13.035888671875, -12.3388671875, -11.641845703125, -10.94482421875, -10.247802734375, -9.55078125, -8.853759765625, -8.15673828125, -7.459716796875, -6.7626953125, -6.065673828125, -5.36865234375, -4.671630859375, -3.974609375, -3.277587890625, -2.58056640625, -1.883544921875, -1.1865234375, -0.489501953125, 0.20751953125, 0.904541015625, 1.6015625, 2.298583984375, 2.99560546875, 3.692626953125, 4.3896484375, 5.086669921875, 5.78369140625, 6.480712890625, 7.177734375, 7.874755859375, 8.57177734375, 9.268798828125, 9.9658203125, 10.662841796875, 11.35986328125, 12.056884765625, 12.75390625, 13.450927734375, 14.14794921875, 14.844970703125, 15.5419921875, 16.239013671875, 16.93603515625, 17.633056640625, 18.330078125, 19.027099609375, 19.72412109375, 20.421142578125, 21.1181640625, 21.815185546875, 22.51220703125, 23.209228515625, 23.90625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 6.0, 7.0, 15.0, 5.0, 6.0, 7.0, 18.0, 12.0, 17.0, 18.0, 18.0, 37.0, 35.0, 29.0, 43.0, 34.0, 39.0, 50.0, 52.0, 49.0, 45.0, 44.0, 47.0, 46.0, 36.0, 31.0, 33.0, 36.0, 34.0, 25.0, 19.0, 17.0, 18.0, 17.0, 9.0, 10.0, 5.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.11590576171875, -6.8685302734375, -6.62115478515625, -6.373779296875, -6.12640380859375, -5.8790283203125, -5.63165283203125, -5.38427734375, -5.13690185546875, -4.8895263671875, -4.64215087890625, -4.394775390625, -4.14739990234375, -3.9000244140625, -3.65264892578125, -3.4052734375, -3.15789794921875, -2.9105224609375, -2.66314697265625, -2.415771484375, -2.16839599609375, -1.9210205078125, -1.67364501953125, -1.42626953125, -1.17889404296875, -0.9315185546875, -0.68414306640625, -0.436767578125, -0.18939208984375, 0.0579833984375, 0.30535888671875, 0.552734375, 0.80010986328125, 1.0474853515625, 1.29486083984375, 1.542236328125, 1.78961181640625, 2.0369873046875, 2.28436279296875, 2.53173828125, 2.77911376953125, 3.0264892578125, 3.27386474609375, 3.521240234375, 3.76861572265625, 4.0159912109375, 4.26336669921875, 4.5107421875, 4.75811767578125, 5.0054931640625, 5.25286865234375, 5.500244140625, 5.74761962890625, 5.9949951171875, 6.24237060546875, 6.48974609375, 6.73712158203125, 6.9844970703125, 7.23187255859375, 7.479248046875, 7.72662353515625, 7.9739990234375, 8.22137451171875, 8.46875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 14.0, 20.0, 26.0, 50.0, 74.0, 162.0, 417.0, 1225.0, 5174.0, 42713.0, 898313.0, 89000.0, 8648.0, 1682.0, 539.0, 233.0, 95.0, 57.0, 32.0, 10.0, 11.0, 4.0, 9.0, 10.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.173828125, -1.1280364990234375, -1.082244873046875, -1.0364532470703125, -0.99066162109375, -0.9448699951171875, -0.899078369140625, -0.8532867431640625, -0.8074951171875, -0.7617034912109375, -0.715911865234375, -0.6701202392578125, -0.62432861328125, -0.5785369873046875, -0.532745361328125, -0.4869537353515625, -0.441162109375, -0.3953704833984375, -0.349578857421875, -0.3037872314453125, -0.25799560546875, -0.2122039794921875, -0.166412353515625, -0.1206207275390625, -0.0748291015625, -0.0290374755859375, 0.016754150390625, 0.0625457763671875, 0.10833740234375, 0.1541290283203125, 0.199920654296875, 0.2457122802734375, 0.29150390625, 0.3372955322265625, 0.383087158203125, 0.4288787841796875, 0.47467041015625, 0.5204620361328125, 0.566253662109375, 0.6120452880859375, 0.6578369140625, 0.7036285400390625, 0.749420166015625, 0.7952117919921875, 0.84100341796875, 0.8867950439453125, 0.932586669921875, 0.9783782958984375, 1.024169921875, 1.0699615478515625, 1.115753173828125, 1.1615447998046875, 1.20733642578125, 1.2531280517578125, 1.298919677734375, 1.3447113037109375, 1.3905029296875, 1.4362945556640625, 1.482086181640625, 1.5278778076171875, 1.57366943359375, 1.6194610595703125, 1.665252685546875, 1.7110443115234375, 1.7568359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 3.0, 4.0, 8.0, 6.0, 8.0, 19.0, 28.0, 24.0, 54.0, 92.0, 119.0, 212.0, 145.0, 79.0, 46.0, 37.0, 24.0, 18.0, 11.0, 8.0, 7.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015735626220703125, -0.00015265494585037231, -0.00014795362949371338, -0.00014325231313705444, -0.0001385509967803955, -0.00013384968042373657, -0.00012914836406707764, -0.0001244470477104187, -0.00011974573135375977, -0.00011504441499710083, -0.0001103430986404419, -0.00010564178228378296, -0.00010094046592712402, -9.623914957046509e-05, -9.153783321380615e-05, -8.683651685714722e-05, -8.213520050048828e-05, -7.743388414382935e-05, -7.273256778717041e-05, -6.803125143051147e-05, -6.332993507385254e-05, -5.8628618717193604e-05, -5.392730236053467e-05, -4.922598600387573e-05, -4.45246696472168e-05, -3.982335329055786e-05, -3.5122036933898926e-05, -3.042072057723999e-05, -2.5719404220581055e-05, -2.101808786392212e-05, -1.6316771507263184e-05, -1.1615455150604248e-05, -6.9141387939453125e-06, -2.212822437286377e-06, 2.4884939193725586e-06, 7.189810276031494e-06, 1.189112663269043e-05, 1.6592442989349365e-05, 2.12937593460083e-05, 2.5995075702667236e-05, 3.069639205932617e-05, 3.539770841598511e-05, 4.009902477264404e-05, 4.480034112930298e-05, 4.9501657485961914e-05, 5.420297384262085e-05, 5.8904290199279785e-05, 6.360560655593872e-05, 6.830692291259766e-05, 7.300823926925659e-05, 7.770955562591553e-05, 8.241087198257446e-05, 8.71121883392334e-05, 9.181350469589233e-05, 9.651482105255127e-05, 0.0001012161374092102, 0.00010591745376586914, 0.00011061877012252808, 0.00011532008647918701, 0.00012002140283584595, 0.00012472271919250488, 0.00012942403554916382, 0.00013412535190582275, 0.0001388266682624817, 0.00014352798461914062]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 31.0, 21.0, 46.0, 93.0, 164.0, 467.0, 1522.0, 8459.0, 117213.0, 887216.0, 28555.0, 3403.0, 836.0, 258.0, 105.0, 63.0, 31.0, 18.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689453125, -1.617218017578125, -1.56549072265625, -1.513763427734375, -1.4620361328125, -1.410308837890625, -1.35858154296875, -1.306854248046875, -1.255126953125, -1.203399658203125, -1.15167236328125, -1.099945068359375, -1.0482177734375, -0.996490478515625, -0.94476318359375, -0.893035888671875, -0.84130859375, -0.789581298828125, -0.73785400390625, -0.686126708984375, -0.6343994140625, -0.582672119140625, -0.53094482421875, -0.479217529296875, -0.427490234375, -0.375762939453125, -0.32403564453125, -0.272308349609375, -0.2205810546875, -0.168853759765625, -0.11712646484375, -0.065399169921875, -0.013671875, 0.038055419921875, 0.08978271484375, 0.141510009765625, 0.1932373046875, 0.244964599609375, 0.29669189453125, 0.348419189453125, 0.400146484375, 0.451873779296875, 0.50360107421875, 0.555328369140625, 0.6070556640625, 0.658782958984375, 0.71051025390625, 0.762237548828125, 0.81396484375, 0.865692138671875, 0.91741943359375, 0.969146728515625, 1.0208740234375, 1.072601318359375, 1.12432861328125, 1.176055908203125, 1.227783203125, 1.279510498046875, 1.33123779296875, 1.382965087890625, 1.4346923828125, 1.486419677734375, 1.53814697265625, 1.589874267578125, 1.6416015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 8.0, 9.0, 8.0, 15.0, 21.0, 25.0, 34.0, 38.0, 67.0, 168.0, 292.0, 99.0, 36.0, 33.0, 35.0, 20.0, 21.0, 11.0, 12.0, 13.0, 6.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.3382377624511719, -0.32808685302734375, -0.3179359436035156, -0.3077850341796875, -0.2976341247558594, -0.28748321533203125, -0.2773323059082031, -0.267181396484375, -0.2570304870605469, -0.24687957763671875, -0.23672866821289062, -0.2265777587890625, -0.21642684936523438, -0.20627593994140625, -0.19612503051757812, -0.18597412109375, -0.17582321166992188, -0.16567230224609375, -0.15552139282226562, -0.1453704833984375, -0.13521957397460938, -0.12506866455078125, -0.11491775512695312, -0.104766845703125, -0.09461593627929688, -0.08446502685546875, -0.07431411743164062, -0.0641632080078125, -0.054012298583984375, -0.04386138916015625, -0.033710479736328125, -0.0235595703125, -0.013408660888671875, -0.00325775146484375, 0.006893157958984375, 0.0170440673828125, 0.027194976806640625, 0.03734588623046875, 0.047496795654296875, 0.057647705078125, 0.06779861450195312, 0.07794952392578125, 0.08810043334960938, 0.0982513427734375, 0.10840225219726562, 0.11855316162109375, 0.12870407104492188, 0.13885498046875, 0.14900588989257812, 0.15915679931640625, 0.16930770874023438, 0.1794586181640625, 0.18960952758789062, 0.19976043701171875, 0.20991134643554688, 0.220062255859375, 0.23021316528320312, 0.24036407470703125, 0.2505149841308594, 0.2606658935546875, 0.2708168029785156, 0.28096771240234375, 0.2911186218261719, 0.30126953125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 7.0, 5.0, 15.0, 33.0, 62.0, 156.0, 224.0, 226.0, 148.0, 64.0, 25.0, 15.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.979602813720703, -9.483386039733887, -8.987170219421387, -8.49095344543457, -7.994737148284912, -7.498520851135254, -7.002304553985596, -6.5060882568359375, -6.009871482849121, -5.513655185699463, -5.017438888549805, -4.521222114562988, -4.02500581741333, -3.528789520263672, -3.0325732231140137, -2.5363566875457764, -2.0401406288146973, -1.5439242124557495, -1.0477077960968018, -0.5514914989471436, -0.0552750825881958, 0.44094133377075195, 0.9371576309204102, 1.4333741664886475, 1.9295904636383057, 2.425806760787964, 2.922023296356201, 3.4182395935058594, 3.9144558906555176, 4.410672187805176, 4.906888961791992, 5.40310525894165, 5.899321556091309, 6.395537853240967, 6.891754150390625, 7.387970924377441, 7.8841872215271, 8.380403518676758, 8.876619338989258, 9.372836112976074, 9.86905288696289, 10.365269660949707, 10.861485481262207, 11.357702255249023, 11.853918075561523, 12.35013484954834, 12.846351623535156, 13.342567443847656, 13.838783264160156, 14.335000038146973, 14.831215858459473, 15.327432632446289, 15.823648452758789, 16.319866180419922, 16.816082000732422, 17.312297821044922, 17.808515548706055, 18.304731369018555, 18.800949096679688, 19.297164916992188, 19.793380737304688, 20.289596557617188, 20.78581428527832, 21.28203010559082, 21.77824592590332]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 8.0, 13.0, 13.0, 14.0, 19.0, 16.0, 16.0, 29.0, 26.0, 35.0, 37.0, 34.0, 41.0, 38.0, 46.0, 57.0, 36.0, 42.0, 46.0, 37.0, 39.0, 25.0, 34.0, 45.0, 31.0, 33.0, 17.0, 20.0, 29.0, 17.0, 22.0, 8.0, 15.0, 11.0, 7.0, 8.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.61107063293457, -11.232358932495117, -10.85364818572998, -10.474936485290527, -10.096224784851074, -9.717514038085938, -9.338802337646484, -8.960090637207031, -8.581379890441895, -8.202668190002441, -7.8239569664001465, -7.445245742797852, -7.066534519195557, -6.687823295593262, -6.309111595153809, -5.930400371551514, -5.5516886711120605, -5.172977447509766, -4.7942657470703125, -4.415554523468018, -4.036843299865723, -3.6581318378448486, -3.2794203758239746, -2.9007091522216797, -2.5219976902008057, -2.1432862281799316, -1.7645750045776367, -1.3858635425567627, -1.0071521997451782, -0.6284408569335938, -0.24972939491271973, 0.1289818286895752, 0.5076932907104492, 0.8864046335220337, 1.2651159763336182, 1.6438274383544922, 2.022538661956787, 2.401250123977661, 2.779961585998535, 3.15867280960083, 3.537384271621704, 3.916095733642578, 4.294806957244873, 4.673518180847168, 5.052229881286621, 5.430941104888916, 5.809652328491211, 6.188364028930664, 6.567075252532959, 6.945786476135254, 7.324498176574707, 7.703209400177002, 8.081920623779297, 8.46063232421875, 8.839344024658203, 9.21805477142334, 9.596766471862793, 9.975478172302246, 10.354188919067383, 10.732900619506836, 11.111612319946289, 11.490323066711426, 11.869034767150879, 12.247745513916016, 12.626457214355469]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 8.0, 10.0, 15.0, 20.0, 31.0, 23.0, 44.0, 41.0, 72.0, 114.0, 271.0, 745.0, 2862.0, 15365.0, 191906.0, 3812124.0, 153112.0, 13495.0, 2645.0, 707.0, 257.0, 103.0, 84.0, 50.0, 35.0, 24.0, 27.0, 15.0, 13.0, 16.0, 4.0, 4.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7578125, -8.4703369140625, -8.182861328125, -7.8953857421875, -7.60791015625, -7.3204345703125, -7.032958984375, -6.7454833984375, -6.4580078125, -6.1705322265625, -5.883056640625, -5.5955810546875, -5.30810546875, -5.0206298828125, -4.733154296875, -4.4456787109375, -4.158203125, -3.8707275390625, -3.583251953125, -3.2957763671875, -3.00830078125, -2.7208251953125, -2.433349609375, -2.1458740234375, -1.8583984375, -1.5709228515625, -1.283447265625, -0.9959716796875, -0.70849609375, -0.4210205078125, -0.133544921875, 0.1539306640625, 0.44140625, 0.7288818359375, 1.016357421875, 1.3038330078125, 1.59130859375, 1.8787841796875, 2.166259765625, 2.4537353515625, 2.7412109375, 3.0286865234375, 3.316162109375, 3.6036376953125, 3.89111328125, 4.1785888671875, 4.466064453125, 4.7535400390625, 5.041015625, 5.3284912109375, 5.615966796875, 5.9034423828125, 6.19091796875, 6.4783935546875, 6.765869140625, 7.0533447265625, 7.3408203125, 7.6282958984375, 7.915771484375, 8.2032470703125, 8.49072265625, 8.7781982421875, 9.065673828125, 9.3531494140625, 9.640625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 24.0, 11.0, 23.0, 23.0, 47.0, 41.0, 50.0, 60.0, 55.0, 75.0, 80.0, 74.0, 74.0, 65.0, 69.0, 44.0, 39.0, 31.0, 24.0, 22.0, 14.0, 11.0, 13.0, 6.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.546722412109375, -3.42352294921875, -3.300323486328125, -3.1771240234375, -3.053924560546875, -2.93072509765625, -2.807525634765625, -2.684326171875, -2.561126708984375, -2.43792724609375, -2.314727783203125, -2.1915283203125, -2.068328857421875, -1.94512939453125, -1.821929931640625, -1.69873046875, -1.575531005859375, -1.45233154296875, -1.329132080078125, -1.2059326171875, -1.082733154296875, -0.95953369140625, -0.836334228515625, -0.713134765625, -0.589935302734375, -0.46673583984375, -0.343536376953125, -0.2203369140625, -0.097137451171875, 0.02606201171875, 0.149261474609375, 0.2724609375, 0.395660400390625, 0.51885986328125, 0.642059326171875, 0.7652587890625, 0.888458251953125, 1.01165771484375, 1.134857177734375, 1.258056640625, 1.381256103515625, 1.50445556640625, 1.627655029296875, 1.7508544921875, 1.874053955078125, 1.99725341796875, 2.120452880859375, 2.24365234375, 2.366851806640625, 2.49005126953125, 2.613250732421875, 2.7364501953125, 2.859649658203125, 2.98284912109375, 3.106048583984375, 3.229248046875, 3.352447509765625, 3.47564697265625, 3.598846435546875, 3.7220458984375, 3.845245361328125, 3.96844482421875, 4.091644287109375, 4.21484375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 31.0, 162.0, 37008.0, 4156717.0, 290.0, 45.0, 14.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-39.0, -37.0625, -35.125, -33.1875, -31.25, -29.3125, -27.375, -25.4375, -23.5, -21.5625, -19.625, -17.6875, -15.75, -13.8125, -11.875, -9.9375, -8.0, -6.0625, -4.125, -2.1875, -0.25, 1.6875, 3.625, 5.5625, 7.5, 9.4375, 11.375, 13.3125, 15.25, 17.1875, 19.125, 21.0625, 23.0, 24.9375, 26.875, 28.8125, 30.75, 32.6875, 34.625, 36.5625, 38.5, 40.4375, 42.375, 44.3125, 46.25, 48.1875, 50.125, 52.0625, 54.0, 55.9375, 57.875, 59.8125, 61.75, 63.6875, 65.625, 67.5625, 69.5, 71.4375, 73.375, 75.3125, 77.25, 79.1875, 81.125, 83.0625, 85.0]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 7.0, 3.0, 12.0, 13.0, 26.0, 29.0, 31.0, 42.0, 56.0, 92.0, 133.0, 212.0, 320.0, 642.0, 1093.0, 538.0, 273.0, 170.0, 96.0, 90.0, 52.0, 30.0, 27.0, 25.0, 14.0, 15.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5322265625, -1.4932861328125, -1.454345703125, -1.4154052734375, -1.37646484375, -1.3375244140625, -1.298583984375, -1.2596435546875, -1.220703125, -1.1817626953125, -1.142822265625, -1.1038818359375, -1.06494140625, -1.0260009765625, -0.987060546875, -0.9481201171875, -0.9091796875, -0.8702392578125, -0.831298828125, -0.7923583984375, -0.75341796875, -0.7144775390625, -0.675537109375, -0.6365966796875, -0.59765625, -0.5587158203125, -0.519775390625, -0.4808349609375, -0.44189453125, -0.4029541015625, -0.364013671875, -0.3250732421875, -0.2861328125, -0.2471923828125, -0.208251953125, -0.1693115234375, -0.13037109375, -0.0914306640625, -0.052490234375, -0.0135498046875, 0.025390625, 0.0643310546875, 0.103271484375, 0.1422119140625, 0.18115234375, 0.2200927734375, 0.259033203125, 0.2979736328125, 0.3369140625, 0.3758544921875, 0.414794921875, 0.4537353515625, 0.49267578125, 0.5316162109375, 0.570556640625, 0.6094970703125, 0.6484375, 0.6873779296875, 0.726318359375, 0.7652587890625, 0.80419921875, 0.8431396484375, 0.882080078125, 0.9210205078125, 0.9599609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 15.0, 23.0, 19.0, 45.0, 65.0, 144.0, 187.0, 200.0, 131.0, 73.0, 35.0, 18.0, 13.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.594799518585205, -7.32333517074585, -7.051871299743652, -6.780406951904297, -6.508942604064941, -6.237478733062744, -5.966014385223389, -5.694550514221191, -5.423086166381836, -5.1516218185424805, -4.880157947540283, -4.608693599700928, -4.3372297286987305, -4.065765380859375, -3.7943010330200195, -3.522836923599243, -3.251372814178467, -2.9799087047576904, -2.708444595336914, -2.4369802474975586, -2.1655161380767822, -1.8940520286560059, -1.62258780002594, -1.351123571395874, -1.0796594619750977, -0.8081952929496765, -0.5367311239242554, -0.26526695489883423, 0.006197214126586914, 0.2776613235473633, 0.5491255521774292, 0.8205897808074951, 1.0920543670654297, 1.363518476486206, 1.634982705116272, 1.906446933746338, 2.1779110431671143, 2.4493751525878906, 2.720839500427246, 2.9923036098480225, 3.263767719268799, 3.535231828689575, 3.8066959381103516, 4.078160285949707, 4.3496246337890625, 4.62108850479126, 4.892552852630615, 5.1640167236328125, 5.435481071472168, 5.706945419311523, 5.978409290313721, 6.249873638153076, 6.521337509155273, 6.792801856994629, 7.064266204833984, 7.33573055267334, 7.607194423675537, 7.878658771514893, 8.15012264251709, 8.421586990356445, 8.6930513381958, 8.964515686035156, 9.235979080200195, 9.50744342803955, 9.778907775878906]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 10.0, 6.0, 10.0, 10.0, 22.0, 24.0, 28.0, 31.0, 32.0, 43.0, 50.0, 56.0, 48.0, 58.0, 57.0, 54.0, 41.0, 63.0, 53.0, 52.0, 32.0, 33.0, 28.0, 32.0, 26.0, 24.0, 19.0, 12.0, 9.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1172287464141846, -2.9991238117218018, -2.881018877029419, -2.7629141807556152, -2.6448092460632324, -2.5267043113708496, -2.408599376678467, -2.290494441986084, -2.172389507293701, -2.0542845726013184, -1.936179757118225, -1.8180748224258423, -1.699970006942749, -1.5818650722503662, -1.4637601375579834, -1.3456552028656006, -1.2275505065917969, -1.109445571899414, -0.9913407564163208, -0.873235821723938, -0.7551309466362, -0.6370260715484619, -0.5189211368560791, -0.40081626176834106, -0.282711386680603, -0.1646064966917038, -0.046501606702804565, 0.07160329818725586, 0.1897081732749939, 0.30781304836273193, 0.42591798305511475, 0.5440228581428528, 0.6621274948120117, 0.7802323698997498, 0.8983372449874878, 1.0164421796798706, 1.1345469951629639, 1.2526519298553467, 1.3707568645477295, 1.4888617992401123, 1.6069666147232056, 1.7250715494155884, 1.8431763648986816, 1.9612812995910645, 2.0793862342834473, 2.19749116897583, 2.315596103668213, 2.4337007999420166, 2.5518057346343994, 2.6699106693267822, 2.788015604019165, 2.9061203002929688, 3.0242252349853516, 3.1423301696777344, 3.260435104370117, 3.3785400390625, 3.496644973754883, 3.6147499084472656, 3.7328548431396484, 3.8509597778320312, 3.969064474105835, 4.087169647216797, 4.20527458190918, 4.323379039764404, 4.441483974456787]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 12.0, 15.0, 25.0, 52.0, 86.0, 175.0, 445.0, 1516.0, 8770.0, 927640.0, 104583.0, 3748.0, 901.0, 297.0, 114.0, 53.0, 35.0, 28.0, 20.0, 7.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.439453125, -2.3849945068359375, -2.330535888671875, -2.2760772705078125, -2.22161865234375, -2.1671600341796875, -2.112701416015625, -2.0582427978515625, -2.0037841796875, -1.9493255615234375, -1.894866943359375, -1.8404083251953125, -1.78594970703125, -1.7314910888671875, -1.677032470703125, -1.6225738525390625, -1.568115234375, -1.5136566162109375, -1.459197998046875, -1.4047393798828125, -1.35028076171875, -1.2958221435546875, -1.241363525390625, -1.1869049072265625, -1.1324462890625, -1.0779876708984375, -1.023529052734375, -0.9690704345703125, -0.91461181640625, -0.8601531982421875, -0.805694580078125, -0.7512359619140625, -0.69677734375, -0.6423187255859375, -0.587860107421875, -0.5334014892578125, -0.47894287109375, -0.4244842529296875, -0.370025634765625, -0.3155670166015625, -0.2611083984375, -0.2066497802734375, -0.152191162109375, -0.0977325439453125, -0.04327392578125, 0.0111846923828125, 0.065643310546875, 0.1201019287109375, 0.174560546875, 0.2290191650390625, 0.283477783203125, 0.3379364013671875, 0.39239501953125, 0.4468536376953125, 0.501312255859375, 0.5557708740234375, 0.6102294921875, 0.6646881103515625, 0.719146728515625, 0.7736053466796875, 0.82806396484375, 0.8825225830078125, 0.936981201171875, 0.9914398193359375, 1.0458984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 6.0, 18.0, 24.0, 20.0, 25.0, 55.0, 79.0, 85.0, 108.0, 105.0, 96.0, 92.0, 73.0, 66.0, 53.0, 36.0, 22.0, 14.0, 9.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.41473388671875, -2.2708740234375, -2.12701416015625, -1.983154296875, -1.83929443359375, -1.6954345703125, -1.55157470703125, -1.40771484375, -1.26385498046875, -1.1199951171875, -0.97613525390625, -0.832275390625, -0.68841552734375, -0.5445556640625, -0.40069580078125, -0.2568359375, -0.11297607421875, 0.0308837890625, 0.17474365234375, 0.318603515625, 0.46246337890625, 0.6063232421875, 0.75018310546875, 0.89404296875, 1.03790283203125, 1.1817626953125, 1.32562255859375, 1.469482421875, 1.61334228515625, 1.7572021484375, 1.90106201171875, 2.044921875, 2.18878173828125, 2.3326416015625, 2.47650146484375, 2.620361328125, 2.76422119140625, 2.9080810546875, 3.05194091796875, 3.19580078125, 3.33966064453125, 3.4835205078125, 3.62738037109375, 3.771240234375, 3.91510009765625, 4.0589599609375, 4.20281982421875, 4.3466796875, 4.49053955078125, 4.6343994140625, 4.77825927734375, 4.922119140625, 5.06597900390625, 5.2098388671875, 5.35369873046875, 5.49755859375, 5.64141845703125, 5.7852783203125, 5.92913818359375, 6.072998046875, 6.21685791015625, 6.3607177734375, 6.50457763671875, 6.6484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 18.0, 17.0, 21.0, 27.0, 31.0, 57.0, 62.0, 72.0, 96.0, 147.0, 171.0, 287.0, 404.0, 846.0, 3011.0, 23559.0, 395629.0, 582816.0, 35063.0, 3739.0, 969.0, 406.0, 285.0, 197.0, 145.0, 117.0, 83.0, 64.0, 39.0, 29.0, 35.0, 19.0, 23.0, 8.0, 9.0, 3.0, 2.0, 6.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.448974609375, -0.4361763000488281, -0.42337799072265625, -0.4105796813964844, -0.3977813720703125, -0.3849830627441406, -0.37218475341796875, -0.3593864440917969, -0.346588134765625, -0.3337898254394531, -0.32099151611328125, -0.3081932067871094, -0.2953948974609375, -0.2825965881347656, -0.26979827880859375, -0.2569999694824219, -0.24420166015625, -0.23140335083007812, -0.21860504150390625, -0.20580673217773438, -0.1930084228515625, -0.18021011352539062, -0.16741180419921875, -0.15461349487304688, -0.141815185546875, -0.12901687622070312, -0.11621856689453125, -0.10342025756835938, -0.0906219482421875, -0.07782363891601562, -0.06502532958984375, -0.052227020263671875, -0.0394287109375, -0.026630401611328125, -0.01383209228515625, -0.001033782958984375, 0.0117645263671875, 0.024562835693359375, 0.03736114501953125, 0.050159454345703125, 0.062957763671875, 0.07575607299804688, 0.08855438232421875, 0.10135269165039062, 0.1141510009765625, 0.12694931030273438, 0.13974761962890625, 0.15254592895507812, 0.16534423828125, 0.17814254760742188, 0.19094085693359375, 0.20373916625976562, 0.2165374755859375, 0.22933578491210938, 0.24213409423828125, 0.2549324035644531, 0.267730712890625, 0.2805290222167969, 0.29332733154296875, 0.3061256408691406, 0.3189239501953125, 0.3317222595214844, 0.34452056884765625, 0.3573188781738281, 0.3701171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 12.0, 13.0, 19.0, 20.0, 26.0, 25.0, 31.0, 42.0, 36.0, 40.0, 50.0, 59.0, 59.0, 54.0, 58.0, 39.0, 49.0, 52.0, 49.0, 27.0, 28.0, 31.0, 37.0, 24.0, 16.0, 14.0, 10.0, 7.0, 9.0, 8.0, 9.0, 2.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.671875, -4.547119140625, -4.42236328125, -4.297607421875, -4.1728515625, -4.048095703125, -3.92333984375, -3.798583984375, -3.673828125, -3.549072265625, -3.42431640625, -3.299560546875, -3.1748046875, -3.050048828125, -2.92529296875, -2.800537109375, -2.67578125, -2.551025390625, -2.42626953125, -2.301513671875, -2.1767578125, -2.052001953125, -1.92724609375, -1.802490234375, -1.677734375, -1.552978515625, -1.42822265625, -1.303466796875, -1.1787109375, -1.053955078125, -0.92919921875, -0.804443359375, -0.6796875, -0.554931640625, -0.43017578125, -0.305419921875, -0.1806640625, -0.055908203125, 0.06884765625, 0.193603515625, 0.318359375, 0.443115234375, 0.56787109375, 0.692626953125, 0.8173828125, 0.942138671875, 1.06689453125, 1.191650390625, 1.31640625, 1.441162109375, 1.56591796875, 1.690673828125, 1.8154296875, 1.940185546875, 2.06494140625, 2.189697265625, 2.314453125, 2.439208984375, 2.56396484375, 2.688720703125, 2.8134765625, 2.938232421875, 3.06298828125, 3.187744140625, 3.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 25.0, 25.0, 31.0, 52.0, 77.0, 100.0, 206.0, 391.0, 1143.0, 9857.0, 1000508.0, 33053.0, 1872.0, 534.0, 230.0, 143.0, 94.0, 56.0, 27.0, 25.0, 19.0, 14.0, 11.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.277099609375, -0.2699298858642578, -0.2627601623535156, -0.25559043884277344, -0.24842071533203125, -0.24125099182128906, -0.23408126831054688, -0.2269115447998047, -0.2197418212890625, -0.2125720977783203, -0.20540237426757812, -0.19823265075683594, -0.19106292724609375, -0.18389320373535156, -0.17672348022460938, -0.1695537567138672, -0.162384033203125, -0.1552143096923828, -0.14804458618164062, -0.14087486267089844, -0.13370513916015625, -0.12653541564941406, -0.11936569213867188, -0.11219596862792969, -0.1050262451171875, -0.09785652160644531, -0.09068679809570312, -0.08351707458496094, -0.07634735107421875, -0.06917762756347656, -0.062007904052734375, -0.05483818054199219, -0.04766845703125, -0.04049873352050781, -0.033329010009765625, -0.026159286499023438, -0.01898956298828125, -0.011819839477539062, -0.004650115966796875, 0.0025196075439453125, 0.0096893310546875, 0.016859054565429688, 0.024028778076171875, 0.031198501586914062, 0.03836822509765625, 0.04553794860839844, 0.052707672119140625, 0.05987739562988281, 0.067047119140625, 0.07421684265136719, 0.08138656616210938, 0.08855628967285156, 0.09572601318359375, 0.10289573669433594, 0.11006546020507812, 0.11723518371582031, 0.1244049072265625, 0.1315746307373047, 0.13874435424804688, 0.14591407775878906, 0.15308380126953125, 0.16025352478027344, 0.16742324829101562, 0.1745929718017578, 0.1817626953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 5.0, 9.0, 15.0, 35.0, 38.0, 50.0, 88.0, 144.0, 186.0, 145.0, 89.0, 55.0, 56.0, 16.0, 18.0, 9.0, 9.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.094310760498047e-05, -7.810443639755249e-05, -7.526576519012451e-05, -7.242709398269653e-05, -6.958842277526855e-05, -6.674975156784058e-05, -6.39110803604126e-05, -6.107240915298462e-05, -5.823373794555664e-05, -5.539506673812866e-05, -5.2556395530700684e-05, -4.9717724323272705e-05, -4.6879053115844727e-05, -4.404038190841675e-05, -4.120171070098877e-05, -3.836303949356079e-05, -3.552436828613281e-05, -3.2685697078704834e-05, -2.9847025871276855e-05, -2.7008354663848877e-05, -2.41696834564209e-05, -2.133101224899292e-05, -1.849234104156494e-05, -1.5653669834136963e-05, -1.2814998626708984e-05, -9.976327419281006e-06, -7.137656211853027e-06, -4.298985004425049e-06, -1.4603137969970703e-06, 1.3783574104309082e-06, 4.217028617858887e-06, 7.055699825286865e-06, 9.894371032714844e-06, 1.2733042240142822e-05, 1.55717134475708e-05, 1.841038465499878e-05, 2.1249055862426758e-05, 2.4087727069854736e-05, 2.6926398277282715e-05, 2.9765069484710693e-05, 3.260374069213867e-05, 3.544241189956665e-05, 3.828108310699463e-05, 4.111975431442261e-05, 4.3958425521850586e-05, 4.6797096729278564e-05, 4.963576793670654e-05, 5.247443914413452e-05, 5.53131103515625e-05, 5.815178155899048e-05, 6.099045276641846e-05, 6.382912397384644e-05, 6.666779518127441e-05, 6.950646638870239e-05, 7.234513759613037e-05, 7.518380880355835e-05, 7.802248001098633e-05, 8.08611512184143e-05, 8.369982242584229e-05, 8.653849363327026e-05, 8.937716484069824e-05, 9.221583604812622e-05, 9.50545072555542e-05, 9.789317846298218e-05, 0.00010073184967041016]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 6.0, 22.0, 20.0, 76.0, 217.0, 796.0, 6014.0, 934239.0, 103415.0, 2904.0, 532.0, 163.0, 66.0, 30.0, 17.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31640625, -0.3046226501464844, -0.29283905029296875, -0.2810554504394531, -0.2692718505859375, -0.2574882507324219, -0.24570465087890625, -0.23392105102539062, -0.222137451171875, -0.21035385131835938, -0.19857025146484375, -0.18678665161132812, -0.1750030517578125, -0.16321945190429688, -0.15143585205078125, -0.13965225219726562, -0.12786865234375, -0.11608505249023438, -0.10430145263671875, -0.09251785278320312, -0.0807342529296875, -0.06895065307617188, -0.05716705322265625, -0.045383453369140625, -0.033599853515625, -0.021816253662109375, -0.01003265380859375, 0.001750946044921875, 0.0135345458984375, 0.025318145751953125, 0.03710174560546875, 0.048885345458984375, 0.0606689453125, 0.07245254516601562, 0.08423614501953125, 0.09601974487304688, 0.1078033447265625, 0.11958694458007812, 0.13137054443359375, 0.14315414428710938, 0.154937744140625, 0.16672134399414062, 0.17850494384765625, 0.19028854370117188, 0.2020721435546875, 0.21385574340820312, 0.22563934326171875, 0.23742294311523438, 0.24920654296875, 0.2609901428222656, 0.27277374267578125, 0.2845573425292969, 0.2963409423828125, 0.3081245422363281, 0.31990814208984375, 0.3316917419433594, 0.343475341796875, 0.3552589416503906, 0.36704254150390625, 0.3788261413574219, 0.3906097412109375, 0.4023933410644531, 0.41417694091796875, 0.4259605407714844, 0.437744140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 5.0, 7.0, 10.0, 10.0, 26.0, 73.0, 139.0, 230.0, 212.0, 111.0, 52.0, 35.0, 24.0, 12.0, 10.0, 7.0, 5.0, 4.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033721923828125, -0.03242349624633789, -0.03112506866455078, -0.029826641082763672, -0.028528213500976562, -0.027229785919189453, -0.025931358337402344, -0.024632930755615234, -0.023334503173828125, -0.022036075592041016, -0.020737648010253906, -0.019439220428466797, -0.018140792846679688, -0.016842365264892578, -0.015543937683105469, -0.01424551010131836, -0.01294708251953125, -0.01164865493774414, -0.010350227355957031, -0.009051799774169922, -0.0077533721923828125, -0.006454944610595703, -0.005156517028808594, -0.0038580894470214844, -0.002559661865234375, -0.0012612342834472656, 3.719329833984375e-05, 0.0013356208801269531, 0.0026340484619140625, 0.003932476043701172, 0.005230903625488281, 0.006529331207275391, 0.0078277587890625, 0.00912618637084961, 0.010424613952636719, 0.011723041534423828, 0.013021469116210938, 0.014319896697998047, 0.015618324279785156, 0.016916751861572266, 0.018215179443359375, 0.019513607025146484, 0.020812034606933594, 0.022110462188720703, 0.023408889770507812, 0.024707317352294922, 0.02600574493408203, 0.02730417251586914, 0.02860260009765625, 0.02990102767944336, 0.03119945526123047, 0.03249788284301758, 0.03379631042480469, 0.0350947380065918, 0.036393165588378906, 0.037691593170166016, 0.038990020751953125, 0.040288448333740234, 0.041586875915527344, 0.04288530349731445, 0.04418373107910156, 0.04548215866088867, 0.04678058624267578, 0.04807901382446289, 0.04937744140625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 20.0, 24.0, 48.0, 99.0, 226.0, 280.0, 165.0, 76.0, 20.0, 13.0, 6.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.267423152923584, -5.03119421005249, -4.7949652671813965, -4.558736324310303, -4.322507858276367, -4.086278915405273, -3.8500499725341797, -3.613821029663086, -3.377592086791992, -3.1413631439208984, -2.9051342010498047, -2.66890549659729, -2.4326765537261963, -2.1964476108551025, -1.9602187871932983, -1.7239899635314941, -1.4877610206604004, -1.2515320777893066, -1.0153032541275024, -0.7790743708610535, -0.5428454875946045, -0.30661654472351074, -0.07038772106170654, 0.16584110260009766, 0.4020700454711914, 0.6382989287376404, 0.8745278120040894, 1.1107566356658936, 1.3469855785369873, 1.583214521408081, 1.8194433450698853, 2.0556721687316895, 2.2919015884399414, 2.528130531311035, 2.764359474182129, 3.0005881786346436, 3.2368171215057373, 3.473046064376831, 3.7092747688293457, 3.9455037117004395, 4.181732654571533, 4.417961597442627, 4.654190540313721, 4.8904194831848145, 5.12664794921875, 5.362876892089844, 5.5991058349609375, 5.835334777832031, 6.071563720703125, 6.307792663574219, 6.5440216064453125, 6.780250549316406, 7.0164794921875, 7.252708435058594, 7.488936901092529, 7.725165843963623, 7.961394786834717, 8.197623252868652, 8.433852195739746, 8.67008113861084, 8.906310081481934, 9.142539024353027, 9.378767967224121, 9.614996910095215, 9.851225852966309]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 12.0, 17.0, 23.0, 31.0, 56.0, 55.0, 89.0, 78.0, 93.0, 96.0, 84.0, 86.0, 64.0, 39.0, 50.0, 37.0, 28.0, 19.0, 10.0, 4.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2476322650909424, -2.131808280944824, -2.015984535217285, -1.900160551071167, -1.784336805343628, -1.6685128211975098, -1.5526889562606812, -1.4368650913238525, -1.321041226387024, -1.2052173614501953, -1.0893934965133667, -0.9735695719718933, -0.8577457070350647, -0.7419218420982361, -0.6260979175567627, -0.5102740526199341, -0.39445018768310547, -0.27862632274627686, -0.16280242800712585, -0.046978533267974854, 0.06884533166885376, 0.18466919660568237, 0.30049312114715576, 0.4163169860839844, 0.532140851020813, 0.6479647159576416, 0.7637885808944702, 0.8796125054359436, 0.9954363703727722, 1.111260175704956, 1.2270841598510742, 1.3429080247879028, 1.4587321281433105, 1.5745559930801392, 1.6903798580169678, 1.806203842163086, 1.922027587890625, 2.037851572036743, 2.1536755561828613, 2.2694993019104004, 2.3853230476379395, 2.5011470317840576, 2.6169707775115967, 2.732794761657715, 2.848618507385254, 2.964442491531372, 3.0802664756774902, 3.1960902214050293, 3.3119142055511475, 3.4277381896972656, 3.5435619354248047, 3.659385919570923, 3.775209665298462, 3.89103364944458, 4.006857395172119, 4.122681617736816, 4.2385053634643555, 4.3543291091918945, 4.470153331756592, 4.585977077484131, 4.70180082321167, 4.817624568939209, 4.933448791503906, 5.049272537231445, 5.165096282958984]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 7.0, 16.0, 30.0, 44.0, 89.0, 149.0, 341.0, 812.0, 2304.0, 8178.0, 39751.0, 381789.0, 547606.0, 52731.0, 10195.0, 2796.0, 950.0, 390.0, 167.0, 96.0, 39.0, 29.0, 16.0, 13.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-5.96484375, -5.83538818359375, -5.7059326171875, -5.57647705078125, -5.447021484375, -5.31756591796875, -5.1881103515625, -5.05865478515625, -4.92919921875, -4.79974365234375, -4.6702880859375, -4.54083251953125, -4.411376953125, -4.28192138671875, -4.1524658203125, -4.02301025390625, -3.8935546875, -3.76409912109375, -3.6346435546875, -3.50518798828125, -3.375732421875, -3.24627685546875, -3.1168212890625, -2.98736572265625, -2.85791015625, -2.72845458984375, -2.5989990234375, -2.46954345703125, -2.340087890625, -2.21063232421875, -2.0811767578125, -1.95172119140625, -1.822265625, -1.69281005859375, -1.5633544921875, -1.43389892578125, -1.304443359375, -1.17498779296875, -1.0455322265625, -0.91607666015625, -0.78662109375, -0.65716552734375, -0.5277099609375, -0.39825439453125, -0.268798828125, -0.13934326171875, -0.0098876953125, 0.11956787109375, 0.2490234375, 0.37847900390625, 0.5079345703125, 0.63739013671875, 0.766845703125, 0.89630126953125, 1.0257568359375, 1.15521240234375, 1.28466796875, 1.41412353515625, 1.5435791015625, 1.67303466796875, 1.802490234375, 1.93194580078125, 2.0614013671875, 2.19085693359375, 2.3203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 1.0, 3.0, 7.0, 3.0, 12.0, 9.0, 10.0, 25.0, 25.0, 43.0, 52.0, 76.0, 92.0, 102.0, 102.0, 83.0, 88.0, 69.0, 53.0, 57.0, 30.0, 13.0, 12.0, 8.0, 10.0, 4.0, 10.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7222900390625, -9.382080078125, -9.0418701171875, -8.70166015625, -8.3614501953125, -8.021240234375, -7.6810302734375, -7.3408203125, -7.0006103515625, -6.660400390625, -6.3201904296875, -5.97998046875, -5.6397705078125, -5.299560546875, -4.9593505859375, -4.619140625, -4.2789306640625, -3.938720703125, -3.5985107421875, -3.25830078125, -2.9180908203125, -2.577880859375, -2.2376708984375, -1.8974609375, -1.5572509765625, -1.217041015625, -0.8768310546875, -0.53662109375, -0.1964111328125, 0.143798828125, 0.4840087890625, 0.82421875, 1.1644287109375, 1.504638671875, 1.8448486328125, 2.18505859375, 2.5252685546875, 2.865478515625, 3.2056884765625, 3.5458984375, 3.8861083984375, 4.226318359375, 4.5665283203125, 4.90673828125, 5.2469482421875, 5.587158203125, 5.9273681640625, 6.267578125, 6.6077880859375, 6.947998046875, 7.2882080078125, 7.62841796875, 7.9686279296875, 8.308837890625, 8.6490478515625, 8.9892578125, 9.3294677734375, 9.669677734375, 10.0098876953125, 10.35009765625, 10.6903076171875, 11.030517578125, 11.3707275390625, 11.7109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 11.0, 11.0, 17.0, 14.0, 26.0, 33.0, 53.0, 57.0, 69.0, 83.0, 1025.0, 1046622.0, 162.0, 81.0, 76.0, 52.0, 41.0, 31.0, 31.0, 15.0, 11.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.6005859375, -37.076171875, -35.5517578125, -34.02734375, -32.5029296875, -30.978515625, -29.4541015625, -27.9296875, -26.4052734375, -24.880859375, -23.3564453125, -21.83203125, -20.3076171875, -18.783203125, -17.2587890625, -15.734375, -14.2099609375, -12.685546875, -11.1611328125, -9.63671875, -8.1123046875, -6.587890625, -5.0634765625, -3.5390625, -2.0146484375, -0.490234375, 1.0341796875, 2.55859375, 4.0830078125, 5.607421875, 7.1318359375, 8.65625, 10.1806640625, 11.705078125, 13.2294921875, 14.75390625, 16.2783203125, 17.802734375, 19.3271484375, 20.8515625, 22.3759765625, 23.900390625, 25.4248046875, 26.94921875, 28.4736328125, 29.998046875, 31.5224609375, 33.046875, 34.5712890625, 36.095703125, 37.6201171875, 39.14453125, 40.6689453125, 42.193359375, 43.7177734375, 45.2421875, 46.7666015625, 48.291015625, 49.8154296875, 51.33984375, 52.8642578125, 54.388671875, 55.9130859375, 57.4375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 12.0, 15.0, 16.0, 21.0, 26.0, 39.0, 49.0, 62.0, 69.0, 81.0, 75.0, 95.0, 86.0, 78.0, 66.0, 55.0, 40.0, 29.0, 25.0, 18.0, 11.0, 7.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.51708984375, -12.0185546875, -11.52001953125, -11.021484375, -10.52294921875, -10.0244140625, -9.52587890625, -9.02734375, -8.52880859375, -8.0302734375, -7.53173828125, -7.033203125, -6.53466796875, -6.0361328125, -5.53759765625, -5.0390625, -4.54052734375, -4.0419921875, -3.54345703125, -3.044921875, -2.54638671875, -2.0478515625, -1.54931640625, -1.05078125, -0.55224609375, -0.0537109375, 0.44482421875, 0.943359375, 1.44189453125, 1.9404296875, 2.43896484375, 2.9375, 3.43603515625, 3.9345703125, 4.43310546875, 4.931640625, 5.43017578125, 5.9287109375, 6.42724609375, 6.92578125, 7.42431640625, 7.9228515625, 8.42138671875, 8.919921875, 9.41845703125, 9.9169921875, 10.41552734375, 10.9140625, 11.41259765625, 11.9111328125, 12.40966796875, 12.908203125, 13.40673828125, 13.9052734375, 14.40380859375, 14.90234375, 15.40087890625, 15.8994140625, 16.39794921875, 16.896484375, 17.39501953125, 17.8935546875, 18.39208984375, 18.890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 13.0, 20.0, 27.0, 45.0, 67.0, 115.0, 238.0, 410.0, 841.0, 1913.0, 5195.0, 19647.0, 183552.0, 758571.0, 61296.0, 10586.0, 3301.0, 1320.0, 625.0, 328.0, 189.0, 85.0, 61.0, 31.0, 19.0, 20.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4267578125, -1.38116455078125, -1.3355712890625, -1.28997802734375, -1.244384765625, -1.19879150390625, -1.1531982421875, -1.10760498046875, -1.06201171875, -1.01641845703125, -0.9708251953125, -0.92523193359375, -0.879638671875, -0.83404541015625, -0.7884521484375, -0.74285888671875, -0.697265625, -0.65167236328125, -0.6060791015625, -0.56048583984375, -0.514892578125, -0.46929931640625, -0.4237060546875, -0.37811279296875, -0.33251953125, -0.28692626953125, -0.2413330078125, -0.19573974609375, -0.150146484375, -0.10455322265625, -0.0589599609375, -0.01336669921875, 0.0322265625, 0.07781982421875, 0.1234130859375, 0.16900634765625, 0.214599609375, 0.26019287109375, 0.3057861328125, 0.35137939453125, 0.39697265625, 0.44256591796875, 0.4881591796875, 0.53375244140625, 0.579345703125, 0.62493896484375, 0.6705322265625, 0.71612548828125, 0.76171875, 0.80731201171875, 0.8529052734375, 0.89849853515625, 0.944091796875, 0.98968505859375, 1.0352783203125, 1.08087158203125, 1.12646484375, 1.17205810546875, 1.2176513671875, 1.26324462890625, 1.308837890625, 1.35443115234375, 1.4000244140625, 1.44561767578125, 1.4912109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 12.0, 27.0, 37.0, 53.0, 75.0, 128.0, 174.0, 174.0, 108.0, 63.0, 36.0, 22.0, 20.0, 11.0, 12.0, 10.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003333091735839844, -0.00032399967312812805, -0.00031469017267227173, -0.0003053806722164154, -0.0002960711717605591, -0.00028676167130470276, -0.00027745217084884644, -0.0002681426703929901, -0.0002588331699371338, -0.00024952366948127747, -0.00024021416902542114, -0.00023090466856956482, -0.0002215951681137085, -0.00021228566765785217, -0.00020297616720199585, -0.00019366666674613953, -0.0001843571662902832, -0.00017504766583442688, -0.00016573816537857056, -0.00015642866492271423, -0.0001471191644668579, -0.0001378096640110016, -0.00012850016355514526, -0.00011919066309928894, -0.00010988116264343262, -0.0001005716621875763, -9.126216173171997e-05, -8.195266127586365e-05, -7.264316082000732e-05, -6.3333660364151e-05, -5.402415990829468e-05, -4.4714659452438354e-05, -3.540515899658203e-05, -2.6095658540725708e-05, -1.6786158084869385e-05, -7.4766576290130615e-06, 1.8328428268432617e-06, 1.1142343282699585e-05, 2.0451843738555908e-05, 2.976134419441223e-05, 3.9070844650268555e-05, 4.838034510612488e-05, 5.76898455619812e-05, 6.699934601783752e-05, 7.630884647369385e-05, 8.561834692955017e-05, 9.49278473854065e-05, 0.00010423734784126282, 0.00011354684829711914, 0.00012285634875297546, 0.0001321658492088318, 0.0001414753496646881, 0.00015078485012054443, 0.00016009435057640076, 0.00016940385103225708, 0.0001787133514881134, 0.00018802285194396973, 0.00019733235239982605, 0.00020664185285568237, 0.0002159513533115387, 0.00022526085376739502, 0.00023457035422325134, 0.00024387985467910767, 0.000253189355134964, 0.0002624988555908203]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 1.0, 3.0, 10.0, 8.0, 11.0, 16.0, 26.0, 38.0, 54.0, 86.0, 89.0, 132.0, 195.0, 420.0, 579.0, 1091.0, 2178.0, 4688.0, 11970.0, 40970.0, 268702.0, 600865.0, 83214.0, 19709.0, 6912.0, 2862.0, 1458.0, 820.0, 493.0, 325.0, 191.0, 127.0, 83.0, 76.0, 37.0, 38.0, 21.0, 14.0, 8.0, 16.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87451171875, -0.8445816040039062, -0.8146514892578125, -0.7847213745117188, -0.754791259765625, -0.7248611450195312, -0.6949310302734375, -0.6650009155273438, -0.63507080078125, -0.6051406860351562, -0.5752105712890625, -0.5452804565429688, -0.515350341796875, -0.48542022705078125, -0.4554901123046875, -0.42555999755859375, -0.3956298828125, -0.36569976806640625, -0.3357696533203125, -0.30583953857421875, -0.275909423828125, -0.24597930908203125, -0.2160491943359375, -0.18611907958984375, -0.15618896484375, -0.12625885009765625, -0.0963287353515625, -0.06639862060546875, -0.036468505859375, -0.00653839111328125, 0.0233917236328125, 0.05332183837890625, 0.083251953125, 0.11318206787109375, 0.1431121826171875, 0.17304229736328125, 0.202972412109375, 0.23290252685546875, 0.2628326416015625, 0.29276275634765625, 0.32269287109375, 0.35262298583984375, 0.3825531005859375, 0.41248321533203125, 0.442413330078125, 0.47234344482421875, 0.5022735595703125, 0.5322036743164062, 0.5621337890625, 0.5920639038085938, 0.6219940185546875, 0.6519241333007812, 0.681854248046875, 0.7117843627929688, 0.7417144775390625, 0.7716445922851562, 0.80157470703125, 0.8315048217773438, 0.8614349365234375, 0.8913650512695312, 0.921295166015625, 0.9512252807617188, 0.9811553955078125, 1.0110855102539062, 1.041015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 10.0, 10.0, 13.0, 12.0, 10.0, 32.0, 42.0, 55.0, 95.0, 138.0, 155.0, 122.0, 89.0, 62.0, 40.0, 30.0, 15.0, 15.0, 5.0, 7.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.48095703125, -0.46407318115234375, -0.4471893310546875, -0.43030548095703125, -0.413421630859375, -0.39653778076171875, -0.3796539306640625, -0.36277008056640625, -0.34588623046875, -0.32900238037109375, -0.3121185302734375, -0.29523468017578125, -0.278350830078125, -0.26146697998046875, -0.2445831298828125, -0.22769927978515625, -0.2108154296875, -0.19393157958984375, -0.1770477294921875, -0.16016387939453125, -0.143280029296875, -0.12639617919921875, -0.1095123291015625, -0.09262847900390625, -0.07574462890625, -0.05886077880859375, -0.0419769287109375, -0.02509307861328125, -0.008209228515625, 0.00867462158203125, 0.0255584716796875, 0.04244232177734375, 0.059326171875, 0.07621002197265625, 0.0930938720703125, 0.10997772216796875, 0.126861572265625, 0.14374542236328125, 0.1606292724609375, 0.17751312255859375, 0.19439697265625, 0.21128082275390625, 0.2281646728515625, 0.24504852294921875, 0.261932373046875, 0.27881622314453125, 0.2957000732421875, 0.31258392333984375, 0.3294677734375, 0.34635162353515625, 0.3632354736328125, 0.38011932373046875, 0.397003173828125, 0.41388702392578125, 0.4307708740234375, 0.44765472412109375, 0.46453857421875, 0.48142242431640625, 0.4983062744140625, 0.5151901245117188, 0.532073974609375, 0.5489578247070312, 0.5658416748046875, 0.5827255249023438, 0.599609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 2.0, 13.0, 62.0, 550.0, 346.0, 25.0, 12.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.294604301452637, -5.796622276306152, -4.298640251159668, -2.800658702850342, -1.3026766777038574, 0.19530534744262695, 1.6932868957519531, 3.1912689208984375, 4.689250946044922, 6.187232971191406, 7.685214996337891, 9.183197021484375, 10.68117904663086, 12.179161071777344, 13.677142143249512, 15.175124168395996, 16.673107147216797, 18.17108917236328, 19.669071197509766, 21.16705322265625, 22.665035247802734, 24.16301727294922, 25.660999298095703, 27.158981323242188, 28.65696144104004, 30.154943466186523, 31.652925491333008, 33.15090560913086, 34.648887634277344, 36.14686965942383, 37.64485168457031, 39.1428337097168, 40.64081954956055, 42.13880157470703, 43.636783599853516, 45.134765625, 46.632747650146484, 48.13072967529297, 49.62871170043945, 51.12669372558594, 52.62467575073242, 54.122657775878906, 55.62063980102539, 57.118621826171875, 58.61660385131836, 60.114585876464844, 61.61256790161133, 63.11054992675781, 64.60852813720703, 66.10650634765625, 67.6044921875, 69.10247039794922, 70.60045623779297, 72.09843444824219, 73.59642028808594, 75.09439849853516, 76.5923843383789, 78.09036254882812, 79.58834838867188, 81.0863265991211, 82.58431243896484, 84.08229064941406, 85.58027648925781, 87.07825469970703, 88.57624053955078]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 6.0, 10.0, 15.0, 12.0, 13.0, 15.0, 25.0, 29.0, 29.0, 44.0, 45.0, 42.0, 53.0, 53.0, 48.0, 63.0, 52.0, 60.0, 50.0, 49.0, 54.0, 30.0, 29.0, 25.0, 25.0, 29.0, 20.0, 15.0, 13.0, 9.0, 11.0, 8.0, 6.0, 7.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.368558883666992, -14.87496280670166, -14.381367683410645, -13.887771606445312, -13.39417552947998, -12.900579452514648, -12.406984329223633, -11.9133882522583, -11.419792175292969, -10.926196098327637, -10.432600975036621, -9.939004898071289, -9.445408821105957, -8.951812744140625, -8.45821762084961, -7.964621543884277, -7.471026420593262, -6.977430820465088, -6.483834743499756, -5.990239143371582, -5.49664306640625, -5.003047466278076, -4.509451866149902, -4.01585578918457, -3.5222601890563965, -3.0286643505096436, -2.5350685119628906, -2.041472911834717, -1.5478770732879639, -1.054281234741211, -0.5606856346130371, -0.06708979606628418, 0.42650604248046875, 0.9201018214225769, 1.413697600364685, 1.9072933197021484, 2.4008891582489014, 2.8944849967956543, 3.388080596923828, 3.881676435470581, 4.375272274017334, 4.868867874145508, 5.36246395111084, 5.856059551239014, 6.3496551513671875, 6.8432512283325195, 7.336846828460693, 7.830442428588867, 8.3240385055542, 8.817634582519531, 9.311229705810547, 9.804825782775879, 10.298421859741211, 10.792016983032227, 11.285613059997559, 11.77920913696289, 12.272804260253906, 12.766400337219238, 13.259995460510254, 13.753591537475586, 14.247187614440918, 14.74078369140625, 15.234378814697266, 15.727974891662598, 16.22157096862793]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 10.0, 9.0, 12.0, 10.0, 20.0, 14.0, 28.0, 29.0, 51.0, 65.0, 94.0, 211.0, 557.0, 1965.0, 9098.0, 74803.0, 3130707.0, 929834.0, 38558.0, 5811.0, 1410.0, 467.0, 189.0, 91.0, 49.0, 28.0, 30.0, 27.0, 16.0, 21.0, 21.0, 4.0, 9.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.43359375, -7.214111328125, -6.99462890625, -6.775146484375, -6.5556640625, -6.336181640625, -6.11669921875, -5.897216796875, -5.677734375, -5.458251953125, -5.23876953125, -5.019287109375, -4.7998046875, -4.580322265625, -4.36083984375, -4.141357421875, -3.921875, -3.702392578125, -3.48291015625, -3.263427734375, -3.0439453125, -2.824462890625, -2.60498046875, -2.385498046875, -2.166015625, -1.946533203125, -1.72705078125, -1.507568359375, -1.2880859375, -1.068603515625, -0.84912109375, -0.629638671875, -0.41015625, -0.190673828125, 0.02880859375, 0.248291015625, 0.4677734375, 0.687255859375, 0.90673828125, 1.126220703125, 1.345703125, 1.565185546875, 1.78466796875, 2.004150390625, 2.2236328125, 2.443115234375, 2.66259765625, 2.882080078125, 3.1015625, 3.321044921875, 3.54052734375, 3.760009765625, 3.9794921875, 4.198974609375, 4.41845703125, 4.637939453125, 4.857421875, 5.076904296875, 5.29638671875, 5.515869140625, 5.7353515625, 5.954833984375, 6.17431640625, 6.393798828125, 6.61328125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 5.0, 10.0, 10.0, 19.0, 26.0, 32.0, 42.0, 38.0, 62.0, 66.0, 76.0, 87.0, 87.0, 77.0, 72.0, 58.0, 36.0, 39.0, 37.0, 25.0, 23.0, 17.0, 18.0, 2.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.23651123046875, -3.1214599609375, -3.00640869140625, -2.891357421875, -2.77630615234375, -2.6612548828125, -2.54620361328125, -2.43115234375, -2.31610107421875, -2.2010498046875, -2.08599853515625, -1.970947265625, -1.85589599609375, -1.7408447265625, -1.62579345703125, -1.5107421875, -1.39569091796875, -1.2806396484375, -1.16558837890625, -1.050537109375, -0.93548583984375, -0.8204345703125, -0.70538330078125, -0.59033203125, -0.47528076171875, -0.3602294921875, -0.24517822265625, -0.130126953125, -0.01507568359375, 0.0999755859375, 0.21502685546875, 0.330078125, 0.44512939453125, 0.5601806640625, 0.67523193359375, 0.790283203125, 0.90533447265625, 1.0203857421875, 1.13543701171875, 1.25048828125, 1.36553955078125, 1.4805908203125, 1.59564208984375, 1.710693359375, 1.82574462890625, 1.9407958984375, 2.05584716796875, 2.1708984375, 2.28594970703125, 2.4010009765625, 2.51605224609375, 2.631103515625, 2.74615478515625, 2.8612060546875, 2.97625732421875, 3.09130859375, 3.20635986328125, 3.3214111328125, 3.43646240234375, 3.551513671875, 3.66656494140625, 3.7816162109375, 3.89666748046875, 4.01171875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 12.0, 15.0, 14.0, 38.0, 56.0, 134.0, 371.0, 2247.0, 138354.0, 4043426.0, 8529.0, 726.0, 198.0, 87.0, 35.0, 20.0, 11.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -11.8704833984375, -11.311279296875, -10.7520751953125, -10.19287109375, -9.6336669921875, -9.074462890625, -8.5152587890625, -7.9560546875, -7.3968505859375, -6.837646484375, -6.2784423828125, -5.71923828125, -5.1600341796875, -4.600830078125, -4.0416259765625, -3.482421875, -2.9232177734375, -2.364013671875, -1.8048095703125, -1.24560546875, -0.6864013671875, -0.127197265625, 0.4320068359375, 0.9912109375, 1.5504150390625, 2.109619140625, 2.6688232421875, 3.22802734375, 3.7872314453125, 4.346435546875, 4.9056396484375, 5.46484375, 6.0240478515625, 6.583251953125, 7.1424560546875, 7.70166015625, 8.2608642578125, 8.820068359375, 9.3792724609375, 9.9384765625, 10.4976806640625, 11.056884765625, 11.6160888671875, 12.17529296875, 12.7344970703125, 13.293701171875, 13.8529052734375, 14.412109375, 14.9713134765625, 15.530517578125, 16.0897216796875, 16.64892578125, 17.2081298828125, 17.767333984375, 18.3265380859375, 18.8857421875, 19.4449462890625, 20.004150390625, 20.5633544921875, 21.12255859375, 21.6817626953125, 22.240966796875, 22.8001708984375, 23.359375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 7.0, 11.0, 7.0, 7.0, 10.0, 20.0, 23.0, 30.0, 43.0, 63.0, 79.0, 94.0, 119.0, 199.0, 249.0, 477.0, 869.0, 562.0, 339.0, 241.0, 139.0, 113.0, 96.0, 49.0, 56.0, 38.0, 25.0, 20.0, 12.0, 22.0, 8.0, 8.0, 6.0, 6.0, 9.0, 4.0, 1.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.947265625, -0.9182586669921875, -0.889251708984375, -0.8602447509765625, -0.83123779296875, -0.8022308349609375, -0.773223876953125, -0.7442169189453125, -0.7152099609375, -0.6862030029296875, -0.657196044921875, -0.6281890869140625, -0.59918212890625, -0.5701751708984375, -0.541168212890625, -0.5121612548828125, -0.483154296875, -0.4541473388671875, -0.425140380859375, -0.3961334228515625, -0.36712646484375, -0.3381195068359375, -0.309112548828125, -0.2801055908203125, -0.2510986328125, -0.2220916748046875, -0.193084716796875, -0.1640777587890625, -0.13507080078125, -0.1060638427734375, -0.077056884765625, -0.0480499267578125, -0.01904296875, 0.0099639892578125, 0.038970947265625, 0.0679779052734375, 0.09698486328125, 0.1259918212890625, 0.154998779296875, 0.1840057373046875, 0.2130126953125, 0.2420196533203125, 0.271026611328125, 0.3000335693359375, 0.32904052734375, 0.3580474853515625, 0.387054443359375, 0.4160614013671875, 0.445068359375, 0.4740753173828125, 0.503082275390625, 0.5320892333984375, 0.56109619140625, 0.5901031494140625, 0.619110107421875, 0.6481170654296875, 0.6771240234375, 0.7061309814453125, 0.735137939453125, 0.7641448974609375, 0.79315185546875, 0.8221588134765625, 0.851165771484375, 0.8801727294921875, 0.9091796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 20.0, 32.0, 38.0, 65.0, 121.0, 167.0, 169.0, 143.0, 83.0, 46.0, 29.0, 17.0, 10.0, 8.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3941330909729, -6.1747026443481445, -5.955272197723389, -5.735841751098633, -5.516411781311035, -5.296980857849121, -5.077550888061523, -4.858120441436768, -4.638689994812012, -4.419259548187256, -4.1998291015625, -3.9803988933563232, -3.7609684467315674, -3.5415380001068115, -3.3221077919006348, -3.102677345275879, -2.883246898651123, -2.663816452026367, -2.4443860054016113, -2.2249557971954346, -2.0055253505706787, -1.7860949039459229, -1.5666645765304565, -1.3472342491149902, -1.1278038024902344, -0.9083734154701233, -0.6889430284500122, -0.4695126414299011, -0.25008225440979004, -0.03065180778503418, 0.18877851963043213, 0.40820884704589844, 0.6276388168334961, 0.8470692038536072, 1.0664995908737183, 1.2859299182891846, 1.5053603649139404, 1.7247908115386963, 1.9442211389541626, 2.163651466369629, 2.3830819129943848, 2.6025123596191406, 2.8219428062438965, 3.0413730144500732, 3.260803461074829, 3.480233907699585, 3.6996641159057617, 3.9190945625305176, 4.138525009155273, 4.357955455780029, 4.577385902404785, 4.796816349029541, 5.016246795654297, 5.2356767654418945, 5.45510721206665, 5.674537658691406, 5.893968105316162, 6.113398551940918, 6.332828998565674, 6.55225944519043, 6.771689414978027, 6.991120338439941, 7.210550308227539, 7.429980754852295, 7.649411201477051]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 10.0, 11.0, 21.0, 13.0, 16.0, 28.0, 37.0, 43.0, 40.0, 47.0, 63.0, 62.0, 75.0, 58.0, 59.0, 81.0, 45.0, 44.0, 45.0, 37.0, 26.0, 19.0, 31.0, 18.0, 17.0, 5.0, 13.0, 6.0, 8.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603375196456909, -3.491175413131714, -3.3789753913879395, -3.266775608062744, -3.154575824737549, -3.0423760414123535, -2.930176019668579, -2.817976236343384, -2.7057762145996094, -2.593576431274414, -2.4813764095306396, -2.3691766262054443, -2.256976842880249, -2.1447768211364746, -2.0325770378112793, -1.920377254486084, -1.8081774711608887, -1.6959775686264038, -1.5837777853012085, -1.4715778827667236, -1.3593780994415283, -1.2471781969070435, -1.1349782943725586, -1.0227785110473633, -0.9105786085128784, -0.7983787655830383, -0.6861789226531982, -0.5739790201187134, -0.4617791771888733, -0.3495793342590332, -0.23737943172454834, -0.12517958879470825, -0.012979984283447266, 0.09921987354755402, 0.2114197313785553, 0.3236196041107178, 0.43581944704055786, 0.548019289970398, 0.6602191925048828, 0.7724190354347229, 0.884618878364563, 0.9968187212944031, 1.1090185642242432, 1.221218466758728, 1.333418369293213, 1.4456181526184082, 1.557818055152893, 1.670017957687378, 1.7822177410125732, 1.894417643547058, 2.006617546081543, 2.1188173294067383, 2.2310171127319336, 2.343216896057129, 2.4554169178009033, 2.5676167011260986, 2.679816722869873, 2.7920165061950684, 2.9042165279388428, 3.016416311264038, 3.1286160945892334, 3.240816116333008, 3.353015899658203, 3.4652156829833984, 3.5774154663085938]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 11.0, 8.0, 15.0, 27.0, 33.0, 38.0, 80.0, 101.0, 213.0, 403.0, 1007.0, 3744.0, 31973.0, 891246.0, 110145.0, 6745.0, 1528.0, 584.0, 240.0, 133.0, 97.0, 54.0, 26.0, 32.0, 16.0, 8.0, 10.0, 10.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.880859375, -0.8554534912109375, -0.830047607421875, -0.8046417236328125, -0.77923583984375, -0.7538299560546875, -0.728424072265625, -0.7030181884765625, -0.6776123046875, -0.6522064208984375, -0.626800537109375, -0.6013946533203125, -0.57598876953125, -0.5505828857421875, -0.525177001953125, -0.4997711181640625, -0.474365234375, -0.4489593505859375, -0.423553466796875, -0.3981475830078125, -0.37274169921875, -0.3473358154296875, -0.321929931640625, -0.2965240478515625, -0.2711181640625, -0.2457122802734375, -0.220306396484375, -0.1949005126953125, -0.16949462890625, -0.1440887451171875, -0.118682861328125, -0.0932769775390625, -0.06787109375, -0.0424652099609375, -0.017059326171875, 0.0083465576171875, 0.03375244140625, 0.0591583251953125, 0.084564208984375, 0.1099700927734375, 0.1353759765625, 0.1607818603515625, 0.186187744140625, 0.2115936279296875, 0.23699951171875, 0.2624053955078125, 0.287811279296875, 0.3132171630859375, 0.338623046875, 0.3640289306640625, 0.389434814453125, 0.4148406982421875, 0.44024658203125, 0.4656524658203125, 0.491058349609375, 0.5164642333984375, 0.5418701171875, 0.5672760009765625, 0.592681884765625, 0.6180877685546875, 0.64349365234375, 0.6688995361328125, 0.694305419921875, 0.7197113037109375, 0.7451171875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 1.0, 9.0, 6.0, 10.0, 11.0, 13.0, 20.0, 18.0, 35.0, 45.0, 49.0, 64.0, 61.0, 71.0, 84.0, 74.0, 83.0, 70.0, 58.0, 40.0, 31.0, 36.0, 16.0, 19.0, 17.0, 15.0, 5.0, 9.0, 11.0, 9.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.943359375, -2.859344482421875, -2.77532958984375, -2.691314697265625, -2.6072998046875, -2.523284912109375, -2.43927001953125, -2.355255126953125, -2.271240234375, -2.187225341796875, -2.10321044921875, -2.019195556640625, -1.9351806640625, -1.851165771484375, -1.76715087890625, -1.683135986328125, -1.59912109375, -1.515106201171875, -1.43109130859375, -1.347076416015625, -1.2630615234375, -1.179046630859375, -1.09503173828125, -1.011016845703125, -0.927001953125, -0.842987060546875, -0.75897216796875, -0.674957275390625, -0.5909423828125, -0.506927490234375, -0.42291259765625, -0.338897705078125, -0.2548828125, -0.170867919921875, -0.08685302734375, -0.002838134765625, 0.0811767578125, 0.165191650390625, 0.24920654296875, 0.333221435546875, 0.417236328125, 0.501251220703125, 0.58526611328125, 0.669281005859375, 0.7532958984375, 0.837310791015625, 0.92132568359375, 1.005340576171875, 1.08935546875, 1.173370361328125, 1.25738525390625, 1.341400146484375, 1.4254150390625, 1.509429931640625, 1.59344482421875, 1.677459716796875, 1.761474609375, 1.845489501953125, 1.92950439453125, 2.013519287109375, 2.0975341796875, 2.181549072265625, 2.26556396484375, 2.349578857421875, 2.43359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 8.0, 3.0, 19.0, 13.0, 20.0, 20.0, 21.0, 42.0, 36.0, 67.0, 70.0, 117.0, 134.0, 206.0, 303.0, 474.0, 1051.0, 4249.0, 50528.0, 670979.0, 299079.0, 17123.0, 2071.0, 679.0, 412.0, 212.0, 155.0, 140.0, 80.0, 57.0, 42.0, 40.0, 36.0, 19.0, 13.0, 14.0, 7.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3560905456542969, -0.34523773193359375, -0.3343849182128906, -0.3235321044921875, -0.3126792907714844, -0.30182647705078125, -0.2909736633300781, -0.280120849609375, -0.2692680358886719, -0.25841522216796875, -0.24756240844726562, -0.2367095947265625, -0.22585678100585938, -0.21500396728515625, -0.20415115356445312, -0.19329833984375, -0.18244552612304688, -0.17159271240234375, -0.16073989868164062, -0.1498870849609375, -0.13903427124023438, -0.12818145751953125, -0.11732864379882812, -0.106475830078125, -0.09562301635742188, -0.08477020263671875, -0.07391738891601562, -0.0630645751953125, -0.052211761474609375, -0.04135894775390625, -0.030506134033203125, -0.0196533203125, -0.008800506591796875, 0.00205230712890625, 0.012905120849609375, 0.0237579345703125, 0.034610748291015625, 0.04546356201171875, 0.056316375732421875, 0.067169189453125, 0.07802200317382812, 0.08887481689453125, 0.09972763061523438, 0.1105804443359375, 0.12143325805664062, 0.13228607177734375, 0.14313888549804688, 0.15399169921875, 0.16484451293945312, 0.17569732666015625, 0.18655014038085938, 0.1974029541015625, 0.20825576782226562, 0.21910858154296875, 0.22996139526367188, 0.240814208984375, 0.2516670227050781, 0.26251983642578125, 0.2733726501464844, 0.2842254638671875, 0.2950782775878906, 0.30593109130859375, 0.3167839050292969, 0.32763671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 9.0, 8.0, 13.0, 12.0, 20.0, 19.0, 17.0, 14.0, 29.0, 38.0, 27.0, 46.0, 52.0, 41.0, 38.0, 56.0, 54.0, 48.0, 42.0, 50.0, 51.0, 41.0, 34.0, 35.0, 23.0, 36.0, 15.0, 22.0, 17.0, 10.0, 16.0, 12.0, 9.0, 10.0, 6.0, 9.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.829620361328125, -2.72955322265625, -2.629486083984375, -2.5294189453125, -2.429351806640625, -2.32928466796875, -2.229217529296875, -2.129150390625, -2.029083251953125, -1.92901611328125, -1.828948974609375, -1.7288818359375, -1.628814697265625, -1.52874755859375, -1.428680419921875, -1.32861328125, -1.228546142578125, -1.12847900390625, -1.028411865234375, -0.9283447265625, -0.828277587890625, -0.72821044921875, -0.628143310546875, -0.528076171875, -0.428009033203125, -0.32794189453125, -0.227874755859375, -0.1278076171875, -0.027740478515625, 0.07232666015625, 0.172393798828125, 0.2724609375, 0.372528076171875, 0.47259521484375, 0.572662353515625, 0.6727294921875, 0.772796630859375, 0.87286376953125, 0.972930908203125, 1.072998046875, 1.173065185546875, 1.27313232421875, 1.373199462890625, 1.4732666015625, 1.573333740234375, 1.67340087890625, 1.773468017578125, 1.87353515625, 1.973602294921875, 2.07366943359375, 2.173736572265625, 2.2738037109375, 2.373870849609375, 2.47393798828125, 2.574005126953125, 2.674072265625, 2.774139404296875, 2.87420654296875, 2.974273681640625, 3.0743408203125, 3.174407958984375, 3.27447509765625, 3.374542236328125, 3.474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 4.0, 4.0, 8.0, 13.0, 14.0, 26.0, 32.0, 42.0, 61.0, 76.0, 112.0, 200.0, 296.0, 403.0, 748.0, 2201.0, 22135.0, 919001.0, 96223.0, 4395.0, 1047.0, 489.0, 313.0, 222.0, 137.0, 85.0, 73.0, 42.0, 41.0, 14.0, 19.0, 17.0, 11.0, 9.0, 5.0, 9.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1029052734375, -0.09985065460205078, -0.09679603576660156, -0.09374141693115234, -0.09068679809570312, -0.0876321792602539, -0.08457756042480469, -0.08152294158935547, -0.07846832275390625, -0.07541370391845703, -0.07235908508300781, -0.0693044662475586, -0.06624984741210938, -0.06319522857666016, -0.06014060974121094, -0.05708599090576172, -0.0540313720703125, -0.05097675323486328, -0.04792213439941406, -0.044867515563964844, -0.041812896728515625, -0.038758277893066406, -0.03570365905761719, -0.03264904022216797, -0.02959442138671875, -0.02653980255126953, -0.023485183715820312, -0.020430564880371094, -0.017375946044921875, -0.014321327209472656, -0.011266708374023438, -0.008212089538574219, -0.005157470703125, -0.0021028518676757812, 0.0009517669677734375, 0.004006385803222656, 0.007061004638671875, 0.010115623474121094, 0.013170242309570312, 0.01622486114501953, 0.01927947998046875, 0.02233409881591797, 0.025388717651367188, 0.028443336486816406, 0.031497955322265625, 0.034552574157714844, 0.03760719299316406, 0.04066181182861328, 0.0437164306640625, 0.04677104949951172, 0.04982566833496094, 0.052880287170410156, 0.055934906005859375, 0.058989524841308594, 0.06204414367675781, 0.06509876251220703, 0.06815338134765625, 0.07120800018310547, 0.07426261901855469, 0.0773172378540039, 0.08037185668945312, 0.08342647552490234, 0.08648109436035156, 0.08953571319580078, 0.09259033203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 6.0, 8.0, 9.0, 19.0, 18.0, 22.0, 24.0, 45.0, 51.0, 48.0, 55.0, 72.0, 51.0, 81.0, 72.0, 82.0, 67.0, 49.0, 39.0, 36.0, 28.0, 25.0, 14.0, 15.0, 10.0, 10.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.0100345611572266e-05, -2.91457399725914e-05, -2.8191134333610535e-05, -2.723652869462967e-05, -2.6281923055648804e-05, -2.5327317416667938e-05, -2.4372711777687073e-05, -2.3418106138706207e-05, -2.2463500499725342e-05, -2.1508894860744476e-05, -2.055428922176361e-05, -1.9599683582782745e-05, -1.864507794380188e-05, -1.7690472304821014e-05, -1.673586666584015e-05, -1.5781261026859283e-05, -1.4826655387878418e-05, -1.3872049748897552e-05, -1.2917444109916687e-05, -1.1962838470935822e-05, -1.1008232831954956e-05, -1.005362719297409e-05, -9.099021553993225e-06, -8.14441591501236e-06, -7.189810276031494e-06, -6.235204637050629e-06, -5.280598998069763e-06, -4.325993359088898e-06, -3.3713877201080322e-06, -2.4167820811271667e-06, -1.4621764421463013e-06, -5.075708031654358e-07, 4.470348358154297e-07, 1.4016404747962952e-06, 2.3562461137771606e-06, 3.310851752758026e-06, 4.265457391738892e-06, 5.220063030719757e-06, 6.1746686697006226e-06, 7.129274308681488e-06, 8.083879947662354e-06, 9.038485586643219e-06, 9.993091225624084e-06, 1.094769686460495e-05, 1.1902302503585815e-05, 1.2856908142566681e-05, 1.3811513781547546e-05, 1.4766119420528412e-05, 1.5720725059509277e-05, 1.6675330698490143e-05, 1.7629936337471008e-05, 1.8584541976451874e-05, 1.953914761543274e-05, 2.0493753254413605e-05, 2.144835889339447e-05, 2.2402964532375336e-05, 2.33575701713562e-05, 2.4312175810337067e-05, 2.5266781449317932e-05, 2.6221387088298798e-05, 2.7175992727279663e-05, 2.813059836626053e-05, 2.9085204005241394e-05, 3.003980964422226e-05, 3.0994415283203125e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 10.0, 14.0, 26.0, 29.0, 51.0, 66.0, 105.0, 211.0, 356.0, 689.0, 1360.0, 2991.0, 6733.0, 20230.0, 94340.0, 735109.0, 144824.0, 26425.0, 8222.0, 3361.0, 1622.0, 772.0, 401.0, 241.0, 127.0, 85.0, 54.0, 30.0, 24.0, 12.0, 8.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07470703125, -0.0723428726196289, -0.06997871398925781, -0.06761455535888672, -0.06525039672851562, -0.06288623809814453, -0.06052207946777344, -0.058157920837402344, -0.05579376220703125, -0.053429603576660156, -0.05106544494628906, -0.04870128631591797, -0.046337127685546875, -0.04397296905517578, -0.04160881042480469, -0.039244651794433594, -0.0368804931640625, -0.034516334533691406, -0.03215217590332031, -0.02978801727294922, -0.027423858642578125, -0.02505970001220703, -0.022695541381835938, -0.020331382751464844, -0.01796722412109375, -0.015603065490722656, -0.013238906860351562, -0.010874748229980469, -0.008510589599609375, -0.006146430969238281, -0.0037822723388671875, -0.0014181137084960938, 0.000946044921875, 0.0033102035522460938, 0.0056743621826171875, 0.008038520812988281, 0.010402679443359375, 0.012766838073730469, 0.015130996704101562, 0.017495155334472656, 0.01985931396484375, 0.022223472595214844, 0.024587631225585938, 0.02695178985595703, 0.029315948486328125, 0.03168010711669922, 0.03404426574707031, 0.036408424377441406, 0.0387725830078125, 0.041136741638183594, 0.04350090026855469, 0.04586505889892578, 0.048229217529296875, 0.05059337615966797, 0.05295753479003906, 0.055321693420410156, 0.05768585205078125, 0.060050010681152344, 0.06241416931152344, 0.06477832794189453, 0.06714248657226562, 0.06950664520263672, 0.07187080383300781, 0.0742349624633789, 0.07659912109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 9.0, 7.0, 14.0, 25.0, 34.0, 63.0, 55.0, 122.0, 131.0, 161.0, 120.0, 92.0, 42.0, 35.0, 18.0, 17.0, 14.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0170440673828125, -0.01657402515411377, -0.01610398292541504, -0.01563394069671631, -0.015163898468017578, -0.014693856239318848, -0.014223814010620117, -0.013753771781921387, -0.013283729553222656, -0.012813687324523926, -0.012343645095825195, -0.011873602867126465, -0.011403560638427734, -0.010933518409729004, -0.010463476181030273, -0.009993433952331543, -0.009523391723632812, -0.009053349494934082, -0.008583307266235352, -0.008113265037536621, -0.007643222808837891, -0.00717318058013916, -0.00670313835144043, -0.006233096122741699, -0.005763053894042969, -0.005293011665344238, -0.004822969436645508, -0.004352927207946777, -0.003882884979248047, -0.0034128427505493164, -0.002942800521850586, -0.0024727582931518555, -0.002002716064453125, -0.0015326738357543945, -0.001062631607055664, -0.0005925893783569336, -0.00012254714965820312, 0.00034749507904052734, 0.0008175373077392578, 0.0012875795364379883, 0.0017576217651367188, 0.0022276639938354492, 0.0026977062225341797, 0.00316774845123291, 0.0036377906799316406, 0.004107832908630371, 0.0045778751373291016, 0.005047917366027832, 0.0055179595947265625, 0.005988001823425293, 0.0064580440521240234, 0.006928086280822754, 0.007398128509521484, 0.007868170738220215, 0.008338212966918945, 0.008808255195617676, 0.009278297424316406, 0.009748339653015137, 0.010218381881713867, 0.010688424110412598, 0.011158466339111328, 0.011628508567810059, 0.012098550796508789, 0.01256859302520752, 0.01303863525390625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 17.0, 11.0, 27.0, 46.0, 82.0, 155.0, 204.0, 188.0, 119.0, 56.0, 30.0, 14.0, 16.0, 5.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.912944793701172, -4.7478413581848145, -4.582737922668457, -4.4176344871521, -4.252531051635742, -4.087428092956543, -3.9223246574401855, -3.757221221923828, -3.5921177864074707, -3.4270143508911133, -3.261910915374756, -3.0968077182769775, -2.93170428276062, -2.7666008472442627, -2.6014976501464844, -2.436394214630127, -2.2712907791137695, -2.106187343597412, -1.9410840272903442, -1.7759807109832764, -1.610877275466919, -1.4457738399505615, -1.2806705236434937, -1.1155672073364258, -0.9504637718200684, -0.7853603959083557, -0.6202570199966431, -0.4551536440849304, -0.2900502681732178, -0.12494689226150513, 0.04015648365020752, 0.2052597999572754, 0.3703627586364746, 0.5354661345481873, 0.7005695104598999, 0.8656728863716125, 1.0307762622833252, 1.1958796977996826, 1.3609830141067505, 1.5260863304138184, 1.6911897659301758, 1.8562932014465332, 2.0213966369628906, 2.186499834060669, 2.3516032695770264, 2.516706705093384, 2.681809902191162, 2.8469133377075195, 3.012016773223877, 3.1771202087402344, 3.342223644256592, 3.50732684135437, 3.6724302768707275, 3.837533712387085, 4.002636909484863, 4.167740345001221, 4.332843780517578, 4.4979472160339355, 4.663050651550293, 4.82815408706665, 4.993257522583008, 5.158360481262207, 5.3234639167785645, 5.488567352294922, 5.653670787811279]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 9.0, 8.0, 14.0, 13.0, 15.0, 19.0, 27.0, 40.0, 44.0, 47.0, 66.0, 58.0, 83.0, 81.0, 77.0, 76.0, 60.0, 33.0, 49.0, 38.0, 24.0, 21.0, 23.0, 12.0, 14.0, 12.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.5324127674102783, -2.454846143722534, -2.377279281616211, -2.299712657928467, -2.2221457958221436, -2.1445791721343994, -2.067012310028076, -1.989445686340332, -1.9118789434432983, -1.8343122005462646, -1.756745457649231, -1.6791787147521973, -1.6016120910644531, -1.5240452289581299, -1.4464786052703857, -1.368911862373352, -1.2913451194763184, -1.2137783765792847, -1.136211633682251, -1.0586448907852173, -0.9810782074928284, -0.9035114645957947, -0.8259447813034058, -0.7483780384063721, -0.6708112955093384, -0.5932445526123047, -0.515677809715271, -0.4381111264228821, -0.3605443835258484, -0.2829776406288147, -0.2054109275341034, -0.1278442144393921, -0.0502774715423584, 0.0272892564535141, 0.1048559844493866, 0.1824227124452591, 0.2599894404411316, 0.3375561833381653, 0.4151228964328766, 0.4926896095275879, 0.5702563524246216, 0.6478230953216553, 0.725389838218689, 0.8029565215110779, 0.8805232644081116, 0.9580900073051453, 1.0356566905975342, 1.1132234334945679, 1.1907901763916016, 1.2683569192886353, 1.345923662185669, 1.4234904050827026, 1.5010571479797363, 1.5786237716674805, 1.6561905145645142, 1.7337572574615479, 1.8113240003585815, 1.8888907432556152, 1.966457486152649, 2.0440242290496826, 2.1215908527374268, 2.19915771484375, 2.276724338531494, 2.3542909622192383, 2.4318578243255615]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 8.0, 1.0, 3.0, 9.0, 9.0, 11.0, 24.0, 42.0, 56.0, 93.0, 148.0, 267.0, 469.0, 903.0, 1915.0, 4088.0, 9547.0, 27540.0, 101042.0, 486097.0, 317883.0, 65245.0, 19444.0, 7305.0, 3114.0, 1459.0, 799.0, 413.0, 240.0, 152.0, 93.0, 35.0, 33.0, 27.0, 9.0, 8.0, 3.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.087890625, -2.98779296875, -2.8876953125, -2.78759765625, -2.6875, -2.58740234375, -2.4873046875, -2.38720703125, -2.287109375, -2.18701171875, -2.0869140625, -1.98681640625, -1.88671875, -1.78662109375, -1.6865234375, -1.58642578125, -1.486328125, -1.38623046875, -1.2861328125, -1.18603515625, -1.0859375, -0.98583984375, -0.8857421875, -0.78564453125, -0.685546875, -0.58544921875, -0.4853515625, -0.38525390625, -0.28515625, -0.18505859375, -0.0849609375, 0.01513671875, 0.115234375, 0.21533203125, 0.3154296875, 0.41552734375, 0.515625, 0.61572265625, 0.7158203125, 0.81591796875, 0.916015625, 1.01611328125, 1.1162109375, 1.21630859375, 1.31640625, 1.41650390625, 1.5166015625, 1.61669921875, 1.716796875, 1.81689453125, 1.9169921875, 2.01708984375, 2.1171875, 2.21728515625, 2.3173828125, 2.41748046875, 2.517578125, 2.61767578125, 2.7177734375, 2.81787109375, 2.91796875, 3.01806640625, 3.1181640625, 3.21826171875, 3.318359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 3.0, 9.0, 14.0, 8.0, 14.0, 20.0, 31.0, 40.0, 46.0, 47.0, 45.0, 78.0, 76.0, 74.0, 87.0, 79.0, 48.0, 52.0, 38.0, 44.0, 24.0, 22.0, 25.0, 18.0, 12.0, 6.0, 4.0, 5.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.01171875, -5.83868408203125, -5.6656494140625, -5.49261474609375, -5.319580078125, -5.14654541015625, -4.9735107421875, -4.80047607421875, -4.62744140625, -4.45440673828125, -4.2813720703125, -4.10833740234375, -3.935302734375, -3.76226806640625, -3.5892333984375, -3.41619873046875, -3.2431640625, -3.07012939453125, -2.8970947265625, -2.72406005859375, -2.551025390625, -2.37799072265625, -2.2049560546875, -2.03192138671875, -1.85888671875, -1.68585205078125, -1.5128173828125, -1.33978271484375, -1.166748046875, -0.99371337890625, -0.8206787109375, -0.64764404296875, -0.474609375, -0.30157470703125, -0.1285400390625, 0.04449462890625, 0.217529296875, 0.39056396484375, 0.5635986328125, 0.73663330078125, 0.90966796875, 1.08270263671875, 1.2557373046875, 1.42877197265625, 1.601806640625, 1.77484130859375, 1.9478759765625, 2.12091064453125, 2.2939453125, 2.46697998046875, 2.6400146484375, 2.81304931640625, 2.986083984375, 3.15911865234375, 3.3321533203125, 3.50518798828125, 3.67822265625, 3.85125732421875, 4.0242919921875, 4.19732666015625, 4.370361328125, 4.54339599609375, 4.7164306640625, 4.88946533203125, 5.0625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 7.0, 10.0, 7.0, 16.0, 18.0, 21.0, 14.0, 25.0, 21.0, 28.0, 35.0, 26.0, 45.0, 65.0, 85.0, 175.0, 919.0, 15456.0, 996711.0, 32897.0, 1309.0, 210.0, 87.0, 57.0, 35.0, 37.0, 34.0, 32.0, 22.0, 18.0, 17.0, 15.0, 8.0, 9.0, 14.0, 10.0, 7.0, 3.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.421875, -12.028564453125, -11.63525390625, -11.241943359375, -10.8486328125, -10.455322265625, -10.06201171875, -9.668701171875, -9.275390625, -8.882080078125, -8.48876953125, -8.095458984375, -7.7021484375, -7.308837890625, -6.91552734375, -6.522216796875, -6.12890625, -5.735595703125, -5.34228515625, -4.948974609375, -4.5556640625, -4.162353515625, -3.76904296875, -3.375732421875, -2.982421875, -2.589111328125, -2.19580078125, -1.802490234375, -1.4091796875, -1.015869140625, -0.62255859375, -0.229248046875, 0.1640625, 0.557373046875, 0.95068359375, 1.343994140625, 1.7373046875, 2.130615234375, 2.52392578125, 2.917236328125, 3.310546875, 3.703857421875, 4.09716796875, 4.490478515625, 4.8837890625, 5.277099609375, 5.67041015625, 6.063720703125, 6.45703125, 6.850341796875, 7.24365234375, 7.636962890625, 8.0302734375, 8.423583984375, 8.81689453125, 9.210205078125, 9.603515625, 9.996826171875, 10.39013671875, 10.783447265625, 11.1767578125, 11.570068359375, 11.96337890625, 12.356689453125, 12.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 11.0, 13.0, 5.0, 9.0, 7.0, 16.0, 9.0, 19.0, 17.0, 14.0, 25.0, 23.0, 22.0, 26.0, 32.0, 34.0, 43.0, 37.0, 31.0, 51.0, 29.0, 34.0, 41.0, 43.0, 42.0, 40.0, 28.0, 36.0, 24.0, 25.0, 17.0, 36.0, 19.0, 17.0, 23.0, 10.0, 11.0, 16.0, 14.0, 6.0, 9.0, 4.0, 5.0, 6.0, 1.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.916015625, -3.79376220703125, -3.6715087890625, -3.54925537109375, -3.427001953125, -3.30474853515625, -3.1824951171875, -3.06024169921875, -2.93798828125, -2.81573486328125, -2.6934814453125, -2.57122802734375, -2.448974609375, -2.32672119140625, -2.2044677734375, -2.08221435546875, -1.9599609375, -1.83770751953125, -1.7154541015625, -1.59320068359375, -1.470947265625, -1.34869384765625, -1.2264404296875, -1.10418701171875, -0.98193359375, -0.85968017578125, -0.7374267578125, -0.61517333984375, -0.492919921875, -0.37066650390625, -0.2484130859375, -0.12615966796875, -0.00390625, 0.11834716796875, 0.2406005859375, 0.36285400390625, 0.485107421875, 0.60736083984375, 0.7296142578125, 0.85186767578125, 0.97412109375, 1.09637451171875, 1.2186279296875, 1.34088134765625, 1.463134765625, 1.58538818359375, 1.7076416015625, 1.82989501953125, 1.9521484375, 2.07440185546875, 2.1966552734375, 2.31890869140625, 2.441162109375, 2.56341552734375, 2.6856689453125, 2.80792236328125, 2.93017578125, 3.05242919921875, 3.1746826171875, 3.29693603515625, 3.419189453125, 3.54144287109375, 3.6636962890625, 3.78594970703125, 3.908203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 10.0, 11.0, 17.0, 26.0, 33.0, 66.0, 125.0, 232.0, 473.0, 1103.0, 3198.0, 11605.0, 69769.0, 613342.0, 305127.0, 32904.0, 7015.0, 2010.0, 768.0, 334.0, 147.0, 86.0, 45.0, 34.0, 25.0, 13.0, 7.0, 6.0, 2.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0614471435546875, -1.023284912109375, -0.9851226806640625, -0.94696044921875, -0.9087982177734375, -0.870635986328125, -0.8324737548828125, -0.7943115234375, -0.7561492919921875, -0.717987060546875, -0.6798248291015625, -0.64166259765625, -0.6035003662109375, -0.565338134765625, -0.5271759033203125, -0.489013671875, -0.4508514404296875, -0.412689208984375, -0.3745269775390625, -0.33636474609375, -0.2982025146484375, -0.260040283203125, -0.2218780517578125, -0.1837158203125, -0.1455535888671875, -0.107391357421875, -0.0692291259765625, -0.03106689453125, 0.0070953369140625, 0.045257568359375, 0.0834197998046875, 0.12158203125, 0.1597442626953125, 0.197906494140625, 0.2360687255859375, 0.27423095703125, 0.3123931884765625, 0.350555419921875, 0.3887176513671875, 0.4268798828125, 0.4650421142578125, 0.503204345703125, 0.5413665771484375, 0.57952880859375, 0.6176910400390625, 0.655853271484375, 0.6940155029296875, 0.732177734375, 0.7703399658203125, 0.808502197265625, 0.8466644287109375, 0.88482666015625, 0.9229888916015625, 0.961151123046875, 0.9993133544921875, 1.0374755859375, 1.0756378173828125, 1.113800048828125, 1.1519622802734375, 1.19012451171875, 1.2282867431640625, 1.266448974609375, 1.3046112060546875, 1.3427734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 10.0, 6.0, 17.0, 12.0, 16.0, 22.0, 22.0, 32.0, 45.0, 55.0, 55.0, 77.0, 77.0, 92.0, 81.0, 86.0, 48.0, 60.0, 40.0, 27.0, 24.0, 19.0, 13.0, 13.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013196468353271484, -0.0001279003918170929, -0.00012383610010147095, -0.000119771808385849, -0.00011570751667022705, -0.0001116432249546051, -0.00010757893323898315, -0.0001035146415233612, -9.945034980773926e-05, -9.538605809211731e-05, -9.132176637649536e-05, -8.725747466087341e-05, -8.319318294525146e-05, -7.912889122962952e-05, -7.506459951400757e-05, -7.100030779838562e-05, -6.693601608276367e-05, -6.287172436714172e-05, -5.8807432651519775e-05, -5.474314093589783e-05, -5.067884922027588e-05, -4.661455750465393e-05, -4.255026578903198e-05, -3.8485974073410034e-05, -3.4421682357788086e-05, -3.0357390642166138e-05, -2.629309892654419e-05, -2.222880721092224e-05, -1.8164515495300293e-05, -1.4100223779678345e-05, -1.0035932064056396e-05, -5.971640348434448e-06, -1.9073486328125e-06, 2.1569430828094482e-06, 6.2212347984313965e-06, 1.0285526514053345e-05, 1.4349818229675293e-05, 1.841410994529724e-05, 2.247840166091919e-05, 2.6542693376541138e-05, 3.0606985092163086e-05, 3.4671276807785034e-05, 3.873556852340698e-05, 4.279986023902893e-05, 4.686415195465088e-05, 5.092844367027283e-05, 5.4992735385894775e-05, 5.9057027101516724e-05, 6.312131881713867e-05, 6.718561053276062e-05, 7.124990224838257e-05, 7.531419396400452e-05, 7.937848567962646e-05, 8.344277739524841e-05, 8.750706911087036e-05, 9.157136082649231e-05, 9.563565254211426e-05, 9.96999442577362e-05, 0.00010376423597335815, 0.0001078285276889801, 0.00011189281940460205, 0.000115957111120224, 0.00012002140283584595, 0.0001240856945514679, 0.00012814998626708984]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 9.0, 9.0, 23.0, 55.0, 66.0, 128.0, 278.0, 697.0, 2014.0, 7040.0, 36535.0, 403647.0, 537942.0, 47907.0, 8483.0, 2303.0, 790.0, 302.0, 154.0, 60.0, 45.0, 19.0, 19.0, 4.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.421173095703125, -1.37945556640625, -1.337738037109375, -1.2960205078125, -1.254302978515625, -1.21258544921875, -1.170867919921875, -1.129150390625, -1.087432861328125, -1.04571533203125, -1.003997802734375, -0.9622802734375, -0.920562744140625, -0.87884521484375, -0.837127685546875, -0.79541015625, -0.753692626953125, -0.71197509765625, -0.670257568359375, -0.6285400390625, -0.586822509765625, -0.54510498046875, -0.503387451171875, -0.461669921875, -0.419952392578125, -0.37823486328125, -0.336517333984375, -0.2947998046875, -0.253082275390625, -0.21136474609375, -0.169647216796875, -0.1279296875, -0.086212158203125, -0.04449462890625, -0.002777099609375, 0.0389404296875, 0.080657958984375, 0.12237548828125, 0.164093017578125, 0.205810546875, 0.247528076171875, 0.28924560546875, 0.330963134765625, 0.3726806640625, 0.414398193359375, 0.45611572265625, 0.497833251953125, 0.53955078125, 0.581268310546875, 0.62298583984375, 0.664703369140625, 0.7064208984375, 0.748138427734375, 0.78985595703125, 0.831573486328125, 0.873291015625, 0.915008544921875, 0.95672607421875, 0.998443603515625, 1.0401611328125, 1.081878662109375, 1.12359619140625, 1.165313720703125, 1.20703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 5.0, 13.0, 8.0, 17.0, 22.0, 26.0, 24.0, 40.0, 54.0, 74.0, 80.0, 93.0, 85.0, 92.0, 65.0, 73.0, 50.0, 30.0, 34.0, 24.0, 14.0, 14.0, 11.0, 12.0, 6.0, 11.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416259765625, -0.4010505676269531, -0.38584136962890625, -0.3706321716308594, -0.3554229736328125, -0.3402137756347656, -0.32500457763671875, -0.3097953796386719, -0.294586181640625, -0.2793769836425781, -0.26416778564453125, -0.24895858764648438, -0.2337493896484375, -0.21854019165039062, -0.20333099365234375, -0.18812179565429688, -0.17291259765625, -0.15770339965820312, -0.14249420166015625, -0.12728500366210938, -0.1120758056640625, -0.09686660766601562, -0.08165740966796875, -0.06644821166992188, -0.051239013671875, -0.036029815673828125, -0.02082061767578125, -0.005611419677734375, 0.0095977783203125, 0.024806976318359375, 0.04001617431640625, 0.055225372314453125, 0.0704345703125, 0.08564376831054688, 0.10085296630859375, 0.11606216430664062, 0.1312713623046875, 0.14648056030273438, 0.16168975830078125, 0.17689895629882812, 0.192108154296875, 0.20731735229492188, 0.22252655029296875, 0.23773574829101562, 0.2529449462890625, 0.2681541442871094, 0.28336334228515625, 0.2985725402832031, 0.31378173828125, 0.3289909362792969, 0.34420013427734375, 0.3594093322753906, 0.3746185302734375, 0.3898277282714844, 0.40503692626953125, 0.4202461242675781, 0.435455322265625, 0.4506645202636719, 0.46587371826171875, 0.4810829162597656, 0.4962921142578125, 0.5115013122558594, 0.5267105102539062, 0.5419197082519531, 0.55712890625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 31.0, 261.0, 612.0, 74.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.790647506713867, -29.464717864990234, -28.138790130615234, -26.8128604888916, -25.48693084716797, -24.16100311279297, -22.835073471069336, -21.509143829345703, -20.183216094970703, -18.85728645324707, -17.53135871887207, -16.205429077148438, -14.879499435424805, -13.553570747375488, -12.227642059326172, -10.901712417602539, -9.575782775878906, -8.24985408782959, -6.923924446105957, -5.597995758056641, -4.272066593170166, -2.9461374282836914, -1.620208740234375, -0.2942790985107422, 1.0316495895385742, 2.357578754425049, 3.6835076808929443, 5.00943660736084, 6.3353657722473145, 7.661294937133789, 8.987223625183105, 10.313153266906738, 11.639080047607422, 12.965008735656738, 14.290938377380371, 15.616867065429688, 16.94279670715332, 18.268726348876953, 19.594654083251953, 20.920583724975586, 22.24651336669922, 23.57244300842285, 24.89837074279785, 26.224300384521484, 27.550230026245117, 28.87615966796875, 30.20208740234375, 31.528017044067383, 32.85394287109375, 34.17987060546875, 35.505802154541016, 36.831729888916016, 38.157657623291016, 39.48358917236328, 40.80951690673828, 42.13544464111328, 43.46137619018555, 44.78730392456055, 46.11323547363281, 47.43916320800781, 48.76509094238281, 50.09102249145508, 51.41695022583008, 52.742881774902344, 54.068809509277344]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 14.0, 8.0, 22.0, 23.0, 18.0, 26.0, 36.0, 42.0, 30.0, 42.0, 38.0, 50.0, 56.0, 45.0, 48.0, 43.0, 64.0, 47.0, 48.0, 44.0, 34.0, 31.0, 27.0, 21.0, 18.0, 13.0, 12.0, 17.0, 13.0, 8.0, 11.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.167393684387207, -9.875500679016113, -9.583608627319336, -9.291715621948242, -8.999823570251465, -8.707930564880371, -8.416038513183594, -8.1241455078125, -7.832253456115723, -7.540360927581787, -7.248468399047852, -6.956575870513916, -6.6646833419799805, -6.372790813446045, -6.080898284912109, -5.789005279541016, -5.49711275100708, -5.2052202224731445, -4.913327693939209, -4.621435165405273, -4.329542636871338, -4.037650108337402, -3.7457573413848877, -3.453864812850952, -3.1619722843170166, -2.870079755783081, -2.5781872272491455, -2.286294460296631, -1.9944020509719849, -1.7025095224380493, -1.4106168746948242, -1.1187243461608887, -0.8268318176269531, -0.5349392890930176, -0.24304670095443726, 0.048845887184143066, 0.3407384157180786, 0.6326309442520142, 0.9245235919952393, 1.2164161205291748, 1.5083086490631104, 1.800201177597046, 2.0920937061309814, 2.383986473083496, 2.6758790016174316, 2.967771530151367, 3.2596640586853027, 3.5515565872192383, 3.843449115753174, 4.135341644287109, 4.427234172821045, 4.7191267013549805, 5.011019229888916, 5.302911758422852, 5.594804763793945, 5.886696815490723, 6.178589820861816, 6.470482349395752, 6.7623748779296875, 7.054267406463623, 7.346159934997559, 7.638052463531494, 7.92994499206543, 8.221837997436523, 8.5137300491333]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 12.0, 11.0, 11.0, 25.0, 34.0, 48.0, 84.0, 124.0, 214.0, 344.0, 532.0, 951.0, 1982.0, 3906.0, 9684.0, 27889.0, 111611.0, 1067910.0, 2723984.0, 182265.0, 39392.0, 12895.0, 5121.0, 2370.0, 1232.0, 660.0, 376.0, 202.0, 126.0, 95.0, 62.0, 54.0, 30.0, 14.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.75390625, -3.6500244140625, -3.546142578125, -3.4422607421875, -3.33837890625, -3.2344970703125, -3.130615234375, -3.0267333984375, -2.9228515625, -2.8189697265625, -2.715087890625, -2.6112060546875, -2.50732421875, -2.4034423828125, -2.299560546875, -2.1956787109375, -2.091796875, -1.9879150390625, -1.884033203125, -1.7801513671875, -1.67626953125, -1.5723876953125, -1.468505859375, -1.3646240234375, -1.2607421875, -1.1568603515625, -1.052978515625, -0.9490966796875, -0.84521484375, -0.7413330078125, -0.637451171875, -0.5335693359375, -0.4296875, -0.3258056640625, -0.221923828125, -0.1180419921875, -0.01416015625, 0.0897216796875, 0.193603515625, 0.2974853515625, 0.4013671875, 0.5052490234375, 0.609130859375, 0.7130126953125, 0.81689453125, 0.9207763671875, 1.024658203125, 1.1285400390625, 1.232421875, 1.3363037109375, 1.440185546875, 1.5440673828125, 1.64794921875, 1.7518310546875, 1.855712890625, 1.9595947265625, 2.0634765625, 2.1673583984375, 2.271240234375, 2.3751220703125, 2.47900390625, 2.5828857421875, 2.686767578125, 2.7906494140625, 2.89453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 5.0, 10.0, 9.0, 12.0, 23.0, 25.0, 31.0, 37.0, 44.0, 58.0, 66.0, 66.0, 79.0, 84.0, 65.0, 71.0, 66.0, 48.0, 37.0, 29.0, 28.0, 19.0, 13.0, 16.0, 11.0, 7.0, 9.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.295257568359375, -3.19012451171875, -3.084991455078125, -2.9798583984375, -2.874725341796875, -2.76959228515625, -2.664459228515625, -2.559326171875, -2.454193115234375, -2.34906005859375, -2.243927001953125, -2.1387939453125, -2.033660888671875, -1.92852783203125, -1.823394775390625, -1.71826171875, -1.613128662109375, -1.50799560546875, -1.402862548828125, -1.2977294921875, -1.192596435546875, -1.08746337890625, -0.982330322265625, -0.877197265625, -0.772064208984375, -0.66693115234375, -0.561798095703125, -0.4566650390625, -0.351531982421875, -0.24639892578125, -0.141265869140625, -0.0361328125, 0.069000244140625, 0.17413330078125, 0.279266357421875, 0.3843994140625, 0.489532470703125, 0.59466552734375, 0.699798583984375, 0.804931640625, 0.910064697265625, 1.01519775390625, 1.120330810546875, 1.2254638671875, 1.330596923828125, 1.43572998046875, 1.540863037109375, 1.64599609375, 1.751129150390625, 1.85626220703125, 1.961395263671875, 2.0665283203125, 2.171661376953125, 2.27679443359375, 2.381927490234375, 2.487060546875, 2.592193603515625, 2.69732666015625, 2.802459716796875, 2.9075927734375, 3.012725830078125, 3.11785888671875, 3.222991943359375, 3.328125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 15.0, 20.0, 32.0, 52.0, 146.0, 558.0, 19240.0, 4169365.0, 4229.0, 393.0, 116.0, 42.0, 34.0, 15.0, 8.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.921875, -20.128173828125, -19.33447265625, -18.540771484375, -17.7470703125, -16.953369140625, -16.15966796875, -15.365966796875, -14.572265625, -13.778564453125, -12.98486328125, -12.191162109375, -11.3974609375, -10.603759765625, -9.81005859375, -9.016357421875, -8.22265625, -7.428955078125, -6.63525390625, -5.841552734375, -5.0478515625, -4.254150390625, -3.46044921875, -2.666748046875, -1.873046875, -1.079345703125, -0.28564453125, 0.508056640625, 1.3017578125, 2.095458984375, 2.88916015625, 3.682861328125, 4.4765625, 5.270263671875, 6.06396484375, 6.857666015625, 7.6513671875, 8.445068359375, 9.23876953125, 10.032470703125, 10.826171875, 11.619873046875, 12.41357421875, 13.207275390625, 14.0009765625, 14.794677734375, 15.58837890625, 16.382080078125, 17.17578125, 17.969482421875, 18.76318359375, 19.556884765625, 20.3505859375, 21.144287109375, 21.93798828125, 22.731689453125, 23.525390625, 24.319091796875, 25.11279296875, 25.906494140625, 26.7001953125, 27.493896484375, 28.28759765625, 29.081298828125, 29.875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 9.0, 9.0, 13.0, 9.0, 22.0, 22.0, 39.0, 66.0, 71.0, 101.0, 156.0, 200.0, 421.0, 972.0, 808.0, 393.0, 223.0, 145.0, 101.0, 71.0, 59.0, 32.0, 31.0, 20.0, 15.0, 8.0, 7.0, 9.0, 11.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7374649047851562, -0.7078399658203125, -0.6782150268554688, -0.648590087890625, -0.6189651489257812, -0.5893402099609375, -0.5597152709960938, -0.53009033203125, -0.5004653930664062, -0.4708404541015625, -0.44121551513671875, -0.411590576171875, -0.38196563720703125, -0.3523406982421875, -0.32271575927734375, -0.2930908203125, -0.26346588134765625, -0.2338409423828125, -0.20421600341796875, -0.174591064453125, -0.14496612548828125, -0.1153411865234375, -0.08571624755859375, -0.05609130859375, -0.02646636962890625, 0.0031585693359375, 0.03278350830078125, 0.062408447265625, 0.09203338623046875, 0.1216583251953125, 0.15128326416015625, 0.180908203125, 0.21053314208984375, 0.2401580810546875, 0.26978302001953125, 0.299407958984375, 0.32903289794921875, 0.3586578369140625, 0.38828277587890625, 0.41790771484375, 0.44753265380859375, 0.4771575927734375, 0.5067825317382812, 0.536407470703125, 0.5660324096679688, 0.5956573486328125, 0.6252822875976562, 0.6549072265625, 0.6845321655273438, 0.7141571044921875, 0.7437820434570312, 0.773406982421875, 0.8030319213867188, 0.8326568603515625, 0.8622817993164062, 0.89190673828125, 0.9215316772460938, 0.9511566162109375, 0.9807815551757812, 1.010406494140625, 1.0400314331054688, 1.0696563720703125, 1.0992813110351562, 1.12890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 8.0, 12.0, 12.0, 22.0, 32.0, 49.0, 83.0, 146.0, 166.0, 148.0, 126.0, 60.0, 33.0, 27.0, 15.0, 10.0, 4.0, 8.0, 7.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.317467212677002, -6.13067626953125, -5.943885803222656, -5.757094860076904, -5.570303916931152, -5.3835129737854, -5.196722030639648, -5.009931564331055, -4.823140621185303, -4.636349678039551, -4.449559211730957, -4.262768268585205, -4.075977325439453, -3.889186382293701, -3.7023956775665283, -3.5156049728393555, -3.3288140296936035, -3.1420230865478516, -2.9552323818206787, -2.768441677093506, -2.581650733947754, -2.394859790802002, -2.208069086074829, -2.0212783813476562, -1.8344874382019043, -1.647696614265442, -1.4609057903289795, -1.274114966392517, -1.0873241424560547, -0.9005333185195923, -0.7137424945831299, -0.5269516706466675, -0.3401608467102051, -0.15337002277374268, 0.03342080116271973, 0.22021162509918213, 0.40700244903564453, 0.5937932729721069, 0.7805840969085693, 0.9673749208450317, 1.1541657447814941, 1.3409565687179565, 1.527747392654419, 1.7145382165908813, 1.9013290405273438, 2.0881199836730957, 2.2749106884002686, 2.4617013931274414, 2.6484923362731934, 2.8352832794189453, 3.022073984146118, 3.208864688873291, 3.395655632019043, 3.582446575164795, 3.7692372798919678, 3.9560279846191406, 4.142818927764893, 4.3296098709106445, 4.516400337219238, 4.70319128036499, 4.889982223510742, 5.076773166656494, 5.263564109802246, 5.45035457611084, 5.637145519256592]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 5.0, 5.0, 13.0, 11.0, 14.0, 18.0, 23.0, 32.0, 37.0, 30.0, 51.0, 59.0, 55.0, 64.0, 65.0, 61.0, 55.0, 54.0, 59.0, 43.0, 40.0, 42.0, 31.0, 22.0, 17.0, 18.0, 13.0, 16.0, 8.0, 9.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51434063911438, -3.407276153564453, -3.3002114295959473, -3.1931467056274414, -3.0860822200775146, -2.979017734527588, -2.871953010559082, -2.764888286590576, -2.6578238010406494, -2.5507593154907227, -2.443694591522217, -2.336629867553711, -2.229565382003784, -2.1225008964538574, -2.0154361724853516, -1.9083715677261353, -1.801306962966919, -1.6942423582077026, -1.5871777534484863, -1.48011314868927, -1.3730485439300537, -1.2659839391708374, -1.158919334411621, -1.0518547296524048, -0.9447901248931885, -0.8377255201339722, -0.7306609153747559, -0.6235963106155396, -0.5165317058563232, -0.40946710109710693, -0.3024024963378906, -0.19533789157867432, -0.0882730484008789, 0.018791556358337402, 0.1258561611175537, 0.23292076587677002, 0.33998537063598633, 0.44704997539520264, 0.554114580154419, 0.6611791849136353, 0.7682437896728516, 0.8753083944320679, 0.9823729991912842, 1.0894376039505005, 1.1965022087097168, 1.303566813468933, 1.4106314182281494, 1.5176960229873657, 1.624760627746582, 1.7318252325057983, 1.8388898372650146, 1.945954442024231, 2.0530190467834473, 2.160083770751953, 2.26714825630188, 2.3742127418518066, 2.4812774658203125, 2.5883421897888184, 2.695406675338745, 2.802471160888672, 2.9095358848571777, 3.0166006088256836, 3.1236650943756104, 3.230729579925537, 3.337794303894043]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 6.0, 16.0, 23.0, 28.0, 44.0, 43.0, 62.0, 78.0, 130.0, 209.0, 324.0, 543.0, 1005.0, 2094.0, 5252.0, 15933.0, 72335.0, 524026.0, 356908.0, 49173.0, 11953.0, 4216.0, 1884.0, 859.0, 482.0, 297.0, 175.0, 126.0, 79.0, 58.0, 54.0, 41.0, 21.0, 16.0, 11.0, 8.0, 7.0, 4.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26513671875, -0.2556304931640625, -0.246124267578125, -0.2366180419921875, -0.22711181640625, -0.2176055908203125, -0.208099365234375, -0.1985931396484375, -0.1890869140625, -0.1795806884765625, -0.170074462890625, -0.1605682373046875, -0.15106201171875, -0.1415557861328125, -0.132049560546875, -0.1225433349609375, -0.113037109375, -0.1035308837890625, -0.094024658203125, -0.0845184326171875, -0.07501220703125, -0.0655059814453125, -0.055999755859375, -0.0464935302734375, -0.0369873046875, -0.0274810791015625, -0.017974853515625, -0.0084686279296875, 0.00103759765625, 0.0105438232421875, 0.020050048828125, 0.0295562744140625, 0.0390625, 0.0485687255859375, 0.058074951171875, 0.0675811767578125, 0.07708740234375, 0.0865936279296875, 0.096099853515625, 0.1056060791015625, 0.1151123046875, 0.1246185302734375, 0.134124755859375, 0.1436309814453125, 0.15313720703125, 0.1626434326171875, 0.172149658203125, 0.1816558837890625, 0.191162109375, 0.2006683349609375, 0.210174560546875, 0.2196807861328125, 0.22918701171875, 0.2386932373046875, 0.248199462890625, 0.2577056884765625, 0.2672119140625, 0.2767181396484375, 0.286224365234375, 0.2957305908203125, 0.30523681640625, 0.3147430419921875, 0.324249267578125, 0.3337554931640625, 0.34326171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 6.0, 15.0, 16.0, 16.0, 22.0, 35.0, 40.0, 61.0, 62.0, 64.0, 73.0, 83.0, 61.0, 67.0, 55.0, 55.0, 50.0, 43.0, 24.0, 25.0, 21.0, 14.0, 12.0, 10.0, 10.0, 10.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6484375, -2.56866455078125, -2.4888916015625, -2.40911865234375, -2.329345703125, -2.24957275390625, -2.1697998046875, -2.09002685546875, -2.01025390625, -1.93048095703125, -1.8507080078125, -1.77093505859375, -1.691162109375, -1.61138916015625, -1.5316162109375, -1.45184326171875, -1.3720703125, -1.29229736328125, -1.2125244140625, -1.13275146484375, -1.052978515625, -0.97320556640625, -0.8934326171875, -0.81365966796875, -0.73388671875, -0.65411376953125, -0.5743408203125, -0.49456787109375, -0.414794921875, -0.33502197265625, -0.2552490234375, -0.17547607421875, -0.095703125, -0.01593017578125, 0.0638427734375, 0.14361572265625, 0.223388671875, 0.30316162109375, 0.3829345703125, 0.46270751953125, 0.54248046875, 0.62225341796875, 0.7020263671875, 0.78179931640625, 0.861572265625, 0.94134521484375, 1.0211181640625, 1.10089111328125, 1.1806640625, 1.26043701171875, 1.3402099609375, 1.41998291015625, 1.499755859375, 1.57952880859375, 1.6593017578125, 1.73907470703125, 1.81884765625, 1.89862060546875, 1.9783935546875, 2.05816650390625, 2.137939453125, 2.21771240234375, 2.2974853515625, 2.37725830078125, 2.45703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 7.0, 11.0, 10.0, 21.0, 22.0, 35.0, 37.0, 54.0, 91.0, 93.0, 151.0, 226.0, 392.0, 796.0, 2869.0, 26111.0, 438495.0, 541616.0, 32243.0, 3286.0, 784.0, 398.0, 238.0, 136.0, 118.0, 77.0, 65.0, 36.0, 36.0, 24.0, 14.0, 14.0, 15.0, 3.0, 2.0, 5.0, 6.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.413818359375, -0.4029426574707031, -0.39206695556640625, -0.3811912536621094, -0.3703155517578125, -0.3594398498535156, -0.34856414794921875, -0.3376884460449219, -0.326812744140625, -0.3159370422363281, -0.30506134033203125, -0.2941856384277344, -0.2833099365234375, -0.2724342346191406, -0.26155853271484375, -0.2506828308105469, -0.23980712890625, -0.22893142700195312, -0.21805572509765625, -0.20718002319335938, -0.1963043212890625, -0.18542861938476562, -0.17455291748046875, -0.16367721557617188, -0.152801513671875, -0.14192581176757812, -0.13105010986328125, -0.12017440795898438, -0.1092987060546875, -0.09842300415039062, -0.08754730224609375, -0.07667160034179688, -0.0657958984375, -0.054920196533203125, -0.04404449462890625, -0.033168792724609375, -0.0222930908203125, -0.011417388916015625, -0.00054168701171875, 0.010334014892578125, 0.021209716796875, 0.032085418701171875, 0.04296112060546875, 0.053836822509765625, 0.0647125244140625, 0.07558822631835938, 0.08646392822265625, 0.09733963012695312, 0.10821533203125, 0.11909103393554688, 0.12996673583984375, 0.14084243774414062, 0.1517181396484375, 0.16259384155273438, 0.17346954345703125, 0.18434524536132812, 0.195220947265625, 0.20609664916992188, 0.21697235107421875, 0.22784805297851562, 0.2387237548828125, 0.24959945678710938, 0.26047515869140625, 0.2713508605957031, 0.2822265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 4.0, 9.0, 15.0, 11.0, 18.0, 25.0, 28.0, 28.0, 38.0, 35.0, 41.0, 40.0, 44.0, 48.0, 53.0, 38.0, 40.0, 52.0, 52.0, 44.0, 41.0, 35.0, 40.0, 39.0, 21.0, 33.0, 21.0, 17.0, 18.0, 13.0, 6.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.701171875, -3.58953857421875, -3.4779052734375, -3.36627197265625, -3.254638671875, -3.14300537109375, -3.0313720703125, -2.91973876953125, -2.80810546875, -2.69647216796875, -2.5848388671875, -2.47320556640625, -2.361572265625, -2.24993896484375, -2.1383056640625, -2.02667236328125, -1.9150390625, -1.80340576171875, -1.6917724609375, -1.58013916015625, -1.468505859375, -1.35687255859375, -1.2452392578125, -1.13360595703125, -1.02197265625, -0.91033935546875, -0.7987060546875, -0.68707275390625, -0.575439453125, -0.46380615234375, -0.3521728515625, -0.24053955078125, -0.12890625, -0.01727294921875, 0.0943603515625, 0.20599365234375, 0.317626953125, 0.42926025390625, 0.5408935546875, 0.65252685546875, 0.76416015625, 0.87579345703125, 0.9874267578125, 1.09906005859375, 1.210693359375, 1.32232666015625, 1.4339599609375, 1.54559326171875, 1.6572265625, 1.76885986328125, 1.8804931640625, 1.99212646484375, 2.103759765625, 2.21539306640625, 2.3270263671875, 2.43865966796875, 2.55029296875, 2.66192626953125, 2.7735595703125, 2.88519287109375, 2.996826171875, 3.10845947265625, 3.2200927734375, 3.33172607421875, 3.443359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 4.0, 15.0, 5.0, 8.0, 9.0, 16.0, 20.0, 33.0, 34.0, 64.0, 149.0, 260.0, 956.0, 10237.0, 1016060.0, 18659.0, 1281.0, 343.0, 134.0, 74.0, 35.0, 30.0, 23.0, 14.0, 11.0, 14.0, 16.0, 6.0, 5.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.206298828125, -0.1993255615234375, -0.192352294921875, -0.1853790283203125, -0.17840576171875, -0.1714324951171875, -0.164459228515625, -0.1574859619140625, -0.1505126953125, -0.1435394287109375, -0.136566162109375, -0.1295928955078125, -0.12261962890625, -0.1156463623046875, -0.108673095703125, -0.1016998291015625, -0.0947265625, -0.0877532958984375, -0.080780029296875, -0.0738067626953125, -0.06683349609375, -0.0598602294921875, -0.052886962890625, -0.0459136962890625, -0.0389404296875, -0.0319671630859375, -0.024993896484375, -0.0180206298828125, -0.01104736328125, -0.0040740966796875, 0.002899169921875, 0.0098724365234375, 0.016845703125, 0.0238189697265625, 0.030792236328125, 0.0377655029296875, 0.04473876953125, 0.0517120361328125, 0.058685302734375, 0.0656585693359375, 0.0726318359375, 0.0796051025390625, 0.086578369140625, 0.0935516357421875, 0.10052490234375, 0.1074981689453125, 0.114471435546875, 0.1214447021484375, 0.12841796875, 0.1353912353515625, 0.142364501953125, 0.1493377685546875, 0.15631103515625, 0.1632843017578125, 0.170257568359375, 0.1772308349609375, 0.1842041015625, 0.1911773681640625, 0.198150634765625, 0.2051239013671875, 0.21209716796875, 0.2190704345703125, 0.226043701171875, 0.2330169677734375, 0.239990234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 22.0, 51.0, 120.0, 245.0, 275.0, 149.0, 57.0, 29.0, 15.0, 10.0, 7.0, 8.0, 2.0, 1.0, 3.0], "bins": [-0.0001926422119140625, -0.0001890202984213829, -0.0001853983849287033, -0.0001817764714360237, -0.00017815455794334412, -0.00017453264445066452, -0.00017091073095798492, -0.00016728881746530533, -0.00016366690397262573, -0.00016004499047994614, -0.00015642307698726654, -0.00015280116349458694, -0.00014917925000190735, -0.00014555733650922775, -0.00014193542301654816, -0.00013831350952386856, -0.00013469159603118896, -0.00013106968253850937, -0.00012744776904582977, -0.00012382585555315018, -0.00012020394206047058, -0.00011658202856779099, -0.00011296011507511139, -0.00010933820158243179, -0.0001057162880897522, -0.0001020943745970726, -9.8472461104393e-05, -9.485054761171341e-05, -9.122863411903381e-05, -8.760672062635422e-05, -8.398480713367462e-05, -8.036289364099503e-05, -7.674098014831543e-05, -7.311906665563583e-05, -6.949715316295624e-05, -6.587523967027664e-05, -6.225332617759705e-05, -5.863141268491745e-05, -5.5009499192237854e-05, -5.138758569955826e-05, -4.776567220687866e-05, -4.4143758714199066e-05, -4.052184522151947e-05, -3.6899931728839874e-05, -3.327801823616028e-05, -2.9656104743480682e-05, -2.6034191250801086e-05, -2.241227775812149e-05, -1.8790364265441895e-05, -1.5168450772762299e-05, -1.1546537280082703e-05, -7.924623787403107e-06, -4.302710294723511e-06, -6.807968020439148e-07, 2.941116690635681e-06, 6.563030183315277e-06, 1.0184943675994873e-05, 1.3806857168674469e-05, 1.7428770661354065e-05, 2.105068415403366e-05, 2.4672597646713257e-05, 2.8294511139392853e-05, 3.191642463207245e-05, 3.5538338124752045e-05, 3.916025161743164e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 9.0, 12.0, 20.0, 18.0, 41.0, 61.0, 120.0, 171.0, 396.0, 861.0, 2872.0, 25834.0, 997452.0, 16674.0, 2435.0, 790.0, 333.0, 170.0, 102.0, 58.0, 43.0, 24.0, 16.0, 13.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2454833984375, -0.23619651794433594, -0.22690963745117188, -0.2176227569580078, -0.20833587646484375, -0.1990489959716797, -0.18976211547851562, -0.18047523498535156, -0.1711883544921875, -0.16190147399902344, -0.15261459350585938, -0.1433277130126953, -0.13404083251953125, -0.12475395202636719, -0.11546707153320312, -0.10618019104003906, -0.096893310546875, -0.08760643005371094, -0.07831954956054688, -0.06903266906738281, -0.05974578857421875, -0.05045890808105469, -0.041172027587890625, -0.03188514709472656, -0.0225982666015625, -0.013311386108398438, -0.004024505615234375, 0.0052623748779296875, 0.01454925537109375, 0.023836135864257812, 0.033123016357421875, 0.04240989685058594, 0.05169677734375, 0.06098365783691406, 0.07027053833007812, 0.07955741882324219, 0.08884429931640625, 0.09813117980957031, 0.10741806030273438, 0.11670494079589844, 0.1259918212890625, 0.13527870178222656, 0.14456558227539062, 0.1538524627685547, 0.16313934326171875, 0.1724262237548828, 0.18171310424804688, 0.19099998474121094, 0.200286865234375, 0.20957374572753906, 0.21886062622070312, 0.2281475067138672, 0.23743438720703125, 0.2467212677001953, 0.2560081481933594, 0.26529502868652344, 0.2745819091796875, 0.28386878967285156, 0.2931556701660156, 0.3024425506591797, 0.31172943115234375, 0.3210163116455078, 0.3303031921386719, 0.33959007263183594, 0.348876953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 15.0, 25.0, 122.0, 578.0, 166.0, 44.0, 18.0, 5.0, 8.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06329345703125, -0.06161308288574219, -0.059932708740234375, -0.05825233459472656, -0.05657196044921875, -0.05489158630371094, -0.053211212158203125, -0.05153083801269531, -0.0498504638671875, -0.04817008972167969, -0.046489715576171875, -0.04480934143066406, -0.04312896728515625, -0.04144859313964844, -0.039768218994140625, -0.03808784484863281, -0.036407470703125, -0.03472709655761719, -0.033046722412109375, -0.03136634826660156, -0.02968597412109375, -0.028005599975585938, -0.026325225830078125, -0.024644851684570312, -0.0229644775390625, -0.021284103393554688, -0.019603729248046875, -0.017923355102539062, -0.01624298095703125, -0.014562606811523438, -0.012882232666015625, -0.011201858520507812, -0.009521484375, -0.007841110229492188, -0.006160736083984375, -0.0044803619384765625, -0.00279998779296875, -0.0011196136474609375, 0.000560760498046875, 0.0022411346435546875, 0.0039215087890625, 0.0056018829345703125, 0.007282257080078125, 0.008962631225585938, 0.01064300537109375, 0.012323379516601562, 0.014003753662109375, 0.015684127807617188, 0.017364501953125, 0.019044876098632812, 0.020725250244140625, 0.022405624389648438, 0.02408599853515625, 0.025766372680664062, 0.027446746826171875, 0.029127120971679688, 0.0308074951171875, 0.03248786926269531, 0.034168243408203125, 0.03584861755371094, 0.03752899169921875, 0.03920936584472656, 0.040889739990234375, 0.04257011413574219, 0.04425048828125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 14.0, 13.0, 31.0, 49.0, 108.0, 217.0, 209.0, 166.0, 62.0, 34.0, 19.0, 17.0, 9.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.561765193939209, -5.399576187133789, -5.237387180328369, -5.075197696685791, -4.913008689880371, -4.750819683074951, -4.588630676269531, -4.426441669464111, -4.264252662658691, -4.1020636558532715, -3.9398744106292725, -3.7776854038238525, -3.6154961585998535, -3.4533071517944336, -3.2911181449890137, -3.1289291381835938, -2.9667396545410156, -2.8045506477355957, -2.6423614025115967, -2.4801723957061768, -2.3179831504821777, -2.155794143676758, -1.993605136871338, -1.8314160108566284, -1.669226884841919, -1.5070377588272095, -1.3448486328125, -1.18265962600708, -1.0204704999923706, -0.8582813739776611, -0.6960923075675964, -0.5339032411575317, -0.37171411514282227, -0.20952501893043518, -0.047335922718048096, 0.11485317349433899, 0.2770422697067261, 0.43923139572143555, 0.6014204621315002, 0.7636095285415649, 0.9257986545562744, 1.0879877805709839, 1.2501769065856934, 1.4123659133911133, 1.5745550394058228, 1.7367441654205322, 1.8989331722259521, 2.061122417449951, 2.223311424255371, 2.385500431060791, 2.54768967628479, 2.70987868309021, 2.872067928314209, 3.034256935119629, 3.196445941925049, 3.3586349487304688, 3.5208241939544678, 3.6830132007598877, 3.8452024459838867, 4.007391452789307, 4.169580459594727, 4.331769943237305, 4.493958950042725, 4.6561479568481445, 4.8183369636535645]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 13.0, 20.0, 24.0, 23.0, 45.0, 45.0, 45.0, 71.0, 67.0, 77.0, 73.0, 62.0, 60.0, 63.0, 46.0, 39.0, 39.0, 27.0, 28.0, 16.0, 11.0, 10.0, 10.0, 12.0, 8.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.44415283203125, -2.3693840503692627, -2.2946152687072754, -2.219846487045288, -2.145077705383301, -2.0703091621398926, -1.9955402612686157, -1.920771598815918, -1.8460028171539307, -1.7712340354919434, -1.696465253829956, -1.6216964721679688, -1.546927809715271, -1.4721590280532837, -1.3973902463912964, -1.3226215839385986, -1.2478526830673218, -1.1730839014053345, -1.0983151197433472, -1.0235464572906494, -0.9487776756286621, -0.8740088939666748, -0.7992401123046875, -0.724471390247345, -0.6497026085853577, -0.5749338269233704, -0.5001651048660278, -0.4253963232040405, -0.3506275713443756, -0.2758588194847107, -0.2010900378227234, -0.12632131576538086, -0.051552534103393555, 0.02321622520685196, 0.09798498451709747, 0.17275375127792358, 0.2475225031375885, 0.3222912549972534, 0.3970600366592407, 0.47182875871658325, 0.5465975403785706, 0.6213663220405579, 0.6961350440979004, 0.7709038257598877, 0.845672607421875, 0.9204413294792175, 0.9952101111412048, 1.0699788331985474, 1.1447476148605347, 1.219516396522522, 1.2942851781845093, 1.369053840637207, 1.4438226222991943, 1.5185914039611816, 1.593360185623169, 1.6681289672851562, 1.7428977489471436, 1.8176665306091309, 1.8924353122711182, 1.9672040939331055, 2.0419728755950928, 2.11674165725708, 2.1915102005004883, 2.2662789821624756, 2.341047763824463]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 14.0, 23.0, 35.0, 68.0, 206.0, 497.0, 1986.0, 17792.0, 782172.0, 236103.0, 7843.0, 1192.0, 331.0, 158.0, 54.0, 27.0, 15.0, 6.0, 3.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.21649169921875, -5.9759521484375, -5.73541259765625, -5.494873046875, -5.25433349609375, -5.0137939453125, -4.77325439453125, -4.53271484375, -4.29217529296875, -4.0516357421875, -3.81109619140625, -3.570556640625, -3.33001708984375, -3.0894775390625, -2.84893798828125, -2.6083984375, -2.36785888671875, -2.1273193359375, -1.88677978515625, -1.646240234375, -1.40570068359375, -1.1651611328125, -0.92462158203125, -0.68408203125, -0.44354248046875, -0.2030029296875, 0.03753662109375, 0.278076171875, 0.51861572265625, 0.7591552734375, 0.99969482421875, 1.240234375, 1.48077392578125, 1.7213134765625, 1.96185302734375, 2.202392578125, 2.44293212890625, 2.6834716796875, 2.92401123046875, 3.16455078125, 3.40509033203125, 3.6456298828125, 3.88616943359375, 4.126708984375, 4.36724853515625, 4.6077880859375, 4.84832763671875, 5.0888671875, 5.32940673828125, 5.5699462890625, 5.81048583984375, 6.051025390625, 6.29156494140625, 6.5321044921875, 6.77264404296875, 7.01318359375, 7.25372314453125, 7.4942626953125, 7.73480224609375, 7.975341796875, 8.21588134765625, 8.4564208984375, 8.69696044921875, 8.9375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 10.0, 16.0, 14.0, 21.0, 37.0, 66.0, 100.0, 118.0, 140.0, 113.0, 116.0, 73.0, 60.0, 35.0, 26.0, 19.0, 11.0, 7.0, 11.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.72467041015625, -5.4063720703125, -5.08807373046875, -4.769775390625, -4.45147705078125, -4.1331787109375, -3.81488037109375, -3.49658203125, -3.17828369140625, -2.8599853515625, -2.54168701171875, -2.223388671875, -1.90509033203125, -1.5867919921875, -1.26849365234375, -0.9501953125, -0.63189697265625, -0.3135986328125, 0.00469970703125, 0.322998046875, 0.64129638671875, 0.9595947265625, 1.27789306640625, 1.59619140625, 1.91448974609375, 2.2327880859375, 2.55108642578125, 2.869384765625, 3.18768310546875, 3.5059814453125, 3.82427978515625, 4.142578125, 4.46087646484375, 4.7791748046875, 5.09747314453125, 5.415771484375, 5.73406982421875, 6.0523681640625, 6.37066650390625, 6.68896484375, 7.00726318359375, 7.3255615234375, 7.64385986328125, 7.962158203125, 8.28045654296875, 8.5987548828125, 8.91705322265625, 9.2353515625, 9.55364990234375, 9.8719482421875, 10.19024658203125, 10.508544921875, 10.82684326171875, 11.1451416015625, 11.46343994140625, 11.78173828125, 12.10003662109375, 12.4183349609375, 12.73663330078125, 13.054931640625, 13.37322998046875, 13.6915283203125, 14.00982666015625, 14.328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 10.0, 11.0, 17.0, 20.0, 35.0, 29.0, 32.0, 48.0, 44.0, 58.0, 84.0, 135.0, 252.0, 605.0, 4116.0, 138303.0, 886421.0, 15962.0, 1376.0, 352.0, 131.0, 91.0, 90.0, 58.0, 37.0, 40.0, 23.0, 19.0, 18.0, 25.0, 19.0, 15.0, 13.0, 9.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.96484375, -6.74188232421875, -6.5189208984375, -6.29595947265625, -6.072998046875, -5.85003662109375, -5.6270751953125, -5.40411376953125, -5.18115234375, -4.95819091796875, -4.7352294921875, -4.51226806640625, -4.289306640625, -4.06634521484375, -3.8433837890625, -3.62042236328125, -3.3974609375, -3.17449951171875, -2.9515380859375, -2.72857666015625, -2.505615234375, -2.28265380859375, -2.0596923828125, -1.83673095703125, -1.61376953125, -1.39080810546875, -1.1678466796875, -0.94488525390625, -0.721923828125, -0.49896240234375, -0.2760009765625, -0.05303955078125, 0.169921875, 0.39288330078125, 0.6158447265625, 0.83880615234375, 1.061767578125, 1.28472900390625, 1.5076904296875, 1.73065185546875, 1.95361328125, 2.17657470703125, 2.3995361328125, 2.62249755859375, 2.845458984375, 3.06842041015625, 3.2913818359375, 3.51434326171875, 3.7373046875, 3.96026611328125, 4.1832275390625, 4.40618896484375, 4.629150390625, 4.85211181640625, 5.0750732421875, 5.29803466796875, 5.52099609375, 5.74395751953125, 5.9669189453125, 6.18988037109375, 6.412841796875, 6.63580322265625, 6.8587646484375, 7.08172607421875, 7.3046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 4.0, 5.0, 3.0, 4.0, 16.0, 7.0, 3.0, 22.0, 11.0, 20.0, 29.0, 22.0, 22.0, 39.0, 26.0, 34.0, 36.0, 32.0, 46.0, 38.0, 37.0, 46.0, 42.0, 30.0, 43.0, 30.0, 36.0, 35.0, 40.0, 24.0, 26.0, 23.0, 21.0, 23.0, 12.0, 20.0, 17.0, 15.0, 17.0, 13.0, 5.0, 12.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.74609375, -4.59906005859375, -4.4520263671875, -4.30499267578125, -4.157958984375, -4.01092529296875, -3.8638916015625, -3.71685791015625, -3.56982421875, -3.42279052734375, -3.2757568359375, -3.12872314453125, -2.981689453125, -2.83465576171875, -2.6876220703125, -2.54058837890625, -2.3935546875, -2.24652099609375, -2.0994873046875, -1.95245361328125, -1.805419921875, -1.65838623046875, -1.5113525390625, -1.36431884765625, -1.21728515625, -1.07025146484375, -0.9232177734375, -0.77618408203125, -0.629150390625, -0.48211669921875, -0.3350830078125, -0.18804931640625, -0.041015625, 0.10601806640625, 0.2530517578125, 0.40008544921875, 0.547119140625, 0.69415283203125, 0.8411865234375, 0.98822021484375, 1.13525390625, 1.28228759765625, 1.4293212890625, 1.57635498046875, 1.723388671875, 1.87042236328125, 2.0174560546875, 2.16448974609375, 2.3115234375, 2.45855712890625, 2.6055908203125, 2.75262451171875, 2.899658203125, 3.04669189453125, 3.1937255859375, 3.34075927734375, 3.48779296875, 3.63482666015625, 3.7818603515625, 3.92889404296875, 4.075927734375, 4.22296142578125, 4.3699951171875, 4.51702880859375, 4.6640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 7.0, 10.0, 8.0, 22.0, 29.0, 51.0, 58.0, 107.0, 200.0, 312.0, 610.0, 1230.0, 2975.0, 7961.0, 25849.0, 110804.0, 509167.0, 302586.0, 61074.0, 16032.0, 5297.0, 2099.0, 947.0, 476.0, 232.0, 150.0, 95.0, 55.0, 41.0, 24.0, 11.0, 14.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69921875, -0.6785354614257812, -0.6578521728515625, -0.6371688842773438, -0.616485595703125, -0.5958023071289062, -0.5751190185546875, -0.5544357299804688, -0.53375244140625, -0.5130691528320312, -0.4923858642578125, -0.47170257568359375, -0.451019287109375, -0.43033599853515625, -0.4096527099609375, -0.38896942138671875, -0.3682861328125, -0.34760284423828125, -0.3269195556640625, -0.30623626708984375, -0.285552978515625, -0.26486968994140625, -0.2441864013671875, -0.22350311279296875, -0.20281982421875, -0.18213653564453125, -0.1614532470703125, -0.14076995849609375, -0.120086669921875, -0.09940338134765625, -0.0787200927734375, -0.05803680419921875, -0.037353515625, -0.01667022705078125, 0.0040130615234375, 0.02469635009765625, 0.045379638671875, 0.06606292724609375, 0.0867462158203125, 0.10742950439453125, 0.12811279296875, 0.14879608154296875, 0.1694793701171875, 0.19016265869140625, 0.210845947265625, 0.23152923583984375, 0.2522125244140625, 0.27289581298828125, 0.2935791015625, 0.31426239013671875, 0.3349456787109375, 0.35562896728515625, 0.376312255859375, 0.39699554443359375, 0.4176788330078125, 0.43836212158203125, 0.45904541015625, 0.47972869873046875, 0.5004119873046875, 0.5210952758789062, 0.541778564453125, 0.5624618530273438, 0.5831451416015625, 0.6038284301757812, 0.62451171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 10.0, 12.0, 22.0, 21.0, 30.0, 18.0, 31.0, 32.0, 50.0, 59.0, 73.0, 64.0, 91.0, 77.0, 56.0, 49.0, 53.0, 43.0, 36.0, 34.0, 18.0, 28.0, 16.0, 10.0, 8.0, 10.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00010955333709716797, -0.00010618753731250763, -0.00010282173752784729, -9.945593774318695e-05, -9.609013795852661e-05, -9.272433817386627e-05, -8.935853838920593e-05, -8.59927386045456e-05, -8.262693881988525e-05, -7.926113903522491e-05, -7.589533925056458e-05, -7.252953946590424e-05, -6.91637396812439e-05, -6.579793989658356e-05, -6.243214011192322e-05, -5.906634032726288e-05, -5.570054054260254e-05, -5.23347407579422e-05, -4.896894097328186e-05, -4.560314118862152e-05, -4.223734140396118e-05, -3.887154161930084e-05, -3.55057418346405e-05, -3.2139942049980164e-05, -2.8774142265319824e-05, -2.5408342480659485e-05, -2.2042542695999146e-05, -1.8676742911338806e-05, -1.5310943126678467e-05, -1.1945143342018127e-05, -8.579343557357788e-06, -5.213543772697449e-06, -1.8477439880371094e-06, 1.51805579662323e-06, 4.883855581283569e-06, 8.249655365943909e-06, 1.1615455150604248e-05, 1.4981254935264587e-05, 1.8347054719924927e-05, 2.1712854504585266e-05, 2.5078654289245605e-05, 2.8444454073905945e-05, 3.1810253858566284e-05, 3.5176053643226624e-05, 3.854185342788696e-05, 4.19076532125473e-05, 4.527345299720764e-05, 4.863925278186798e-05, 5.200505256652832e-05, 5.537085235118866e-05, 5.8736652135849e-05, 6.210245192050934e-05, 6.546825170516968e-05, 6.883405148983002e-05, 7.219985127449036e-05, 7.55656510591507e-05, 7.893145084381104e-05, 8.229725062847137e-05, 8.566305041313171e-05, 8.902885019779205e-05, 9.239464998245239e-05, 9.576044976711273e-05, 9.912624955177307e-05, 0.00010249204933643341, 0.00010585784912109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 12.0, 11.0, 23.0, 27.0, 38.0, 66.0, 101.0, 198.0, 469.0, 868.0, 2195.0, 6202.0, 23060.0, 125368.0, 641037.0, 202753.0, 33088.0, 8077.0, 2746.0, 1093.0, 473.0, 289.0, 141.0, 76.0, 52.0, 29.0, 22.0, 6.0, 9.0, 5.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.93701171875, -0.91070556640625, -0.8843994140625, -0.85809326171875, -0.831787109375, -0.80548095703125, -0.7791748046875, -0.75286865234375, -0.7265625, -0.70025634765625, -0.6739501953125, -0.64764404296875, -0.621337890625, -0.59503173828125, -0.5687255859375, -0.54241943359375, -0.51611328125, -0.48980712890625, -0.4635009765625, -0.43719482421875, -0.410888671875, -0.38458251953125, -0.3582763671875, -0.33197021484375, -0.3056640625, -0.27935791015625, -0.2530517578125, -0.22674560546875, -0.200439453125, -0.17413330078125, -0.1478271484375, -0.12152099609375, -0.09521484375, -0.06890869140625, -0.0426025390625, -0.01629638671875, 0.010009765625, 0.03631591796875, 0.0626220703125, 0.08892822265625, 0.115234375, 0.14154052734375, 0.1678466796875, 0.19415283203125, 0.220458984375, 0.24676513671875, 0.2730712890625, 0.29937744140625, 0.32568359375, 0.35198974609375, 0.3782958984375, 0.40460205078125, 0.430908203125, 0.45721435546875, 0.4835205078125, 0.50982666015625, 0.5361328125, 0.56243896484375, 0.5887451171875, 0.61505126953125, 0.641357421875, 0.66766357421875, 0.6939697265625, 0.72027587890625, 0.74658203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 6.0, 8.0, 17.0, 21.0, 16.0, 20.0, 30.0, 31.0, 39.0, 41.0, 62.0, 69.0, 73.0, 90.0, 72.0, 84.0, 51.0, 45.0, 29.0, 33.0, 25.0, 24.0, 21.0, 14.0, 13.0, 11.0, 7.0, 10.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2736167907714844, -0.26427459716796875, -0.2549324035644531, -0.2455902099609375, -0.23624801635742188, -0.22690582275390625, -0.21756362915039062, -0.208221435546875, -0.19887924194335938, -0.18953704833984375, -0.18019485473632812, -0.1708526611328125, -0.16151046752929688, -0.15216827392578125, -0.14282608032226562, -0.13348388671875, -0.12414169311523438, -0.11479949951171875, -0.10545730590820312, -0.0961151123046875, -0.08677291870117188, -0.07743072509765625, -0.06808853149414062, -0.058746337890625, -0.049404144287109375, -0.04006195068359375, -0.030719757080078125, -0.0213775634765625, -0.012035369873046875, -0.00269317626953125, 0.006649017333984375, 0.0159912109375, 0.025333404541015625, 0.03467559814453125, 0.044017791748046875, 0.0533599853515625, 0.06270217895507812, 0.07204437255859375, 0.08138656616210938, 0.090728759765625, 0.10007095336914062, 0.10941314697265625, 0.11875534057617188, 0.1280975341796875, 0.13743972778320312, 0.14678192138671875, 0.15612411499023438, 0.16546630859375, 0.17480850219726562, 0.18415069580078125, 0.19349288940429688, 0.2028350830078125, 0.21217727661132812, 0.22151947021484375, 0.23086166381835938, 0.240203857421875, 0.24954605102539062, 0.25888824462890625, 0.2682304382324219, 0.2775726318359375, 0.2869148254394531, 0.29625701904296875, 0.3055992126464844, 0.31494140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 9.0, 11.0, 13.0, 32.0, 89.0, 228.0, 323.0, 152.0, 65.0, 26.0, 18.0, 16.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-21.855234146118164, -21.383920669555664, -20.912607192993164, -20.441293716430664, -19.969980239868164, -19.498666763305664, -19.027353286743164, -18.556041717529297, -18.084728240966797, -17.613414764404297, -17.142101287841797, -16.670787811279297, -16.199474334716797, -15.728160858154297, -15.256848335266113, -14.785534858703613, -14.314220428466797, -13.842906951904297, -13.371593475341797, -12.900279998779297, -12.428966522216797, -11.957653045654297, -11.486340522766113, -11.015027046203613, -10.543713569641113, -10.072400093078613, -9.601086616516113, -9.129773139953613, -8.65846061706543, -8.18714714050293, -7.71583366394043, -7.24452018737793, -6.77320671081543, -6.30189323425293, -5.83057975769043, -5.359266757965088, -4.887953281402588, -4.416639804840088, -3.945326566696167, -3.474013328552246, -3.002699851989746, -2.531386375427246, -2.060073137283325, -1.5887597799301147, -1.1174464225769043, -0.6461329460144043, -0.1748197078704834, 0.2964935302734375, 0.7678070068359375, 1.239120364189148, 1.7104337215423584, 2.1817469596862793, 2.6530604362487793, 3.1243739128112793, 3.5956871509552, 4.067000389099121, 4.538313865661621, 5.009627342224121, 5.480940818786621, 5.952253818511963, 6.423567295074463, 6.894880771636963, 7.366193771362305, 7.837507247924805, 8.308820724487305]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 13.0, 9.0, 8.0, 7.0, 18.0, 16.0, 15.0, 27.0, 33.0, 29.0, 41.0, 56.0, 53.0, 58.0, 59.0, 52.0, 54.0, 72.0, 50.0, 46.0, 43.0, 35.0, 52.0, 36.0, 19.0, 20.0, 16.0, 9.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.608564376831055, -9.237091064453125, -8.865617752075195, -8.494144439697266, -8.122671127319336, -7.751197814941406, -7.379724502563477, -7.008251190185547, -6.636777877807617, -6.2653045654296875, -5.893831253051758, -5.522357940673828, -5.150884628295898, -4.779411315917969, -4.407938003540039, -4.036464691162109, -3.664991855621338, -3.293518543243408, -2.9220452308654785, -2.550571918487549, -2.179098606109619, -1.807625412940979, -1.4361522197723389, -1.0646789073944092, -0.6932055950164795, -0.3217323124408722, 0.04974097013473511, 0.42121422290802, 0.7926875352859497, 1.1641608476638794, 1.5356340408325195, 1.9071073532104492, 2.278580665588379, 2.6500539779663086, 3.0215272903442383, 3.393000602722168, 3.7644739151000977, 4.135947227478027, 4.507420539855957, 4.878893852233887, 5.250367164611816, 5.621840476989746, 5.993313789367676, 6.3647871017456055, 6.736260414123535, 7.107733726501465, 7.4792070388793945, 7.850680351257324, 8.222152709960938, 8.593626022338867, 8.965099334716797, 9.336572647094727, 9.708045959472656, 10.079519271850586, 10.450992584228516, 10.822465896606445, 11.193939208984375, 11.565412521362305, 11.936885833740234, 12.308359146118164, 12.679832458496094, 13.051305770874023, 13.422779083251953, 13.794252395629883, 14.165725708007812]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 0.0, 13.0, 13.0, 11.0, 14.0, 24.0, 27.0, 37.0, 54.0, 72.0, 92.0, 121.0, 194.0, 284.0, 465.0, 790.0, 1464.0, 2821.0, 6058.0, 15701.0, 50843.0, 256292.0, 3226167.0, 518333.0, 76170.0, 21994.0, 8209.0, 3632.0, 1829.0, 937.0, 545.0, 339.0, 204.0, 138.0, 93.0, 86.0, 47.0, 42.0, 31.0, 32.0, 15.0, 13.0, 3.0, 7.0, 6.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 5.0], "bins": [-3.142578125, -3.0491943359375, -2.955810546875, -2.8624267578125, -2.76904296875, -2.6756591796875, -2.582275390625, -2.4888916015625, -2.3955078125, -2.3021240234375, -2.208740234375, -2.1153564453125, -2.02197265625, -1.9285888671875, -1.835205078125, -1.7418212890625, -1.6484375, -1.5550537109375, -1.461669921875, -1.3682861328125, -1.27490234375, -1.1815185546875, -1.088134765625, -0.9947509765625, -0.9013671875, -0.8079833984375, -0.714599609375, -0.6212158203125, -0.52783203125, -0.4344482421875, -0.341064453125, -0.2476806640625, -0.154296875, -0.0609130859375, 0.032470703125, 0.1258544921875, 0.21923828125, 0.3126220703125, 0.406005859375, 0.4993896484375, 0.5927734375, 0.6861572265625, 0.779541015625, 0.8729248046875, 0.96630859375, 1.0596923828125, 1.153076171875, 1.2464599609375, 1.33984375, 1.4332275390625, 1.526611328125, 1.6199951171875, 1.71337890625, 1.8067626953125, 1.900146484375, 1.9935302734375, 2.0869140625, 2.1802978515625, 2.273681640625, 2.3670654296875, 2.46044921875, 2.5538330078125, 2.647216796875, 2.7406005859375, 2.833984375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 6.0, 3.0, 6.0, 7.0, 8.0, 13.0, 18.0, 23.0, 23.0, 29.0, 34.0, 48.0, 51.0, 70.0, 70.0, 90.0, 66.0, 79.0, 72.0, 64.0, 42.0, 34.0, 23.0, 21.0, 17.0, 14.0, 11.0, 7.0, 15.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.22650146484375, -3.1287841796875, -3.03106689453125, -2.933349609375, -2.83563232421875, -2.7379150390625, -2.64019775390625, -2.54248046875, -2.44476318359375, -2.3470458984375, -2.24932861328125, -2.151611328125, -2.05389404296875, -1.9561767578125, -1.85845947265625, -1.7607421875, -1.66302490234375, -1.5653076171875, -1.46759033203125, -1.369873046875, -1.27215576171875, -1.1744384765625, -1.07672119140625, -0.97900390625, -0.88128662109375, -0.7835693359375, -0.68585205078125, -0.588134765625, -0.49041748046875, -0.3927001953125, -0.29498291015625, -0.197265625, -0.09954833984375, -0.0018310546875, 0.09588623046875, 0.193603515625, 0.29132080078125, 0.3890380859375, 0.48675537109375, 0.58447265625, 0.68218994140625, 0.7799072265625, 0.87762451171875, 0.975341796875, 1.07305908203125, 1.1707763671875, 1.26849365234375, 1.3662109375, 1.46392822265625, 1.5616455078125, 1.65936279296875, 1.757080078125, 1.85479736328125, 1.9525146484375, 2.05023193359375, 2.14794921875, 2.24566650390625, 2.3433837890625, 2.44110107421875, 2.538818359375, 2.63653564453125, 2.7342529296875, 2.83197021484375, 2.9296875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 14.0, 16.0, 16.0, 28.0, 44.0, 46.0, 71.0, 151.0, 419.0, 2683.0, 112885.0, 4062988.0, 13376.0, 1015.0, 237.0, 96.0, 49.0, 38.0, 20.0, 19.0, 16.0, 10.0, 12.0, 9.0, 0.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.140625, -15.7188720703125, -15.297119140625, -14.8753662109375, -14.45361328125, -14.0318603515625, -13.610107421875, -13.1883544921875, -12.7666015625, -12.3448486328125, -11.923095703125, -11.5013427734375, -11.07958984375, -10.6578369140625, -10.236083984375, -9.8143310546875, -9.392578125, -8.9708251953125, -8.549072265625, -8.1273193359375, -7.70556640625, -7.2838134765625, -6.862060546875, -6.4403076171875, -6.0185546875, -5.5968017578125, -5.175048828125, -4.7532958984375, -4.33154296875, -3.9097900390625, -3.488037109375, -3.0662841796875, -2.64453125, -2.2227783203125, -1.801025390625, -1.3792724609375, -0.95751953125, -0.5357666015625, -0.114013671875, 0.3077392578125, 0.7294921875, 1.1512451171875, 1.572998046875, 1.9947509765625, 2.41650390625, 2.8382568359375, 3.260009765625, 3.6817626953125, 4.103515625, 4.5252685546875, 4.947021484375, 5.3687744140625, 5.79052734375, 6.2122802734375, 6.634033203125, 7.0557861328125, 7.4775390625, 7.8992919921875, 8.321044921875, 8.7427978515625, 9.16455078125, 9.5863037109375, 10.008056640625, 10.4298095703125, 10.8515625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 10.0, 19.0, 16.0, 26.0, 26.0, 29.0, 42.0, 54.0, 83.0, 145.0, 221.0, 388.0, 1033.0, 960.0, 357.0, 166.0, 120.0, 88.0, 56.0, 51.0, 42.0, 35.0, 26.0, 16.0, 10.0, 11.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.7766876220703125, -0.746734619140625, -0.7167816162109375, -0.68682861328125, -0.6568756103515625, -0.626922607421875, -0.5969696044921875, -0.5670166015625, -0.5370635986328125, -0.507110595703125, -0.4771575927734375, -0.44720458984375, -0.4172515869140625, -0.387298583984375, -0.3573455810546875, -0.327392578125, -0.2974395751953125, -0.267486572265625, -0.2375335693359375, -0.20758056640625, -0.1776275634765625, -0.147674560546875, -0.1177215576171875, -0.0877685546875, -0.0578155517578125, -0.027862548828125, 0.0020904541015625, 0.03204345703125, 0.0619964599609375, 0.091949462890625, 0.1219024658203125, 0.15185546875, 0.1818084716796875, 0.211761474609375, 0.2417144775390625, 0.27166748046875, 0.3016204833984375, 0.331573486328125, 0.3615264892578125, 0.3914794921875, 0.4214324951171875, 0.451385498046875, 0.4813385009765625, 0.51129150390625, 0.5412445068359375, 0.571197509765625, 0.6011505126953125, 0.631103515625, 0.6610565185546875, 0.691009521484375, 0.7209625244140625, 0.75091552734375, 0.7808685302734375, 0.810821533203125, 0.8407745361328125, 0.8707275390625, 0.9006805419921875, 0.930633544921875, 0.9605865478515625, 0.99053955078125, 1.0204925537109375, 1.050445556640625, 1.0803985595703125, 1.1103515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 8.0, 3.0, 13.0, 18.0, 22.0, 42.0, 69.0, 109.0, 169.0, 189.0, 129.0, 77.0, 38.0, 29.0, 13.0, 14.0, 16.0, 5.0, 5.0, 2.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7632222175598145, -6.576618671417236, -6.390015602111816, -6.203412055969238, -6.016808986663818, -5.83020544052124, -5.64360237121582, -5.456998825073242, -5.270395278930664, -5.083791732788086, -4.897188663482666, -4.710585117340088, -4.523982048034668, -4.33737850189209, -4.150774955749512, -3.964171886444092, -3.777568817138672, -3.590965509414673, -3.404362201690674, -3.2177586555480957, -3.031155586242676, -2.8445520401000977, -2.6579487323760986, -2.4713454246520996, -2.2847421169281006, -2.0981388092041016, -1.9115355014801025, -1.724932074546814, -1.538328766822815, -1.351725459098816, -1.1651220321655273, -0.9785187244415283, -0.7919149398803711, -0.6053116321563721, -0.41870826482772827, -0.23210489749908447, -0.04550158977508545, 0.14110171794891357, 0.32770514488220215, 0.5143084526062012, 0.7009117603302002, 0.8875150680541992, 1.0741183757781982, 1.2607218027114868, 1.4473251104354858, 1.6339284181594849, 1.8205318450927734, 2.0071351528167725, 2.1937384605407715, 2.3803417682647705, 2.5669450759887695, 2.7535486221313477, 2.9401516914367676, 3.1267552375793457, 3.3133585453033447, 3.4999618530273438, 3.6865651607513428, 3.873168468475342, 4.05977201461792, 4.24637508392334, 4.432978630065918, 4.619581699371338, 4.806185245513916, 4.992788314819336, 5.179391860961914]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 6.0, 8.0, 9.0, 13.0, 18.0, 13.0, 22.0, 27.0, 43.0, 49.0, 39.0, 72.0, 81.0, 71.0, 77.0, 58.0, 49.0, 49.0, 48.0, 41.0, 36.0, 30.0, 31.0, 23.0, 10.0, 10.0, 18.0, 9.0, 11.0, 7.0, 7.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3075475692749023, -3.2033259868621826, -3.099104404449463, -2.994882583618164, -2.8906610012054443, -2.7864394187927246, -2.682217597961426, -2.577996015548706, -2.4737744331359863, -2.3695528507232666, -2.265331268310547, -2.161109447479248, -2.0568878650665283, -1.9526662826538086, -1.8484445810317993, -1.74422287940979, -1.6400012969970703, -1.5357797145843506, -1.4315580129623413, -1.327336311340332, -1.2231147289276123, -1.1188931465148926, -1.0146714448928833, -0.9104498028755188, -0.8062281608581543, -0.7020065188407898, -0.5977848768234253, -0.4935632348060608, -0.3893415927886963, -0.2851199507713318, -0.18089830875396729, -0.07667666673660278, 0.02754497528076172, 0.13176661729812622, 0.23598825931549072, 0.3402099013328552, 0.4444315433502197, 0.5486531853675842, 0.6528748273849487, 0.7570964694023132, 0.8613181114196777, 0.9655397534370422, 1.0697613954544067, 1.173983097076416, 1.2782046794891357, 1.3824262619018555, 1.4866479635238647, 1.590869665145874, 1.6950912475585938, 1.7993128299713135, 1.9035345315933228, 2.007756233215332, 2.1119778156280518, 2.2161993980407715, 2.3204212188720703, 2.42464280128479, 2.5288643836975098, 2.6330859661102295, 2.737307548522949, 2.841529369354248, 2.9457509517669678, 3.0499725341796875, 3.1541943550109863, 3.258415937423706, 3.362637519836426]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 10.0, 5.0, 12.0, 22.0, 30.0, 67.0, 72.0, 119.0, 224.0, 344.0, 599.0, 1027.0, 1916.0, 3609.0, 7745.0, 18994.0, 56204.0, 223316.0, 512242.0, 152209.0, 41749.0, 14936.0, 6325.0, 3022.0, 1560.0, 807.0, 497.0, 338.0, 183.0, 118.0, 74.0, 55.0, 39.0, 28.0, 12.0, 11.0, 12.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2264404296875, -0.22021484375, -0.2139892578125, -0.207763671875, -0.2015380859375, -0.1953125, -0.1890869140625, -0.182861328125, -0.1766357421875, -0.17041015625, -0.1641845703125, -0.157958984375, -0.1517333984375, -0.1455078125, -0.1392822265625, -0.133056640625, -0.1268310546875, -0.12060546875, -0.1143798828125, -0.108154296875, -0.1019287109375, -0.095703125, -0.0894775390625, -0.083251953125, -0.0770263671875, -0.07080078125, -0.0645751953125, -0.058349609375, -0.0521240234375, -0.0458984375, -0.0396728515625, -0.033447265625, -0.0272216796875, -0.02099609375, -0.0147705078125, -0.008544921875, -0.0023193359375, 0.00390625, 0.0101318359375, 0.016357421875, 0.0225830078125, 0.02880859375, 0.0350341796875, 0.041259765625, 0.0474853515625, 0.0537109375, 0.0599365234375, 0.066162109375, 0.0723876953125, 0.07861328125, 0.0848388671875, 0.091064453125, 0.0972900390625, 0.103515625, 0.1097412109375, 0.115966796875, 0.1221923828125, 0.12841796875, 0.1346435546875, 0.140869140625, 0.1470947265625, 0.1533203125, 0.1595458984375, 0.165771484375, 0.1719970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 7.0, 14.0, 20.0, 18.0, 27.0, 36.0, 53.0, 56.0, 78.0, 97.0, 91.0, 83.0, 86.0, 43.0, 62.0, 34.0, 43.0, 30.0, 22.0, 17.0, 12.0, 10.0, 12.0, 5.0, 10.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.970703125, -2.88323974609375, -2.7957763671875, -2.70831298828125, -2.620849609375, -2.53338623046875, -2.4459228515625, -2.35845947265625, -2.27099609375, -2.18353271484375, -2.0960693359375, -2.00860595703125, -1.921142578125, -1.83367919921875, -1.7462158203125, -1.65875244140625, -1.5712890625, -1.48382568359375, -1.3963623046875, -1.30889892578125, -1.221435546875, -1.13397216796875, -1.0465087890625, -0.95904541015625, -0.87158203125, -0.78411865234375, -0.6966552734375, -0.60919189453125, -0.521728515625, -0.43426513671875, -0.3468017578125, -0.25933837890625, -0.171875, -0.08441162109375, 0.0030517578125, 0.09051513671875, 0.177978515625, 0.26544189453125, 0.3529052734375, 0.44036865234375, 0.52783203125, 0.61529541015625, 0.7027587890625, 0.79022216796875, 0.877685546875, 0.96514892578125, 1.0526123046875, 1.14007568359375, 1.2275390625, 1.31500244140625, 1.4024658203125, 1.48992919921875, 1.577392578125, 1.66485595703125, 1.7523193359375, 1.83978271484375, 1.92724609375, 2.01470947265625, 2.1021728515625, 2.18963623046875, 2.277099609375, 2.36456298828125, 2.4520263671875, 2.53948974609375, 2.626953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 13.0, 10.0, 12.0, 14.0, 18.0, 19.0, 32.0, 46.0, 50.0, 69.0, 100.0, 149.0, 214.0, 319.0, 646.0, 1819.0, 12152.0, 148535.0, 749114.0, 120842.0, 10925.0, 1777.0, 578.0, 345.0, 239.0, 136.0, 99.0, 78.0, 43.0, 36.0, 24.0, 17.0, 13.0, 8.0, 15.0, 12.0, 13.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.372802734375, -0.362579345703125, -0.35235595703125, -0.342132568359375, -0.3319091796875, -0.321685791015625, -0.31146240234375, -0.301239013671875, -0.291015625, -0.280792236328125, -0.27056884765625, -0.260345458984375, -0.2501220703125, -0.239898681640625, -0.22967529296875, -0.219451904296875, -0.209228515625, -0.199005126953125, -0.18878173828125, -0.178558349609375, -0.1683349609375, -0.158111572265625, -0.14788818359375, -0.137664794921875, -0.12744140625, -0.117218017578125, -0.10699462890625, -0.096771240234375, -0.0865478515625, -0.076324462890625, -0.06610107421875, -0.055877685546875, -0.045654296875, -0.035430908203125, -0.02520751953125, -0.014984130859375, -0.0047607421875, 0.005462646484375, 0.01568603515625, 0.025909423828125, 0.0361328125, 0.046356201171875, 0.05657958984375, 0.066802978515625, 0.0770263671875, 0.087249755859375, 0.09747314453125, 0.107696533203125, 0.117919921875, 0.128143310546875, 0.13836669921875, 0.148590087890625, 0.1588134765625, 0.169036865234375, 0.17926025390625, 0.189483642578125, 0.19970703125, 0.209930419921875, 0.22015380859375, 0.230377197265625, 0.2406005859375, 0.250823974609375, 0.26104736328125, 0.271270751953125, 0.281494140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 12.0, 9.0, 12.0, 15.0, 19.0, 31.0, 12.0, 33.0, 28.0, 31.0, 40.0, 52.0, 36.0, 54.0, 48.0, 47.0, 53.0, 43.0, 58.0, 55.0, 42.0, 29.0, 39.0, 21.0, 26.0, 19.0, 15.0, 14.0, 16.0, 6.0, 11.0, 6.0, 6.0, 10.0, 7.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.642578125, -3.528839111328125, -3.41510009765625, -3.301361083984375, -3.1876220703125, -3.073883056640625, -2.96014404296875, -2.846405029296875, -2.732666015625, -2.618927001953125, -2.50518798828125, -2.391448974609375, -2.2777099609375, -2.163970947265625, -2.05023193359375, -1.936492919921875, -1.82275390625, -1.709014892578125, -1.59527587890625, -1.481536865234375, -1.3677978515625, -1.254058837890625, -1.14031982421875, -1.026580810546875, -0.912841796875, -0.799102783203125, -0.68536376953125, -0.571624755859375, -0.4578857421875, -0.344146728515625, -0.23040771484375, -0.116668701171875, -0.0029296875, 0.110809326171875, 0.22454833984375, 0.338287353515625, 0.4520263671875, 0.565765380859375, 0.67950439453125, 0.793243408203125, 0.906982421875, 1.020721435546875, 1.13446044921875, 1.248199462890625, 1.3619384765625, 1.475677490234375, 1.58941650390625, 1.703155517578125, 1.81689453125, 1.930633544921875, 2.04437255859375, 2.158111572265625, 2.2718505859375, 2.385589599609375, 2.49932861328125, 2.613067626953125, 2.726806640625, 2.840545654296875, 2.95428466796875, 3.068023681640625, 3.1817626953125, 3.295501708984375, 3.40924072265625, 3.522979736328125, 3.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 8.0, 16.0, 14.0, 20.0, 28.0, 38.0, 53.0, 65.0, 127.0, 181.0, 295.0, 561.0, 2550.0, 150593.0, 886650.0, 5545.0, 780.0, 355.0, 220.0, 125.0, 91.0, 73.0, 46.0, 30.0, 26.0, 14.0, 13.0, 4.0, 4.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.14575576782226562, -0.14148712158203125, -0.13721847534179688, -0.1329498291015625, -0.12868118286132812, -0.12441253662109375, -0.12014389038085938, -0.115875244140625, -0.11160659790039062, -0.10733795166015625, -0.10306930541992188, -0.0988006591796875, -0.09453201293945312, -0.09026336669921875, -0.08599472045898438, -0.08172607421875, -0.07745742797851562, -0.07318878173828125, -0.06892013549804688, -0.0646514892578125, -0.060382843017578125, -0.05611419677734375, -0.051845550537109375, -0.047576904296875, -0.043308258056640625, -0.03903961181640625, -0.034770965576171875, -0.0305023193359375, -0.026233673095703125, -0.02196502685546875, -0.017696380615234375, -0.013427734375, -0.009159088134765625, -0.00489044189453125, -0.000621795654296875, 0.0036468505859375, 0.007915496826171875, 0.01218414306640625, 0.016452789306640625, 0.020721435546875, 0.024990081787109375, 0.02925872802734375, 0.033527374267578125, 0.0377960205078125, 0.042064666748046875, 0.04633331298828125, 0.050601959228515625, 0.05487060546875, 0.059139251708984375, 0.06340789794921875, 0.06767654418945312, 0.0719451904296875, 0.07621383666992188, 0.08048248291015625, 0.08475112915039062, 0.089019775390625, 0.09328842163085938, 0.09755706787109375, 0.10182571411132812, 0.1060943603515625, 0.11036300659179688, 0.11463165283203125, 0.11890029907226562, 0.1231689453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 23.0, 45.0, 72.0, 136.0, 230.0, 221.0, 128.0, 63.0, 33.0, 14.0, 8.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.51750373840332e-05, -8.223205804824829e-05, -7.928907871246338e-05, -7.634609937667847e-05, -7.340312004089355e-05, -7.046014070510864e-05, -6.751716136932373e-05, -6.457418203353882e-05, -6.16312026977539e-05, -5.8688223361968994e-05, -5.574524402618408e-05, -5.280226469039917e-05, -4.985928535461426e-05, -4.6916306018829346e-05, -4.3973326683044434e-05, -4.103034734725952e-05, -3.808736801147461e-05, -3.51443886756897e-05, -3.2201409339904785e-05, -2.9258430004119873e-05, -2.631545066833496e-05, -2.337247133255005e-05, -2.0429491996765137e-05, -1.7486512660980225e-05, -1.4543533325195312e-05, -1.16005539894104e-05, -8.657574653625488e-06, -5.714595317840576e-06, -2.771615982055664e-06, 1.7136335372924805e-07, 3.11434268951416e-06, 6.057322025299072e-06, 9.000301361083984e-06, 1.1943280696868896e-05, 1.4886260032653809e-05, 1.782923936843872e-05, 2.0772218704223633e-05, 2.3715198040008545e-05, 2.6658177375793457e-05, 2.960115671157837e-05, 3.254413604736328e-05, 3.548711538314819e-05, 3.8430094718933105e-05, 4.137307405471802e-05, 4.431605339050293e-05, 4.725903272628784e-05, 5.0202012062072754e-05, 5.3144991397857666e-05, 5.608797073364258e-05, 5.903095006942749e-05, 6.19739294052124e-05, 6.491690874099731e-05, 6.785988807678223e-05, 7.080286741256714e-05, 7.374584674835205e-05, 7.668882608413696e-05, 7.963180541992188e-05, 8.257478475570679e-05, 8.55177640914917e-05, 8.846074342727661e-05, 9.140372276306152e-05, 9.434670209884644e-05, 9.728968143463135e-05, 0.00010023266077041626, 0.00010317564010620117]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 23.0, 22.0, 36.0, 56.0, 62.0, 117.0, 216.0, 413.0, 862.0, 2233.0, 7144.0, 37701.0, 810989.0, 165968.0, 15919.0, 3981.0, 1431.0, 589.0, 300.0, 158.0, 81.0, 65.0, 41.0, 29.0, 19.0, 14.0, 11.0, 6.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1207275390625, -0.11715221405029297, -0.11357688903808594, -0.1100015640258789, -0.10642623901367188, -0.10285091400146484, -0.09927558898925781, -0.09570026397705078, -0.09212493896484375, -0.08854961395263672, -0.08497428894042969, -0.08139896392822266, -0.07782363891601562, -0.0742483139038086, -0.07067298889160156, -0.06709766387939453, -0.0635223388671875, -0.05994701385498047, -0.05637168884277344, -0.052796363830566406, -0.049221038818359375, -0.045645713806152344, -0.04207038879394531, -0.03849506378173828, -0.03491973876953125, -0.03134441375732422, -0.027769088745117188, -0.024193763732910156, -0.020618438720703125, -0.017043113708496094, -0.013467788696289062, -0.009892463684082031, -0.006317138671875, -0.0027418136596679688, 0.0008335113525390625, 0.004408836364746094, 0.007984161376953125, 0.011559486389160156, 0.015134811401367188, 0.01871013641357422, 0.02228546142578125, 0.02586078643798828, 0.029436111450195312, 0.033011436462402344, 0.036586761474609375, 0.040162086486816406, 0.04373741149902344, 0.04731273651123047, 0.0508880615234375, 0.05446338653564453, 0.05803871154785156, 0.061614036560058594, 0.06518936157226562, 0.06876468658447266, 0.07234001159667969, 0.07591533660888672, 0.07949066162109375, 0.08306598663330078, 0.08664131164550781, 0.09021663665771484, 0.09379196166992188, 0.0973672866821289, 0.10094261169433594, 0.10451793670654297, 0.10809326171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 19.0, 7.0, 19.0, 20.0, 35.0, 49.0, 52.0, 105.0, 208.0, 145.0, 94.0, 44.0, 46.0, 20.0, 16.0, 9.0, 11.0, 12.0, 10.0, 10.0, 6.0, 3.0, 2.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01378631591796875, -0.013352632522583008, -0.012918949127197266, -0.012485265731811523, -0.012051582336425781, -0.011617898941040039, -0.011184215545654297, -0.010750532150268555, -0.010316848754882812, -0.00988316535949707, -0.009449481964111328, -0.009015798568725586, -0.008582115173339844, -0.008148431777954102, -0.007714748382568359, -0.007281064987182617, -0.006847381591796875, -0.006413698196411133, -0.005980014801025391, -0.0055463314056396484, -0.005112648010253906, -0.004678964614868164, -0.004245281219482422, -0.0038115978240966797, -0.0033779144287109375, -0.0029442310333251953, -0.002510547637939453, -0.002076864242553711, -0.0016431808471679688, -0.0012094974517822266, -0.0007758140563964844, -0.0003421306610107422, 9.1552734375e-05, 0.0005252361297607422, 0.0009589195251464844, 0.0013926029205322266, 0.0018262863159179688, 0.002259969711303711, 0.002693653106689453, 0.0031273365020751953, 0.0035610198974609375, 0.00399470329284668, 0.004428386688232422, 0.004862070083618164, 0.005295753479003906, 0.0057294368743896484, 0.006163120269775391, 0.006596803665161133, 0.007030487060546875, 0.007464170455932617, 0.00789785385131836, 0.008331537246704102, 0.008765220642089844, 0.009198904037475586, 0.009632587432861328, 0.01006627082824707, 0.010499954223632812, 0.010933637619018555, 0.011367321014404297, 0.011801004409790039, 0.012234687805175781, 0.012668371200561523, 0.013102054595947266, 0.013535737991333008, 0.01396942138671875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 1.0, 10.0, 12.0, 9.0, 23.0, 43.0, 91.0, 176.0, 277.0, 176.0, 74.0, 31.0, 19.0, 16.0, 14.0, 4.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6137871742248535, -6.432416915893555, -6.251047134399414, -6.069676876068115, -5.888306617736816, -5.706936836242676, -5.525566577911377, -5.344196319580078, -5.1628265380859375, -4.981456279754639, -4.800086498260498, -4.618716239929199, -4.437346458435059, -4.25597620010376, -4.074605941772461, -3.893235921859741, -3.7118659019470215, -3.5304958820343018, -3.349125862121582, -3.167755603790283, -2.9863855838775635, -2.8050155639648438, -2.623645305633545, -2.442275285720825, -2.2609052658081055, -2.0795352458953857, -1.8981651067733765, -1.7167949676513672, -1.5354249477386475, -1.3540549278259277, -1.1726847887039185, -0.9913146495819092, -0.8099441528320312, -0.6285740733146667, -0.44720399379730225, -0.26583391427993774, -0.08446383476257324, 0.09690624475479126, 0.27827632427215576, 0.45964646339416504, 0.6410164833068848, 0.8223865628242493, 1.0037566423416138, 1.185126781463623, 1.3664968013763428, 1.5478668212890625, 1.7292369604110718, 1.910607099533081, 2.091977119445801, 2.2733471393585205, 2.4547171592712402, 2.636087417602539, 2.817457437515259, 2.9988274574279785, 3.1801977157592773, 3.361567735671997, 3.542937755584717, 3.7243077754974365, 3.9056777954101562, 4.087048053741455, 4.268418312072754, 4.4497880935668945, 4.631158351898193, 4.812528610229492, 4.993898391723633]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 20.0, 21.0, 37.0, 42.0, 59.0, 64.0, 95.0, 79.0, 94.0, 60.0, 58.0, 59.0, 43.0, 41.0, 32.0, 34.0, 16.0, 12.0, 10.0, 13.0, 13.0, 8.0, 7.0, 8.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4626808166503906, -2.384437322616577, -2.3061938285827637, -2.22795033454895, -2.1497068405151367, -2.0714633464813232, -1.9932199716567993, -1.9149764776229858, -1.8367329835891724, -1.7584894895553589, -1.6802459955215454, -1.602002501487732, -1.523759126663208, -1.4455156326293945, -1.367272138595581, -1.2890286445617676, -1.210785150527954, -1.1325416564941406, -1.0542981624603271, -0.9760547280311584, -0.897811233997345, -0.8195677399635315, -0.7413243055343628, -0.6630808115005493, -0.5848373174667358, -0.5065938234329224, -0.4283503592014313, -0.3501068949699402, -0.2718634009361267, -0.19361990690231323, -0.11537644267082214, -0.037132978439331055, 0.04111051559448242, 0.1193539947271347, 0.197597473859787, 0.2758409380912781, 0.35408443212509155, 0.43232792615890503, 0.5105713605880737, 0.5888148546218872, 0.6670583486557007, 0.7453018426895142, 0.8235453367233276, 0.9017887711524963, 0.9800322651863098, 1.0582756996154785, 1.136519193649292, 1.2147626876831055, 1.293006181716919, 1.3712496757507324, 1.449493169784546, 1.5277366638183594, 1.6059801578521729, 1.6842236518859863, 1.7624670267105103, 1.8407105207443237, 1.9189540147781372, 1.9971975088119507, 2.0754408836364746, 2.153684377670288, 2.2319278717041016, 2.310171365737915, 2.3884148597717285, 2.466658353805542, 2.5449018478393555]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 12.0, 18.0, 37.0, 70.0, 144.0, 459.0, 1854.0, 13151.0, 307757.0, 697930.0, 23524.0, 2573.0, 584.0, 209.0, 89.0, 49.0, 33.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.479736328125, -5.29150390625, -5.103271484375, -4.9150390625, -4.726806640625, -4.53857421875, -4.350341796875, -4.162109375, -3.973876953125, -3.78564453125, -3.597412109375, -3.4091796875, -3.220947265625, -3.03271484375, -2.844482421875, -2.65625, -2.468017578125, -2.27978515625, -2.091552734375, -1.9033203125, -1.715087890625, -1.52685546875, -1.338623046875, -1.150390625, -0.962158203125, -0.77392578125, -0.585693359375, -0.3974609375, -0.209228515625, -0.02099609375, 0.167236328125, 0.35546875, 0.543701171875, 0.73193359375, 0.920166015625, 1.1083984375, 1.296630859375, 1.48486328125, 1.673095703125, 1.861328125, 2.049560546875, 2.23779296875, 2.426025390625, 2.6142578125, 2.802490234375, 2.99072265625, 3.178955078125, 3.3671875, 3.555419921875, 3.74365234375, 3.931884765625, 4.1201171875, 4.308349609375, 4.49658203125, 4.684814453125, 4.873046875, 5.061279296875, 5.24951171875, 5.437744140625, 5.6259765625, 5.814208984375, 6.00244140625, 6.190673828125, 6.37890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 6.0, 21.0, 21.0, 49.0, 77.0, 105.0, 145.0, 165.0, 119.0, 92.0, 64.0, 39.0, 33.0, 16.0, 17.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.23089599609375, -6.8953857421875, -6.55987548828125, -6.224365234375, -5.88885498046875, -5.5533447265625, -5.21783447265625, -4.88232421875, -4.54681396484375, -4.2113037109375, -3.87579345703125, -3.540283203125, -3.20477294921875, -2.8692626953125, -2.53375244140625, -2.1982421875, -1.86273193359375, -1.5272216796875, -1.19171142578125, -0.856201171875, -0.52069091796875, -0.1851806640625, 0.15032958984375, 0.48583984375, 0.82135009765625, 1.1568603515625, 1.49237060546875, 1.827880859375, 2.16339111328125, 2.4989013671875, 2.83441162109375, 3.169921875, 3.50543212890625, 3.8409423828125, 4.17645263671875, 4.511962890625, 4.84747314453125, 5.1829833984375, 5.51849365234375, 5.85400390625, 6.18951416015625, 6.5250244140625, 6.86053466796875, 7.196044921875, 7.53155517578125, 7.8670654296875, 8.20257568359375, 8.5380859375, 8.87359619140625, 9.2091064453125, 9.54461669921875, 9.880126953125, 10.21563720703125, 10.5511474609375, 10.88665771484375, 11.22216796875, 11.55767822265625, 11.8931884765625, 12.22869873046875, 12.564208984375, 12.89971923828125, 13.2352294921875, 13.57073974609375, 13.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 6.0, 6.0, 10.0, 19.0, 23.0, 25.0, 38.0, 60.0, 118.0, 160.0, 224.0, 427.0, 963.0, 2551.0, 9907.0, 84799.0, 812387.0, 119545.0, 12075.0, 2880.0, 1104.0, 483.0, 267.0, 135.0, 105.0, 65.0, 45.0, 44.0, 21.0, 15.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.11865234375, -3.0166015625, -2.91455078125, -2.8125, -2.71044921875, -2.6083984375, -2.50634765625, -2.404296875, -2.30224609375, -2.2001953125, -2.09814453125, -1.99609375, -1.89404296875, -1.7919921875, -1.68994140625, -1.587890625, -1.48583984375, -1.3837890625, -1.28173828125, -1.1796875, -1.07763671875, -0.9755859375, -0.87353515625, -0.771484375, -0.66943359375, -0.5673828125, -0.46533203125, -0.36328125, -0.26123046875, -0.1591796875, -0.05712890625, 0.044921875, 0.14697265625, 0.2490234375, 0.35107421875, 0.453125, 0.55517578125, 0.6572265625, 0.75927734375, 0.861328125, 0.96337890625, 1.0654296875, 1.16748046875, 1.26953125, 1.37158203125, 1.4736328125, 1.57568359375, 1.677734375, 1.77978515625, 1.8818359375, 1.98388671875, 2.0859375, 2.18798828125, 2.2900390625, 2.39208984375, 2.494140625, 2.59619140625, 2.6982421875, 2.80029296875, 2.90234375, 3.00439453125, 3.1064453125, 3.20849609375, 3.310546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 7.0, 10.0, 8.0, 15.0, 16.0, 23.0, 34.0, 27.0, 27.0, 40.0, 37.0, 44.0, 48.0, 41.0, 51.0, 53.0, 58.0, 45.0, 61.0, 43.0, 54.0, 33.0, 43.0, 26.0, 30.0, 26.0, 17.0, 16.0, 12.0, 21.0, 8.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.015625, -5.82794189453125, -5.6402587890625, -5.45257568359375, -5.264892578125, -5.07720947265625, -4.8895263671875, -4.70184326171875, -4.51416015625, -4.32647705078125, -4.1387939453125, -3.95111083984375, -3.763427734375, -3.57574462890625, -3.3880615234375, -3.20037841796875, -3.0126953125, -2.82501220703125, -2.6373291015625, -2.44964599609375, -2.261962890625, -2.07427978515625, -1.8865966796875, -1.69891357421875, -1.51123046875, -1.32354736328125, -1.1358642578125, -0.94818115234375, -0.760498046875, -0.57281494140625, -0.3851318359375, -0.19744873046875, -0.009765625, 0.17791748046875, 0.3656005859375, 0.55328369140625, 0.740966796875, 0.92864990234375, 1.1163330078125, 1.30401611328125, 1.49169921875, 1.67938232421875, 1.8670654296875, 2.05474853515625, 2.242431640625, 2.43011474609375, 2.6177978515625, 2.80548095703125, 2.9931640625, 3.18084716796875, 3.3685302734375, 3.55621337890625, 3.743896484375, 3.93157958984375, 4.1192626953125, 4.30694580078125, 4.49462890625, 4.68231201171875, 4.8699951171875, 5.05767822265625, 5.245361328125, 5.43304443359375, 5.6207275390625, 5.80841064453125, 5.99609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 16.0, 14.0, 30.0, 64.0, 92.0, 191.0, 361.0, 777.0, 1759.0, 4841.0, 17652.0, 128954.0, 753866.0, 115458.0, 16646.0, 4544.0, 1756.0, 714.0, 361.0, 217.0, 92.0, 59.0, 34.0, 17.0, 10.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.1641845703125, -1.127197265625, -1.0902099609375, -1.05322265625, -1.0162353515625, -0.979248046875, -0.9422607421875, -0.9052734375, -0.8682861328125, -0.831298828125, -0.7943115234375, -0.75732421875, -0.7203369140625, -0.683349609375, -0.6463623046875, -0.609375, -0.5723876953125, -0.535400390625, -0.4984130859375, -0.46142578125, -0.4244384765625, -0.387451171875, -0.3504638671875, -0.3134765625, -0.2764892578125, -0.239501953125, -0.2025146484375, -0.16552734375, -0.1285400390625, -0.091552734375, -0.0545654296875, -0.017578125, 0.0194091796875, 0.056396484375, 0.0933837890625, 0.13037109375, 0.1673583984375, 0.204345703125, 0.2413330078125, 0.2783203125, 0.3153076171875, 0.352294921875, 0.3892822265625, 0.42626953125, 0.4632568359375, 0.500244140625, 0.5372314453125, 0.57421875, 0.6112060546875, 0.648193359375, 0.6851806640625, 0.72216796875, 0.7591552734375, 0.796142578125, 0.8331298828125, 0.8701171875, 0.9071044921875, 0.944091796875, 0.9810791015625, 1.01806640625, 1.0550537109375, 1.092041015625, 1.1290283203125, 1.166015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 12.0, 20.0, 29.0, 20.0, 45.0, 43.0, 56.0, 74.0, 103.0, 124.0, 99.0, 74.0, 56.0, 51.0, 30.0, 34.0, 15.0, 23.0, 14.0, 7.0, 4.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018739700317382812, -0.0001826537773013115, -0.00017791055142879486, -0.00017316732555627823, -0.0001684240996837616, -0.00016368087381124496, -0.00015893764793872833, -0.0001541944220662117, -0.00014945119619369507, -0.00014470797032117844, -0.0001399647444486618, -0.00013522151857614517, -0.00013047829270362854, -0.0001257350668311119, -0.00012099184095859528, -0.00011624861508607864, -0.00011150538921356201, -0.00010676216334104538, -0.00010201893746852875, -9.727571159601212e-05, -9.253248572349548e-05, -8.778925985097885e-05, -8.304603397846222e-05, -7.830280810594559e-05, -7.355958223342896e-05, -6.881635636091232e-05, -6.407313048839569e-05, -5.932990461587906e-05, -5.458667874336243e-05, -4.9843452870845795e-05, -4.510022699832916e-05, -4.035700112581253e-05, -3.56137752532959e-05, -3.0870549380779266e-05, -2.6127323508262634e-05, -2.1384097635746002e-05, -1.664087176322937e-05, -1.1897645890712738e-05, -7.154420018196106e-06, -2.411194145679474e-06, 2.332031726837158e-06, 7.07525759935379e-06, 1.1818483471870422e-05, 1.6561709344387054e-05, 2.1304935216903687e-05, 2.604816108942032e-05, 3.079138696193695e-05, 3.553461283445358e-05, 4.0277838706970215e-05, 4.502106457948685e-05, 4.976429045200348e-05, 5.450751632452011e-05, 5.925074219703674e-05, 6.399396806955338e-05, 6.873719394207001e-05, 7.348041981458664e-05, 7.822364568710327e-05, 8.29668715596199e-05, 8.771009743213654e-05, 9.245332330465317e-05, 9.71965491771698e-05, 0.00010193977504968643, 0.00010668300092220306, 0.0001114262267947197, 0.00011616945266723633]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 10.0, 9.0, 7.0, 7.0, 13.0, 21.0, 28.0, 59.0, 100.0, 167.0, 290.0, 712.0, 1613.0, 4913.0, 21231.0, 207415.0, 739337.0, 58323.0, 9584.0, 2694.0, 1007.0, 448.0, 226.0, 134.0, 87.0, 42.0, 21.0, 19.0, 6.0, 8.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0755767822265625, -1.032989501953125, -0.9904022216796875, -0.94781494140625, -0.9052276611328125, -0.862640380859375, -0.8200531005859375, -0.7774658203125, -0.7348785400390625, -0.692291259765625, -0.6497039794921875, -0.60711669921875, -0.5645294189453125, -0.521942138671875, -0.4793548583984375, -0.436767578125, -0.3941802978515625, -0.351593017578125, -0.3090057373046875, -0.26641845703125, -0.2238311767578125, -0.181243896484375, -0.1386566162109375, -0.0960693359375, -0.0534820556640625, -0.010894775390625, 0.0316925048828125, 0.07427978515625, 0.1168670654296875, 0.159454345703125, 0.2020416259765625, 0.24462890625, 0.2872161865234375, 0.329803466796875, 0.3723907470703125, 0.41497802734375, 0.4575653076171875, 0.500152587890625, 0.5427398681640625, 0.5853271484375, 0.6279144287109375, 0.670501708984375, 0.7130889892578125, 0.75567626953125, 0.7982635498046875, 0.840850830078125, 0.8834381103515625, 0.926025390625, 0.9686126708984375, 1.011199951171875, 1.0537872314453125, 1.09637451171875, 1.1389617919921875, 1.181549072265625, 1.2241363525390625, 1.2667236328125, 1.3093109130859375, 1.351898193359375, 1.3944854736328125, 1.43707275390625, 1.4796600341796875, 1.522247314453125, 1.5648345947265625, 1.607421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 8.0, 11.0, 10.0, 11.0, 21.0, 33.0, 59.0, 82.0, 119.0, 209.0, 151.0, 84.0, 68.0, 44.0, 30.0, 18.0, 15.0, 6.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9174652099609375, -0.892547607421875, -0.8676300048828125, -0.84271240234375, -0.8177947998046875, -0.792877197265625, -0.7679595947265625, -0.7430419921875, -0.7181243896484375, -0.693206787109375, -0.6682891845703125, -0.64337158203125, -0.6184539794921875, -0.593536376953125, -0.5686187744140625, -0.543701171875, -0.5187835693359375, -0.493865966796875, -0.4689483642578125, -0.44403076171875, -0.4191131591796875, -0.394195556640625, -0.3692779541015625, -0.3443603515625, -0.3194427490234375, -0.294525146484375, -0.2696075439453125, -0.24468994140625, -0.2197723388671875, -0.194854736328125, -0.1699371337890625, -0.14501953125, -0.1201019287109375, -0.095184326171875, -0.0702667236328125, -0.04534912109375, -0.0204315185546875, 0.004486083984375, 0.0294036865234375, 0.0543212890625, 0.0792388916015625, 0.104156494140625, 0.1290740966796875, 0.15399169921875, 0.1789093017578125, 0.203826904296875, 0.2287445068359375, 0.253662109375, 0.2785797119140625, 0.303497314453125, 0.3284149169921875, 0.35333251953125, 0.3782501220703125, 0.403167724609375, 0.4280853271484375, 0.4530029296875, 0.4779205322265625, 0.502838134765625, 0.5277557373046875, 0.55267333984375, 0.5775909423828125, 0.602508544921875, 0.6274261474609375, 0.65234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 30.0, 107.0, 549.0, 230.0, 54.0, 10.0, 10.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.293861389160156, -33.2762336730957, -32.258602142333984, -31.24097442626953, -30.223346710205078, -29.205717086791992, -28.188087463378906, -27.170459747314453, -26.152830123901367, -25.13520050048828, -24.117572784423828, -23.099943161010742, -22.082313537597656, -21.064685821533203, -20.047056198120117, -19.02942657470703, -18.011798858642578, -16.994169235229492, -15.976541519165039, -14.958911895751953, -13.941283226013184, -12.923654556274414, -11.906024932861328, -10.888396263122559, -9.870767593383789, -8.85313892364502, -7.835509777069092, -6.817880630493164, -5.8002519607543945, -4.782623291015625, -3.7649941444396973, -2.7473649978637695, -1.7297325134277344, -0.7121036052703857, 0.3055253028869629, 1.3231542110443115, 2.34078311920166, 3.3584117889404297, 4.376040935516357, 5.393670082092285, 6.411298751831055, 7.428927421569824, 8.446556091308594, 9.46418571472168, 10.48181438446045, 11.499443054199219, 12.517072677612305, 13.534701347351074, 14.552330017089844, 15.569958686828613, 16.587587356567383, 17.60521697998047, 18.622844696044922, 19.640474319458008, 20.658103942871094, 21.675731658935547, 22.693361282348633, 23.71099090576172, 24.728618621826172, 25.746248245239258, 26.763877868652344, 27.781505584716797, 28.799135208129883, 29.81676483154297, 30.834392547607422]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 3.0, 15.0, 11.0, 6.0, 11.0, 16.0, 18.0, 18.0, 25.0, 35.0, 32.0, 41.0, 33.0, 51.0, 52.0, 49.0, 50.0, 59.0, 59.0, 48.0, 39.0, 38.0, 44.0, 44.0, 44.0, 31.0, 30.0, 22.0, 13.0, 17.0, 11.0, 7.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.323591232299805, -9.95914077758789, -9.594691276550293, -9.230240821838379, -8.865791320800781, -8.501340866088867, -8.136890411376953, -7.772440433502197, -7.407990455627441, -7.0435404777526855, -6.67909049987793, -6.314640045166016, -5.95019006729126, -5.585740089416504, -5.22128963470459, -4.856839656829834, -4.492389678955078, -4.127939701080322, -3.7634894847869873, -3.3990392684936523, -3.0345892906188965, -2.6701393127441406, -2.3056890964508057, -1.9412388801574707, -1.5767889022827148, -1.2123388051986694, -0.847888708114624, -0.4834386110305786, -0.1189885139465332, 0.2454615831375122, 0.6099116802215576, 0.9743618965148926, 1.338810920715332, 1.7032610177993774, 2.067711114883423, 2.432161331176758, 2.7966113090515137, 3.1610612869262695, 3.5255115032196045, 3.8899617195129395, 4.254411697387695, 4.618861675262451, 4.983311653137207, 5.347762107849121, 5.712212085723877, 6.076662063598633, 6.441112518310547, 6.805562496185303, 7.170012474060059, 7.5344624519348145, 7.89891242980957, 8.263362884521484, 8.627813339233398, 8.992262840270996, 9.35671329498291, 9.721162796020508, 10.085613250732422, 10.450063705444336, 10.814513206481934, 11.178963661193848, 11.543413162231445, 11.90786361694336, 12.272314071655273, 12.636764526367188, 13.001214027404785]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 12.0, 10.0, 8.0, 16.0, 17.0, 21.0, 23.0, 42.0, 45.0, 66.0, 103.0, 114.0, 194.0, 244.0, 399.0, 547.0, 915.0, 1478.0, 2654.0, 5221.0, 11230.0, 29163.0, 103390.0, 735645.0, 2985130.0, 231783.0, 51781.0, 17607.0, 7352.0, 3735.0, 1941.0, 1192.0, 664.0, 478.0, 307.0, 214.0, 133.0, 85.0, 96.0, 69.0, 40.0, 26.0, 18.0, 19.0, 15.0, 7.0, 7.0, 3.0, 7.0, 9.0, 2.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.87890625, -2.792327880859375, -2.70574951171875, -2.619171142578125, -2.5325927734375, -2.446014404296875, -2.35943603515625, -2.272857666015625, -2.186279296875, -2.099700927734375, -2.01312255859375, -1.926544189453125, -1.8399658203125, -1.753387451171875, -1.66680908203125, -1.580230712890625, -1.49365234375, -1.407073974609375, -1.32049560546875, -1.233917236328125, -1.1473388671875, -1.060760498046875, -0.97418212890625, -0.887603759765625, -0.801025390625, -0.714447021484375, -0.62786865234375, -0.541290283203125, -0.4547119140625, -0.368133544921875, -0.28155517578125, -0.194976806640625, -0.1083984375, -0.021820068359375, 0.06475830078125, 0.151336669921875, 0.2379150390625, 0.324493408203125, 0.41107177734375, 0.497650146484375, 0.584228515625, 0.670806884765625, 0.75738525390625, 0.843963623046875, 0.9305419921875, 1.017120361328125, 1.10369873046875, 1.190277099609375, 1.27685546875, 1.363433837890625, 1.45001220703125, 1.536590576171875, 1.6231689453125, 1.709747314453125, 1.79632568359375, 1.882904052734375, 1.969482421875, 2.056060791015625, 2.14263916015625, 2.229217529296875, 2.3157958984375, 2.402374267578125, 2.48895263671875, 2.575531005859375, 2.662109375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 14.0, 15.0, 23.0, 30.0, 36.0, 46.0, 68.0, 88.0, 68.0, 101.0, 76.0, 78.0, 58.0, 48.0, 52.0, 34.0, 21.0, 23.0, 25.0, 11.0, 9.0, 13.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.22894287109375, -3.1278076171875, -3.02667236328125, -2.925537109375, -2.82440185546875, -2.7232666015625, -2.62213134765625, -2.52099609375, -2.41986083984375, -2.3187255859375, -2.21759033203125, -2.116455078125, -2.01531982421875, -1.9141845703125, -1.81304931640625, -1.7119140625, -1.61077880859375, -1.5096435546875, -1.40850830078125, -1.307373046875, -1.20623779296875, -1.1051025390625, -1.00396728515625, -0.90283203125, -0.80169677734375, -0.7005615234375, -0.59942626953125, -0.498291015625, -0.39715576171875, -0.2960205078125, -0.19488525390625, -0.09375, 0.00738525390625, 0.1085205078125, 0.20965576171875, 0.310791015625, 0.41192626953125, 0.5130615234375, 0.61419677734375, 0.71533203125, 0.81646728515625, 0.9176025390625, 1.01873779296875, 1.119873046875, 1.22100830078125, 1.3221435546875, 1.42327880859375, 1.5244140625, 1.62554931640625, 1.7266845703125, 1.82781982421875, 1.928955078125, 2.03009033203125, 2.1312255859375, 2.23236083984375, 2.33349609375, 2.43463134765625, 2.5357666015625, 2.63690185546875, 2.738037109375, 2.83917236328125, 2.9403076171875, 3.04144287109375, 3.142578125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 4.0, 11.0, 15.0, 25.0, 31.0, 64.0, 96.0, 156.0, 256.0, 475.0, 1058.0, 2878.0, 11035.0, 73345.0, 3560204.0, 504258.0, 30568.0, 6167.0, 1925.0, 780.0, 378.0, 200.0, 106.0, 67.0, 39.0, 30.0, 29.0, 19.0, 10.0, 10.0, 6.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.16290283203125, -5.0054931640625, -4.84808349609375, -4.690673828125, -4.53326416015625, -4.3758544921875, -4.21844482421875, -4.06103515625, -3.90362548828125, -3.7462158203125, -3.58880615234375, -3.431396484375, -3.27398681640625, -3.1165771484375, -2.95916748046875, -2.8017578125, -2.64434814453125, -2.4869384765625, -2.32952880859375, -2.172119140625, -2.01470947265625, -1.8572998046875, -1.69989013671875, -1.54248046875, -1.38507080078125, -1.2276611328125, -1.07025146484375, -0.912841796875, -0.75543212890625, -0.5980224609375, -0.44061279296875, -0.283203125, -0.12579345703125, 0.0316162109375, 0.18902587890625, 0.346435546875, 0.50384521484375, 0.6612548828125, 0.81866455078125, 0.97607421875, 1.13348388671875, 1.2908935546875, 1.44830322265625, 1.605712890625, 1.76312255859375, 1.9205322265625, 2.07794189453125, 2.2353515625, 2.39276123046875, 2.5501708984375, 2.70758056640625, 2.864990234375, 3.02239990234375, 3.1798095703125, 3.33721923828125, 3.49462890625, 3.65203857421875, 3.8094482421875, 3.96685791015625, 4.124267578125, 4.28167724609375, 4.4390869140625, 4.59649658203125, 4.75390625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 10.0, 5.0, 9.0, 16.0, 15.0, 17.0, 28.0, 32.0, 44.0, 84.0, 117.0, 198.0, 312.0, 617.0, 1181.0, 548.0, 263.0, 159.0, 119.0, 79.0, 65.0, 31.0, 26.0, 27.0, 12.0, 12.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.7357025146484375, -0.706756591796875, -0.6778106689453125, -0.64886474609375, -0.6199188232421875, -0.590972900390625, -0.5620269775390625, -0.5330810546875, -0.5041351318359375, -0.475189208984375, -0.4462432861328125, -0.41729736328125, -0.3883514404296875, -0.359405517578125, -0.3304595947265625, -0.301513671875, -0.2725677490234375, -0.243621826171875, -0.2146759033203125, -0.18572998046875, -0.1567840576171875, -0.127838134765625, -0.0988922119140625, -0.0699462890625, -0.0410003662109375, -0.012054443359375, 0.0168914794921875, 0.04583740234375, 0.0747833251953125, 0.103729248046875, 0.1326751708984375, 0.16162109375, 0.1905670166015625, 0.219512939453125, 0.2484588623046875, 0.27740478515625, 0.3063507080078125, 0.335296630859375, 0.3642425537109375, 0.3931884765625, 0.4221343994140625, 0.451080322265625, 0.4800262451171875, 0.50897216796875, 0.5379180908203125, 0.566864013671875, 0.5958099365234375, 0.624755859375, 0.6537017822265625, 0.682647705078125, 0.7115936279296875, 0.74053955078125, 0.7694854736328125, 0.798431396484375, 0.8273773193359375, 0.8563232421875, 0.8852691650390625, 0.914215087890625, 0.9431610107421875, 0.97210693359375, 1.0010528564453125, 1.029998779296875, 1.0589447021484375, 1.087890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 12.0, 12.0, 14.0, 21.0, 44.0, 56.0, 142.0, 186.0, 199.0, 133.0, 62.0, 40.0, 17.0, 14.0, 13.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.484271049499512, -7.270178318023682, -7.056085586547852, -6.8419928550720215, -6.627900123596191, -6.413807392120361, -6.199714660644531, -5.985622406005859, -5.771529197692871, -5.557436466217041, -5.343343734741211, -5.129251003265381, -4.915158271789551, -4.701065540313721, -4.486972808837891, -4.272880554199219, -4.058787822723389, -3.8446950912475586, -3.6306023597717285, -3.4165096282958984, -3.2024168968200684, -2.9883241653442383, -2.7742316722869873, -2.5601389408111572, -2.346046209335327, -2.131953477859497, -1.917860746383667, -1.7037681341171265, -1.4896754026412964, -1.2755826711654663, -1.0614900588989258, -0.8473973274230957, -0.6333041191101074, -0.41921141743659973, -0.20511871576309204, 0.008973956108093262, 0.22306668758392334, 0.4371594190597534, 0.651252031326294, 0.865344762802124, 1.079437494277954, 1.2935302257537842, 1.5076229572296143, 1.7217155694961548, 1.9358083009719849, 2.1499009132385254, 2.3639936447143555, 2.5780863761901855, 2.7921791076660156, 3.0062718391418457, 3.220364570617676, 3.434457302093506, 3.648550033569336, 3.862642765045166, 4.076735496520996, 4.290827751159668, 4.504920959472656, 4.719013690948486, 4.933106422424316, 5.1471991539001465, 5.361291885375977, 5.575384616851807, 5.789477348327637, 6.003569602966309, 6.217662334442139]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 8.0, 6.0, 3.0, 10.0, 5.0, 8.0, 18.0, 16.0, 18.0, 29.0, 37.0, 52.0, 53.0, 57.0, 56.0, 65.0, 55.0, 55.0, 64.0, 53.0, 54.0, 40.0, 38.0, 39.0, 32.0, 29.0, 19.0, 21.0, 8.0, 13.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.8989529609680176, -2.805762767791748, -2.7125728130340576, -2.619382619857788, -2.5261926651000977, -2.433002471923828, -2.3398122787475586, -2.246622323989868, -2.1534323692321777, -2.060242176055908, -1.9670522212982178, -1.8738620281219482, -1.7806720733642578, -1.6874818801879883, -1.5942918062210083, -1.5011017322540283, -1.4079115390777588, -1.3147214651107788, -1.2215313911437988, -1.1283411979675293, -1.0351512432098389, -0.9419611096382141, -0.8487709760665894, -0.7555809020996094, -0.6623908281326294, -0.5692007541656494, -0.47601065039634705, -0.3828205466270447, -0.2896304726600647, -0.19644039869308472, -0.10325026512145996, -0.01006019115447998, 0.0831298828125, 0.17631997168064117, 0.26951006054878235, 0.3627001643180847, 0.4558902382850647, 0.5490803122520447, 0.6422704458236694, 0.7354605197906494, 0.8286505937576294, 0.9218406677246094, 1.0150307416915894, 1.1082208156585693, 1.2014110088348389, 1.2946009635925293, 1.3877911567687988, 1.4809812307357788, 1.5741713047027588, 1.6673613786697388, 1.7605514526367188, 1.8537416458129883, 1.9469316005706787, 2.0401217937469482, 2.1333117485046387, 2.226501941680908, 2.3196921348571777, 2.4128823280334473, 2.5060722827911377, 2.5992624759674072, 2.6924524307250977, 2.785642623901367, 2.8788328170776367, 2.972022771835327, 3.0652127265930176]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 9.0, 11.0, 6.0, 12.0, 17.0, 31.0, 44.0, 102.0, 161.0, 353.0, 875.0, 2413.0, 9329.0, 61747.0, 722566.0, 222563.0, 21441.0, 4416.0, 1375.0, 545.0, 236.0, 114.0, 57.0, 48.0, 26.0, 17.0, 9.0, 6.0, 10.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.409423828125, -0.39691925048828125, -0.3844146728515625, -0.37191009521484375, -0.359405517578125, -0.34690093994140625, -0.3343963623046875, -0.32189178466796875, -0.30938720703125, -0.29688262939453125, -0.2843780517578125, -0.27187347412109375, -0.259368896484375, -0.24686431884765625, -0.2343597412109375, -0.22185516357421875, -0.2093505859375, -0.19684600830078125, -0.1843414306640625, -0.17183685302734375, -0.159332275390625, -0.14682769775390625, -0.1343231201171875, -0.12181854248046875, -0.10931396484375, -0.09680938720703125, -0.0843048095703125, -0.07180023193359375, -0.059295654296875, -0.04679107666015625, -0.0342864990234375, -0.02178192138671875, -0.00927734375, 0.00322723388671875, 0.0157318115234375, 0.02823638916015625, 0.040740966796875, 0.05324554443359375, 0.0657501220703125, 0.07825469970703125, 0.09075927734375, 0.10326385498046875, 0.1157684326171875, 0.12827301025390625, 0.140777587890625, 0.15328216552734375, 0.1657867431640625, 0.17829132080078125, 0.1907958984375, 0.20330047607421875, 0.2158050537109375, 0.22830963134765625, 0.240814208984375, 0.25331878662109375, 0.2658233642578125, 0.27832794189453125, 0.29083251953125, 0.30333709716796875, 0.3158416748046875, 0.32834625244140625, 0.340850830078125, 0.35335540771484375, 0.3658599853515625, 0.37836456298828125, 0.390869140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 3.0, 9.0, 19.0, 14.0, 20.0, 29.0, 42.0, 61.0, 67.0, 90.0, 88.0, 95.0, 77.0, 75.0, 64.0, 53.0, 41.0, 31.0, 21.0, 20.0, 24.0, 9.0, 5.0, 10.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.4959716796875, -2.411865234375, -2.3277587890625, -2.24365234375, -2.1595458984375, -2.075439453125, -1.9913330078125, -1.9072265625, -1.8231201171875, -1.739013671875, -1.6549072265625, -1.57080078125, -1.4866943359375, -1.402587890625, -1.3184814453125, -1.234375, -1.1502685546875, -1.066162109375, -0.9820556640625, -0.89794921875, -0.8138427734375, -0.729736328125, -0.6456298828125, -0.5615234375, -0.4774169921875, -0.393310546875, -0.3092041015625, -0.22509765625, -0.1409912109375, -0.056884765625, 0.0272216796875, 0.111328125, 0.1954345703125, 0.279541015625, 0.3636474609375, 0.44775390625, 0.5318603515625, 0.615966796875, 0.7000732421875, 0.7841796875, 0.8682861328125, 0.952392578125, 1.0364990234375, 1.12060546875, 1.2047119140625, 1.288818359375, 1.3729248046875, 1.45703125, 1.5411376953125, 1.625244140625, 1.7093505859375, 1.79345703125, 1.8775634765625, 1.961669921875, 2.0457763671875, 2.1298828125, 2.2139892578125, 2.298095703125, 2.3822021484375, 2.46630859375, 2.5504150390625, 2.634521484375, 2.7186279296875, 2.802734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 4.0, 13.0, 13.0, 18.0, 30.0, 46.0, 50.0, 68.0, 84.0, 123.0, 175.0, 268.0, 433.0, 820.0, 2979.0, 28680.0, 493380.0, 489092.0, 27503.0, 2632.0, 779.0, 434.0, 299.0, 177.0, 123.0, 82.0, 59.0, 44.0, 40.0, 22.0, 12.0, 18.0, 7.0, 11.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3696479797363281, -0.35965728759765625, -0.3496665954589844, -0.3396759033203125, -0.3296852111816406, -0.31969451904296875, -0.3097038269042969, -0.299713134765625, -0.2897224426269531, -0.27973175048828125, -0.2697410583496094, -0.2597503662109375, -0.24975967407226562, -0.23976898193359375, -0.22977828979492188, -0.21978759765625, -0.20979690551757812, -0.19980621337890625, -0.18981552124023438, -0.1798248291015625, -0.16983413696289062, -0.15984344482421875, -0.14985275268554688, -0.139862060546875, -0.12987136840820312, -0.11988067626953125, -0.10988998413085938, -0.0998992919921875, -0.08990859985351562, -0.07991790771484375, -0.06992721557617188, -0.0599365234375, -0.049945831298828125, -0.03995513916015625, -0.029964447021484375, -0.0199737548828125, -0.009983062744140625, 7.62939453125e-06, 0.009998321533203125, 0.019989013671875, 0.029979705810546875, 0.03997039794921875, 0.049961090087890625, 0.0599517822265625, 0.06994247436523438, 0.07993316650390625, 0.08992385864257812, 0.09991455078125, 0.10990524291992188, 0.11989593505859375, 0.12988662719726562, 0.1398773193359375, 0.14986801147460938, 0.15985870361328125, 0.16984939575195312, 0.179840087890625, 0.18983078002929688, 0.19982147216796875, 0.20981216430664062, 0.2198028564453125, 0.22979354858398438, 0.23978424072265625, 0.24977493286132812, 0.259765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 9.0, 8.0, 9.0, 13.0, 23.0, 19.0, 24.0, 20.0, 24.0, 40.0, 52.0, 46.0, 41.0, 46.0, 51.0, 59.0, 61.0, 54.0, 49.0, 47.0, 45.0, 39.0, 37.0, 29.0, 24.0, 22.0, 28.0, 19.0, 11.0, 13.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.06640625, -3.959747314453125, -3.85308837890625, -3.746429443359375, -3.6397705078125, -3.533111572265625, -3.42645263671875, -3.319793701171875, -3.213134765625, -3.106475830078125, -2.99981689453125, -2.893157958984375, -2.7864990234375, -2.679840087890625, -2.57318115234375, -2.466522216796875, -2.35986328125, -2.253204345703125, -2.14654541015625, -2.039886474609375, -1.9332275390625, -1.826568603515625, -1.71990966796875, -1.613250732421875, -1.506591796875, -1.399932861328125, -1.29327392578125, -1.186614990234375, -1.0799560546875, -0.973297119140625, -0.86663818359375, -0.759979248046875, -0.6533203125, -0.546661376953125, -0.44000244140625, -0.333343505859375, -0.2266845703125, -0.120025634765625, -0.01336669921875, 0.093292236328125, 0.199951171875, 0.306610107421875, 0.41326904296875, 0.519927978515625, 0.6265869140625, 0.733245849609375, 0.83990478515625, 0.946563720703125, 1.05322265625, 1.159881591796875, 1.26654052734375, 1.373199462890625, 1.4798583984375, 1.586517333984375, 1.69317626953125, 1.799835205078125, 1.906494140625, 2.013153076171875, 2.11981201171875, 2.226470947265625, 2.3331298828125, 2.439788818359375, 2.54644775390625, 2.653106689453125, 2.759765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 5.0, 8.0, 18.0, 35.0, 37.0, 52.0, 87.0, 142.0, 247.0, 516.0, 1689.0, 87179.0, 953177.0, 3814.0, 687.0, 326.0, 183.0, 123.0, 67.0, 47.0, 42.0, 20.0, 16.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.150390625, -0.14599037170410156, -0.14159011840820312, -0.1371898651123047, -0.13278961181640625, -0.1283893585205078, -0.12398910522460938, -0.11958885192871094, -0.1151885986328125, -0.11078834533691406, -0.10638809204101562, -0.10198783874511719, -0.09758758544921875, -0.09318733215332031, -0.08878707885742188, -0.08438682556152344, -0.079986572265625, -0.07558631896972656, -0.07118606567382812, -0.06678581237792969, -0.06238555908203125, -0.05798530578613281, -0.053585052490234375, -0.04918479919433594, -0.0447845458984375, -0.04038429260253906, -0.035984039306640625, -0.03158378601074219, -0.02718353271484375, -0.022783279418945312, -0.018383026123046875, -0.013982772827148438, -0.00958251953125, -0.0051822662353515625, -0.000782012939453125, 0.0036182403564453125, 0.00801849365234375, 0.012418746948242188, 0.016819000244140625, 0.021219253540039062, 0.0256195068359375, 0.030019760131835938, 0.034420013427734375, 0.03882026672363281, 0.04322052001953125, 0.04762077331542969, 0.052021026611328125, 0.05642127990722656, 0.060821533203125, 0.06522178649902344, 0.06962203979492188, 0.07402229309082031, 0.07842254638671875, 0.08282279968261719, 0.08722305297851562, 0.09162330627441406, 0.0960235595703125, 0.10042381286621094, 0.10482406616210938, 0.10922431945800781, 0.11362457275390625, 0.11802482604980469, 0.12242507934570312, 0.12682533264160156, 0.1312255859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 16.0, 14.0, 28.0, 34.0, 67.0, 70.0, 117.0, 136.0, 141.0, 118.0, 72.0, 42.0, 28.0, 31.0, 16.0, 15.0, 14.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.678964614868164e-05, -4.569999873638153e-05, -4.461035132408142e-05, -4.352070391178131e-05, -4.24310564994812e-05, -4.134140908718109e-05, -4.025176167488098e-05, -3.916211426258087e-05, -3.807246685028076e-05, -3.698281943798065e-05, -3.589317202568054e-05, -3.480352461338043e-05, -3.371387720108032e-05, -3.262422978878021e-05, -3.15345823764801e-05, -3.0444934964179993e-05, -2.9355287551879883e-05, -2.8265640139579773e-05, -2.7175992727279663e-05, -2.6086345314979553e-05, -2.4996697902679443e-05, -2.3907050490379333e-05, -2.2817403078079224e-05, -2.1727755665779114e-05, -2.0638108253479004e-05, -1.9548460841178894e-05, -1.8458813428878784e-05, -1.7369166016578674e-05, -1.6279518604278564e-05, -1.5189871191978455e-05, -1.4100223779678345e-05, -1.3010576367378235e-05, -1.1920928955078125e-05, -1.0831281542778015e-05, -9.741634130477905e-06, -8.651986718177795e-06, -7.5623393058776855e-06, -6.472691893577576e-06, -5.383044481277466e-06, -4.293397068977356e-06, -3.203749656677246e-06, -2.1141022443771362e-06, -1.0244548320770264e-06, 6.51925802230835e-08, 1.1548399925231934e-06, 2.2444874048233032e-06, 3.334134817123413e-06, 4.423782229423523e-06, 5.513429641723633e-06, 6.603077054023743e-06, 7.692724466323853e-06, 8.782371878623962e-06, 9.872019290924072e-06, 1.0961666703224182e-05, 1.2051314115524292e-05, 1.3140961527824402e-05, 1.4230608940124512e-05, 1.532025635242462e-05, 1.640990376472473e-05, 1.749955117702484e-05, 1.858919858932495e-05, 1.967884600162506e-05, 2.076849341392517e-05, 2.185814082622528e-05, 2.294778823852539e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 14.0, 17.0, 35.0, 48.0, 66.0, 77.0, 169.0, 277.0, 490.0, 1014.0, 2282.0, 7613.0, 46165.0, 850298.0, 121122.0, 12801.0, 3313.0, 1271.0, 607.0, 322.0, 185.0, 131.0, 79.0, 43.0, 31.0, 22.0, 12.0, 5.0, 7.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0859375, -0.08245468139648438, -0.07897186279296875, -0.07548904418945312, -0.0720062255859375, -0.06852340698242188, -0.06504058837890625, -0.061557769775390625, -0.058074951171875, -0.054592132568359375, -0.05110931396484375, -0.047626495361328125, -0.0441436767578125, -0.040660858154296875, -0.03717803955078125, -0.033695220947265625, -0.03021240234375, -0.026729583740234375, -0.02324676513671875, -0.019763946533203125, -0.0162811279296875, -0.012798309326171875, -0.00931549072265625, -0.005832672119140625, -0.002349853515625, 0.001132965087890625, 0.00461578369140625, 0.008098602294921875, 0.0115814208984375, 0.015064239501953125, 0.01854705810546875, 0.022029876708984375, 0.0255126953125, 0.028995513916015625, 0.03247833251953125, 0.035961151123046875, 0.0394439697265625, 0.042926788330078125, 0.04640960693359375, 0.049892425537109375, 0.053375244140625, 0.056858062744140625, 0.06034088134765625, 0.06382369995117188, 0.0673065185546875, 0.07078933715820312, 0.07427215576171875, 0.07775497436523438, 0.08123779296875, 0.08472061157226562, 0.08820343017578125, 0.09168624877929688, 0.0951690673828125, 0.09865188598632812, 0.10213470458984375, 0.10561752319335938, 0.109100341796875, 0.11258316040039062, 0.11606597900390625, 0.11954879760742188, 0.1230316162109375, 0.12651443481445312, 0.12999725341796875, 0.13348007202148438, 0.136962890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 13.0, 20.0, 19.0, 49.0, 110.0, 286.0, 276.0, 90.0, 53.0, 19.0, 20.0, 7.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.029449462890625, -0.028630495071411133, -0.027811527252197266, -0.0269925594329834, -0.02617359161376953, -0.025354623794555664, -0.024535655975341797, -0.02371668815612793, -0.022897720336914062, -0.022078752517700195, -0.021259784698486328, -0.02044081687927246, -0.019621849060058594, -0.018802881240844727, -0.01798391342163086, -0.017164945602416992, -0.016345977783203125, -0.015527009963989258, -0.01470804214477539, -0.013889074325561523, -0.013070106506347656, -0.012251138687133789, -0.011432170867919922, -0.010613203048706055, -0.009794235229492188, -0.00897526741027832, -0.008156299591064453, -0.007337331771850586, -0.006518363952636719, -0.0056993961334228516, -0.004880428314208984, -0.004061460494995117, -0.00324249267578125, -0.002423524856567383, -0.0016045570373535156, -0.0007855892181396484, 3.337860107421875e-05, 0.0008523464202880859, 0.0016713142395019531, 0.0024902820587158203, 0.0033092498779296875, 0.004128217697143555, 0.004947185516357422, 0.005766153335571289, 0.006585121154785156, 0.0074040889739990234, 0.00822305679321289, 0.009042024612426758, 0.009860992431640625, 0.010679960250854492, 0.01149892807006836, 0.012317895889282227, 0.013136863708496094, 0.013955831527709961, 0.014774799346923828, 0.015593767166137695, 0.016412734985351562, 0.01723170280456543, 0.018050670623779297, 0.018869638442993164, 0.01968860626220703, 0.0205075740814209, 0.021326541900634766, 0.022145509719848633, 0.0229644775390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 11.0, 23.0, 30.0, 66.0, 228.0, 373.0, 157.0, 48.0, 24.0, 15.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.047561645507812, -7.79892110824585, -7.5502800941467285, -7.301639556884766, -7.052999019622803, -6.804358005523682, -6.555717468261719, -6.307076454162598, -6.058435916900635, -5.809795379638672, -5.561154365539551, -5.312513828277588, -5.063873291015625, -4.815232276916504, -4.566591739654541, -4.317951202392578, -4.069310188293457, -3.820669412612915, -3.572028875350952, -3.32338809967041, -3.074747323989868, -2.826106548309326, -2.5774660110473633, -2.3288252353668213, -2.0801849365234375, -1.831544280052185, -1.582903504371643, -1.3342628479003906, -1.0856220722198486, -0.8369814157485962, -0.5883407592773438, -0.33969998359680176, -0.09105920791625977, 0.15758149325847626, 0.4062221944332123, 0.6548628807067871, 0.9035035967826843, 1.1521443128585815, 1.400784969329834, 1.649425745010376, 1.8980664014816284, 2.146707057952881, 2.395347833633423, 2.643988609313965, 2.8926291465759277, 3.1412699222564697, 3.3899106979370117, 3.6385512351989746, 3.8871920108795166, 4.135832786560059, 4.3844733238220215, 4.633113861083984, 4.8817548751831055, 5.130395412445068, 5.379035949707031, 5.627676963806152, 5.876317501068115, 6.124958038330078, 6.373599052429199, 6.622239589691162, 6.870880126953125, 7.119521141052246, 7.368161678314209, 7.616802215576172, 7.865443229675293]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 5.0, 0.0, 4.0, 12.0, 9.0, 3.0, 12.0, 18.0, 18.0, 26.0, 39.0, 53.0, 71.0, 69.0, 67.0, 80.0, 76.0, 73.0, 62.0, 69.0, 45.0, 32.0, 34.0, 27.0, 24.0, 21.0, 10.0, 10.0, 8.0, 5.0, 3.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.060120105743408, -1.9872314929962158, -1.9143428802490234, -1.8414543867111206, -1.7685657739639282, -1.6956771612167358, -1.622788667678833, -1.5499000549316406, -1.4770114421844482, -1.4041228294372559, -1.3312342166900635, -1.2583457231521606, -1.1854571104049683, -1.1125684976577759, -1.039680004119873, -0.9667913913726807, -0.8939027786254883, -0.8210141658782959, -0.7481256127357483, -0.6752370595932007, -0.6023484468460083, -0.5294598340988159, -0.4565712809562683, -0.3836827278137207, -0.3107941150665283, -0.23790553212165833, -0.16501694917678833, -0.09212836623191833, -0.01923978328704834, 0.053648799657821655, 0.12653738260269165, 0.19942593574523926, 0.27231478691101074, 0.34520336985588074, 0.41809195280075073, 0.4909805357456207, 0.5638691186904907, 0.6367577314376831, 0.7096462845802307, 0.7825348377227783, 0.8554234504699707, 0.9283120632171631, 1.0012006759643555, 1.0740891695022583, 1.1469777822494507, 1.219866394996643, 1.292754888534546, 1.3656435012817383, 1.4385321140289307, 1.511420726776123, 1.5843093395233154, 1.6571978330612183, 1.7300864458084106, 1.802975058555603, 1.8758635520935059, 1.9487521648406982, 2.0216407775878906, 2.094529390335083, 2.1674180030822754, 2.2403066158294678, 2.31319522857666, 2.3860836029052734, 2.458972215652466, 2.531860828399658, 2.6047494411468506]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 1.0, 6.0, 11.0, 27.0, 31.0, 55.0, 71.0, 134.0, 215.0, 399.0, 709.0, 1383.0, 2722.0, 6023.0, 13690.0, 36389.0, 118872.0, 425953.0, 312318.0, 82178.0, 26874.0, 10984.0, 4731.0, 2283.0, 1138.0, 569.0, 302.0, 185.0, 114.0, 71.0, 51.0, 19.0, 13.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3037109375, -1.2585296630859375, -1.213348388671875, -1.1681671142578125, -1.12298583984375, -1.0778045654296875, -1.032623291015625, -0.9874420166015625, -0.9422607421875, -0.8970794677734375, -0.851898193359375, -0.8067169189453125, -0.76153564453125, -0.7163543701171875, -0.671173095703125, -0.6259918212890625, -0.580810546875, -0.5356292724609375, -0.490447998046875, -0.4452667236328125, -0.40008544921875, -0.3549041748046875, -0.309722900390625, -0.2645416259765625, -0.2193603515625, -0.1741790771484375, -0.128997802734375, -0.0838165283203125, -0.03863525390625, 0.0065460205078125, 0.051727294921875, 0.0969085693359375, 0.14208984375, 0.1872711181640625, 0.232452392578125, 0.2776336669921875, 0.32281494140625, 0.3679962158203125, 0.413177490234375, 0.4583587646484375, 0.5035400390625, 0.5487213134765625, 0.593902587890625, 0.6390838623046875, 0.68426513671875, 0.7294464111328125, 0.774627685546875, 0.8198089599609375, 0.864990234375, 0.9101715087890625, 0.955352783203125, 1.0005340576171875, 1.04571533203125, 1.0908966064453125, 1.136077880859375, 1.1812591552734375, 1.2264404296875, 1.2716217041015625, 1.316802978515625, 1.3619842529296875, 1.40716552734375, 1.4523468017578125, 1.497528076171875, 1.5427093505859375, 1.587890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 10.0, 10.0, 13.0, 16.0, 18.0, 29.0, 34.0, 58.0, 58.0, 66.0, 85.0, 75.0, 80.0, 67.0, 84.0, 58.0, 38.0, 33.0, 31.0, 27.0, 17.0, 14.0, 9.0, 13.0, 10.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71875, -5.53564453125, -5.3525390625, -5.16943359375, -4.986328125, -4.80322265625, -4.6201171875, -4.43701171875, -4.25390625, -4.07080078125, -3.8876953125, -3.70458984375, -3.521484375, -3.33837890625, -3.1552734375, -2.97216796875, -2.7890625, -2.60595703125, -2.4228515625, -2.23974609375, -2.056640625, -1.87353515625, -1.6904296875, -1.50732421875, -1.32421875, -1.14111328125, -0.9580078125, -0.77490234375, -0.591796875, -0.40869140625, -0.2255859375, -0.04248046875, 0.140625, 0.32373046875, 0.5068359375, 0.68994140625, 0.873046875, 1.05615234375, 1.2392578125, 1.42236328125, 1.60546875, 1.78857421875, 1.9716796875, 2.15478515625, 2.337890625, 2.52099609375, 2.7041015625, 2.88720703125, 3.0703125, 3.25341796875, 3.4365234375, 3.61962890625, 3.802734375, 3.98583984375, 4.1689453125, 4.35205078125, 4.53515625, 4.71826171875, 4.9013671875, 5.08447265625, 5.267578125, 5.45068359375, 5.6337890625, 5.81689453125, 6.0]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 11.0, 12.0, 20.0, 21.0, 28.0, 37.0, 47.0, 55.0, 78.0, 82.0, 154.0, 208.0, 308.0, 502.0, 1030.0, 2068.0, 5735.0, 20496.0, 113124.0, 603311.0, 249694.0, 36644.0, 8915.0, 3003.0, 1226.0, 564.0, 357.0, 226.0, 155.0, 98.0, 92.0, 48.0, 53.0, 30.0, 18.0, 22.0, 18.0, 17.0, 5.0, 5.0, 7.0, 1.0, 7.0, 0.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5909881591796875, -1.542327880859375, -1.4936676025390625, -1.44500732421875, -1.3963470458984375, -1.347686767578125, -1.2990264892578125, -1.2503662109375, -1.2017059326171875, -1.153045654296875, -1.1043853759765625, -1.05572509765625, -1.0070648193359375, -0.958404541015625, -0.9097442626953125, -0.861083984375, -0.8124237060546875, -0.763763427734375, -0.7151031494140625, -0.66644287109375, -0.6177825927734375, -0.569122314453125, -0.5204620361328125, -0.4718017578125, -0.4231414794921875, -0.374481201171875, -0.3258209228515625, -0.27716064453125, -0.2285003662109375, -0.179840087890625, -0.1311798095703125, -0.08251953125, -0.0338592529296875, 0.014801025390625, 0.0634613037109375, 0.11212158203125, 0.1607818603515625, 0.209442138671875, 0.2581024169921875, 0.3067626953125, 0.3554229736328125, 0.404083251953125, 0.4527435302734375, 0.50140380859375, 0.5500640869140625, 0.598724365234375, 0.6473846435546875, 0.696044921875, 0.7447052001953125, 0.793365478515625, 0.8420257568359375, 0.89068603515625, 0.9393463134765625, 0.988006591796875, 1.0366668701171875, 1.0853271484375, 1.1339874267578125, 1.182647705078125, 1.2313079833984375, 1.27996826171875, 1.3286285400390625, 1.377288818359375, 1.4259490966796875, 1.474609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 9.0, 7.0, 15.0, 9.0, 18.0, 16.0, 25.0, 31.0, 23.0, 29.0, 42.0, 43.0, 49.0, 52.0, 48.0, 45.0, 40.0, 49.0, 33.0, 56.0, 47.0, 42.0, 46.0, 34.0, 33.0, 28.0, 23.0, 23.0, 15.0, 12.0, 15.0, 13.0, 6.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.11456298828125, -4.9361572265625, -4.75775146484375, -4.579345703125, -4.40093994140625, -4.2225341796875, -4.04412841796875, -3.86572265625, -3.68731689453125, -3.5089111328125, -3.33050537109375, -3.152099609375, -2.97369384765625, -2.7952880859375, -2.61688232421875, -2.4384765625, -2.26007080078125, -2.0816650390625, -1.90325927734375, -1.724853515625, -1.54644775390625, -1.3680419921875, -1.18963623046875, -1.01123046875, -0.83282470703125, -0.6544189453125, -0.47601318359375, -0.297607421875, -0.11920166015625, 0.0592041015625, 0.23760986328125, 0.416015625, 0.59442138671875, 0.7728271484375, 0.95123291015625, 1.129638671875, 1.30804443359375, 1.4864501953125, 1.66485595703125, 1.84326171875, 2.02166748046875, 2.2000732421875, 2.37847900390625, 2.556884765625, 2.73529052734375, 2.9136962890625, 3.09210205078125, 3.2705078125, 3.44891357421875, 3.6273193359375, 3.80572509765625, 3.984130859375, 4.16253662109375, 4.3409423828125, 4.51934814453125, 4.69775390625, 4.87615966796875, 5.0545654296875, 5.23297119140625, 5.411376953125, 5.58978271484375, 5.7681884765625, 5.94659423828125, 6.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 6.0, 17.0, 17.0, 28.0, 48.0, 41.0, 71.0, 107.0, 164.0, 269.0, 505.0, 919.0, 2264.0, 6247.0, 24826.0, 180762.0, 696967.0, 109501.0, 17383.0, 4706.0, 1777.0, 822.0, 412.0, 255.0, 141.0, 83.0, 65.0, 46.0, 29.0, 18.0, 15.0, 7.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8056640625, -0.7815322875976562, -0.7574005126953125, -0.7332687377929688, -0.709136962890625, -0.6850051879882812, -0.6608734130859375, -0.6367416381835938, -0.61260986328125, -0.5884780883789062, -0.5643463134765625, -0.5402145385742188, -0.516082763671875, -0.49195098876953125, -0.4678192138671875, -0.44368743896484375, -0.4195556640625, -0.39542388916015625, -0.3712921142578125, -0.34716033935546875, -0.323028564453125, -0.29889678955078125, -0.2747650146484375, -0.25063323974609375, -0.22650146484375, -0.20236968994140625, -0.1782379150390625, -0.15410614013671875, -0.129974365234375, -0.10584259033203125, -0.0817108154296875, -0.05757904052734375, -0.033447265625, -0.00931549072265625, 0.0148162841796875, 0.03894805908203125, 0.063079833984375, 0.08721160888671875, 0.1113433837890625, 0.13547515869140625, 0.15960693359375, 0.18373870849609375, 0.2078704833984375, 0.23200225830078125, 0.256134033203125, 0.28026580810546875, 0.3043975830078125, 0.32852935791015625, 0.3526611328125, 0.37679290771484375, 0.4009246826171875, 0.42505645751953125, 0.449188232421875, 0.47332000732421875, 0.4974517822265625, 0.5215835571289062, 0.54571533203125, 0.5698471069335938, 0.5939788818359375, 0.6181106567382812, 0.642242431640625, 0.6663742065429688, 0.6905059814453125, 0.7146377563476562, 0.73876953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 8.0, 5.0, 13.0, 19.0, 15.0, 27.0, 43.0, 54.0, 67.0, 96.0, 102.0, 131.0, 124.0, 74.0, 57.0, 53.0, 30.0, 27.0, 17.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014638900756835938, -0.00014213472604751587, -0.00013788044452667236, -0.00013362616300582886, -0.00012937188148498535, -0.00012511759996414185, -0.00012086331844329834, -0.00011660903692245483, -0.00011235475540161133, -0.00010810047388076782, -0.00010384619235992432, -9.959191083908081e-05, -9.53376293182373e-05, -9.10833477973938e-05, -8.682906627655029e-05, -8.257478475570679e-05, -7.832050323486328e-05, -7.406622171401978e-05, -6.981194019317627e-05, -6.555765867233276e-05, -6.130337715148926e-05, -5.704909563064575e-05, -5.2794814109802246e-05, -4.854053258895874e-05, -4.4286251068115234e-05, -4.003196954727173e-05, -3.577768802642822e-05, -3.152340650558472e-05, -2.726912498474121e-05, -2.3014843463897705e-05, -1.87605619430542e-05, -1.4506280422210693e-05, -1.0251998901367188e-05, -5.997717380523682e-06, -1.7434358596801758e-06, 2.51084566116333e-06, 6.765127182006836e-06, 1.1019408702850342e-05, 1.5273690223693848e-05, 1.9527971744537354e-05, 2.378225326538086e-05, 2.8036534786224365e-05, 3.229081630706787e-05, 3.654509782791138e-05, 4.079937934875488e-05, 4.505366086959839e-05, 4.9307942390441895e-05, 5.35622239112854e-05, 5.7816505432128906e-05, 6.207078695297241e-05, 6.632506847381592e-05, 7.057934999465942e-05, 7.483363151550293e-05, 7.908791303634644e-05, 8.334219455718994e-05, 8.759647607803345e-05, 9.185075759887695e-05, 9.610503911972046e-05, 0.00010035932064056396, 0.00010461360216140747, 0.00010886788368225098, 0.00011312216520309448, 0.00011737644672393799, 0.0001216307282447815, 0.000125885009765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 9.0, 12.0, 19.0, 26.0, 44.0, 75.0, 129.0, 255.0, 455.0, 943.0, 2384.0, 7767.0, 35658.0, 320097.0, 605472.0, 58612.0, 11029.0, 3162.0, 1203.0, 506.0, 298.0, 161.0, 91.0, 44.0, 34.0, 21.0, 16.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9142990112304688, -0.8867034912109375, -0.8591079711914062, -0.831512451171875, -0.8039169311523438, -0.7763214111328125, -0.7487258911132812, -0.72113037109375, -0.6935348510742188, -0.6659393310546875, -0.6383438110351562, -0.610748291015625, -0.5831527709960938, -0.5555572509765625, -0.5279617309570312, -0.5003662109375, -0.47277069091796875, -0.4451751708984375, -0.41757965087890625, -0.389984130859375, -0.36238861083984375, -0.3347930908203125, -0.30719757080078125, -0.27960205078125, -0.25200653076171875, -0.2244110107421875, -0.19681549072265625, -0.169219970703125, -0.14162445068359375, -0.1140289306640625, -0.08643341064453125, -0.058837890625, -0.03124237060546875, -0.0036468505859375, 0.02394866943359375, 0.051544189453125, 0.07913970947265625, 0.1067352294921875, 0.13433074951171875, 0.16192626953125, 0.18952178955078125, 0.2171173095703125, 0.24471282958984375, 0.272308349609375, 0.29990386962890625, 0.3274993896484375, 0.35509490966796875, 0.3826904296875, 0.41028594970703125, 0.4378814697265625, 0.46547698974609375, 0.493072509765625, 0.5206680297851562, 0.5482635498046875, 0.5758590698242188, 0.60345458984375, 0.6310501098632812, 0.6586456298828125, 0.6862411499023438, 0.713836669921875, 0.7414321899414062, 0.7690277099609375, 0.7966232299804688, 0.82421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 9.0, 9.0, 12.0, 14.0, 14.0, 28.0, 39.0, 46.0, 54.0, 74.0, 101.0, 105.0, 99.0, 94.0, 66.0, 52.0, 47.0, 31.0, 23.0, 15.0, 14.0, 11.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3350410461425781, -0.32340240478515625, -0.3117637634277344, -0.3001251220703125, -0.2884864807128906, -0.27684783935546875, -0.2652091979980469, -0.253570556640625, -0.24193191528320312, -0.23029327392578125, -0.21865463256835938, -0.2070159912109375, -0.19537734985351562, -0.18373870849609375, -0.17210006713867188, -0.16046142578125, -0.14882278442382812, -0.13718414306640625, -0.12554550170898438, -0.1139068603515625, -0.10226821899414062, -0.09062957763671875, -0.07899093627929688, -0.067352294921875, -0.055713653564453125, -0.04407501220703125, -0.032436370849609375, -0.0207977294921875, -0.009159088134765625, 0.00247955322265625, 0.014118194580078125, 0.0257568359375, 0.037395477294921875, 0.04903411865234375, 0.060672760009765625, 0.0723114013671875, 0.08395004272460938, 0.09558868408203125, 0.10722732543945312, 0.118865966796875, 0.13050460815429688, 0.14214324951171875, 0.15378189086914062, 0.1654205322265625, 0.17705917358398438, 0.18869781494140625, 0.20033645629882812, 0.21197509765625, 0.22361373901367188, 0.23525238037109375, 0.24689102172851562, 0.2585296630859375, 0.2701683044433594, 0.28180694580078125, 0.2934455871582031, 0.305084228515625, 0.3167228698730469, 0.32836151123046875, 0.3400001525878906, 0.3516387939453125, 0.3632774353027344, 0.37491607666015625, 0.3865547180175781, 0.398193359375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 15.0, 29.0, 46.0, 104.0, 204.0, 237.0, 159.0, 76.0, 40.0, 24.0, 10.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.236562728881836, -11.890440940856934, -11.544319152832031, -11.198196411132812, -10.85207462310791, -10.505952835083008, -10.159831047058105, -9.813709259033203, -9.467586517333984, -9.121464729309082, -8.77534294128418, -8.429220199584961, -8.083098411560059, -7.736976623535156, -7.390854835510254, -7.044733047485352, -6.698611259460449, -6.352489471435547, -6.006367206573486, -5.660245418548584, -5.314123153686523, -4.968001365661621, -4.621879577636719, -4.275757789611816, -3.929635524749756, -3.5835134983062744, -3.237391471862793, -2.8912696838378906, -2.545147657394409, -2.1990256309509277, -1.8529038429260254, -1.506781816482544, -1.160660743713379, -0.8145387768745422, -0.46841681003570557, -0.12229490280151367, 0.22382712364196777, 0.5699491500854492, 0.9160709381103516, 1.262192964553833, 1.6083149909973145, 1.954437017440796, 2.3005590438842773, 2.6466808319091797, 2.992802858352661, 3.3389248847961426, 3.685046672821045, 4.0311689376831055, 4.377290725708008, 4.72341251373291, 5.069534778594971, 5.415656566619873, 5.761778831481934, 6.107900619506836, 6.454022407531738, 6.800144195556641, 7.146266460418701, 7.4923882484436035, 7.838510513305664, 8.184632301330566, 8.530754089355469, 8.876876831054688, 9.222997665405273, 9.569120407104492, 9.915242195129395]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 4.0, 10.0, 8.0, 11.0, 9.0, 17.0, 22.0, 21.0, 37.0, 25.0, 28.0, 31.0, 38.0, 30.0, 34.0, 34.0, 37.0, 32.0, 38.0, 38.0, 39.0, 33.0, 47.0, 38.0, 27.0, 37.0, 31.0, 27.0, 22.0, 19.0, 22.0, 17.0, 17.0, 14.0, 9.0, 10.0, 11.0, 12.0, 9.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.085018157958984, -8.795896530151367, -8.50677490234375, -8.217653274536133, -7.928531646728516, -7.639410018920898, -7.350288391113281, -7.061166763305664, -6.772045135498047, -6.48292350769043, -6.1938018798828125, -5.904680252075195, -5.615558624267578, -5.326436996459961, -5.037315368652344, -4.748193740844727, -4.459072113037109, -4.169950485229492, -3.880828857421875, -3.591707229614258, -3.3025856018066406, -3.0134639739990234, -2.7243423461914062, -2.435220718383789, -2.146099090576172, -1.8569774627685547, -1.5678558349609375, -1.2787342071533203, -0.9896125793457031, -0.7004909515380859, -0.41136932373046875, -0.12224769592285156, 0.16687488555908203, 0.4559965133666992, 0.7451181411743164, 1.0342397689819336, 1.3233613967895508, 1.612483024597168, 1.9016046524047852, 2.1907262802124023, 2.4798479080200195, 2.7689695358276367, 3.058091163635254, 3.347212791442871, 3.6363344192504883, 3.9254560470581055, 4.214577674865723, 4.50369930267334, 4.792820930480957, 5.081942558288574, 5.371064186096191, 5.660185813903809, 5.949307441711426, 6.238429069519043, 6.52755069732666, 6.816672325134277, 7.1057939529418945, 7.394915580749512, 7.684037208557129, 7.973158836364746, 8.262280464172363, 8.55140209197998, 8.840523719787598, 9.129645347595215, 9.418766975402832]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 7.0, 4.0, 9.0, 15.0, 25.0, 19.0, 32.0, 44.0, 66.0, 100.0, 117.0, 208.0, 279.0, 485.0, 669.0, 1143.0, 1890.0, 3601.0, 7974.0, 19633.0, 64691.0, 368964.0, 3281529.0, 348297.0, 59796.0, 18762.0, 7448.0, 3517.0, 1829.0, 1030.0, 673.0, 419.0, 283.0, 193.0, 137.0, 112.0, 88.0, 53.0, 40.0, 24.0, 14.0, 10.0, 19.0, 10.0, 8.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.717498779296875, -2.62835693359375, -2.539215087890625, -2.4500732421875, -2.360931396484375, -2.27178955078125, -2.182647705078125, -2.093505859375, -2.004364013671875, -1.91522216796875, -1.826080322265625, -1.7369384765625, -1.647796630859375, -1.55865478515625, -1.469512939453125, -1.38037109375, -1.291229248046875, -1.20208740234375, -1.112945556640625, -1.0238037109375, -0.934661865234375, -0.84552001953125, -0.756378173828125, -0.667236328125, -0.578094482421875, -0.48895263671875, -0.399810791015625, -0.3106689453125, -0.221527099609375, -0.13238525390625, -0.043243408203125, 0.0458984375, 0.135040283203125, 0.22418212890625, 0.313323974609375, 0.4024658203125, 0.491607666015625, 0.58074951171875, 0.669891357421875, 0.759033203125, 0.848175048828125, 0.93731689453125, 1.026458740234375, 1.1156005859375, 1.204742431640625, 1.29388427734375, 1.383026123046875, 1.47216796875, 1.561309814453125, 1.65045166015625, 1.739593505859375, 1.8287353515625, 1.917877197265625, 2.00701904296875, 2.096160888671875, 2.185302734375, 2.274444580078125, 2.36358642578125, 2.452728271484375, 2.5418701171875, 2.631011962890625, 2.72015380859375, 2.809295654296875, 2.8984375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 11.0, 20.0, 19.0, 27.0, 37.0, 45.0, 56.0, 78.0, 73.0, 101.0, 79.0, 88.0, 90.0, 45.0, 44.0, 28.0, 27.0, 22.0, 21.0, 15.0, 10.0, 8.0, 4.0, 6.0, 5.0, 9.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73046875, -2.637359619140625, -2.54425048828125, -2.451141357421875, -2.3580322265625, -2.264923095703125, -2.17181396484375, -2.078704833984375, -1.985595703125, -1.892486572265625, -1.79937744140625, -1.706268310546875, -1.6131591796875, -1.520050048828125, -1.42694091796875, -1.333831787109375, -1.24072265625, -1.147613525390625, -1.05450439453125, -0.961395263671875, -0.8682861328125, -0.775177001953125, -0.68206787109375, -0.588958740234375, -0.495849609375, -0.402740478515625, -0.30963134765625, -0.216522216796875, -0.1234130859375, -0.030303955078125, 0.06280517578125, 0.155914306640625, 0.2490234375, 0.342132568359375, 0.43524169921875, 0.528350830078125, 0.6214599609375, 0.714569091796875, 0.80767822265625, 0.900787353515625, 0.993896484375, 1.087005615234375, 1.18011474609375, 1.273223876953125, 1.3663330078125, 1.459442138671875, 1.55255126953125, 1.645660400390625, 1.73876953125, 1.831878662109375, 1.92498779296875, 2.018096923828125, 2.1112060546875, 2.204315185546875, 2.29742431640625, 2.390533447265625, 2.483642578125, 2.576751708984375, 2.66986083984375, 2.762969970703125, 2.8560791015625, 2.949188232421875, 3.04229736328125, 3.135406494140625, 3.228515625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 8.0, 12.0, 6.0, 19.0, 28.0, 43.0, 64.0, 125.0, 182.0, 343.0, 709.0, 1767.0, 5115.0, 21415.0, 200072.0, 3776429.0, 160852.0, 19082.0, 4808.0, 1650.0, 695.0, 324.0, 215.0, 108.0, 72.0, 45.0, 24.0, 17.0, 14.0, 13.0, 10.0, 12.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.107879638671875, -2.95599365234375, -2.804107666015625, -2.6522216796875, -2.500335693359375, -2.34844970703125, -2.196563720703125, -2.044677734375, -1.892791748046875, -1.74090576171875, -1.589019775390625, -1.4371337890625, -1.285247802734375, -1.13336181640625, -0.981475830078125, -0.82958984375, -0.677703857421875, -0.52581787109375, -0.373931884765625, -0.2220458984375, -0.070159912109375, 0.08172607421875, 0.233612060546875, 0.385498046875, 0.537384033203125, 0.68927001953125, 0.841156005859375, 0.9930419921875, 1.144927978515625, 1.29681396484375, 1.448699951171875, 1.6005859375, 1.752471923828125, 1.90435791015625, 2.056243896484375, 2.2081298828125, 2.360015869140625, 2.51190185546875, 2.663787841796875, 2.815673828125, 2.967559814453125, 3.11944580078125, 3.271331787109375, 3.4232177734375, 3.575103759765625, 3.72698974609375, 3.878875732421875, 4.03076171875, 4.182647705078125, 4.33453369140625, 4.486419677734375, 4.6383056640625, 4.790191650390625, 4.94207763671875, 5.093963623046875, 5.245849609375, 5.397735595703125, 5.54962158203125, 5.701507568359375, 5.8533935546875, 6.005279541015625, 6.15716552734375, 6.309051513671875, 6.4609375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 5.0, 8.0, 7.0, 13.0, 9.0, 15.0, 25.0, 22.0, 34.0, 47.0, 68.0, 97.0, 137.0, 243.0, 432.0, 1206.0, 740.0, 360.0, 185.0, 104.0, 88.0, 61.0, 35.0, 40.0, 21.0, 20.0, 10.0, 14.0, 4.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.1962890625, -1.1662368774414062, -1.1361846923828125, -1.1061325073242188, -1.076080322265625, -1.0460281372070312, -1.0159759521484375, -0.9859237670898438, -0.95587158203125, -0.9258193969726562, -0.8957672119140625, -0.8657150268554688, -0.835662841796875, -0.8056106567382812, -0.7755584716796875, -0.7455062866210938, -0.7154541015625, -0.6854019165039062, -0.6553497314453125, -0.6252975463867188, -0.595245361328125, -0.5651931762695312, -0.5351409912109375, -0.5050888061523438, -0.47503662109375, -0.44498443603515625, -0.4149322509765625, -0.38488006591796875, -0.354827880859375, -0.32477569580078125, -0.2947235107421875, -0.26467132568359375, -0.234619140625, -0.20456695556640625, -0.1745147705078125, -0.14446258544921875, -0.114410400390625, -0.08435821533203125, -0.0543060302734375, -0.02425384521484375, 0.00579833984375, 0.03585052490234375, 0.0659027099609375, 0.09595489501953125, 0.126007080078125, 0.15605926513671875, 0.1861114501953125, 0.21616363525390625, 0.2462158203125, 0.27626800537109375, 0.3063201904296875, 0.33637237548828125, 0.366424560546875, 0.39647674560546875, 0.4265289306640625, 0.45658111572265625, 0.48663330078125, 0.5166854858398438, 0.5467376708984375, 0.5767898559570312, 0.606842041015625, 0.6368942260742188, 0.6669464111328125, 0.6969985961914062, 0.72705078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 5.0, 9.0, 13.0, 15.0, 24.0, 70.0, 111.0, 169.0, 207.0, 145.0, 96.0, 44.0, 28.0, 16.0, 8.0, 7.0, 8.0, 8.0, 7.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4522809982299805, -6.239776134490967, -6.027270793914795, -5.814765930175781, -5.602260589599609, -5.389755725860596, -5.177250862121582, -4.96474552154541, -4.7522406578063965, -4.539735794067383, -4.327230453491211, -4.114725589752197, -3.9022204875946045, -3.6897153854370117, -3.477210521697998, -3.2647054195404053, -3.0522003173828125, -2.8396952152252197, -2.627190113067627, -2.4146852493286133, -2.2021801471710205, -1.9896750450134277, -1.7771700620651245, -1.5646650791168213, -1.3521599769592285, -1.1396548748016357, -0.9271498918533325, -0.7146448493003845, -0.5021398067474365, -0.28963470458984375, -0.07712972164154053, 0.1353752613067627, 0.34787988662719727, 0.5603849291801453, 0.7728899717330933, 0.9853950142860413, 1.1979000568389893, 1.410405158996582, 1.6229101419448853, 1.8354151248931885, 2.0479202270507812, 2.260425329208374, 2.472930431365967, 2.6854352951049805, 2.8979403972625732, 3.110445499420166, 3.3229503631591797, 3.5354554653167725, 3.7479605674743652, 3.960465669631958, 4.172970771789551, 4.3854756355285645, 4.597980499267578, 4.81048583984375, 5.022990703582764, 5.235495567321777, 5.448000907897949, 5.660505771636963, 5.873011112213135, 6.085515975952148, 6.29802131652832, 6.510526180267334, 6.723031044006348, 6.9355363845825195, 7.148041248321533]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 4.0, 6.0, 15.0, 11.0, 14.0, 29.0, 38.0, 30.0, 49.0, 52.0, 61.0, 46.0, 57.0, 66.0, 66.0, 63.0, 60.0, 57.0, 36.0, 41.0, 28.0, 29.0, 35.0, 16.0, 17.0, 9.0, 17.0, 14.0, 4.0, 2.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.0965628623962402, -3.003164529800415, -2.9097659587860107, -2.8163676261901855, -2.7229690551757812, -2.629570722579956, -2.536172389984131, -2.4427738189697266, -2.3493752479553223, -2.255976915359497, -2.1625783443450928, -2.0691800117492676, -1.9757814407348633, -1.882383108139038, -1.7889846563339233, -1.6955862045288086, -1.6021878719329834, -1.5087894201278687, -1.415390968322754, -1.3219926357269287, -1.2285940647125244, -1.1351957321166992, -1.0417972803115845, -0.9483988285064697, -0.855000376701355, -0.7616019248962402, -0.6682034730911255, -0.5748050808906555, -0.48140662908554077, -0.388008177280426, -0.29460978507995605, -0.2012113332748413, -0.10781311988830566, -0.014414682984352112, 0.07898375391960144, 0.1723821759223938, 0.26578062772750854, 0.3591790795326233, 0.45257747173309326, 0.545975923538208, 0.6393743753433228, 0.7327728271484375, 0.8261712789535522, 0.9195696711540222, 1.0129680633544922, 1.1063666343688965, 1.1997649669647217, 1.2931634187698364, 1.3865618705749512, 1.479960322380066, 1.5733587741851807, 1.6667571067810059, 1.7601556777954102, 1.8535540103912354, 1.94695246219635, 2.040350914001465, 2.133749485015869, 2.2271478176116943, 2.3205463886260986, 2.413944721221924, 2.507343292236328, 2.6007416248321533, 2.6941399574279785, 2.787538528442383, 2.880936861038208]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 5.0, 6.0, 19.0, 24.0, 39.0, 74.0, 119.0, 280.0, 1034.0, 5556.0, 73505.0, 895080.0, 66107.0, 5185.0, 937.0, 276.0, 97.0, 62.0, 37.0, 26.0, 14.0, 18.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63330078125, -0.6125259399414062, -0.5917510986328125, -0.5709762573242188, -0.550201416015625, -0.5294265747070312, -0.5086517333984375, -0.48787689208984375, -0.46710205078125, -0.44632720947265625, -0.4255523681640625, -0.40477752685546875, -0.384002685546875, -0.36322784423828125, -0.3424530029296875, -0.32167816162109375, -0.3009033203125, -0.28012847900390625, -0.2593536376953125, -0.23857879638671875, -0.217803955078125, -0.19702911376953125, -0.1762542724609375, -0.15547943115234375, -0.13470458984375, -0.11392974853515625, -0.0931549072265625, -0.07238006591796875, -0.051605224609375, -0.03083038330078125, -0.0100555419921875, 0.01071929931640625, 0.031494140625, 0.05226898193359375, 0.0730438232421875, 0.09381866455078125, 0.114593505859375, 0.13536834716796875, 0.1561431884765625, 0.17691802978515625, 0.19769287109375, 0.21846771240234375, 0.2392425537109375, 0.26001739501953125, 0.280792236328125, 0.30156707763671875, 0.3223419189453125, 0.34311676025390625, 0.3638916015625, 0.38466644287109375, 0.4054412841796875, 0.42621612548828125, 0.446990966796875, 0.46776580810546875, 0.4885406494140625, 0.5093154907226562, 0.53009033203125, 0.5508651733398438, 0.5716400146484375, 0.5924148559570312, 0.613189697265625, 0.6339645385742188, 0.6547393798828125, 0.6755142211914062, 0.6962890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 8.0, 5.0, 8.0, 12.0, 17.0, 33.0, 31.0, 48.0, 62.0, 86.0, 71.0, 90.0, 99.0, 94.0, 77.0, 57.0, 47.0, 38.0, 28.0, 25.0, 17.0, 14.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.7366943359375, -2.643310546875, -2.5499267578125, -2.45654296875, -2.3631591796875, -2.269775390625, -2.1763916015625, -2.0830078125, -1.9896240234375, -1.896240234375, -1.8028564453125, -1.70947265625, -1.6160888671875, -1.522705078125, -1.4293212890625, -1.3359375, -1.2425537109375, -1.149169921875, -1.0557861328125, -0.96240234375, -0.8690185546875, -0.775634765625, -0.6822509765625, -0.5888671875, -0.4954833984375, -0.402099609375, -0.3087158203125, -0.21533203125, -0.1219482421875, -0.028564453125, 0.0648193359375, 0.158203125, 0.2515869140625, 0.344970703125, 0.4383544921875, 0.53173828125, 0.6251220703125, 0.718505859375, 0.8118896484375, 0.9052734375, 0.9986572265625, 1.092041015625, 1.1854248046875, 1.27880859375, 1.3721923828125, 1.465576171875, 1.5589599609375, 1.65234375, 1.7457275390625, 1.839111328125, 1.9324951171875, 2.02587890625, 2.1192626953125, 2.212646484375, 2.3060302734375, 2.3994140625, 2.4927978515625, 2.586181640625, 2.6795654296875, 2.77294921875, 2.8663330078125, 2.959716796875, 3.0531005859375, 3.146484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 8.0, 7.0, 11.0, 12.0, 16.0, 20.0, 31.0, 33.0, 55.0, 63.0, 86.0, 141.0, 179.0, 295.0, 534.0, 1207.0, 6583.0, 74618.0, 724284.0, 219654.0, 16429.0, 2288.0, 749.0, 422.0, 222.0, 172.0, 118.0, 80.0, 50.0, 41.0, 31.0, 23.0, 19.0, 16.0, 15.0, 13.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.32275390625, -0.3128814697265625, -0.303009033203125, -0.2931365966796875, -0.28326416015625, -0.2733917236328125, -0.263519287109375, -0.2536468505859375, -0.2437744140625, -0.2339019775390625, -0.224029541015625, -0.2141571044921875, -0.20428466796875, -0.1944122314453125, -0.184539794921875, -0.1746673583984375, -0.164794921875, -0.1549224853515625, -0.145050048828125, -0.1351776123046875, -0.12530517578125, -0.1154327392578125, -0.105560302734375, -0.0956878662109375, -0.0858154296875, -0.0759429931640625, -0.066070556640625, -0.0561981201171875, -0.04632568359375, -0.0364532470703125, -0.026580810546875, -0.0167083740234375, -0.0068359375, 0.0030364990234375, 0.012908935546875, 0.0227813720703125, 0.03265380859375, 0.0425262451171875, 0.052398681640625, 0.0622711181640625, 0.0721435546875, 0.0820159912109375, 0.091888427734375, 0.1017608642578125, 0.11163330078125, 0.1215057373046875, 0.131378173828125, 0.1412506103515625, 0.151123046875, 0.1609954833984375, 0.170867919921875, 0.1807403564453125, 0.19061279296875, 0.2004852294921875, 0.210357666015625, 0.2202301025390625, 0.2301025390625, 0.2399749755859375, 0.249847412109375, 0.2597198486328125, 0.26959228515625, 0.2794647216796875, 0.289337158203125, 0.2992095947265625, 0.30908203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 9.0, 3.0, 2.0, 6.0, 8.0, 3.0, 6.0, 10.0, 13.0, 13.0, 17.0, 14.0, 23.0, 21.0, 27.0, 29.0, 34.0, 36.0, 32.0, 47.0, 38.0, 36.0, 49.0, 41.0, 37.0, 48.0, 46.0, 36.0, 30.0, 43.0, 32.0, 19.0, 26.0, 20.0, 25.0, 18.0, 15.0, 9.0, 16.0, 13.0, 10.0, 9.0, 12.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.767578125, -2.674285888671875, -2.58099365234375, -2.487701416015625, -2.3944091796875, -2.301116943359375, -2.20782470703125, -2.114532470703125, -2.021240234375, -1.927947998046875, -1.83465576171875, -1.741363525390625, -1.6480712890625, -1.554779052734375, -1.46148681640625, -1.368194580078125, -1.27490234375, -1.181610107421875, -1.08831787109375, -0.995025634765625, -0.9017333984375, -0.808441162109375, -0.71514892578125, -0.621856689453125, -0.528564453125, -0.435272216796875, -0.34197998046875, -0.248687744140625, -0.1553955078125, -0.062103271484375, 0.03118896484375, 0.124481201171875, 0.2177734375, 0.311065673828125, 0.40435791015625, 0.497650146484375, 0.5909423828125, 0.684234619140625, 0.77752685546875, 0.870819091796875, 0.964111328125, 1.057403564453125, 1.15069580078125, 1.243988037109375, 1.3372802734375, 1.430572509765625, 1.52386474609375, 1.617156982421875, 1.71044921875, 1.803741455078125, 1.89703369140625, 1.990325927734375, 2.0836181640625, 2.176910400390625, 2.27020263671875, 2.363494873046875, 2.456787109375, 2.550079345703125, 2.64337158203125, 2.736663818359375, 2.8299560546875, 2.923248291015625, 3.01654052734375, 3.109832763671875, 3.203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 6.0, 14.0, 11.0, 20.0, 17.0, 45.0, 82.0, 196.0, 613.0, 5486.0, 1028579.0, 12169.0, 851.0, 220.0, 91.0, 36.0, 36.0, 18.0, 13.0, 8.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15153884887695312, -0.14511871337890625, -0.13869857788085938, -0.1322784423828125, -0.12585830688476562, -0.11943817138671875, -0.11301803588867188, -0.106597900390625, -0.10017776489257812, -0.09375762939453125, -0.08733749389648438, -0.0809173583984375, -0.07449722290039062, -0.06807708740234375, -0.061656951904296875, -0.05523681640625, -0.048816680908203125, -0.04239654541015625, -0.035976409912109375, -0.0295562744140625, -0.023136138916015625, -0.01671600341796875, -0.010295867919921875, -0.003875732421875, 0.002544403076171875, 0.00896453857421875, 0.015384674072265625, 0.0218048095703125, 0.028224945068359375, 0.03464508056640625, 0.041065216064453125, 0.0474853515625, 0.053905487060546875, 0.06032562255859375, 0.06674575805664062, 0.0731658935546875, 0.07958602905273438, 0.08600616455078125, 0.09242630004882812, 0.098846435546875, 0.10526657104492188, 0.11168670654296875, 0.11810684204101562, 0.1245269775390625, 0.13094711303710938, 0.13736724853515625, 0.14378738403320312, 0.15020751953125, 0.15662765502929688, 0.16304779052734375, 0.16946792602539062, 0.1758880615234375, 0.18230819702148438, 0.18872833251953125, 0.19514846801757812, 0.201568603515625, 0.20798873901367188, 0.21440887451171875, 0.22082901000976562, 0.2272491455078125, 0.23366928100585938, 0.24008941650390625, 0.24650955200195312, 0.2529296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 1.0, 12.0, 15.0, 24.0, 42.0, 76.0, 83.0, 135.0, 160.0, 148.0, 101.0, 65.0, 48.0, 20.0, 20.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.131959915161133e-05, -5.0049275159835815e-05, -4.87789511680603e-05, -4.750862717628479e-05, -4.623830318450928e-05, -4.4967979192733765e-05, -4.369765520095825e-05, -4.242733120918274e-05, -4.1157007217407227e-05, -3.9886683225631714e-05, -3.86163592338562e-05, -3.734603524208069e-05, -3.6075711250305176e-05, -3.480538725852966e-05, -3.353506326675415e-05, -3.226473927497864e-05, -3.0994415283203125e-05, -2.9724091291427612e-05, -2.84537672996521e-05, -2.7183443307876587e-05, -2.5913119316101074e-05, -2.464279532432556e-05, -2.337247133255005e-05, -2.2102147340774536e-05, -2.0831823348999023e-05, -1.956149935722351e-05, -1.8291175365447998e-05, -1.7020851373672485e-05, -1.5750527381896973e-05, -1.448020339012146e-05, -1.3209879398345947e-05, -1.1939555406570435e-05, -1.0669231414794922e-05, -9.39890742301941e-06, -8.128583431243896e-06, -6.858259439468384e-06, -5.587935447692871e-06, -4.317611455917358e-06, -3.0472874641418457e-06, -1.776963472366333e-06, -5.066394805908203e-07, 7.636845111846924e-07, 2.034008502960205e-06, 3.3043324947357178e-06, 4.5746564865112305e-06, 5.844980478286743e-06, 7.115304470062256e-06, 8.385628461837769e-06, 9.655952453613281e-06, 1.0926276445388794e-05, 1.2196600437164307e-05, 1.346692442893982e-05, 1.4737248420715332e-05, 1.6007572412490845e-05, 1.7277896404266357e-05, 1.854822039604187e-05, 1.9818544387817383e-05, 2.1088868379592896e-05, 2.2359192371368408e-05, 2.362951636314392e-05, 2.4899840354919434e-05, 2.6170164346694946e-05, 2.744048833847046e-05, 2.871081233024597e-05, 2.9981136322021484e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 13.0, 16.0, 26.0, 38.0, 53.0, 98.0, 162.0, 347.0, 700.0, 2003.0, 11332.0, 921049.0, 104849.0, 5444.0, 1269.0, 471.0, 242.0, 146.0, 88.0, 67.0, 29.0, 30.0, 17.0, 14.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1361083984375, -0.13083648681640625, -0.1255645751953125, -0.12029266357421875, -0.115020751953125, -0.10974884033203125, -0.1044769287109375, -0.09920501708984375, -0.09393310546875, -0.08866119384765625, -0.0833892822265625, -0.07811737060546875, -0.072845458984375, -0.06757354736328125, -0.0623016357421875, -0.05702972412109375, -0.0517578125, -0.04648590087890625, -0.0412139892578125, -0.03594207763671875, -0.030670166015625, -0.02539825439453125, -0.0201263427734375, -0.01485443115234375, -0.00958251953125, -0.00431060791015625, 0.0009613037109375, 0.00623321533203125, 0.011505126953125, 0.01677703857421875, 0.0220489501953125, 0.02732086181640625, 0.0325927734375, 0.03786468505859375, 0.0431365966796875, 0.04840850830078125, 0.053680419921875, 0.05895233154296875, 0.0642242431640625, 0.06949615478515625, 0.07476806640625, 0.08003997802734375, 0.0853118896484375, 0.09058380126953125, 0.095855712890625, 0.10112762451171875, 0.1063995361328125, 0.11167144775390625, 0.116943359375, 0.12221527099609375, 0.1274871826171875, 0.13275909423828125, 0.138031005859375, 0.14330291748046875, 0.1485748291015625, 0.15384674072265625, 0.15911865234375, 0.16439056396484375, 0.1696624755859375, 0.17493438720703125, 0.180206298828125, 0.18547821044921875, 0.1907501220703125, 0.19602203369140625, 0.2012939453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 10.0, 10.0, 22.0, 63.0, 253.0, 450.0, 89.0, 26.0, 19.0, 16.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02838134765625, -0.027708888053894043, -0.027036428451538086, -0.02636396884918213, -0.025691509246826172, -0.025019049644470215, -0.024346590042114258, -0.0236741304397583, -0.023001670837402344, -0.022329211235046387, -0.02165675163269043, -0.020984292030334473, -0.020311832427978516, -0.01963937282562256, -0.0189669132232666, -0.018294453620910645, -0.017621994018554688, -0.01694953441619873, -0.016277074813842773, -0.015604615211486816, -0.01493215560913086, -0.014259696006774902, -0.013587236404418945, -0.012914776802062988, -0.012242317199707031, -0.011569857597351074, -0.010897397994995117, -0.01022493839263916, -0.009552478790283203, -0.008880019187927246, -0.008207559585571289, -0.007535099983215332, -0.006862640380859375, -0.006190180778503418, -0.005517721176147461, -0.004845261573791504, -0.004172801971435547, -0.00350034236907959, -0.002827882766723633, -0.0021554231643676758, -0.0014829635620117188, -0.0008105039596557617, -0.0001380443572998047, 0.0005344152450561523, 0.0012068748474121094, 0.0018793344497680664, 0.0025517940521240234, 0.0032242536544799805, 0.0038967132568359375, 0.0045691728591918945, 0.0052416324615478516, 0.005914092063903809, 0.006586551666259766, 0.007259011268615723, 0.00793147087097168, 0.008603930473327637, 0.009276390075683594, 0.00994884967803955, 0.010621309280395508, 0.011293768882751465, 0.011966228485107422, 0.012638688087463379, 0.013311147689819336, 0.013983607292175293, 0.01465606689453125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 11.0, 16.0, 26.0, 59.0, 221.0, 371.0, 179.0, 54.0, 26.0, 14.0, 10.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.41562557220459, -8.156509399414062, -7.897392272949219, -7.638276100158691, -7.379159450531006, -7.12004280090332, -6.860926628112793, -6.601809978485107, -6.342693328857422, -6.083576679229736, -5.824460029602051, -5.565343856811523, -5.306227207183838, -5.047110557556152, -4.787994384765625, -4.5288777351379395, -4.269761085510254, -4.010644435882568, -3.751528024673462, -3.4924116134643555, -3.23329496383667, -2.9741783142089844, -2.715061902999878, -2.4559454917907715, -2.196828842163086, -1.93771231174469, -1.678595781326294, -1.419479250907898, -1.160362720489502, -0.901246190071106, -0.64212965965271, -0.38301312923431396, -0.12389755249023438, 0.13521897792816162, 0.3943355083465576, 0.6534520387649536, 0.9125685691833496, 1.1716850996017456, 1.4308016300201416, 1.6899181604385376, 1.9490346908569336, 2.208151340484619, 2.4672677516937256, 2.726384162902832, 2.9855008125305176, 3.244617462158203, 3.5037338733673096, 3.762850284576416, 4.021966934204102, 4.281083583831787, 4.540200233459473, 4.79931640625, 5.0584330558776855, 5.317549705505371, 5.576665878295898, 5.835782527923584, 6.0948991775512695, 6.354015827178955, 6.613132476806641, 6.872248649597168, 7.1313652992248535, 7.390481948852539, 7.649598121643066, 7.908714771270752, 8.167831420898438]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 6.0, 15.0, 19.0, 22.0, 32.0, 41.0, 46.0, 79.0, 56.0, 65.0, 76.0, 82.0, 76.0, 68.0, 57.0, 42.0, 35.0, 35.0, 31.0, 19.0, 14.0, 13.0, 17.0, 6.0, 7.0, 2.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2592005729675293, -2.184823751449585, -2.1104469299316406, -2.0360703468322754, -1.961693525314331, -1.8873167037963867, -1.8129398822784424, -1.738563060760498, -1.6641863584518433, -1.589809536933899, -1.5154328346252441, -1.4410560131072998, -1.3666791915893555, -1.2923024892807007, -1.2179256677627563, -1.1435489654541016, -1.0691721439361572, -0.9947953820228577, -0.9204186201095581, -0.8460417985916138, -0.7716650366783142, -0.6972882747650146, -0.6229114532470703, -0.5485346913337708, -0.4741579294204712, -0.39978116750717163, -0.3254043757915497, -0.25102758407592773, -0.17665082216262817, -0.10227406024932861, -0.027897268533706665, 0.04647952318191528, 0.12085628509521484, 0.1952330619096756, 0.26960983872413635, 0.3439866304397583, 0.41836339235305786, 0.4927401542663574, 0.5671169757843018, 0.6414937376976013, 0.7158704996109009, 0.7902472615242004, 0.8646240234375, 0.9390008449554443, 1.0133776664733887, 1.0877543687820435, 1.1621311902999878, 1.2365078926086426, 1.310884714126587, 1.3852615356445312, 1.459638237953186, 1.5340150594711304, 1.6083917617797852, 1.6827685832977295, 1.7571454048156738, 1.8315222263336182, 1.905898928642273, 1.9802757501602173, 2.054652452468872, 2.1290292739868164, 2.2034060955047607, 2.277782917022705, 2.3521595001220703, 2.4265363216400146, 2.500913143157959]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 23.0, 15.0, 44.0, 53.0, 94.0, 158.0, 224.0, 381.0, 605.0, 1191.0, 2097.0, 4129.0, 9036.0, 22108.0, 70115.0, 452945.0, 384075.0, 63129.0, 20756.0, 8719.0, 4066.0, 2018.0, 1018.0, 584.0, 383.0, 216.0, 122.0, 94.0, 50.0, 25.0, 13.0, 14.0, 10.0, 8.0, 6.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5009765625, -1.4508819580078125, -1.400787353515625, -1.3506927490234375, -1.30059814453125, -1.2505035400390625, -1.200408935546875, -1.1503143310546875, -1.1002197265625, -1.0501251220703125, -1.000030517578125, -0.9499359130859375, -0.89984130859375, -0.8497467041015625, -0.799652099609375, -0.7495574951171875, -0.699462890625, -0.6493682861328125, -0.599273681640625, -0.5491790771484375, -0.49908447265625, -0.4489898681640625, -0.398895263671875, -0.3488006591796875, -0.2987060546875, -0.2486114501953125, -0.198516845703125, -0.1484222412109375, -0.09832763671875, -0.0482330322265625, 0.001861572265625, 0.0519561767578125, 0.10205078125, 0.1521453857421875, 0.202239990234375, 0.2523345947265625, 0.30242919921875, 0.3525238037109375, 0.402618408203125, 0.4527130126953125, 0.5028076171875, 0.5529022216796875, 0.602996826171875, 0.6530914306640625, 0.70318603515625, 0.7532806396484375, 0.803375244140625, 0.8534698486328125, 0.903564453125, 0.9536590576171875, 1.003753662109375, 1.0538482666015625, 1.10394287109375, 1.1540374755859375, 1.204132080078125, 1.2542266845703125, 1.3043212890625, 1.3544158935546875, 1.404510498046875, 1.4546051025390625, 1.50469970703125, 1.5547943115234375, 1.604888916015625, 1.6549835205078125, 1.705078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 11.0, 9.0, 14.0, 13.0, 19.0, 30.0, 38.0, 41.0, 72.0, 76.0, 86.0, 92.0, 88.0, 65.0, 76.0, 52.0, 48.0, 35.0, 29.0, 21.0, 21.0, 10.0, 9.0, 7.0, 10.0, 4.0, 5.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.61328125, -5.43353271484375, -5.2537841796875, -5.07403564453125, -4.894287109375, -4.71453857421875, -4.5347900390625, -4.35504150390625, -4.17529296875, -3.99554443359375, -3.8157958984375, -3.63604736328125, -3.456298828125, -3.27655029296875, -3.0968017578125, -2.91705322265625, -2.7373046875, -2.55755615234375, -2.3778076171875, -2.19805908203125, -2.018310546875, -1.83856201171875, -1.6588134765625, -1.47906494140625, -1.29931640625, -1.11956787109375, -0.9398193359375, -0.76007080078125, -0.580322265625, -0.40057373046875, -0.2208251953125, -0.04107666015625, 0.138671875, 0.31842041015625, 0.4981689453125, 0.67791748046875, 0.857666015625, 1.03741455078125, 1.2171630859375, 1.39691162109375, 1.57666015625, 1.75640869140625, 1.9361572265625, 2.11590576171875, 2.295654296875, 2.47540283203125, 2.6551513671875, 2.83489990234375, 3.0146484375, 3.19439697265625, 3.3741455078125, 3.55389404296875, 3.733642578125, 3.91339111328125, 4.0931396484375, 4.27288818359375, 4.45263671875, 4.63238525390625, 4.8121337890625, 4.99188232421875, 5.171630859375, 5.35137939453125, 5.5311279296875, 5.71087646484375, 5.890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 8.0, 11.0, 16.0, 16.0, 30.0, 32.0, 57.0, 90.0, 148.0, 252.0, 432.0, 921.0, 2426.0, 7836.0, 39210.0, 592947.0, 363033.0, 30697.0, 6627.0, 1978.0, 769.0, 378.0, 216.0, 135.0, 88.0, 48.0, 37.0, 22.0, 13.0, 22.0, 14.0, 2.0, 10.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8857421875, -1.8182220458984375, -1.750701904296875, -1.6831817626953125, -1.61566162109375, -1.5481414794921875, -1.480621337890625, -1.4131011962890625, -1.3455810546875, -1.2780609130859375, -1.210540771484375, -1.1430206298828125, -1.07550048828125, -1.0079803466796875, -0.940460205078125, -0.8729400634765625, -0.805419921875, -0.7378997802734375, -0.670379638671875, -0.6028594970703125, -0.53533935546875, -0.4678192138671875, -0.400299072265625, -0.3327789306640625, -0.2652587890625, -0.1977386474609375, -0.130218505859375, -0.0626983642578125, 0.00482177734375, 0.0723419189453125, 0.139862060546875, 0.2073822021484375, 0.27490234375, 0.3424224853515625, 0.409942626953125, 0.4774627685546875, 0.54498291015625, 0.6125030517578125, 0.680023193359375, 0.7475433349609375, 0.8150634765625, 0.8825836181640625, 0.950103759765625, 1.0176239013671875, 1.08514404296875, 1.1526641845703125, 1.220184326171875, 1.2877044677734375, 1.355224609375, 1.4227447509765625, 1.490264892578125, 1.5577850341796875, 1.62530517578125, 1.6928253173828125, 1.760345458984375, 1.8278656005859375, 1.8953857421875, 1.9629058837890625, 2.030426025390625, 2.0979461669921875, 2.16546630859375, 2.2329864501953125, 2.300506591796875, 2.3680267333984375, 2.435546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 7.0, 9.0, 9.0, 10.0, 10.0, 15.0, 12.0, 22.0, 28.0, 24.0, 22.0, 32.0, 26.0, 22.0, 32.0, 34.0, 29.0, 34.0, 31.0, 34.0, 38.0, 40.0, 38.0, 44.0, 36.0, 35.0, 34.0, 38.0, 40.0, 29.0, 28.0, 25.0, 18.0, 24.0, 13.0, 13.0, 12.0, 6.0, 6.0, 13.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.9296875, -3.7943115234375, -3.658935546875, -3.5235595703125, -3.38818359375, -3.2528076171875, -3.117431640625, -2.9820556640625, -2.8466796875, -2.7113037109375, -2.575927734375, -2.4405517578125, -2.30517578125, -2.1697998046875, -2.034423828125, -1.8990478515625, -1.763671875, -1.6282958984375, -1.492919921875, -1.3575439453125, -1.22216796875, -1.0867919921875, -0.951416015625, -0.8160400390625, -0.6806640625, -0.5452880859375, -0.409912109375, -0.2745361328125, -0.13916015625, -0.0037841796875, 0.131591796875, 0.2669677734375, 0.40234375, 0.5377197265625, 0.673095703125, 0.8084716796875, 0.94384765625, 1.0792236328125, 1.214599609375, 1.3499755859375, 1.4853515625, 1.6207275390625, 1.756103515625, 1.8914794921875, 2.02685546875, 2.1622314453125, 2.297607421875, 2.4329833984375, 2.568359375, 2.7037353515625, 2.839111328125, 2.9744873046875, 3.10986328125, 3.2452392578125, 3.380615234375, 3.5159912109375, 3.6513671875, 3.7867431640625, 3.922119140625, 4.0574951171875, 4.19287109375, 4.3282470703125, 4.463623046875, 4.5989990234375, 4.734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 10.0, 17.0, 35.0, 45.0, 100.0, 184.0, 389.0, 1212.0, 5644.0, 62817.0, 906259.0, 63945.0, 5876.0, 1215.0, 396.0, 200.0, 71.0, 44.0, 33.0, 10.0, 10.0, 9.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4794921875, -1.435333251953125, -1.39117431640625, -1.347015380859375, -1.3028564453125, -1.258697509765625, -1.21453857421875, -1.170379638671875, -1.126220703125, -1.082061767578125, -1.03790283203125, -0.993743896484375, -0.9495849609375, -0.905426025390625, -0.86126708984375, -0.817108154296875, -0.77294921875, -0.728790283203125, -0.68463134765625, -0.640472412109375, -0.5963134765625, -0.552154541015625, -0.50799560546875, -0.463836669921875, -0.419677734375, -0.375518798828125, -0.33135986328125, -0.287200927734375, -0.2430419921875, -0.198883056640625, -0.15472412109375, -0.110565185546875, -0.06640625, -0.022247314453125, 0.02191162109375, 0.066070556640625, 0.1102294921875, 0.154388427734375, 0.19854736328125, 0.242706298828125, 0.286865234375, 0.331024169921875, 0.37518310546875, 0.419342041015625, 0.4635009765625, 0.507659912109375, 0.55181884765625, 0.595977783203125, 0.64013671875, 0.684295654296875, 0.72845458984375, 0.772613525390625, 0.8167724609375, 0.860931396484375, 0.90509033203125, 0.949249267578125, 0.993408203125, 1.037567138671875, 1.08172607421875, 1.125885009765625, 1.1700439453125, 1.214202880859375, 1.25836181640625, 1.302520751953125, 1.3466796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 16.0, 22.0, 32.0, 78.0, 130.0, 358.0, 175.0, 92.0, 36.0, 25.0, 15.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002384185791015625, -0.00023008882999420166, -0.00022175908088684082, -0.00021342933177947998, -0.00020509958267211914, -0.0001967698335647583, -0.00018844008445739746, -0.00018011033535003662, -0.00017178058624267578, -0.00016345083713531494, -0.0001551210880279541, -0.00014679133892059326, -0.00013846158981323242, -0.00013013184070587158, -0.00012180209159851074, -0.0001134723424911499, -0.00010514259338378906, -9.681284427642822e-05, -8.848309516906738e-05, -8.015334606170654e-05, -7.18235969543457e-05, -6.349384784698486e-05, -5.5164098739624023e-05, -4.6834349632263184e-05, -3.8504600524902344e-05, -3.0174851417541504e-05, -2.1845102310180664e-05, -1.3515353202819824e-05, -5.185604095458984e-06, 3.1441450119018555e-06, 1.1473894119262695e-05, 1.9803643226623535e-05, 2.8133392333984375e-05, 3.6463141441345215e-05, 4.4792890548706055e-05, 5.3122639656066895e-05, 6.145238876342773e-05, 6.978213787078857e-05, 7.811188697814941e-05, 8.644163608551025e-05, 9.47713851928711e-05, 0.00010310113430023193, 0.00011143088340759277, 0.00011976063251495361, 0.00012809038162231445, 0.0001364201307296753, 0.00014474987983703613, 0.00015307962894439697, 0.0001614093780517578, 0.00016973912715911865, 0.0001780688762664795, 0.00018639862537384033, 0.00019472837448120117, 0.000203058123588562, 0.00021138787269592285, 0.0002197176218032837, 0.00022804737091064453, 0.00023637712001800537, 0.0002447068691253662, 0.00025303661823272705, 0.0002613663673400879, 0.00026969611644744873, 0.00027802586555480957, 0.0002863556146621704, 0.00029468536376953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 16.0, 21.0, 32.0, 38.0, 65.0, 94.0, 163.0, 263.0, 476.0, 985.0, 2187.0, 5908.0, 19404.0, 90477.0, 734239.0, 152785.0, 28089.0, 7878.0, 2891.0, 1184.0, 548.0, 297.0, 154.0, 100.0, 81.0, 57.0, 32.0, 20.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.857421875, -0.8333587646484375, -0.809295654296875, -0.7852325439453125, -0.76116943359375, -0.7371063232421875, -0.713043212890625, -0.6889801025390625, -0.6649169921875, -0.6408538818359375, -0.616790771484375, -0.5927276611328125, -0.56866455078125, -0.5446014404296875, -0.520538330078125, -0.4964752197265625, -0.472412109375, -0.4483489990234375, -0.424285888671875, -0.4002227783203125, -0.37615966796875, -0.3520965576171875, -0.328033447265625, -0.3039703369140625, -0.2799072265625, -0.2558441162109375, -0.231781005859375, -0.2077178955078125, -0.18365478515625, -0.1595916748046875, -0.135528564453125, -0.1114654541015625, -0.08740234375, -0.0633392333984375, -0.039276123046875, -0.0152130126953125, 0.00885009765625, 0.0329132080078125, 0.056976318359375, 0.0810394287109375, 0.1051025390625, 0.1291656494140625, 0.153228759765625, 0.1772918701171875, 0.20135498046875, 0.2254180908203125, 0.249481201171875, 0.2735443115234375, 0.297607421875, 0.3216705322265625, 0.345733642578125, 0.3697967529296875, 0.39385986328125, 0.4179229736328125, 0.441986083984375, 0.4660491943359375, 0.4901123046875, 0.5141754150390625, 0.538238525390625, 0.5623016357421875, 0.58636474609375, 0.6104278564453125, 0.634490966796875, 0.6585540771484375, 0.6826171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 11.0, 11.0, 29.0, 20.0, 35.0, 32.0, 60.0, 70.0, 106.0, 233.0, 96.0, 72.0, 54.0, 42.0, 17.0, 24.0, 18.0, 19.0, 13.0, 5.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.3524169921875, -0.341552734375, -0.3306884765625, -0.31982421875, -0.3089599609375, -0.298095703125, -0.2872314453125, -0.2763671875, -0.2655029296875, -0.254638671875, -0.2437744140625, -0.23291015625, -0.2220458984375, -0.211181640625, -0.2003173828125, -0.189453125, -0.1785888671875, -0.167724609375, -0.1568603515625, -0.14599609375, -0.1351318359375, -0.124267578125, -0.1134033203125, -0.1025390625, -0.0916748046875, -0.080810546875, -0.0699462890625, -0.05908203125, -0.0482177734375, -0.037353515625, -0.0264892578125, -0.015625, -0.0047607421875, 0.006103515625, 0.0169677734375, 0.02783203125, 0.0386962890625, 0.049560546875, 0.0604248046875, 0.0712890625, 0.0821533203125, 0.093017578125, 0.1038818359375, 0.11474609375, 0.1256103515625, 0.136474609375, 0.1473388671875, 0.158203125, 0.1690673828125, 0.179931640625, 0.1907958984375, 0.20166015625, 0.2125244140625, 0.223388671875, 0.2342529296875, 0.2451171875, 0.2559814453125, 0.266845703125, 0.2777099609375, 0.28857421875, 0.2994384765625, 0.310302734375, 0.3211669921875, 0.33203125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 5.0, 6.0, 10.0, 23.0, 31.0, 58.0, 136.0, 232.0, 228.0, 122.0, 58.0, 31.0, 18.0, 14.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.230271339416504, -11.88103199005127, -11.531791687011719, -11.182552337646484, -10.83331298828125, -10.484073638916016, -10.134833335876465, -9.78559398651123, -9.43635368347168, -9.087114334106445, -8.737874031066895, -8.38863468170166, -8.039395332336426, -7.690155506134033, -7.340915679931641, -6.991676330566406, -6.642436981201172, -6.293197154998779, -5.943957805633545, -5.594717979431152, -5.245478630065918, -4.896238803863525, -4.546998977661133, -4.197759628295898, -3.848519802093506, -3.4992802143096924, -3.150040626525879, -2.8008008003234863, -2.451561212539673, -2.1023216247558594, -1.7530817985534668, -1.4038422107696533, -1.0546035766601562, -0.705363929271698, -0.35612428188323975, -0.006884574890136719, 0.34235501289367676, 0.6915946006774902, 1.0408344268798828, 1.3900740146636963, 1.7393136024475098, 2.0885531902313232, 2.4377927780151367, 2.7870326042175293, 3.1362721920013428, 3.4855117797851562, 3.834751605987549, 4.183991432189941, 4.533230781555176, 4.882470607757568, 5.231709957122803, 5.580949783325195, 5.93018913269043, 6.279428958892822, 6.628668785095215, 6.977908134460449, 7.327147960662842, 7.676387786865234, 8.025627136230469, 8.374866485595703, 8.724106788635254, 9.073346138000488, 9.422586441040039, 9.771825790405273, 10.121065139770508]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 1.0, 11.0, 6.0, 12.0, 7.0, 15.0, 16.0, 20.0, 29.0, 21.0, 27.0, 33.0, 32.0, 26.0, 37.0, 36.0, 41.0, 45.0, 41.0, 43.0, 39.0, 47.0, 36.0, 45.0, 35.0, 44.0, 27.0, 30.0, 37.0, 28.0, 17.0, 17.0, 12.0, 16.0, 8.0, 16.0, 12.0, 5.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.703096389770508, -8.445080757141113, -8.187065124511719, -7.929049491882324, -7.67103385925293, -7.413018226623535, -7.155002593994141, -6.896986961364746, -6.638971328735352, -6.380955696105957, -6.1229400634765625, -5.864924430847168, -5.606908798217773, -5.348893165588379, -5.090877532958984, -4.83286190032959, -4.5748467445373535, -4.316831111907959, -4.0588154792785645, -3.80079984664917, -3.5427842140197754, -3.284768581390381, -3.0267531871795654, -2.768737554550171, -2.5107219219207764, -2.252706289291382, -1.9946906566619873, -1.7366751432418823, -1.4786595106124878, -1.2206438779830933, -0.9626283645629883, -0.7046127319335938, -0.446596622467041, -0.18858101963996887, 0.06943458318710327, 0.327450156211853, 0.5854657888412476, 0.8434814214706421, 1.101496934890747, 1.3595125675201416, 1.6175282001495361, 1.8755438327789307, 2.133559465408325, 2.3915748596191406, 2.649590492248535, 2.9076061248779297, 3.165621757507324, 3.4236373901367188, 3.6816530227661133, 3.939668655395508, 4.197684288024902, 4.455699920654297, 4.713715553283691, 4.971731185913086, 5.2297468185424805, 5.487762451171875, 5.7457780838012695, 6.003793716430664, 6.261809349060059, 6.519824981689453, 6.777840614318848, 7.035856246948242, 7.293871879577637, 7.551887512207031, 7.809902667999268]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 4.0, 12.0, 9.0, 14.0, 17.0, 26.0, 34.0, 48.0, 82.0, 130.0, 169.0, 264.0, 485.0, 874.0, 1753.0, 4349.0, 13475.0, 63395.0, 1274544.0, 2731073.0, 78833.0, 15543.0, 4855.0, 1915.0, 947.0, 521.0, 283.0, 178.0, 121.0, 76.0, 63.0, 42.0, 36.0, 27.0, 23.0, 15.0, 11.0, 5.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.95703125, -3.82086181640625, -3.6846923828125, -3.54852294921875, -3.412353515625, -3.27618408203125, -3.1400146484375, -3.00384521484375, -2.86767578125, -2.73150634765625, -2.5953369140625, -2.45916748046875, -2.322998046875, -2.18682861328125, -2.0506591796875, -1.91448974609375, -1.7783203125, -1.64215087890625, -1.5059814453125, -1.36981201171875, -1.233642578125, -1.09747314453125, -0.9613037109375, -0.82513427734375, -0.68896484375, -0.55279541015625, -0.4166259765625, -0.28045654296875, -0.144287109375, -0.00811767578125, 0.1280517578125, 0.26422119140625, 0.400390625, 0.53656005859375, 0.6727294921875, 0.80889892578125, 0.945068359375, 1.08123779296875, 1.2174072265625, 1.35357666015625, 1.48974609375, 1.62591552734375, 1.7620849609375, 1.89825439453125, 2.034423828125, 2.17059326171875, 2.3067626953125, 2.44293212890625, 2.5791015625, 2.71527099609375, 2.8514404296875, 2.98760986328125, 3.123779296875, 3.25994873046875, 3.3961181640625, 3.53228759765625, 3.66845703125, 3.80462646484375, 3.9407958984375, 4.07696533203125, 4.213134765625, 4.34930419921875, 4.4854736328125, 4.62164306640625, 4.7578125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 9.0, 11.0, 12.0, 16.0, 15.0, 27.0, 42.0, 58.0, 65.0, 69.0, 101.0, 95.0, 94.0, 82.0, 64.0, 49.0, 41.0, 33.0, 24.0, 20.0, 10.0, 17.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1484375, -3.055206298828125, -2.96197509765625, -2.868743896484375, -2.7755126953125, -2.682281494140625, -2.58905029296875, -2.495819091796875, -2.402587890625, -2.309356689453125, -2.21612548828125, -2.122894287109375, -2.0296630859375, -1.936431884765625, -1.84320068359375, -1.749969482421875, -1.65673828125, -1.563507080078125, -1.47027587890625, -1.377044677734375, -1.2838134765625, -1.190582275390625, -1.09735107421875, -1.004119873046875, -0.910888671875, -0.817657470703125, -0.72442626953125, -0.631195068359375, -0.5379638671875, -0.444732666015625, -0.35150146484375, -0.258270263671875, -0.1650390625, -0.071807861328125, 0.02142333984375, 0.114654541015625, 0.2078857421875, 0.301116943359375, 0.39434814453125, 0.487579345703125, 0.580810546875, 0.674041748046875, 0.76727294921875, 0.860504150390625, 0.9537353515625, 1.046966552734375, 1.14019775390625, 1.233428955078125, 1.32666015625, 1.419891357421875, 1.51312255859375, 1.606353759765625, 1.6995849609375, 1.792816162109375, 1.88604736328125, 1.979278564453125, 2.072509765625, 2.165740966796875, 2.25897216796875, 2.352203369140625, 2.4454345703125, 2.538665771484375, 2.63189697265625, 2.725128173828125, 2.818359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 11.0, 18.0, 29.0, 54.0, 71.0, 117.0, 267.0, 606.0, 1671.0, 7176.0, 60779.0, 3771057.0, 329468.0, 18073.0, 3171.0, 964.0, 350.0, 158.0, 88.0, 50.0, 24.0, 19.0, 12.0, 7.0, 12.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.37469482421875, -6.1673583984375, -5.96002197265625, -5.752685546875, -5.54534912109375, -5.3380126953125, -5.13067626953125, -4.92333984375, -4.71600341796875, -4.5086669921875, -4.30133056640625, -4.093994140625, -3.88665771484375, -3.6793212890625, -3.47198486328125, -3.2646484375, -3.05731201171875, -2.8499755859375, -2.64263916015625, -2.435302734375, -2.22796630859375, -2.0206298828125, -1.81329345703125, -1.60595703125, -1.39862060546875, -1.1912841796875, -0.98394775390625, -0.776611328125, -0.56927490234375, -0.3619384765625, -0.15460205078125, 0.052734375, 0.26007080078125, 0.4674072265625, 0.67474365234375, 0.882080078125, 1.08941650390625, 1.2967529296875, 1.50408935546875, 1.71142578125, 1.91876220703125, 2.1260986328125, 2.33343505859375, 2.540771484375, 2.74810791015625, 2.9554443359375, 3.16278076171875, 3.3701171875, 3.57745361328125, 3.7847900390625, 3.99212646484375, 4.199462890625, 4.40679931640625, 4.6141357421875, 4.82147216796875, 5.02880859375, 5.23614501953125, 5.4434814453125, 5.65081787109375, 5.858154296875, 6.06549072265625, 6.2728271484375, 6.48016357421875, 6.6875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 1.0, 8.0, 12.0, 17.0, 14.0, 22.0, 33.0, 50.0, 61.0, 83.0, 145.0, 268.0, 492.0, 1291.0, 667.0, 308.0, 198.0, 111.0, 85.0, 59.0, 39.0, 24.0, 27.0, 15.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.0697021484375, -1.035888671875, -1.0020751953125, -0.96826171875, -0.9344482421875, -0.900634765625, -0.8668212890625, -0.8330078125, -0.7991943359375, -0.765380859375, -0.7315673828125, -0.69775390625, -0.6639404296875, -0.630126953125, -0.5963134765625, -0.5625, -0.5286865234375, -0.494873046875, -0.4610595703125, -0.42724609375, -0.3934326171875, -0.359619140625, -0.3258056640625, -0.2919921875, -0.2581787109375, -0.224365234375, -0.1905517578125, -0.15673828125, -0.1229248046875, -0.089111328125, -0.0552978515625, -0.021484375, 0.0123291015625, 0.046142578125, 0.0799560546875, 0.11376953125, 0.1475830078125, 0.181396484375, 0.2152099609375, 0.2490234375, 0.2828369140625, 0.316650390625, 0.3504638671875, 0.38427734375, 0.4180908203125, 0.451904296875, 0.4857177734375, 0.51953125, 0.5533447265625, 0.587158203125, 0.6209716796875, 0.65478515625, 0.6885986328125, 0.722412109375, 0.7562255859375, 0.7900390625, 0.8238525390625, 0.857666015625, 0.8914794921875, 0.92529296875, 0.9591064453125, 0.992919921875, 1.0267333984375, 1.060546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 15.0, 17.0, 29.0, 41.0, 70.0, 104.0, 141.0, 138.0, 136.0, 98.0, 75.0, 40.0, 22.0, 13.0, 8.0, 5.0, 5.0, 5.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.389087200164795, -6.222047805786133, -6.055008411407471, -5.887969017028809, -5.7209296226501465, -5.553890228271484, -5.3868513107299805, -5.219811916351318, -5.052772521972656, -4.885733127593994, -4.718693733215332, -4.55165433883667, -4.384614944458008, -4.217576026916504, -4.050536155700684, -3.8834972381591797, -3.7164576053619385, -3.5494182109832764, -3.3823788166046143, -3.2153396606445312, -3.048300266265869, -2.881260871887207, -2.714221477508545, -2.547182083129883, -2.3801426887512207, -2.2131032943725586, -2.0460638999938965, -1.879024624824524, -1.7119853496551514, -1.5449459552764893, -1.3779065608978271, -1.2108672857284546, -1.043828010559082, -0.8767886757850647, -0.7097493410110474, -0.5427099466323853, -0.3756706118583679, -0.20863127708435059, -0.04159188270568848, 0.12544739246368408, 0.2924867868423462, 0.4595261216163635, 0.6265654563903809, 0.793604850769043, 0.9606441855430603, 1.1276835203170776, 1.2947229146957397, 1.4617621898651123, 1.6288015842437744, 1.7958409786224365, 1.962880253791809, 2.1299195289611816, 2.2969589233398438, 2.463998317718506, 2.631037712097168, 2.79807710647583, 2.965116500854492, 3.1321558952331543, 3.2991952896118164, 3.4662346839904785, 3.6332738399505615, 3.8003132343292236, 3.9673526287078857, 4.134391784667969, 4.301431179046631]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 8.0, 15.0, 16.0, 17.0, 21.0, 31.0, 35.0, 44.0, 40.0, 49.0, 58.0, 57.0, 76.0, 58.0, 71.0, 61.0, 50.0, 45.0, 44.0, 28.0, 34.0, 20.0, 22.0, 17.0, 14.0, 15.0, 5.0, 11.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.356705904006958, -3.266069173812866, -3.1754324436187744, -3.0847959518432617, -2.99415922164917, -2.903522491455078, -2.8128857612609863, -2.7222490310668945, -2.6316123008728027, -2.540975570678711, -2.450338840484619, -2.3597021102905273, -2.2690656185150146, -2.178428888320923, -2.087792158126831, -1.9971554279327393, -1.9065189361572266, -1.8158822059631348, -1.7252455949783325, -1.6346088647842407, -1.5439722537994385, -1.4533355236053467, -1.3626987934112549, -1.272062063217163, -1.1814254522323608, -1.090788722038269, -1.0001521110534668, -0.909515380859375, -0.818878710269928, -0.728242039680481, -0.6376053094863892, -0.5469686388969421, -0.4563322067260742, -0.3656955361366272, -0.2750588357448578, -0.18442213535308838, -0.09378546476364136, -0.003148794174194336, 0.08748793601989746, 0.17812460660934448, 0.2687612771987915, 0.3593979477882385, 0.45003464818000793, 0.5406713485717773, 0.6313080191612244, 0.7219446897506714, 0.8125814199447632, 0.9032180905342102, 0.9938547611236572, 1.084491491317749, 1.1751281023025513, 1.265764832496643, 1.3564014434814453, 1.447038173675537, 1.537674903869629, 1.6283116340637207, 1.718948245048523, 1.8095849752426147, 1.900221586227417, 1.9908583164215088, 2.0814950466156006, 2.1721315383911133, 2.262768268585205, 2.353404998779297, 2.4440417289733887]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 3.0, 7.0, 15.0, 16.0, 19.0, 33.0, 47.0, 81.0, 105.0, 154.0, 296.0, 517.0, 937.0, 2075.0, 5522.0, 19253.0, 121160.0, 722681.0, 143855.0, 21248.0, 5830.0, 2309.0, 1059.0, 534.0, 287.0, 186.0, 115.0, 64.0, 40.0, 27.0, 16.0, 18.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.334228515625, -0.3245506286621094, -0.31487274169921875, -0.3051948547363281, -0.2955169677734375, -0.2858390808105469, -0.27616119384765625, -0.2664833068847656, -0.256805419921875, -0.24712753295898438, -0.23744964599609375, -0.22777175903320312, -0.2180938720703125, -0.20841598510742188, -0.19873809814453125, -0.18906021118164062, -0.17938232421875, -0.16970443725585938, -0.16002655029296875, -0.15034866333007812, -0.1406707763671875, -0.13099288940429688, -0.12131500244140625, -0.11163711547851562, -0.101959228515625, -0.09228134155273438, -0.08260345458984375, -0.07292556762695312, -0.0632476806640625, -0.053569793701171875, -0.04389190673828125, -0.034214019775390625, -0.0245361328125, -0.014858245849609375, -0.00518035888671875, 0.004497528076171875, 0.0141754150390625, 0.023853302001953125, 0.03353118896484375, 0.043209075927734375, 0.052886962890625, 0.06256484985351562, 0.07224273681640625, 0.08192062377929688, 0.0915985107421875, 0.10127639770507812, 0.11095428466796875, 0.12063217163085938, 0.13031005859375, 0.13998794555664062, 0.14966583251953125, 0.15934371948242188, 0.1690216064453125, 0.17869949340820312, 0.18837738037109375, 0.19805526733398438, 0.207733154296875, 0.21741104125976562, 0.22708892822265625, 0.23676681518554688, 0.2464447021484375, 0.2561225891113281, 0.26580047607421875, 0.2754783630371094, 0.28515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 11.0, 16.0, 19.0, 25.0, 29.0, 41.0, 51.0, 65.0, 66.0, 68.0, 82.0, 84.0, 92.0, 65.0, 70.0, 40.0, 37.0, 32.0, 19.0, 15.0, 16.0, 12.0, 11.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.30816650390625, -2.2257080078125, -2.14324951171875, -2.060791015625, -1.97833251953125, -1.8958740234375, -1.81341552734375, -1.73095703125, -1.64849853515625, -1.5660400390625, -1.48358154296875, -1.401123046875, -1.31866455078125, -1.2362060546875, -1.15374755859375, -1.0712890625, -0.98883056640625, -0.9063720703125, -0.82391357421875, -0.741455078125, -0.65899658203125, -0.5765380859375, -0.49407958984375, -0.41162109375, -0.32916259765625, -0.2467041015625, -0.16424560546875, -0.081787109375, 0.00067138671875, 0.0831298828125, 0.16558837890625, 0.248046875, 0.33050537109375, 0.4129638671875, 0.49542236328125, 0.577880859375, 0.66033935546875, 0.7427978515625, 0.82525634765625, 0.90771484375, 0.99017333984375, 1.0726318359375, 1.15509033203125, 1.237548828125, 1.32000732421875, 1.4024658203125, 1.48492431640625, 1.5673828125, 1.64984130859375, 1.7322998046875, 1.81475830078125, 1.897216796875, 1.97967529296875, 2.0621337890625, 2.14459228515625, 2.22705078125, 2.30950927734375, 2.3919677734375, 2.47442626953125, 2.556884765625, 2.63934326171875, 2.7218017578125, 2.80426025390625, 2.88671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 19.0, 19.0, 31.0, 31.0, 48.0, 63.0, 82.0, 97.0, 161.0, 218.0, 391.0, 802.0, 2929.0, 26067.0, 421851.0, 553057.0, 36860.0, 3647.0, 883.0, 418.0, 236.0, 164.0, 103.0, 75.0, 66.0, 48.0, 36.0, 23.0, 22.0, 19.0, 16.0, 7.0, 10.0, 4.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.245574951171875, -0.23577880859375, -0.225982666015625, -0.2161865234375, -0.206390380859375, -0.19659423828125, -0.186798095703125, -0.177001953125, -0.167205810546875, -0.15740966796875, -0.147613525390625, -0.1378173828125, -0.128021240234375, -0.11822509765625, -0.108428955078125, -0.0986328125, -0.088836669921875, -0.07904052734375, -0.069244384765625, -0.0594482421875, -0.049652099609375, -0.03985595703125, -0.030059814453125, -0.020263671875, -0.010467529296875, -0.00067138671875, 0.009124755859375, 0.0189208984375, 0.028717041015625, 0.03851318359375, 0.048309326171875, 0.05810546875, 0.067901611328125, 0.07769775390625, 0.087493896484375, 0.0972900390625, 0.107086181640625, 0.11688232421875, 0.126678466796875, 0.136474609375, 0.146270751953125, 0.15606689453125, 0.165863037109375, 0.1756591796875, 0.185455322265625, 0.19525146484375, 0.205047607421875, 0.21484375, 0.224639892578125, 0.23443603515625, 0.244232177734375, 0.2540283203125, 0.263824462890625, 0.27362060546875, 0.283416748046875, 0.293212890625, 0.303009033203125, 0.31280517578125, 0.322601318359375, 0.3323974609375, 0.342193603515625, 0.35198974609375, 0.361785888671875, 0.37158203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 4.0, 8.0, 12.0, 11.0, 15.0, 27.0, 30.0, 29.0, 42.0, 41.0, 33.0, 39.0, 46.0, 46.0, 44.0, 48.0, 49.0, 51.0, 50.0, 51.0, 46.0, 31.0, 29.0, 35.0, 27.0, 28.0, 22.0, 23.0, 13.0, 11.0, 14.0, 9.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.228607177734375, -3.12127685546875, -3.013946533203125, -2.9066162109375, -2.799285888671875, -2.69195556640625, -2.584625244140625, -2.477294921875, -2.369964599609375, -2.26263427734375, -2.155303955078125, -2.0479736328125, -1.940643310546875, -1.83331298828125, -1.725982666015625, -1.61865234375, -1.511322021484375, -1.40399169921875, -1.296661376953125, -1.1893310546875, -1.082000732421875, -0.97467041015625, -0.867340087890625, -0.760009765625, -0.652679443359375, -0.54534912109375, -0.438018798828125, -0.3306884765625, -0.223358154296875, -0.11602783203125, -0.008697509765625, 0.0986328125, 0.205963134765625, 0.31329345703125, 0.420623779296875, 0.5279541015625, 0.635284423828125, 0.74261474609375, 0.849945068359375, 0.957275390625, 1.064605712890625, 1.17193603515625, 1.279266357421875, 1.3865966796875, 1.493927001953125, 1.60125732421875, 1.708587646484375, 1.81591796875, 1.923248291015625, 2.03057861328125, 2.137908935546875, 2.2452392578125, 2.352569580078125, 2.45989990234375, 2.567230224609375, 2.674560546875, 2.781890869140625, 2.88922119140625, 2.996551513671875, 3.1038818359375, 3.211212158203125, 3.31854248046875, 3.425872802734375, 3.533203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 18.0, 14.0, 35.0, 33.0, 65.0, 124.0, 266.0, 862.0, 7420.0, 1019671.0, 18106.0, 1238.0, 325.0, 122.0, 84.0, 41.0, 31.0, 19.0, 14.0, 3.0, 15.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.182373046875, -0.17776870727539062, -0.17316436767578125, -0.16856002807617188, -0.1639556884765625, -0.15935134887695312, -0.15474700927734375, -0.15014266967773438, -0.145538330078125, -0.14093399047851562, -0.13632965087890625, -0.13172531127929688, -0.1271209716796875, -0.12251663208007812, -0.11791229248046875, -0.11330795288085938, -0.10870361328125, -0.10409927368164062, -0.09949493408203125, -0.09489059448242188, -0.0902862548828125, -0.08568191528320312, -0.08107757568359375, -0.07647323608398438, -0.071868896484375, -0.06726455688476562, -0.06266021728515625, -0.058055877685546875, -0.0534515380859375, -0.048847198486328125, -0.04424285888671875, -0.039638519287109375, -0.0350341796875, -0.030429840087890625, -0.02582550048828125, -0.021221160888671875, -0.0166168212890625, -0.012012481689453125, -0.00740814208984375, -0.002803802490234375, 0.001800537109375, 0.006404876708984375, 0.01100921630859375, 0.015613555908203125, 0.0202178955078125, 0.024822235107421875, 0.02942657470703125, 0.034030914306640625, 0.03863525390625, 0.043239593505859375, 0.04784393310546875, 0.052448272705078125, 0.0570526123046875, 0.061656951904296875, 0.06626129150390625, 0.07086563110351562, 0.075469970703125, 0.08007431030273438, 0.08467864990234375, 0.08928298950195312, 0.0938873291015625, 0.09849166870117188, 0.10309600830078125, 0.10770034790039062, 0.1123046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 9.0, 15.0, 22.0, 27.0, 63.0, 66.0, 109.0, 127.0, 135.0, 118.0, 94.0, 53.0, 40.0, 30.0, 16.0, 9.0, 11.0, 4.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4809112548828125e-05, -3.365427255630493e-05, -3.249943256378174e-05, -3.1344592571258545e-05, -3.018975257873535e-05, -2.9034912586212158e-05, -2.7880072593688965e-05, -2.672523260116577e-05, -2.5570392608642578e-05, -2.4415552616119385e-05, -2.326071262359619e-05, -2.2105872631072998e-05, -2.0951032638549805e-05, -1.979619264602661e-05, -1.8641352653503418e-05, -1.7486512660980225e-05, -1.633167266845703e-05, -1.5176832675933838e-05, -1.4021992683410645e-05, -1.2867152690887451e-05, -1.1712312698364258e-05, -1.0557472705841064e-05, -9.402632713317871e-06, -8.247792720794678e-06, -7.092952728271484e-06, -5.938112735748291e-06, -4.783272743225098e-06, -3.6284327507019043e-06, -2.473592758178711e-06, -1.3187527656555176e-06, -1.6391277313232422e-07, 9.909272193908691e-07, 2.1457672119140625e-06, 3.300607204437256e-06, 4.455447196960449e-06, 5.610287189483643e-06, 6.765127182006836e-06, 7.91996717453003e-06, 9.074807167053223e-06, 1.0229647159576416e-05, 1.138448715209961e-05, 1.2539327144622803e-05, 1.3694167137145996e-05, 1.484900712966919e-05, 1.6003847122192383e-05, 1.7158687114715576e-05, 1.831352710723877e-05, 1.9468367099761963e-05, 2.0623207092285156e-05, 2.177804708480835e-05, 2.2932887077331543e-05, 2.4087727069854736e-05, 2.524256706237793e-05, 2.6397407054901123e-05, 2.7552247047424316e-05, 2.870708703994751e-05, 2.9861927032470703e-05, 3.1016767024993896e-05, 3.217160701751709e-05, 3.332644701004028e-05, 3.4481287002563477e-05, 3.563612699508667e-05, 3.679096698760986e-05, 3.794580698013306e-05, 3.910064697265625e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 12.0, 14.0, 15.0, 29.0, 30.0, 36.0, 50.0, 63.0, 108.0, 158.0, 236.0, 316.0, 647.0, 1343.0, 4006.0, 19454.0, 848642.0, 156872.0, 11145.0, 2769.0, 1038.0, 531.0, 320.0, 212.0, 127.0, 94.0, 68.0, 52.0, 29.0, 30.0, 21.0, 12.0, 10.0, 12.0, 6.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1300048828125, -0.12616443634033203, -0.12232398986816406, -0.1184835433959961, -0.11464309692382812, -0.11080265045166016, -0.10696220397949219, -0.10312175750732422, -0.09928131103515625, -0.09544086456298828, -0.09160041809082031, -0.08775997161865234, -0.08391952514648438, -0.0800790786743164, -0.07623863220214844, -0.07239818572998047, -0.0685577392578125, -0.06471729278564453, -0.06087684631347656, -0.057036399841308594, -0.053195953369140625, -0.049355506896972656, -0.04551506042480469, -0.04167461395263672, -0.03783416748046875, -0.03399372100830078, -0.030153274536132812, -0.026312828063964844, -0.022472381591796875, -0.018631935119628906, -0.014791488647460938, -0.010951042175292969, -0.007110595703125, -0.0032701492309570312, 0.0005702972412109375, 0.004410743713378906, 0.008251190185546875, 0.012091636657714844, 0.015932083129882812, 0.01977252960205078, 0.02361297607421875, 0.02745342254638672, 0.03129386901855469, 0.035134315490722656, 0.038974761962890625, 0.042815208435058594, 0.04665565490722656, 0.05049610137939453, 0.0543365478515625, 0.05817699432373047, 0.06201744079589844, 0.0658578872680664, 0.06969833374023438, 0.07353878021240234, 0.07737922668457031, 0.08121967315673828, 0.08506011962890625, 0.08890056610107422, 0.09274101257324219, 0.09658145904541016, 0.10042190551757812, 0.1042623519897461, 0.10810279846191406, 0.11194324493408203, 0.11578369140625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 21.0, 36.0, 82.0, 216.0, 326.0, 162.0, 61.0, 32.0, 14.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01226043701171875, -0.011794447898864746, -0.011328458786010742, -0.010862469673156738, -0.010396480560302734, -0.00993049144744873, -0.009464502334594727, -0.008998513221740723, -0.008532524108886719, -0.008066534996032715, -0.007600545883178711, -0.007134556770324707, -0.006668567657470703, -0.006202578544616699, -0.005736589431762695, -0.005270600318908691, -0.0048046112060546875, -0.004338622093200684, -0.0038726329803466797, -0.0034066438674926758, -0.002940654754638672, -0.002474665641784668, -0.002008676528930664, -0.0015426874160766602, -0.0010766983032226562, -0.0006107091903686523, -0.00014472007751464844, 0.00032126903533935547, 0.0007872581481933594, 0.0012532472610473633, 0.0017192363739013672, 0.002185225486755371, 0.002651214599609375, 0.003117203712463379, 0.003583192825317383, 0.004049181938171387, 0.004515171051025391, 0.0049811601638793945, 0.0054471492767333984, 0.005913138389587402, 0.006379127502441406, 0.00684511661529541, 0.007311105728149414, 0.007777094841003418, 0.008243083953857422, 0.008709073066711426, 0.00917506217956543, 0.009641051292419434, 0.010107040405273438, 0.010573029518127441, 0.011039018630981445, 0.01150500774383545, 0.011970996856689453, 0.012436985969543457, 0.012902975082397461, 0.013368964195251465, 0.013834953308105469, 0.014300942420959473, 0.014766931533813477, 0.01523292064666748, 0.015698909759521484, 0.01616489887237549, 0.016630887985229492, 0.017096877098083496, 0.0175628662109375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 16.0, 35.0, 89.0, 206.0, 294.0, 201.0, 85.0, 23.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.291729927062988, -9.067230224609375, -8.842730522155762, -8.618230819702148, -8.393731117248535, -8.169231414794922, -7.944731712341309, -7.720232009887695, -7.495732307434082, -7.271232604980469, -7.0467329025268555, -6.822233200073242, -6.597733497619629, -6.373233795166016, -6.148734092712402, -5.924234390258789, -5.699734687805176, -5.4752349853515625, -5.250735282897949, -5.026235580444336, -4.801735877990723, -4.577236175537109, -4.352736473083496, -4.128236770629883, -3.9037365913391113, -3.679236888885498, -3.4547371864318848, -3.2302374839782715, -3.005737781524658, -2.781238079071045, -2.5567383766174316, -2.3322386741638184, -2.107738971710205, -1.8832392692565918, -1.6587395668029785, -1.4342398643493652, -1.209740161895752, -0.9852403402328491, -0.7607406377792358, -0.5362409353256226, -0.3117412328720093, -0.0872415155172348, 0.13725820183753967, 0.36175793409347534, 0.5862576365470886, 0.8107573986053467, 1.03525710105896, 1.2597568035125732, 1.4842565059661865, 1.7087562084197998, 1.933255910873413, 2.1577556133270264, 2.3822553157806396, 2.606755256652832, 2.8312549591064453, 3.0557546615600586, 3.280254364013672, 3.504754066467285, 3.7292537689208984, 3.9537534713745117, 4.178253173828125, 4.402752876281738, 4.627252578735352, 4.851752281188965, 5.076251983642578]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 7.0, 19.0, 18.0, 13.0, 28.0, 33.0, 40.0, 53.0, 50.0, 58.0, 81.0, 79.0, 82.0, 67.0, 55.0, 59.0, 57.0, 29.0, 35.0, 23.0, 20.0, 20.0, 10.0, 11.0, 9.0, 11.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3290717601776123, -2.260688066482544, -2.1923046112060547, -2.1239209175109863, -2.055537223815918, -1.9871535301208496, -1.9187699556350708, -1.850386381149292, -1.7820026874542236, -1.7136189937591553, -1.6452354192733765, -1.5768518447875977, -1.5084681510925293, -1.440084457397461, -1.3717008829116821, -1.3033173084259033, -1.234933614730835, -1.1665499210357666, -1.0981663465499878, -1.029782772064209, -0.9613990783691406, -0.893015444278717, -0.8246318101882935, -0.7562481760978699, -0.6878645420074463, -0.6194809079170227, -0.5510972738265991, -0.48271363973617554, -0.41433000564575195, -0.34594637155532837, -0.2775627374649048, -0.2091791033744812, -0.14079523086547852, -0.07241159677505493, -0.004027962684631348, 0.06435567140579224, 0.13273930549621582, 0.2011229395866394, 0.269506573677063, 0.3378902077674866, 0.40627384185791016, 0.47465747594833374, 0.5430411100387573, 0.6114247441291809, 0.6798083782196045, 0.7481920123100281, 0.8165756464004517, 0.8849592804908752, 0.9533429145812988, 1.0217266082763672, 1.090110182762146, 1.1584937572479248, 1.2268774509429932, 1.2952611446380615, 1.3636447191238403, 1.4320282936096191, 1.5004119873046875, 1.5687956809997559, 1.6371792554855347, 1.7055628299713135, 1.7739465236663818, 1.8423302173614502, 1.910713791847229, 1.9790973663330078, 2.047481060028076]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 18.0, 21.0, 31.0, 44.0, 63.0, 122.0, 226.0, 392.0, 786.0, 1788.0, 4319.0, 12476.0, 46969.0, 291928.0, 577025.0, 82349.0, 19323.0, 6089.0, 2418.0, 1030.0, 487.0, 282.0, 128.0, 73.0, 50.0, 33.0, 21.0, 13.0, 16.0, 13.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7958984375, -1.7321624755859375, -1.668426513671875, -1.6046905517578125, -1.54095458984375, -1.4772186279296875, -1.413482666015625, -1.3497467041015625, -1.2860107421875, -1.2222747802734375, -1.158538818359375, -1.0948028564453125, -1.03106689453125, -0.9673309326171875, -0.903594970703125, -0.8398590087890625, -0.776123046875, -0.7123870849609375, -0.648651123046875, -0.5849151611328125, -0.52117919921875, -0.4574432373046875, -0.393707275390625, -0.3299713134765625, -0.2662353515625, -0.2024993896484375, -0.138763427734375, -0.0750274658203125, -0.01129150390625, 0.0524444580078125, 0.116180419921875, 0.1799163818359375, 0.24365234375, 0.3073883056640625, 0.371124267578125, 0.4348602294921875, 0.49859619140625, 0.5623321533203125, 0.626068115234375, 0.6898040771484375, 0.7535400390625, 0.8172760009765625, 0.881011962890625, 0.9447479248046875, 1.00848388671875, 1.0722198486328125, 1.135955810546875, 1.1996917724609375, 1.263427734375, 1.3271636962890625, 1.390899658203125, 1.4546356201171875, 1.51837158203125, 1.5821075439453125, 1.645843505859375, 1.7095794677734375, 1.7733154296875, 1.8370513916015625, 1.900787353515625, 1.9645233154296875, 2.02825927734375, 2.0919952392578125, 2.155731201171875, 2.2194671630859375, 2.283203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 6.0, 8.0, 11.0, 8.0, 22.0, 15.0, 24.0, 31.0, 47.0, 66.0, 62.0, 80.0, 86.0, 79.0, 72.0, 70.0, 59.0, 53.0, 35.0, 29.0, 28.0, 19.0, 23.0, 9.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.11328125, -4.96484375, -4.81640625, -4.66796875, -4.51953125, -4.37109375, -4.22265625, -4.07421875, -3.92578125, -3.77734375, -3.62890625, -3.48046875, -3.33203125, -3.18359375, -3.03515625, -2.88671875, -2.73828125, -2.58984375, -2.44140625, -2.29296875, -2.14453125, -1.99609375, -1.84765625, -1.69921875, -1.55078125, -1.40234375, -1.25390625, -1.10546875, -0.95703125, -0.80859375, -0.66015625, -0.51171875, -0.36328125, -0.21484375, -0.06640625, 0.08203125, 0.23046875, 0.37890625, 0.52734375, 0.67578125, 0.82421875, 0.97265625, 1.12109375, 1.26953125, 1.41796875, 1.56640625, 1.71484375, 1.86328125, 2.01171875, 2.16015625, 2.30859375, 2.45703125, 2.60546875, 2.75390625, 2.90234375, 3.05078125, 3.19921875, 3.34765625, 3.49609375, 3.64453125, 3.79296875, 3.94140625, 4.08984375, 4.23828125, 4.38671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 13.0, 19.0, 21.0, 33.0, 21.0, 29.0, 39.0, 51.0, 59.0, 89.0, 97.0, 114.0, 130.0, 168.0, 218.0, 327.0, 574.0, 1744.0, 11777.0, 266638.0, 737990.0, 23360.0, 2618.0, 770.0, 407.0, 253.0, 186.0, 148.0, 109.0, 99.0, 78.0, 72.0, 64.0, 44.0, 33.0, 26.0, 24.0, 30.0, 16.0, 9.0, 7.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.126953125, -3.023193359375, -2.91943359375, -2.815673828125, -2.7119140625, -2.608154296875, -2.50439453125, -2.400634765625, -2.296875, -2.193115234375, -2.08935546875, -1.985595703125, -1.8818359375, -1.778076171875, -1.67431640625, -1.570556640625, -1.466796875, -1.363037109375, -1.25927734375, -1.155517578125, -1.0517578125, -0.947998046875, -0.84423828125, -0.740478515625, -0.63671875, -0.532958984375, -0.42919921875, -0.325439453125, -0.2216796875, -0.117919921875, -0.01416015625, 0.089599609375, 0.193359375, 0.297119140625, 0.40087890625, 0.504638671875, 0.6083984375, 0.712158203125, 0.81591796875, 0.919677734375, 1.0234375, 1.127197265625, 1.23095703125, 1.334716796875, 1.4384765625, 1.542236328125, 1.64599609375, 1.749755859375, 1.853515625, 1.957275390625, 2.06103515625, 2.164794921875, 2.2685546875, 2.372314453125, 2.47607421875, 2.579833984375, 2.68359375, 2.787353515625, 2.89111328125, 2.994873046875, 3.0986328125, 3.202392578125, 3.30615234375, 3.409912109375, 3.513671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 9.0, 9.0, 10.0, 17.0, 28.0, 20.0, 19.0, 22.0, 38.0, 30.0, 33.0, 37.0, 57.0, 61.0, 49.0, 51.0, 45.0, 42.0, 50.0, 50.0, 49.0, 48.0, 40.0, 29.0, 20.0, 19.0, 21.0, 24.0, 14.0, 12.0, 10.0, 4.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.3487548828125, -4.197509765625, -4.0462646484375, -3.89501953125, -3.7437744140625, -3.592529296875, -3.4412841796875, -3.2900390625, -3.1387939453125, -2.987548828125, -2.8363037109375, -2.68505859375, -2.5338134765625, -2.382568359375, -2.2313232421875, -2.080078125, -1.9288330078125, -1.777587890625, -1.6263427734375, -1.47509765625, -1.3238525390625, -1.172607421875, -1.0213623046875, -0.8701171875, -0.7188720703125, -0.567626953125, -0.4163818359375, -0.26513671875, -0.1138916015625, 0.037353515625, 0.1885986328125, 0.33984375, 0.4910888671875, 0.642333984375, 0.7935791015625, 0.94482421875, 1.0960693359375, 1.247314453125, 1.3985595703125, 1.5498046875, 1.7010498046875, 1.852294921875, 2.0035400390625, 2.15478515625, 2.3060302734375, 2.457275390625, 2.6085205078125, 2.759765625, 2.9110107421875, 3.062255859375, 3.2135009765625, 3.36474609375, 3.5159912109375, 3.667236328125, 3.8184814453125, 3.9697265625, 4.1209716796875, 4.272216796875, 4.4234619140625, 4.57470703125, 4.7259521484375, 4.877197265625, 5.0284423828125, 5.1796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 2.0, 3.0, 7.0, 9.0, 9.0, 10.0, 25.0, 26.0, 44.0, 62.0, 119.0, 224.0, 421.0, 886.0, 2210.0, 6826.0, 36758.0, 759403.0, 214012.0, 19765.0, 4541.0, 1566.0, 707.0, 395.0, 215.0, 103.0, 61.0, 37.0, 27.0, 13.0, 14.0, 9.0, 2.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.2661285400390625, -1.227569580078125, -1.1890106201171875, -1.15045166015625, -1.1118927001953125, -1.073333740234375, -1.0347747802734375, -0.9962158203125, -0.9576568603515625, -0.919097900390625, -0.8805389404296875, -0.84197998046875, -0.8034210205078125, -0.764862060546875, -0.7263031005859375, -0.687744140625, -0.6491851806640625, -0.610626220703125, -0.5720672607421875, -0.53350830078125, -0.4949493408203125, -0.456390380859375, -0.4178314208984375, -0.3792724609375, -0.3407135009765625, -0.302154541015625, -0.2635955810546875, -0.22503662109375, -0.1864776611328125, -0.147918701171875, -0.1093597412109375, -0.07080078125, -0.0322418212890625, 0.006317138671875, 0.0448760986328125, 0.08343505859375, 0.1219940185546875, 0.160552978515625, 0.1991119384765625, 0.2376708984375, 0.2762298583984375, 0.314788818359375, 0.3533477783203125, 0.39190673828125, 0.4304656982421875, 0.469024658203125, 0.5075836181640625, 0.546142578125, 0.5847015380859375, 0.623260498046875, 0.6618194580078125, 0.70037841796875, 0.7389373779296875, 0.777496337890625, 0.8160552978515625, 0.8546142578125, 0.8931732177734375, 0.931732177734375, 0.9702911376953125, 1.00885009765625, 1.0474090576171875, 1.085968017578125, 1.1245269775390625, 1.1630859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 3.0, 10.0, 10.0, 16.0, 26.0, 41.0, 52.0, 89.0, 185.0, 257.0, 109.0, 58.0, 36.0, 29.0, 15.0, 10.0, 12.0, 9.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00017118453979492188, -0.0001660361886024475, -0.00016088783740997314, -0.00015573948621749878, -0.00015059113502502441, -0.00014544278383255005, -0.00014029443264007568, -0.00013514608144760132, -0.00012999773025512695, -0.0001248493790626526, -0.00011970102787017822, -0.00011455267667770386, -0.00010940432548522949, -0.00010425597429275513, -9.910762310028076e-05, -9.39592719078064e-05, -8.881092071533203e-05, -8.366256952285767e-05, -7.85142183303833e-05, -7.336586713790894e-05, -6.821751594543457e-05, -6.30691647529602e-05, -5.792081356048584e-05, -5.2772462368011475e-05, -4.762411117553711e-05, -4.2475759983062744e-05, -3.732740879058838e-05, -3.2179057598114014e-05, -2.703070640563965e-05, -2.1882355213165283e-05, -1.6734004020690918e-05, -1.1585652828216553e-05, -6.4373016357421875e-06, -1.2889504432678223e-06, 3.859400749206543e-06, 9.007751941680908e-06, 1.4156103134155273e-05, 1.930445432662964e-05, 2.4452805519104004e-05, 2.960115671157837e-05, 3.4749507904052734e-05, 3.98978590965271e-05, 4.5046210289001465e-05, 5.019456148147583e-05, 5.5342912673950195e-05, 6.049126386642456e-05, 6.563961505889893e-05, 7.078796625137329e-05, 7.593631744384766e-05, 8.108466863632202e-05, 8.623301982879639e-05, 9.138137102127075e-05, 9.652972221374512e-05, 0.00010167807340621948, 0.00010682642459869385, 0.00011197477579116821, 0.00011712312698364258, 0.00012227147817611694, 0.0001274198293685913, 0.00013256818056106567, 0.00013771653175354004, 0.0001428648829460144, 0.00014801323413848877, 0.00015316158533096313, 0.0001583099365234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 4.0, 9.0, 21.0, 33.0, 27.0, 34.0, 55.0, 73.0, 96.0, 188.0, 247.0, 418.0, 690.0, 1300.0, 2501.0, 5832.0, 16258.0, 58073.0, 628747.0, 270793.0, 41324.0, 12334.0, 4660.0, 2054.0, 1016.0, 604.0, 416.0, 210.0, 169.0, 95.0, 68.0, 47.0, 34.0, 31.0, 23.0, 11.0, 23.0, 8.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6478195190429688, -0.6227874755859375, -0.5977554321289062, -0.572723388671875, -0.5476913452148438, -0.5226593017578125, -0.49762725830078125, -0.47259521484375, -0.44756317138671875, -0.4225311279296875, -0.39749908447265625, -0.372467041015625, -0.34743499755859375, -0.3224029541015625, -0.29737091064453125, -0.2723388671875, -0.24730682373046875, -0.2222747802734375, -0.19724273681640625, -0.172210693359375, -0.14717864990234375, -0.1221466064453125, -0.09711456298828125, -0.07208251953125, -0.04705047607421875, -0.0220184326171875, 0.00301361083984375, 0.028045654296875, 0.05307769775390625, 0.0781097412109375, 0.10314178466796875, 0.128173828125, 0.15320587158203125, 0.1782379150390625, 0.20326995849609375, 0.228302001953125, 0.25333404541015625, 0.2783660888671875, 0.30339813232421875, 0.32843017578125, 0.35346221923828125, 0.3784942626953125, 0.40352630615234375, 0.428558349609375, 0.45359039306640625, 0.4786224365234375, 0.5036544799804688, 0.5286865234375, 0.5537185668945312, 0.5787506103515625, 0.6037826538085938, 0.628814697265625, 0.6538467407226562, 0.6788787841796875, 0.7039108276367188, 0.72894287109375, 0.7539749145507812, 0.7790069580078125, 0.8040390014648438, 0.829071044921875, 0.8541030883789062, 0.8791351318359375, 0.9041671752929688, 0.92919921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 11.0, 17.0, 14.0, 25.0, 20.0, 28.0, 43.0, 79.0, 148.0, 268.0, 110.0, 56.0, 30.0, 31.0, 23.0, 15.0, 6.0, 13.0, 14.0, 8.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5324821472167969, -0.5185775756835938, -0.5046730041503906, -0.4907684326171875, -0.4768638610839844, -0.46295928955078125, -0.4490547180175781, -0.435150146484375, -0.4212455749511719, -0.40734100341796875, -0.3934364318847656, -0.3795318603515625, -0.3656272888183594, -0.35172271728515625, -0.3378181457519531, -0.32391357421875, -0.3100090026855469, -0.29610443115234375, -0.2821998596191406, -0.2682952880859375, -0.2543907165527344, -0.24048614501953125, -0.22658157348632812, -0.212677001953125, -0.19877243041992188, -0.18486785888671875, -0.17096328735351562, -0.1570587158203125, -0.14315414428710938, -0.12924957275390625, -0.11534500122070312, -0.1014404296875, -0.08753585815429688, -0.07363128662109375, -0.059726715087890625, -0.0458221435546875, -0.031917572021484375, -0.01801300048828125, -0.004108428955078125, 0.009796142578125, 0.023700714111328125, 0.03760528564453125, 0.051509857177734375, 0.0654144287109375, 0.07931900024414062, 0.09322357177734375, 0.10712814331054688, 0.12103271484375, 0.13493728637695312, 0.14884185791015625, 0.16274642944335938, 0.1766510009765625, 0.19055557250976562, 0.20446014404296875, 0.21836471557617188, 0.232269287109375, 0.24617385864257812, 0.26007843017578125, 0.2739830017089844, 0.2878875732421875, 0.3017921447753906, 0.31569671630859375, 0.3296012878417969, 0.343505859375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 18.0, 40.0, 59.0, 119.0, 171.0, 201.0, 152.0, 99.0, 57.0, 18.0, 12.0, 11.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.252156257629395, -11.931120872497559, -11.610086441040039, -11.289051055908203, -10.968015670776367, -10.646981239318848, -10.325945854187012, -10.004911422729492, -9.683876037597656, -9.36284065246582, -9.0418062210083, -8.720770835876465, -8.399736404418945, -8.07870101928711, -7.757665634155273, -7.436630725860596, -7.115595817565918, -6.79456090927124, -6.4735260009765625, -6.152490615844727, -5.831455707550049, -5.510420799255371, -5.189385414123535, -4.868350505828857, -4.54731559753418, -4.226280689239502, -3.905245542526245, -3.5842103958129883, -3.2631754875183105, -2.942140579223633, -2.621105432510376, -2.300070285797119, -1.979034423828125, -1.6579993963241577, -1.3369643688201904, -1.0159293413162231, -0.6948943138122559, -0.3738592863082886, -0.05282425880432129, 0.26821088790893555, 0.5892457962036133, 0.9102808237075806, 1.2313158512115479, 1.5523508787155151, 1.8733859062194824, 2.19442081451416, 2.515455961227417, 2.836491107940674, 3.1575260162353516, 3.4785609245300293, 3.799596071243286, 4.120631217956543, 4.441666126251221, 4.762701034545898, 5.083736419677734, 5.404771327972412, 5.72580623626709, 6.046841144561768, 6.367876052856445, 6.688911437988281, 7.009946346282959, 7.330981254577637, 7.652016639709473, 7.97305154800415, 8.294086456298828]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 9.0, 6.0, 8.0, 9.0, 7.0, 12.0, 19.0, 14.0, 24.0, 23.0, 16.0, 33.0, 33.0, 30.0, 51.0, 32.0, 39.0, 39.0, 33.0, 42.0, 40.0, 42.0, 39.0, 47.0, 31.0, 34.0, 30.0, 32.0, 28.0, 24.0, 27.0, 20.0, 18.0, 20.0, 16.0, 10.0, 8.0, 10.0, 11.0, 3.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.865767955780029, -6.648454189300537, -6.431140899658203, -6.213827133178711, -5.996513366699219, -5.779199600219727, -5.561886310577393, -5.3445725440979, -5.127259254455566, -4.909945487976074, -4.69263219833374, -4.475318431854248, -4.258004665374756, -4.040691375732422, -3.8233776092529297, -3.6060638427734375, -3.3887500762939453, -3.1714365482330322, -2.95412278175354, -2.736809253692627, -2.5194954872131348, -2.3021819591522217, -2.0848684310913086, -1.867554783821106, -1.6502411365509033, -1.4329274892807007, -1.215613842010498, -0.998300313949585, -0.7809866666793823, -0.5636730194091797, -0.3463594913482666, -0.12904584407806396, 0.08826780319213867, 0.3055814206600189, 0.5228950381278992, 0.740208625793457, 0.9575222730636597, 1.1748359203338623, 1.3921494483947754, 1.609463095664978, 1.8267767429351807, 2.0440902709960938, 2.261404037475586, 2.478717565536499, 2.696031093597412, 2.9133448600769043, 3.1306583881378174, 3.3479719161987305, 3.5652856826782227, 3.7825992107391357, 3.999912977218628, 4.217226505279541, 4.434540271759033, 4.651853561401367, 4.869167327880859, 5.086481094360352, 5.303794860839844, 5.521108627319336, 5.73842191696167, 5.955735683441162, 6.173049449920654, 6.390362739562988, 6.6076765060424805, 6.824990272521973, 7.042303562164307]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 4.0, 6.0, 7.0, 13.0, 8.0, 10.0, 18.0, 14.0, 19.0, 29.0, 31.0, 28.0, 36.0, 65.0, 63.0, 146.0, 381.0, 1291.0, 8039.0, 420991.0, 3742443.0, 17454.0, 2084.0, 512.0, 181.0, 95.0, 60.0, 32.0, 29.0, 25.0, 22.0, 25.0, 15.0, 19.0, 14.0, 12.0, 8.0, 10.0, 10.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.234375, -9.90576171875, -9.5771484375, -9.24853515625, -8.919921875, -8.59130859375, -8.2626953125, -7.93408203125, -7.60546875, -7.27685546875, -6.9482421875, -6.61962890625, -6.291015625, -5.96240234375, -5.6337890625, -5.30517578125, -4.9765625, -4.64794921875, -4.3193359375, -3.99072265625, -3.662109375, -3.33349609375, -3.0048828125, -2.67626953125, -2.34765625, -2.01904296875, -1.6904296875, -1.36181640625, -1.033203125, -0.70458984375, -0.3759765625, -0.04736328125, 0.28125, 0.60986328125, 0.9384765625, 1.26708984375, 1.595703125, 1.92431640625, 2.2529296875, 2.58154296875, 2.91015625, 3.23876953125, 3.5673828125, 3.89599609375, 4.224609375, 4.55322265625, 4.8818359375, 5.21044921875, 5.5390625, 5.86767578125, 6.1962890625, 6.52490234375, 6.853515625, 7.18212890625, 7.5107421875, 7.83935546875, 8.16796875, 8.49658203125, 8.8251953125, 9.15380859375, 9.482421875, 9.81103515625, 10.1396484375, 10.46826171875, 10.796875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 4.0, 5.0, 10.0, 16.0, 25.0, 30.0, 39.0, 48.0, 59.0, 74.0, 79.0, 79.0, 100.0, 67.0, 65.0, 42.0, 55.0, 45.0, 33.0, 24.0, 21.0, 14.0, 11.0, 7.0, 5.0, 12.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6484375, -2.56622314453125, -2.4840087890625, -2.40179443359375, -2.319580078125, -2.23736572265625, -2.1551513671875, -2.07293701171875, -1.99072265625, -1.90850830078125, -1.8262939453125, -1.74407958984375, -1.661865234375, -1.57965087890625, -1.4974365234375, -1.41522216796875, -1.3330078125, -1.25079345703125, -1.1685791015625, -1.08636474609375, -1.004150390625, -0.92193603515625, -0.8397216796875, -0.75750732421875, -0.67529296875, -0.59307861328125, -0.5108642578125, -0.42864990234375, -0.346435546875, -0.26422119140625, -0.1820068359375, -0.09979248046875, -0.017578125, 0.06463623046875, 0.1468505859375, 0.22906494140625, 0.311279296875, 0.39349365234375, 0.4757080078125, 0.55792236328125, 0.64013671875, 0.72235107421875, 0.8045654296875, 0.88677978515625, 0.968994140625, 1.05120849609375, 1.1334228515625, 1.21563720703125, 1.2978515625, 1.38006591796875, 1.4622802734375, 1.54449462890625, 1.626708984375, 1.70892333984375, 1.7911376953125, 1.87335205078125, 1.95556640625, 2.03778076171875, 2.1199951171875, 2.20220947265625, 2.284423828125, 2.36663818359375, 2.4488525390625, 2.53106689453125, 2.61328125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 6.0, 12.0, 16.0, 21.0, 23.0, 39.0, 45.0, 76.0, 111.0, 169.0, 299.0, 537.0, 1162.0, 2935.0, 8986.0, 41242.0, 446868.0, 3515388.0, 145228.0, 21435.0, 5792.0, 1982.0, 859.0, 420.0, 225.0, 134.0, 85.0, 53.0, 31.0, 25.0, 13.0, 25.0, 8.0, 6.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5859375, -4.43463134765625, -4.2833251953125, -4.13201904296875, -3.980712890625, -3.82940673828125, -3.6781005859375, -3.52679443359375, -3.37548828125, -3.22418212890625, -3.0728759765625, -2.92156982421875, -2.770263671875, -2.61895751953125, -2.4676513671875, -2.31634521484375, -2.1650390625, -2.01373291015625, -1.8624267578125, -1.71112060546875, -1.559814453125, -1.40850830078125, -1.2572021484375, -1.10589599609375, -0.95458984375, -0.80328369140625, -0.6519775390625, -0.50067138671875, -0.349365234375, -0.19805908203125, -0.0467529296875, 0.10455322265625, 0.255859375, 0.40716552734375, 0.5584716796875, 0.70977783203125, 0.861083984375, 1.01239013671875, 1.1636962890625, 1.31500244140625, 1.46630859375, 1.61761474609375, 1.7689208984375, 1.92022705078125, 2.071533203125, 2.22283935546875, 2.3741455078125, 2.52545166015625, 2.6767578125, 2.82806396484375, 2.9793701171875, 3.13067626953125, 3.281982421875, 3.43328857421875, 3.5845947265625, 3.73590087890625, 3.88720703125, 4.03851318359375, 4.1898193359375, 4.34112548828125, 4.492431640625, 4.64373779296875, 4.7950439453125, 4.94635009765625, 5.09765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 1.0, 6.0, 7.0, 11.0, 11.0, 8.0, 14.0, 24.0, 23.0, 26.0, 48.0, 57.0, 90.0, 122.0, 173.0, 355.0, 551.0, 960.0, 554.0, 342.0, 177.0, 133.0, 73.0, 68.0, 49.0, 44.0, 29.0, 17.0, 23.0, 15.0, 9.0, 8.0, 9.0, 5.0, 8.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8125, -0.7829437255859375, -0.753387451171875, -0.7238311767578125, -0.69427490234375, -0.6647186279296875, -0.635162353515625, -0.6056060791015625, -0.5760498046875, -0.5464935302734375, -0.516937255859375, -0.4873809814453125, -0.45782470703125, -0.4282684326171875, -0.398712158203125, -0.3691558837890625, -0.339599609375, -0.3100433349609375, -0.280487060546875, -0.2509307861328125, -0.22137451171875, -0.1918182373046875, -0.162261962890625, -0.1327056884765625, -0.1031494140625, -0.0735931396484375, -0.044036865234375, -0.0144805908203125, 0.01507568359375, 0.0446319580078125, 0.074188232421875, 0.1037445068359375, 0.13330078125, 0.1628570556640625, 0.192413330078125, 0.2219696044921875, 0.25152587890625, 0.2810821533203125, 0.310638427734375, 0.3401947021484375, 0.3697509765625, 0.3993072509765625, 0.428863525390625, 0.4584197998046875, 0.48797607421875, 0.5175323486328125, 0.547088623046875, 0.5766448974609375, 0.606201171875, 0.6357574462890625, 0.665313720703125, 0.6948699951171875, 0.72442626953125, 0.7539825439453125, 0.783538818359375, 0.8130950927734375, 0.8426513671875, 0.8722076416015625, 0.901763916015625, 0.9313201904296875, 0.96087646484375, 0.9904327392578125, 1.019989013671875, 1.0495452880859375, 1.0791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 17.0, 30.0, 35.0, 57.0, 92.0, 98.0, 138.0, 141.0, 114.0, 84.0, 57.0, 45.0, 32.0, 20.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7026777267456055, -5.529074192047119, -5.355470657348633, -5.181866645812988, -5.008263111114502, -4.834659576416016, -4.661056041717529, -4.487452507019043, -4.313848495483398, -4.140244960784912, -3.9666411876678467, -3.7930376529693604, -3.619433879852295, -3.4458303451538086, -3.2722268104553223, -3.098623037338257, -2.9250195026397705, -2.751415967941284, -2.5778121948242188, -2.4042086601257324, -2.230604887008667, -2.0570013523101807, -1.8833976984024048, -1.709794044494629, -1.536190390586853, -1.3625867366790771, -1.1889830827713013, -1.0153794288635254, -0.8417758345603943, -0.6681721806526184, -0.4945685863494873, -0.3209649324417114, -0.14736127853393555, 0.026242360472679138, 0.19984599947929382, 0.3734496235847473, 0.5470532774925232, 0.7206569314002991, 0.8942605257034302, 1.067864179611206, 1.241467833518982, 1.4150714874267578, 1.5886751413345337, 1.7622787952423096, 1.935882329940796, 2.1094861030578613, 2.2830896377563477, 2.456693172454834, 2.6302969455718994, 2.8039004802703857, 2.977504253387451, 3.1511077880859375, 3.324711561203003, 3.4983150959014893, 3.6719188690185547, 3.845522403717041, 4.019125938415527, 4.192729473114014, 4.3663330078125, 4.5399370193481445, 4.713540554046631, 4.887144088745117, 5.0607476234436035, 5.23435115814209, 5.407955169677734]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 1.0, 3.0, 9.0, 5.0, 6.0, 17.0, 18.0, 22.0, 21.0, 19.0, 18.0, 27.0, 25.0, 41.0, 47.0, 38.0, 40.0, 60.0, 36.0, 49.0, 53.0, 59.0, 40.0, 40.0, 30.0, 42.0, 43.0, 32.0, 30.0, 20.0, 17.0, 14.0, 12.0, 17.0, 5.0, 8.0, 9.0, 6.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.693044662475586, -2.616018772125244, -2.5389928817749023, -2.4619669914245605, -2.3849408626556396, -2.307914972305298, -2.230889081954956, -2.1538631916046143, -2.0768373012542725, -1.9998114109039307, -1.9227854013442993, -1.8457595109939575, -1.7687336206436157, -1.6917076110839844, -1.6146817207336426, -1.5376558303833008, -1.4606298208236694, -1.3836039304733276, -1.3065779209136963, -1.2295520305633545, -1.1525261402130127, -1.075500249862671, -0.9984742403030396, -0.9214483499526978, -0.8444223999977112, -0.7673964500427246, -0.6903705596923828, -0.6133446097373962, -0.5363186597824097, -0.45929276943206787, -0.3822668194770813, -0.3052409291267395, -0.22821497917175293, -0.15118905901908875, -0.07416312396526337, 0.0028628110885620117, 0.0798887312412262, 0.15691465139389038, 0.23394060134887695, 0.31096649169921875, 0.3879924416542053, 0.4650183618068695, 0.5420442819595337, 0.6190702319145203, 0.6960961818695068, 0.7731220722198486, 0.8501480221748352, 0.927173912525177, 1.0041998624801636, 1.0812257528305054, 1.1582517623901367, 1.2352776527404785, 1.3123035430908203, 1.389329433441162, 1.4663554430007935, 1.5433813333511353, 1.6204073429107666, 1.6974332332611084, 1.7744592428207397, 1.8514851331710815, 1.9285110235214233, 2.0055370330810547, 2.0825629234313965, 2.1595888137817383, 2.23661470413208]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 6.0, 5.0, 5.0, 8.0, 3.0, 13.0, 11.0, 15.0, 18.0, 29.0, 45.0, 32.0, 53.0, 59.0, 94.0, 122.0, 169.0, 230.0, 281.0, 457.0, 706.0, 1228.0, 2942.0, 9294.0, 45664.0, 395215.0, 513280.0, 59956.0, 11229.0, 3442.0, 1423.0, 745.0, 494.0, 313.0, 233.0, 174.0, 136.0, 87.0, 71.0, 52.0, 49.0, 42.0, 27.0, 25.0, 11.0, 10.0, 9.0, 9.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.386474609375, -0.3744239807128906, -0.36237335205078125, -0.3503227233886719, -0.3382720947265625, -0.3262214660644531, -0.31417083740234375, -0.3021202087402344, -0.290069580078125, -0.2780189514160156, -0.26596832275390625, -0.2539176940917969, -0.2418670654296875, -0.22981643676757812, -0.21776580810546875, -0.20571517944335938, -0.19366455078125, -0.18161392211914062, -0.16956329345703125, -0.15751266479492188, -0.1454620361328125, -0.13341140747070312, -0.12136077880859375, -0.10931015014648438, -0.097259521484375, -0.08520889282226562, -0.07315826416015625, -0.061107635498046875, -0.0490570068359375, -0.037006378173828125, -0.02495574951171875, -0.012905120849609375, -0.0008544921875, 0.011196136474609375, 0.02324676513671875, 0.035297393798828125, 0.0473480224609375, 0.059398651123046875, 0.07144927978515625, 0.08349990844726562, 0.095550537109375, 0.10760116577148438, 0.11965179443359375, 0.13170242309570312, 0.1437530517578125, 0.15580368041992188, 0.16785430908203125, 0.17990493774414062, 0.19195556640625, 0.20400619506835938, 0.21605682373046875, 0.22810745239257812, 0.2401580810546875, 0.2522087097167969, 0.26425933837890625, 0.2763099670410156, 0.288360595703125, 0.3004112243652344, 0.31246185302734375, 0.3245124816894531, 0.3365631103515625, 0.3486137390136719, 0.36066436767578125, 0.3727149963378906, 0.384765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 3.0, 8.0, 7.0, 7.0, 10.0, 23.0, 16.0, 26.0, 24.0, 30.0, 27.0, 43.0, 32.0, 45.0, 49.0, 41.0, 50.0, 54.0, 55.0, 48.0, 54.0, 38.0, 38.0, 36.0, 33.0, 31.0, 23.0, 30.0, 16.0, 21.0, 14.0, 7.0, 9.0, 12.0, 7.0, 6.0, 7.0, 0.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9794921875, -1.919189453125, -1.85888671875, -1.798583984375, -1.73828125, -1.677978515625, -1.61767578125, -1.557373046875, -1.4970703125, -1.436767578125, -1.37646484375, -1.316162109375, -1.255859375, -1.195556640625, -1.13525390625, -1.074951171875, -1.0146484375, -0.954345703125, -0.89404296875, -0.833740234375, -0.7734375, -0.713134765625, -0.65283203125, -0.592529296875, -0.5322265625, -0.471923828125, -0.41162109375, -0.351318359375, -0.291015625, -0.230712890625, -0.17041015625, -0.110107421875, -0.0498046875, 0.010498046875, 0.07080078125, 0.131103515625, 0.19140625, 0.251708984375, 0.31201171875, 0.372314453125, 0.4326171875, 0.492919921875, 0.55322265625, 0.613525390625, 0.673828125, 0.734130859375, 0.79443359375, 0.854736328125, 0.9150390625, 0.975341796875, 1.03564453125, 1.095947265625, 1.15625, 1.216552734375, 1.27685546875, 1.337158203125, 1.3974609375, 1.457763671875, 1.51806640625, 1.578369140625, 1.638671875, 1.698974609375, 1.75927734375, 1.819580078125, 1.8798828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 7.0, 3.0, 5.0, 6.0, 12.0, 18.0, 29.0, 36.0, 23.0, 37.0, 50.0, 81.0, 85.0, 139.0, 156.0, 265.0, 427.0, 688.0, 1883.0, 11682.0, 139734.0, 743926.0, 134243.0, 11061.0, 1851.0, 656.0, 409.0, 299.0, 185.0, 140.0, 115.0, 78.0, 46.0, 33.0, 34.0, 24.0, 28.0, 15.0, 11.0, 7.0, 11.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349365234375, -0.3379058837890625, -0.326446533203125, -0.3149871826171875, -0.30352783203125, -0.2920684814453125, -0.280609130859375, -0.2691497802734375, -0.2576904296875, -0.2462310791015625, -0.234771728515625, -0.2233123779296875, -0.21185302734375, -0.2003936767578125, -0.188934326171875, -0.1774749755859375, -0.166015625, -0.1545562744140625, -0.143096923828125, -0.1316375732421875, -0.12017822265625, -0.1087188720703125, -0.097259521484375, -0.0858001708984375, -0.0743408203125, -0.0628814697265625, -0.051422119140625, -0.0399627685546875, -0.02850341796875, -0.0170440673828125, -0.005584716796875, 0.0058746337890625, 0.017333984375, 0.0287933349609375, 0.040252685546875, 0.0517120361328125, 0.06317138671875, 0.0746307373046875, 0.086090087890625, 0.0975494384765625, 0.1090087890625, 0.1204681396484375, 0.131927490234375, 0.1433868408203125, 0.15484619140625, 0.1663055419921875, 0.177764892578125, 0.1892242431640625, 0.20068359375, 0.2121429443359375, 0.223602294921875, 0.2350616455078125, 0.24652099609375, 0.2579803466796875, 0.269439697265625, 0.2808990478515625, 0.2923583984375, 0.3038177490234375, 0.315277099609375, 0.3267364501953125, 0.33819580078125, 0.3496551513671875, 0.361114501953125, 0.3725738525390625, 0.384033203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 9.0, 10.0, 11.0, 13.0, 15.0, 9.0, 21.0, 18.0, 27.0, 25.0, 25.0, 34.0, 51.0, 37.0, 45.0, 43.0, 43.0, 48.0, 57.0, 46.0, 55.0, 50.0, 35.0, 25.0, 27.0, 32.0, 27.0, 20.0, 24.0, 23.0, 15.0, 14.0, 6.0, 11.0, 13.0, 9.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.94140625, -3.824005126953125, -3.70660400390625, -3.589202880859375, -3.4718017578125, -3.354400634765625, -3.23699951171875, -3.119598388671875, -3.002197265625, -2.884796142578125, -2.76739501953125, -2.649993896484375, -2.5325927734375, -2.415191650390625, -2.29779052734375, -2.180389404296875, -2.06298828125, -1.945587158203125, -1.82818603515625, -1.710784912109375, -1.5933837890625, -1.475982666015625, -1.35858154296875, -1.241180419921875, -1.123779296875, -1.006378173828125, -0.88897705078125, -0.771575927734375, -0.6541748046875, -0.536773681640625, -0.41937255859375, -0.301971435546875, -0.1845703125, -0.067169189453125, 0.05023193359375, 0.167633056640625, 0.2850341796875, 0.402435302734375, 0.51983642578125, 0.637237548828125, 0.754638671875, 0.872039794921875, 0.98944091796875, 1.106842041015625, 1.2242431640625, 1.341644287109375, 1.45904541015625, 1.576446533203125, 1.69384765625, 1.811248779296875, 1.92864990234375, 2.046051025390625, 2.1634521484375, 2.280853271484375, 2.39825439453125, 2.515655517578125, 2.633056640625, 2.750457763671875, 2.86785888671875, 2.985260009765625, 3.1026611328125, 3.220062255859375, 3.33746337890625, 3.454864501953125, 3.572265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 13.0, 8.0, 20.0, 22.0, 33.0, 37.0, 63.0, 98.0, 132.0, 243.0, 463.0, 1396.0, 11687.0, 986151.0, 44240.0, 2437.0, 659.0, 312.0, 159.0, 112.0, 74.0, 47.0, 30.0, 14.0, 17.0, 9.0, 10.0, 10.0, 10.0, 2.0, 3.0, 11.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1300373077392578, -0.12579727172851562, -0.12155723571777344, -0.11731719970703125, -0.11307716369628906, -0.10883712768554688, -0.10459709167480469, -0.1003570556640625, -0.09611701965332031, -0.09187698364257812, -0.08763694763183594, -0.08339691162109375, -0.07915687561035156, -0.07491683959960938, -0.07067680358886719, -0.066436767578125, -0.06219673156738281, -0.057956695556640625, -0.05371665954589844, -0.04947662353515625, -0.04523658752441406, -0.040996551513671875, -0.03675651550292969, -0.0325164794921875, -0.028276443481445312, -0.024036407470703125, -0.019796371459960938, -0.01555633544921875, -0.011316299438476562, -0.007076263427734375, -0.0028362274169921875, 0.00140380859375, 0.0056438446044921875, 0.009883880615234375, 0.014123916625976562, 0.01836395263671875, 0.022603988647460938, 0.026844024658203125, 0.031084060668945312, 0.0353240966796875, 0.03956413269042969, 0.043804168701171875, 0.04804420471191406, 0.05228424072265625, 0.05652427673339844, 0.060764312744140625, 0.06500434875488281, 0.069244384765625, 0.07348442077636719, 0.07772445678710938, 0.08196449279785156, 0.08620452880859375, 0.09044456481933594, 0.09468460083007812, 0.09892463684082031, 0.1031646728515625, 0.10740470886230469, 0.11164474487304688, 0.11588478088378906, 0.12012481689453125, 0.12436485290527344, 0.12860488891601562, 0.1328449249267578, 0.1370849609375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 6.0, 18.0, 24.0, 24.0, 32.0, 44.0, 64.0, 70.0, 96.0, 89.0, 105.0, 80.0, 87.0, 68.0, 49.0, 28.0, 23.0, 19.0, 18.0, 11.0, 6.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.081560134887695e-05, -2.9820017516613007e-05, -2.882443368434906e-05, -2.7828849852085114e-05, -2.6833266019821167e-05, -2.583768218755722e-05, -2.4842098355293274e-05, -2.3846514523029327e-05, -2.285093069076538e-05, -2.1855346858501434e-05, -2.0859763026237488e-05, -1.986417919397354e-05, -1.8868595361709595e-05, -1.7873011529445648e-05, -1.68774276971817e-05, -1.5881843864917755e-05, -1.4886260032653809e-05, -1.3890676200389862e-05, -1.2895092368125916e-05, -1.1899508535861969e-05, -1.0903924703598022e-05, -9.908340871334076e-06, -8.91275703907013e-06, -7.917173206806183e-06, -6.921589374542236e-06, -5.92600554227829e-06, -4.930421710014343e-06, -3.934837877750397e-06, -2.93925404548645e-06, -1.9436702132225037e-06, -9.480863809585571e-07, 4.7497451305389404e-08, 1.043081283569336e-06, 2.0386651158332825e-06, 3.034248948097229e-06, 4.0298327803611755e-06, 5.025416612625122e-06, 6.021000444889069e-06, 7.016584277153015e-06, 8.012168109416962e-06, 9.007751941680908e-06, 1.0003335773944855e-05, 1.0998919606208801e-05, 1.1994503438472748e-05, 1.2990087270736694e-05, 1.3985671103000641e-05, 1.4981254935264587e-05, 1.5976838767528534e-05, 1.697242259979248e-05, 1.7968006432056427e-05, 1.8963590264320374e-05, 1.995917409658432e-05, 2.0954757928848267e-05, 2.1950341761112213e-05, 2.294592559337616e-05, 2.3941509425640106e-05, 2.4937093257904053e-05, 2.5932677090168e-05, 2.6928260922431946e-05, 2.7923844754695892e-05, 2.891942858695984e-05, 2.9915012419223785e-05, 3.091059625148773e-05, 3.190618008375168e-05, 3.2901763916015625e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 9.0, 11.0, 30.0, 29.0, 27.0, 76.0, 72.0, 94.0, 170.0, 246.0, 412.0, 692.0, 1265.0, 2439.0, 5321.0, 15654.0, 108819.0, 838859.0, 54273.0, 11197.0, 4139.0, 1953.0, 1079.0, 589.0, 354.0, 217.0, 144.0, 109.0, 67.0, 49.0, 35.0, 22.0, 21.0, 17.0, 4.0, 7.0, 9.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09735107421875, -0.0939188003540039, -0.09048652648925781, -0.08705425262451172, -0.08362197875976562, -0.08018970489501953, -0.07675743103027344, -0.07332515716552734, -0.06989288330078125, -0.06646060943603516, -0.06302833557128906, -0.05959606170654297, -0.056163787841796875, -0.05273151397705078, -0.04929924011230469, -0.045866966247558594, -0.0424346923828125, -0.039002418518066406, -0.03557014465332031, -0.03213787078857422, -0.028705596923828125, -0.02527332305908203, -0.021841049194335938, -0.018408775329589844, -0.01497650146484375, -0.011544227600097656, -0.008111953735351562, -0.004679679870605469, -0.001247406005859375, 0.0021848678588867188, 0.0056171417236328125, 0.009049415588378906, 0.012481689453125, 0.015913963317871094, 0.019346237182617188, 0.02277851104736328, 0.026210784912109375, 0.02964305877685547, 0.03307533264160156, 0.036507606506347656, 0.03993988037109375, 0.043372154235839844, 0.04680442810058594, 0.05023670196533203, 0.053668975830078125, 0.05710124969482422, 0.06053352355957031, 0.0639657974243164, 0.0673980712890625, 0.0708303451538086, 0.07426261901855469, 0.07769489288330078, 0.08112716674804688, 0.08455944061279297, 0.08799171447753906, 0.09142398834228516, 0.09485626220703125, 0.09828853607177734, 0.10172080993652344, 0.10515308380126953, 0.10858535766601562, 0.11201763153076172, 0.11544990539550781, 0.1188821792602539, 0.122314453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 11.0, 12.0, 15.0, 35.0, 62.0, 122.0, 315.0, 193.0, 84.0, 36.0, 23.0, 16.0, 15.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.031201839447021484, -0.03011608123779297, -0.029030323028564453, -0.027944564819335938, -0.026858806610107422, -0.025773048400878906, -0.02468729019165039, -0.023601531982421875, -0.02251577377319336, -0.021430015563964844, -0.020344257354736328, -0.019258499145507812, -0.018172740936279297, -0.01708698272705078, -0.016001224517822266, -0.01491546630859375, -0.013829708099365234, -0.012743949890136719, -0.011658191680908203, -0.010572433471679688, -0.009486675262451172, -0.008400917053222656, -0.007315158843994141, -0.006229400634765625, -0.005143642425537109, -0.004057884216308594, -0.002972126007080078, -0.0018863677978515625, -0.0008006095886230469, 0.00028514862060546875, 0.0013709068298339844, 0.0024566650390625, 0.0035424232482910156, 0.004628181457519531, 0.005713939666748047, 0.0067996978759765625, 0.007885456085205078, 0.008971214294433594, 0.01005697250366211, 0.011142730712890625, 0.01222848892211914, 0.013314247131347656, 0.014400005340576172, 0.015485763549804688, 0.016571521759033203, 0.01765727996826172, 0.018743038177490234, 0.01982879638671875, 0.020914554595947266, 0.02200031280517578, 0.023086071014404297, 0.024171829223632812, 0.025257587432861328, 0.026343345642089844, 0.02742910385131836, 0.028514862060546875, 0.02960062026977539, 0.030686378479003906, 0.03177213668823242, 0.03285789489746094, 0.03394365310668945, 0.03502941131591797, 0.036115169525146484, 0.037200927734375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 25.0, 52.0, 115.0, 198.0, 226.0, 163.0, 115.0, 47.0, 28.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.30893611907959, -9.089130401611328, -8.869325637817383, -8.649519920349121, -8.42971420288086, -8.209908485412598, -7.990103244781494, -7.770298004150391, -7.550492286682129, -7.330686569213867, -7.110881328582764, -6.89107608795166, -6.671270370483398, -6.451464653015137, -6.231659412384033, -6.01185417175293, -5.792048454284668, -5.572242736816406, -5.352437496185303, -5.132632255554199, -4.9128265380859375, -4.693020820617676, -4.473215579986572, -4.253410339355469, -4.033604621887207, -3.8137991428375244, -3.593993663787842, -3.374188184738159, -3.1543827056884766, -2.934577226638794, -2.7147717475891113, -2.4949662685394287, -2.2751612663269043, -2.0553557872772217, -1.835550308227539, -1.6157448291778564, -1.3959393501281738, -1.1761338710784912, -0.9563283920288086, -0.736522912979126, -0.5167174339294434, -0.29691195487976074, -0.07710647583007812, 0.1426990032196045, 0.3625044822692871, 0.5823099613189697, 0.8021154403686523, 1.021920919418335, 1.2417263984680176, 1.4615318775177002, 1.6813373565673828, 1.9011428356170654, 2.120948314666748, 2.3407537937164307, 2.5605592727661133, 2.780364751815796, 3.0001702308654785, 3.219975709915161, 3.4397811889648438, 3.6595866680145264, 3.879392147064209, 4.0991973876953125, 4.319003105163574, 4.538808822631836, 4.7586140632629395]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 10.0, 6.0, 15.0, 25.0, 22.0, 26.0, 25.0, 26.0, 36.0, 49.0, 47.0, 41.0, 65.0, 43.0, 70.0, 48.0, 59.0, 51.0, 47.0, 51.0, 36.0, 32.0, 32.0, 24.0, 17.0, 18.0, 12.0, 9.0, 8.0, 8.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1779773235321045, -2.1129143238067627, -2.0478515625, -1.9827885627746582, -1.917725682258606, -1.8526628017425537, -1.787599802017212, -1.7225369215011597, -1.6574740409851074, -1.5924111604690552, -1.527348279953003, -1.4622852802276611, -1.3972223997116089, -1.3321595191955566, -1.2670965194702148, -1.2020336389541626, -1.1369707584381104, -1.071907877922058, -1.0068449974060059, -0.9417819976806641, -0.8767191171646118, -0.8116562366485596, -0.7465932965278625, -0.6815303564071655, -0.6164674758911133, -0.551404595375061, -0.486341655254364, -0.4212787449359894, -0.35621583461761475, -0.2911529242992401, -0.22609001398086548, -0.16102710366249084, -0.09596407413482666, -0.030901163816452026, 0.03416174650192261, 0.09922465682029724, 0.16428756713867188, 0.2293504774570465, 0.29441338777542114, 0.3594762980937958, 0.4245392084121704, 0.48960211873054504, 0.5546650290489197, 0.6197279691696167, 0.684790849685669, 0.7498537302017212, 0.8149166703224182, 0.8799796104431152, 0.9450424909591675, 1.0101053714752197, 1.0751683712005615, 1.1402312517166138, 1.205294132232666, 1.2703570127487183, 1.3354198932647705, 1.4004828929901123, 1.4655457735061646, 1.5306086540222168, 1.5956716537475586, 1.6607345342636108, 1.725797414779663, 1.7908602952957153, 1.8559231758117676, 1.9209861755371094, 1.9860490560531616]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 9.0, 11.0, 6.0, 14.0, 21.0, 33.0, 43.0, 65.0, 85.0, 163.0, 270.0, 515.0, 836.0, 1559.0, 3286.0, 6956.0, 16265.0, 44190.0, 148082.0, 612129.0, 141703.0, 42980.0, 15842.0, 6833.0, 3151.0, 1482.0, 833.0, 451.0, 271.0, 157.0, 108.0, 63.0, 43.0, 33.0, 21.0, 9.0, 9.0, 7.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.214813232421875, -2.14447021484375, -2.074127197265625, -2.0037841796875, -1.933441162109375, -1.86309814453125, -1.792755126953125, -1.722412109375, -1.652069091796875, -1.58172607421875, -1.511383056640625, -1.4410400390625, -1.370697021484375, -1.30035400390625, -1.230010986328125, -1.15966796875, -1.089324951171875, -1.01898193359375, -0.948638916015625, -0.8782958984375, -0.807952880859375, -0.73760986328125, -0.667266845703125, -0.596923828125, -0.526580810546875, -0.45623779296875, -0.385894775390625, -0.3155517578125, -0.245208740234375, -0.17486572265625, -0.104522705078125, -0.0341796875, 0.036163330078125, 0.10650634765625, 0.176849365234375, 0.2471923828125, 0.317535400390625, 0.38787841796875, 0.458221435546875, 0.528564453125, 0.598907470703125, 0.66925048828125, 0.739593505859375, 0.8099365234375, 0.880279541015625, 0.95062255859375, 1.020965576171875, 1.09130859375, 1.161651611328125, 1.23199462890625, 1.302337646484375, 1.3726806640625, 1.443023681640625, 1.51336669921875, 1.583709716796875, 1.654052734375, 1.724395751953125, 1.79473876953125, 1.865081787109375, 1.9354248046875, 2.005767822265625, 2.07611083984375, 2.146453857421875, 2.216796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 8.0, 6.0, 10.0, 15.0, 20.0, 19.0, 30.0, 43.0, 39.0, 50.0, 42.0, 56.0, 64.0, 67.0, 75.0, 78.0, 57.0, 50.0, 44.0, 42.0, 39.0, 30.0, 17.0, 17.0, 15.0, 18.0, 3.0, 6.0, 9.0, 1.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.191650390625, -4.04736328125, -3.903076171875, -3.7587890625, -3.614501953125, -3.47021484375, -3.325927734375, -3.181640625, -3.037353515625, -2.89306640625, -2.748779296875, -2.6044921875, -2.460205078125, -2.31591796875, -2.171630859375, -2.02734375, -1.883056640625, -1.73876953125, -1.594482421875, -1.4501953125, -1.305908203125, -1.16162109375, -1.017333984375, -0.873046875, -0.728759765625, -0.58447265625, -0.440185546875, -0.2958984375, -0.151611328125, -0.00732421875, 0.136962890625, 0.28125, 0.425537109375, 0.56982421875, 0.714111328125, 0.8583984375, 1.002685546875, 1.14697265625, 1.291259765625, 1.435546875, 1.579833984375, 1.72412109375, 1.868408203125, 2.0126953125, 2.156982421875, 2.30126953125, 2.445556640625, 2.58984375, 2.734130859375, 2.87841796875, 3.022705078125, 3.1669921875, 3.311279296875, 3.45556640625, 3.599853515625, 3.744140625, 3.888427734375, 4.03271484375, 4.177001953125, 4.3212890625, 4.465576171875, 4.60986328125, 4.754150390625, 4.8984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 15.0, 20.0, 14.0, 27.0, 25.0, 41.0, 51.0, 82.0, 110.0, 179.0, 315.0, 661.0, 2015.0, 10806.0, 144601.0, 840849.0, 41535.0, 4831.0, 1157.0, 461.0, 240.0, 138.0, 91.0, 79.0, 49.0, 27.0, 24.0, 19.0, 14.0, 8.0, 11.0, 6.0, 4.0, 4.0, 3.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-6.546875, -6.37127685546875, -6.1956787109375, -6.02008056640625, -5.844482421875, -5.66888427734375, -5.4932861328125, -5.31768798828125, -5.14208984375, -4.96649169921875, -4.7908935546875, -4.61529541015625, -4.439697265625, -4.26409912109375, -4.0885009765625, -3.91290283203125, -3.7373046875, -3.56170654296875, -3.3861083984375, -3.21051025390625, -3.034912109375, -2.85931396484375, -2.6837158203125, -2.50811767578125, -2.33251953125, -2.15692138671875, -1.9813232421875, -1.80572509765625, -1.630126953125, -1.45452880859375, -1.2789306640625, -1.10333251953125, -0.927734375, -0.75213623046875, -0.5765380859375, -0.40093994140625, -0.225341796875, -0.04974365234375, 0.1258544921875, 0.30145263671875, 0.47705078125, 0.65264892578125, 0.8282470703125, 1.00384521484375, 1.179443359375, 1.35504150390625, 1.5306396484375, 1.70623779296875, 1.8818359375, 2.05743408203125, 2.2330322265625, 2.40863037109375, 2.584228515625, 2.75982666015625, 2.9354248046875, 3.11102294921875, 3.28662109375, 3.46221923828125, 3.6378173828125, 3.81341552734375, 3.989013671875, 4.16461181640625, 4.3402099609375, 4.51580810546875, 4.69140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 4.0, 2.0, 7.0, 7.0, 8.0, 9.0, 8.0, 9.0, 17.0, 18.0, 20.0, 28.0, 25.0, 35.0, 35.0, 37.0, 30.0, 42.0, 43.0, 47.0, 54.0, 52.0, 57.0, 50.0, 48.0, 40.0, 36.0, 25.0, 25.0, 31.0, 28.0, 25.0, 21.0, 17.0, 10.0, 11.0, 12.0, 8.0, 3.0, 4.0, 8.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.35546875, -5.2034912109375, -5.051513671875, -4.8995361328125, -4.74755859375, -4.5955810546875, -4.443603515625, -4.2916259765625, -4.1396484375, -3.9876708984375, -3.835693359375, -3.6837158203125, -3.53173828125, -3.3797607421875, -3.227783203125, -3.0758056640625, -2.923828125, -2.7718505859375, -2.619873046875, -2.4678955078125, -2.31591796875, -2.1639404296875, -2.011962890625, -1.8599853515625, -1.7080078125, -1.5560302734375, -1.404052734375, -1.2520751953125, -1.10009765625, -0.9481201171875, -0.796142578125, -0.6441650390625, -0.4921875, -0.3402099609375, -0.188232421875, -0.0362548828125, 0.11572265625, 0.2677001953125, 0.419677734375, 0.5716552734375, 0.7236328125, 0.8756103515625, 1.027587890625, 1.1795654296875, 1.33154296875, 1.4835205078125, 1.635498046875, 1.7874755859375, 1.939453125, 2.0914306640625, 2.243408203125, 2.3953857421875, 2.54736328125, 2.6993408203125, 2.851318359375, 3.0032958984375, 3.1552734375, 3.3072509765625, 3.459228515625, 3.6112060546875, 3.76318359375, 3.9151611328125, 4.067138671875, 4.2191162109375, 4.37109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 10.0, 13.0, 12.0, 41.0, 95.0, 262.0, 750.0, 3548.0, 41102.0, 852351.0, 140329.0, 8151.0, 1257.0, 348.0, 152.0, 53.0, 33.0, 20.0, 11.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5498046875, -1.4894866943359375, -1.429168701171875, -1.3688507080078125, -1.30853271484375, -1.2482147216796875, -1.187896728515625, -1.1275787353515625, -1.0672607421875, -1.0069427490234375, -0.946624755859375, -0.8863067626953125, -0.82598876953125, -0.7656707763671875, -0.705352783203125, -0.6450347900390625, -0.584716796875, -0.5243988037109375, -0.464080810546875, -0.4037628173828125, -0.34344482421875, -0.2831268310546875, -0.222808837890625, -0.1624908447265625, -0.1021728515625, -0.0418548583984375, 0.018463134765625, 0.0787811279296875, 0.13909912109375, 0.1994171142578125, 0.259735107421875, 0.3200531005859375, 0.38037109375, 0.4406890869140625, 0.501007080078125, 0.5613250732421875, 0.62164306640625, 0.6819610595703125, 0.742279052734375, 0.8025970458984375, 0.8629150390625, 0.9232330322265625, 0.983551025390625, 1.0438690185546875, 1.10418701171875, 1.1645050048828125, 1.224822998046875, 1.2851409912109375, 1.345458984375, 1.4057769775390625, 1.466094970703125, 1.5264129638671875, 1.58673095703125, 1.6470489501953125, 1.707366943359375, 1.7676849365234375, 1.8280029296875, 1.8883209228515625, 1.948638916015625, 2.0089569091796875, 2.06927490234375, 2.1295928955078125, 2.189910888671875, 2.2502288818359375, 2.310546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 7.0, 10.0, 8.0, 11.0, 15.0, 10.0, 21.0, 22.0, 27.0, 33.0, 34.0, 48.0, 65.0, 104.0, 145.0, 100.0, 65.0, 46.0, 40.0, 45.0, 22.0, 16.0, 14.0, 13.0, 10.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001291036605834961, -0.00012534763664007187, -0.00012159161269664764, -0.00011783558875322342, -0.0001140795648097992, -0.00011032354086637497, -0.00010656751692295074, -0.00010281149297952652, -9.90554690361023e-05, -9.529944509267807e-05, -9.154342114925385e-05, -8.778739720582962e-05, -8.40313732624054e-05, -8.027534931898117e-05, -7.651932537555695e-05, -7.276330143213272e-05, -6.90072774887085e-05, -6.525125354528427e-05, -6.149522960186005e-05, -5.773920565843582e-05, -5.39831817150116e-05, -5.022715777158737e-05, -4.647113382816315e-05, -4.271510988473892e-05, -3.89590859413147e-05, -3.520306199789047e-05, -3.144703805446625e-05, -2.7691014111042023e-05, -2.3934990167617798e-05, -2.0178966224193573e-05, -1.6422942280769348e-05, -1.2666918337345123e-05, -8.910894393920898e-06, -5.154870450496674e-06, -1.3988465070724487e-06, 2.357177436351776e-06, 6.113201379776001e-06, 9.869225323200226e-06, 1.362524926662445e-05, 1.7381273210048676e-05, 2.11372971534729e-05, 2.4893321096897125e-05, 2.864934504032135e-05, 3.2405368983745575e-05, 3.61613929271698e-05, 3.9917416870594025e-05, 4.367344081401825e-05, 4.7429464757442474e-05, 5.11854887008667e-05, 5.4941512644290924e-05, 5.869753658771515e-05, 6.245356053113937e-05, 6.62095844745636e-05, 6.996560841798782e-05, 7.372163236141205e-05, 7.747765630483627e-05, 8.12336802482605e-05, 8.498970419168472e-05, 8.874572813510895e-05, 9.250175207853317e-05, 9.62577760219574e-05, 0.00010001379996538162, 0.00010376982390880585, 0.00010752584785223007, 0.0001112818717956543]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 17.0, 14.0, 20.0, 28.0, 43.0, 78.0, 175.0, 274.0, 650.0, 1458.0, 3808.0, 11444.0, 42376.0, 198356.0, 649376.0, 104214.0, 24532.0, 7082.0, 2545.0, 1026.0, 473.0, 224.0, 135.0, 59.0, 42.0, 37.0, 16.0, 11.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8623046875, -0.8318328857421875, -0.801361083984375, -0.7708892822265625, -0.74041748046875, -0.7099456787109375, -0.679473876953125, -0.6490020751953125, -0.6185302734375, -0.5880584716796875, -0.557586669921875, -0.5271148681640625, -0.49664306640625, -0.4661712646484375, -0.435699462890625, -0.4052276611328125, -0.374755859375, -0.3442840576171875, -0.313812255859375, -0.2833404541015625, -0.25286865234375, -0.2223968505859375, -0.191925048828125, -0.1614532470703125, -0.1309814453125, -0.1005096435546875, -0.070037841796875, -0.0395660400390625, -0.00909423828125, 0.0213775634765625, 0.051849365234375, 0.0823211669921875, 0.11279296875, 0.1432647705078125, 0.173736572265625, 0.2042083740234375, 0.23468017578125, 0.2651519775390625, 0.295623779296875, 0.3260955810546875, 0.3565673828125, 0.3870391845703125, 0.417510986328125, 0.4479827880859375, 0.47845458984375, 0.5089263916015625, 0.539398193359375, 0.5698699951171875, 0.600341796875, 0.6308135986328125, 0.661285400390625, 0.6917572021484375, 0.72222900390625, 0.7527008056640625, 0.783172607421875, 0.8136444091796875, 0.8441162109375, 0.8745880126953125, 0.905059814453125, 0.9355316162109375, 0.96600341796875, 0.9964752197265625, 1.026947021484375, 1.0574188232421875, 1.087890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 8.0, 6.0, 13.0, 16.0, 16.0, 23.0, 31.0, 35.0, 42.0, 77.0, 139.0, 195.0, 107.0, 78.0, 45.0, 44.0, 26.0, 16.0, 14.0, 15.0, 12.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4625053405761719, -0.44771575927734375, -0.4329261779785156, -0.4181365966796875, -0.4033470153808594, -0.38855743408203125, -0.3737678527832031, -0.358978271484375, -0.3441886901855469, -0.32939910888671875, -0.3146095275878906, -0.2998199462890625, -0.2850303649902344, -0.27024078369140625, -0.2554512023925781, -0.24066162109375, -0.22587203979492188, -0.21108245849609375, -0.19629287719726562, -0.1815032958984375, -0.16671371459960938, -0.15192413330078125, -0.13713455200195312, -0.122344970703125, -0.10755538940429688, -0.09276580810546875, -0.07797622680664062, -0.0631866455078125, -0.048397064208984375, -0.03360748291015625, -0.018817901611328125, -0.0040283203125, 0.010761260986328125, 0.02555084228515625, 0.040340423583984375, 0.0551300048828125, 0.06991958618164062, 0.08470916748046875, 0.09949874877929688, 0.114288330078125, 0.12907791137695312, 0.14386749267578125, 0.15865707397460938, 0.1734466552734375, 0.18823623657226562, 0.20302581787109375, 0.21781539916992188, 0.23260498046875, 0.24739456176757812, 0.26218414306640625, 0.2769737243652344, 0.2917633056640625, 0.3065528869628906, 0.32134246826171875, 0.3361320495605469, 0.350921630859375, 0.3657112121582031, 0.38050079345703125, 0.3952903747558594, 0.4100799560546875, 0.4248695373535156, 0.43965911865234375, 0.4544486999511719, 0.46923828125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 23.0, 64.0, 174.0, 297.0, 256.0, 123.0, 37.0, 9.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.123258590698242, -10.493622779846191, -9.863986015319824, -9.234350204467773, -8.604714393615723, -7.975078105926514, -7.345441818237305, -6.715806007385254, -6.086169719696045, -5.456533432006836, -4.826897621154785, -4.197261333465576, -3.5676252841949463, -2.9379892349243164, -2.3083529472351074, -1.6787171363830566, -1.0490808486938477, -0.419444739818573, 0.21019136905670166, 0.8398275375366211, 1.469463586807251, 2.099099636077881, 2.72873592376709, 3.3583717346191406, 3.9880080223083496, 4.617644309997559, 5.247280120849609, 5.876916408538818, 6.506552696228027, 7.136188507080078, 7.765824794769287, 8.39546012878418, 9.025096893310547, 9.654732704162598, 10.284369468688965, 10.914005279541016, 11.543641090393066, 12.173276901245117, 12.802913665771484, 13.432549476623535, 14.062185287475586, 14.691821098327637, 15.321457862854004, 15.951093673706055, 16.580730438232422, 17.210365295410156, 17.840002059936523, 18.46963882446289, 19.099273681640625, 19.728910446166992, 20.358545303344727, 20.988182067871094, 21.61781883239746, 22.247453689575195, 22.877090454101562, 23.506725311279297, 24.136363983154297, 24.766000747680664, 25.3956356048584, 26.025272369384766, 26.654909133911133, 27.284543991088867, 27.914180755615234, 28.54381561279297, 29.173452377319336]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 11.0, 11.0, 13.0, 14.0, 17.0, 17.0, 26.0, 28.0, 28.0, 34.0, 33.0, 35.0, 44.0, 49.0, 42.0, 34.0, 38.0, 49.0, 60.0, 35.0, 39.0, 45.0, 34.0, 26.0, 48.0, 24.0, 30.0, 17.0, 14.0, 19.0, 13.0, 20.0, 3.0, 9.0, 6.0, 1.0, 8.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.942437171936035, -8.68869686126709, -8.434956550598145, -8.1812162399292, -7.927475929260254, -7.673735618591309, -7.419994831085205, -7.16625452041626, -6.9125142097473145, -6.658773899078369, -6.405033588409424, -6.1512932777404785, -5.897552490234375, -5.64381217956543, -5.390071868896484, -5.136331558227539, -4.882591247558594, -4.628850936889648, -4.375110626220703, -4.121370315551758, -3.8676297664642334, -3.613889455795288, -3.3601489067077637, -3.1064085960388184, -2.852668285369873, -2.5989279747009277, -2.3451876640319824, -2.091447114944458, -1.8377068042755127, -1.5839664936065674, -1.3302260637283325, -1.0764856338500977, -0.8227453231811523, -0.5690049529075623, -0.31526458263397217, -0.06152421236038208, 0.192216157913208, 0.4459564685821533, 0.6996968984603882, 0.953437328338623, 1.2071776390075684, 1.4609179496765137, 1.7146583795547485, 1.9683988094329834, 2.2221391201019287, 2.475879430770874, 2.7296199798583984, 2.9833602905273438, 3.237100601196289, 3.4908409118652344, 3.7445812225341797, 3.998321771621704, 4.25206184387207, 4.505802154541016, 4.759542942047119, 5.0132832527160645, 5.26702356338501, 5.520763874053955, 5.7745041847229, 6.028244495391846, 6.281985282897949, 6.5357255935668945, 6.78946590423584, 7.043206214904785, 7.2969465255737305]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 6.0, 9.0, 7.0, 16.0, 14.0, 16.0, 24.0, 37.0, 51.0, 59.0, 84.0, 112.0, 132.0, 188.0, 322.0, 515.0, 902.0, 1700.0, 4074.0, 11781.0, 44854.0, 340536.0, 3369723.0, 352687.0, 46174.0, 11745.0, 4133.0, 1836.0, 923.0, 488.0, 311.0, 206.0, 169.0, 116.0, 86.0, 68.0, 39.0, 38.0, 30.0, 18.0, 15.0, 13.0, 10.0, 5.0, 4.0, 10.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.844329833984375, -3.71405029296875, -3.583770751953125, -3.4534912109375, -3.323211669921875, -3.19293212890625, -3.062652587890625, -2.932373046875, -2.802093505859375, -2.67181396484375, -2.541534423828125, -2.4112548828125, -2.280975341796875, -2.15069580078125, -2.020416259765625, -1.89013671875, -1.759857177734375, -1.62957763671875, -1.499298095703125, -1.3690185546875, -1.238739013671875, -1.10845947265625, -0.978179931640625, -0.847900390625, -0.717620849609375, -0.58734130859375, -0.457061767578125, -0.3267822265625, -0.196502685546875, -0.06622314453125, 0.064056396484375, 0.1943359375, 0.324615478515625, 0.45489501953125, 0.585174560546875, 0.7154541015625, 0.845733642578125, 0.97601318359375, 1.106292724609375, 1.236572265625, 1.366851806640625, 1.49713134765625, 1.627410888671875, 1.7576904296875, 1.887969970703125, 2.01824951171875, 2.148529052734375, 2.27880859375, 2.409088134765625, 2.53936767578125, 2.669647216796875, 2.7999267578125, 2.930206298828125, 3.06048583984375, 3.190765380859375, 3.321044921875, 3.451324462890625, 3.58160400390625, 3.711883544921875, 3.8421630859375, 3.972442626953125, 4.10272216796875, 4.233001708984375, 4.36328125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 4.0, 10.0, 4.0, 11.0, 23.0, 35.0, 23.0, 36.0, 48.0, 69.0, 53.0, 78.0, 78.0, 77.0, 73.0, 74.0, 56.0, 46.0, 32.0, 31.0, 30.0, 28.0, 15.0, 9.0, 8.0, 4.0, 9.0, 3.0, 7.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.583984375, -2.512451171875, -2.44091796875, -2.369384765625, -2.2978515625, -2.226318359375, -2.15478515625, -2.083251953125, -2.01171875, -1.940185546875, -1.86865234375, -1.797119140625, -1.7255859375, -1.654052734375, -1.58251953125, -1.510986328125, -1.439453125, -1.367919921875, -1.29638671875, -1.224853515625, -1.1533203125, -1.081787109375, -1.01025390625, -0.938720703125, -0.8671875, -0.795654296875, -0.72412109375, -0.652587890625, -0.5810546875, -0.509521484375, -0.43798828125, -0.366455078125, -0.294921875, -0.223388671875, -0.15185546875, -0.080322265625, -0.0087890625, 0.062744140625, 0.13427734375, 0.205810546875, 0.27734375, 0.348876953125, 0.42041015625, 0.491943359375, 0.5634765625, 0.635009765625, 0.70654296875, 0.778076171875, 0.849609375, 0.921142578125, 0.99267578125, 1.064208984375, 1.1357421875, 1.207275390625, 1.27880859375, 1.350341796875, 1.421875, 1.493408203125, 1.56494140625, 1.636474609375, 1.7080078125, 1.779541015625, 1.85107421875, 1.922607421875, 1.994140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 9.0, 25.0, 31.0, 60.0, 91.0, 192.0, 502.0, 1925.0, 17224.0, 1107932.0, 3034557.0, 27869.0, 2698.0, 605.0, 251.0, 133.0, 63.0, 46.0, 18.0, 8.0, 14.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.74853515625, -7.4267578125, -7.10498046875, -6.783203125, -6.46142578125, -6.1396484375, -5.81787109375, -5.49609375, -5.17431640625, -4.8525390625, -4.53076171875, -4.208984375, -3.88720703125, -3.5654296875, -3.24365234375, -2.921875, -2.60009765625, -2.2783203125, -1.95654296875, -1.634765625, -1.31298828125, -0.9912109375, -0.66943359375, -0.34765625, -0.02587890625, 0.2958984375, 0.61767578125, 0.939453125, 1.26123046875, 1.5830078125, 1.90478515625, 2.2265625, 2.54833984375, 2.8701171875, 3.19189453125, 3.513671875, 3.83544921875, 4.1572265625, 4.47900390625, 4.80078125, 5.12255859375, 5.4443359375, 5.76611328125, 6.087890625, 6.40966796875, 6.7314453125, 7.05322265625, 7.375, 7.69677734375, 8.0185546875, 8.34033203125, 8.662109375, 8.98388671875, 9.3056640625, 9.62744140625, 9.94921875, 10.27099609375, 10.5927734375, 10.91455078125, 11.236328125, 11.55810546875, 11.8798828125, 12.20166015625, 12.5234375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 11.0, 11.0, 18.0, 21.0, 29.0, 45.0, 67.0, 82.0, 174.0, 198.0, 346.0, 524.0, 816.0, 640.0, 398.0, 241.0, 131.0, 104.0, 68.0, 31.0, 49.0, 21.0, 8.0, 7.0, 12.0, 5.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.98828125, -1.9427566528320312, -1.8972320556640625, -1.8517074584960938, -1.806182861328125, -1.7606582641601562, -1.7151336669921875, -1.6696090698242188, -1.62408447265625, -1.5785598754882812, -1.5330352783203125, -1.4875106811523438, -1.441986083984375, -1.3964614868164062, -1.3509368896484375, -1.3054122924804688, -1.2598876953125, -1.2143630981445312, -1.1688385009765625, -1.1233139038085938, -1.077789306640625, -1.0322647094726562, -0.9867401123046875, -0.9412155151367188, -0.89569091796875, -0.8501663208007812, -0.8046417236328125, -0.7591171264648438, -0.713592529296875, -0.6680679321289062, -0.6225433349609375, -0.5770187377929688, -0.531494140625, -0.48596954345703125, -0.4404449462890625, -0.39492034912109375, -0.349395751953125, -0.30387115478515625, -0.2583465576171875, -0.21282196044921875, -0.16729736328125, -0.12177276611328125, -0.0762481689453125, -0.03072357177734375, 0.014801025390625, 0.06032562255859375, 0.1058502197265625, 0.15137481689453125, 0.1968994140625, 0.24242401123046875, 0.2879486083984375, 0.33347320556640625, 0.378997802734375, 0.42452239990234375, 0.4700469970703125, 0.5155715942382812, 0.56109619140625, 0.6066207885742188, 0.6521453857421875, 0.6976699829101562, 0.743194580078125, 0.7887191772460938, 0.8342437744140625, 0.8797683715820312, 0.92529296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 13.0, 19.0, 26.0, 35.0, 77.0, 79.0, 103.0, 108.0, 107.0, 90.0, 95.0, 61.0, 36.0, 45.0, 37.0, 19.0, 14.0, 6.0, 3.0, 7.0, 2.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.760065078735352, -4.594661712646484, -4.429258823394775, -4.263855457305908, -4.098452091217041, -3.933049201965332, -3.767645835876465, -3.6022427082061768, -3.4368395805358887, -3.2714364528656006, -3.1060330867767334, -2.9406299591064453, -2.7752268314361572, -2.609823703765869, -2.444420337677002, -2.279017210006714, -2.1136138439178467, -1.948210597038269, -1.782807469367981, -1.6174042224884033, -1.4520010948181152, -1.2865978479385376, -1.12119460105896, -0.9557914733886719, -0.7903882265090942, -0.6249850392341614, -0.45958182215690613, -0.2941786050796509, -0.12877541780471802, 0.036627769470214844, 0.20203101634979248, 0.36743414402008057, 0.5328373908996582, 0.6982405781745911, 0.8636437654495239, 1.0290470123291016, 1.1944501399993896, 1.3598533868789673, 1.525256633758545, 1.690659761428833, 1.8560630083084106, 2.0214662551879883, 2.1868693828582764, 2.3522725105285645, 2.5176758766174316, 2.6830790042877197, 2.848482131958008, 3.013885498046875, 3.179288625717163, 3.344691753387451, 3.5100951194763184, 3.6754982471466064, 3.8409013748168945, 4.006304740905762, 4.171708106994629, 4.337110996246338, 4.502514362335205, 4.667917728424072, 4.833320617675781, 4.998723983764648, 5.164127349853516, 5.329530239105225, 5.494933605194092, 5.660336494445801, 5.825739860534668]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 8.0, 8.0, 15.0, 19.0, 16.0, 18.0, 15.0, 27.0, 29.0, 37.0, 43.0, 39.0, 44.0, 38.0, 38.0, 35.0, 33.0, 48.0, 42.0, 41.0, 43.0, 46.0, 44.0, 27.0, 32.0, 32.0, 26.0, 30.0, 23.0, 19.0, 15.0, 6.0, 9.0, 6.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.64679217338562, -2.5657248497009277, -2.4846575260162354, -2.403590202331543, -2.3225231170654297, -2.2414557933807373, -2.160388469696045, -2.0793211460113525, -1.9982538223266602, -1.9171864986419678, -1.8361191749572754, -1.7550519704818726, -1.6739846467971802, -1.5929173231124878, -1.511850118637085, -1.4307827949523926, -1.3497154712677002, -1.2686481475830078, -1.1875808238983154, -1.1065136194229126, -1.0254462957382202, -0.9443789720535278, -0.8633117079734802, -0.7822444438934326, -0.7011771202087402, -0.6201097965240479, -0.5390425324440002, -0.45797523856163025, -0.37690794467926025, -0.29584065079689026, -0.21477335691452026, -0.13370609283447266, -0.05263853073120117, 0.028428763151168823, 0.10949605703353882, 0.1905633509159088, 0.2716306447982788, 0.3526979386806488, 0.4337652325630188, 0.5148324966430664, 0.5958998203277588, 0.6769671440124512, 0.7580344080924988, 0.8391016721725464, 0.9201689958572388, 1.0012363195419312, 1.082303524017334, 1.1633708477020264, 1.2444381713867188, 1.3255054950714111, 1.4065728187561035, 1.4876400232315063, 1.5687073469161987, 1.6497746706008911, 1.730841875076294, 1.8119091987609863, 1.8929765224456787, 1.974043846130371, 2.0551111698150635, 2.136178493499756, 2.217245578765869, 2.2983129024505615, 2.379380226135254, 2.4604475498199463, 2.5415148735046387]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 15.0, 17.0, 16.0, 33.0, 47.0, 59.0, 80.0, 145.0, 263.0, 530.0, 1404.0, 4078.0, 17745.0, 147672.0, 752720.0, 104055.0, 13859.0, 3445.0, 1198.0, 477.0, 264.0, 161.0, 78.0, 55.0, 43.0, 24.0, 17.0, 14.0, 6.0, 7.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.59326171875, -0.5755157470703125, -0.557769775390625, -0.5400238037109375, -0.52227783203125, -0.5045318603515625, -0.486785888671875, -0.4690399169921875, -0.4512939453125, -0.4335479736328125, -0.415802001953125, -0.3980560302734375, -0.38031005859375, -0.3625640869140625, -0.344818115234375, -0.3270721435546875, -0.309326171875, -0.2915802001953125, -0.273834228515625, -0.2560882568359375, -0.23834228515625, -0.2205963134765625, -0.202850341796875, -0.1851043701171875, -0.1673583984375, -0.1496124267578125, -0.131866455078125, -0.1141204833984375, -0.09637451171875, -0.0786285400390625, -0.060882568359375, -0.0431365966796875, -0.025390625, -0.0076446533203125, 0.010101318359375, 0.0278472900390625, 0.04559326171875, 0.0633392333984375, 0.081085205078125, 0.0988311767578125, 0.1165771484375, 0.1343231201171875, 0.152069091796875, 0.1698150634765625, 0.18756103515625, 0.2053070068359375, 0.223052978515625, 0.2407989501953125, 0.258544921875, 0.2762908935546875, 0.294036865234375, 0.3117828369140625, 0.32952880859375, 0.3472747802734375, 0.365020751953125, 0.3827667236328125, 0.4005126953125, 0.4182586669921875, 0.436004638671875, 0.4537506103515625, 0.47149658203125, 0.4892425537109375, 0.506988525390625, 0.5247344970703125, 0.54248046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 5.0, 9.0, 14.0, 10.0, 15.0, 17.0, 26.0, 23.0, 33.0, 40.0, 43.0, 52.0, 51.0, 60.0, 58.0, 55.0, 57.0, 58.0, 57.0, 50.0, 35.0, 40.0, 50.0, 30.0, 25.0, 23.0, 13.0, 12.0, 10.0, 8.0, 8.0, 2.0, 4.0, 0.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.259765625, -2.191162109375, -2.12255859375, -2.053955078125, -1.9853515625, -1.916748046875, -1.84814453125, -1.779541015625, -1.7109375, -1.642333984375, -1.57373046875, -1.505126953125, -1.4365234375, -1.367919921875, -1.29931640625, -1.230712890625, -1.162109375, -1.093505859375, -1.02490234375, -0.956298828125, -0.8876953125, -0.819091796875, -0.75048828125, -0.681884765625, -0.61328125, -0.544677734375, -0.47607421875, -0.407470703125, -0.3388671875, -0.270263671875, -0.20166015625, -0.133056640625, -0.064453125, 0.004150390625, 0.07275390625, 0.141357421875, 0.2099609375, 0.278564453125, 0.34716796875, 0.415771484375, 0.484375, 0.552978515625, 0.62158203125, 0.690185546875, 0.7587890625, 0.827392578125, 0.89599609375, 0.964599609375, 1.033203125, 1.101806640625, 1.17041015625, 1.239013671875, 1.3076171875, 1.376220703125, 1.44482421875, 1.513427734375, 1.58203125, 1.650634765625, 1.71923828125, 1.787841796875, 1.8564453125, 1.925048828125, 1.99365234375, 2.062255859375, 2.130859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 16.0, 13.0, 12.0, 16.0, 12.0, 26.0, 27.0, 63.0, 54.0, 88.0, 135.0, 180.0, 291.0, 546.0, 1429.0, 9542.0, 294528.0, 712951.0, 24179.0, 2445.0, 763.0, 386.0, 219.0, 184.0, 123.0, 57.0, 66.0, 44.0, 29.0, 29.0, 22.0, 11.0, 14.0, 10.0, 9.0, 8.0, 5.0, 3.0, 5.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5615234375, -0.5434951782226562, -0.5254669189453125, -0.5074386596679688, -0.489410400390625, -0.47138214111328125, -0.4533538818359375, -0.43532562255859375, -0.41729736328125, -0.39926910400390625, -0.3812408447265625, -0.36321258544921875, -0.345184326171875, -0.32715606689453125, -0.3091278076171875, -0.29109954833984375, -0.2730712890625, -0.25504302978515625, -0.2370147705078125, -0.21898651123046875, -0.200958251953125, -0.18292999267578125, -0.1649017333984375, -0.14687347412109375, -0.12884521484375, -0.11081695556640625, -0.0927886962890625, -0.07476043701171875, -0.056732177734375, -0.03870391845703125, -0.0206756591796875, -0.00264739990234375, 0.015380859375, 0.03340911865234375, 0.0514373779296875, 0.06946563720703125, 0.087493896484375, 0.10552215576171875, 0.1235504150390625, 0.14157867431640625, 0.15960693359375, 0.17763519287109375, 0.1956634521484375, 0.21369171142578125, 0.231719970703125, 0.24974822998046875, 0.2677764892578125, 0.28580474853515625, 0.3038330078125, 0.32186126708984375, 0.3398895263671875, 0.35791778564453125, 0.375946044921875, 0.39397430419921875, 0.4120025634765625, 0.43003082275390625, 0.44805908203125, 0.46608734130859375, 0.4841156005859375, 0.5021438598632812, 0.520172119140625, 0.5382003784179688, 0.5562286376953125, 0.5742568969726562, 0.59228515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 9.0, 17.0, 19.0, 27.0, 23.0, 29.0, 42.0, 30.0, 35.0, 57.0, 55.0, 57.0, 62.0, 60.0, 51.0, 44.0, 51.0, 52.0, 44.0, 40.0, 26.0, 33.0, 21.0, 15.0, 9.0, 13.0, 10.0, 8.0, 7.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.763671875, -3.632659912109375, -3.50164794921875, -3.370635986328125, -3.2396240234375, -3.108612060546875, -2.97760009765625, -2.846588134765625, -2.715576171875, -2.584564208984375, -2.45355224609375, -2.322540283203125, -2.1915283203125, -2.060516357421875, -1.92950439453125, -1.798492431640625, -1.66748046875, -1.536468505859375, -1.40545654296875, -1.274444580078125, -1.1434326171875, -1.012420654296875, -0.88140869140625, -0.750396728515625, -0.619384765625, -0.488372802734375, -0.35736083984375, -0.226348876953125, -0.0953369140625, 0.035675048828125, 0.16668701171875, 0.297698974609375, 0.4287109375, 0.559722900390625, 0.69073486328125, 0.821746826171875, 0.9527587890625, 1.083770751953125, 1.21478271484375, 1.345794677734375, 1.476806640625, 1.607818603515625, 1.73883056640625, 1.869842529296875, 2.0008544921875, 2.131866455078125, 2.26287841796875, 2.393890380859375, 2.52490234375, 2.655914306640625, 2.78692626953125, 2.917938232421875, 3.0489501953125, 3.179962158203125, 3.31097412109375, 3.441986083984375, 3.572998046875, 3.704010009765625, 3.83502197265625, 3.966033935546875, 4.0970458984375, 4.228057861328125, 4.35906982421875, 4.490081787109375, 4.62109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 13.0, 14.0, 21.0, 16.0, 23.0, 48.0, 89.0, 130.0, 256.0, 726.0, 5142.0, 1016832.0, 23238.0, 1192.0, 346.0, 169.0, 100.0, 69.0, 34.0, 21.0, 18.0, 17.0, 12.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2454833984375, -0.2355365753173828, -0.22558975219726562, -0.21564292907714844, -0.20569610595703125, -0.19574928283691406, -0.18580245971679688, -0.1758556365966797, -0.1659088134765625, -0.1559619903564453, -0.14601516723632812, -0.13606834411621094, -0.12612152099609375, -0.11617469787597656, -0.10622787475585938, -0.09628105163574219, -0.086334228515625, -0.07638740539550781, -0.06644058227539062, -0.05649375915527344, -0.04654693603515625, -0.03660011291503906, -0.026653289794921875, -0.016706466674804688, -0.0067596435546875, 0.0031871795654296875, 0.013134002685546875, 0.023080825805664062, 0.03302764892578125, 0.04297447204589844, 0.052921295166015625, 0.06286811828613281, 0.07281494140625, 0.08276176452636719, 0.09270858764648438, 0.10265541076660156, 0.11260223388671875, 0.12254905700683594, 0.13249588012695312, 0.1424427032470703, 0.1523895263671875, 0.1623363494873047, 0.17228317260742188, 0.18222999572753906, 0.19217681884765625, 0.20212364196777344, 0.21207046508789062, 0.2220172882080078, 0.231964111328125, 0.2419109344482422, 0.2518577575683594, 0.26180458068847656, 0.27175140380859375, 0.28169822692871094, 0.2916450500488281, 0.3015918731689453, 0.3115386962890625, 0.3214855194091797, 0.3314323425292969, 0.34137916564941406, 0.35132598876953125, 0.36127281188964844, 0.3712196350097656, 0.3811664581298828, 0.39111328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 8.0, 18.0, 33.0, 59.0, 118.0, 169.0, 221.0, 162.0, 87.0, 40.0, 30.0, 13.0, 10.0, 5.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011360645294189453, -0.00011071376502513885, -0.00010782107710838318, -0.0001049283891916275, -0.00010203570127487183, -9.914301335811615e-05, -9.625032544136047e-05, -9.33576375246048e-05, -9.046494960784912e-05, -8.757226169109344e-05, -8.467957377433777e-05, -8.178688585758209e-05, -7.889419794082642e-05, -7.600151002407074e-05, -7.310882210731506e-05, -7.021613419055939e-05, -6.732344627380371e-05, -6.443075835704803e-05, -6.153807044029236e-05, -5.864538252353668e-05, -5.5752694606781006e-05, -5.286000669002533e-05, -4.996731877326965e-05, -4.707463085651398e-05, -4.41819429397583e-05, -4.1289255023002625e-05, -3.839656710624695e-05, -3.550387918949127e-05, -3.2611191272735596e-05, -2.971850335597992e-05, -2.6825815439224243e-05, -2.3933127522468567e-05, -2.104043960571289e-05, -1.8147751688957214e-05, -1.5255063772201538e-05, -1.2362375855445862e-05, -9.469687938690186e-06, -6.577000021934509e-06, -3.684312105178833e-06, -7.916241884231567e-07, 2.1010637283325195e-06, 4.993751645088196e-06, 7.886439561843872e-06, 1.0779127478599548e-05, 1.3671815395355225e-05, 1.65645033121109e-05, 1.9457191228866577e-05, 2.2349879145622253e-05, 2.524256706237793e-05, 2.8135254979133606e-05, 3.102794289588928e-05, 3.392063081264496e-05, 3.6813318729400635e-05, 3.970600664615631e-05, 4.259869456291199e-05, 4.5491382479667664e-05, 4.838407039642334e-05, 5.1276758313179016e-05, 5.416944622993469e-05, 5.706213414669037e-05, 5.9954822063446045e-05, 6.284750998020172e-05, 6.57401978969574e-05, 6.863288581371307e-05, 7.152557373046875e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 13.0, 18.0, 30.0, 48.0, 45.0, 76.0, 117.0, 137.0, 239.0, 388.0, 708.0, 1681.0, 4975.0, 23406.0, 742428.0, 251455.0, 15845.0, 3899.0, 1405.0, 604.0, 318.0, 211.0, 154.0, 89.0, 88.0, 57.0, 30.0, 29.0, 16.0, 10.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1787109375, -0.17181015014648438, -0.16490936279296875, -0.15800857543945312, -0.1511077880859375, -0.14420700073242188, -0.13730621337890625, -0.13040542602539062, -0.123504638671875, -0.11660385131835938, -0.10970306396484375, -0.10280227661132812, -0.0959014892578125, -0.08900070190429688, -0.08209991455078125, -0.07519912719726562, -0.06829833984375, -0.061397552490234375, -0.05449676513671875, -0.047595977783203125, -0.0406951904296875, -0.033794403076171875, -0.02689361572265625, -0.019992828369140625, -0.013092041015625, -0.006191253662109375, 0.00070953369140625, 0.007610321044921875, 0.0145111083984375, 0.021411895751953125, 0.02831268310546875, 0.035213470458984375, 0.0421142578125, 0.049015045166015625, 0.05591583251953125, 0.06281661987304688, 0.0697174072265625, 0.07661819458007812, 0.08351898193359375, 0.09041976928710938, 0.097320556640625, 0.10422134399414062, 0.11112213134765625, 0.11802291870117188, 0.1249237060546875, 0.13182449340820312, 0.13872528076171875, 0.14562606811523438, 0.15252685546875, 0.15942764282226562, 0.16632843017578125, 0.17322921752929688, 0.1801300048828125, 0.18703079223632812, 0.19393157958984375, 0.20083236694335938, 0.207733154296875, 0.21463394165039062, 0.22153472900390625, 0.22843551635742188, 0.2353363037109375, 0.24223709106445312, 0.24913787841796875, 0.2560386657714844, 0.262939453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 14.0, 28.0, 46.0, 72.0, 262.0, 361.0, 91.0, 52.0, 25.0, 14.0, 12.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08349609375, -0.08130550384521484, -0.07911491394042969, -0.07692432403564453, -0.07473373413085938, -0.07254314422607422, -0.07035255432128906, -0.0681619644165039, -0.06597137451171875, -0.0637807846069336, -0.06159019470214844, -0.05939960479736328, -0.057209014892578125, -0.05501842498779297, -0.05282783508300781, -0.050637245178222656, -0.0484466552734375, -0.046256065368652344, -0.04406547546386719, -0.04187488555908203, -0.039684295654296875, -0.03749370574951172, -0.03530311584472656, -0.033112525939941406, -0.03092193603515625, -0.028731346130371094, -0.026540756225585938, -0.02435016632080078, -0.022159576416015625, -0.01996898651123047, -0.017778396606445312, -0.015587806701660156, -0.013397216796875, -0.011206626892089844, -0.009016036987304688, -0.006825447082519531, -0.004634857177734375, -0.0024442672729492188, -0.0002536773681640625, 0.0019369125366210938, 0.00412750244140625, 0.006318092346191406, 0.008508682250976562, 0.010699272155761719, 0.012889862060546875, 0.015080451965332031, 0.017271041870117188, 0.019461631774902344, 0.0216522216796875, 0.023842811584472656, 0.026033401489257812, 0.02822399139404297, 0.030414581298828125, 0.03260517120361328, 0.03479576110839844, 0.036986351013183594, 0.03917694091796875, 0.041367530822753906, 0.04355812072753906, 0.04574871063232422, 0.047939300537109375, 0.05012989044189453, 0.05232048034667969, 0.054511070251464844, 0.05670166015625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 10.0, 14.0, 29.0, 37.0, 71.0, 107.0, 119.0, 137.0, 111.0, 98.0, 70.0, 60.0, 45.0, 34.0, 13.0, 12.0, 4.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.265610218048096, -4.147425174713135, -4.029240131378174, -3.911054849624634, -3.792869806289673, -3.674684524536133, -3.556499481201172, -3.438314437866211, -3.32012939453125, -3.201944351196289, -3.083759069442749, -2.965574026107788, -2.847388982772827, -2.729203701019287, -2.611018657684326, -2.4928336143493652, -2.374648332595825, -2.2564632892608643, -2.138278007507324, -2.0200929641723633, -1.9019079208374023, -1.7837227582931519, -1.6655375957489014, -1.5473525524139404, -1.42916738986969, -1.3109822273254395, -1.1927971839904785, -1.074612021446228, -0.9564269185066223, -0.8382418155670166, -0.7200566530227661, -0.6018715500831604, -0.4836866855621338, -0.3655015826225281, -0.24731644988059998, -0.12913131713867188, -0.010946214199066162, 0.10723888874053955, 0.22542405128479004, 0.34360915422439575, 0.46179425716400146, 0.5799793601036072, 0.6981644630432129, 0.8163496255874634, 0.9345347285270691, 1.0527198314666748, 1.1709049940109253, 1.2890901565551758, 1.4072751998901367, 1.5254603624343872, 1.6436454057693481, 1.7618305683135986, 1.8800156116485596, 1.99820077419281, 2.1163859367370605, 2.2345709800720215, 2.3527560234069824, 2.4709410667419434, 2.5891263484954834, 2.7073113918304443, 2.8254964351654053, 2.9436817169189453, 3.0618667602539062, 3.180051803588867, 3.2982370853424072]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 6.0, 3.0, 10.0, 9.0, 10.0, 11.0, 17.0, 25.0, 23.0, 24.0, 37.0, 41.0, 44.0, 64.0, 56.0, 31.0, 50.0, 59.0, 54.0, 56.0, 55.0, 48.0, 47.0, 44.0, 33.0, 29.0, 23.0, 25.0, 20.0, 9.0, 9.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.0510823726654053, -1.9886244535446167, -1.9261665344238281, -1.8637086153030396, -1.801250696182251, -1.7387927770614624, -1.6763348579406738, -1.6138769388198853, -1.5514190196990967, -1.488961100578308, -1.4265031814575195, -1.364045262336731, -1.3015873432159424, -1.2391294240951538, -1.1766715049743652, -1.1142135858535767, -1.051755666732788, -0.9892977476119995, -0.9268398284912109, -0.8643819093704224, -0.8019239902496338, -0.7394660711288452, -0.6770081520080566, -0.6145502328872681, -0.5520923137664795, -0.4896343946456909, -0.42717647552490234, -0.36471855640411377, -0.3022606372833252, -0.23980271816253662, -0.17734479904174805, -0.11488687992095947, -0.05242908000946045, 0.010028839111328125, 0.0724867582321167, 0.13494467735290527, 0.19740259647369385, 0.2598605155944824, 0.322318434715271, 0.38477635383605957, 0.44723427295684814, 0.5096921920776367, 0.5721501111984253, 0.6346080303192139, 0.6970659494400024, 0.759523868560791, 0.8219817876815796, 0.8844397068023682, 0.9468976259231567, 1.0093555450439453, 1.0718134641647339, 1.1342713832855225, 1.196729302406311, 1.2591872215270996, 1.3216451406478882, 1.3841030597686768, 1.4465609788894653, 1.509018898010254, 1.5714768171310425, 1.633934736251831, 1.6963926553726196, 1.7588505744934082, 1.8213084936141968, 1.8837664127349854, 1.946224331855774]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 5.0, 11.0, 11.0, 14.0, 29.0, 53.0, 63.0, 107.0, 161.0, 308.0, 534.0, 973.0, 1823.0, 3580.0, 7513.0, 17190.0, 42301.0, 121520.0, 461153.0, 264161.0, 75153.0, 28548.0, 12164.0, 5513.0, 2639.0, 1361.0, 699.0, 391.0, 199.0, 137.0, 67.0, 59.0, 38.0, 25.0, 16.0, 4.0, 6.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.95074462890625, -2.8682861328125, -2.78582763671875, -2.703369140625, -2.62091064453125, -2.5384521484375, -2.45599365234375, -2.37353515625, -2.29107666015625, -2.2086181640625, -2.12615966796875, -2.043701171875, -1.96124267578125, -1.8787841796875, -1.79632568359375, -1.7138671875, -1.63140869140625, -1.5489501953125, -1.46649169921875, -1.384033203125, -1.30157470703125, -1.2191162109375, -1.13665771484375, -1.05419921875, -0.97174072265625, -0.8892822265625, -0.80682373046875, -0.724365234375, -0.64190673828125, -0.5594482421875, -0.47698974609375, -0.39453125, -0.31207275390625, -0.2296142578125, -0.14715576171875, -0.064697265625, 0.01776123046875, 0.1002197265625, 0.18267822265625, 0.26513671875, 0.34759521484375, 0.4300537109375, 0.51251220703125, 0.594970703125, 0.67742919921875, 0.7598876953125, 0.84234619140625, 0.9248046875, 1.00726318359375, 1.0897216796875, 1.17218017578125, 1.254638671875, 1.33709716796875, 1.4195556640625, 1.50201416015625, 1.58447265625, 1.66693115234375, 1.7493896484375, 1.83184814453125, 1.914306640625, 1.99676513671875, 2.0792236328125, 2.16168212890625, 2.244140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 27.0, 20.0, 18.0, 32.0, 36.0, 55.0, 51.0, 62.0, 54.0, 68.0, 68.0, 80.0, 57.0, 74.0, 49.0, 49.0, 32.0, 26.0, 31.0, 20.0, 11.0, 11.0, 9.0, 6.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.35162353515625, -5.1915283203125, -5.03143310546875, -4.871337890625, -4.71124267578125, -4.5511474609375, -4.39105224609375, -4.23095703125, -4.07086181640625, -3.9107666015625, -3.75067138671875, -3.590576171875, -3.43048095703125, -3.2703857421875, -3.11029052734375, -2.9501953125, -2.79010009765625, -2.6300048828125, -2.46990966796875, -2.309814453125, -2.14971923828125, -1.9896240234375, -1.82952880859375, -1.66943359375, -1.50933837890625, -1.3492431640625, -1.18914794921875, -1.029052734375, -0.86895751953125, -0.7088623046875, -0.54876708984375, -0.388671875, -0.22857666015625, -0.0684814453125, 0.09161376953125, 0.251708984375, 0.41180419921875, 0.5718994140625, 0.73199462890625, 0.89208984375, 1.05218505859375, 1.2122802734375, 1.37237548828125, 1.532470703125, 1.69256591796875, 1.8526611328125, 2.01275634765625, 2.1728515625, 2.33294677734375, 2.4930419921875, 2.65313720703125, 2.813232421875, 2.97332763671875, 3.1334228515625, 3.29351806640625, 3.45361328125, 3.61370849609375, 3.7738037109375, 3.93389892578125, 4.093994140625, 4.25408935546875, 4.4141845703125, 4.57427978515625, 4.734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 13.0, 25.0, 31.0, 46.0, 85.0, 148.0, 255.0, 584.0, 1630.0, 5165.0, 21628.0, 121396.0, 724651.0, 139970.0, 24192.0, 5807.0, 1661.0, 600.0, 274.0, 119.0, 80.0, 53.0, 33.0, 29.0, 14.0, 17.0, 9.0, 3.0, 0.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.43359375, -3.29364013671875, -3.1536865234375, -3.01373291015625, -2.873779296875, -2.73382568359375, -2.5938720703125, -2.45391845703125, -2.31396484375, -2.17401123046875, -2.0340576171875, -1.89410400390625, -1.754150390625, -1.61419677734375, -1.4742431640625, -1.33428955078125, -1.1943359375, -1.05438232421875, -0.9144287109375, -0.77447509765625, -0.634521484375, -0.49456787109375, -0.3546142578125, -0.21466064453125, -0.07470703125, 0.06524658203125, 0.2052001953125, 0.34515380859375, 0.485107421875, 0.62506103515625, 0.7650146484375, 0.90496826171875, 1.044921875, 1.18487548828125, 1.3248291015625, 1.46478271484375, 1.604736328125, 1.74468994140625, 1.8846435546875, 2.02459716796875, 2.16455078125, 2.30450439453125, 2.4444580078125, 2.58441162109375, 2.724365234375, 2.86431884765625, 3.0042724609375, 3.14422607421875, 3.2841796875, 3.42413330078125, 3.5640869140625, 3.70404052734375, 3.843994140625, 3.98394775390625, 4.1239013671875, 4.26385498046875, 4.40380859375, 4.54376220703125, 4.6837158203125, 4.82366943359375, 4.963623046875, 5.10357666015625, 5.2435302734375, 5.38348388671875, 5.5234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 11.0, 17.0, 12.0, 15.0, 25.0, 28.0, 26.0, 26.0, 38.0, 50.0, 58.0, 37.0, 61.0, 60.0, 54.0, 60.0, 42.0, 70.0, 36.0, 45.0, 34.0, 30.0, 23.0, 30.0, 26.0, 12.0, 10.0, 13.0, 8.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25390625, -5.080810546875, -4.90771484375, -4.734619140625, -4.5615234375, -4.388427734375, -4.21533203125, -4.042236328125, -3.869140625, -3.696044921875, -3.52294921875, -3.349853515625, -3.1767578125, -3.003662109375, -2.83056640625, -2.657470703125, -2.484375, -2.311279296875, -2.13818359375, -1.965087890625, -1.7919921875, -1.618896484375, -1.44580078125, -1.272705078125, -1.099609375, -0.926513671875, -0.75341796875, -0.580322265625, -0.4072265625, -0.234130859375, -0.06103515625, 0.112060546875, 0.28515625, 0.458251953125, 0.63134765625, 0.804443359375, 0.9775390625, 1.150634765625, 1.32373046875, 1.496826171875, 1.669921875, 1.843017578125, 2.01611328125, 2.189208984375, 2.3623046875, 2.535400390625, 2.70849609375, 2.881591796875, 3.0546875, 3.227783203125, 3.40087890625, 3.573974609375, 3.7470703125, 3.920166015625, 4.09326171875, 4.266357421875, 4.439453125, 4.612548828125, 4.78564453125, 4.958740234375, 5.1318359375, 5.304931640625, 5.47802734375, 5.651123046875, 5.82421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 11.0, 18.0, 28.0, 41.0, 50.0, 117.0, 175.0, 362.0, 802.0, 1809.0, 5402.0, 18549.0, 90802.0, 606331.0, 264820.0, 43245.0, 10326.0, 3210.0, 1269.0, 545.0, 265.0, 148.0, 87.0, 63.0, 20.0, 15.0, 14.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1215362548828125, -1.078033447265625, -1.0345306396484375, -0.99102783203125, -0.9475250244140625, -0.904022216796875, -0.8605194091796875, -0.8170166015625, -0.7735137939453125, -0.730010986328125, -0.6865081787109375, -0.64300537109375, -0.5995025634765625, -0.555999755859375, -0.5124969482421875, -0.468994140625, -0.4254913330078125, -0.381988525390625, -0.3384857177734375, -0.29498291015625, -0.2514801025390625, -0.207977294921875, -0.1644744873046875, -0.1209716796875, -0.0774688720703125, -0.033966064453125, 0.0095367431640625, 0.05303955078125, 0.0965423583984375, 0.140045166015625, 0.1835479736328125, 0.22705078125, 0.2705535888671875, 0.314056396484375, 0.3575592041015625, 0.40106201171875, 0.4445648193359375, 0.488067626953125, 0.5315704345703125, 0.5750732421875, 0.6185760498046875, 0.662078857421875, 0.7055816650390625, 0.74908447265625, 0.7925872802734375, 0.836090087890625, 0.8795928955078125, 0.923095703125, 0.9665985107421875, 1.010101318359375, 1.0536041259765625, 1.09710693359375, 1.1406097412109375, 1.184112548828125, 1.2276153564453125, 1.2711181640625, 1.3146209716796875, 1.358123779296875, 1.4016265869140625, 1.44512939453125, 1.4886322021484375, 1.532135009765625, 1.5756378173828125, 1.619140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 9.0, 19.0, 26.0, 39.0, 54.0, 82.0, 96.0, 125.0, 156.0, 106.0, 81.0, 51.0, 39.0, 20.0, 14.0, 21.0, 4.0, 13.0, 4.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0003135204315185547, -0.0003062523901462555, -0.0002989843487739563, -0.0002917163074016571, -0.0002844482660293579, -0.0002771802246570587, -0.0002699121832847595, -0.00026264414191246033, -0.00025537610054016113, -0.00024810805916786194, -0.00024084001779556274, -0.00023357197642326355, -0.00022630393505096436, -0.00021903589367866516, -0.00021176785230636597, -0.00020449981093406677, -0.00019723176956176758, -0.00018996372818946838, -0.0001826956868171692, -0.00017542764544487, -0.0001681596040725708, -0.0001608915627002716, -0.0001536235213279724, -0.00014635547995567322, -0.00013908743858337402, -0.00013181939721107483, -0.00012455135583877563, -0.00011728331446647644, -0.00011001527309417725, -0.00010274723172187805, -9.547919034957886e-05, -8.821114897727966e-05, -8.094310760498047e-05, -7.367506623268127e-05, -6.640702486038208e-05, -5.9138983488082886e-05, -5.187094211578369e-05, -4.46029007434845e-05, -3.73348593711853e-05, -3.006681799888611e-05, -2.2798776626586914e-05, -1.553073525428772e-05, -8.262693881988525e-06, -9.94652509689331e-07, 6.273388862609863e-06, 1.3541430234909058e-05, 2.0809471607208252e-05, 2.8077512979507446e-05, 3.534555435180664e-05, 4.2613595724105835e-05, 4.988163709640503e-05, 5.7149678468704224e-05, 6.441771984100342e-05, 7.168576121330261e-05, 7.89538025856018e-05, 8.6221843957901e-05, 9.34898853302002e-05, 0.00010075792670249939, 0.00010802596807479858, 0.00011529400944709778, 0.00012256205081939697, 0.00012983009219169617, 0.00013709813356399536, 0.00014436617493629456, 0.00015163421630859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 8.0, 12.0, 11.0, 16.0, 27.0, 38.0, 57.0, 148.0, 256.0, 578.0, 1461.0, 3741.0, 10680.0, 35543.0, 165314.0, 616802.0, 161938.0, 34991.0, 10597.0, 3639.0, 1472.0, 625.0, 279.0, 135.0, 60.0, 49.0, 22.0, 9.0, 12.0, 4.0, 1.0, 10.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.451171875, -1.411407470703125, -1.37164306640625, -1.331878662109375, -1.2921142578125, -1.252349853515625, -1.21258544921875, -1.172821044921875, -1.133056640625, -1.093292236328125, -1.05352783203125, -1.013763427734375, -0.9739990234375, -0.934234619140625, -0.89447021484375, -0.854705810546875, -0.81494140625, -0.775177001953125, -0.73541259765625, -0.695648193359375, -0.6558837890625, -0.616119384765625, -0.57635498046875, -0.536590576171875, -0.496826171875, -0.457061767578125, -0.41729736328125, -0.377532958984375, -0.3377685546875, -0.298004150390625, -0.25823974609375, -0.218475341796875, -0.1787109375, -0.138946533203125, -0.09918212890625, -0.059417724609375, -0.0196533203125, 0.020111083984375, 0.05987548828125, 0.099639892578125, 0.139404296875, 0.179168701171875, 0.21893310546875, 0.258697509765625, 0.2984619140625, 0.338226318359375, 0.37799072265625, 0.417755126953125, 0.45751953125, 0.497283935546875, 0.53704833984375, 0.576812744140625, 0.6165771484375, 0.656341552734375, 0.69610595703125, 0.735870361328125, 0.775634765625, 0.815399169921875, 0.85516357421875, 0.894927978515625, 0.9346923828125, 0.974456787109375, 1.01422119140625, 1.053985595703125, 1.09375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 7.0, 15.0, 14.0, 28.0, 37.0, 34.0, 49.0, 59.0, 75.0, 125.0, 146.0, 101.0, 68.0, 43.0, 35.0, 38.0, 25.0, 17.0, 12.0, 16.0, 3.0, 7.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56396484375, -0.543243408203125, -0.52252197265625, -0.501800537109375, -0.4810791015625, -0.460357666015625, -0.43963623046875, -0.418914794921875, -0.398193359375, -0.377471923828125, -0.35675048828125, -0.336029052734375, -0.3153076171875, -0.294586181640625, -0.27386474609375, -0.253143310546875, -0.232421875, -0.211700439453125, -0.19097900390625, -0.170257568359375, -0.1495361328125, -0.128814697265625, -0.10809326171875, -0.087371826171875, -0.066650390625, -0.045928955078125, -0.02520751953125, -0.004486083984375, 0.0162353515625, 0.036956787109375, 0.05767822265625, 0.078399658203125, 0.09912109375, 0.119842529296875, 0.14056396484375, 0.161285400390625, 0.1820068359375, 0.202728271484375, 0.22344970703125, 0.244171142578125, 0.264892578125, 0.285614013671875, 0.30633544921875, 0.327056884765625, 0.3477783203125, 0.368499755859375, 0.38922119140625, 0.409942626953125, 0.4306640625, 0.451385498046875, 0.47210693359375, 0.492828369140625, 0.5135498046875, 0.534271240234375, 0.55499267578125, 0.575714111328125, 0.596435546875, 0.617156982421875, 0.63787841796875, 0.658599853515625, 0.6793212890625, 0.700042724609375, 0.72076416015625, 0.741485595703125, 0.76220703125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 17.0, 89.0, 197.0, 375.0, 215.0, 77.0, 23.0, 9.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4956693649292, -7.688922882080078, -6.882176399230957, -6.075429916381836, -5.268683433532715, -4.461937427520752, -3.655190944671631, -2.8484444618225098, -2.0416979789733887, -1.2349514961242676, -0.42820513248443604, 0.3785412311553955, 1.1852877140045166, 1.9920339584350586, 2.7987804412841797, 3.605526924133301, 4.412273406982422, 5.219019889831543, 6.025766372680664, 6.832512855529785, 7.639259338378906, 8.446004867553711, 9.252752304077148, 10.059497833251953, 10.86624526977539, 11.672991752624512, 12.479738235473633, 13.286484718322754, 14.093231201171875, 14.89997673034668, 15.706724166870117, 16.513469696044922, 17.320215225219727, 18.12696075439453, 18.93370819091797, 19.740453720092773, 20.54720115661621, 21.353946685791016, 22.160694122314453, 22.967439651489258, 23.774187088012695, 24.5809326171875, 25.387680053710938, 26.194425582885742, 27.00117301940918, 27.807918548583984, 28.614665985107422, 29.421411514282227, 30.22815704345703, 31.034902572631836, 31.841650009155273, 32.64839553833008, 33.455142974853516, 34.26189041137695, 35.068634033203125, 35.87538146972656, 36.68212890625, 37.48887634277344, 38.29561996459961, 39.10236740112305, 39.909114837646484, 40.71586227416992, 41.522605895996094, 42.32935333251953, 43.13610076904297]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 1.0, 7.0, 10.0, 8.0, 5.0, 8.0, 6.0, 15.0, 13.0, 12.0, 11.0, 20.0, 18.0, 40.0, 37.0, 35.0, 38.0, 45.0, 35.0, 40.0, 43.0, 49.0, 43.0, 47.0, 35.0, 38.0, 55.0, 35.0, 27.0, 43.0, 22.0, 27.0, 27.0, 18.0, 17.0, 17.0, 8.0, 10.0, 9.0, 14.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.425134658813477, -8.175859451293945, -7.926583766937256, -7.677308559417725, -7.428032875061035, -7.178757667541504, -6.929482460021973, -6.680206775665283, -6.430931091308594, -6.1816558837890625, -5.932380199432373, -5.683104991912842, -5.433829307556152, -5.184554100036621, -4.93527889251709, -4.6860032081604, -4.436728000640869, -4.187452793121338, -3.9381771087646484, -3.688901901245117, -3.4396262168884277, -3.1903510093688965, -2.941075563430786, -2.691800117492676, -2.4425246715545654, -2.193249225616455, -1.9439737796783447, -1.694698452949524, -1.4454230070114136, -1.1961475610733032, -0.9468722343444824, -0.6975967884063721, -0.4483218193054199, -0.19904640316963196, 0.050229012966156006, 0.2995043992996216, 0.5487798452377319, 0.7980552911758423, 1.047330617904663, 1.2966060638427734, 1.5458815097808838, 1.7951569557189941, 2.0444324016571045, 2.293707847595215, 2.542983055114746, 2.7922587394714355, 3.041533946990967, 3.290809392929077, 3.5400848388671875, 3.789360284805298, 4.038635730743408, 4.2879109382629395, 4.537186622619629, 4.78646183013916, 5.035737037658691, 5.285012722015381, 5.53428840637207, 5.783563613891602, 6.032839298248291, 6.282114505767822, 6.531390190124512, 6.780665397644043, 7.029940605163574, 7.279216289520264, 7.528491497039795]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 6.0, 10.0, 6.0, 13.0, 11.0, 12.0, 22.0, 34.0, 35.0, 41.0, 47.0, 98.0, 158.0, 235.0, 470.0, 882.0, 2131.0, 5845.0, 19552.0, 92863.0, 1040458.0, 2778259.0, 203292.0, 34167.0, 9436.0, 3219.0, 1338.0, 647.0, 336.0, 199.0, 125.0, 76.0, 58.0, 42.0, 38.0, 14.0, 28.0, 17.0, 7.0, 6.0, 12.0, 2.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.4296875, -4.2921142578125, -4.154541015625, -4.0169677734375, -3.87939453125, -3.7418212890625, -3.604248046875, -3.4666748046875, -3.3291015625, -3.1915283203125, -3.053955078125, -2.9163818359375, -2.77880859375, -2.6412353515625, -2.503662109375, -2.3660888671875, -2.228515625, -2.0909423828125, -1.953369140625, -1.8157958984375, -1.67822265625, -1.5406494140625, -1.403076171875, -1.2655029296875, -1.1279296875, -0.9903564453125, -0.852783203125, -0.7152099609375, -0.57763671875, -0.4400634765625, -0.302490234375, -0.1649169921875, -0.02734375, 0.1102294921875, 0.247802734375, 0.3853759765625, 0.52294921875, 0.6605224609375, 0.798095703125, 0.9356689453125, 1.0732421875, 1.2108154296875, 1.348388671875, 1.4859619140625, 1.62353515625, 1.7611083984375, 1.898681640625, 2.0362548828125, 2.173828125, 2.3114013671875, 2.448974609375, 2.5865478515625, 2.72412109375, 2.8616943359375, 2.999267578125, 3.1368408203125, 3.2744140625, 3.4119873046875, 3.549560546875, 3.6871337890625, 3.82470703125, 3.9622802734375, 4.099853515625, 4.2374267578125, 4.375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 17.0, 7.0, 15.0, 30.0, 26.0, 35.0, 43.0, 47.0, 57.0, 59.0, 62.0, 60.0, 59.0, 60.0, 71.0, 57.0, 62.0, 42.0, 43.0, 30.0, 22.0, 21.0, 13.0, 10.0, 7.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.306640625, -2.24310302734375, -2.1795654296875, -2.11602783203125, -2.052490234375, -1.98895263671875, -1.9254150390625, -1.86187744140625, -1.79833984375, -1.73480224609375, -1.6712646484375, -1.60772705078125, -1.544189453125, -1.48065185546875, -1.4171142578125, -1.35357666015625, -1.2900390625, -1.22650146484375, -1.1629638671875, -1.09942626953125, -1.035888671875, -0.97235107421875, -0.9088134765625, -0.84527587890625, -0.78173828125, -0.71820068359375, -0.6546630859375, -0.59112548828125, -0.527587890625, -0.46405029296875, -0.4005126953125, -0.33697509765625, -0.2734375, -0.20989990234375, -0.1463623046875, -0.08282470703125, -0.019287109375, 0.04425048828125, 0.1077880859375, 0.17132568359375, 0.23486328125, 0.29840087890625, 0.3619384765625, 0.42547607421875, 0.489013671875, 0.55255126953125, 0.6160888671875, 0.67962646484375, 0.7431640625, 0.80670166015625, 0.8702392578125, 0.93377685546875, 0.997314453125, 1.06085205078125, 1.1243896484375, 1.18792724609375, 1.25146484375, 1.31500244140625, 1.3785400390625, 1.44207763671875, 1.505615234375, 1.56915283203125, 1.6326904296875, 1.69622802734375, 1.759765625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 7.0, 6.0, 11.0, 19.0, 15.0, 26.0, 41.0, 52.0, 107.0, 206.0, 442.0, 1247.0, 5468.0, 47873.0, 1403118.0, 2651573.0, 74034.0, 7572.0, 1501.0, 453.0, 216.0, 106.0, 62.0, 40.0, 20.0, 27.0, 10.0, 12.0, 6.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.58392333984375, -7.3475341796875, -7.11114501953125, -6.874755859375, -6.63836669921875, -6.4019775390625, -6.16558837890625, -5.92919921875, -5.69281005859375, -5.4564208984375, -5.22003173828125, -4.983642578125, -4.74725341796875, -4.5108642578125, -4.27447509765625, -4.0380859375, -3.80169677734375, -3.5653076171875, -3.32891845703125, -3.092529296875, -2.85614013671875, -2.6197509765625, -2.38336181640625, -2.14697265625, -1.91058349609375, -1.6741943359375, -1.43780517578125, -1.201416015625, -0.96502685546875, -0.7286376953125, -0.49224853515625, -0.255859375, -0.01947021484375, 0.2169189453125, 0.45330810546875, 0.689697265625, 0.92608642578125, 1.1624755859375, 1.39886474609375, 1.63525390625, 1.87164306640625, 2.1080322265625, 2.34442138671875, 2.580810546875, 2.81719970703125, 3.0535888671875, 3.28997802734375, 3.5263671875, 3.76275634765625, 3.9991455078125, 4.23553466796875, 4.471923828125, 4.70831298828125, 4.9447021484375, 5.18109130859375, 5.41748046875, 5.65386962890625, 5.8902587890625, 6.12664794921875, 6.363037109375, 6.59942626953125, 6.8358154296875, 7.07220458984375, 7.30859375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 5.0, 13.0, 19.0, 17.0, 32.0, 46.0, 60.0, 93.0, 120.0, 200.0, 317.0, 487.0, 645.0, 690.0, 395.0, 301.0, 188.0, 135.0, 104.0, 61.0, 43.0, 31.0, 21.0, 8.0, 15.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.4495391845703125, -1.401031494140625, -1.3525238037109375, -1.30401611328125, -1.2555084228515625, -1.207000732421875, -1.1584930419921875, -1.1099853515625, -1.0614776611328125, -1.012969970703125, -0.9644622802734375, -0.91595458984375, -0.8674468994140625, -0.818939208984375, -0.7704315185546875, -0.721923828125, -0.6734161376953125, -0.624908447265625, -0.5764007568359375, -0.52789306640625, -0.4793853759765625, -0.430877685546875, -0.3823699951171875, -0.3338623046875, -0.2853546142578125, -0.236846923828125, -0.1883392333984375, -0.13983154296875, -0.0913238525390625, -0.042816162109375, 0.0056915283203125, 0.05419921875, 0.1027069091796875, 0.151214599609375, 0.1997222900390625, 0.24822998046875, 0.2967376708984375, 0.345245361328125, 0.3937530517578125, 0.4422607421875, 0.4907684326171875, 0.539276123046875, 0.5877838134765625, 0.63629150390625, 0.6847991943359375, 0.733306884765625, 0.7818145751953125, 0.830322265625, 0.8788299560546875, 0.927337646484375, 0.9758453369140625, 1.02435302734375, 1.0728607177734375, 1.121368408203125, 1.1698760986328125, 1.2183837890625, 1.2668914794921875, 1.315399169921875, 1.3639068603515625, 1.41241455078125, 1.4609222412109375, 1.509429931640625, 1.5579376220703125, 1.6064453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 11.0, 11.0, 17.0, 18.0, 20.0, 33.0, 35.0, 36.0, 36.0, 57.0, 51.0, 59.0, 63.0, 63.0, 56.0, 58.0, 59.0, 39.0, 45.0, 45.0, 33.0, 30.0, 19.0, 24.0, 14.0, 12.0, 11.0, 3.0, 12.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8021485805511475, -3.694023847579956, -3.5858988761901855, -3.477774143218994, -3.3696494102478027, -3.2615246772766113, -3.153399705886841, -3.0452749729156494, -2.937150001525879, -2.8290252685546875, -2.720900297164917, -2.6127755641937256, -2.504650831222534, -2.3965258598327637, -2.2884011268615723, -2.180276393890381, -2.0721516609191895, -1.9640268087387085, -1.855902075767517, -1.7477772235870361, -1.6396524906158447, -1.5315276384353638, -1.4234027862548828, -1.3152780532836914, -1.2071532011032104, -1.0990283489227295, -0.9909036159515381, -0.8827787637710571, -0.774653971195221, -0.6665291786193848, -0.5584043264389038, -0.4502795338630676, -0.34215450286865234, -0.23402969539165497, -0.1259048879146576, -0.017780065536499023, 0.09034472703933716, 0.19846951961517334, 0.3065943717956543, 0.4147191643714905, 0.5228439569473267, 0.6309687495231628, 0.739093542098999, 0.84721839427948, 0.9553431868553162, 1.0634679794311523, 1.1715928316116333, 1.2797176837921143, 1.3878424167633057, 1.4959672689437866, 1.604092001914978, 1.712216854095459, 1.8203415870666504, 1.9284664392471313, 2.0365912914276123, 2.1447160243988037, 2.252840995788574, 2.3609657287597656, 2.469090700149536, 2.5772154331207275, 2.685340166091919, 2.7934651374816895, 2.901589870452881, 3.0097146034240723, 3.1178393363952637]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 7.0, 11.0, 13.0, 19.0, 17.0, 17.0, 25.0, 32.0, 23.0, 32.0, 36.0, 26.0, 21.0, 37.0, 33.0, 41.0, 49.0, 37.0, 40.0, 29.0, 30.0, 39.0, 38.0, 24.0, 28.0, 24.0, 45.0, 24.0, 25.0, 16.0, 22.0, 25.0, 20.0, 10.0, 16.0, 9.0, 12.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.507863998413086, -2.4301974773406982, -2.3525309562683105, -2.2748641967773438, -2.197197675704956, -2.1195311546325684, -2.0418646335601807, -1.964198112487793, -1.8865314722061157, -1.808864951133728, -1.7311983108520508, -1.653531789779663, -1.5758652687072754, -1.4981986284255981, -1.4205321073532104, -1.3428654670715332, -1.2651989459991455, -1.1875324249267578, -1.1098657846450806, -1.0321992635726929, -0.9545326828956604, -0.8768661022186279, -0.7991995811462402, -0.7215330004692078, -0.6438664197921753, -0.5661998391151428, -0.48853328824043274, -0.41086673736572266, -0.3332001566886902, -0.2555335760116577, -0.17786702513694763, -0.10020047426223755, -0.022533893585205078, 0.0551326721906662, 0.13279923796653748, 0.21046580374240875, 0.28813236951828003, 0.3657989501953125, 0.4434655010700226, 0.5211320519447327, 0.5987986326217651, 0.6764652132987976, 0.7541317939758301, 0.8317983150482178, 0.9094648957252502, 0.9871314764022827, 1.0647979974746704, 1.1424646377563477, 1.2201311588287354, 1.297797679901123, 1.3754643201828003, 1.453130841255188, 1.5307974815368652, 1.608464002609253, 1.6861305236816406, 1.7637970447540283, 1.8414636850357056, 1.9191302061080933, 1.9967968463897705, 2.074463367462158, 2.152129888534546, 2.2297964096069336, 2.3074631690979004, 2.385129690170288, 2.462796211242676]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 9.0, 17.0, 16.0, 15.0, 29.0, 31.0, 42.0, 60.0, 72.0, 100.0, 117.0, 175.0, 239.0, 392.0, 662.0, 1677.0, 7494.0, 187463.0, 814050.0, 29974.0, 3229.0, 1026.0, 506.0, 312.0, 210.0, 145.0, 104.0, 87.0, 54.0, 50.0, 36.0, 27.0, 28.0, 18.0, 17.0, 10.0, 4.0, 8.0, 9.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.849609375, -0.8224258422851562, -0.7952423095703125, -0.7680587768554688, -0.740875244140625, -0.7136917114257812, -0.6865081787109375, -0.6593246459960938, -0.63214111328125, -0.6049575805664062, -0.5777740478515625, -0.5505905151367188, -0.523406982421875, -0.49622344970703125, -0.4690399169921875, -0.44185638427734375, -0.4146728515625, -0.38748931884765625, -0.3603057861328125, -0.33312225341796875, -0.305938720703125, -0.27875518798828125, -0.2515716552734375, -0.22438812255859375, -0.19720458984375, -0.17002105712890625, -0.1428375244140625, -0.11565399169921875, -0.088470458984375, -0.06128692626953125, -0.0341033935546875, -0.00691986083984375, 0.020263671875, 0.04744720458984375, 0.0746307373046875, 0.10181427001953125, 0.128997802734375, 0.15618133544921875, 0.1833648681640625, 0.21054840087890625, 0.23773193359375, 0.26491546630859375, 0.2920989990234375, 0.31928253173828125, 0.346466064453125, 0.37364959716796875, 0.4008331298828125, 0.42801666259765625, 0.4552001953125, 0.48238372802734375, 0.5095672607421875, 0.5367507934570312, 0.563934326171875, 0.5911178588867188, 0.6183013916015625, 0.6454849243164062, 0.67266845703125, 0.6998519897460938, 0.7270355224609375, 0.7542190551757812, 0.781402587890625, 0.8085861206054688, 0.8357696533203125, 0.8629531860351562, 0.89013671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 9.0, 9.0, 5.0, 13.0, 18.0, 17.0, 16.0, 25.0, 19.0, 35.0, 28.0, 33.0, 35.0, 30.0, 40.0, 40.0, 37.0, 34.0, 38.0, 43.0, 41.0, 37.0, 35.0, 29.0, 32.0, 28.0, 34.0, 27.0, 31.0, 28.0, 18.0, 22.0, 21.0, 16.0, 10.0, 10.0, 8.0, 10.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-1.861328125, -1.8066864013671875, -1.752044677734375, -1.6974029541015625, -1.64276123046875, -1.5881195068359375, -1.533477783203125, -1.4788360595703125, -1.4241943359375, -1.3695526123046875, -1.314910888671875, -1.2602691650390625, -1.20562744140625, -1.1509857177734375, -1.096343994140625, -1.0417022705078125, -0.987060546875, -0.9324188232421875, -0.877777099609375, -0.8231353759765625, -0.76849365234375, -0.7138519287109375, -0.659210205078125, -0.6045684814453125, -0.5499267578125, -0.4952850341796875, -0.440643310546875, -0.3860015869140625, -0.33135986328125, -0.2767181396484375, -0.222076416015625, -0.1674346923828125, -0.11279296875, -0.0581512451171875, -0.003509521484375, 0.0511322021484375, 0.10577392578125, 0.1604156494140625, 0.215057373046875, 0.2696990966796875, 0.3243408203125, 0.3789825439453125, 0.433624267578125, 0.4882659912109375, 0.54290771484375, 0.5975494384765625, 0.652191162109375, 0.7068328857421875, 0.761474609375, 0.8161163330078125, 0.870758056640625, 0.9253997802734375, 0.98004150390625, 1.0346832275390625, 1.089324951171875, 1.1439666748046875, 1.1986083984375, 1.2532501220703125, 1.307891845703125, 1.3625335693359375, 1.41717529296875, 1.4718170166015625, 1.526458740234375, 1.5811004638671875, 1.6357421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 10.0, 6.0, 14.0, 14.0, 20.0, 19.0, 24.0, 31.0, 44.0, 48.0, 57.0, 83.0, 84.0, 114.0, 162.0, 248.0, 324.0, 563.0, 1242.0, 6709.0, 66522.0, 619126.0, 319244.0, 27679.0, 3610.0, 880.0, 463.0, 281.0, 196.0, 143.0, 116.0, 103.0, 90.0, 59.0, 42.0, 42.0, 36.0, 24.0, 16.0, 18.0, 9.0, 14.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.4150390625, -0.4015693664550781, -0.38809967041015625, -0.3746299743652344, -0.3611602783203125, -0.3476905822753906, -0.33422088623046875, -0.3207511901855469, -0.307281494140625, -0.2938117980957031, -0.28034210205078125, -0.2668724060058594, -0.2534027099609375, -0.23993301391601562, -0.22646331787109375, -0.21299362182617188, -0.19952392578125, -0.18605422973632812, -0.17258453369140625, -0.15911483764648438, -0.1456451416015625, -0.13217544555664062, -0.11870574951171875, -0.10523605346679688, -0.091766357421875, -0.07829666137695312, -0.06482696533203125, -0.051357269287109375, -0.0378875732421875, -0.024417877197265625, -0.01094818115234375, 0.002521514892578125, 0.0159912109375, 0.029460906982421875, 0.04293060302734375, 0.056400299072265625, 0.0698699951171875, 0.08333969116210938, 0.09680938720703125, 0.11027908325195312, 0.123748779296875, 0.13721847534179688, 0.15068817138671875, 0.16415786743164062, 0.1776275634765625, 0.19109725952148438, 0.20456695556640625, 0.21803665161132812, 0.23150634765625, 0.24497604370117188, 0.25844573974609375, 0.2719154357910156, 0.2853851318359375, 0.2988548278808594, 0.31232452392578125, 0.3257942199707031, 0.339263916015625, 0.3527336120605469, 0.36620330810546875, 0.3796730041503906, 0.3931427001953125, 0.4066123962402344, 0.42008209228515625, 0.4335517883300781, 0.447021484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 7.0, 5.0, 9.0, 15.0, 13.0, 20.0, 22.0, 25.0, 20.0, 28.0, 37.0, 37.0, 29.0, 33.0, 52.0, 47.0, 38.0, 50.0, 36.0, 48.0, 45.0, 40.0, 47.0, 43.0, 29.0, 27.0, 22.0, 20.0, 29.0, 21.0, 20.0, 9.0, 13.0, 16.0, 7.0, 8.0, 2.0, 5.0, 5.0, 2.0, 0.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73046875, -3.59600830078125, -3.4615478515625, -3.32708740234375, -3.192626953125, -3.05816650390625, -2.9237060546875, -2.78924560546875, -2.65478515625, -2.52032470703125, -2.3858642578125, -2.25140380859375, -2.116943359375, -1.98248291015625, -1.8480224609375, -1.71356201171875, -1.5791015625, -1.44464111328125, -1.3101806640625, -1.17572021484375, -1.041259765625, -0.90679931640625, -0.7723388671875, -0.63787841796875, -0.50341796875, -0.36895751953125, -0.2344970703125, -0.10003662109375, 0.034423828125, 0.16888427734375, 0.3033447265625, 0.43780517578125, 0.572265625, 0.70672607421875, 0.8411865234375, 0.97564697265625, 1.110107421875, 1.24456787109375, 1.3790283203125, 1.51348876953125, 1.64794921875, 1.78240966796875, 1.9168701171875, 2.05133056640625, 2.185791015625, 2.32025146484375, 2.4547119140625, 2.58917236328125, 2.7236328125, 2.85809326171875, 2.9925537109375, 3.12701416015625, 3.261474609375, 3.39593505859375, 3.5303955078125, 3.66485595703125, 3.79931640625, 3.93377685546875, 4.0682373046875, 4.20269775390625, 4.337158203125, 4.47161865234375, 4.6060791015625, 4.74053955078125, 4.875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 6.0, 11.0, 10.0, 14.0, 20.0, 19.0, 16.0, 31.0, 40.0, 73.0, 98.0, 164.0, 293.0, 708.0, 2583.0, 34644.0, 992516.0, 14293.0, 1740.0, 517.0, 266.0, 145.0, 82.0, 57.0, 48.0, 28.0, 23.0, 19.0, 14.0, 11.0, 10.0, 11.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.15114974975585938, -0.14519500732421875, -0.13924026489257812, -0.1332855224609375, -0.12733078002929688, -0.12137603759765625, -0.11542129516601562, -0.109466552734375, -0.10351181030273438, -0.09755706787109375, -0.09160232543945312, -0.0856475830078125, -0.07969284057617188, -0.07373809814453125, -0.06778335571289062, -0.06182861328125, -0.055873870849609375, -0.04991912841796875, -0.043964385986328125, -0.0380096435546875, -0.032054901123046875, -0.02610015869140625, -0.020145416259765625, -0.014190673828125, -0.008235931396484375, -0.00228118896484375, 0.003673553466796875, 0.0096282958984375, 0.015583038330078125, 0.02153778076171875, 0.027492523193359375, 0.033447265625, 0.039402008056640625, 0.04535675048828125, 0.051311492919921875, 0.0572662353515625, 0.06322097778320312, 0.06917572021484375, 0.07513046264648438, 0.081085205078125, 0.08703994750976562, 0.09299468994140625, 0.09894943237304688, 0.1049041748046875, 0.11085891723632812, 0.11681365966796875, 0.12276840209960938, 0.12872314453125, 0.13467788696289062, 0.14063262939453125, 0.14658737182617188, 0.1525421142578125, 0.15849685668945312, 0.16445159912109375, 0.17040634155273438, 0.176361083984375, 0.18231582641601562, 0.18827056884765625, 0.19422531127929688, 0.2001800537109375, 0.20613479614257812, 0.21208953857421875, 0.21804428100585938, 0.2239990234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 9.0, 13.0, 17.0, 19.0, 30.0, 31.0, 64.0, 91.0, 119.0, 157.0, 118.0, 85.0, 65.0, 46.0, 33.0, 25.0, 16.0, 13.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29425048828125e-05, -6.073620170354843e-05, -5.852989852428436e-05, -5.6323595345020294e-05, -5.4117292165756226e-05, -5.191098898649216e-05, -4.970468580722809e-05, -4.749838262796402e-05, -4.529207944869995e-05, -4.308577626943588e-05, -4.0879473090171814e-05, -3.8673169910907745e-05, -3.646686673164368e-05, -3.426056355237961e-05, -3.205426037311554e-05, -2.984795719385147e-05, -2.7641654014587402e-05, -2.5435350835323334e-05, -2.3229047656059265e-05, -2.1022744476795197e-05, -1.8816441297531128e-05, -1.661013811826706e-05, -1.440383493900299e-05, -1.2197531759738922e-05, -9.991228580474854e-06, -7.784925401210785e-06, -5.578622221946716e-06, -3.3723190426826477e-06, -1.166015863418579e-06, 1.0402873158454895e-06, 3.246590495109558e-06, 5.452893674373627e-06, 7.659196853637695e-06, 9.865500032901764e-06, 1.2071803212165833e-05, 1.4278106391429901e-05, 1.648440957069397e-05, 1.869071274995804e-05, 2.0897015929222107e-05, 2.3103319108486176e-05, 2.5309622287750244e-05, 2.7515925467014313e-05, 2.972222864627838e-05, 3.192853182554245e-05, 3.413483500480652e-05, 3.634113818407059e-05, 3.8547441363334656e-05, 4.0753744542598724e-05, 4.296004772186279e-05, 4.516635090112686e-05, 4.737265408039093e-05, 4.9578957259655e-05, 5.178526043891907e-05, 5.3991563618183136e-05, 5.6197866797447205e-05, 5.840416997671127e-05, 6.061047315597534e-05, 6.281677633523941e-05, 6.502307951450348e-05, 6.722938269376755e-05, 6.943568587303162e-05, 7.164198905229568e-05, 7.384829223155975e-05, 7.605459541082382e-05, 7.826089859008789e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 11.0, 7.0, 12.0, 16.0, 16.0, 33.0, 34.0, 58.0, 68.0, 112.0, 138.0, 205.0, 317.0, 430.0, 696.0, 1007.0, 1732.0, 3044.0, 6033.0, 12634.0, 34662.0, 157051.0, 672271.0, 106952.0, 27653.0, 10860.0, 5271.0, 2761.0, 1609.0, 975.0, 593.0, 380.0, 273.0, 183.0, 129.0, 88.0, 61.0, 46.0, 40.0, 29.0, 28.0, 10.0, 11.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.09027099609375, -0.087646484375, -0.08502197265625, -0.0823974609375, -0.07977294921875, -0.0771484375, -0.07452392578125, -0.0718994140625, -0.06927490234375, -0.066650390625, -0.06402587890625, -0.0614013671875, -0.05877685546875, -0.05615234375, -0.05352783203125, -0.0509033203125, -0.04827880859375, -0.045654296875, -0.04302978515625, -0.0404052734375, -0.03778076171875, -0.03515625, -0.03253173828125, -0.0299072265625, -0.02728271484375, -0.024658203125, -0.02203369140625, -0.0194091796875, -0.01678466796875, -0.01416015625, -0.01153564453125, -0.0089111328125, -0.00628662109375, -0.003662109375, -0.00103759765625, 0.0015869140625, 0.00421142578125, 0.0068359375, 0.00946044921875, 0.0120849609375, 0.01470947265625, 0.017333984375, 0.01995849609375, 0.0225830078125, 0.02520751953125, 0.02783203125, 0.03045654296875, 0.0330810546875, 0.03570556640625, 0.038330078125, 0.04095458984375, 0.0435791015625, 0.04620361328125, 0.048828125, 0.05145263671875, 0.0540771484375, 0.05670166015625, 0.059326171875, 0.06195068359375, 0.0645751953125, 0.06719970703125, 0.06982421875, 0.07244873046875, 0.0750732421875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 8.0, 17.0, 22.0, 29.0, 46.0, 75.0, 95.0, 208.0, 167.0, 82.0, 62.0, 44.0, 35.0, 26.0, 8.0, 18.0, 5.0, 5.0, 8.0, 2.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025970458984375, -0.02517986297607422, -0.024389266967773438, -0.023598670959472656, -0.022808074951171875, -0.022017478942871094, -0.021226882934570312, -0.02043628692626953, -0.01964569091796875, -0.01885509490966797, -0.018064498901367188, -0.017273902893066406, -0.016483306884765625, -0.015692710876464844, -0.014902114868164062, -0.014111518859863281, -0.0133209228515625, -0.012530326843261719, -0.011739730834960938, -0.010949134826660156, -0.010158538818359375, -0.009367942810058594, -0.008577346801757812, -0.007786750793457031, -0.00699615478515625, -0.006205558776855469, -0.0054149627685546875, -0.004624366760253906, -0.003833770751953125, -0.0030431747436523438, -0.0022525787353515625, -0.0014619827270507812, -0.00067138671875, 0.00011920928955078125, 0.0009098052978515625, 0.0017004013061523438, 0.002490997314453125, 0.0032815933227539062, 0.0040721893310546875, 0.004862785339355469, 0.00565338134765625, 0.006443977355957031, 0.0072345733642578125, 0.008025169372558594, 0.008815765380859375, 0.009606361389160156, 0.010396957397460938, 0.011187553405761719, 0.0119781494140625, 0.012768745422363281, 0.013559341430664062, 0.014349937438964844, 0.015140533447265625, 0.015931129455566406, 0.016721725463867188, 0.01751232147216797, 0.01830291748046875, 0.01909351348876953, 0.019884109497070312, 0.020674705505371094, 0.021465301513671875, 0.022255897521972656, 0.023046493530273438, 0.02383708953857422, 0.024627685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 13.0, 8.0, 14.0, 19.0, 25.0, 27.0, 32.0, 34.0, 45.0, 42.0, 59.0, 59.0, 58.0, 63.0, 55.0, 52.0, 55.0, 39.0, 45.0, 49.0, 28.0, 36.0, 21.0, 26.0, 16.0, 15.0, 9.0, 12.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3585026264190674, -2.2884914875030518, -2.218480348587036, -2.1484689712524414, -2.078457832336426, -2.00844669342041, -1.9384355545043945, -1.868424415588379, -1.7984131574630737, -1.728402018547058, -1.658390760421753, -1.5883796215057373, -1.5183684825897217, -1.4483572244644165, -1.3783460855484009, -1.3083348274230957, -1.23832368850708, -1.1683125495910645, -1.0983012914657593, -1.0282901525497437, -0.9582789540290833, -0.8882677555084229, -0.8182566165924072, -0.7482454180717468, -0.6782342195510864, -0.608223021030426, -0.5382118225097656, -0.46820068359375, -0.3981894850730896, -0.3281782865524292, -0.2581671178340912, -0.18815594911575317, -0.11814498901367188, -0.04813380539417267, 0.021877378225326538, 0.09188856184482574, 0.16189974546432495, 0.23191094398498535, 0.30192211270332336, 0.3719332814216614, 0.4419444799423218, 0.5119556784629822, 0.5819668769836426, 0.6519780158996582, 0.7219892144203186, 0.792000412940979, 0.8620115518569946, 0.932022750377655, 1.0020339488983154, 1.072045087814331, 1.1420563459396362, 1.2120674848556519, 1.282078742980957, 1.3520898818969727, 1.4221010208129883, 1.492112159729004, 1.562123417854309, 1.6321345567703247, 1.7021458148956299, 1.7721569538116455, 1.8421680927276611, 1.9121793508529663, 1.982190489768982, 2.052201747894287, 2.1222128868103027]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 2.0, 3.0, 10.0, 10.0, 8.0, 15.0, 13.0, 24.0, 22.0, 19.0, 27.0, 30.0, 30.0, 37.0, 34.0, 26.0, 29.0, 40.0, 41.0, 40.0, 49.0, 34.0, 30.0, 29.0, 49.0, 31.0, 27.0, 31.0, 34.0, 25.0, 27.0, 24.0, 23.0, 17.0, 19.0, 21.0, 14.0, 13.0, 10.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.67923903465271, -1.6262422800064087, -1.573245644569397, -1.5202488899230957, -1.467252254486084, -1.4142554998397827, -1.3612587451934814, -1.3082621097564697, -1.2552653551101685, -1.2022686004638672, -1.1492719650268555, -1.0962752103805542, -1.043278455734253, -0.9902818202972412, -0.9372850656509399, -0.8842883706092834, -0.831291675567627, -0.7782949805259705, -0.725298285484314, -0.6723015308380127, -0.6193048357963562, -0.5663081407546997, -0.5133113861083984, -0.46031469106674194, -0.40731799602508545, -0.35432130098342896, -0.3013245761394501, -0.24832786619663239, -0.1953311562538147, -0.1423344612121582, -0.08933773636817932, -0.03634101152420044, 0.016655802726745605, 0.0696525126695633, 0.12264922261238098, 0.17564593255519867, 0.22864264249801636, 0.28163933753967285, 0.33463606238365173, 0.3876327872276306, 0.4406294822692871, 0.4936261773109436, 0.5466228723526001, 0.5996196269989014, 0.6526163220405579, 0.7056130170822144, 0.7586097717285156, 0.8116064667701721, 0.8646031618118286, 0.9175998568534851, 0.9705965518951416, 1.0235933065414429, 1.0765900611877441, 1.1295866966247559, 1.1825834512710571, 1.2355802059173584, 1.2885768413543701, 1.3415735960006714, 1.394570231437683, 1.4475669860839844, 1.500563621520996, 1.5535603761672974, 1.6065571308135986, 1.6595537662506104, 1.7125505208969116]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 2.0, 9.0, 12.0, 17.0, 34.0, 37.0, 55.0, 61.0, 111.0, 165.0, 216.0, 402.0, 579.0, 929.0, 1552.0, 2720.0, 4814.0, 9587.0, 19446.0, 42033.0, 100158.0, 244254.0, 332824.0, 163915.0, 66006.0, 29008.0, 13564.0, 6841.0, 3757.0, 2129.0, 1218.0, 747.0, 457.0, 315.0, 186.0, 123.0, 70.0, 58.0, 48.0, 35.0, 18.0, 12.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0], "bins": [-3.138671875, -3.0521240234375, -2.965576171875, -2.8790283203125, -2.79248046875, -2.7059326171875, -2.619384765625, -2.5328369140625, -2.4462890625, -2.3597412109375, -2.273193359375, -2.1866455078125, -2.10009765625, -2.0135498046875, -1.927001953125, -1.8404541015625, -1.75390625, -1.6673583984375, -1.580810546875, -1.4942626953125, -1.40771484375, -1.3211669921875, -1.234619140625, -1.1480712890625, -1.0615234375, -0.9749755859375, -0.888427734375, -0.8018798828125, -0.71533203125, -0.6287841796875, -0.542236328125, -0.4556884765625, -0.369140625, -0.2825927734375, -0.196044921875, -0.1094970703125, -0.02294921875, 0.0635986328125, 0.150146484375, 0.2366943359375, 0.3232421875, 0.4097900390625, 0.496337890625, 0.5828857421875, 0.66943359375, 0.7559814453125, 0.842529296875, 0.9290771484375, 1.015625, 1.1021728515625, 1.188720703125, 1.2752685546875, 1.36181640625, 1.4483642578125, 1.534912109375, 1.6214599609375, 1.7080078125, 1.7945556640625, 1.881103515625, 1.9676513671875, 2.05419921875, 2.1407470703125, 2.227294921875, 2.3138427734375, 2.400390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 11.0, 10.0, 11.0, 11.0, 13.0, 8.0, 11.0, 21.0, 25.0, 25.0, 22.0, 23.0, 25.0, 32.0, 39.0, 31.0, 39.0, 31.0, 35.0, 38.0, 37.0, 39.0, 30.0, 27.0, 41.0, 46.0, 31.0, 24.0, 33.0, 21.0, 26.0, 26.0, 24.0, 20.0, 13.0, 20.0, 15.0, 15.0, 9.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.5234375, -2.43603515625, -2.3486328125, -2.26123046875, -2.173828125, -2.08642578125, -1.9990234375, -1.91162109375, -1.82421875, -1.73681640625, -1.6494140625, -1.56201171875, -1.474609375, -1.38720703125, -1.2998046875, -1.21240234375, -1.125, -1.03759765625, -0.9501953125, -0.86279296875, -0.775390625, -0.68798828125, -0.6005859375, -0.51318359375, -0.42578125, -0.33837890625, -0.2509765625, -0.16357421875, -0.076171875, 0.01123046875, 0.0986328125, 0.18603515625, 0.2734375, 0.36083984375, 0.4482421875, 0.53564453125, 0.623046875, 0.71044921875, 0.7978515625, 0.88525390625, 0.97265625, 1.06005859375, 1.1474609375, 1.23486328125, 1.322265625, 1.40966796875, 1.4970703125, 1.58447265625, 1.671875, 1.75927734375, 1.8466796875, 1.93408203125, 2.021484375, 2.10888671875, 2.1962890625, 2.28369140625, 2.37109375, 2.45849609375, 2.5458984375, 2.63330078125, 2.720703125, 2.80810546875, 2.8955078125, 2.98291015625, 3.0703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 5.0, 8.0, 16.0, 24.0, 28.0, 43.0, 73.0, 115.0, 193.0, 324.0, 615.0, 1202.0, 2297.0, 4990.0, 11442.0, 31759.0, 101234.0, 340863.0, 376974.0, 116872.0, 35900.0, 12741.0, 5459.0, 2532.0, 1224.0, 715.0, 353.0, 180.0, 125.0, 85.0, 44.0, 33.0, 29.0, 13.0, 10.0, 6.0, 4.0, 8.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.18359375, -3.07012939453125, -2.9566650390625, -2.84320068359375, -2.729736328125, -2.61627197265625, -2.5028076171875, -2.38934326171875, -2.27587890625, -2.16241455078125, -2.0489501953125, -1.93548583984375, -1.822021484375, -1.70855712890625, -1.5950927734375, -1.48162841796875, -1.3681640625, -1.25469970703125, -1.1412353515625, -1.02777099609375, -0.914306640625, -0.80084228515625, -0.6873779296875, -0.57391357421875, -0.46044921875, -0.34698486328125, -0.2335205078125, -0.12005615234375, -0.006591796875, 0.10687255859375, 0.2203369140625, 0.33380126953125, 0.447265625, 0.56072998046875, 0.6741943359375, 0.78765869140625, 0.901123046875, 1.01458740234375, 1.1280517578125, 1.24151611328125, 1.35498046875, 1.46844482421875, 1.5819091796875, 1.69537353515625, 1.808837890625, 1.92230224609375, 2.0357666015625, 2.14923095703125, 2.2626953125, 2.37615966796875, 2.4896240234375, 2.60308837890625, 2.716552734375, 2.83001708984375, 2.9434814453125, 3.05694580078125, 3.17041015625, 3.28387451171875, 3.3973388671875, 3.51080322265625, 3.624267578125, 3.73773193359375, 3.8511962890625, 3.96466064453125, 4.078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 4.0, 9.0, 11.0, 11.0, 16.0, 12.0, 31.0, 20.0, 22.0, 31.0, 34.0, 45.0, 42.0, 37.0, 43.0, 50.0, 58.0, 44.0, 48.0, 40.0, 34.0, 47.0, 35.0, 40.0, 38.0, 40.0, 32.0, 25.0, 14.0, 19.0, 17.0, 11.0, 11.0, 9.0, 4.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.31121826171875, -4.1654052734375, -4.01959228515625, -3.873779296875, -3.72796630859375, -3.5821533203125, -3.43634033203125, -3.29052734375, -3.14471435546875, -2.9989013671875, -2.85308837890625, -2.707275390625, -2.56146240234375, -2.4156494140625, -2.26983642578125, -2.1240234375, -1.97821044921875, -1.8323974609375, -1.68658447265625, -1.540771484375, -1.39495849609375, -1.2491455078125, -1.10333251953125, -0.95751953125, -0.81170654296875, -0.6658935546875, -0.52008056640625, -0.374267578125, -0.22845458984375, -0.0826416015625, 0.06317138671875, 0.208984375, 0.35479736328125, 0.5006103515625, 0.64642333984375, 0.792236328125, 0.93804931640625, 1.0838623046875, 1.22967529296875, 1.37548828125, 1.52130126953125, 1.6671142578125, 1.81292724609375, 1.958740234375, 2.10455322265625, 2.2503662109375, 2.39617919921875, 2.5419921875, 2.68780517578125, 2.8336181640625, 2.97943115234375, 3.125244140625, 3.27105712890625, 3.4168701171875, 3.56268310546875, 3.70849609375, 3.85430908203125, 4.0001220703125, 4.14593505859375, 4.291748046875, 4.43756103515625, 4.5833740234375, 4.72918701171875, 4.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 11.0, 20.0, 19.0, 30.0, 43.0, 54.0, 71.0, 98.0, 134.0, 222.0, 258.0, 411.0, 569.0, 840.0, 1145.0, 1691.0, 2642.0, 4356.0, 7719.0, 14437.0, 29521.0, 65183.0, 141733.0, 284105.0, 251499.0, 126315.0, 57719.0, 25984.0, 12973.0, 6875.0, 4069.0, 2411.0, 1662.0, 1139.0, 722.0, 535.0, 377.0, 267.0, 180.0, 123.0, 101.0, 69.0, 61.0, 42.0, 27.0, 31.0, 13.0, 11.0, 8.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0], "bins": [-0.7421875, -0.7196426391601562, -0.6970977783203125, -0.6745529174804688, -0.652008056640625, -0.6294631958007812, -0.6069183349609375, -0.5843734741210938, -0.56182861328125, -0.5392837524414062, -0.5167388916015625, -0.49419403076171875, -0.471649169921875, -0.44910430908203125, -0.4265594482421875, -0.40401458740234375, -0.3814697265625, -0.35892486572265625, -0.3363800048828125, -0.31383514404296875, -0.291290283203125, -0.26874542236328125, -0.2462005615234375, -0.22365570068359375, -0.20111083984375, -0.17856597900390625, -0.1560211181640625, -0.13347625732421875, -0.110931396484375, -0.08838653564453125, -0.0658416748046875, -0.04329681396484375, -0.020751953125, 0.00179290771484375, 0.0243377685546875, 0.04688262939453125, 0.069427490234375, 0.09197235107421875, 0.1145172119140625, 0.13706207275390625, 0.15960693359375, 0.18215179443359375, 0.2046966552734375, 0.22724151611328125, 0.249786376953125, 0.27233123779296875, 0.2948760986328125, 0.31742095947265625, 0.3399658203125, 0.36251068115234375, 0.3850555419921875, 0.40760040283203125, 0.430145263671875, 0.45269012451171875, 0.4752349853515625, 0.49777984619140625, 0.52032470703125, 0.5428695678710938, 0.5654144287109375, 0.5879592895507812, 0.610504150390625, 0.6330490112304688, 0.6555938720703125, 0.6781387329101562, 0.70068359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 7.0, 12.0, 17.0, 25.0, 31.0, 40.0, 42.0, 57.0, 73.0, 83.0, 120.0, 112.0, 79.0, 67.0, 46.0, 56.0, 36.0, 26.0, 12.0, 14.0, 11.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023639202117919922, -0.00022897683084011078, -0.00022156164050102234, -0.0002141464501619339, -0.00020673125982284546, -0.00019931606948375702, -0.00019190087914466858, -0.00018448568880558014, -0.0001770704984664917, -0.00016965530812740326, -0.00016224011778831482, -0.00015482492744922638, -0.00014740973711013794, -0.0001399945467710495, -0.00013257935643196106, -0.00012516416609287262, -0.00011774897575378418, -0.00011033378541469574, -0.0001029185950756073, -9.550340473651886e-05, -8.808821439743042e-05, -8.067302405834198e-05, -7.325783371925354e-05, -6.58426433801651e-05, -5.842745304107666e-05, -5.101226270198822e-05, -4.359707236289978e-05, -3.618188202381134e-05, -2.87666916847229e-05, -2.135150134563446e-05, -1.393631100654602e-05, -6.5211206674575806e-06, 8.940696716308594e-07, 8.3092600107193e-06, 1.572445034980774e-05, 2.313964068889618e-05, 3.055483102798462e-05, 3.797002136707306e-05, 4.53852117061615e-05, 5.280040204524994e-05, 6.021559238433838e-05, 6.763078272342682e-05, 7.504597306251526e-05, 8.24611634016037e-05, 8.987635374069214e-05, 9.729154407978058e-05, 0.00010470673441886902, 0.00011212192475795746, 0.0001195371150970459, 0.00012695230543613434, 0.00013436749577522278, 0.00014178268611431122, 0.00014919787645339966, 0.0001566130667924881, 0.00016402825713157654, 0.00017144344747066498, 0.00017885863780975342, 0.00018627382814884186, 0.0001936890184879303, 0.00020110420882701874, 0.00020851939916610718, 0.00021593458950519562, 0.00022334977984428406, 0.0002307649701833725, 0.00023818016052246094]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 11.0, 6.0, 9.0, 18.0, 15.0, 22.0, 41.0, 65.0, 79.0, 107.0, 164.0, 204.0, 349.0, 462.0, 737.0, 1044.0, 1648.0, 2764.0, 4693.0, 8605.0, 17008.0, 37690.0, 89439.0, 203768.0, 343782.0, 185863.0, 80162.0, 34389.0, 15734.0, 7995.0, 4347.0, 2616.0, 1523.0, 1058.0, 693.0, 450.0, 306.0, 217.0, 139.0, 94.0, 74.0, 46.0, 41.0, 26.0, 16.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.8212890625, -0.795166015625, -0.76904296875, -0.742919921875, -0.716796875, -0.690673828125, -0.66455078125, -0.638427734375, -0.6123046875, -0.586181640625, -0.56005859375, -0.533935546875, -0.5078125, -0.481689453125, -0.45556640625, -0.429443359375, -0.4033203125, -0.377197265625, -0.35107421875, -0.324951171875, -0.298828125, -0.272705078125, -0.24658203125, -0.220458984375, -0.1943359375, -0.168212890625, -0.14208984375, -0.115966796875, -0.08984375, -0.063720703125, -0.03759765625, -0.011474609375, 0.0146484375, 0.040771484375, 0.06689453125, 0.093017578125, 0.119140625, 0.145263671875, 0.17138671875, 0.197509765625, 0.2236328125, 0.249755859375, 0.27587890625, 0.302001953125, 0.328125, 0.354248046875, 0.38037109375, 0.406494140625, 0.4326171875, 0.458740234375, 0.48486328125, 0.510986328125, 0.537109375, 0.563232421875, 0.58935546875, 0.615478515625, 0.6416015625, 0.667724609375, 0.69384765625, 0.719970703125, 0.74609375, 0.772216796875, 0.79833984375, 0.824462890625, 0.8505859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 7.0, 16.0, 13.0, 19.0, 24.0, 38.0, 53.0, 66.0, 64.0, 84.0, 129.0, 125.0, 78.0, 64.0, 56.0, 37.0, 35.0, 23.0, 23.0, 9.0, 3.0, 6.0, 6.0, 3.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892578125, -0.8669586181640625, -0.841339111328125, -0.8157196044921875, -0.79010009765625, -0.7644805908203125, -0.738861083984375, -0.7132415771484375, -0.6876220703125, -0.6620025634765625, -0.636383056640625, -0.6107635498046875, -0.58514404296875, -0.5595245361328125, -0.533905029296875, -0.5082855224609375, -0.482666015625, -0.4570465087890625, -0.431427001953125, -0.4058074951171875, -0.38018798828125, -0.3545684814453125, -0.328948974609375, -0.3033294677734375, -0.2777099609375, -0.2520904541015625, -0.226470947265625, -0.2008514404296875, -0.17523193359375, -0.1496124267578125, -0.123992919921875, -0.0983734130859375, -0.07275390625, -0.0471343994140625, -0.021514892578125, 0.0041046142578125, 0.02972412109375, 0.0553436279296875, 0.080963134765625, 0.1065826416015625, 0.1322021484375, 0.1578216552734375, 0.183441162109375, 0.2090606689453125, 0.23468017578125, 0.2602996826171875, 0.285919189453125, 0.3115386962890625, 0.337158203125, 0.3627777099609375, 0.388397216796875, 0.4140167236328125, 0.43963623046875, 0.4652557373046875, 0.490875244140625, 0.5164947509765625, 0.5421142578125, 0.5677337646484375, 0.593353271484375, 0.6189727783203125, 0.64459228515625, 0.6702117919921875, 0.695831298828125, 0.7214508056640625, 0.7470703125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 14.0, 42.0, 94.0, 217.0, 271.0, 198.0, 104.0, 43.0, 12.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.770950317382812, -16.055702209472656, -15.340453147888184, -14.625204086303711, -13.909955978393555, -13.194706916809082, -12.47945785522461, -11.764209747314453, -11.04896068572998, -10.333711624145508, -9.618463516235352, -8.903214454650879, -8.187965393066406, -7.47271728515625, -6.757468223571777, -6.042219638824463, -5.326971054077148, -4.611722469329834, -3.8964736461639404, -3.181224822998047, -2.4659762382507324, -1.750727653503418, -1.0354785919189453, -0.32023000717163086, 0.3950185775756836, 1.1102672815322876, 1.8255159854888916, 2.540764808654785, 3.2560133934020996, 3.971261978149414, 4.686511039733887, 5.401759624481201, 6.117010116577148, 6.832258701324463, 7.547507286071777, 8.26275634765625, 8.978004455566406, 9.693253517150879, 10.408502578735352, 11.123750686645508, 11.83899974822998, 12.554248809814453, 13.26949691772461, 13.984745979309082, 14.699995040893555, 15.415243148803711, 16.1304931640625, 16.845741271972656, 17.560989379882812, 18.27623748779297, 18.991487503051758, 19.706735610961914, 20.42198371887207, 21.13723373413086, 21.852481842041016, 22.567729949951172, 23.282978057861328, 23.998226165771484, 24.713476181030273, 25.42872428894043, 26.143972396850586, 26.859222412109375, 27.57447052001953, 28.289718627929688, 29.004968643188477]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 8.0, 11.0, 8.0, 15.0, 12.0, 19.0, 15.0, 23.0, 25.0, 25.0, 30.0, 33.0, 31.0, 36.0, 33.0, 40.0, 37.0, 39.0, 42.0, 46.0, 43.0, 40.0, 39.0, 47.0, 31.0, 34.0, 30.0, 32.0, 25.0, 19.0, 19.0, 19.0, 12.0, 17.0, 11.0, 9.0, 8.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-8.28282356262207, -8.050165176391602, -7.817506313323975, -7.584847927093506, -7.352189064025879, -7.11953067779541, -6.886872291564941, -6.6542134284973145, -6.421555042266846, -6.188896656036377, -5.95623779296875, -5.723579406738281, -5.490920543670654, -5.2582621574401855, -5.025603294372559, -4.79294490814209, -4.560286521911621, -4.327628135681152, -4.094969272613525, -3.8623108863830566, -3.629652261734009, -3.396993637084961, -3.164335012435913, -2.9316763877868652, -2.6990175247192383, -2.4663589000701904, -2.2337002754211426, -2.001041889190674, -1.768383264541626, -1.5357246398925781, -1.3030660152435303, -1.070407509803772, -0.8377490043640137, -0.6050904393196106, -0.37243184447288513, -0.13977324962615967, 0.09288531541824341, 0.3255438804626465, 0.5582025051116943, 0.7908610105514526, 1.0235196352005005, 1.2561782598495483, 1.4888367652893066, 1.7214953899383545, 1.9541540145874023, 2.186812400817871, 2.419471263885498, 2.652129650115967, 2.8847882747650146, 3.1174468994140625, 3.3501055240631104, 3.582764148712158, 3.815422534942627, 4.048081398010254, 4.280739784240723, 4.513398170471191, 4.746057033538818, 4.978715419769287, 5.211374282836914, 5.444032669067383, 5.67669153213501, 5.9093499183654785, 6.1420087814331055, 6.374667167663574, 6.607325553894043]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 12.0, 10.0, 15.0, 15.0, 30.0, 29.0, 52.0, 73.0, 90.0, 144.0, 159.0, 249.0, 317.0, 473.0, 632.0, 899.0, 1230.0, 1648.0, 2235.0, 1030823.0, 3464.0, 2135.0, 1506.0, 1209.0, 846.0, 610.0, 479.0, 347.0, 227.0, 158.0, 128.0, 89.0, 64.0, 54.0, 35.0, 18.0, 33.0, 12.0, 12.0, 10.0, 5.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.166447639465332, -8.896451950073242, -8.626456260681152, -8.356460571289062, -8.086464881896973, -7.816469669342041, -7.546473979949951, -7.276478290557861, -7.00648307800293, -6.73648738861084, -6.46649169921875, -6.19649600982666, -5.9265007972717285, -5.656505107879639, -5.386509418487549, -5.116513729095459, -4.846518039703369, -4.576522350311279, -4.3065266609191895, -4.036531448364258, -3.766535758972168, -3.496540069580078, -3.2265443801879883, -2.9565486907958984, -2.6865532398223877, -2.416557550430298, -2.146562099456787, -1.8765664100646973, -1.606570839881897, -1.3365752696990967, -1.0665795803070068, -0.7965840101242065, -0.5265884399414062, -0.25659283995628357, 0.013402760028839111, 0.2833983898162842, 0.5533939599990845, 0.8233895301818848, 1.0933852195739746, 1.363380789756775, 1.6333763599395752, 1.9033719301223755, 2.173367500305176, 2.4433631896972656, 2.7133588790893555, 2.983354330062866, 3.253350019454956, 3.523345470428467, 3.7933411598205566, 4.0633368492126465, 4.333332538604736, 4.603327751159668, 4.873323440551758, 5.143319129943848, 5.4133148193359375, 5.683310508728027, 5.953306198120117, 6.223301887512207, 6.493297576904297, 6.763293266296387, 7.033288478851318, 7.303284168243408, 7.573279857635498, 7.843275547027588, 8.11327075958252]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 14.0, 21.0, 86.0, 64.0, 133.0, 300.0, 804.0, 2497.0, 10279.0, 224059.0, 51215700.0, 12807.0, 3330.0, 1001.0, 409.0, 151.0, 88.0, 45.0, 28.0, 17.0, 12.0, 6.0, 7.0, 8.0, 3.0, 2.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.785619735717773, -23.931493759155273, -23.07736587524414, -22.22323989868164, -21.36911392211914, -20.51498794555664, -19.660860061645508, -18.806734085083008, -17.952608108520508, -17.098482131958008, -16.244354248046875, -15.390228271484375, -14.536102294921875, -13.681975364685059, -12.827848434448242, -11.973722457885742, -11.119595527648926, -10.26546859741211, -9.41134262084961, -8.557215690612793, -7.703089714050293, -6.848962783813477, -5.994836330413818, -5.14070987701416, -4.286583423614502, -3.4324569702148438, -2.5783305168151855, -1.7242038249969482, -0.87007737159729, -0.015950679779052734, 0.8381757736206055, 1.6923022270202637, 2.546428680419922, 3.40055513381958, 4.254681587219238, 5.108808517456055, 5.962934494018555, 6.817061424255371, 7.671187877655029, 8.525314331054688, 9.379440307617188, 10.233567237854004, 11.087693214416504, 11.94182014465332, 12.79594612121582, 13.650073051452637, 14.504199981689453, 15.358325958251953, 16.212451934814453, 17.066577911376953, 17.920705795288086, 18.774831771850586, 19.628957748413086, 20.48308563232422, 21.33721160888672, 22.19133758544922, 23.04546546936035, 23.89959144592285, 24.753719329833984, 25.607845306396484, 26.461971282958984, 27.316097259521484, 28.170225143432617, 29.024351119995117, 29.878477096557617]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 8.0, 13.0, 15.0, 21.0, 29.0, 68.0, 74.0, 150.0, 166.0, 295.0, 500.0, 969.0, 1867.0, 4031.0, 9573.0, 26090.0, 76583.0, 237604.0, 672986.0, 4260742.0, 655291.0, 228803.0, 73978.0, 24699.0, 9151.0, 3686.0, 1699.0, 889.0, 529.0, 295.0, 188.0, 128.0, 99.0, 59.0, 45.0, 31.0, 26.0, 14.0, 17.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4130859375, -0.39858245849609375, -0.3840789794921875, -0.36957550048828125, -0.355072021484375, -0.34056854248046875, -0.3260650634765625, -0.31156158447265625, -0.29705810546875, -0.28255462646484375, -0.2680511474609375, -0.25354766845703125, -0.239044189453125, -0.22454071044921875, -0.2100372314453125, -0.19553375244140625, -0.1810302734375, -0.16652679443359375, -0.1520233154296875, -0.13751983642578125, -0.123016357421875, -0.10851287841796875, -0.0940093994140625, -0.07950592041015625, -0.06500244140625, -0.05049896240234375, -0.0359954833984375, -0.02149200439453125, -0.006988525390625, 0.00751495361328125, 0.0220184326171875, 0.03652191162109375, 0.051025390625, 0.06552886962890625, 0.0800323486328125, 0.09453582763671875, 0.109039306640625, 0.12354278564453125, 0.1380462646484375, 0.15254974365234375, 0.16705322265625, 0.18155670166015625, 0.1960601806640625, 0.21056365966796875, 0.225067138671875, 0.23957061767578125, 0.2540740966796875, 0.26857757568359375, 0.2830810546875, 0.29758453369140625, 0.3120880126953125, 0.32659149169921875, 0.341094970703125, 0.35559844970703125, 0.3701019287109375, 0.38460540771484375, 0.39910888671875, 0.41361236572265625, 0.4281158447265625, 0.44261932373046875, 0.457122802734375, 0.47162628173828125, 0.4861297607421875, 0.5006332397460938, 0.51513671875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 11.0, 10.0, 10.0, 18.0, 18.0, 13.0, 26.0, 21.0, 27.0, 22.0, 32.0, 32.0, 38.0, 36.0, 56.0, 42.0, 39.0, 51.0, 1074.0, 57.0, 33.0, 37.0, 43.0, 24.0, 34.0, 32.0, 25.0, 27.0, 21.0, 17.0, 23.0, 26.0, 11.0, 6.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-18.1875, -17.687255859375, -17.18701171875, -16.686767578125, -16.1865234375, -15.686279296875, -15.18603515625, -14.685791015625, -14.185546875, -13.685302734375, -13.18505859375, -12.684814453125, -12.1845703125, -11.684326171875, -11.18408203125, -10.683837890625, -10.18359375, -9.683349609375, -9.18310546875, -8.682861328125, -8.1826171875, -7.682373046875, -7.18212890625, -6.681884765625, -6.181640625, -5.681396484375, -5.18115234375, -4.680908203125, -4.1806640625, -3.680419921875, -3.18017578125, -2.679931640625, -2.1796875, -1.679443359375, -1.17919921875, -0.678955078125, -0.1787109375, 0.321533203125, 0.82177734375, 1.322021484375, 1.822265625, 2.322509765625, 2.82275390625, 3.322998046875, 3.8232421875, 4.323486328125, 4.82373046875, 5.323974609375, 5.82421875, 6.324462890625, 6.82470703125, 7.324951171875, 7.8251953125, 8.325439453125, 8.82568359375, 9.325927734375, 9.826171875, 10.326416015625, 10.82666015625, 11.326904296875, 11.8271484375, 12.327392578125, 12.82763671875, 13.327880859375, 13.828125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 10.0, 19.0, 15.0, 21.0, 35.0, 66.0, 78.0, 82.0, 92.0, 136.0, 159.0, 220.0, 245.0, 351.0, 553.0, 843.0, 1379.0, 2619.0, 6557.0, 22832.0, 106593.0, 541091.0, 4575349.0, 808669.0, 170840.0, 34903.0, 9305.0, 3392.0, 1621.0, 950.0, 626.0, 471.0, 321.0, 240.0, 182.0, 128.0, 93.0, 77.0, 64.0, 35.0, 43.0, 21.0, 18.0, 18.0, 25.0, 20.0, 12.0, 10.0, 3.0, 2.0, 2.0], "bins": [-0.5146484375, -0.5002098083496094, -0.48577117919921875, -0.4713325500488281, -0.4568939208984375, -0.4424552917480469, -0.42801666259765625, -0.4135780334472656, -0.399139404296875, -0.3847007751464844, -0.37026214599609375, -0.3558235168457031, -0.3413848876953125, -0.3269462585449219, -0.31250762939453125, -0.2980690002441406, -0.28363037109375, -0.2691917419433594, -0.25475311279296875, -0.24031448364257812, -0.2258758544921875, -0.21143722534179688, -0.19699859619140625, -0.18255996704101562, -0.168121337890625, -0.15368270874023438, -0.13924407958984375, -0.12480545043945312, -0.1103668212890625, -0.09592819213867188, -0.08148956298828125, -0.06705093383789062, -0.0526123046875, -0.038173675537109375, -0.02373504638671875, -0.009296417236328125, 0.0051422119140625, 0.019580841064453125, 0.03401947021484375, 0.048458099365234375, 0.062896728515625, 0.07733535766601562, 0.09177398681640625, 0.10621261596679688, 0.1206512451171875, 0.13508987426757812, 0.14952850341796875, 0.16396713256835938, 0.17840576171875, 0.19284439086914062, 0.20728302001953125, 0.22172164916992188, 0.2361602783203125, 0.2505989074707031, 0.26503753662109375, 0.2794761657714844, 0.293914794921875, 0.3083534240722656, 0.32279205322265625, 0.3372306823730469, 0.3516693115234375, 0.3661079406738281, 0.38054656982421875, 0.3949851989746094, 0.409423828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 5.0, 6.0, 5.0, 9.0, 7.0, 14.0, 19.0, 20.0, 25.0, 23.0, 37.0, 40.0, 38.0, 26.0, 63.0, 33.0, 44.0, 214.0, 910.0, 53.0, 53.0, 43.0, 42.0, 42.0, 35.0, 23.0, 40.0, 27.0, 31.0, 21.0, 19.0, 14.0, 10.0, 13.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.3203125, -13.8997802734375, -13.479248046875, -13.0587158203125, -12.63818359375, -12.2176513671875, -11.797119140625, -11.3765869140625, -10.9560546875, -10.5355224609375, -10.114990234375, -9.6944580078125, -9.27392578125, -8.8533935546875, -8.432861328125, -8.0123291015625, -7.591796875, -7.1712646484375, -6.750732421875, -6.3302001953125, -5.90966796875, -5.4891357421875, -5.068603515625, -4.6480712890625, -4.2275390625, -3.8070068359375, -3.386474609375, -2.9659423828125, -2.54541015625, -2.1248779296875, -1.704345703125, -1.2838134765625, -0.86328125, -0.4427490234375, -0.022216796875, 0.3983154296875, 0.81884765625, 1.2393798828125, 1.659912109375, 2.0804443359375, 2.5009765625, 2.9215087890625, 3.342041015625, 3.7625732421875, 4.18310546875, 4.6036376953125, 5.024169921875, 5.4447021484375, 5.865234375, 6.2857666015625, 6.706298828125, 7.1268310546875, 7.54736328125, 7.9678955078125, 8.388427734375, 8.8089599609375, 9.2294921875, 9.6500244140625, 10.070556640625, 10.4910888671875, 10.91162109375, 11.3321533203125, 11.752685546875, 12.1732177734375, 12.59375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 11.0, 14.0, 22.0, 30.0, 54.0, 66.0, 88.0, 149.0, 278.0, 431.0, 674.0, 1081.0, 1804.0, 3381.0, 10017.0, 109520.0, 6032581.0, 112775.0, 10199.0, 3601.0, 1810.0, 1088.0, 568.0, 357.0, 223.0, 173.0, 120.0, 94.0, 54.0, 36.0, 18.0, 21.0, 17.0, 15.0, 16.0, 10.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0], "bins": [-1.384765625, -1.3421630859375, -1.299560546875, -1.2569580078125, -1.21435546875, -1.1717529296875, -1.129150390625, -1.0865478515625, -1.0439453125, -1.0013427734375, -0.958740234375, -0.9161376953125, -0.87353515625, -0.8309326171875, -0.788330078125, -0.7457275390625, -0.703125, -0.6605224609375, -0.617919921875, -0.5753173828125, -0.53271484375, -0.4901123046875, -0.447509765625, -0.4049072265625, -0.3623046875, -0.3197021484375, -0.277099609375, -0.2344970703125, -0.19189453125, -0.1492919921875, -0.106689453125, -0.0640869140625, -0.021484375, 0.0211181640625, 0.063720703125, 0.1063232421875, 0.14892578125, 0.1915283203125, 0.234130859375, 0.2767333984375, 0.3193359375, 0.3619384765625, 0.404541015625, 0.4471435546875, 0.48974609375, 0.5323486328125, 0.574951171875, 0.6175537109375, 0.66015625, 0.7027587890625, 0.745361328125, 0.7879638671875, 0.83056640625, 0.8731689453125, 0.915771484375, 0.9583740234375, 1.0009765625, 1.0435791015625, 1.086181640625, 1.1287841796875, 1.17138671875, 1.2139892578125, 1.256591796875, 1.2991943359375, 1.341796875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 11.0, 14.0, 14.0, 15.0, 21.0, 23.0, 34.0, 21.0, 48.0, 38.0, 66.0, 66.0, 78.0, 1101.0, 60.0, 76.0, 60.0, 66.0, 53.0, 42.0, 32.0, 22.0, 13.0, 16.0, 7.0, 2.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7734375, -10.3118896484375, -9.850341796875, -9.3887939453125, -8.92724609375, -8.4656982421875, -8.004150390625, -7.5426025390625, -7.0810546875, -6.6195068359375, -6.157958984375, -5.6964111328125, -5.23486328125, -4.7733154296875, -4.311767578125, -3.8502197265625, -3.388671875, -2.9271240234375, -2.465576171875, -2.0040283203125, -1.54248046875, -1.0809326171875, -0.619384765625, -0.1578369140625, 0.3037109375, 0.7652587890625, 1.226806640625, 1.6883544921875, 2.14990234375, 2.6114501953125, 3.072998046875, 3.5345458984375, 3.99609375, 4.4576416015625, 4.919189453125, 5.3807373046875, 5.84228515625, 6.3038330078125, 6.765380859375, 7.2269287109375, 7.6884765625, 8.1500244140625, 8.611572265625, 9.0731201171875, 9.53466796875, 9.9962158203125, 10.457763671875, 10.9193115234375, 11.380859375, 11.8424072265625, 12.303955078125, 12.7655029296875, 13.22705078125, 13.6885986328125, 14.150146484375, 14.6116943359375, 15.0732421875, 15.5347900390625, 15.996337890625, 16.4578857421875, 16.91943359375, 17.3809814453125, 17.842529296875, 18.3040771484375, 18.765625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 540.0, 453.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.311052322387695, -24.666324615478516, -23.021596908569336, -21.376869201660156, -19.732139587402344, -18.087413787841797, -16.442684173583984, -14.797956466674805, -13.153228759765625, -11.508501052856445, -9.863773345947266, -8.21904468536377, -6.57431697845459, -4.92958927154541, -3.284860610961914, -1.6401329040527344, 0.0045948028564453125, 1.649322748184204, 3.294050693511963, 4.938778877258301, 6.5835065841674805, 8.22823429107666, 9.872962951660156, 11.517690658569336, 13.162418365478516, 14.807146072387695, 16.451873779296875, 18.096603393554688, 19.741329193115234, 21.386058807373047, 23.030786514282227, 24.675514221191406, 26.32024383544922, 27.9649715423584, 29.609699249267578, 31.25442886352539, 32.89915466308594, 34.54388427734375, 36.18861389160156, 37.83333969116211, 39.478065490722656, 41.12279510498047, 42.767520904541016, 44.41225051879883, 46.056976318359375, 47.70170593261719, 49.346435546875, 50.99116134643555, 52.63589096069336, 54.28062057495117, 55.92534637451172, 57.57007598876953, 59.21480178833008, 60.85953140258789, 62.50425720214844, 64.14898681640625, 65.79371643066406, 67.43844604492188, 69.08317565917969, 70.72789764404297, 72.37262725830078, 74.0173568725586, 75.6620864868164, 77.30680847167969, 78.9515380859375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 11.0, 18.0, 46.0, 73.0, 95.0, 154.0, 180.0, 154.0, 128.0, 76.0, 43.0, 16.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.068031311035156, -56.51930236816406, -54.97057342529297, -53.421844482421875, -51.87311553955078, -50.32439041137695, -48.77566146850586, -47.226932525634766, -45.67820358276367, -44.12947463989258, -42.580745697021484, -41.03201675415039, -39.48329162597656, -37.93456268310547, -36.385833740234375, -34.83710479736328, -33.28837585449219, -31.739646911621094, -30.19091796875, -28.64219093322754, -27.093461990356445, -25.54473304748535, -23.99600601196289, -22.447277069091797, -20.898548126220703, -19.34981918334961, -17.801090240478516, -16.252363204956055, -14.703634262084961, -13.154905319213867, -11.60617733001709, -10.057449340820312, -8.508720397949219, -6.959991931915283, -5.411263465881348, -3.862534999847412, -2.3138065338134766, -0.765078067779541, 0.7836503982543945, 2.332378387451172, 3.8811073303222656, 5.429835796356201, 6.978564262390137, 8.527292251586914, 10.076021194458008, 11.624750137329102, 13.173478126525879, 14.722206115722656, 16.27093505859375, 17.819664001464844, 19.368392944335938, 20.9171199798584, 22.465848922729492, 24.014577865600586, 25.563304901123047, 27.11203384399414, 28.660762786865234, 30.209491729736328, 31.758220672607422, 33.306949615478516, 34.855674743652344, 36.40440368652344, 37.95313262939453, 39.501861572265625, 41.05059051513672]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 7.0, 20.0, 47.0, 1433.0, 4399.0, 345409.0, 3827801.0, 9256.0, 3039.0, 1969.0, 854.0, 11.0, 9.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.09004020690917969, -0.08779525756835938, -0.08555030822753906, -0.08330535888671875, -0.08106040954589844, -0.07881546020507812, -0.07657051086425781, -0.0743255615234375, -0.07208061218261719, -0.06983566284179688, -0.06759071350097656, -0.06534576416015625, -0.06310081481933594, -0.060855865478515625, -0.05861091613769531, -0.056365966796875, -0.05412101745605469, -0.051876068115234375, -0.04963111877441406, -0.04738616943359375, -0.04514122009277344, -0.042896270751953125, -0.04065132141113281, -0.0384063720703125, -0.03616142272949219, -0.033916473388671875, -0.03167152404785156, -0.02942657470703125, -0.027181625366210938, -0.024936676025390625, -0.022691726684570312, -0.02044677734375, -0.018201828002929688, -0.015956878662109375, -0.013711929321289062, -0.01146697998046875, -0.009222030639648438, -0.006977081298828125, -0.0047321319580078125, -0.0024871826171875, -0.0002422332763671875, 0.002002716064453125, 0.0042476654052734375, 0.00649261474609375, 0.008737564086914062, 0.010982513427734375, 0.013227462768554688, 0.015472412109375, 0.017717361450195312, 0.019962310791015625, 0.022207260131835938, 0.02445220947265625, 0.026697158813476562, 0.028942108154296875, 0.031187057495117188, 0.0334320068359375, 0.03567695617675781, 0.037921905517578125, 0.04016685485839844, 0.04241180419921875, 0.04465675354003906, 0.046901702880859375, 0.04914665222167969, 0.0513916015625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 27.0, 113.0, 446.0, 276.0, 75.0, 22.0, 13.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055938720703125, -0.054533958435058594, -0.05312919616699219, -0.05172443389892578, -0.050319671630859375, -0.04891490936279297, -0.04751014709472656, -0.046105384826660156, -0.04470062255859375, -0.043295860290527344, -0.04189109802246094, -0.04048633575439453, -0.039081573486328125, -0.03767681121826172, -0.03627204895019531, -0.034867286682128906, -0.0334625244140625, -0.032057762145996094, -0.030652999877929688, -0.02924823760986328, -0.027843475341796875, -0.02643871307373047, -0.025033950805664062, -0.023629188537597656, -0.02222442626953125, -0.020819664001464844, -0.019414901733398438, -0.01801013946533203, -0.016605377197265625, -0.015200614929199219, -0.013795852661132812, -0.012391090393066406, -0.010986328125, -0.009581565856933594, -0.008176803588867188, -0.006772041320800781, -0.005367279052734375, -0.003962516784667969, -0.0025577545166015625, -0.0011529922485351562, 0.00025177001953125, 0.0016565322875976562, 0.0030612945556640625, 0.004466056823730469, 0.005870819091796875, 0.007275581359863281, 0.008680343627929688, 0.010085105895996094, 0.0114898681640625, 0.012894630432128906, 0.014299392700195312, 0.01570415496826172, 0.017108917236328125, 0.01851367950439453, 0.019918441772460938, 0.021323204040527344, 0.02272796630859375, 0.024132728576660156, 0.025537490844726562, 0.02694225311279297, 0.028347015380859375, 0.02975177764892578, 0.031156539916992188, 0.032561302185058594, 0.033966064453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 7.0, 7.0, 10.0, 17.0, 14.0, 32.0, 51.0, 66.0, 139.0, 258.0, 918.0, 4127527.0, 64063.0, 624.0, 244.0, 112.0, 57.0, 34.0, 25.0, 18.0, 12.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057830810546875, -0.05559682846069336, -0.05336284637451172, -0.05112886428833008, -0.04889488220214844, -0.0466609001159668, -0.044426918029785156, -0.042192935943603516, -0.039958953857421875, -0.037724971771240234, -0.035490989685058594, -0.03325700759887695, -0.031023025512695312, -0.028789043426513672, -0.02655506134033203, -0.02432107925415039, -0.02208709716796875, -0.01985311508178711, -0.01761913299560547, -0.015385150909423828, -0.013151168823242188, -0.010917186737060547, -0.008683204650878906, -0.006449222564697266, -0.004215240478515625, -0.0019812583923339844, 0.00025272369384765625, 0.002486705780029297, 0.0047206878662109375, 0.006954669952392578, 0.009188652038574219, 0.01142263412475586, 0.0136566162109375, 0.01589059829711914, 0.01812458038330078, 0.020358562469482422, 0.022592544555664062, 0.024826526641845703, 0.027060508728027344, 0.029294490814208984, 0.031528472900390625, 0.033762454986572266, 0.035996437072753906, 0.03823041915893555, 0.04046440124511719, 0.04269838333129883, 0.04493236541748047, 0.04716634750366211, 0.04940032958984375, 0.05163431167602539, 0.05386829376220703, 0.05610227584838867, 0.05833625793457031, 0.06057024002075195, 0.0628042221069336, 0.06503820419311523, 0.06727218627929688, 0.06950616836547852, 0.07174015045166016, 0.0739741325378418, 0.07620811462402344, 0.07844209671020508, 0.08067607879638672, 0.08291006088256836, 0.08514404296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 2.0, 11.0, 3.0, 8.0, 9.0, 16.0, 16.0, 22.0, 46.0, 62.0, 96.0, 209.0, 431.0, 912.0, 1157.0, 495.0, 253.0, 132.0, 62.0, 40.0, 24.0, 20.0, 12.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0124053955078125, -0.011930465698242188, -0.011455535888671875, -0.010980606079101562, -0.01050567626953125, -0.010030746459960938, -0.009555816650390625, -0.009080886840820312, -0.00860595703125, -0.008131027221679688, -0.007656097412109375, -0.0071811676025390625, -0.00670623779296875, -0.0062313079833984375, -0.005756378173828125, -0.0052814483642578125, -0.0048065185546875, -0.0043315887451171875, -0.003856658935546875, -0.0033817291259765625, -0.00290679931640625, -0.0024318695068359375, -0.001956939697265625, -0.0014820098876953125, -0.001007080078125, -0.0005321502685546875, -5.7220458984375e-05, 0.0004177093505859375, 0.00089263916015625, 0.0013675689697265625, 0.001842498779296875, 0.0023174285888671875, 0.0027923583984375, 0.0032672882080078125, 0.003742218017578125, 0.0042171478271484375, 0.00469207763671875, 0.0051670074462890625, 0.005641937255859375, 0.0061168670654296875, 0.006591796875, 0.0070667266845703125, 0.007541656494140625, 0.008016586303710938, 0.00849151611328125, 0.008966445922851562, 0.009441375732421875, 0.009916305541992188, 0.0103912353515625, 0.010866165161132812, 0.011341094970703125, 0.011816024780273438, 0.01229095458984375, 0.012765884399414062, 0.013240814208984375, 0.013715744018554688, 0.014190673828125, 0.014665603637695312, 0.015140533447265625, 0.015615463256835938, 0.01609039306640625, 0.016565322875976562, 0.017040252685546875, 0.017515182495117188, 0.0179901123046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 80.0, 937.0, 0.0, 0.0, 1.0], "bins": [-0.5009832382202148, -0.49267318844795227, -0.4843631088733673, -0.47605305910110474, -0.4677429795265198, -0.4594329297542572, -0.45112287998199463, -0.44281280040740967, -0.4345027506351471, -0.4261927008628845, -0.41788262128829956, -0.409572571516037, -0.4012625217437744, -0.39295244216918945, -0.3846423923969269, -0.3763323128223419, -0.36802226305007935, -0.3597122132778168, -0.3514021337032318, -0.34309208393096924, -0.3347820043563843, -0.3264719545841217, -0.31816190481185913, -0.30985182523727417, -0.3015417754650116, -0.293231725692749, -0.28492164611816406, -0.2766115963459015, -0.2683015465736389, -0.25999146699905396, -0.2516814172267914, -0.24337135255336761, -0.23506127297878265, -0.2267512083053589, -0.2184411585330963, -0.21013109385967255, -0.20182102918624878, -0.193510964512825, -0.18520089983940125, -0.17689085006713867, -0.1685807853937149, -0.16027072072029114, -0.15196067094802856, -0.1436506062746048, -0.13534054160118103, -0.12703047692775726, -0.11872041970491409, -0.11041036248207092, -0.10210029780864716, -0.09379023313522339, -0.08548017591238022, -0.07717011868953705, -0.06886005401611328, -0.06054999306797981, -0.052239932119846344, -0.043929871171712875, -0.03561981022357941, -0.027309749275445938, -0.01899968832731247, -0.010689627379179, -0.0023795664310455322, 0.005930494517087936, 0.014240555465221405, 0.022550616413354874, 0.030860677361488342]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 5.0, 15.0, 9.0, 11.0, 17.0, 21.0, 26.0, 37.0, 27.0, 22.0, 38.0, 39.0, 40.0, 45.0, 51.0, 52.0, 50.0, 42.0, 38.0, 43.0, 51.0, 35.0, 31.0, 35.0, 16.0, 33.0, 30.0, 21.0, 26.0, 8.0, 14.0, 8.0, 12.0, 8.0, 7.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03019261360168457, -0.029178205877542496, -0.028163796290755272, -0.027149386703968048, -0.026134978979825974, -0.0251205712556839, -0.024106161668896675, -0.02309175208210945, -0.022077344357967377, -0.021062936633825302, -0.02004852704703808, -0.019034117460250854, -0.01801970973610878, -0.017005302011966705, -0.01599089242517948, -0.014976483769714832, -0.013962075114250183, -0.012947666458785534, -0.011933257803320885, -0.010918849147856236, -0.009904440492391586, -0.008890031836926937, -0.007875623181462288, -0.006861214525997639, -0.0058468058705329895, -0.00483239721506834, -0.003817988559603691, -0.002803579904139042, -0.0017891712486743927, -0.0007747625932097435, 0.0002396460622549057, 0.001254054717719555, 0.002268463373184204, 0.0032828720286488533, 0.0042972806841135025, 0.005311689339578152, 0.006326097995042801, 0.00734050665050745, 0.0083549153059721, 0.009369323961436749, 0.010383732616901398, 0.011398141272366047, 0.012412549927830696, 0.013426958583295345, 0.014441367238759995, 0.015455775894224644, 0.016470184549689293, 0.017484594136476517, 0.01849900186061859, 0.019513409584760666, 0.02052781917154789, 0.021542228758335114, 0.022556636482477188, 0.023571044206619263, 0.024585453793406487, 0.02559986338019371, 0.026614271104335785, 0.02762867882847786, 0.028643088415265083, 0.029657498002052307, 0.03067190572619438, 0.031686313450336456, 0.03270072489976883, 0.033715132623910904, 0.03472954034805298]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 11.0, 12.0, 11.0, 14.0, 25.0, 38.0, 42.0, 71.0, 106.0, 149.0, 299.0, 655.0, 2004.0, 16734.0, 1011405.0, 13657.0, 1846.0, 612.0, 305.0, 177.0, 120.0, 65.0, 41.0, 24.0, 32.0, 17.0, 13.0, 12.0, 6.0, 12.0, 7.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.37890625, -2.318634033203125, -2.25836181640625, -2.198089599609375, -2.1378173828125, -2.077545166015625, -2.01727294921875, -1.957000732421875, -1.896728515625, -1.836456298828125, -1.77618408203125, -1.715911865234375, -1.6556396484375, -1.595367431640625, -1.53509521484375, -1.474822998046875, -1.41455078125, -1.354278564453125, -1.29400634765625, -1.233734130859375, -1.1734619140625, -1.113189697265625, -1.05291748046875, -0.992645263671875, -0.932373046875, -0.872100830078125, -0.81182861328125, -0.751556396484375, -0.6912841796875, -0.631011962890625, -0.57073974609375, -0.510467529296875, -0.4501953125, -0.389923095703125, -0.32965087890625, -0.269378662109375, -0.2091064453125, -0.148834228515625, -0.08856201171875, -0.028289794921875, 0.031982421875, 0.092254638671875, 0.15252685546875, 0.212799072265625, 0.2730712890625, 0.333343505859375, 0.39361572265625, 0.453887939453125, 0.51416015625, 0.574432373046875, 0.63470458984375, 0.694976806640625, 0.7552490234375, 0.815521240234375, 0.87579345703125, 0.936065673828125, 0.996337890625, 1.056610107421875, 1.11688232421875, 1.177154541015625, 1.2374267578125, 1.297698974609375, 1.35797119140625, 1.418243408203125, 1.478515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 13.0, 44.0, 151.0, 476.0, 212.0, 62.0, 18.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05645751953125, -0.05503225326538086, -0.05360698699951172, -0.05218172073364258, -0.05075645446777344, -0.0493311882019043, -0.047905921936035156, -0.046480655670166016, -0.045055389404296875, -0.043630123138427734, -0.042204856872558594, -0.04077959060668945, -0.03935432434082031, -0.03792905807495117, -0.03650379180908203, -0.03507852554321289, -0.03365325927734375, -0.03222799301147461, -0.03080272674560547, -0.029377460479736328, -0.027952194213867188, -0.026526927947998047, -0.025101661682128906, -0.023676395416259766, -0.022251129150390625, -0.020825862884521484, -0.019400596618652344, -0.017975330352783203, -0.016550064086914062, -0.015124797821044922, -0.013699531555175781, -0.01227426528930664, -0.0108489990234375, -0.00942373275756836, -0.007998466491699219, -0.006573200225830078, -0.0051479339599609375, -0.003722667694091797, -0.0022974014282226562, -0.0008721351623535156, 0.000553131103515625, 0.0019783973693847656, 0.0034036636352539062, 0.004828929901123047, 0.0062541961669921875, 0.007679462432861328, 0.009104728698730469, 0.01052999496459961, 0.01195526123046875, 0.01338052749633789, 0.014805793762207031, 0.016231060028076172, 0.017656326293945312, 0.019081592559814453, 0.020506858825683594, 0.021932125091552734, 0.023357391357421875, 0.024782657623291016, 0.026207923889160156, 0.027633190155029297, 0.029058456420898438, 0.030483722686767578, 0.03190898895263672, 0.03333425521850586, 0.034759521484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 13.0, 12.0, 21.0, 32.0, 49.0, 37.0, 81.0, 103.0, 228.0, 364.0, 659.0, 1214.0, 2395.0, 4874.0, 10190.0, 23529.0, 62400.0, 237999.0, 506739.0, 125926.0, 40439.0, 16294.0, 7399.0, 3555.0, 1704.0, 974.0, 524.0, 268.0, 191.0, 107.0, 62.0, 37.0, 36.0, 16.0, 21.0, 9.0, 10.0, 12.0, 3.0, 5.0, 4.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04282093048095703, -0.04145240783691406, -0.040083885192871094, -0.038715362548828125, -0.037346839904785156, -0.03597831726074219, -0.03460979461669922, -0.03324127197265625, -0.03187274932861328, -0.030504226684570312, -0.029135704040527344, -0.027767181396484375, -0.026398658752441406, -0.025030136108398438, -0.02366161346435547, -0.0222930908203125, -0.02092456817626953, -0.019556045532226562, -0.018187522888183594, -0.016819000244140625, -0.015450477600097656, -0.014081954956054688, -0.012713432312011719, -0.01134490966796875, -0.009976387023925781, -0.008607864379882812, -0.007239341735839844, -0.005870819091796875, -0.004502296447753906, -0.0031337738037109375, -0.0017652511596679688, -0.000396728515625, 0.0009717941284179688, 0.0023403167724609375, 0.0037088394165039062, 0.005077362060546875, 0.006445884704589844, 0.007814407348632812, 0.009182929992675781, 0.01055145263671875, 0.011919975280761719, 0.013288497924804688, 0.014657020568847656, 0.016025543212890625, 0.017394065856933594, 0.018762588500976562, 0.02013111114501953, 0.0214996337890625, 0.02286815643310547, 0.024236679077148438, 0.025605201721191406, 0.026973724365234375, 0.028342247009277344, 0.029710769653320312, 0.03107929229736328, 0.03244781494140625, 0.03381633758544922, 0.03518486022949219, 0.036553382873535156, 0.037921905517578125, 0.039290428161621094, 0.04065895080566406, 0.04202747344970703, 0.04339599609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 8.0, 20.0, 16.0, 24.0, 18.0, 25.0, 28.0, 27.0, 27.0, 36.0, 38.0, 31.0, 40.0, 44.0, 41.0, 39.0, 40.0, 39.0, 34.0, 34.0, 42.0, 42.0, 40.0, 33.0, 28.0, 32.0, 27.0, 12.0, 20.0, 17.0, 15.0, 10.0, 7.0, 7.0, 10.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.024810791015625, -0.024040937423706055, -0.02327108383178711, -0.022501230239868164, -0.02173137664794922, -0.020961523056030273, -0.020191669464111328, -0.019421815872192383, -0.018651962280273438, -0.017882108688354492, -0.017112255096435547, -0.0163424015045166, -0.015572547912597656, -0.014802694320678711, -0.014032840728759766, -0.01326298713684082, -0.012493133544921875, -0.01172327995300293, -0.010953426361083984, -0.010183572769165039, -0.009413719177246094, -0.008643865585327148, -0.007874011993408203, -0.007104158401489258, -0.0063343048095703125, -0.005564451217651367, -0.004794597625732422, -0.0040247440338134766, -0.0032548904418945312, -0.002485036849975586, -0.0017151832580566406, -0.0009453296661376953, -0.00017547607421875, 0.0005943775177001953, 0.0013642311096191406, 0.002134084701538086, 0.0029039382934570312, 0.0036737918853759766, 0.004443645477294922, 0.005213499069213867, 0.0059833526611328125, 0.006753206253051758, 0.007523059844970703, 0.008292913436889648, 0.009062767028808594, 0.009832620620727539, 0.010602474212646484, 0.01137232780456543, 0.012142181396484375, 0.01291203498840332, 0.013681888580322266, 0.014451742172241211, 0.015221595764160156, 0.0159914493560791, 0.016761302947998047, 0.017531156539916992, 0.018301010131835938, 0.019070863723754883, 0.019840717315673828, 0.020610570907592773, 0.02138042449951172, 0.022150278091430664, 0.02292013168334961, 0.023689985275268555, 0.0244598388671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 15.0, 11.0, 20.0, 40.0, 72.0, 132.0, 425.0, 1853.0, 17263.0, 960829.0, 63085.0, 3724.0, 683.0, 197.0, 89.0, 37.0, 33.0, 14.0, 10.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09763336181640625, -0.0952911376953125, -0.09294891357421875, -0.090606689453125, -0.08826446533203125, -0.0859222412109375, -0.08358001708984375, -0.08123779296875, -0.07889556884765625, -0.0765533447265625, -0.07421112060546875, -0.071868896484375, -0.06952667236328125, -0.0671844482421875, -0.06484222412109375, -0.0625, -0.06015777587890625, -0.0578155517578125, -0.05547332763671875, -0.053131103515625, -0.05078887939453125, -0.0484466552734375, -0.04610443115234375, -0.04376220703125, -0.04141998291015625, -0.0390777587890625, -0.03673553466796875, -0.034393310546875, -0.03205108642578125, -0.0297088623046875, -0.02736663818359375, -0.0250244140625, -0.02268218994140625, -0.0203399658203125, -0.01799774169921875, -0.015655517578125, -0.01331329345703125, -0.0109710693359375, -0.00862884521484375, -0.00628662109375, -0.00394439697265625, -0.0016021728515625, 0.00074005126953125, 0.003082275390625, 0.00542449951171875, 0.0077667236328125, 0.01010894775390625, 0.012451171875, 0.01479339599609375, 0.0171356201171875, 0.01947784423828125, 0.021820068359375, 0.02416229248046875, 0.0265045166015625, 0.02884674072265625, 0.03118896484375, 0.03353118896484375, 0.0358734130859375, 0.03821563720703125, 0.040557861328125, 0.04290008544921875, 0.0452423095703125, 0.04758453369140625, 0.0499267578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 4.0, 14.0, 11.0, 14.0, 25.0, 34.0, 52.0, 98.0, 123.0, 151.0, 143.0, 117.0, 77.0, 44.0, 31.0, 20.0, 15.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0001043081283569336, -0.00010197330266237259, -9.963847696781158e-05, -9.730365127325058e-05, -9.496882557868958e-05, -9.263399988412857e-05, -9.029917418956757e-05, -8.796434849500656e-05, -8.562952280044556e-05, -8.329469710588455e-05, -8.095987141132355e-05, -7.862504571676254e-05, -7.629022002220154e-05, -7.395539432764053e-05, -7.162056863307953e-05, -6.928574293851852e-05, -6.695091724395752e-05, -6.461609154939651e-05, -6.228126585483551e-05, -5.9946440160274506e-05, -5.76116144657135e-05, -5.5276788771152496e-05, -5.294196307659149e-05, -5.060713738203049e-05, -4.827231168746948e-05, -4.593748599290848e-05, -4.360266029834747e-05, -4.126783460378647e-05, -3.8933008909225464e-05, -3.659818321466446e-05, -3.4263357520103455e-05, -3.192853182554245e-05, -2.9593706130981445e-05, -2.725888043642044e-05, -2.4924054741859436e-05, -2.258922904729843e-05, -2.0254403352737427e-05, -1.7919577658176422e-05, -1.5584751963615417e-05, -1.3249926269054413e-05, -1.0915100574493408e-05, -8.580274879932404e-06, -6.245449185371399e-06, -3.910623490810394e-06, -1.5757977962493896e-06, 7.59027898311615e-07, 3.0938535928726196e-06, 5.428679287433624e-06, 7.763504981994629e-06, 1.0098330676555634e-05, 1.2433156371116638e-05, 1.4767982065677643e-05, 1.7102807760238647e-05, 1.9437633454799652e-05, 2.1772459149360657e-05, 2.410728484392166e-05, 2.6442110538482666e-05, 2.877693623304367e-05, 3.1111761927604675e-05, 3.344658762216568e-05, 3.5781413316726685e-05, 3.811623901128769e-05, 4.0451064705848694e-05, 4.27858904004097e-05, 4.51207160949707e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 10.0, 30.0, 32.0, 64.0, 103.0, 267.0, 697.0, 2394.0, 18046.0, 970248.0, 50674.0, 4255.0, 1042.0, 334.0, 144.0, 64.0, 49.0, 23.0, 20.0, 13.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.06137847900390625, -0.0586700439453125, -0.05596160888671875, -0.053253173828125, -0.05054473876953125, -0.0478363037109375, -0.04512786865234375, -0.04241943359375, -0.03971099853515625, -0.0370025634765625, -0.03429412841796875, -0.031585693359375, -0.02887725830078125, -0.0261688232421875, -0.02346038818359375, -0.020751953125, -0.01804351806640625, -0.0153350830078125, -0.01262664794921875, -0.009918212890625, -0.00720977783203125, -0.0045013427734375, -0.00179290771484375, 0.00091552734375, 0.00362396240234375, 0.0063323974609375, 0.00904083251953125, 0.011749267578125, 0.01445770263671875, 0.0171661376953125, 0.01987457275390625, 0.0225830078125, 0.02529144287109375, 0.0279998779296875, 0.03070831298828125, 0.033416748046875, 0.03612518310546875, 0.0388336181640625, 0.04154205322265625, 0.04425048828125, 0.04695892333984375, 0.0496673583984375, 0.05237579345703125, 0.055084228515625, 0.05779266357421875, 0.0605010986328125, 0.06320953369140625, 0.06591796875, 0.06862640380859375, 0.0713348388671875, 0.07404327392578125, 0.076751708984375, 0.07946014404296875, 0.0821685791015625, 0.08487701416015625, 0.08758544921875, 0.09029388427734375, 0.0930023193359375, 0.09571075439453125, 0.098419189453125, 0.10112762451171875, 0.1038360595703125, 0.10654449462890625, 0.1092529296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 14.0, 30.0, 32.0, 70.0, 267.0, 322.0, 121.0, 54.0, 34.0, 13.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030670166015625, -0.029346466064453125, -0.02802276611328125, -0.026699066162109375, -0.0253753662109375, -0.024051666259765625, -0.02272796630859375, -0.021404266357421875, -0.02008056640625, -0.018756866455078125, -0.01743316650390625, -0.016109466552734375, -0.0147857666015625, -0.013462066650390625, -0.01213836669921875, -0.010814666748046875, -0.009490966796875, -0.008167266845703125, -0.00684356689453125, -0.005519866943359375, -0.0041961669921875, -0.002872467041015625, -0.00154876708984375, -0.000225067138671875, 0.0010986328125, 0.002422332763671875, 0.00374603271484375, 0.005069732666015625, 0.0063934326171875, 0.007717132568359375, 0.00904083251953125, 0.010364532470703125, 0.011688232421875, 0.013011932373046875, 0.01433563232421875, 0.015659332275390625, 0.0169830322265625, 0.018306732177734375, 0.01963043212890625, 0.020954132080078125, 0.02227783203125, 0.023601531982421875, 0.02492523193359375, 0.026248931884765625, 0.0275726318359375, 0.028896331787109375, 0.03022003173828125, 0.031543731689453125, 0.032867431640625, 0.034191131591796875, 0.03551483154296875, 0.036838531494140625, 0.0381622314453125, 0.039485931396484375, 0.04080963134765625, 0.042133331298828125, 0.04345703125, 0.044780731201171875, 0.04610443115234375, 0.047428131103515625, 0.0487518310546875, 0.050075531005859375, 0.05139923095703125, 0.052722930908203125, 0.054046630859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 86.0, 864.0, 55.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0377006530761719, -0.9648602604866028, -0.8920198678970337, -0.8191795349121094, -0.7463391423225403, -0.6734987497329712, -0.6006584167480469, -0.5278180241584778, -0.4549776315689087, -0.3821372389793396, -0.3092968761920929, -0.236456498503685, -0.1636161208152771, -0.09077572822570801, -0.017935365438461304, 0.0549049973487854, 0.1277453899383545, 0.2005857676267624, 0.2734261453151703, 0.346266508102417, 0.4191069006919861, 0.4919472932815552, 0.5647876262664795, 0.6376280188560486, 0.7104684114456177, 0.7833088040351868, 0.8561491966247559, 0.9289895296096802, 1.0018298625946045, 1.0746703147888184, 1.1475106477737427, 1.220350980758667, 1.2931911945343018, 1.366031527519226, 1.43887197971344, 1.5117123126983643, 1.5845527648925781, 1.6573930978775024, 1.7302334308624268, 1.8030738830566406, 1.875914216041565, 1.9487545490264893, 2.021595001220703, 2.094435453414917, 2.1672756671905518, 2.2401161193847656, 2.3129565715789795, 2.3857967853546143, 2.458637237548828, 2.531477689743042, 2.6043179035186768, 2.6771583557128906, 2.7499988079071045, 2.8228392601013184, 2.895679473876953, 2.968519926071167, 3.041360378265381, 3.1142008304595947, 3.1870410442352295, 3.2598814964294434, 3.3327219486236572, 3.405562400817871, 3.478402614593506, 3.5512430667877197, 3.6240832805633545]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 7.0, 10.0, 10.0, 19.0, 23.0, 43.0, 41.0, 43.0, 72.0, 68.0, 62.0, 63.0, 71.0, 70.0, 69.0, 70.0, 63.0, 40.0, 32.0, 23.0, 33.0, 17.0, 19.0, 10.0, 7.0, 2.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166653394699097, -0.19291836023330688, -0.1841701865196228, -0.17542202770709991, -0.16667385399341583, -0.15792568027973175, -0.14917752146720886, -0.14042934775352478, -0.1316811740398407, -0.12293300032615662, -0.11418483406305313, -0.10543666779994965, -0.09668849408626556, -0.08794032037258148, -0.079192154109478, -0.07044398784637451, -0.06169581413269043, -0.052947644144296646, -0.04419947415590286, -0.03545130416750908, -0.026703134179115295, -0.017954964190721512, -0.009206794202327728, -0.0004586242139339447, 0.008289545774459839, 0.017037715762853622, 0.025785885751247406, 0.03453405573964119, 0.04328222572803497, 0.05203039571642876, 0.06077856570482254, 0.06952673196792603, 0.07827490568161011, 0.08702307939529419, 0.09577124565839767, 0.10451941192150116, 0.11326758563518524, 0.12201575934886932, 0.1307639181613922, 0.1395120918750763, 0.14826026558876038, 0.15700843930244446, 0.16575661301612854, 0.17450477182865143, 0.1832529455423355, 0.1920011192560196, 0.20074927806854248, 0.20949745178222656, 0.21824562549591064, 0.22699379920959473, 0.2357419729232788, 0.2444901317358017, 0.253238320350647, 0.26198646426200867, 0.27073463797569275, 0.27948281168937683, 0.2882309854030609, 0.296979159116745, 0.3057273328304291, 0.31447550654411316, 0.32322365045547485, 0.33197182416915894, 0.340719997882843, 0.3494681715965271, 0.3582163453102112]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 10.0, 7.0, 9.0, 10.0, 19.0, 21.0, 21.0, 35.0, 52.0, 67.0, 80.0, 125.0, 151.0, 314.0, 777.0, 3536.0, 748613.0, 3434289.0, 4643.0, 891.0, 296.0, 130.0, 58.0, 34.0, 22.0, 19.0, 12.0, 12.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251220703125, -0.24443435668945312, -0.23764801025390625, -0.23086166381835938, -0.2240753173828125, -0.21728897094726562, -0.21050262451171875, -0.20371627807617188, -0.196929931640625, -0.19014358520507812, -0.18335723876953125, -0.17657089233398438, -0.1697845458984375, -0.16299819946289062, -0.15621185302734375, -0.14942550659179688, -0.14263916015625, -0.13585281372070312, -0.12906646728515625, -0.12228012084960938, -0.1154937744140625, -0.10870742797851562, -0.10192108154296875, -0.09513473510742188, -0.088348388671875, -0.08156204223632812, -0.07477569580078125, -0.06798934936523438, -0.0612030029296875, -0.054416656494140625, -0.04763031005859375, -0.040843963623046875, -0.0340576171875, -0.027271270751953125, -0.02048492431640625, -0.013698577880859375, -0.0069122314453125, -0.000125885009765625, 0.00666046142578125, 0.013446807861328125, 0.020233154296875, 0.027019500732421875, 0.03380584716796875, 0.040592193603515625, 0.0473785400390625, 0.054164886474609375, 0.06095123291015625, 0.06773757934570312, 0.07452392578125, 0.08131027221679688, 0.08809661865234375, 0.09488296508789062, 0.1016693115234375, 0.10845565795898438, 0.11524200439453125, 0.12202835083007812, 0.128814697265625, 0.13560104370117188, 0.14238739013671875, 0.14917373657226562, 0.1559600830078125, 0.16274642944335938, 0.16953277587890625, 0.17631912231445312, 0.18310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 9.0, 17.0, 65.0, 216.0, 441.0, 180.0, 40.0, 22.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055267333984375, -0.05389833450317383, -0.052529335021972656, -0.051160335540771484, -0.04979133605957031, -0.04842233657836914, -0.04705333709716797, -0.0456843376159668, -0.044315338134765625, -0.04294633865356445, -0.04157733917236328, -0.04020833969116211, -0.03883934020996094, -0.037470340728759766, -0.036101341247558594, -0.03473234176635742, -0.03336334228515625, -0.03199434280395508, -0.030625343322753906, -0.029256343841552734, -0.027887344360351562, -0.02651834487915039, -0.02514934539794922, -0.023780345916748047, -0.022411346435546875, -0.021042346954345703, -0.01967334747314453, -0.01830434799194336, -0.016935348510742188, -0.015566349029541016, -0.014197349548339844, -0.012828350067138672, -0.0114593505859375, -0.010090351104736328, -0.008721351623535156, -0.007352352142333984, -0.0059833526611328125, -0.004614353179931641, -0.0032453536987304688, -0.0018763542175292969, -0.000507354736328125, 0.0008616447448730469, 0.0022306442260742188, 0.0035996437072753906, 0.0049686431884765625, 0.006337642669677734, 0.007706642150878906, 0.009075641632080078, 0.01044464111328125, 0.011813640594482422, 0.013182640075683594, 0.014551639556884766, 0.015920639038085938, 0.01728963851928711, 0.01865863800048828, 0.020027637481689453, 0.021396636962890625, 0.022765636444091797, 0.02413463592529297, 0.02550363540649414, 0.026872634887695312, 0.028241634368896484, 0.029610633850097656, 0.030979633331298828, 0.0323486328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 14.0, 9.0, 22.0, 40.0, 87.0, 145.0, 317.0, 812.0, 3065.0, 25275.0, 3696364.0, 452543.0, 12603.0, 2002.0, 530.0, 213.0, 97.0, 44.0, 26.0, 33.0, 17.0, 5.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06321334838867188, -0.06044769287109375, -0.057682037353515625, -0.0549163818359375, -0.052150726318359375, -0.04938507080078125, -0.046619415283203125, -0.043853759765625, -0.041088104248046875, -0.03832244873046875, -0.035556793212890625, -0.0327911376953125, -0.030025482177734375, -0.02725982666015625, -0.024494171142578125, -0.021728515625, -0.018962860107421875, -0.01619720458984375, -0.013431549072265625, -0.0106658935546875, -0.007900238037109375, -0.00513458251953125, -0.002368927001953125, 0.000396728515625, 0.003162384033203125, 0.00592803955078125, 0.008693695068359375, 0.0114593505859375, 0.014225006103515625, 0.01699066162109375, 0.019756317138671875, 0.02252197265625, 0.025287628173828125, 0.02805328369140625, 0.030818939208984375, 0.0335845947265625, 0.036350250244140625, 0.03911590576171875, 0.041881561279296875, 0.044647216796875, 0.047412872314453125, 0.05017852783203125, 0.052944183349609375, 0.0557098388671875, 0.058475494384765625, 0.06124114990234375, 0.06400680541992188, 0.0667724609375, 0.06953811645507812, 0.07230377197265625, 0.07506942749023438, 0.0778350830078125, 0.08060073852539062, 0.08336639404296875, 0.08613204956054688, 0.088897705078125, 0.09166336059570312, 0.09442901611328125, 0.09719467163085938, 0.0999603271484375, 0.10272598266601562, 0.10549163818359375, 0.10825729370117188, 0.11102294921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 10.0, 15.0, 29.0, 40.0, 83.0, 123.0, 198.0, 393.0, 1300.0, 1106.0, 305.0, 156.0, 96.0, 59.0, 43.0, 30.0, 15.0, 11.0, 14.0, 12.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0193328857421875, -0.018450021743774414, -0.017567157745361328, -0.016684293746948242, -0.015801429748535156, -0.01491856575012207, -0.014035701751708984, -0.013152837753295898, -0.012269973754882812, -0.011387109756469727, -0.01050424575805664, -0.009621381759643555, -0.008738517761230469, -0.007855653762817383, -0.006972789764404297, -0.006089925765991211, -0.005207061767578125, -0.004324197769165039, -0.003441333770751953, -0.002558469772338867, -0.0016756057739257812, -0.0007927417755126953, 9.012222290039062e-05, 0.0009729862213134766, 0.0018558502197265625, 0.0027387142181396484, 0.0036215782165527344, 0.00450444221496582, 0.005387306213378906, 0.006270170211791992, 0.007153034210205078, 0.008035898208618164, 0.00891876220703125, 0.009801626205444336, 0.010684490203857422, 0.011567354202270508, 0.012450218200683594, 0.01333308219909668, 0.014215946197509766, 0.015098810195922852, 0.015981674194335938, 0.016864538192749023, 0.01774740219116211, 0.018630266189575195, 0.01951313018798828, 0.020395994186401367, 0.021278858184814453, 0.02216172218322754, 0.023044586181640625, 0.02392745018005371, 0.024810314178466797, 0.025693178176879883, 0.02657604217529297, 0.027458906173706055, 0.02834177017211914, 0.029224634170532227, 0.030107498168945312, 0.0309903621673584, 0.031873226165771484, 0.03275609016418457, 0.033638954162597656, 0.03452181816101074, 0.03540468215942383, 0.036287546157836914, 0.03717041015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 26.0, 76.0, 327.0, 401.0, 122.0, 28.0, 16.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2483457326889038, -0.24064253270626068, -0.23293931782245636, -0.22523611783981323, -0.2175329029560089, -0.20982970297336578, -0.20212650299072266, -0.19442328810691833, -0.186720073223114, -0.1790168732404709, -0.17131365835666656, -0.16361045837402344, -0.15590724349021912, -0.148204043507576, -0.14050084352493286, -0.13279762864112854, -0.1250944286584854, -0.11739122122526169, -0.10968801379203796, -0.10198481380939484, -0.09428159892559052, -0.08657839894294739, -0.07887519150972366, -0.07117198407649994, -0.06346877664327621, -0.05576556921005249, -0.048062361776828766, -0.04035915806889534, -0.032655950635671616, -0.02495274320244789, -0.017249539494514465, -0.009546332061290741, -0.0018431097269058228, 0.005860096774995327, 0.013563303276896477, 0.021266508847475052, 0.028969716280698776, 0.0366729237139225, 0.044376127421855927, 0.05207933485507965, 0.059782542288303375, 0.0674857497215271, 0.07518895715475082, 0.08289216458797455, 0.09059536457061768, 0.098298579454422, 0.10600177943706512, 0.11370498687028885, 0.12140819430351257, 0.1291113942861557, 0.13681460916996002, 0.14451780915260315, 0.15222102403640747, 0.1599242240190506, 0.16762742400169373, 0.17533063888549805, 0.18303385376930237, 0.1907370537519455, 0.19844026863574982, 0.20614346861839294, 0.21384668350219727, 0.2215498834848404, 0.22925308346748352, 0.23695629835128784, 0.24465949833393097]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 13.0, 11.0, 9.0, 9.0, 12.0, 21.0, 22.0, 26.0, 30.0, 26.0, 29.0, 35.0, 27.0, 41.0, 25.0, 50.0, 46.0, 43.0, 37.0, 45.0, 42.0, 39.0, 26.0, 42.0, 37.0, 29.0, 26.0, 27.0, 29.0, 26.0, 22.0, 11.0, 14.0, 13.0, 9.0, 6.0, 12.0, 9.0, 7.0, 4.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.05230659246444702, -0.0504167377948761, -0.048526886850595474, -0.04663703590631485, -0.04474718123674393, -0.042857326567173004, -0.04096747562289238, -0.039077624678611755, -0.03718777000904083, -0.03529791533946991, -0.033408064395189285, -0.03151821345090866, -0.029628358781337738, -0.027738505974411964, -0.02584865316748619, -0.023958800360560417, -0.022068947553634644, -0.02017909474670887, -0.018289241939783096, -0.016399389132857323, -0.014509536325931549, -0.012619683519005775, -0.010729830712080002, -0.008839977905154228, -0.006950125098228455, -0.005060272291302681, -0.0031704194843769073, -0.0012805666774511337, 0.0006092861294746399, 0.0024991389364004135, 0.004388991743326187, 0.006278844550251961, 0.008168697357177734, 0.010058550164103508, 0.011948402971029282, 0.013838255777955055, 0.01572810858488083, 0.017617961391806602, 0.019507814198732376, 0.02139766700565815, 0.023287519812583923, 0.025177372619509697, 0.02706722542643547, 0.028957078233361244, 0.030846931040287018, 0.03273678570985794, 0.034626636654138565, 0.03651648759841919, 0.03840634226799011, 0.040296196937561035, 0.04218604788184166, 0.044075898826122284, 0.04596575349569321, 0.04785560816526413, 0.049745459109544754, 0.05163531005382538, 0.0535251647233963, 0.055415019392967224, 0.05730487033724785, 0.05919472128152847, 0.061084575951099396, 0.06297443062067032, 0.06486427783966064, 0.06675413250923157, 0.06864398717880249]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 5.0, 14.0, 16.0, 12.0, 14.0, 19.0, 34.0, 43.0, 55.0, 106.0, 149.0, 218.0, 332.0, 595.0, 1216.0, 4222.0, 67831.0, 945992.0, 22560.0, 2719.0, 915.0, 487.0, 330.0, 207.0, 127.0, 75.0, 60.0, 47.0, 28.0, 31.0, 22.0, 19.0, 17.0, 3.0, 10.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1507568359375, -0.14609718322753906, -0.14143753051757812, -0.1367778778076172, -0.13211822509765625, -0.1274585723876953, -0.12279891967773438, -0.11813926696777344, -0.1134796142578125, -0.10881996154785156, -0.10416030883789062, -0.09950065612792969, -0.09484100341796875, -0.09018135070800781, -0.08552169799804688, -0.08086204528808594, -0.076202392578125, -0.07154273986816406, -0.06688308715820312, -0.06222343444824219, -0.05756378173828125, -0.05290412902832031, -0.048244476318359375, -0.04358482360839844, -0.0389251708984375, -0.03426551818847656, -0.029605865478515625, -0.024946212768554688, -0.02028656005859375, -0.015626907348632812, -0.010967254638671875, -0.0063076019287109375, -0.00164794921875, 0.0030117034912109375, 0.007671356201171875, 0.012331008911132812, 0.01699066162109375, 0.021650314331054688, 0.026309967041015625, 0.030969619750976562, 0.0356292724609375, 0.04028892517089844, 0.044948577880859375, 0.04960823059082031, 0.05426788330078125, 0.05892753601074219, 0.06358718872070312, 0.06824684143066406, 0.072906494140625, 0.07756614685058594, 0.08222579956054688, 0.08688545227050781, 0.09154510498046875, 0.09620475769042969, 0.10086441040039062, 0.10552406311035156, 0.1101837158203125, 0.11484336853027344, 0.11950302124023438, 0.12416267395019531, 0.12882232666015625, 0.1334819793701172, 0.13814163208007812, 0.14280128479003906, 0.1474609375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 37.0, 143.0, 377.0, 298.0, 84.0, 29.0, 10.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052703857421875, -0.0513463020324707, -0.049988746643066406, -0.04863119125366211, -0.04727363586425781, -0.045916080474853516, -0.04455852508544922, -0.04320096969604492, -0.041843414306640625, -0.04048585891723633, -0.03912830352783203, -0.037770748138427734, -0.03641319274902344, -0.03505563735961914, -0.033698081970214844, -0.03234052658081055, -0.03098297119140625, -0.029625415802001953, -0.028267860412597656, -0.02691030502319336, -0.025552749633789062, -0.024195194244384766, -0.02283763885498047, -0.021480083465576172, -0.020122528076171875, -0.018764972686767578, -0.01740741729736328, -0.016049861907958984, -0.014692306518554688, -0.01333475112915039, -0.011977195739746094, -0.010619640350341797, -0.0092620849609375, -0.007904529571533203, -0.006546974182128906, -0.005189418792724609, -0.0038318634033203125, -0.0024743080139160156, -0.0011167526245117188, 0.00024080276489257812, 0.001598358154296875, 0.002955913543701172, 0.004313468933105469, 0.005671024322509766, 0.0070285797119140625, 0.00838613510131836, 0.009743690490722656, 0.011101245880126953, 0.01245880126953125, 0.013816356658935547, 0.015173912048339844, 0.01653146743774414, 0.017889022827148438, 0.019246578216552734, 0.02060413360595703, 0.021961688995361328, 0.023319244384765625, 0.024676799774169922, 0.02603435516357422, 0.027391910552978516, 0.028749465942382812, 0.03010702133178711, 0.031464576721191406, 0.0328221321105957, 0.0341796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 7.0, 3.0, 4.0, 6.0, 5.0, 13.0, 16.0, 18.0, 28.0, 26.0, 27.0, 34.0, 46.0, 62.0, 100.0, 146.0, 267.0, 661.0, 5728.0, 544978.0, 489430.0, 5559.0, 660.0, 237.0, 126.0, 81.0, 64.0, 54.0, 32.0, 29.0, 21.0, 22.0, 15.0, 13.0, 15.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.12929153442382812, -0.12467193603515625, -0.12005233764648438, -0.1154327392578125, -0.11081314086914062, -0.10619354248046875, -0.10157394409179688, -0.096954345703125, -0.09233474731445312, -0.08771514892578125, -0.08309555053710938, -0.0784759521484375, -0.07385635375976562, -0.06923675537109375, -0.06461715698242188, -0.05999755859375, -0.055377960205078125, -0.05075836181640625, -0.046138763427734375, -0.0415191650390625, -0.036899566650390625, -0.03227996826171875, -0.027660369873046875, -0.023040771484375, -0.018421173095703125, -0.01380157470703125, -0.009181976318359375, -0.0045623779296875, 5.7220458984375e-05, 0.00467681884765625, 0.009296417236328125, 0.013916015625, 0.018535614013671875, 0.02315521240234375, 0.027774810791015625, 0.0323944091796875, 0.037014007568359375, 0.04163360595703125, 0.046253204345703125, 0.050872802734375, 0.055492401123046875, 0.06011199951171875, 0.06473159790039062, 0.0693511962890625, 0.07397079467773438, 0.07859039306640625, 0.08320999145507812, 0.08782958984375, 0.09244918823242188, 0.09706878662109375, 0.10168838500976562, 0.1063079833984375, 0.11092758178710938, 0.11554718017578125, 0.12016677856445312, 0.124786376953125, 0.12940597534179688, 0.13402557373046875, 0.13864517211914062, 0.1432647705078125, 0.14788436889648438, 0.15250396728515625, 0.15712356567382812, 0.1617431640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 3.0, 6.0, 14.0, 8.0, 21.0, 24.0, 22.0, 22.0, 22.0, 29.0, 44.0, 40.0, 58.0, 52.0, 60.0, 55.0, 42.0, 55.0, 44.0, 47.0, 32.0, 44.0, 34.0, 34.0, 35.0, 22.0, 23.0, 16.0, 15.0, 20.0, 9.0, 7.0, 14.0, 10.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02252197265625, -0.021746158599853516, -0.02097034454345703, -0.020194530487060547, -0.019418716430664062, -0.018642902374267578, -0.017867088317871094, -0.01709127426147461, -0.016315460205078125, -0.01553964614868164, -0.014763832092285156, -0.013988018035888672, -0.013212203979492188, -0.012436389923095703, -0.011660575866699219, -0.010884761810302734, -0.01010894775390625, -0.009333133697509766, -0.008557319641113281, -0.007781505584716797, -0.0070056915283203125, -0.006229877471923828, -0.005454063415527344, -0.004678249359130859, -0.003902435302734375, -0.0031266212463378906, -0.0023508071899414062, -0.0015749931335449219, -0.0007991790771484375, -2.3365020751953125e-05, 0.0007524490356445312, 0.0015282630920410156, 0.0023040771484375, 0.0030798912048339844, 0.0038557052612304688, 0.004631519317626953, 0.0054073333740234375, 0.006183147430419922, 0.006958961486816406, 0.007734775543212891, 0.008510589599609375, 0.00928640365600586, 0.010062217712402344, 0.010838031768798828, 0.011613845825195312, 0.012389659881591797, 0.013165473937988281, 0.013941287994384766, 0.01471710205078125, 0.015492916107177734, 0.01626873016357422, 0.017044544219970703, 0.017820358276367188, 0.018596172332763672, 0.019371986389160156, 0.02014780044555664, 0.020923614501953125, 0.02169942855834961, 0.022475242614746094, 0.023251056671142578, 0.024026870727539062, 0.024802684783935547, 0.02557849884033203, 0.026354312896728516, 0.027130126953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 3.0, 11.0, 24.0, 39.0, 123.0, 322.0, 1045.0, 4210.0, 150629.0, 884806.0, 5438.0, 1275.0, 367.0, 133.0, 63.0, 22.0, 10.0, 4.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.100830078125, -0.09795570373535156, -0.09508132934570312, -0.09220695495605469, -0.08933258056640625, -0.08645820617675781, -0.08358383178710938, -0.08070945739746094, -0.0778350830078125, -0.07496070861816406, -0.07208633422851562, -0.06921195983886719, -0.06633758544921875, -0.06346321105957031, -0.060588836669921875, -0.05771446228027344, -0.054840087890625, -0.05196571350097656, -0.049091339111328125, -0.04621696472167969, -0.04334259033203125, -0.04046821594238281, -0.037593841552734375, -0.03471946716308594, -0.0318450927734375, -0.028970718383789062, -0.026096343994140625, -0.023221969604492188, -0.02034759521484375, -0.017473220825195312, -0.014598846435546875, -0.011724472045898438, -0.00885009765625, -0.0059757232666015625, -0.003101348876953125, -0.0002269744873046875, 0.00264739990234375, 0.0055217742919921875, 0.008396148681640625, 0.011270523071289062, 0.0141448974609375, 0.017019271850585938, 0.019893646240234375, 0.022768020629882812, 0.02564239501953125, 0.028516769409179688, 0.031391143798828125, 0.03426551818847656, 0.037139892578125, 0.04001426696777344, 0.042888641357421875, 0.04576301574707031, 0.04863739013671875, 0.05151176452636719, 0.054386138916015625, 0.05726051330566406, 0.0601348876953125, 0.06300926208496094, 0.06588363647460938, 0.06875801086425781, 0.07163238525390625, 0.07450675964355469, 0.07738113403320312, 0.08025550842285156, 0.0831298828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 10.0, 9.0, 8.0, 16.0, 25.0, 31.0, 46.0, 79.0, 99.0, 152.0, 130.0, 110.0, 80.0, 41.0, 28.0, 26.0, 17.0, 14.0, 24.0, 11.0, 14.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.922815322875977e-05, -8.591916412115097e-05, -8.261017501354218e-05, -7.930118590593338e-05, -7.599219679832458e-05, -7.268320769071579e-05, -6.9374218583107e-05, -6.60652294754982e-05, -6.27562403678894e-05, -5.944725126028061e-05, -5.6138262152671814e-05, -5.282927304506302e-05, -4.9520283937454224e-05, -4.621129482984543e-05, -4.290230572223663e-05, -3.959331661462784e-05, -3.628432750701904e-05, -3.297533839941025e-05, -2.9666349291801453e-05, -2.6357360184192657e-05, -2.3048371076583862e-05, -1.9739381968975067e-05, -1.6430392861366272e-05, -1.3121403753757477e-05, -9.812414646148682e-06, -6.5034255385398865e-06, -3.1944364309310913e-06, 1.1455267667770386e-07, 3.423541784286499e-06, 6.732530891895294e-06, 1.004151999950409e-05, 1.3350509107112885e-05, 1.665949821472168e-05, 1.9968487322330475e-05, 2.327747642993927e-05, 2.6586465537548065e-05, 2.989545464515686e-05, 3.3204443752765656e-05, 3.651343286037445e-05, 3.9822421967983246e-05, 4.313141107559204e-05, 4.6440400183200836e-05, 4.974938929080963e-05, 5.3058378398418427e-05, 5.636736750602722e-05, 5.967635661363602e-05, 6.298534572124481e-05, 6.629433482885361e-05, 6.96033239364624e-05, 7.29123130440712e-05, 7.622130215167999e-05, 7.953029125928879e-05, 8.283928036689758e-05, 8.614826947450638e-05, 8.945725858211517e-05, 9.276624768972397e-05, 9.607523679733276e-05, 9.938422590494156e-05, 0.00010269321501255035, 0.00010600220412015915, 0.00010931119322776794, 0.00011262018233537674, 0.00011592917144298553, 0.00011923816055059433, 0.00012254714965820312]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 6.0, 9.0, 14.0, 23.0, 29.0, 39.0, 63.0, 107.0, 194.0, 627.0, 3948.0, 363046.0, 674517.0, 4625.0, 727.0, 221.0, 106.0, 71.0, 29.0, 24.0, 24.0, 7.0, 17.0, 6.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.02616095542907715, -0.025344371795654297, -0.024527788162231445, -0.023711204528808594, -0.022894620895385742, -0.02207803726196289, -0.02126145362854004, -0.020444869995117188, -0.019628286361694336, -0.018811702728271484, -0.017995119094848633, -0.01717853546142578, -0.01636195182800293, -0.015545368194580078, -0.014728784561157227, -0.013912200927734375, -0.013095617294311523, -0.012279033660888672, -0.01146245002746582, -0.010645866394042969, -0.009829282760620117, -0.009012699127197266, -0.008196115493774414, -0.0073795318603515625, -0.006562948226928711, -0.005746364593505859, -0.004929780960083008, -0.004113197326660156, -0.0032966136932373047, -0.002480030059814453, -0.0016634464263916016, -0.00084686279296875, -3.0279159545898438e-05, 0.0007863044738769531, 0.0016028881072998047, 0.0024194717407226562, 0.003236055374145508, 0.004052639007568359, 0.004869222640991211, 0.0056858062744140625, 0.006502389907836914, 0.007318973541259766, 0.008135557174682617, 0.008952140808105469, 0.00976872444152832, 0.010585308074951172, 0.011401891708374023, 0.012218475341796875, 0.013035058975219727, 0.013851642608642578, 0.01466822624206543, 0.015484809875488281, 0.016301393508911133, 0.017117977142333984, 0.017934560775756836, 0.018751144409179688, 0.01956772804260254, 0.02038431167602539, 0.021200895309448242, 0.022017478942871094, 0.022834062576293945, 0.023650646209716797, 0.02446722984313965, 0.0252838134765625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 9.0, 5.0, 6.0, 7.0, 9.0, 17.0, 20.0, 31.0, 24.0, 42.0, 51.0, 62.0, 81.0, 103.0, 96.0, 83.0, 82.0, 73.0, 39.0, 40.0, 27.0, 17.0, 6.0, 14.0, 11.0, 4.0, 4.0, 3.0, 7.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003505706787109375, -0.0033894777297973633, -0.0032732486724853516, -0.00315701961517334, -0.003040790557861328, -0.0029245615005493164, -0.0028083324432373047, -0.002692103385925293, -0.0025758743286132812, -0.0024596452713012695, -0.002343416213989258, -0.002227187156677246, -0.0021109580993652344, -0.0019947290420532227, -0.001878499984741211, -0.0017622709274291992, -0.0016460418701171875, -0.0015298128128051758, -0.001413583755493164, -0.0012973546981811523, -0.0011811256408691406, -0.001064896583557129, -0.0009486675262451172, -0.0008324384689331055, -0.0007162094116210938, -0.000599980354309082, -0.0004837512969970703, -0.0003675222396850586, -0.0002512931823730469, -0.00013506412506103516, -1.8835067749023438e-05, 9.739398956298828e-05, 0.000213623046875, 0.0003298521041870117, 0.00044608116149902344, 0.0005623102188110352, 0.0006785392761230469, 0.0007947683334350586, 0.0009109973907470703, 0.001027226448059082, 0.0011434555053710938, 0.0012596845626831055, 0.0013759136199951172, 0.001492142677307129, 0.0016083717346191406, 0.0017246007919311523, 0.001840829849243164, 0.0019570589065551758, 0.0020732879638671875, 0.0021895170211791992, 0.002305746078491211, 0.0024219751358032227, 0.0025382041931152344, 0.002654433250427246, 0.002770662307739258, 0.0028868913650512695, 0.0030031204223632812, 0.003119349479675293, 0.0032355785369873047, 0.0033518075942993164, 0.003468036651611328, 0.00358426570892334, 0.0037004947662353516, 0.0038167238235473633, 0.003932952880859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 12.0, 43.0, 525.0, 409.0, 22.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29551321268081665, -0.26862838864326477, -0.24174357950687408, -0.2148587703704834, -0.18797394633293152, -0.16108912229537964, -0.13420431315898895, -0.10731950402259827, -0.08043467998504639, -0.053549863398075104, -0.02666504681110382, 0.00021976977586746216, 0.027104586362838745, 0.053989410400390625, 0.08087421953678131, 0.107759028673172, 0.13464385271072388, 0.16152867674827576, 0.18841348588466644, 0.21529829502105713, 0.242183119058609, 0.2690679430961609, 0.2959527373313904, 0.32283756136894226, 0.34972238540649414, 0.376607209444046, 0.4034920334815979, 0.4303768277168274, 0.4572616517543793, 0.48414647579193115, 0.5110312700271606, 0.5379160642623901, 0.5648009777069092, 0.5916857719421387, 0.6185706257820129, 0.6454554200172424, 0.6723402738571167, 0.6992250680923462, 0.7261098623275757, 0.7529946565628052, 0.7798795104026794, 0.8067643046379089, 0.8336491584777832, 0.8605339527130127, 0.8874187469482422, 0.9143036007881165, 0.941188395023346, 0.9680732488632202, 0.9949580430984497, 1.0218428373336792, 1.0487276315689087, 1.0756125450134277, 1.1024973392486572, 1.1293821334838867, 1.1562669277191162, 1.1831517219543457, 1.2100365161895752, 1.2369213104248047, 1.2638061046600342, 1.2906910181045532, 1.3175758123397827, 1.3444606065750122, 1.3713454008102417, 1.3982301950454712, 1.4251151084899902]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 15.0, 16.0, 23.0, 44.0, 34.0, 50.0, 57.0, 57.0, 78.0, 86.0, 75.0, 90.0, 85.0, 71.0, 59.0, 40.0, 37.0, 25.0, 17.0, 10.0, 11.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2028101682662964, -0.1975306123495102, -0.192251056432724, -0.1869715005159378, -0.1816919445991516, -0.17641238868236542, -0.17113283276557922, -0.16585326194763184, -0.16057372093200684, -0.15529416501522064, -0.15001460909843445, -0.14473505318164825, -0.13945549726486206, -0.13417594134807587, -0.12889638543128967, -0.12361682206392288, -0.11833725869655609, -0.1130577027797699, -0.1077781468629837, -0.10249859094619751, -0.09721903502941132, -0.09193947911262512, -0.08665991574525833, -0.08138035982847214, -0.07610080391168594, -0.07082124799489975, -0.06554169207811356, -0.060262132436037064, -0.05498257651925087, -0.049703020602464676, -0.044423460960388184, -0.03914390504360199, -0.033864349126815796, -0.028584793210029602, -0.02330523543059826, -0.018025677651166916, -0.012746121734380722, -0.007466565817594528, -0.002187006175518036, 0.003092549741268158, 0.008372105658054352, 0.01365166250616312, 0.01893121935427189, 0.024210777133703232, 0.029490333050489426, 0.03476988896727562, 0.04004944860935211, 0.045329004526138306, 0.0506085604429245, 0.05588811635971069, 0.06116767227649689, 0.06644722819328308, 0.07172678411006927, 0.07700634002685547, 0.08228590339422226, 0.08756545931100845, 0.09284501522779465, 0.09812457114458084, 0.10340412706136703, 0.10868369042873383, 0.11396324634552002, 0.11924280226230621, 0.12452235817909241, 0.1298019140958786, 0.1350814700126648]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 14.0, 25.0, 29.0, 36.0, 116.0, 206.0, 605.0, 2652.0, 2111813.0, 2074611.0, 3279.0, 589.0, 170.0, 53.0, 30.0, 18.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2164306640625, -0.210418701171875, -0.20440673828125, -0.198394775390625, -0.1923828125, -0.186370849609375, -0.18035888671875, -0.174346923828125, -0.1683349609375, -0.162322998046875, -0.15631103515625, -0.150299072265625, -0.144287109375, -0.138275146484375, -0.13226318359375, -0.126251220703125, -0.1202392578125, -0.114227294921875, -0.10821533203125, -0.102203369140625, -0.09619140625, -0.090179443359375, -0.08416748046875, -0.078155517578125, -0.0721435546875, -0.066131591796875, -0.06011962890625, -0.054107666015625, -0.048095703125, -0.042083740234375, -0.03607177734375, -0.030059814453125, -0.0240478515625, -0.018035888671875, -0.01202392578125, -0.006011962890625, 0.0, 0.006011962890625, 0.01202392578125, 0.018035888671875, 0.0240478515625, 0.030059814453125, 0.03607177734375, 0.042083740234375, 0.048095703125, 0.054107666015625, 0.06011962890625, 0.066131591796875, 0.0721435546875, 0.078155517578125, 0.08416748046875, 0.090179443359375, 0.09619140625, 0.102203369140625, 0.10821533203125, 0.114227294921875, 0.1202392578125, 0.126251220703125, 0.13226318359375, 0.138275146484375, 0.144287109375, 0.150299072265625, 0.15631103515625, 0.162322998046875, 0.1683349609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 45.0, 167.0, 397.0, 272.0, 66.0, 24.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0535888671875, -0.05227184295654297, -0.05095481872558594, -0.049637794494628906, -0.048320770263671875, -0.047003746032714844, -0.04568672180175781, -0.04436969757080078, -0.04305267333984375, -0.04173564910888672, -0.04041862487792969, -0.039101600646972656, -0.037784576416015625, -0.036467552185058594, -0.03515052795410156, -0.03383350372314453, -0.0325164794921875, -0.03119945526123047, -0.029882431030273438, -0.028565406799316406, -0.027248382568359375, -0.025931358337402344, -0.024614334106445312, -0.02329730987548828, -0.02198028564453125, -0.02066326141357422, -0.019346237182617188, -0.018029212951660156, -0.016712188720703125, -0.015395164489746094, -0.014078140258789062, -0.012761116027832031, -0.011444091796875, -0.010127067565917969, -0.008810043334960938, -0.007493019104003906, -0.006175994873046875, -0.004858970642089844, -0.0035419464111328125, -0.0022249221801757812, -0.00090789794921875, 0.00040912628173828125, 0.0017261505126953125, 0.0030431747436523438, 0.004360198974609375, 0.005677223205566406, 0.0069942474365234375, 0.008311271667480469, 0.0096282958984375, 0.010945320129394531, 0.012262344360351562, 0.013579368591308594, 0.014896392822265625, 0.016213417053222656, 0.017530441284179688, 0.01884746551513672, 0.02016448974609375, 0.02148151397705078, 0.022798538208007812, 0.024115562438964844, 0.025432586669921875, 0.026749610900878906, 0.028066635131835938, 0.02938365936279297, 0.03070068359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 9.0, 4.0, 20.0, 27.0, 35.0, 47.0, 72.0, 91.0, 139.0, 239.0, 341.0, 544.0, 1068.0, 2332.0, 6330.0, 24218.0, 155054.0, 3080885.0, 834818.0, 66543.0, 13578.0, 4160.0, 1572.0, 779.0, 471.0, 268.0, 181.0, 126.0, 68.0, 53.0, 58.0, 26.0, 20.0, 19.0, 12.0, 13.0, 11.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042694091796875, -0.041351318359375, -0.040008544921875, -0.038665771484375, -0.037322998046875, -0.035980224609375, -0.034637451171875, -0.033294677734375, -0.031951904296875, -0.030609130859375, -0.029266357421875, -0.027923583984375, -0.026580810546875, -0.025238037109375, -0.023895263671875, -0.022552490234375, -0.021209716796875, -0.019866943359375, -0.018524169921875, -0.017181396484375, -0.015838623046875, -0.014495849609375, -0.013153076171875, -0.011810302734375, -0.010467529296875, -0.009124755859375, -0.007781982421875, -0.006439208984375, -0.005096435546875, -0.003753662109375, -0.002410888671875, -0.001068115234375, 0.000274658203125, 0.001617431640625, 0.002960205078125, 0.004302978515625, 0.005645751953125, 0.006988525390625, 0.008331298828125, 0.009674072265625, 0.011016845703125, 0.012359619140625, 0.013702392578125, 0.015045166015625, 0.016387939453125, 0.017730712890625, 0.019073486328125, 0.020416259765625, 0.021759033203125, 0.023101806640625, 0.024444580078125, 0.025787353515625, 0.027130126953125, 0.028472900390625, 0.029815673828125, 0.031158447265625, 0.032501220703125, 0.033843994140625, 0.035186767578125, 0.036529541015625, 0.037872314453125, 0.039215087890625, 0.040557861328125, 0.041900634765625, 0.043243408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 6.0, 9.0, 18.0, 19.0, 25.0, 43.0, 38.0, 63.0, 76.0, 95.0, 132.0, 161.0, 262.0, 394.0, 603.0, 547.0, 411.0, 285.0, 230.0, 166.0, 110.0, 77.0, 73.0, 45.0, 35.0, 29.0, 27.0, 19.0, 11.0, 11.0, 8.0, 5.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155029296875, -0.014983654022216797, -0.014464378356933594, -0.01394510269165039, -0.013425827026367188, -0.012906551361083984, -0.012387275695800781, -0.011868000030517578, -0.011348724365234375, -0.010829448699951172, -0.010310173034667969, -0.009790897369384766, -0.009271621704101562, -0.00875234603881836, -0.008233070373535156, -0.007713794708251953, -0.00719451904296875, -0.006675243377685547, -0.006155967712402344, -0.005636692047119141, -0.0051174163818359375, -0.004598140716552734, -0.004078865051269531, -0.003559589385986328, -0.003040313720703125, -0.002521038055419922, -0.0020017623901367188, -0.0014824867248535156, -0.0009632110595703125, -0.0004439353942871094, 7.534027099609375e-05, 0.0005946159362792969, 0.0011138916015625, 0.0016331672668457031, 0.0021524429321289062, 0.0026717185974121094, 0.0031909942626953125, 0.0037102699279785156, 0.004229545593261719, 0.004748821258544922, 0.005268096923828125, 0.005787372589111328, 0.006306648254394531, 0.006825923919677734, 0.0073451995849609375, 0.00786447525024414, 0.008383750915527344, 0.008903026580810547, 0.00942230224609375, 0.009941577911376953, 0.010460853576660156, 0.01098012924194336, 0.011499404907226562, 0.012018680572509766, 0.012537956237792969, 0.013057231903076172, 0.013576507568359375, 0.014095783233642578, 0.014615058898925781, 0.015134334564208984, 0.015653610229492188, 0.01617288589477539, 0.016692161560058594, 0.017211437225341797, 0.017730712890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 19.0, 86.0, 368.0, 396.0, 103.0, 22.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23356427252292633, -0.22385922074317932, -0.21415415406227112, -0.20444908738136292, -0.1947440356016159, -0.1850389838218689, -0.1753339171409607, -0.1656288504600525, -0.15592379868030548, -0.14621874690055847, -0.13651368021965027, -0.12680861353874207, -0.11710356175899506, -0.10739850252866745, -0.09769344329833984, -0.08798838406801224, -0.07828332483768463, -0.06857826560735703, -0.05887320637702942, -0.04916814714670181, -0.03946308791637421, -0.0297580286860466, -0.020052969455718994, -0.010347910225391388, -0.0006428509950637817, 0.009062208235263824, 0.01876726746559143, 0.028472326695919037, 0.03817738592624664, 0.04788244515657425, 0.057587504386901855, 0.06729256361722946, 0.07699760794639587, 0.08670266717672348, 0.09640772640705109, 0.10611278563737869, 0.1158178448677063, 0.1255229115486145, 0.1352279633283615, 0.14493301510810852, 0.15463808178901672, 0.16434314846992493, 0.17404820024967194, 0.18375325202941895, 0.19345831871032715, 0.20316338539123535, 0.21286843717098236, 0.22257348895072937, 0.23227855563163757, 0.24198362231254578, 0.2516886591911316, 0.2613937258720398, 0.271098792552948, 0.2808038592338562, 0.2905089259147644, 0.3002139627933502, 0.3099190294742584, 0.3196240961551666, 0.32932913303375244, 0.33903419971466064, 0.34873926639556885, 0.35844433307647705, 0.36814939975738525, 0.37785443663597107, 0.3875595033168793]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 12.0, 11.0, 15.0, 22.0, 30.0, 35.0, 37.0, 38.0, 46.0, 58.0, 57.0, 57.0, 47.0, 67.0, 56.0, 52.0, 65.0, 41.0, 50.0, 53.0, 31.0, 28.0, 20.0, 22.0, 15.0, 16.0, 4.0, 2.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07740026712417603, -0.0749441385269165, -0.07248801738023758, -0.07003188878297806, -0.06757576763629913, -0.06511963903903961, -0.06266351044178009, -0.06020738556981087, -0.057751260697841644, -0.05529513582587242, -0.0528390109539032, -0.05038288235664368, -0.047926757484674454, -0.04547063261270523, -0.04301450401544571, -0.040558379143476486, -0.03810225427150726, -0.03564612939953804, -0.03319000452756882, -0.030733875930309296, -0.028277751058340073, -0.02582162618637085, -0.023365499451756477, -0.020909372717142105, -0.018453247845172882, -0.01599712297320366, -0.013540996238589287, -0.01108487043529749, -0.008628744632005692, -0.006172618828713894, -0.0037164930254220963, -0.001260366290807724, 0.001195758581161499, 0.0036518843844532967, 0.006108010187745094, 0.008564135991036892, 0.01102026179432869, 0.013476387597620487, 0.015932513400912285, 0.018388640135526657, 0.02084476500749588, 0.023300889879465103, 0.025757016614079475, 0.028213143348693848, 0.03066926822066307, 0.033125393092632294, 0.035581521689891815, 0.03803764656186104, 0.04049377143383026, 0.042949896305799484, 0.04540602117776871, 0.04786214977502823, 0.05031827464699745, 0.052774399518966675, 0.055230528116226196, 0.05768665298819542, 0.06014277786016464, 0.06259890645742416, 0.06505502760410309, 0.06751115620136261, 0.06996728479862213, 0.07242340594530106, 0.07487953454256058, 0.0773356556892395, 0.07979178428649902]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 7.0, 9.0, 9.0, 12.0, 19.0, 17.0, 20.0, 53.0, 62.0, 99.0, 136.0, 200.0, 382.0, 743.0, 2337.0, 29112.0, 995030.0, 16753.0, 1931.0, 664.0, 323.0, 215.0, 129.0, 78.0, 59.0, 41.0, 24.0, 28.0, 10.0, 9.0, 17.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.27001953125, -0.26194190979003906, -0.2538642883300781, -0.2457866668701172, -0.23770904541015625, -0.2296314239501953, -0.22155380249023438, -0.21347618103027344, -0.2053985595703125, -0.19732093811035156, -0.18924331665039062, -0.1811656951904297, -0.17308807373046875, -0.1650104522705078, -0.15693283081054688, -0.14885520935058594, -0.140777587890625, -0.13269996643066406, -0.12462234497070312, -0.11654472351074219, -0.10846710205078125, -0.10038948059082031, -0.09231185913085938, -0.08423423767089844, -0.0761566162109375, -0.06807899475097656, -0.060001373291015625, -0.05192375183105469, -0.04384613037109375, -0.03576850891113281, -0.027690887451171875, -0.019613265991210938, -0.01153564453125, -0.0034580230712890625, 0.004619598388671875, 0.012697219848632812, 0.02077484130859375, 0.028852462768554688, 0.036930084228515625, 0.04500770568847656, 0.0530853271484375, 0.06116294860839844, 0.06924057006835938, 0.07731819152832031, 0.08539581298828125, 0.09347343444824219, 0.10155105590820312, 0.10962867736816406, 0.117706298828125, 0.12578392028808594, 0.13386154174804688, 0.1419391632080078, 0.15001678466796875, 0.1580944061279297, 0.16617202758789062, 0.17424964904785156, 0.1823272705078125, 0.19040489196777344, 0.19848251342773438, 0.2065601348876953, 0.21463775634765625, 0.2227153778076172, 0.23079299926757812, 0.23887062072753906, 0.2469482421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 12.0, 45.0, 175.0, 366.0, 281.0, 72.0, 30.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050262451171875, -0.048996925354003906, -0.04773139953613281, -0.04646587371826172, -0.045200347900390625, -0.04393482208251953, -0.04266929626464844, -0.041403770446777344, -0.04013824462890625, -0.038872718811035156, -0.03760719299316406, -0.03634166717529297, -0.035076141357421875, -0.03381061553955078, -0.03254508972167969, -0.031279563903808594, -0.0300140380859375, -0.028748512268066406, -0.027482986450195312, -0.02621746063232422, -0.024951934814453125, -0.02368640899658203, -0.022420883178710938, -0.021155357360839844, -0.01988983154296875, -0.018624305725097656, -0.017358779907226562, -0.01609325408935547, -0.014827728271484375, -0.013562202453613281, -0.012296676635742188, -0.011031150817871094, -0.009765625, -0.008500099182128906, -0.0072345733642578125, -0.005969047546386719, -0.004703521728515625, -0.0034379959106445312, -0.0021724700927734375, -0.0009069442749023438, 0.00035858154296875, 0.0016241073608398438, 0.0028896331787109375, 0.004155158996582031, 0.005420684814453125, 0.006686210632324219, 0.007951736450195312, 0.009217262268066406, 0.0104827880859375, 0.011748313903808594, 0.013013839721679688, 0.014279365539550781, 0.015544891357421875, 0.01681041717529297, 0.018075942993164062, 0.019341468811035156, 0.02060699462890625, 0.021872520446777344, 0.023138046264648438, 0.02440357208251953, 0.025669097900390625, 0.02693462371826172, 0.028200149536132812, 0.029465675354003906, 0.030731201171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 5.0, 8.0, 8.0, 11.0, 25.0, 29.0, 37.0, 40.0, 75.0, 114.0, 129.0, 182.0, 306.0, 501.0, 1147.0, 3392.0, 14397.0, 149991.0, 795646.0, 68644.0, 9185.0, 2468.0, 867.0, 461.0, 260.0, 163.0, 100.0, 113.0, 72.0, 41.0, 35.0, 17.0, 22.0, 10.0, 4.0, 11.0, 6.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.1151123046875, -0.11185741424560547, -0.10860252380371094, -0.1053476333618164, -0.10209274291992188, -0.09883785247802734, -0.09558296203613281, -0.09232807159423828, -0.08907318115234375, -0.08581829071044922, -0.08256340026855469, -0.07930850982666016, -0.07605361938476562, -0.0727987289428711, -0.06954383850097656, -0.06628894805908203, -0.0630340576171875, -0.05977916717529297, -0.05652427673339844, -0.053269386291503906, -0.050014495849609375, -0.046759605407714844, -0.04350471496582031, -0.04024982452392578, -0.03699493408203125, -0.03374004364013672, -0.030485153198242188, -0.027230262756347656, -0.023975372314453125, -0.020720481872558594, -0.017465591430664062, -0.014210700988769531, -0.010955810546875, -0.007700920104980469, -0.0044460296630859375, -0.0011911392211914062, 0.002063751220703125, 0.005318641662597656, 0.008573532104492188, 0.011828422546386719, 0.01508331298828125, 0.01833820343017578, 0.021593093872070312, 0.024847984313964844, 0.028102874755859375, 0.031357765197753906, 0.03461265563964844, 0.03786754608154297, 0.0411224365234375, 0.04437732696533203, 0.04763221740722656, 0.050887107849121094, 0.054141998291015625, 0.057396888732910156, 0.06065177917480469, 0.06390666961669922, 0.06716156005859375, 0.07041645050048828, 0.07367134094238281, 0.07692623138427734, 0.08018112182617188, 0.0834360122680664, 0.08669090270996094, 0.08994579315185547, 0.09320068359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 14.0, 17.0, 17.0, 16.0, 19.0, 19.0, 35.0, 45.0, 63.0, 55.0, 55.0, 71.0, 61.0, 78.0, 64.0, 50.0, 50.0, 41.0, 47.0, 33.0, 23.0, 23.0, 18.0, 21.0, 12.0, 13.0, 10.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0284423828125, -0.027483463287353516, -0.02652454376220703, -0.025565624237060547, -0.024606704711914062, -0.023647785186767578, -0.022688865661621094, -0.02172994613647461, -0.020771026611328125, -0.01981210708618164, -0.018853187561035156, -0.017894268035888672, -0.016935348510742188, -0.015976428985595703, -0.015017509460449219, -0.014058589935302734, -0.01309967041015625, -0.012140750885009766, -0.011181831359863281, -0.010222911834716797, -0.009263992309570312, -0.008305072784423828, -0.007346153259277344, -0.006387233734130859, -0.005428314208984375, -0.004469394683837891, -0.0035104751586914062, -0.002551555633544922, -0.0015926361083984375, -0.0006337165832519531, 0.00032520294189453125, 0.0012841224670410156, 0.0022430419921875, 0.0032019615173339844, 0.004160881042480469, 0.005119800567626953, 0.0060787200927734375, 0.007037639617919922, 0.007996559143066406, 0.00895547866821289, 0.009914398193359375, 0.01087331771850586, 0.011832237243652344, 0.012791156768798828, 0.013750076293945312, 0.014708995819091797, 0.01566791534423828, 0.016626834869384766, 0.01758575439453125, 0.018544673919677734, 0.01950359344482422, 0.020462512969970703, 0.021421432495117188, 0.022380352020263672, 0.023339271545410156, 0.02429819107055664, 0.025257110595703125, 0.02621603012084961, 0.027174949645996094, 0.028133869171142578, 0.029092788696289062, 0.030051708221435547, 0.03101062774658203, 0.031969547271728516, 0.032928466796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 6.0, 7.0, 11.0, 13.0, 21.0, 42.0, 54.0, 93.0, 156.0, 323.0, 669.0, 1464.0, 3599.0, 9855.0, 64137.0, 931770.0, 24936.0, 6760.0, 2549.0, 1068.0, 453.0, 214.0, 123.0, 57.0, 50.0, 32.0, 12.0, 13.0, 14.0, 15.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.09385395050048828, -0.09041786193847656, -0.08698177337646484, -0.08354568481445312, -0.0801095962524414, -0.07667350769042969, -0.07323741912841797, -0.06980133056640625, -0.06636524200439453, -0.06292915344238281, -0.059493064880371094, -0.056056976318359375, -0.052620887756347656, -0.04918479919433594, -0.04574871063232422, -0.0423126220703125, -0.03887653350830078, -0.03544044494628906, -0.032004356384277344, -0.028568267822265625, -0.025132179260253906, -0.021696090698242188, -0.01826000213623047, -0.01482391357421875, -0.011387825012207031, -0.007951736450195312, -0.004515647888183594, -0.001079559326171875, 0.0023565292358398438, 0.0057926177978515625, 0.009228706359863281, 0.012664794921875, 0.01610088348388672, 0.019536972045898438, 0.022973060607910156, 0.026409149169921875, 0.029845237731933594, 0.03328132629394531, 0.03671741485595703, 0.04015350341796875, 0.04358959197998047, 0.04702568054199219, 0.050461769104003906, 0.053897857666015625, 0.057333946228027344, 0.06077003479003906, 0.06420612335205078, 0.0676422119140625, 0.07107830047607422, 0.07451438903808594, 0.07795047760009766, 0.08138656616210938, 0.0848226547241211, 0.08825874328613281, 0.09169483184814453, 0.09513092041015625, 0.09856700897216797, 0.10200309753417969, 0.1054391860961914, 0.10887527465820312, 0.11231136322021484, 0.11574745178222656, 0.11918354034423828, 0.12261962890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 2.0, 6.0, 18.0, 23.0, 31.0, 37.0, 50.0, 81.0, 124.0, 218.0, 128.0, 69.0, 50.0, 33.0, 32.0, 16.0, 14.0, 12.0, 8.0, 7.0, 1.0, 4.0, 4.0, 0.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.00017547607421875, -0.00017114076763391495, -0.0001668054610490799, -0.00016247015446424484, -0.0001581348478794098, -0.00015379954129457474, -0.00014946423470973969, -0.00014512892812490463, -0.00014079362154006958, -0.00013645831495523453, -0.00013212300837039948, -0.00012778770178556442, -0.00012345239520072937, -0.00011911708861589432, -0.00011478178203105927, -0.00011044647544622421, -0.00010611116886138916, -0.00010177586227655411, -9.744055569171906e-05, -9.3105249106884e-05, -8.876994252204895e-05, -8.44346359372139e-05, -8.009932935237885e-05, -7.576402276754379e-05, -7.142871618270874e-05, -6.709340959787369e-05, -6.275810301303864e-05, -5.842279642820358e-05, -5.408748984336853e-05, -4.975218325853348e-05, -4.5416876673698425e-05, -4.108157008886337e-05, -3.674626350402832e-05, -3.241095691919327e-05, -2.8075650334358215e-05, -2.3740343749523163e-05, -1.940503716468811e-05, -1.5069730579853058e-05, -1.0734423995018005e-05, -6.399117410182953e-06, -2.0638108253479004e-06, 2.271495759487152e-06, 6.606802344322205e-06, 1.0942108929157257e-05, 1.527741551399231e-05, 1.9612722098827362e-05, 2.3948028683662415e-05, 2.8283335268497467e-05, 3.261864185333252e-05, 3.695394843816757e-05, 4.1289255023002625e-05, 4.562456160783768e-05, 4.995986819267273e-05, 5.429517477750778e-05, 5.8630481362342834e-05, 6.296578794717789e-05, 6.730109453201294e-05, 7.163640111684799e-05, 7.597170770168304e-05, 8.03070142865181e-05, 8.464232087135315e-05, 8.89776274561882e-05, 9.331293404102325e-05, 9.764824062585831e-05, 0.00010198354721069336]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 11.0, 9.0, 11.0, 27.0, 37.0, 45.0, 69.0, 219.0, 471.0, 1433.0, 5744.0, 59570.0, 958876.0, 17324.0, 3143.0, 885.0, 322.0, 138.0, 59.0, 26.0, 28.0, 20.0, 16.0, 7.0, 7.0, 10.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09689903259277344, -0.09370040893554688, -0.09050178527832031, -0.08730316162109375, -0.08410453796386719, -0.08090591430664062, -0.07770729064941406, -0.0745086669921875, -0.07131004333496094, -0.06811141967773438, -0.06491279602050781, -0.06171417236328125, -0.05851554870605469, -0.055316925048828125, -0.05211830139160156, -0.048919677734375, -0.04572105407714844, -0.042522430419921875, -0.03932380676269531, -0.03612518310546875, -0.03292655944824219, -0.029727935791015625, -0.026529312133789062, -0.0233306884765625, -0.020132064819335938, -0.016933441162109375, -0.013734817504882812, -0.01053619384765625, -0.0073375701904296875, -0.004138946533203125, -0.0009403228759765625, 0.00225830078125, 0.0054569244384765625, 0.008655548095703125, 0.011854171752929688, 0.01505279541015625, 0.018251419067382812, 0.021450042724609375, 0.024648666381835938, 0.0278472900390625, 0.031045913696289062, 0.034244537353515625, 0.03744316101074219, 0.04064178466796875, 0.04384040832519531, 0.047039031982421875, 0.05023765563964844, 0.053436279296875, 0.05663490295410156, 0.059833526611328125, 0.06303215026855469, 0.06623077392578125, 0.06942939758300781, 0.07262802124023438, 0.07582664489746094, 0.0790252685546875, 0.08222389221191406, 0.08542251586914062, 0.08862113952636719, 0.09181976318359375, 0.09501838684082031, 0.09821701049804688, 0.10141563415527344, 0.1046142578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 11.0, 12.0, 19.0, 26.0, 43.0, 86.0, 203.0, 280.0, 124.0, 66.0, 47.0, 19.0, 16.0, 12.0, 3.0, 0.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032745361328125, -0.03179025650024414, -0.03083515167236328, -0.029880046844482422, -0.028924942016601562, -0.027969837188720703, -0.027014732360839844, -0.026059627532958984, -0.025104522705078125, -0.024149417877197266, -0.023194313049316406, -0.022239208221435547, -0.021284103393554688, -0.020328998565673828, -0.01937389373779297, -0.01841878890991211, -0.01746368408203125, -0.01650857925415039, -0.015553474426269531, -0.014598369598388672, -0.013643264770507812, -0.012688159942626953, -0.011733055114746094, -0.010777950286865234, -0.009822845458984375, -0.008867740631103516, -0.007912635803222656, -0.006957530975341797, -0.0060024261474609375, -0.005047321319580078, -0.004092216491699219, -0.0031371116638183594, -0.0021820068359375, -0.0012269020080566406, -0.00027179718017578125, 0.0006833076477050781, 0.0016384124755859375, 0.002593517303466797, 0.0035486221313476562, 0.004503726959228516, 0.005458831787109375, 0.006413936614990234, 0.007369041442871094, 0.008324146270751953, 0.009279251098632812, 0.010234355926513672, 0.011189460754394531, 0.01214456558227539, 0.01309967041015625, 0.01405477523803711, 0.015009880065917969, 0.015964984893798828, 0.016920089721679688, 0.017875194549560547, 0.018830299377441406, 0.019785404205322266, 0.020740509033203125, 0.021695613861083984, 0.022650718688964844, 0.023605823516845703, 0.024560928344726562, 0.025516033172607422, 0.02647113800048828, 0.02742624282836914, 0.02838134765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 21.0, 89.0, 357.0, 370.0, 122.0, 19.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6188273429870605, -0.6030632257461548, -0.5872991681098938, -0.571535050868988, -0.5557709336280823, -0.5400068759918213, -0.5242427587509155, -0.5084786415100098, -0.4927145540714264, -0.476950466632843, -0.46118634939193726, -0.4454222619533539, -0.4296581745147705, -0.41389405727386475, -0.39812996983528137, -0.382365882396698, -0.36660176515579224, -0.35083767771720886, -0.3350735604763031, -0.3193094730377197, -0.30354535579681396, -0.2877812683582306, -0.2720171809196472, -0.25625306367874146, -0.24048897624015808, -0.2247248739004135, -0.20896077156066895, -0.19319668412208557, -0.177432581782341, -0.16166847944259644, -0.14590439200401306, -0.1301402896642685, -0.1143762469291687, -0.09861214458942413, -0.08284804970026016, -0.06708395481109619, -0.051319852471351624, -0.035555750131607056, -0.019791655242443085, -0.004027560353279114, 0.011736541986465454, 0.027500640600919724, 0.04326473921537399, 0.05902883782982826, 0.07479293644428253, 0.0905570387840271, 0.10632113367319107, 0.12208522856235504, 0.1378493309020996, 0.15361343324184418, 0.16937753558158875, 0.18514162302017212, 0.2009057253599167, 0.21666982769966125, 0.23243391513824463, 0.2481980174779892, 0.26396211981773376, 0.27972620725631714, 0.2954903244972229, 0.3112544119358063, 0.32701849937438965, 0.3427826166152954, 0.3585467040538788, 0.37431079149246216, 0.3900749087333679]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 10.0, 13.0, 11.0, 21.0, 12.0, 24.0, 23.0, 25.0, 23.0, 36.0, 35.0, 48.0, 38.0, 46.0, 41.0, 38.0, 43.0, 55.0, 49.0, 47.0, 51.0, 39.0, 31.0, 22.0, 37.0, 37.0, 29.0, 18.0, 17.0, 17.0, 10.0, 16.0, 11.0, 8.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09061121940612793, -0.08812852948904037, -0.08564583957195282, -0.08316314965486526, -0.08068045973777771, -0.07819777727127075, -0.0757150873541832, -0.07323239743709564, -0.07074970752000809, -0.06826701760292053, -0.06578432768583298, -0.06330163776874542, -0.060818951576948166, -0.05833626165986061, -0.055853575468063354, -0.0533708855509758, -0.050888195633888245, -0.04840550571680069, -0.045922815799713135, -0.04344012960791588, -0.04095743969082832, -0.03847474977374077, -0.03599206358194351, -0.03350937366485596, -0.031026683747768402, -0.028543993830680847, -0.02606130577623844, -0.023578617721796036, -0.02109592780470848, -0.018613237887620926, -0.01613054983317852, -0.013647861778736115, -0.01116517186164856, -0.00868248287588358, -0.006199793890118599, -0.0037171049043536186, -0.0012344159185886383, 0.001248273067176342, 0.0037309620529413223, 0.006213650107383728, 0.008696340024471283, 0.011179029010236263, 0.013661717996001244, 0.01614440605044365, 0.018627095967531204, 0.02110978588461876, 0.023592473939061165, 0.02607516199350357, 0.028557851910591125, 0.03104054182767868, 0.033523231744766235, 0.03600591793656349, 0.03848860785365105, 0.0409712977707386, 0.04345398396253586, 0.04593667387962341, 0.04841936379671097, 0.05090205371379852, 0.05338474363088608, 0.055867429822683334, 0.05835011973977089, 0.060832809656858444, 0.0633154958486557, 0.06579818576574326, 0.06828087568283081]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 14.0, 12.0, 26.0, 38.0, 43.0, 90.0, 205.0, 423.0, 1066.0, 4756.0, 3954993.0, 227352.0, 4094.0, 773.0, 213.0, 113.0, 34.0, 17.0, 13.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.14531898498535156, -0.14061355590820312, -0.1359081268310547, -0.13120269775390625, -0.1264972686767578, -0.12179183959960938, -0.11708641052246094, -0.1123809814453125, -0.10767555236816406, -0.10297012329101562, -0.09826469421386719, -0.09355926513671875, -0.08885383605957031, -0.08414840698242188, -0.07944297790527344, -0.074737548828125, -0.07003211975097656, -0.06532669067382812, -0.06062126159667969, -0.05591583251953125, -0.05121040344238281, -0.046504974365234375, -0.04179954528808594, -0.0370941162109375, -0.03238868713378906, -0.027683258056640625, -0.022977828979492188, -0.01827239990234375, -0.013566970825195312, -0.008861541748046875, -0.0041561126708984375, 0.00054931640625, 0.0052547454833984375, 0.009960174560546875, 0.014665603637695312, 0.01937103271484375, 0.024076461791992188, 0.028781890869140625, 0.03348731994628906, 0.0381927490234375, 0.04289817810058594, 0.047603607177734375, 0.05230903625488281, 0.05701446533203125, 0.06171989440917969, 0.06642532348632812, 0.07113075256347656, 0.075836181640625, 0.08054161071777344, 0.08524703979492188, 0.08995246887207031, 0.09465789794921875, 0.09936332702636719, 0.10406875610351562, 0.10877418518066406, 0.1134796142578125, 0.11818504333496094, 0.12289047241210938, 0.1275959014892578, 0.13230133056640625, 0.1370067596435547, 0.14171218872070312, 0.14641761779785156, 0.151123046875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 32.0, 137.0, 332.0, 324.0, 110.0, 34.0, 13.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0509033203125, -0.049628496170043945, -0.04835367202758789, -0.047078847885131836, -0.04580402374267578, -0.04452919960021973, -0.04325437545776367, -0.04197955131530762, -0.04070472717285156, -0.03942990303039551, -0.03815507888793945, -0.0368802547454834, -0.035605430603027344, -0.03433060646057129, -0.033055782318115234, -0.03178095817565918, -0.030506134033203125, -0.02923130989074707, -0.027956485748291016, -0.02668166160583496, -0.025406837463378906, -0.02413201332092285, -0.022857189178466797, -0.021582365036010742, -0.020307540893554688, -0.019032716751098633, -0.017757892608642578, -0.016483068466186523, -0.015208244323730469, -0.013933420181274414, -0.01265859603881836, -0.011383771896362305, -0.01010894775390625, -0.008834123611450195, -0.007559299468994141, -0.006284475326538086, -0.005009651184082031, -0.0037348270416259766, -0.002460002899169922, -0.0011851787567138672, 8.96453857421875e-05, 0.0013644695281982422, 0.002639293670654297, 0.0039141178131103516, 0.005188941955566406, 0.006463766098022461, 0.007738590240478516, 0.00901341438293457, 0.010288238525390625, 0.01156306266784668, 0.012837886810302734, 0.014112710952758789, 0.015387535095214844, 0.0166623592376709, 0.017937183380126953, 0.019212007522583008, 0.020486831665039062, 0.021761655807495117, 0.023036479949951172, 0.024311304092407227, 0.02558612823486328, 0.026860952377319336, 0.02813577651977539, 0.029410600662231445, 0.0306854248046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 15.0, 14.0, 22.0, 45.0, 73.0, 82.0, 166.0, 295.0, 476.0, 923.0, 2295.0, 7761.0, 53380.0, 1406589.0, 2622254.0, 84811.0, 10199.0, 2647.0, 1042.0, 488.0, 253.0, 162.0, 97.0, 57.0, 50.0, 19.0, 19.0, 12.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04890298843383789, -0.04732990264892578, -0.04575681686401367, -0.04418373107910156, -0.04261064529418945, -0.041037559509277344, -0.039464473724365234, -0.037891387939453125, -0.036318302154541016, -0.034745216369628906, -0.0331721305847168, -0.03159904479980469, -0.030025959014892578, -0.02845287322998047, -0.02687978744506836, -0.02530670166015625, -0.02373361587524414, -0.02216053009033203, -0.020587444305419922, -0.019014358520507812, -0.017441272735595703, -0.015868186950683594, -0.014295101165771484, -0.012722015380859375, -0.011148929595947266, -0.009575843811035156, -0.008002758026123047, -0.0064296722412109375, -0.004856586456298828, -0.0032835006713867188, -0.0017104148864746094, -0.0001373291015625, 0.0014357566833496094, 0.0030088424682617188, 0.004581928253173828, 0.0061550140380859375, 0.007728099822998047, 0.009301185607910156, 0.010874271392822266, 0.012447357177734375, 0.014020442962646484, 0.015593528747558594, 0.017166614532470703, 0.018739700317382812, 0.020312786102294922, 0.02188587188720703, 0.02345895767211914, 0.02503204345703125, 0.02660512924194336, 0.02817821502685547, 0.029751300811767578, 0.03132438659667969, 0.0328974723815918, 0.034470558166503906, 0.036043643951416016, 0.037616729736328125, 0.039189815521240234, 0.040762901306152344, 0.04233598709106445, 0.04390907287597656, 0.04548215866088867, 0.04705524444580078, 0.04862833023071289, 0.050201416015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 8.0, 17.0, 26.0, 29.0, 23.0, 58.0, 64.0, 105.0, 139.0, 195.0, 229.0, 307.0, 457.0, 522.0, 440.0, 358.0, 283.0, 226.0, 149.0, 116.0, 90.0, 55.0, 36.0, 29.0, 29.0, 19.0, 15.0, 15.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0226287841796875, -0.02195429801940918, -0.02127981185913086, -0.02060532569885254, -0.01993083953857422, -0.0192563533782959, -0.018581867218017578, -0.017907381057739258, -0.017232894897460938, -0.016558408737182617, -0.015883922576904297, -0.015209436416625977, -0.014534950256347656, -0.013860464096069336, -0.013185977935791016, -0.012511491775512695, -0.011837005615234375, -0.011162519454956055, -0.010488033294677734, -0.009813547134399414, -0.009139060974121094, -0.008464574813842773, -0.007790088653564453, -0.007115602493286133, -0.0064411163330078125, -0.005766630172729492, -0.005092144012451172, -0.0044176578521728516, -0.0037431716918945312, -0.003068685531616211, -0.0023941993713378906, -0.0017197132110595703, -0.00104522705078125, -0.0003707408905029297, 0.0003037452697753906, 0.000978231430053711, 0.0016527175903320312, 0.0023272037506103516, 0.003001689910888672, 0.003676176071166992, 0.0043506622314453125, 0.005025148391723633, 0.005699634552001953, 0.0063741207122802734, 0.007048606872558594, 0.007723093032836914, 0.008397579193115234, 0.009072065353393555, 0.009746551513671875, 0.010421037673950195, 0.011095523834228516, 0.011770009994506836, 0.012444496154785156, 0.013118982315063477, 0.013793468475341797, 0.014467954635620117, 0.015142440795898438, 0.015816926956176758, 0.016491413116455078, 0.0171658992767334, 0.01784038543701172, 0.01851487159729004, 0.01918935775756836, 0.01986384391784668, 0.020538330078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 55.0, 702.0, 234.0, 17.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9157102108001709, -0.8893593549728394, -0.8630084991455078, -0.8366576433181763, -0.8103067874908447, -0.7839559316635132, -0.7576050758361816, -0.7312542200088501, -0.7049033641815186, -0.678552508354187, -0.6522016525268555, -0.6258507966995239, -0.5994999408721924, -0.5731490850448608, -0.5467982292175293, -0.5204473733901978, -0.494096577167511, -0.46774572134017944, -0.4413948655128479, -0.41504400968551636, -0.3886931538581848, -0.36234229803085327, -0.3359914720058441, -0.3096406161785126, -0.28328976035118103, -0.2569389045238495, -0.23058804869651794, -0.2042372077703476, -0.17788635194301605, -0.1515354961156845, -0.12518465518951416, -0.09883379936218262, -0.07248294353485107, -0.04613209143280983, -0.019781239330768585, 0.006569609045982361, 0.032920464873313904, 0.05927132070064545, 0.0856221616268158, 0.11197301745414734, 0.13832387328147888, 0.16467472910881042, 0.19102558493614197, 0.21737642586231232, 0.24372728168964386, 0.2700781226158142, 0.29642897844314575, 0.3227798342704773, 0.34913069009780884, 0.3754815459251404, 0.4018324017524719, 0.42818325757980347, 0.454534113407135, 0.48088496923446655, 0.5072357654571533, 0.5335866212844849, 0.5599374771118164, 0.586288332939148, 0.6126391887664795, 0.638990044593811, 0.6653409004211426, 0.6916917562484741, 0.7180426120758057, 0.7443934679031372, 0.7707443237304688]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 4.0, 15.0, 10.0, 15.0, 17.0, 29.0, 46.0, 41.0, 39.0, 46.0, 37.0, 49.0, 51.0, 65.0, 48.0, 74.0, 54.0, 51.0, 44.0, 42.0, 34.0, 23.0, 35.0, 26.0, 21.0, 22.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.09094744920730591, -0.08803810179233551, -0.08512875437736511, -0.08221940696239471, -0.07931005954742432, -0.07640070468187332, -0.07349135726690292, -0.07058200985193253, -0.06767266243696213, -0.06476331502199173, -0.06185396760702133, -0.058944616466760635, -0.05603526905179024, -0.05312592163681984, -0.05021657049655914, -0.047307223081588745, -0.04439787566661835, -0.04148852825164795, -0.03857918083667755, -0.035669829696416855, -0.03276048228144646, -0.02985113486647606, -0.026941785588860512, -0.024032436311244965, -0.021123088896274567, -0.01821374148130417, -0.015304392203688622, -0.012395043857395649, -0.009485695511102676, -0.006576347164809704, -0.0036669988185167313, -0.0007576495409011841, 0.002151697874069214, 0.005061046220362186, 0.007970394566655159, 0.010879742912948132, 0.013789091259241104, 0.016698438674211502, 0.01960778795182705, 0.022517137229442596, 0.025426484644412994, 0.028335832059383392, 0.03124518133699894, 0.03415453061461449, 0.037063878029584885, 0.03997322544455528, 0.04288257658481598, 0.04579192399978638, 0.048701271414756775, 0.05161061882972717, 0.05451996624469757, 0.05742931738495827, 0.060338664799928665, 0.06324801594018936, 0.06615736335515976, 0.06906671077013016, 0.07197605818510056, 0.07488540560007095, 0.07779475301504135, 0.08070410043001175, 0.08361345529556274, 0.08652280271053314, 0.08943215012550354, 0.09234149754047394, 0.09525084495544434]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 4.0, 14.0, 9.0, 11.0, 24.0, 44.0, 61.0, 85.0, 144.0, 235.0, 429.0, 792.0, 2711.0, 175018.0, 862442.0, 4339.0, 980.0, 463.0, 255.0, 173.0, 104.0, 76.0, 32.0, 27.0, 25.0, 9.0, 9.0, 11.0, 6.0, 6.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2732410430908203, -0.2652320861816406, -0.25722312927246094, -0.24921417236328125, -0.24120521545410156, -0.23319625854492188, -0.2251873016357422, -0.2171783447265625, -0.2091693878173828, -0.20116043090820312, -0.19315147399902344, -0.18514251708984375, -0.17713356018066406, -0.16912460327148438, -0.1611156463623047, -0.153106689453125, -0.1450977325439453, -0.13708877563476562, -0.12907981872558594, -0.12107086181640625, -0.11306190490722656, -0.10505294799804688, -0.09704399108886719, -0.0890350341796875, -0.08102607727050781, -0.07301712036132812, -0.06500816345214844, -0.05699920654296875, -0.04899024963378906, -0.040981292724609375, -0.03297233581542969, -0.02496337890625, -0.016954421997070312, -0.008945465087890625, -0.0009365081787109375, 0.00707244873046875, 0.015081405639648438, 0.023090362548828125, 0.031099319458007812, 0.0391082763671875, 0.04711723327636719, 0.055126190185546875, 0.06313514709472656, 0.07114410400390625, 0.07915306091308594, 0.08716201782226562, 0.09517097473144531, 0.103179931640625, 0.11118888854980469, 0.11919784545898438, 0.12720680236816406, 0.13521575927734375, 0.14322471618652344, 0.15123367309570312, 0.1592426300048828, 0.1672515869140625, 0.1752605438232422, 0.18326950073242188, 0.19127845764160156, 0.19928741455078125, 0.20729637145996094, 0.21530532836914062, 0.2233142852783203, 0.2313232421875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 27.0, 99.0, 265.0, 375.0, 154.0, 51.0, 19.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048828125, -0.047583580017089844, -0.04633903503417969, -0.04509449005126953, -0.043849945068359375, -0.04260540008544922, -0.04136085510253906, -0.040116310119628906, -0.03887176513671875, -0.037627220153808594, -0.03638267517089844, -0.03513813018798828, -0.033893585205078125, -0.03264904022216797, -0.03140449523925781, -0.030159950256347656, -0.0289154052734375, -0.027670860290527344, -0.026426315307617188, -0.02518177032470703, -0.023937225341796875, -0.02269268035888672, -0.021448135375976562, -0.020203590393066406, -0.01895904541015625, -0.017714500427246094, -0.016469955444335938, -0.015225410461425781, -0.013980865478515625, -0.012736320495605469, -0.011491775512695312, -0.010247230529785156, -0.009002685546875, -0.007758140563964844, -0.0065135955810546875, -0.005269050598144531, -0.004024505615234375, -0.0027799606323242188, -0.0015354156494140625, -0.00029087066650390625, 0.00095367431640625, 0.0021982192993164062, 0.0034427642822265625, 0.004687309265136719, 0.005931854248046875, 0.007176399230957031, 0.008420944213867188, 0.009665489196777344, 0.0109100341796875, 0.012154579162597656, 0.013399124145507812, 0.014643669128417969, 0.015888214111328125, 0.01713275909423828, 0.018377304077148438, 0.019621849060058594, 0.02086639404296875, 0.022110939025878906, 0.023355484008789062, 0.02460002899169922, 0.025844573974609375, 0.02708911895751953, 0.028333663940429688, 0.029578208923339844, 0.03082275390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 8.0, 13.0, 14.0, 12.0, 20.0, 29.0, 39.0, 53.0, 64.0, 102.0, 125.0, 215.0, 304.0, 443.0, 817.0, 1936.0, 6537.0, 35825.0, 384359.0, 551030.0, 53057.0, 8474.0, 2433.0, 990.0, 535.0, 336.0, 220.0, 162.0, 104.0, 72.0, 44.0, 39.0, 29.0, 22.0, 26.0, 16.0, 12.0, 6.0, 8.0, 2.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08642578125, -0.08373260498046875, -0.0810394287109375, -0.07834625244140625, -0.075653076171875, -0.07295989990234375, -0.0702667236328125, -0.06757354736328125, -0.06488037109375, -0.06218719482421875, -0.0594940185546875, -0.05680084228515625, -0.054107666015625, -0.05141448974609375, -0.0487213134765625, -0.04602813720703125, -0.0433349609375, -0.04064178466796875, -0.0379486083984375, -0.03525543212890625, -0.032562255859375, -0.02986907958984375, -0.0271759033203125, -0.02448272705078125, -0.02178955078125, -0.01909637451171875, -0.0164031982421875, -0.01371002197265625, -0.011016845703125, -0.00832366943359375, -0.0056304931640625, -0.00293731689453125, -0.000244140625, 0.00244903564453125, 0.0051422119140625, 0.00783538818359375, 0.010528564453125, 0.01322174072265625, 0.0159149169921875, 0.01860809326171875, 0.02130126953125, 0.02399444580078125, 0.0266876220703125, 0.02938079833984375, 0.032073974609375, 0.03476715087890625, 0.0374603271484375, 0.04015350341796875, 0.0428466796875, 0.04553985595703125, 0.0482330322265625, 0.05092620849609375, 0.053619384765625, 0.05631256103515625, 0.0590057373046875, 0.06169891357421875, 0.06439208984375, 0.06708526611328125, 0.0697784423828125, 0.07247161865234375, 0.075164794921875, 0.07785797119140625, 0.0805511474609375, 0.08324432373046875, 0.0859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 5.0, 7.0, 12.0, 11.0, 10.0, 14.0, 19.0, 22.0, 24.0, 28.0, 37.0, 41.0, 43.0, 52.0, 45.0, 39.0, 37.0, 54.0, 45.0, 53.0, 45.0, 51.0, 42.0, 47.0, 25.0, 38.0, 27.0, 21.0, 14.0, 18.0, 8.0, 13.0, 6.0, 14.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299835205078125, -0.029099464416503906, -0.028215408325195312, -0.02733135223388672, -0.026447296142578125, -0.02556324005126953, -0.024679183959960938, -0.023795127868652344, -0.02291107177734375, -0.022027015686035156, -0.021142959594726562, -0.02025890350341797, -0.019374847412109375, -0.01849079132080078, -0.017606735229492188, -0.016722679138183594, -0.015838623046875, -0.014954566955566406, -0.014070510864257812, -0.013186454772949219, -0.012302398681640625, -0.011418342590332031, -0.010534286499023438, -0.009650230407714844, -0.00876617431640625, -0.007882118225097656, -0.0069980621337890625, -0.006114006042480469, -0.005229949951171875, -0.004345893859863281, -0.0034618377685546875, -0.0025777816772460938, -0.0016937255859375, -0.0008096694946289062, 7.43865966796875e-05, 0.0009584426879882812, 0.001842498779296875, 0.0027265548706054688, 0.0036106109619140625, 0.004494667053222656, 0.00537872314453125, 0.006262779235839844, 0.0071468353271484375, 0.008030891418457031, 0.008914947509765625, 0.009799003601074219, 0.010683059692382812, 0.011567115783691406, 0.012451171875, 0.013335227966308594, 0.014219284057617188, 0.015103340148925781, 0.015987396240234375, 0.01687145233154297, 0.017755508422851562, 0.018639564514160156, 0.01952362060546875, 0.020407676696777344, 0.021291732788085938, 0.02217578887939453, 0.023059844970703125, 0.02394390106201172, 0.024827957153320312, 0.025712013244628906, 0.0265960693359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 12.0, 12.0, 22.0, 27.0, 34.0, 56.0, 97.0, 143.0, 207.0, 322.0, 612.0, 1088.0, 2042.0, 4144.0, 8655.0, 19806.0, 59407.0, 394927.0, 453875.0, 63628.0, 21326.0, 8972.0, 4207.0, 2160.0, 1126.0, 628.0, 372.0, 188.0, 132.0, 100.0, 57.0, 45.0, 29.0, 27.0, 15.0, 9.0, 10.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.03485870361328125, -0.0336151123046875, -0.03237152099609375, -0.0311279296875, -0.02988433837890625, -0.0286407470703125, -0.02739715576171875, -0.026153564453125, -0.02490997314453125, -0.0236663818359375, -0.02242279052734375, -0.02117919921875, -0.01993560791015625, -0.0186920166015625, -0.01744842529296875, -0.016204833984375, -0.01496124267578125, -0.0137176513671875, -0.01247406005859375, -0.01123046875, -0.00998687744140625, -0.0087432861328125, -0.00749969482421875, -0.006256103515625, -0.00501251220703125, -0.0037689208984375, -0.00252532958984375, -0.00128173828125, -3.814697265625e-05, 0.0012054443359375, 0.00244903564453125, 0.003692626953125, 0.00493621826171875, 0.0061798095703125, 0.00742340087890625, 0.0086669921875, 0.00991058349609375, 0.0111541748046875, 0.01239776611328125, 0.013641357421875, 0.01488494873046875, 0.0161285400390625, 0.01737213134765625, 0.01861572265625, 0.01985931396484375, 0.0211029052734375, 0.02234649658203125, 0.023590087890625, 0.02483367919921875, 0.0260772705078125, 0.02732086181640625, 0.028564453125, 0.02980804443359375, 0.0310516357421875, 0.03229522705078125, 0.033538818359375, 0.03478240966796875, 0.0360260009765625, 0.03726959228515625, 0.03851318359375, 0.03975677490234375, 0.0410003662109375, 0.04224395751953125, 0.043487548828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 6.0, 1.0, 5.0, 5.0, 8.0, 4.0, 8.0, 13.0, 19.0, 21.0, 14.0, 32.0, 39.0, 28.0, 36.0, 47.0, 51.0, 72.0, 90.0, 87.0, 73.0, 58.0, 47.0, 41.0, 26.0, 38.0, 29.0, 29.0, 16.0, 11.0, 13.0, 7.0, 4.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.490945816040039e-05, -6.260816007852554e-05, -6.0306861996650696e-05, -5.800556391477585e-05, -5.5704265832901e-05, -5.3402967751026154e-05, -5.1101669669151306e-05, -4.880037158727646e-05, -4.649907350540161e-05, -4.4197775423526764e-05, -4.1896477341651917e-05, -3.959517925977707e-05, -3.729388117790222e-05, -3.4992583096027374e-05, -3.269128501415253e-05, -3.038998693227768e-05, -2.8088688850402832e-05, -2.5787390768527985e-05, -2.3486092686653137e-05, -2.118479460477829e-05, -1.8883496522903442e-05, -1.6582198441028595e-05, -1.4280900359153748e-05, -1.19796022772789e-05, -9.678304195404053e-06, -7.377006113529205e-06, -5.075708031654358e-06, -2.7744099497795105e-06, -4.731118679046631e-07, 1.8281862139701843e-06, 4.129484295845032e-06, 6.430782377719879e-06, 8.732080459594727e-06, 1.1033378541469574e-05, 1.3334676623344421e-05, 1.563597470521927e-05, 1.7937272787094116e-05, 2.0238570868968964e-05, 2.253986895084381e-05, 2.484116703271866e-05, 2.7142465114593506e-05, 2.9443763196468353e-05, 3.17450612783432e-05, 3.404635936021805e-05, 3.6347657442092896e-05, 3.864895552396774e-05, 4.095025360584259e-05, 4.325155168771744e-05, 4.5552849769592285e-05, 4.785414785146713e-05, 5.015544593334198e-05, 5.245674401521683e-05, 5.4758042097091675e-05, 5.705934017896652e-05, 5.936063826084137e-05, 6.166193634271622e-05, 6.396323442459106e-05, 6.626453250646591e-05, 6.856583058834076e-05, 7.08671286702156e-05, 7.316842675209045e-05, 7.54697248339653e-05, 7.777102291584015e-05, 8.0072320997715e-05, 8.237361907958984e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 6.0, 5.0, 9.0, 13.0, 14.0, 28.0, 36.0, 69.0, 110.0, 223.0, 467.0, 1360.0, 4672.0, 25412.0, 856053.0, 145282.0, 10804.0, 2422.0, 771.0, 331.0, 169.0, 78.0, 67.0, 29.0, 26.0, 15.0, 13.0, 10.0, 6.0, 10.0, 5.0, 10.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07439041137695312, -0.07138824462890625, -0.06838607788085938, -0.0653839111328125, -0.062381744384765625, -0.05937957763671875, -0.056377410888671875, -0.053375244140625, -0.050373077392578125, -0.04737091064453125, -0.044368743896484375, -0.0413665771484375, -0.038364410400390625, -0.03536224365234375, -0.032360076904296875, -0.02935791015625, -0.026355743408203125, -0.02335357666015625, -0.020351409912109375, -0.0173492431640625, -0.014347076416015625, -0.01134490966796875, -0.008342742919921875, -0.005340576171875, -0.002338409423828125, 0.00066375732421875, 0.003665924072265625, 0.0066680908203125, 0.009670257568359375, 0.01267242431640625, 0.015674591064453125, 0.0186767578125, 0.021678924560546875, 0.02468109130859375, 0.027683258056640625, 0.0306854248046875, 0.033687591552734375, 0.03668975830078125, 0.039691925048828125, 0.042694091796875, 0.045696258544921875, 0.04869842529296875, 0.051700592041015625, 0.0547027587890625, 0.057704925537109375, 0.06070709228515625, 0.06370925903320312, 0.06671142578125, 0.06971359252929688, 0.07271575927734375, 0.07571792602539062, 0.0787200927734375, 0.08172225952148438, 0.08472442626953125, 0.08772659301757812, 0.090728759765625, 0.09373092651367188, 0.09673309326171875, 0.09973526000976562, 0.1027374267578125, 0.10573959350585938, 0.10874176025390625, 0.11174392700195312, 0.11474609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 10.0, 11.0, 11.0, 24.0, 39.0, 68.0, 119.0, 221.0, 241.0, 114.0, 47.0, 24.0, 18.0, 7.0, 13.0, 3.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0560302734375, -0.05455589294433594, -0.053081512451171875, -0.05160713195800781, -0.05013275146484375, -0.04865837097167969, -0.047183990478515625, -0.04570960998535156, -0.0442352294921875, -0.04276084899902344, -0.041286468505859375, -0.03981208801269531, -0.03833770751953125, -0.03686332702636719, -0.035388946533203125, -0.03391456604003906, -0.032440185546875, -0.030965805053710938, -0.029491424560546875, -0.028017044067382812, -0.02654266357421875, -0.025068283081054688, -0.023593902587890625, -0.022119522094726562, -0.0206451416015625, -0.019170761108398438, -0.017696380615234375, -0.016222000122070312, -0.01474761962890625, -0.013273239135742188, -0.011798858642578125, -0.010324478149414062, -0.00885009765625, -0.0073757171630859375, -0.005901336669921875, -0.0044269561767578125, -0.00295257568359375, -0.0014781951904296875, -3.814697265625e-06, 0.0014705657958984375, 0.0029449462890625, 0.0044193267822265625, 0.005893707275390625, 0.0073680877685546875, 0.00884246826171875, 0.010316848754882812, 0.011791229248046875, 0.013265609741210938, 0.014739990234375, 0.016214370727539062, 0.017688751220703125, 0.019163131713867188, 0.02063751220703125, 0.022111892700195312, 0.023586273193359375, 0.025060653686523438, 0.0265350341796875, 0.028009414672851562, 0.029483795166015625, 0.030958175659179688, 0.03243255615234375, 0.03390693664550781, 0.035381317138671875, 0.03685569763183594, 0.038330078125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 12.0, 31.0, 404.0, 482.0, 67.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24406927824020386, -0.2137887328863144, -0.18350818753242493, -0.15322764217853546, -0.122947096824646, -0.09266655147075653, -0.062386006116867065, -0.0321054607629776, -0.0018249154090881348, 0.02845562994480133, 0.058736175298690796, 0.08901672065258026, 0.11929726600646973, 0.1495778113603592, 0.17985835671424866, 0.21013890206813812, 0.2404194474220276, 0.27069997787475586, 0.3009805381298065, 0.3312610983848572, 0.36154162883758545, 0.3918221592903137, 0.4221027195453644, 0.45238327980041504, 0.4826638102531433, 0.5129443407058716, 0.5432249307632446, 0.5735054612159729, 0.6037859916687012, 0.6340665221214294, 0.6643470525741577, 0.6946276426315308, 0.7249081134796143, 0.7551886439323425, 0.7854691743850708, 0.8157497644424438, 0.8460302948951721, 0.8763108253479004, 0.9065914154052734, 0.9368719458580017, 0.96715247631073, 0.9974330067634583, 1.0277135372161865, 1.0579941272735596, 1.0882747173309326, 1.1185551881790161, 1.1488357782363892, 1.1791162490844727, 1.2093968391418457, 1.2396774291992188, 1.2699579000473022, 1.3002384901046753, 1.3305189609527588, 1.3607995510101318, 1.3910801410675049, 1.4213606119155884, 1.4516412019729614, 1.4819217920303345, 1.512202262878418, 1.542482852935791, 1.572763442993164, 1.6030439138412476, 1.6333245038986206, 1.663604974746704, 1.6938855648040771]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 10.0, 10.0, 16.0, 18.0, 19.0, 40.0, 42.0, 52.0, 65.0, 73.0, 72.0, 65.0, 63.0, 74.0, 67.0, 66.0, 53.0, 53.0, 45.0, 20.0, 25.0, 16.0, 9.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17111057043075562, -0.16573134064674377, -0.16035212576389313, -0.1549728959798813, -0.14959366619586945, -0.1442144513130188, -0.13883522152900696, -0.13345599174499512, -0.12807676196098328, -0.12269753962755203, -0.11731830984354019, -0.11193908751010895, -0.1065598577260971, -0.10118063539266586, -0.09580141305923462, -0.09042218327522278, -0.08504296839237213, -0.07966374605894089, -0.07428451627492905, -0.0689052939414978, -0.06352606415748596, -0.05814684182405472, -0.052767619490623474, -0.04738839343190193, -0.04200916737318039, -0.03662994131445885, -0.031250715255737305, -0.02587149292230606, -0.02049226686358452, -0.015113040804862976, -0.009733818471431732, -0.00435459241271019, 0.0010246336460113525, 0.00640385877341032, 0.011783083900809288, 0.01716230809688568, 0.022541534155607224, 0.027920760214328766, 0.03329998254776001, 0.03867920860648155, 0.044058434665203094, 0.04943766072392464, 0.05481688678264618, 0.06019610911607742, 0.06557533144950867, 0.07095456123352051, 0.07633378356695175, 0.081713005900383, 0.08709223568439484, 0.09247145801782608, 0.09785068780183792, 0.10322991013526917, 0.108609139919281, 0.11398836225271225, 0.1193675845861435, 0.12474681437015533, 0.13012602925300598, 0.13550525903701782, 0.14088447391986847, 0.1462637037038803, 0.15164293348789215, 0.1570221483707428, 0.16240137815475464, 0.16778060793876648, 0.17315983772277832]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 13.0, 13.0, 17.0, 37.0, 42.0, 92.0, 142.0, 338.0, 734.0, 1865.0, 8913.0, 2471805.0, 1696666.0, 9973.0, 2540.0, 650.0, 238.0, 107.0, 46.0, 22.0, 9.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06939697265625, -0.06691646575927734, -0.06443595886230469, -0.06195545196533203, -0.059474945068359375, -0.05699443817138672, -0.05451393127441406, -0.052033424377441406, -0.04955291748046875, -0.047072410583496094, -0.04459190368652344, -0.04211139678955078, -0.039630889892578125, -0.03715038299560547, -0.03466987609863281, -0.032189369201660156, -0.0297088623046875, -0.027228355407714844, -0.024747848510742188, -0.02226734161376953, -0.019786834716796875, -0.01730632781982422, -0.014825820922851562, -0.012345314025878906, -0.00986480712890625, -0.007384300231933594, -0.0049037933349609375, -0.0024232864379882812, 5.7220458984375e-05, 0.0025377273559570312, 0.0050182342529296875, 0.007498741149902344, 0.009979248046875, 0.012459754943847656, 0.014940261840820312, 0.01742076873779297, 0.019901275634765625, 0.02238178253173828, 0.024862289428710938, 0.027342796325683594, 0.02982330322265625, 0.032303810119628906, 0.03478431701660156, 0.03726482391357422, 0.039745330810546875, 0.04222583770751953, 0.04470634460449219, 0.047186851501464844, 0.0496673583984375, 0.052147865295410156, 0.05462837219238281, 0.05710887908935547, 0.059589385986328125, 0.06206989288330078, 0.06455039978027344, 0.0670309066772461, 0.06951141357421875, 0.0719919204711914, 0.07447242736816406, 0.07695293426513672, 0.07943344116210938, 0.08191394805908203, 0.08439445495605469, 0.08687496185302734, 0.08935546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 40.0, 119.0, 235.0, 307.0, 186.0, 71.0, 22.0, 8.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04815673828125, -0.04696083068847656, -0.045764923095703125, -0.04456901550292969, -0.04337310791015625, -0.04217720031738281, -0.040981292724609375, -0.03978538513183594, -0.0385894775390625, -0.03739356994628906, -0.036197662353515625, -0.03500175476074219, -0.03380584716796875, -0.03260993957519531, -0.031414031982421875, -0.030218124389648438, -0.029022216796875, -0.027826309204101562, -0.026630401611328125, -0.025434494018554688, -0.02423858642578125, -0.023042678833007812, -0.021846771240234375, -0.020650863647460938, -0.0194549560546875, -0.018259048461914062, -0.017063140869140625, -0.015867233276367188, -0.01467132568359375, -0.013475418090820312, -0.012279510498046875, -0.011083602905273438, -0.0098876953125, -0.008691787719726562, -0.007495880126953125, -0.0062999725341796875, -0.00510406494140625, -0.0039081573486328125, -0.002712249755859375, -0.0015163421630859375, -0.0003204345703125, 0.0008754730224609375, 0.002071380615234375, 0.0032672882080078125, 0.00446319580078125, 0.0056591033935546875, 0.006855010986328125, 0.008050918579101562, 0.009246826171875, 0.010442733764648438, 0.011638641357421875, 0.012834548950195312, 0.01403045654296875, 0.015226364135742188, 0.016422271728515625, 0.017618179321289062, 0.0188140869140625, 0.020009994506835938, 0.021205902099609375, 0.022401809692382812, 0.02359771728515625, 0.024793624877929688, 0.025989532470703125, 0.027185440063476562, 0.02838134765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 2.0, 6.0, 13.0, 8.0, 11.0, 15.0, 31.0, 39.0, 51.0, 79.0, 143.0, 270.0, 495.0, 1102.0, 2879.0, 11775.0, 107253.0, 2912580.0, 1101435.0, 45332.0, 6877.0, 1978.0, 854.0, 404.0, 239.0, 134.0, 91.0, 48.0, 39.0, 33.0, 19.0, 12.0, 11.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046630859375, -0.04525279998779297, -0.04387474060058594, -0.042496681213378906, -0.041118621826171875, -0.039740562438964844, -0.03836250305175781, -0.03698444366455078, -0.03560638427734375, -0.03422832489013672, -0.03285026550292969, -0.031472206115722656, -0.030094146728515625, -0.028716087341308594, -0.027338027954101562, -0.02595996856689453, -0.0245819091796875, -0.02320384979248047, -0.021825790405273438, -0.020447731018066406, -0.019069671630859375, -0.017691612243652344, -0.016313552856445312, -0.014935493469238281, -0.01355743408203125, -0.012179374694824219, -0.010801315307617188, -0.009423255920410156, -0.008045196533203125, -0.006667137145996094, -0.0052890777587890625, -0.003911018371582031, -0.002532958984375, -0.0011548995971679688, 0.0002231597900390625, 0.0016012191772460938, 0.002979278564453125, 0.004357337951660156, 0.0057353973388671875, 0.007113456726074219, 0.00849151611328125, 0.009869575500488281, 0.011247634887695312, 0.012625694274902344, 0.014003753662109375, 0.015381813049316406, 0.016759872436523438, 0.01813793182373047, 0.0195159912109375, 0.02089405059814453, 0.022272109985351562, 0.023650169372558594, 0.025028228759765625, 0.026406288146972656, 0.027784347534179688, 0.02916240692138672, 0.03054046630859375, 0.03191852569580078, 0.03329658508300781, 0.034674644470214844, 0.036052703857421875, 0.037430763244628906, 0.03880882263183594, 0.04018688201904297, 0.04156494140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 13.0, 11.0, 9.0, 27.0, 58.0, 52.0, 80.0, 130.0, 156.0, 210.0, 281.0, 372.0, 465.0, 527.0, 430.0, 349.0, 258.0, 171.0, 146.0, 86.0, 68.0, 51.0, 32.0, 26.0, 14.0, 9.0, 13.0, 3.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.019622802734375, -0.018996477127075195, -0.01837015151977539, -0.017743825912475586, -0.01711750030517578, -0.016491174697875977, -0.015864849090576172, -0.015238523483276367, -0.014612197875976562, -0.013985872268676758, -0.013359546661376953, -0.012733221054077148, -0.012106895446777344, -0.011480569839477539, -0.010854244232177734, -0.01022791862487793, -0.009601593017578125, -0.00897526741027832, -0.008348941802978516, -0.007722616195678711, -0.007096290588378906, -0.0064699649810791016, -0.005843639373779297, -0.005217313766479492, -0.0045909881591796875, -0.003964662551879883, -0.003338336944580078, -0.0027120113372802734, -0.0020856857299804688, -0.001459360122680664, -0.0008330345153808594, -0.0002067089080810547, 0.00041961669921875, 0.0010459423065185547, 0.0016722679138183594, 0.002298593521118164, 0.0029249191284179688, 0.0035512447357177734, 0.004177570343017578, 0.004803895950317383, 0.0054302215576171875, 0.006056547164916992, 0.006682872772216797, 0.0073091983795166016, 0.007935523986816406, 0.008561849594116211, 0.009188175201416016, 0.00981450080871582, 0.010440826416015625, 0.01106715202331543, 0.011693477630615234, 0.012319803237915039, 0.012946128845214844, 0.013572454452514648, 0.014198780059814453, 0.014825105667114258, 0.015451431274414062, 0.016077756881713867, 0.016704082489013672, 0.017330408096313477, 0.01795673370361328, 0.018583059310913086, 0.01920938491821289, 0.019835710525512695, 0.0204620361328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 36.0, 135.0, 347.0, 315.0, 123.0, 26.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3070932924747467, -0.2980409264564514, -0.28898856043815613, -0.27993619441986084, -0.27088382840156555, -0.26183146238327026, -0.252779096364975, -0.2437267154455185, -0.2346743494272232, -0.22562198340892792, -0.21656961739063263, -0.20751725137233734, -0.19846487045288086, -0.18941250443458557, -0.18036013841629028, -0.171307772397995, -0.1622554063796997, -0.15320304036140442, -0.14415067434310913, -0.13509830832481384, -0.12604594230651855, -0.11699356883764267, -0.10794119536876678, -0.0988888293504715, -0.08983646333217621, -0.08078409731388092, -0.07173173129558563, -0.06267935782670975, -0.05362699180841446, -0.04457462579011917, -0.035522256046533585, -0.026469886302947998, -0.017417550086975098, -0.00836518220603466, 0.000687185674905777, 0.009739553555846214, 0.01879192143678665, 0.02784428745508194, 0.036896657198667526, 0.04594902694225311, 0.0550013929605484, 0.06405375897884369, 0.07310612499713898, 0.08215849846601486, 0.09121086448431015, 0.10026323050260544, 0.10931560397148132, 0.11836796998977661, 0.1274203360080719, 0.1364727020263672, 0.14552506804466248, 0.15457743406295776, 0.16362980008125305, 0.17268216609954834, 0.18173454701900482, 0.1907869130373001, 0.1998392790555954, 0.20889164507389069, 0.21794401109218597, 0.22699637711048126, 0.23604875802993774, 0.24510112404823303, 0.2541534900665283, 0.2632058560848236, 0.2722582221031189]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 5.0, 15.0, 16.0, 17.0, 37.0, 30.0, 27.0, 29.0, 53.0, 51.0, 54.0, 56.0, 54.0, 55.0, 54.0, 55.0, 50.0, 53.0, 47.0, 43.0, 33.0, 31.0, 34.0, 28.0, 10.0, 16.0, 13.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07462972402572632, -0.0718650296330452, -0.06910032778978348, -0.06633563339710236, -0.06357093155384064, -0.060806237161159515, -0.058041542768478394, -0.05527684465050697, -0.05251214653253555, -0.04974744841456413, -0.04698275029659271, -0.04421805590391159, -0.04145335778594017, -0.03868865966796875, -0.03592396527528763, -0.03315926715731621, -0.030394569039344788, -0.027629870921373367, -0.024865174666047096, -0.022100478410720825, -0.019335780292749405, -0.016571082174777985, -0.013806385919451714, -0.011041689664125443, -0.008276991546154022, -0.0055122943595051765, -0.002747597172856331, 1.71000137925148e-05, 0.0027817972004413605, 0.005546494387090206, 0.008311191573739052, 0.011075887829065323, 0.013840585947036743, 0.016605284065008163, 0.019369980320334435, 0.022134676575660706, 0.024899374693632126, 0.027664072811603546, 0.030428769066929817, 0.03319346532225609, 0.03595816344022751, 0.03872286155819893, 0.04148755967617035, 0.04425225406885147, 0.04701695218682289, 0.04978165030479431, 0.05254634469747543, 0.055311042815446854, 0.058075740933418274, 0.060840439051389694, 0.06360513716936111, 0.06636983156204224, 0.06913453340530396, 0.07189922779798508, 0.0746639221906662, 0.07742862403392792, 0.08019331842660904, 0.08295801281929016, 0.08572271466255188, 0.088487409055233, 0.09125210344791412, 0.09401680529117584, 0.09678149968385696, 0.09954619407653809, 0.1023108959197998]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 2.0, 4.0, 10.0, 7.0, 4.0, 11.0, 16.0, 16.0, 23.0, 47.0, 40.0, 67.0, 91.0, 164.0, 227.0, 336.0, 555.0, 1024.0, 2601.0, 23984.0, 859314.0, 150412.0, 6175.0, 1456.0, 709.0, 395.0, 275.0, 162.0, 123.0, 83.0, 69.0, 33.0, 29.0, 22.0, 18.0, 10.0, 10.0, 8.0, 6.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.116455078125, -0.11289787292480469, -0.10934066772460938, -0.10578346252441406, -0.10222625732421875, -0.09866905212402344, -0.09511184692382812, -0.09155464172363281, -0.0879974365234375, -0.08444023132324219, -0.08088302612304688, -0.07732582092285156, -0.07376861572265625, -0.07021141052246094, -0.06665420532226562, -0.06309700012207031, -0.059539794921875, -0.05598258972167969, -0.052425384521484375, -0.04886817932128906, -0.04531097412109375, -0.04175376892089844, -0.038196563720703125, -0.03463935852050781, -0.0310821533203125, -0.027524948120117188, -0.023967742919921875, -0.020410537719726562, -0.01685333251953125, -0.013296127319335938, -0.009738922119140625, -0.0061817169189453125, -0.00262451171875, 0.0009326934814453125, 0.004489898681640625, 0.008047103881835938, 0.01160430908203125, 0.015161514282226562, 0.018718719482421875, 0.022275924682617188, 0.0258331298828125, 0.029390335083007812, 0.032947540283203125, 0.03650474548339844, 0.04006195068359375, 0.04361915588378906, 0.047176361083984375, 0.05073356628417969, 0.054290771484375, 0.05784797668457031, 0.061405181884765625, 0.06496238708496094, 0.06851959228515625, 0.07207679748535156, 0.07563400268554688, 0.07919120788574219, 0.0827484130859375, 0.08630561828613281, 0.08986282348632812, 0.09342002868652344, 0.09697723388671875, 0.10053443908691406, 0.10409164428710938, 0.10764884948730469, 0.1112060546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 25.0, 86.0, 206.0, 306.0, 239.0, 93.0, 29.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04620361328125, -0.04503464698791504, -0.04386568069458008, -0.04269671440124512, -0.041527748107910156, -0.040358781814575195, -0.039189815521240234, -0.03802084922790527, -0.03685188293457031, -0.03568291664123535, -0.03451395034790039, -0.03334498405456543, -0.03217601776123047, -0.031007051467895508, -0.029838085174560547, -0.028669118881225586, -0.027500152587890625, -0.026331186294555664, -0.025162220001220703, -0.023993253707885742, -0.02282428741455078, -0.02165532112121582, -0.02048635482788086, -0.0193173885345459, -0.018148422241210938, -0.016979455947875977, -0.015810489654541016, -0.014641523361206055, -0.013472557067871094, -0.012303590774536133, -0.011134624481201172, -0.009965658187866211, -0.00879669189453125, -0.007627725601196289, -0.006458759307861328, -0.005289793014526367, -0.004120826721191406, -0.0029518604278564453, -0.0017828941345214844, -0.0006139278411865234, 0.0005550384521484375, 0.0017240047454833984, 0.0028929710388183594, 0.00406193733215332, 0.005230903625488281, 0.006399869918823242, 0.007568836212158203, 0.008737802505493164, 0.009906768798828125, 0.011075735092163086, 0.012244701385498047, 0.013413667678833008, 0.014582633972167969, 0.01575160026550293, 0.01692056655883789, 0.01808953285217285, 0.019258499145507812, 0.020427465438842773, 0.021596431732177734, 0.022765398025512695, 0.023934364318847656, 0.025103330612182617, 0.026272296905517578, 0.02744126319885254, 0.0286102294921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 10.0, 18.0, 18.0, 23.0, 71.0, 74.0, 128.0, 228.0, 380.0, 696.0, 1521.0, 5594.0, 58748.0, 787130.0, 178100.0, 11419.0, 2239.0, 926.0, 484.0, 256.0, 129.0, 97.0, 77.0, 41.0, 32.0, 18.0, 19.0, 14.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.106201171875, -0.1032247543334961, -0.10024833679199219, -0.09727191925048828, -0.09429550170898438, -0.09131908416748047, -0.08834266662597656, -0.08536624908447266, -0.08238983154296875, -0.07941341400146484, -0.07643699645996094, -0.07346057891845703, -0.07048416137695312, -0.06750774383544922, -0.06453132629394531, -0.061554908752441406, -0.0585784912109375, -0.055602073669433594, -0.05262565612792969, -0.04964923858642578, -0.046672821044921875, -0.04369640350341797, -0.04071998596191406, -0.037743568420410156, -0.03476715087890625, -0.031790733337402344, -0.028814315795898438, -0.02583789825439453, -0.022861480712890625, -0.01988506317138672, -0.016908645629882812, -0.013932228088378906, -0.010955810546875, -0.007979393005371094, -0.0050029754638671875, -0.0020265579223632812, 0.000949859619140625, 0.003926277160644531, 0.0069026947021484375, 0.009879112243652344, 0.01285552978515625, 0.015831947326660156, 0.018808364868164062, 0.02178478240966797, 0.024761199951171875, 0.02773761749267578, 0.030714035034179688, 0.033690452575683594, 0.0366668701171875, 0.039643287658691406, 0.04261970520019531, 0.04559612274169922, 0.048572540283203125, 0.05154895782470703, 0.05452537536621094, 0.057501792907714844, 0.06047821044921875, 0.06345462799072266, 0.06643104553222656, 0.06940746307373047, 0.07238388061523438, 0.07536029815673828, 0.07833671569824219, 0.0813131332397461, 0.08428955078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 8.0, 6.0, 12.0, 13.0, 29.0, 20.0, 29.0, 32.0, 36.0, 44.0, 41.0, 34.0, 40.0, 41.0, 53.0, 66.0, 65.0, 70.0, 48.0, 39.0, 47.0, 40.0, 37.0, 28.0, 27.0, 14.0, 14.0, 12.0, 13.0, 8.0, 9.0, 8.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291595458984375, -0.028212308883666992, -0.027265071868896484, -0.026317834854125977, -0.02537059783935547, -0.02442336082458496, -0.023476123809814453, -0.022528886795043945, -0.021581649780273438, -0.02063441276550293, -0.019687175750732422, -0.018739938735961914, -0.017792701721191406, -0.0168454647064209, -0.01589822769165039, -0.014950990676879883, -0.014003753662109375, -0.013056516647338867, -0.01210927963256836, -0.011162042617797852, -0.010214805603027344, -0.009267568588256836, -0.008320331573486328, -0.00737309455871582, -0.0064258575439453125, -0.005478620529174805, -0.004531383514404297, -0.003584146499633789, -0.0026369094848632812, -0.0016896724700927734, -0.0007424354553222656, 0.0002048015594482422, 0.00115203857421875, 0.002099275588989258, 0.0030465126037597656, 0.0039937496185302734, 0.004940986633300781, 0.005888223648071289, 0.006835460662841797, 0.007782697677612305, 0.008729934692382812, 0.00967717170715332, 0.010624408721923828, 0.011571645736694336, 0.012518882751464844, 0.013466119766235352, 0.01441335678100586, 0.015360593795776367, 0.016307830810546875, 0.017255067825317383, 0.01820230484008789, 0.0191495418548584, 0.020096778869628906, 0.021044015884399414, 0.021991252899169922, 0.02293848991394043, 0.023885726928710938, 0.024832963943481445, 0.025780200958251953, 0.02672743797302246, 0.02767467498779297, 0.028621912002563477, 0.029569149017333984, 0.030516386032104492, 0.031463623046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 4.0, 16.0, 21.0, 29.0, 40.0, 57.0, 104.0, 184.0, 317.0, 545.0, 1160.0, 2481.0, 5576.0, 14875.0, 59288.0, 693428.0, 224366.0, 29070.0, 9537.0, 3952.0, 1708.0, 824.0, 397.0, 211.0, 129.0, 53.0, 44.0, 33.0, 22.0, 15.0, 7.0, 17.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037750244140625, -0.036632537841796875, -0.03551483154296875, -0.034397125244140625, -0.0332794189453125, -0.032161712646484375, -0.03104400634765625, -0.029926300048828125, -0.02880859375, -0.027690887451171875, -0.02657318115234375, -0.025455474853515625, -0.0243377685546875, -0.023220062255859375, -0.02210235595703125, -0.020984649658203125, -0.019866943359375, -0.018749237060546875, -0.01763153076171875, -0.016513824462890625, -0.0153961181640625, -0.014278411865234375, -0.01316070556640625, -0.012042999267578125, -0.01092529296875, -0.009807586669921875, -0.00868988037109375, -0.007572174072265625, -0.0064544677734375, -0.005336761474609375, -0.00421905517578125, -0.003101348876953125, -0.001983642578125, -0.000865936279296875, 0.00025177001953125, 0.001369476318359375, 0.0024871826171875, 0.003604888916015625, 0.00472259521484375, 0.005840301513671875, 0.0069580078125, 0.008075714111328125, 0.00919342041015625, 0.010311126708984375, 0.0114288330078125, 0.012546539306640625, 0.01366424560546875, 0.014781951904296875, 0.015899658203125, 0.017017364501953125, 0.01813507080078125, 0.019252777099609375, 0.0203704833984375, 0.021488189697265625, 0.02260589599609375, 0.023723602294921875, 0.02484130859375, 0.025959014892578125, 0.02707672119140625, 0.028194427490234375, 0.0293121337890625, 0.030429840087890625, 0.03154754638671875, 0.032665252685546875, 0.033782958984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 5.0, 11.0, 5.0, 12.0, 13.0, 12.0, 17.0, 18.0, 40.0, 42.0, 58.0, 58.0, 89.0, 87.0, 92.0, 86.0, 79.0, 64.0, 37.0, 30.0, 22.0, 20.0, 13.0, 6.0, 12.0, 11.0, 12.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.5789947509765625e-05, -5.4108910262584686e-05, -5.242787301540375e-05, -5.074683576822281e-05, -4.906579852104187e-05, -4.738476127386093e-05, -4.570372402667999e-05, -4.4022686779499054e-05, -4.2341649532318115e-05, -4.0660612285137177e-05, -3.897957503795624e-05, -3.72985377907753e-05, -3.561750054359436e-05, -3.393646329641342e-05, -3.225542604923248e-05, -3.0574388802051544e-05, -2.8893351554870605e-05, -2.7212314307689667e-05, -2.5531277060508728e-05, -2.385023981332779e-05, -2.216920256614685e-05, -2.0488165318965912e-05, -1.8807128071784973e-05, -1.7126090824604034e-05, -1.5445053577423096e-05, -1.3764016330242157e-05, -1.2082979083061218e-05, -1.040194183588028e-05, -8.72090458869934e-06, -7.039867341518402e-06, -5.358830094337463e-06, -3.6777928471565247e-06, -1.996755599975586e-06, -3.157183527946472e-07, 1.3653188943862915e-06, 3.0463561415672302e-06, 4.727393388748169e-06, 6.408430635929108e-06, 8.089467883110046e-06, 9.770505130290985e-06, 1.1451542377471924e-05, 1.3132579624652863e-05, 1.4813616871833801e-05, 1.649465411901474e-05, 1.817569136619568e-05, 1.9856728613376617e-05, 2.1537765860557556e-05, 2.3218803107738495e-05, 2.4899840354919434e-05, 2.6580877602100372e-05, 2.826191484928131e-05, 2.994295209646225e-05, 3.162398934364319e-05, 3.330502659082413e-05, 3.4986063838005066e-05, 3.6667101085186005e-05, 3.834813833236694e-05, 4.002917557954788e-05, 4.171021282672882e-05, 4.339125007390976e-05, 4.50722873210907e-05, 4.675332456827164e-05, 4.8434361815452576e-05, 5.0115399062633514e-05, 5.179643630981445e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 9.0, 15.0, 10.0, 18.0, 25.0, 37.0, 37.0, 65.0, 104.0, 177.0, 341.0, 750.0, 1937.0, 5346.0, 20298.0, 150537.0, 787614.0, 62424.0, 12484.0, 3746.0, 1288.0, 559.0, 275.0, 164.0, 80.0, 40.0, 42.0, 28.0, 22.0, 24.0, 11.0, 8.0, 13.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0458984375, -0.04456138610839844, -0.043224334716796875, -0.04188728332519531, -0.04055023193359375, -0.03921318054199219, -0.037876129150390625, -0.03653907775878906, -0.0352020263671875, -0.03386497497558594, -0.032527923583984375, -0.031190872192382812, -0.02985382080078125, -0.028516769409179688, -0.027179718017578125, -0.025842666625976562, -0.024505615234375, -0.023168563842773438, -0.021831512451171875, -0.020494461059570312, -0.01915740966796875, -0.017820358276367188, -0.016483306884765625, -0.015146255493164062, -0.0138092041015625, -0.012472152709960938, -0.011135101318359375, -0.009798049926757812, -0.00846099853515625, -0.0071239471435546875, -0.005786895751953125, -0.0044498443603515625, -0.00311279296875, -0.0017757415771484375, -0.000438690185546875, 0.0008983612060546875, 0.00223541259765625, 0.0035724639892578125, 0.004909515380859375, 0.0062465667724609375, 0.0075836181640625, 0.008920669555664062, 0.010257720947265625, 0.011594772338867188, 0.01293182373046875, 0.014268875122070312, 0.015605926513671875, 0.016942977905273438, 0.018280029296875, 0.019617080688476562, 0.020954132080078125, 0.022291183471679688, 0.02362823486328125, 0.024965286254882812, 0.026302337646484375, 0.027639389038085938, 0.0289764404296875, 0.030313491821289062, 0.031650543212890625, 0.03298759460449219, 0.03432464599609375, 0.03566169738769531, 0.036998748779296875, 0.03833580017089844, 0.0396728515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 8.0, 13.0, 11.0, 17.0, 13.0, 23.0, 21.0, 27.0, 62.0, 67.0, 89.0, 127.0, 135.0, 86.0, 68.0, 40.0, 34.0, 27.0, 14.0, 10.0, 20.0, 11.0, 5.0, 11.0, 6.0, 8.0, 6.0, 2.0, 8.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0177001953125, -0.017191648483276367, -0.016683101654052734, -0.0161745548248291, -0.01566600799560547, -0.015157461166381836, -0.014648914337158203, -0.01414036750793457, -0.013631820678710938, -0.013123273849487305, -0.012614727020263672, -0.012106180191040039, -0.011597633361816406, -0.011089086532592773, -0.01058053970336914, -0.010071992874145508, -0.009563446044921875, -0.009054899215698242, -0.00854635238647461, -0.008037805557250977, -0.007529258728027344, -0.007020711898803711, -0.006512165069580078, -0.006003618240356445, -0.0054950714111328125, -0.00498652458190918, -0.004477977752685547, -0.003969430923461914, -0.0034608840942382812, -0.0029523372650146484, -0.0024437904357910156, -0.0019352436065673828, -0.00142669677734375, -0.0009181499481201172, -0.0004096031188964844, 9.894371032714844e-05, 0.0006074905395507812, 0.001116037368774414, 0.0016245841979980469, 0.0021331310272216797, 0.0026416778564453125, 0.0031502246856689453, 0.003658771514892578, 0.004167318344116211, 0.004675865173339844, 0.0051844120025634766, 0.005692958831787109, 0.006201505661010742, 0.006710052490234375, 0.007218599319458008, 0.007727146148681641, 0.008235692977905273, 0.008744239807128906, 0.009252786636352539, 0.009761333465576172, 0.010269880294799805, 0.010778427124023438, 0.01128697395324707, 0.011795520782470703, 0.012304067611694336, 0.012812614440917969, 0.013321161270141602, 0.013829708099365234, 0.014338254928588867, 0.0148468017578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 22.0, 142.0, 588.0, 227.0, 13.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1434255838394165, -1.1221356391906738, -1.1008458137512207, -1.079555869102478, -1.0582659244537354, -1.0369760990142822, -1.0156861543655396, -0.9943962097167969, -0.973106324672699, -0.9518164396286011, -0.9305264949798584, -0.9092366099357605, -0.8879466652870178, -0.8666567802429199, -0.8453668355941772, -0.8240769505500793, -0.8027870655059814, -0.7814971804618835, -0.7602072358131409, -0.738917350769043, -0.7176274061203003, -0.6963375210762024, -0.6750476360321045, -0.6537576913833618, -0.6324677467346191, -0.6111778616905212, -0.5898879170417786, -0.5685980319976807, -0.547308087348938, -0.5260182023048401, -0.5047283172607422, -0.4834383726119995, -0.4621484875679016, -0.4408585727214813, -0.41956865787506104, -0.39827877283096313, -0.37698885798454285, -0.35569894313812256, -0.33440902829170227, -0.313119113445282, -0.2918292284011841, -0.2705393135547638, -0.2492494136095047, -0.2279594987630844, -0.20666959881782532, -0.18537968397140503, -0.16408976912498474, -0.14279986917972565, -0.12150995433330536, -0.10022004693746567, -0.07893013954162598, -0.05764022469520569, -0.036350317299366, -0.015060409903526306, 0.006229504942893982, 0.027519404888153076, 0.048809319734573364, 0.07009922713041306, 0.09138913452625275, 0.11267904937267303, 0.13396894931793213, 0.15525886416435242, 0.1765487790107727, 0.1978386789560318, 0.2191285938024521]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 8.0, 5.0, 8.0, 9.0, 12.0, 19.0, 13.0, 27.0, 27.0, 39.0, 33.0, 38.0, 46.0, 51.0, 49.0, 61.0, 46.0, 40.0, 45.0, 57.0, 50.0, 42.0, 30.0, 33.0, 37.0, 31.0, 29.0, 19.0, 14.0, 14.0, 7.0, 10.0, 9.0, 9.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08443325757980347, -0.08162000775337219, -0.07880675792694092, -0.07599350810050964, -0.07318025827407837, -0.07036701589822769, -0.06755376607179642, -0.06474051624536514, -0.06192726641893387, -0.059114016592502594, -0.05630076676607132, -0.053487520664930344, -0.05067427083849907, -0.047861021012067795, -0.04504777491092682, -0.042234525084495544, -0.03942127525806427, -0.036608025431632996, -0.03379477560520172, -0.030981529504060745, -0.02816827967762947, -0.025355029851198196, -0.02254178188741207, -0.019728533923625946, -0.01691528409719467, -0.014102035202085972, -0.011288786306977272, -0.008475537411868572, -0.0056622885167598724, -0.0028490396216511726, -3.579072654247284e-05, 0.0027774572372436523, 0.005590707063674927, 0.008403955958783627, 0.011217204853892326, 0.014030453749001026, 0.016843702644109726, 0.019656952470541, 0.022470200434327126, 0.02528344839811325, 0.028096698224544525, 0.0309099480509758, 0.033723197877407074, 0.03653644397854805, 0.039349693804979324, 0.0421629436314106, 0.044976189732551575, 0.04778943955898285, 0.050602689385414124, 0.0534159392118454, 0.05622918903827667, 0.05904243513941765, 0.06185568496584892, 0.0646689310669899, 0.06748218089342117, 0.07029543071985245, 0.07310868054628372, 0.075921930372715, 0.07873518019914627, 0.08154843002557755, 0.08436167240142822, 0.0871749222278595, 0.08998817205429077, 0.09280142188072205, 0.09561467170715332]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 11.0, 12.0, 12.0, 10.0, 24.0, 42.0, 73.0, 94.0, 145.0, 280.0, 490.0, 940.0, 2413.0, 9919.0, 289603.0, 3846701.0, 34815.0, 6052.0, 1586.0, 550.0, 214.0, 126.0, 62.0, 33.0, 24.0, 18.0, 13.0, 7.0, 9.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05763816833496094, -0.055522918701171875, -0.05340766906738281, -0.05129241943359375, -0.04917716979980469, -0.047061920166015625, -0.04494667053222656, -0.0428314208984375, -0.04071617126464844, -0.038600921630859375, -0.03648567199707031, -0.03437042236328125, -0.03225517272949219, -0.030139923095703125, -0.028024673461914062, -0.025909423828125, -0.023794174194335938, -0.021678924560546875, -0.019563674926757812, -0.01744842529296875, -0.015333175659179688, -0.013217926025390625, -0.011102676391601562, -0.0089874267578125, -0.0068721771240234375, -0.004756927490234375, -0.0026416778564453125, -0.00052642822265625, 0.0015888214111328125, 0.003704071044921875, 0.0058193206787109375, 0.0079345703125, 0.010049819946289062, 0.012165069580078125, 0.014280319213867188, 0.01639556884765625, 0.018510818481445312, 0.020626068115234375, 0.022741317749023438, 0.0248565673828125, 0.026971817016601562, 0.029087066650390625, 0.031202316284179688, 0.03331756591796875, 0.03543281555175781, 0.037548065185546875, 0.03966331481933594, 0.041778564453125, 0.04389381408691406, 0.046009063720703125, 0.04812431335449219, 0.05023956298828125, 0.05235481262207031, 0.054470062255859375, 0.05658531188964844, 0.0587005615234375, 0.06081581115722656, 0.06293106079101562, 0.06504631042480469, 0.06716156005859375, 0.06927680969238281, 0.07139205932617188, 0.07350730895996094, 0.07562255859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 11.0, 17.0, 66.0, 146.0, 254.0, 282.0, 146.0, 55.0, 13.0, 10.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0433349609375, -0.042249202728271484, -0.04116344451904297, -0.04007768630981445, -0.03899192810058594, -0.03790616989135742, -0.036820411682128906, -0.03573465347290039, -0.034648895263671875, -0.03356313705444336, -0.032477378845214844, -0.03139162063598633, -0.030305862426757812, -0.029220104217529297, -0.02813434600830078, -0.027048587799072266, -0.02596282958984375, -0.024877071380615234, -0.02379131317138672, -0.022705554962158203, -0.021619796752929688, -0.020534038543701172, -0.019448280334472656, -0.01836252212524414, -0.017276763916015625, -0.01619100570678711, -0.015105247497558594, -0.014019489288330078, -0.012933731079101562, -0.011847972869873047, -0.010762214660644531, -0.009676456451416016, -0.0085906982421875, -0.007504940032958984, -0.006419181823730469, -0.005333423614501953, -0.0042476654052734375, -0.003161907196044922, -0.0020761489868164062, -0.0009903907775878906, 9.5367431640625e-05, 0.0011811256408691406, 0.0022668838500976562, 0.003352642059326172, 0.0044384002685546875, 0.005524158477783203, 0.006609916687011719, 0.007695674896240234, 0.00878143310546875, 0.009867191314697266, 0.010952949523925781, 0.012038707733154297, 0.013124465942382812, 0.014210224151611328, 0.015295982360839844, 0.01638174057006836, 0.017467498779296875, 0.01855325698852539, 0.019639015197753906, 0.020724773406982422, 0.021810531616210938, 0.022896289825439453, 0.02398204803466797, 0.025067806243896484, 0.026153564453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 12.0, 13.0, 20.0, 25.0, 41.0, 51.0, 80.0, 126.0, 201.0, 389.0, 998.0, 4292.0, 61682.0, 3732268.0, 381244.0, 9953.0, 1655.0, 556.0, 263.0, 141.0, 70.0, 55.0, 35.0, 23.0, 18.0, 22.0, 14.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0721435546875, -0.07027959823608398, -0.06841564178466797, -0.06655168533325195, -0.06468772888183594, -0.06282377243041992, -0.060959815979003906, -0.05909585952758789, -0.057231903076171875, -0.05536794662475586, -0.053503990173339844, -0.05164003372192383, -0.04977607727050781, -0.0479121208190918, -0.04604816436767578, -0.044184207916259766, -0.04232025146484375, -0.040456295013427734, -0.03859233856201172, -0.0367283821105957, -0.03486442565917969, -0.03300046920776367, -0.031136512756347656, -0.02927255630493164, -0.027408599853515625, -0.02554464340209961, -0.023680686950683594, -0.021816730499267578, -0.019952774047851562, -0.018088817596435547, -0.01622486114501953, -0.014360904693603516, -0.0124969482421875, -0.010632991790771484, -0.008769035339355469, -0.006905078887939453, -0.0050411224365234375, -0.003177165985107422, -0.0013132095336914062, 0.0005507469177246094, 0.002414703369140625, 0.004278659820556641, 0.006142616271972656, 0.008006572723388672, 0.009870529174804688, 0.011734485626220703, 0.013598442077636719, 0.015462398529052734, 0.01732635498046875, 0.019190311431884766, 0.02105426788330078, 0.022918224334716797, 0.024782180786132812, 0.026646137237548828, 0.028510093688964844, 0.03037405014038086, 0.032238006591796875, 0.03410196304321289, 0.035965919494628906, 0.03782987594604492, 0.03969383239746094, 0.04155778884887695, 0.04342174530029297, 0.045285701751708984, 0.047149658203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 11.0, 15.0, 14.0, 21.0, 24.0, 45.0, 68.0, 83.0, 132.0, 197.0, 257.0, 392.0, 560.0, 616.0, 502.0, 322.0, 228.0, 181.0, 110.0, 73.0, 80.0, 42.0, 26.0, 22.0, 17.0, 8.0, 12.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.01259160041809082, -0.01199960708618164, -0.011407613754272461, -0.010815620422363281, -0.010223627090454102, -0.009631633758544922, -0.009039640426635742, -0.008447647094726562, -0.007855653762817383, -0.007263660430908203, -0.0066716670989990234, -0.006079673767089844, -0.005487680435180664, -0.004895687103271484, -0.004303693771362305, -0.003711700439453125, -0.0031197071075439453, -0.0025277137756347656, -0.001935720443725586, -0.0013437271118164062, -0.0007517337799072266, -0.00015974044799804688, 0.0004322528839111328, 0.0010242462158203125, 0.0016162395477294922, 0.002208232879638672, 0.0028002262115478516, 0.0033922195434570312, 0.003984212875366211, 0.004576206207275391, 0.00516819953918457, 0.00576019287109375, 0.00635218620300293, 0.006944179534912109, 0.007536172866821289, 0.008128166198730469, 0.008720159530639648, 0.009312152862548828, 0.009904146194458008, 0.010496139526367188, 0.011088132858276367, 0.011680126190185547, 0.012272119522094727, 0.012864112854003906, 0.013456106185913086, 0.014048099517822266, 0.014640092849731445, 0.015232086181640625, 0.015824079513549805, 0.016416072845458984, 0.017008066177368164, 0.017600059509277344, 0.018192052841186523, 0.018784046173095703, 0.019376039505004883, 0.019968032836914062, 0.020560026168823242, 0.021152019500732422, 0.0217440128326416, 0.02233600616455078, 0.02292799949645996, 0.02351999282836914, 0.02411198616027832, 0.0247039794921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 25.0, 238.0, 570.0, 156.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5299005508422852, -0.5164393186569214, -0.5029780268669128, -0.4895167648792267, -0.4760555028915405, -0.46259427070617676, -0.4491329789161682, -0.43567174673080444, -0.4222104847431183, -0.40874922275543213, -0.39528796076774597, -0.3818266987800598, -0.36836543679237366, -0.3549041748046875, -0.34144294261932373, -0.3279816806316376, -0.3145204186439514, -0.30105915665626526, -0.2875978946685791, -0.27413663268089294, -0.2606753706932068, -0.24721412360668182, -0.23375286161899567, -0.2202916145324707, -0.20683032274246216, -0.193369060754776, -0.17990779876708984, -0.1664465367794037, -0.15298528969287872, -0.13952402770519257, -0.1260627657175064, -0.11260151118040085, -0.09914025664329529, -0.08567899465560913, -0.07221774011850357, -0.05875647813081741, -0.045295219868421555, -0.031833961606025696, -0.01837269961833954, -0.004911445081233978, 0.008549816906452179, 0.022011075168848038, 0.035472333431243896, 0.048933595418930054, 0.06239485368132591, 0.07585611194372177, 0.08931737393140793, 0.10277862846851349, 0.11623989045619965, 0.1297011524438858, 0.14316241443157196, 0.15662366151809692, 0.17008492350578308, 0.18354618549346924, 0.1970074474811554, 0.21046870946884155, 0.2239299714565277, 0.23739123344421387, 0.2508524954319, 0.2643137574195862, 0.27777501940727234, 0.2912362813949585, 0.30469751358032227, 0.3181587755680084, 0.3316200375556946]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 13.0, 8.0, 11.0, 12.0, 24.0, 23.0, 30.0, 32.0, 43.0, 50.0, 46.0, 69.0, 45.0, 51.0, 54.0, 56.0, 46.0, 50.0, 51.0, 42.0, 43.0, 31.0, 29.0, 31.0, 26.0, 11.0, 15.0, 13.0, 13.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443386435508728, -0.042285285890102386, -0.04023193195462227, -0.03817857801914215, -0.036125220358371735, -0.03407186269760132, -0.0320185087621212, -0.029965152963995934, -0.027911797165870667, -0.0258584413677454, -0.023805085569620132, -0.021751729771494865, -0.0196983739733696, -0.01764501817524433, -0.015591662377119064, -0.013538306578993797, -0.01148495078086853, -0.009431594982743263, -0.007378239184617996, -0.005324883386492729, -0.003271527588367462, -0.0012181717902421951, 0.0008351840078830719, 0.002888539806008339, 0.004941895604133606, 0.006995251402258873, 0.00904860720038414, 0.011101962998509407, 0.013155318796634674, 0.015208674594759941, 0.017262030392885208, 0.019315386191010475, 0.021368741989135742, 0.02342209778726101, 0.025475453585386276, 0.027528809383511543, 0.02958216518163681, 0.03163552284240723, 0.033688876777887344, 0.03574223071336746, 0.03779558837413788, 0.039848946034908295, 0.04190229997038841, 0.04395565390586853, 0.04600901156663895, 0.04806236922740936, 0.05011572316288948, 0.0521690770983696, 0.054222434759140015, 0.05627579241991043, 0.05832914635539055, 0.060382500290870667, 0.06243585795164108, 0.0644892156124115, 0.06654256582260132, 0.06859592348337173, 0.07064928114414215, 0.07270263880491257, 0.07475599646568298, 0.0768093466758728, 0.07886270433664322, 0.08091606199741364, 0.08296941220760345, 0.08502276986837387, 0.08707612752914429]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 6.0, 6.0, 9.0, 18.0, 13.0, 23.0, 25.0, 41.0, 62.0, 83.0, 106.0, 110.0, 195.0, 322.0, 399.0, 631.0, 1066.0, 2290.0, 10523.0, 159307.0, 801976.0, 60897.0, 5911.0, 1777.0, 950.0, 539.0, 354.0, 242.0, 167.0, 135.0, 98.0, 52.0, 60.0, 47.0, 26.0, 17.0, 10.0, 12.0, 7.0, 10.0, 13.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.074951171875, -0.0727691650390625, -0.070587158203125, -0.0684051513671875, -0.06622314453125, -0.0640411376953125, -0.061859130859375, -0.0596771240234375, -0.0574951171875, -0.0553131103515625, -0.053131103515625, -0.0509490966796875, -0.04876708984375, -0.0465850830078125, -0.044403076171875, -0.0422210693359375, -0.0400390625, -0.0378570556640625, -0.035675048828125, -0.0334930419921875, -0.03131103515625, -0.0291290283203125, -0.026947021484375, -0.0247650146484375, -0.0225830078125, -0.0204010009765625, -0.018218994140625, -0.0160369873046875, -0.01385498046875, -0.0116729736328125, -0.009490966796875, -0.0073089599609375, -0.005126953125, -0.0029449462890625, -0.000762939453125, 0.0014190673828125, 0.00360107421875, 0.0057830810546875, 0.007965087890625, 0.0101470947265625, 0.0123291015625, 0.0145111083984375, 0.016693115234375, 0.0188751220703125, 0.02105712890625, 0.0232391357421875, 0.025421142578125, 0.0276031494140625, 0.02978515625, 0.0319671630859375, 0.034149169921875, 0.0363311767578125, 0.03851318359375, 0.0406951904296875, 0.042877197265625, 0.0450592041015625, 0.0472412109375, 0.0494232177734375, 0.051605224609375, 0.0537872314453125, 0.05596923828125, 0.0581512451171875, 0.060333251953125, 0.0625152587890625, 0.064697265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 19.0, 57.0, 143.0, 251.0, 274.0, 169.0, 50.0, 18.0, 6.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03993391990661621, -0.03888273239135742, -0.03783154487609863, -0.036780357360839844, -0.035729169845581055, -0.034677982330322266, -0.03362679481506348, -0.03257560729980469, -0.0315244197845459, -0.03047323226928711, -0.02942204475402832, -0.02837085723876953, -0.027319669723510742, -0.026268482208251953, -0.025217294692993164, -0.024166107177734375, -0.023114919662475586, -0.022063732147216797, -0.021012544631958008, -0.01996135711669922, -0.01891016960144043, -0.01785898208618164, -0.01680779457092285, -0.015756607055664062, -0.014705419540405273, -0.013654232025146484, -0.012603044509887695, -0.011551856994628906, -0.010500669479370117, -0.009449481964111328, -0.008398294448852539, -0.00734710693359375, -0.006295919418334961, -0.005244731903076172, -0.004193544387817383, -0.0031423568725585938, -0.0020911693572998047, -0.0010399818420410156, 1.1205673217773438e-05, 0.0010623931884765625, 0.0021135807037353516, 0.0031647682189941406, 0.00421595573425293, 0.005267143249511719, 0.006318330764770508, 0.007369518280029297, 0.008420705795288086, 0.009471893310546875, 0.010523080825805664, 0.011574268341064453, 0.012625455856323242, 0.013676643371582031, 0.01472783088684082, 0.01577901840209961, 0.0168302059173584, 0.017881393432617188, 0.018932580947875977, 0.019983768463134766, 0.021034955978393555, 0.022086143493652344, 0.023137331008911133, 0.024188518524169922, 0.02523970603942871, 0.0262908935546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 9.0, 7.0, 8.0, 12.0, 18.0, 27.0, 31.0, 32.0, 50.0, 63.0, 84.0, 94.0, 137.0, 201.0, 313.0, 450.0, 846.0, 1462.0, 3351.0, 8446.0, 24925.0, 83126.0, 272943.0, 407810.0, 168915.0, 48900.0, 15459.0, 5527.0, 2302.0, 1086.0, 621.0, 393.0, 230.0, 168.0, 113.0, 102.0, 69.0, 52.0, 30.0, 26.0, 22.0, 22.0, 17.0, 15.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.027923583984375, -0.027109146118164062, -0.026294708251953125, -0.025480270385742188, -0.02466583251953125, -0.023851394653320312, -0.023036956787109375, -0.022222518920898438, -0.0214080810546875, -0.020593643188476562, -0.019779205322265625, -0.018964767456054688, -0.01815032958984375, -0.017335891723632812, -0.016521453857421875, -0.015707015991210938, -0.014892578125, -0.014078140258789062, -0.013263702392578125, -0.012449264526367188, -0.01163482666015625, -0.010820388793945312, -0.010005950927734375, -0.009191513061523438, -0.0083770751953125, -0.0075626373291015625, -0.006748199462890625, -0.0059337615966796875, -0.00511932373046875, -0.0043048858642578125, -0.003490447998046875, -0.0026760101318359375, -0.001861572265625, -0.0010471343994140625, -0.000232696533203125, 0.0005817413330078125, 0.00139617919921875, 0.0022106170654296875, 0.003025054931640625, 0.0038394927978515625, 0.0046539306640625, 0.0054683685302734375, 0.006282806396484375, 0.0070972442626953125, 0.00791168212890625, 0.008726119995117188, 0.009540557861328125, 0.010354995727539062, 0.01116943359375, 0.011983871459960938, 0.012798309326171875, 0.013612747192382812, 0.01442718505859375, 0.015241622924804688, 0.016056060791015625, 0.016870498657226562, 0.0176849365234375, 0.018499374389648438, 0.019313812255859375, 0.020128250122070312, 0.02094268798828125, 0.021757125854492188, 0.022571563720703125, 0.023386001586914062, 0.024200439453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 8.0, 9.0, 6.0, 10.0, 19.0, 16.0, 23.0, 31.0, 31.0, 37.0, 29.0, 26.0, 51.0, 42.0, 26.0, 59.0, 26.0, 47.0, 38.0, 52.0, 39.0, 38.0, 42.0, 39.0, 29.0, 27.0, 33.0, 21.0, 26.0, 20.0, 23.0, 16.0, 6.0, 12.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01871180534362793, -0.01806020736694336, -0.01740860939025879, -0.01675701141357422, -0.01610541343688965, -0.015453815460205078, -0.014802217483520508, -0.014150619506835938, -0.013499021530151367, -0.012847423553466797, -0.012195825576782227, -0.011544227600097656, -0.010892629623413086, -0.010241031646728516, -0.009589433670043945, -0.008937835693359375, -0.008286237716674805, -0.007634639739990234, -0.006983041763305664, -0.006331443786621094, -0.0056798458099365234, -0.005028247833251953, -0.004376649856567383, -0.0037250518798828125, -0.003073453903198242, -0.002421855926513672, -0.0017702579498291016, -0.0011186599731445312, -0.00046706199645996094, 0.00018453598022460938, 0.0008361339569091797, 0.00148773193359375, 0.0021393299102783203, 0.0027909278869628906, 0.003442525863647461, 0.004094123840332031, 0.0047457218170166016, 0.005397319793701172, 0.006048917770385742, 0.0067005157470703125, 0.007352113723754883, 0.008003711700439453, 0.008655309677124023, 0.009306907653808594, 0.009958505630493164, 0.010610103607177734, 0.011261701583862305, 0.011913299560546875, 0.012564897537231445, 0.013216495513916016, 0.013868093490600586, 0.014519691467285156, 0.015171289443969727, 0.015822887420654297, 0.016474485397338867, 0.017126083374023438, 0.017777681350708008, 0.018429279327392578, 0.01908087730407715, 0.01973247528076172, 0.02038407325744629, 0.02103567123413086, 0.02168726921081543, 0.0223388671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 18.0, 39.0, 43.0, 67.0, 113.0, 194.0, 290.0, 465.0, 844.0, 1449.0, 2962.0, 6418.0, 16510.0, 52575.0, 223693.0, 505188.0, 170411.0, 42113.0, 13863.0, 5545.0, 2523.0, 1307.0, 748.0, 458.0, 272.0, 155.0, 99.0, 46.0, 42.0, 26.0, 18.0, 11.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01338958740234375, -0.012934327125549316, -0.012479066848754883, -0.01202380657196045, -0.011568546295166016, -0.011113286018371582, -0.010658025741577148, -0.010202765464782715, -0.009747505187988281, -0.009292244911193848, -0.008836984634399414, -0.00838172435760498, -0.007926464080810547, -0.007471203804016113, -0.00701594352722168, -0.006560683250427246, -0.0061054229736328125, -0.005650162696838379, -0.005194902420043945, -0.004739642143249512, -0.004284381866455078, -0.0038291215896606445, -0.003373861312866211, -0.0029186010360717773, -0.0024633407592773438, -0.00200808048248291, -0.0015528202056884766, -0.001097559928894043, -0.0006422996520996094, -0.00018703937530517578, 0.0002682209014892578, 0.0007234811782836914, 0.001178741455078125, 0.0016340017318725586, 0.002089262008666992, 0.0025445222854614258, 0.0029997825622558594, 0.003455042839050293, 0.0039103031158447266, 0.00436556339263916, 0.004820823669433594, 0.005276083946228027, 0.005731344223022461, 0.0061866044998168945, 0.006641864776611328, 0.007097125053405762, 0.007552385330200195, 0.008007645606994629, 0.008462905883789062, 0.008918166160583496, 0.00937342643737793, 0.009828686714172363, 0.010283946990966797, 0.01073920726776123, 0.011194467544555664, 0.011649727821350098, 0.012104988098144531, 0.012560248374938965, 0.013015508651733398, 0.013470768928527832, 0.013926029205322266, 0.0143812894821167, 0.014836549758911133, 0.015291810035705566, 0.0157470703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 10.0, 14.0, 8.0, 7.0, 8.0, 18.0, 30.0, 39.0, 47.0, 44.0, 62.0, 97.0, 165.0, 105.0, 69.0, 48.0, 59.0, 36.0, 22.0, 22.0, 17.0, 9.0, 8.0, 7.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.918741226196289e-05, -5.711149424314499e-05, -5.503557622432709e-05, -5.2959658205509186e-05, -5.0883740186691284e-05, -4.880782216787338e-05, -4.673190414905548e-05, -4.465598613023758e-05, -4.258006811141968e-05, -4.0504150092601776e-05, -3.8428232073783875e-05, -3.635231405496597e-05, -3.427639603614807e-05, -3.220047801733017e-05, -3.0124559998512268e-05, -2.8048641979694366e-05, -2.5972723960876465e-05, -2.3896805942058563e-05, -2.182088792324066e-05, -1.974496990442276e-05, -1.766905188560486e-05, -1.5593133866786957e-05, -1.3517215847969055e-05, -1.1441297829151154e-05, -9.365379810333252e-06, -7.28946179151535e-06, -5.213543772697449e-06, -3.137625753879547e-06, -1.0617077350616455e-06, 1.014210283756256e-06, 3.0901283025741577e-06, 5.166046321392059e-06, 7.241964340209961e-06, 9.317882359027863e-06, 1.1393800377845764e-05, 1.3469718396663666e-05, 1.5545636415481567e-05, 1.762155443429947e-05, 1.969747245311737e-05, 2.1773390471935272e-05, 2.3849308490753174e-05, 2.5925226509571075e-05, 2.8001144528388977e-05, 3.007706254720688e-05, 3.215298056602478e-05, 3.422889858484268e-05, 3.6304816603660583e-05, 3.8380734622478485e-05, 4.045665264129639e-05, 4.253257066011429e-05, 4.460848867893219e-05, 4.668440669775009e-05, 4.876032471656799e-05, 5.0836242735385895e-05, 5.2912160754203796e-05, 5.49880787730217e-05, 5.70639967918396e-05, 5.91399148106575e-05, 6.12158328294754e-05, 6.32917508482933e-05, 6.53676688671112e-05, 6.744358688592911e-05, 6.951950490474701e-05, 7.159542292356491e-05, 7.367134094238281e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 5.0, 13.0, 14.0, 13.0, 21.0, 14.0, 47.0, 64.0, 123.0, 247.0, 492.0, 1160.0, 2703.0, 8834.0, 47565.0, 463384.0, 462325.0, 47837.0, 8829.0, 2601.0, 1137.0, 563.0, 244.0, 143.0, 52.0, 30.0, 25.0, 17.0, 11.0, 9.0, 4.0, 2.0, 4.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191192626953125, -0.018436431884765625, -0.01775360107421875, -0.017070770263671875, -0.016387939453125, -0.015705108642578125, -0.01502227783203125, -0.014339447021484375, -0.0136566162109375, -0.012973785400390625, -0.01229095458984375, -0.011608123779296875, -0.01092529296875, -0.010242462158203125, -0.00955963134765625, -0.008876800537109375, -0.0081939697265625, -0.007511138916015625, -0.00682830810546875, -0.006145477294921875, -0.005462646484375, -0.004779815673828125, -0.00409698486328125, -0.003414154052734375, -0.0027313232421875, -0.002048492431640625, -0.00136566162109375, -0.000682830810546875, 0.0, 0.000682830810546875, 0.00136566162109375, 0.002048492431640625, 0.0027313232421875, 0.003414154052734375, 0.00409698486328125, 0.004779815673828125, 0.005462646484375, 0.006145477294921875, 0.00682830810546875, 0.007511138916015625, 0.0081939697265625, 0.008876800537109375, 0.00955963134765625, 0.010242462158203125, 0.01092529296875, 0.011608123779296875, 0.01229095458984375, 0.012973785400390625, 0.0136566162109375, 0.014339447021484375, 0.01502227783203125, 0.015705108642578125, 0.016387939453125, 0.017070770263671875, 0.01775360107421875, 0.018436431884765625, 0.0191192626953125, 0.019802093505859375, 0.02048492431640625, 0.021167755126953125, 0.0218505859375, 0.022533416748046875, 0.02321624755859375, 0.023899078369140625, 0.0245819091796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 5.0, 9.0, 9.0, 12.0, 18.0, 27.0, 38.0, 65.0, 63.0, 85.0, 75.0, 99.0, 102.0, 85.0, 74.0, 56.0, 31.0, 31.0, 25.0, 23.0, 15.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01430511474609375, -0.013894438743591309, -0.013483762741088867, -0.013073086738586426, -0.012662410736083984, -0.012251734733581543, -0.011841058731079102, -0.01143038272857666, -0.011019706726074219, -0.010609030723571777, -0.010198354721069336, -0.009787678718566895, -0.009377002716064453, -0.008966326713562012, -0.00855565071105957, -0.008144974708557129, -0.0077342987060546875, -0.007323622703552246, -0.006912946701049805, -0.006502270698547363, -0.006091594696044922, -0.0056809186935424805, -0.005270242691040039, -0.004859566688537598, -0.004448890686035156, -0.004038214683532715, -0.0036275386810302734, -0.003216862678527832, -0.0028061866760253906, -0.0023955106735229492, -0.001984834671020508, -0.0015741586685180664, -0.001163482666015625, -0.0007528066635131836, -0.0003421306610107422, 6.854534149169922e-05, 0.0004792213439941406, 0.000889897346496582, 0.0013005733489990234, 0.0017112493515014648, 0.0021219253540039062, 0.0025326013565063477, 0.002943277359008789, 0.0033539533615112305, 0.003764629364013672, 0.004175305366516113, 0.004585981369018555, 0.004996657371520996, 0.0054073333740234375, 0.005818009376525879, 0.00622868537902832, 0.006639361381530762, 0.007050037384033203, 0.0074607133865356445, 0.007871389389038086, 0.008282065391540527, 0.008692741394042969, 0.00910341739654541, 0.009514093399047852, 0.009924769401550293, 0.010335445404052734, 0.010746121406555176, 0.011156797409057617, 0.011567473411560059, 0.0119781494140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 142.0, 621.0, 223.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0956953763961792, -1.076025128364563, -1.0563548803329468, -1.0366846323013306, -1.0170142650604248, -0.9973440170288086, -0.9776737689971924, -0.9580035209655762, -0.93833327293396, -0.9186630249023438, -0.8989927172660828, -0.8793224692344666, -0.8596522212028503, -0.8399819135665894, -0.8203116655349731, -0.8006414175033569, -0.780971109867096, -0.7613008618354797, -0.7416305541992188, -0.7219603061676025, -0.7022900581359863, -0.6826198101043701, -0.6629495024681091, -0.6432792544364929, -0.6236089468002319, -0.6039386987686157, -0.5842683911323547, -0.5645981431007385, -0.5449278950691223, -0.5252575874328613, -0.5055873394012451, -0.4859170913696289, -0.4662468135356903, -0.4465765357017517, -0.4269062876701355, -0.4072360098361969, -0.3875657320022583, -0.3678954839706421, -0.3482252061367035, -0.3285549283027649, -0.3088846802711487, -0.2892144024372101, -0.26954415440559387, -0.24987387657165527, -0.23020361363887787, -0.21053335070610046, -0.19086307287216187, -0.17119280993938446, -0.15152254700660706, -0.13185228407382965, -0.11218201369047165, -0.09251174330711365, -0.07284148037433624, -0.05317121744155884, -0.033500947058200836, -0.013830676674842834, 0.00583958625793457, 0.025509852916002274, 0.04518011957406998, 0.06485038995742798, 0.08452065289020538, 0.10419091582298279, 0.12386118620634079, 0.1435314565896988, 0.1632017195224762]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 13.0, 18.0, 13.0, 28.0, 38.0, 38.0, 46.0, 57.0, 45.0, 50.0, 55.0, 63.0, 65.0, 67.0, 59.0, 57.0, 42.0, 47.0, 43.0, 37.0, 27.0, 17.0, 20.0, 11.0, 10.0, 7.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.11531573534011841, -0.11205366253852844, -0.10879159718751907, -0.1055295318365097, -0.10226745903491974, -0.09900538623332977, -0.0957433208823204, -0.09248125553131104, -0.08921918272972107, -0.0859571099281311, -0.08269504457712173, -0.07943297922611237, -0.0761709064245224, -0.07290883362293243, -0.06964676827192307, -0.0663847029209137, -0.06312263011932373, -0.05986056104302406, -0.056598491966724396, -0.05333642289042473, -0.05007435381412506, -0.046812284737825394, -0.043550215661525726, -0.04028814658522606, -0.03702607750892639, -0.033764008432626724, -0.030501939356327057, -0.02723987028002739, -0.023977801203727722, -0.020715732127428055, -0.017453663051128387, -0.01419159397482872, -0.010929524898529053, -0.007667455822229385, -0.004405386745929718, -0.0011433176696300507, 0.0021187514066696167, 0.005380820482969284, 0.008642889559268951, 0.011904958635568619, 0.015167027711868286, 0.018429096788167953, 0.02169116586446762, 0.024953234940767288, 0.028215304017066956, 0.03147737309336662, 0.03473944216966629, 0.03800151124596596, 0.041263580322265625, 0.04452564939856529, 0.04778771847486496, 0.05104978755116463, 0.054311856627464294, 0.05757392570376396, 0.06083599478006363, 0.064098060131073, 0.06736013293266296, 0.07062220573425293, 0.0738842710852623, 0.07714633643627167, 0.08040840923786163, 0.0836704820394516, 0.08693254739046097, 0.09019461274147034, 0.0934566855430603]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 13.0, 16.0, 17.0, 50.0, 64.0, 141.0, 204.0, 378.0, 786.0, 1750.0, 6308.0, 84020.0, 4023336.0, 66988.0, 7225.0, 1803.0, 597.0, 261.0, 110.0, 66.0, 51.0, 27.0, 14.0, 10.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07012939453125, -0.06796932220458984, -0.06580924987792969, -0.06364917755126953, -0.061489105224609375, -0.05932903289794922, -0.05716896057128906, -0.055008888244628906, -0.05284881591796875, -0.050688743591308594, -0.04852867126464844, -0.04636859893798828, -0.044208526611328125, -0.04204845428466797, -0.03988838195800781, -0.037728309631347656, -0.0355682373046875, -0.033408164978027344, -0.031248092651367188, -0.02908802032470703, -0.026927947998046875, -0.02476787567138672, -0.022607803344726562, -0.020447731018066406, -0.01828765869140625, -0.016127586364746094, -0.013967514038085938, -0.011807441711425781, -0.009647369384765625, -0.007487297058105469, -0.0053272247314453125, -0.0031671524047851562, -0.001007080078125, 0.0011529922485351562, 0.0033130645751953125, 0.005473136901855469, 0.007633209228515625, 0.009793281555175781, 0.011953353881835938, 0.014113426208496094, 0.01627349853515625, 0.018433570861816406, 0.020593643188476562, 0.02275371551513672, 0.024913787841796875, 0.02707386016845703, 0.029233932495117188, 0.031394004821777344, 0.0335540771484375, 0.035714149475097656, 0.03787422180175781, 0.04003429412841797, 0.042194366455078125, 0.04435443878173828, 0.04651451110839844, 0.048674583435058594, 0.05083465576171875, 0.052994728088378906, 0.05515480041503906, 0.05731487274169922, 0.059474945068359375, 0.06163501739501953, 0.06379508972167969, 0.06595516204833984, 0.068115234375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 19.0, 44.0, 123.0, 230.0, 277.0, 200.0, 74.0, 19.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042510986328125, -0.04142618179321289, -0.04034137725830078, -0.03925657272338867, -0.03817176818847656, -0.03708696365356445, -0.036002159118652344, -0.034917354583740234, -0.033832550048828125, -0.032747745513916016, -0.031662940979003906, -0.030578136444091797, -0.029493331909179688, -0.028408527374267578, -0.02732372283935547, -0.02623891830444336, -0.02515411376953125, -0.02406930923461914, -0.02298450469970703, -0.021899700164794922, -0.020814895629882812, -0.019730091094970703, -0.018645286560058594, -0.017560482025146484, -0.016475677490234375, -0.015390872955322266, -0.014306068420410156, -0.013221263885498047, -0.012136459350585938, -0.011051654815673828, -0.009966850280761719, -0.00888204574584961, -0.0077972412109375, -0.006712436676025391, -0.005627632141113281, -0.004542827606201172, -0.0034580230712890625, -0.002373218536376953, -0.0012884140014648438, -0.00020360946655273438, 0.000881195068359375, 0.0019659996032714844, 0.0030508041381835938, 0.004135608673095703, 0.0052204132080078125, 0.006305217742919922, 0.007390022277832031, 0.00847482681274414, 0.00955963134765625, 0.01064443588256836, 0.011729240417480469, 0.012814044952392578, 0.013898849487304688, 0.014983654022216797, 0.016068458557128906, 0.017153263092041016, 0.018238067626953125, 0.019322872161865234, 0.020407676696777344, 0.021492481231689453, 0.022577285766601562, 0.023662090301513672, 0.02474689483642578, 0.02583169937133789, 0.02691650390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 5.0, 10.0, 11.0, 14.0, 20.0, 23.0, 18.0, 41.0, 47.0, 57.0, 90.0, 119.0, 177.0, 425.0, 1060.0, 3965.0, 37258.0, 2053402.0, 2054234.0, 37053.0, 4092.0, 1066.0, 387.0, 222.0, 139.0, 101.0, 65.0, 46.0, 31.0, 24.0, 23.0, 8.0, 8.0, 8.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04522705078125, -0.04381370544433594, -0.042400360107421875, -0.04098701477050781, -0.03957366943359375, -0.03816032409667969, -0.036746978759765625, -0.03533363342285156, -0.0339202880859375, -0.03250694274902344, -0.031093597412109375, -0.029680252075195312, -0.02826690673828125, -0.026853561401367188, -0.025440216064453125, -0.024026870727539062, -0.022613525390625, -0.021200180053710938, -0.019786834716796875, -0.018373489379882812, -0.01696014404296875, -0.015546798706054688, -0.014133453369140625, -0.012720108032226562, -0.0113067626953125, -0.009893417358398438, -0.008480072021484375, -0.0070667266845703125, -0.00565338134765625, -0.0042400360107421875, -0.002826690673828125, -0.0014133453369140625, 0.0, 0.0014133453369140625, 0.002826690673828125, 0.0042400360107421875, 0.00565338134765625, 0.0070667266845703125, 0.008480072021484375, 0.009893417358398438, 0.0113067626953125, 0.012720108032226562, 0.014133453369140625, 0.015546798706054688, 0.01696014404296875, 0.018373489379882812, 0.019786834716796875, 0.021200180053710938, 0.022613525390625, 0.024026870727539062, 0.025440216064453125, 0.026853561401367188, 0.02826690673828125, 0.029680252075195312, 0.031093597412109375, 0.03250694274902344, 0.0339202880859375, 0.03533363342285156, 0.036746978759765625, 0.03816032409667969, 0.03957366943359375, 0.04098701477050781, 0.042400360107421875, 0.04381370544433594, 0.04522705078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 18.0, 14.0, 21.0, 29.0, 35.0, 51.0, 61.0, 107.0, 86.0, 169.0, 224.0, 258.0, 399.0, 524.0, 531.0, 414.0, 280.0, 200.0, 153.0, 124.0, 96.0, 46.0, 41.0, 39.0, 22.0, 13.0, 23.0, 17.0, 19.0, 13.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01287078857421875, -0.01244211196899414, -0.012013435363769531, -0.011584758758544922, -0.011156082153320312, -0.010727405548095703, -0.010298728942871094, -0.009870052337646484, -0.009441375732421875, -0.009012699127197266, -0.008584022521972656, -0.008155345916748047, -0.0077266693115234375, -0.007297992706298828, -0.006869316101074219, -0.006440639495849609, -0.006011962890625, -0.005583286285400391, -0.005154609680175781, -0.004725933074951172, -0.0042972564697265625, -0.003868579864501953, -0.0034399032592773438, -0.0030112266540527344, -0.002582550048828125, -0.0021538734436035156, -0.0017251968383789062, -0.0012965202331542969, -0.0008678436279296875, -0.0004391670227050781, -1.049041748046875e-05, 0.0004181861877441406, 0.00084686279296875, 0.0012755393981933594, 0.0017042160034179688, 0.002132892608642578, 0.0025615692138671875, 0.002990245819091797, 0.0034189224243164062, 0.0038475990295410156, 0.004276275634765625, 0.004704952239990234, 0.005133628845214844, 0.005562305450439453, 0.0059909820556640625, 0.006419658660888672, 0.006848335266113281, 0.007277011871337891, 0.0077056884765625, 0.00813436508178711, 0.008563041687011719, 0.008991718292236328, 0.009420394897460938, 0.009849071502685547, 0.010277748107910156, 0.010706424713134766, 0.011135101318359375, 0.011563777923583984, 0.011992454528808594, 0.012421131134033203, 0.012849807739257812, 0.013278484344482422, 0.013707160949707031, 0.01413583755493164, 0.01456451416015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 20.0, 43.0, 144.0, 259.0, 278.0, 153.0, 68.0, 20.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2224159985780716, -0.21640627086162567, -0.21039652824401855, -0.20438680052757263, -0.1983770728111267, -0.1923673450946808, -0.18635761737823486, -0.18034787476062775, -0.17433814704418182, -0.1683284193277359, -0.16231867671012878, -0.15630894899368286, -0.15029922127723694, -0.14428949356079102, -0.1382797658443451, -0.13227002322673798, -0.12626029551029205, -0.12025056779384613, -0.11424083262681961, -0.10823109745979309, -0.10222136974334717, -0.09621164202690125, -0.09020190685987473, -0.0841921716928482, -0.07818244397640228, -0.07217271625995636, -0.06616298109292984, -0.06015324965119362, -0.0541435182094574, -0.048133786767721176, -0.042124055325984955, -0.036114323884248734, -0.030104592442512512, -0.02409486100077629, -0.01808512955904007, -0.012075398117303848, -0.006065666675567627, -5.593523383140564e-05, 0.005953796207904816, 0.011963527649641037, 0.01797325909137726, 0.02398299053311348, 0.0299927219748497, 0.03600245341658592, 0.042012184858322144, 0.048021916300058365, 0.054031647741794586, 0.06004137918353081, 0.06605111062526703, 0.07206083834171295, 0.07807057350873947, 0.08408030867576599, 0.09009003639221191, 0.09609976410865784, 0.10210949927568436, 0.10811923444271088, 0.1141289621591568, 0.12013868987560272, 0.12614843249320984, 0.13215816020965576, 0.13816788792610168, 0.1441776156425476, 0.15018734335899353, 0.15619708597660065, 0.16220681369304657]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 8.0, 10.0, 14.0, 15.0, 19.0, 20.0, 22.0, 38.0, 48.0, 38.0, 52.0, 39.0, 50.0, 68.0, 37.0, 53.0, 55.0, 37.0, 51.0, 45.0, 41.0, 43.0, 48.0, 32.0, 20.0, 17.0, 22.0, 18.0, 5.0, 9.0, 2.0, 9.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053300559520721436, -0.05148433521389961, -0.04966811090707779, -0.047851886600255966, -0.04603566229343414, -0.04421943798661232, -0.0424032136797905, -0.040586989372968674, -0.03877076506614685, -0.03695454075932503, -0.035138316452503204, -0.03332209214568138, -0.03150586783885956, -0.029689643532037735, -0.027873419225215912, -0.02605719491839409, -0.024240970611572266, -0.022424746304750443, -0.02060852199792862, -0.018792297691106796, -0.016976073384284973, -0.01515984907746315, -0.013343624770641327, -0.011527400463819504, -0.00971117615699768, -0.007894951850175858, -0.006078727543354034, -0.004262503236532211, -0.002446278929710388, -0.0006300546228885651, 0.001186169683933258, 0.003002393990755081, 0.004818618297576904, 0.006634842604398727, 0.00845106691122055, 0.010267291218042374, 0.012083515524864197, 0.01389973983168602, 0.015715964138507843, 0.017532188445329666, 0.01934841275215149, 0.021164637058973312, 0.022980861365795135, 0.02479708567261696, 0.026613309979438782, 0.028429534286260605, 0.030245758593082428, 0.03206198289990425, 0.033878207206726074, 0.0356944315135479, 0.03751065582036972, 0.039326880127191544, 0.04114310443401337, 0.04295932874083519, 0.04477555304765701, 0.046591777354478836, 0.04840800166130066, 0.05022422596812248, 0.052040450274944305, 0.05385667458176613, 0.05567289888858795, 0.057489123195409775, 0.0593053475022316, 0.06112157180905342, 0.06293779611587524]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 9.0, 13.0, 21.0, 24.0, 25.0, 33.0, 55.0, 82.0, 103.0, 142.0, 194.0, 366.0, 557.0, 820.0, 1742.0, 5749.0, 86109.0, 862436.0, 80523.0, 5358.0, 1690.0, 833.0, 531.0, 315.0, 256.0, 171.0, 97.0, 88.0, 53.0, 37.0, 33.0, 22.0, 20.0, 10.0, 5.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.09458065032958984, -0.09126091003417969, -0.08794116973876953, -0.08462142944335938, -0.08130168914794922, -0.07798194885253906, -0.0746622085571289, -0.07134246826171875, -0.0680227279663086, -0.06470298767089844, -0.06138324737548828, -0.058063507080078125, -0.05474376678466797, -0.05142402648925781, -0.048104286193847656, -0.0447845458984375, -0.041464805603027344, -0.03814506530761719, -0.03482532501220703, -0.031505584716796875, -0.02818584442138672, -0.024866104125976562, -0.021546363830566406, -0.01822662353515625, -0.014906883239746094, -0.011587142944335938, -0.008267402648925781, -0.004947662353515625, -0.0016279220581054688, 0.0016918182373046875, 0.005011558532714844, 0.008331298828125, 0.011651039123535156, 0.014970779418945312, 0.01829051971435547, 0.021610260009765625, 0.02493000030517578, 0.028249740600585938, 0.031569480895996094, 0.03488922119140625, 0.038208961486816406, 0.04152870178222656, 0.04484844207763672, 0.048168182373046875, 0.05148792266845703, 0.05480766296386719, 0.058127403259277344, 0.0614471435546875, 0.06476688385009766, 0.06808662414550781, 0.07140636444091797, 0.07472610473632812, 0.07804584503173828, 0.08136558532714844, 0.0846853256225586, 0.08800506591796875, 0.0913248062133789, 0.09464454650878906, 0.09796428680419922, 0.10128402709960938, 0.10460376739501953, 0.10792350769042969, 0.11124324798583984, 0.11456298828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 16.0, 48.0, 114.0, 215.0, 282.0, 216.0, 78.0, 17.0, 5.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.0413060188293457, -0.040253639221191406, -0.03920125961303711, -0.03814888000488281, -0.037096500396728516, -0.03604412078857422, -0.03499174118041992, -0.033939361572265625, -0.03288698196411133, -0.03183460235595703, -0.030782222747802734, -0.029729843139648438, -0.02867746353149414, -0.027625083923339844, -0.026572704315185547, -0.02552032470703125, -0.024467945098876953, -0.023415565490722656, -0.02236318588256836, -0.021310806274414062, -0.020258426666259766, -0.01920604705810547, -0.018153667449951172, -0.017101287841796875, -0.016048908233642578, -0.014996528625488281, -0.013944149017333984, -0.012891769409179688, -0.01183938980102539, -0.010787010192871094, -0.009734630584716797, -0.0086822509765625, -0.007629871368408203, -0.006577491760253906, -0.005525112152099609, -0.0044727325439453125, -0.0034203529357910156, -0.0023679733276367188, -0.0013155937194824219, -0.000263214111328125, 0.0007891654968261719, 0.0018415451049804688, 0.0028939247131347656, 0.0039463043212890625, 0.004998683929443359, 0.006051063537597656, 0.007103443145751953, 0.00815582275390625, 0.009208202362060547, 0.010260581970214844, 0.01131296157836914, 0.012365341186523438, 0.013417720794677734, 0.014470100402832031, 0.015522480010986328, 0.016574859619140625, 0.017627239227294922, 0.01867961883544922, 0.019731998443603516, 0.020784378051757812, 0.02183675765991211, 0.022889137268066406, 0.023941516876220703, 0.024993896484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 12.0, 5.0, 11.0, 19.0, 39.0, 46.0, 41.0, 67.0, 109.0, 142.0, 226.0, 300.0, 424.0, 690.0, 1186.0, 2467.0, 7682.0, 32020.0, 169057.0, 520476.0, 248107.0, 48141.0, 10297.0, 3137.0, 1431.0, 771.0, 490.0, 363.0, 232.0, 163.0, 104.0, 72.0, 66.0, 39.0, 43.0, 13.0, 12.0, 11.0, 7.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0477294921875, -0.04638957977294922, -0.04504966735839844, -0.043709754943847656, -0.042369842529296875, -0.041029930114746094, -0.03969001770019531, -0.03835010528564453, -0.03701019287109375, -0.03567028045654297, -0.03433036804199219, -0.032990455627441406, -0.031650543212890625, -0.030310630798339844, -0.028970718383789062, -0.02763080596923828, -0.0262908935546875, -0.02495098114013672, -0.023611068725585938, -0.022271156311035156, -0.020931243896484375, -0.019591331481933594, -0.018251419067382812, -0.01691150665283203, -0.01557159423828125, -0.014231681823730469, -0.012891769409179688, -0.011551856994628906, -0.010211944580078125, -0.008872032165527344, -0.0075321197509765625, -0.006192207336425781, -0.004852294921875, -0.0035123825073242188, -0.0021724700927734375, -0.0008325576782226562, 0.000507354736328125, 0.0018472671508789062, 0.0031871795654296875, 0.004527091979980469, 0.00586700439453125, 0.007206916809082031, 0.008546829223632812, 0.009886741638183594, 0.011226654052734375, 0.012566566467285156, 0.013906478881835938, 0.015246391296386719, 0.0165863037109375, 0.01792621612548828, 0.019266128540039062, 0.020606040954589844, 0.021945953369140625, 0.023285865783691406, 0.024625778198242188, 0.02596569061279297, 0.02730560302734375, 0.02864551544189453, 0.029985427856445312, 0.031325340270996094, 0.032665252685546875, 0.034005165100097656, 0.03534507751464844, 0.03668498992919922, 0.03802490234375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 6.0, 8.0, 13.0, 11.0, 9.0, 17.0, 23.0, 19.0, 29.0, 24.0, 30.0, 27.0, 36.0, 47.0, 47.0, 39.0, 55.0, 53.0, 47.0, 40.0, 48.0, 41.0, 39.0, 46.0, 36.0, 38.0, 27.0, 22.0, 17.0, 20.0, 14.0, 13.0, 13.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0247650146484375, -0.024018049240112305, -0.02327108383178711, -0.022524118423461914, -0.02177715301513672, -0.021030187606811523, -0.020283222198486328, -0.019536256790161133, -0.018789291381835938, -0.018042325973510742, -0.017295360565185547, -0.01654839515686035, -0.015801429748535156, -0.015054464340209961, -0.014307498931884766, -0.01356053352355957, -0.012813568115234375, -0.01206660270690918, -0.011319637298583984, -0.010572671890258789, -0.009825706481933594, -0.009078741073608398, -0.008331775665283203, -0.007584810256958008, -0.0068378448486328125, -0.006090879440307617, -0.005343914031982422, -0.0045969486236572266, -0.0038499832153320312, -0.003103017807006836, -0.0023560523986816406, -0.0016090869903564453, -0.00086212158203125, -0.00011515617370605469, 0.0006318092346191406, 0.001378774642944336, 0.0021257400512695312, 0.0028727054595947266, 0.003619670867919922, 0.004366636276245117, 0.0051136016845703125, 0.005860567092895508, 0.006607532501220703, 0.0073544979095458984, 0.008101463317871094, 0.008848428726196289, 0.009595394134521484, 0.01034235954284668, 0.011089324951171875, 0.01183629035949707, 0.012583255767822266, 0.013330221176147461, 0.014077186584472656, 0.014824151992797852, 0.015571117401123047, 0.016318082809448242, 0.017065048217773438, 0.017812013626098633, 0.018558979034423828, 0.019305944442749023, 0.02005290985107422, 0.020799875259399414, 0.02154684066772461, 0.022293806076049805, 0.023040771484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 9.0, 3.0, 6.0, 10.0, 16.0, 10.0, 25.0, 26.0, 44.0, 85.0, 109.0, 249.0, 427.0, 797.0, 1740.0, 3845.0, 9797.0, 27139.0, 93771.0, 456774.0, 346049.0, 71314.0, 21854.0, 8074.0, 3290.0, 1438.0, 712.0, 370.0, 203.0, 120.0, 89.0, 42.0, 33.0, 27.0, 17.0, 8.0, 14.0, 4.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018157958984375, -0.01755070686340332, -0.01694345474243164, -0.01633620262145996, -0.01572895050048828, -0.015121698379516602, -0.014514446258544922, -0.013907194137573242, -0.013299942016601562, -0.012692689895629883, -0.012085437774658203, -0.011478185653686523, -0.010870933532714844, -0.010263681411743164, -0.009656429290771484, -0.009049177169799805, -0.008441925048828125, -0.007834672927856445, -0.007227420806884766, -0.006620168685913086, -0.006012916564941406, -0.0054056644439697266, -0.004798412322998047, -0.004191160202026367, -0.0035839080810546875, -0.002976655960083008, -0.002369403839111328, -0.0017621517181396484, -0.0011548995971679688, -0.0005476474761962891, 5.9604644775390625e-05, 0.0006668567657470703, 0.00127410888671875, 0.0018813610076904297, 0.0024886131286621094, 0.003095865249633789, 0.0037031173706054688, 0.0043103694915771484, 0.004917621612548828, 0.005524873733520508, 0.0061321258544921875, 0.006739377975463867, 0.007346630096435547, 0.007953882217407227, 0.008561134338378906, 0.009168386459350586, 0.009775638580322266, 0.010382890701293945, 0.010990142822265625, 0.011597394943237305, 0.012204647064208984, 0.012811899185180664, 0.013419151306152344, 0.014026403427124023, 0.014633655548095703, 0.015240907669067383, 0.015848159790039062, 0.016455411911010742, 0.017062664031982422, 0.0176699161529541, 0.01827716827392578, 0.01888442039489746, 0.01949167251586914, 0.02009892463684082, 0.0207061767578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 11.0, 2.0, 8.0, 18.0, 27.0, 27.0, 72.0, 96.0, 149.0, 218.0, 153.0, 83.0, 47.0, 37.0, 11.0, 14.0, 9.0, 9.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.840726852416992e-05, -9.438116103410721e-05, -9.03550535440445e-05, -8.632894605398178e-05, -8.230283856391907e-05, -7.827673107385635e-05, -7.425062358379364e-05, -7.022451609373093e-05, -6.619840860366821e-05, -6.21723011136055e-05, -5.8146193623542786e-05, -5.412008613348007e-05, -5.009397864341736e-05, -4.6067871153354645e-05, -4.204176366329193e-05, -3.801565617322922e-05, -3.3989548683166504e-05, -2.996344119310379e-05, -2.5937333703041077e-05, -2.1911226212978363e-05, -1.788511872291565e-05, -1.3859011232852936e-05, -9.832903742790222e-06, -5.8067962527275085e-06, -1.780688762664795e-06, 2.2454187273979187e-06, 6.271526217460632e-06, 1.0297633707523346e-05, 1.432374119758606e-05, 1.8349848687648773e-05, 2.2375956177711487e-05, 2.64020636677742e-05, 3.0428171157836914e-05, 3.445427864789963e-05, 3.848038613796234e-05, 4.2506493628025055e-05, 4.653260111808777e-05, 5.055870860815048e-05, 5.4584816098213196e-05, 5.861092358827591e-05, 6.263703107833862e-05, 6.666313856840134e-05, 7.068924605846405e-05, 7.471535354852676e-05, 7.874146103858948e-05, 8.276756852865219e-05, 8.67936760187149e-05, 9.081978350877762e-05, 9.484589099884033e-05, 9.887199848890305e-05, 0.00010289810597896576, 0.00010692421346902847, 0.00011095032095909119, 0.0001149764284491539, 0.00011900253593921661, 0.00012302864342927933, 0.00012705475091934204, 0.00013108085840940475, 0.00013510696589946747, 0.00013913307338953018, 0.0001431591808795929, 0.0001471852883696556, 0.00015121139585971832, 0.00015523750334978104, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 11.0, 5.0, 15.0, 22.0, 32.0, 66.0, 82.0, 152.0, 339.0, 843.0, 3092.0, 21425.0, 588687.0, 412862.0, 16884.0, 2614.0, 736.0, 306.0, 144.0, 81.0, 44.0, 38.0, 27.0, 11.0, 11.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03468179702758789, -0.03329181671142578, -0.03190183639526367, -0.030511856079101562, -0.029121875762939453, -0.027731895446777344, -0.026341915130615234, -0.024951934814453125, -0.023561954498291016, -0.022171974182128906, -0.020781993865966797, -0.019392013549804688, -0.018002033233642578, -0.01661205291748047, -0.01522207260131836, -0.01383209228515625, -0.01244211196899414, -0.011052131652832031, -0.009662151336669922, -0.008272171020507812, -0.006882190704345703, -0.005492210388183594, -0.004102230072021484, -0.002712249755859375, -0.0013222694396972656, 6.771087646484375e-05, 0.0014576911926269531, 0.0028476715087890625, 0.004237651824951172, 0.005627632141113281, 0.007017612457275391, 0.0084075927734375, 0.00979757308959961, 0.011187553405761719, 0.012577533721923828, 0.013967514038085938, 0.015357494354248047, 0.016747474670410156, 0.018137454986572266, 0.019527435302734375, 0.020917415618896484, 0.022307395935058594, 0.023697376251220703, 0.025087356567382812, 0.026477336883544922, 0.02786731719970703, 0.02925729751586914, 0.03064727783203125, 0.03203725814819336, 0.03342723846435547, 0.03481721878051758, 0.03620719909667969, 0.0375971794128418, 0.038987159729003906, 0.040377140045166016, 0.041767120361328125, 0.043157100677490234, 0.044547080993652344, 0.04593706130981445, 0.04732704162597656, 0.04871702194213867, 0.05010700225830078, 0.05149698257446289, 0.052886962890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 8.0, 7.0, 13.0, 12.0, 27.0, 38.0, 44.0, 76.0, 97.0, 99.0, 142.0, 100.0, 76.0, 63.0, 49.0, 37.0, 14.0, 16.0, 11.0, 8.0, 5.0, 5.0, 2.0, 8.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015839576721191406, -0.015352249145507812, -0.014864921569824219, -0.014377593994140625, -0.013890266418457031, -0.013402938842773438, -0.012915611267089844, -0.01242828369140625, -0.011940956115722656, -0.011453628540039062, -0.010966300964355469, -0.010478973388671875, -0.009991645812988281, -0.009504318237304688, -0.009016990661621094, -0.0085296630859375, -0.008042335510253906, -0.0075550079345703125, -0.007067680358886719, -0.006580352783203125, -0.006093025207519531, -0.0056056976318359375, -0.005118370056152344, -0.00463104248046875, -0.004143714904785156, -0.0036563873291015625, -0.0031690597534179688, -0.002681732177734375, -0.0021944046020507812, -0.0017070770263671875, -0.0012197494506835938, -0.000732421875, -0.00024509429931640625, 0.0002422332763671875, 0.0007295608520507812, 0.001216888427734375, 0.0017042160034179688, 0.0021915435791015625, 0.0026788711547851562, 0.00316619873046875, 0.0036535263061523438, 0.0041408538818359375, 0.004628181457519531, 0.005115509033203125, 0.005602836608886719, 0.0060901641845703125, 0.006577491760253906, 0.0070648193359375, 0.007552146911621094, 0.008039474487304688, 0.008526802062988281, 0.009014129638671875, 0.009501457214355469, 0.009988784790039062, 0.010476112365722656, 0.01096343994140625, 0.011450767517089844, 0.011938095092773438, 0.012425422668457031, 0.012912750244140625, 0.013400077819824219, 0.013887405395507812, 0.014374732971191406, 0.014862060546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 50.0, 207.0, 470.0, 215.0, 37.0, 14.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5916694402694702, -0.5754954814910889, -0.5593215823173523, -0.543147623538971, -0.5269736647605896, -0.510799765586853, -0.4946258068084717, -0.4784518778324127, -0.46227794885635376, -0.4461040198802948, -0.42993006110191345, -0.4137561321258545, -0.39758220314979553, -0.3814082741737366, -0.3652343153953552, -0.34906038641929626, -0.3328864276409149, -0.31671249866485596, -0.3005385398864746, -0.28436461091041565, -0.2681906819343567, -0.25201672315597534, -0.23584279417991638, -0.21966886520385742, -0.20349492132663727, -0.18732097744941711, -0.17114704847335815, -0.154973104596138, -0.13879916071891785, -0.12262523174285889, -0.10645128786563873, -0.09027735143899918, -0.07410341501235962, -0.05792947858572006, -0.04175553843379021, -0.02558159828186035, -0.009407661855220795, 0.006766274571418762, 0.022940218448638916, 0.03911415487527847, 0.05528809130191803, 0.07146202772855759, 0.08763596415519714, 0.1038099080324173, 0.11998384445905685, 0.1361577808856964, 0.15233172476291656, 0.16850566864013672, 0.18467959761619568, 0.20085354149341583, 0.2170274704694748, 0.23320141434669495, 0.2493753433227539, 0.26554930210113525, 0.2817232310771942, 0.2978971600532532, 0.3140711188316345, 0.3302450478076935, 0.34641900658607483, 0.3625929355621338, 0.37876686453819275, 0.3949407935142517, 0.41111475229263306, 0.427288681268692, 0.443462610244751]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 14.0, 14.0, 31.0, 33.0, 44.0, 58.0, 58.0, 68.0, 73.0, 79.0, 104.0, 94.0, 73.0, 53.0, 61.0, 44.0, 41.0, 18.0, 14.0, 16.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18112850189208984, -0.17565332353115082, -0.17017816007137299, -0.16470298171043396, -0.15922781825065613, -0.1537526398897171, -0.14827746152877808, -0.14280229806900024, -0.1373271346092224, -0.1318519562482834, -0.12637679278850555, -0.12090161442756653, -0.1154264509677887, -0.10995127260684967, -0.10447610169649124, -0.09900093078613281, -0.09352575242519379, -0.08805058151483536, -0.08257541060447693, -0.0771002322435379, -0.07162506878376007, -0.06614989042282104, -0.060674719512462616, -0.05519954860210419, -0.04972437769174576, -0.04424920678138733, -0.0387740358710289, -0.03329886123538017, -0.027823690325021744, -0.022348519414663315, -0.016873344779014587, -0.011398173868656158, -0.0059230029582977295, -0.0004478311166167259, 0.005027340725064278, 0.010502513498067856, 0.015977684408426285, 0.021452855318784714, 0.02692802995443344, 0.03240320086479187, 0.0378783717751503, 0.04335354268550873, 0.04882871359586716, 0.054303888231515884, 0.05977905914187431, 0.06525422632694244, 0.07072940468788147, 0.0762045755982399, 0.08167974650859833, 0.08715491741895676, 0.09263008832931519, 0.09810526669025421, 0.10358043015003204, 0.10905560851097107, 0.1145307794213295, 0.12000595033168793, 0.12548112869262695, 0.13095630705356598, 0.1364314705133438, 0.14190664887428284, 0.14738181233406067, 0.1528569906949997, 0.15833216905593872, 0.16380733251571655, 0.16928249597549438]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 3.0, 9.0, 9.0, 13.0, 20.0, 29.0, 26.0, 42.0, 79.0, 111.0, 159.0, 245.0, 420.0, 751.0, 1811.0, 5292.0, 29911.0, 2134991.0, 1977712.0, 31248.0, 6789.0, 2629.0, 1100.0, 391.0, 188.0, 106.0, 61.0, 39.0, 33.0, 11.0, 6.0, 15.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.050445556640625, -0.049044132232666016, -0.04764270782470703, -0.04624128341674805, -0.04483985900878906, -0.04343843460083008, -0.042037010192871094, -0.04063558578491211, -0.039234161376953125, -0.03783273696899414, -0.036431312561035156, -0.03502988815307617, -0.03362846374511719, -0.0322270393371582, -0.03082561492919922, -0.029424190521240234, -0.02802276611328125, -0.026621341705322266, -0.02521991729736328, -0.023818492889404297, -0.022417068481445312, -0.021015644073486328, -0.019614219665527344, -0.01821279525756836, -0.016811370849609375, -0.01540994644165039, -0.014008522033691406, -0.012607097625732422, -0.011205673217773438, -0.009804248809814453, -0.008402824401855469, -0.007001399993896484, -0.0055999755859375, -0.004198551177978516, -0.0027971267700195312, -0.0013957023620605469, 5.7220458984375e-06, 0.0014071464538574219, 0.0028085708618164062, 0.004209995269775391, 0.005611419677734375, 0.007012844085693359, 0.008414268493652344, 0.009815692901611328, 0.011217117309570312, 0.012618541717529297, 0.014019966125488281, 0.015421390533447266, 0.01682281494140625, 0.018224239349365234, 0.01962566375732422, 0.021027088165283203, 0.022428512573242188, 0.023829936981201172, 0.025231361389160156, 0.02663278579711914, 0.028034210205078125, 0.02943563461303711, 0.030837059020996094, 0.03223848342895508, 0.03363990783691406, 0.03504133224487305, 0.03644275665283203, 0.037844181060791016, 0.03924560546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 32.0, 80.0, 184.0, 252.0, 246.0, 130.0, 46.0, 13.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043701171875, -0.0425717830657959, -0.0414423942565918, -0.040313005447387695, -0.039183616638183594, -0.03805422782897949, -0.03692483901977539, -0.03579545021057129, -0.03466606140136719, -0.033536672592163086, -0.032407283782958984, -0.03127789497375488, -0.03014850616455078, -0.02901911735534668, -0.027889728546142578, -0.026760339736938477, -0.025630950927734375, -0.024501562118530273, -0.023372173309326172, -0.02224278450012207, -0.02111339569091797, -0.019984006881713867, -0.018854618072509766, -0.017725229263305664, -0.016595840454101562, -0.015466451644897461, -0.01433706283569336, -0.013207674026489258, -0.012078285217285156, -0.010948896408081055, -0.009819507598876953, -0.008690118789672852, -0.00756072998046875, -0.0064313411712646484, -0.005301952362060547, -0.004172563552856445, -0.0030431747436523438, -0.0019137859344482422, -0.0007843971252441406, 0.00034499168395996094, 0.0014743804931640625, 0.002603769302368164, 0.0037331581115722656, 0.004862546920776367, 0.005991935729980469, 0.00712132453918457, 0.008250713348388672, 0.009380102157592773, 0.010509490966796875, 0.011638879776000977, 0.012768268585205078, 0.01389765739440918, 0.015027046203613281, 0.016156435012817383, 0.017285823822021484, 0.018415212631225586, 0.019544601440429688, 0.02067399024963379, 0.02180337905883789, 0.022932767868041992, 0.024062156677246094, 0.025191545486450195, 0.026320934295654297, 0.0274503231048584, 0.0285797119140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 13.0, 22.0, 15.0, 26.0, 40.0, 67.0, 76.0, 136.0, 278.0, 605.0, 1690.0, 7210.0, 61812.0, 2736355.0, 1334571.0, 43069.0, 5805.0, 1420.0, 493.0, 210.0, 127.0, 77.0, 48.0, 38.0, 22.0, 15.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.044189453125, -0.04305434226989746, -0.04191923141479492, -0.04078412055969238, -0.039649009704589844, -0.038513898849487305, -0.037378787994384766, -0.03624367713928223, -0.03510856628417969, -0.03397345542907715, -0.03283834457397461, -0.03170323371887207, -0.03056812286376953, -0.029433012008666992, -0.028297901153564453, -0.027162790298461914, -0.026027679443359375, -0.024892568588256836, -0.023757457733154297, -0.022622346878051758, -0.02148723602294922, -0.02035212516784668, -0.01921701431274414, -0.0180819034576416, -0.016946792602539062, -0.015811681747436523, -0.014676570892333984, -0.013541460037231445, -0.012406349182128906, -0.011271238327026367, -0.010136127471923828, -0.009001016616821289, -0.00786590576171875, -0.006730794906616211, -0.005595684051513672, -0.004460573196411133, -0.0033254623413085938, -0.0021903514862060547, -0.0010552406311035156, 7.987022399902344e-05, 0.0012149810791015625, 0.0023500919342041016, 0.0034852027893066406, 0.00462031364440918, 0.005755424499511719, 0.006890535354614258, 0.008025646209716797, 0.009160757064819336, 0.010295867919921875, 0.011430978775024414, 0.012566089630126953, 0.013701200485229492, 0.014836311340332031, 0.01597142219543457, 0.01710653305053711, 0.01824164390563965, 0.019376754760742188, 0.020511865615844727, 0.021646976470947266, 0.022782087326049805, 0.023917198181152344, 0.025052309036254883, 0.026187419891357422, 0.02732253074645996, 0.0284576416015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 5.0, 14.0, 18.0, 25.0, 46.0, 61.0, 64.0, 102.0, 145.0, 235.0, 420.0, 654.0, 765.0, 520.0, 274.0, 202.0, 134.0, 76.0, 82.0, 50.0, 50.0, 30.0, 19.0, 16.0, 13.0, 7.0, 10.0, 4.0, 1.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0128631591796875, -0.012372732162475586, -0.011882305145263672, -0.011391878128051758, -0.010901451110839844, -0.01041102409362793, -0.009920597076416016, -0.009430170059204102, -0.008939743041992188, -0.008449316024780273, -0.00795888900756836, -0.007468461990356445, -0.006978034973144531, -0.006487607955932617, -0.005997180938720703, -0.005506753921508789, -0.005016326904296875, -0.004525899887084961, -0.004035472869873047, -0.003545045852661133, -0.0030546188354492188, -0.0025641918182373047, -0.0020737648010253906, -0.0015833377838134766, -0.0010929107666015625, -0.0006024837493896484, -0.00011205673217773438, 0.0003783702850341797, 0.0008687973022460938, 0.0013592243194580078, 0.0018496513366699219, 0.002340078353881836, 0.00283050537109375, 0.003320932388305664, 0.003811359405517578, 0.004301786422729492, 0.004792213439941406, 0.00528264045715332, 0.005773067474365234, 0.0062634944915771484, 0.0067539215087890625, 0.0072443485260009766, 0.007734775543212891, 0.008225202560424805, 0.008715629577636719, 0.009206056594848633, 0.009696483612060547, 0.010186910629272461, 0.010677337646484375, 0.011167764663696289, 0.011658191680908203, 0.012148618698120117, 0.012639045715332031, 0.013129472732543945, 0.01361989974975586, 0.014110326766967773, 0.014600753784179688, 0.015091180801391602, 0.015581607818603516, 0.01607203483581543, 0.016562461853027344, 0.017052888870239258, 0.017543315887451172, 0.018033742904663086, 0.018524169921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 100.0, 370.0, 402.0, 98.0, 17.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2900851368904114, -0.2803795635700226, -0.2706739604473114, -0.2609683871269226, -0.2512628138065338, -0.24155721068382263, -0.23185163736343384, -0.22214604914188385, -0.21244046092033386, -0.20273487269878387, -0.19302929937839508, -0.1833237111568451, -0.1736181229352951, -0.16391253471374512, -0.15420696139335632, -0.14450137317180634, -0.13479579985141754, -0.12509021162986755, -0.11538463085889816, -0.10567905008792877, -0.09597346186637878, -0.0862678810954094, -0.07656230032444, -0.06685671210289001, -0.057151131331920624, -0.047445546835660934, -0.037739962339401245, -0.028034381568431854, -0.018328797072172165, -0.008623212575912476, 0.0010823681950569153, 0.010787956416606903, 0.020493537187576294, 0.030199121683835983, 0.03990470618009567, 0.049610286951065063, 0.05931587144732475, 0.06902145594358444, 0.07872703671455383, 0.08843262493610382, 0.09813820570707321, 0.1078437864780426, 0.11754937469959259, 0.12725496292114258, 0.13696053624153137, 0.14666612446308136, 0.15637171268463135, 0.16607728600502014, 0.17578287422657013, 0.18548846244812012, 0.1951940357685089, 0.2048996239900589, 0.2146052122116089, 0.22431078553199768, 0.23401637375354767, 0.24372196197509766, 0.25342753529548645, 0.26313310861587524, 0.2728387117385864, 0.2825442850589752, 0.292249858379364, 0.3019554615020752, 0.311661034822464, 0.3213666081428528, 0.33107221126556396]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 16.0, 20.0, 40.0, 40.0, 52.0, 65.0, 71.0, 77.0, 90.0, 81.0, 77.0, 67.0, 68.0, 44.0, 54.0, 34.0, 26.0, 20.0, 12.0, 12.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06291890144348145, -0.06021612137556076, -0.057513341307640076, -0.05481056496500969, -0.052107784897089005, -0.04940500482916832, -0.04670222848653793, -0.04399944841861725, -0.041296668350696564, -0.03859388828277588, -0.035891108214855194, -0.03318833187222481, -0.030485551804304123, -0.027782771736383438, -0.025079993531107903, -0.022377215325832367, -0.019674435257911682, -0.016971655189990997, -0.014268876984715462, -0.011566097848117352, -0.008863318711519241, -0.006160539574921131, -0.003457760438323021, -0.0007549822330474854, 0.0019477978348731995, 0.00465057697147131, 0.00735335610806942, 0.01005613524466753, 0.01275891438126564, 0.01546169351786375, 0.01816447265446186, 0.020867250859737396, 0.02357003092765808, 0.026272810995578766, 0.0289755892008543, 0.03167836740612984, 0.03438114747405052, 0.03708392754197121, 0.03978670388460159, 0.04248948395252228, 0.04519226402044296, 0.04789504408836365, 0.05059782415628433, 0.05330060049891472, 0.0560033805668354, 0.05870616063475609, 0.061408936977386475, 0.06411171704530716, 0.06681449711322784, 0.06951727718114853, 0.07222005724906921, 0.0749228373169899, 0.07762561738491058, 0.08032839000225067, 0.08303117007017136, 0.08573395013809204, 0.08843673020601273, 0.09113951027393341, 0.0938422903418541, 0.09654507040977478, 0.09924784302711487, 0.10195062309503555, 0.10465340316295624, 0.10735618323087692, 0.11005896329879761]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 11.0, 7.0, 15.0, 15.0, 22.0, 32.0, 35.0, 77.0, 93.0, 125.0, 141.0, 223.0, 345.0, 461.0, 688.0, 1296.0, 3566.0, 24814.0, 530105.0, 458047.0, 21688.0, 3314.0, 1235.0, 693.0, 438.0, 318.0, 229.0, 135.0, 104.0, 81.0, 38.0, 38.0, 28.0, 21.0, 11.0, 13.0, 6.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06781005859375, -0.0656890869140625, -0.063568115234375, -0.0614471435546875, -0.059326171875, -0.0572052001953125, -0.055084228515625, -0.0529632568359375, -0.05084228515625, -0.0487213134765625, -0.046600341796875, -0.0444793701171875, -0.0423583984375, -0.0402374267578125, -0.038116455078125, -0.0359954833984375, -0.03387451171875, -0.0317535400390625, -0.029632568359375, -0.0275115966796875, -0.025390625, -0.0232696533203125, -0.021148681640625, -0.0190277099609375, -0.01690673828125, -0.0147857666015625, -0.012664794921875, -0.0105438232421875, -0.0084228515625, -0.0063018798828125, -0.004180908203125, -0.0020599365234375, 6.103515625e-05, 0.0021820068359375, 0.004302978515625, 0.0064239501953125, 0.008544921875, 0.0106658935546875, 0.012786865234375, 0.0149078369140625, 0.01702880859375, 0.0191497802734375, 0.021270751953125, 0.0233917236328125, 0.0255126953125, 0.0276336669921875, 0.029754638671875, 0.0318756103515625, 0.03399658203125, 0.0361175537109375, 0.038238525390625, 0.0403594970703125, 0.04248046875, 0.0446014404296875, 0.046722412109375, 0.0488433837890625, 0.05096435546875, 0.0530853271484375, 0.055206298828125, 0.0573272705078125, 0.0594482421875, 0.0615692138671875, 0.063690185546875, 0.0658111572265625, 0.06793212890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 41.0, 99.0, 196.0, 258.0, 252.0, 96.0, 34.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0439453125, -0.042832136154174805, -0.04171895980834961, -0.040605783462524414, -0.03949260711669922, -0.03837943077087402, -0.03726625442504883, -0.03615307807922363, -0.03503990173339844, -0.03392672538757324, -0.03281354904174805, -0.03170037269592285, -0.030587196350097656, -0.02947402000427246, -0.028360843658447266, -0.02724766731262207, -0.026134490966796875, -0.02502131462097168, -0.023908138275146484, -0.02279496192932129, -0.021681785583496094, -0.0205686092376709, -0.019455432891845703, -0.018342256546020508, -0.017229080200195312, -0.016115903854370117, -0.015002727508544922, -0.013889551162719727, -0.012776374816894531, -0.011663198471069336, -0.01055002212524414, -0.009436845779418945, -0.00832366943359375, -0.007210493087768555, -0.006097316741943359, -0.004984140396118164, -0.0038709640502929688, -0.0027577877044677734, -0.0016446113586425781, -0.0005314350128173828, 0.0005817413330078125, 0.0016949176788330078, 0.002808094024658203, 0.0039212703704833984, 0.005034446716308594, 0.006147623062133789, 0.007260799407958984, 0.00837397575378418, 0.009487152099609375, 0.01060032844543457, 0.011713504791259766, 0.012826681137084961, 0.013939857482910156, 0.015053033828735352, 0.016166210174560547, 0.017279386520385742, 0.018392562866210938, 0.019505739212036133, 0.020618915557861328, 0.021732091903686523, 0.02284526824951172, 0.023958444595336914, 0.02507162094116211, 0.026184797286987305, 0.0272979736328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 12.0, 8.0, 16.0, 18.0, 29.0, 45.0, 66.0, 80.0, 132.0, 232.0, 434.0, 967.0, 2911.0, 17602.0, 231560.0, 709908.0, 73613.0, 7544.0, 1822.0, 660.0, 352.0, 184.0, 110.0, 55.0, 46.0, 36.0, 22.0, 16.0, 11.0, 5.0, 7.0, 7.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055206298828125, -0.0534968376159668, -0.051787376403808594, -0.05007791519165039, -0.04836845397949219, -0.046658992767333984, -0.04494953155517578, -0.04324007034301758, -0.041530609130859375, -0.03982114791870117, -0.03811168670654297, -0.036402225494384766, -0.03469276428222656, -0.03298330307006836, -0.031273841857910156, -0.029564380645751953, -0.02785491943359375, -0.026145458221435547, -0.024435997009277344, -0.02272653579711914, -0.021017074584960938, -0.019307613372802734, -0.01759815216064453, -0.015888690948486328, -0.014179229736328125, -0.012469768524169922, -0.010760307312011719, -0.009050846099853516, -0.0073413848876953125, -0.005631923675537109, -0.003922462463378906, -0.002213001251220703, -0.0005035400390625, 0.0012059211730957031, 0.0029153823852539062, 0.004624843597412109, 0.0063343048095703125, 0.008043766021728516, 0.009753227233886719, 0.011462688446044922, 0.013172149658203125, 0.014881610870361328, 0.01659107208251953, 0.018300533294677734, 0.020009994506835938, 0.02171945571899414, 0.023428916931152344, 0.025138378143310547, 0.02684783935546875, 0.028557300567626953, 0.030266761779785156, 0.03197622299194336, 0.03368568420410156, 0.035395145416259766, 0.03710460662841797, 0.03881406784057617, 0.040523529052734375, 0.04223299026489258, 0.04394245147705078, 0.045651912689208984, 0.04736137390136719, 0.04907083511352539, 0.050780296325683594, 0.0524897575378418, 0.05419921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 9.0, 19.0, 15.0, 15.0, 17.0, 13.0, 20.0, 30.0, 28.0, 33.0, 38.0, 31.0, 36.0, 39.0, 45.0, 41.0, 49.0, 39.0, 38.0, 48.0, 30.0, 40.0, 30.0, 45.0, 28.0, 26.0, 23.0, 23.0, 17.0, 12.0, 15.0, 13.0, 8.0, 5.0, 11.0, 11.0, 6.0, 6.0, 4.0, 4.0, 2.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.020599365234375, -0.019969463348388672, -0.019339561462402344, -0.018709659576416016, -0.018079757690429688, -0.01744985580444336, -0.01681995391845703, -0.016190052032470703, -0.015560150146484375, -0.014930248260498047, -0.014300346374511719, -0.01367044448852539, -0.013040542602539062, -0.012410640716552734, -0.011780738830566406, -0.011150836944580078, -0.01052093505859375, -0.009891033172607422, -0.009261131286621094, -0.008631229400634766, -0.008001327514648438, -0.007371425628662109, -0.006741523742675781, -0.006111621856689453, -0.005481719970703125, -0.004851818084716797, -0.004221916198730469, -0.0035920143127441406, -0.0029621124267578125, -0.0023322105407714844, -0.0017023086547851562, -0.0010724067687988281, -0.0004425048828125, 0.00018739700317382812, 0.0008172988891601562, 0.0014472007751464844, 0.0020771026611328125, 0.0027070045471191406, 0.0033369064331054688, 0.003966808319091797, 0.004596710205078125, 0.005226612091064453, 0.005856513977050781, 0.006486415863037109, 0.0071163177490234375, 0.007746219635009766, 0.008376121520996094, 0.009006023406982422, 0.00963592529296875, 0.010265827178955078, 0.010895729064941406, 0.011525630950927734, 0.012155532836914062, 0.01278543472290039, 0.013415336608886719, 0.014045238494873047, 0.014675140380859375, 0.015305042266845703, 0.01593494415283203, 0.01656484603881836, 0.017194747924804688, 0.017824649810791016, 0.018454551696777344, 0.019084453582763672, 0.01971435546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 11.0, 10.0, 10.0, 16.0, 29.0, 29.0, 39.0, 80.0, 137.0, 213.0, 393.0, 753.0, 1436.0, 3057.0, 6692.0, 16700.0, 60081.0, 455004.0, 419333.0, 56033.0, 16057.0, 6416.0, 2926.0, 1398.0, 710.0, 397.0, 226.0, 137.0, 73.0, 50.0, 25.0, 26.0, 16.0, 15.0, 9.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0211029052734375, -0.020462989807128906, -0.019823074340820312, -0.01918315887451172, -0.018543243408203125, -0.01790332794189453, -0.017263412475585938, -0.016623497009277344, -0.01598358154296875, -0.015343666076660156, -0.014703750610351562, -0.014063835144042969, -0.013423919677734375, -0.012784004211425781, -0.012144088745117188, -0.011504173278808594, -0.0108642578125, -0.010224342346191406, -0.009584426879882812, -0.008944511413574219, -0.008304595947265625, -0.007664680480957031, -0.0070247650146484375, -0.006384849548339844, -0.00574493408203125, -0.005105018615722656, -0.0044651031494140625, -0.0038251876831054688, -0.003185272216796875, -0.0025453567504882812, -0.0019054412841796875, -0.0012655258178710938, -0.0006256103515625, 1.430511474609375e-05, 0.0006542205810546875, 0.0012941360473632812, 0.001934051513671875, 0.0025739669799804688, 0.0032138824462890625, 0.0038537979125976562, 0.00449371337890625, 0.005133628845214844, 0.0057735443115234375, 0.006413459777832031, 0.007053375244140625, 0.007693290710449219, 0.008333206176757812, 0.008973121643066406, 0.009613037109375, 0.010252952575683594, 0.010892868041992188, 0.011532783508300781, 0.012172698974609375, 0.012812614440917969, 0.013452529907226562, 0.014092445373535156, 0.01473236083984375, 0.015372276306152344, 0.016012191772460938, 0.01665210723876953, 0.017292022705078125, 0.01793193817138672, 0.018571853637695312, 0.019211769104003906, 0.0198516845703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 15.0, 14.0, 20.0, 21.0, 23.0, 26.0, 55.0, 53.0, 63.0, 96.0, 107.0, 110.0, 71.0, 58.0, 55.0, 56.0, 46.0, 22.0, 15.0, 17.0, 9.0, 13.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.860494613647461e-05, -6.664451211690903e-05, -6.468407809734344e-05, -6.272364407777786e-05, -6.076321005821228e-05, -5.88027760386467e-05, -5.6842342019081116e-05, -5.4881907999515533e-05, -5.292147397994995e-05, -5.096103996038437e-05, -4.900060594081879e-05, -4.7040171921253204e-05, -4.507973790168762e-05, -4.311930388212204e-05, -4.115886986255646e-05, -3.9198435842990875e-05, -3.723800182342529e-05, -3.527756780385971e-05, -3.331713378429413e-05, -3.1356699764728546e-05, -2.9396265745162964e-05, -2.743583172559738e-05, -2.54753977060318e-05, -2.3514963686466217e-05, -2.1554529666900635e-05, -1.9594095647335052e-05, -1.763366162776947e-05, -1.5673227608203888e-05, -1.3712793588638306e-05, -1.1752359569072723e-05, -9.791925549507141e-06, -7.831491529941559e-06, -5.8710575103759766e-06, -3.910623490810394e-06, -1.950189471244812e-06, 1.0244548320770264e-08, 1.9706785678863525e-06, 3.931112587451935e-06, 5.891546607017517e-06, 7.8519806265831e-06, 9.812414646148682e-06, 1.1772848665714264e-05, 1.3733282685279846e-05, 1.569371670484543e-05, 1.765415072441101e-05, 1.9614584743976593e-05, 2.1575018763542175e-05, 2.3535452783107758e-05, 2.549588680267334e-05, 2.7456320822238922e-05, 2.9416754841804504e-05, 3.137718886137009e-05, 3.333762288093567e-05, 3.529805690050125e-05, 3.7258490920066833e-05, 3.9218924939632416e-05, 4.1179358959198e-05, 4.313979297876358e-05, 4.510022699832916e-05, 4.7060661017894745e-05, 4.902109503746033e-05, 5.098152905702591e-05, 5.294196307659149e-05, 5.4902397096157074e-05, 5.6862831115722656e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 9.0, 9.0, 14.0, 24.0, 23.0, 48.0, 49.0, 85.0, 126.0, 239.0, 389.0, 707.0, 1402.0, 2953.0, 7322.0, 20524.0, 90919.0, 684459.0, 190272.0, 31039.0, 10058.0, 3974.0, 1842.0, 904.0, 467.0, 259.0, 153.0, 90.0, 61.0, 45.0, 28.0, 17.0, 11.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.02486562728881836, -0.02412700653076172, -0.023388385772705078, -0.022649765014648438, -0.021911144256591797, -0.021172523498535156, -0.020433902740478516, -0.019695281982421875, -0.018956661224365234, -0.018218040466308594, -0.017479419708251953, -0.016740798950195312, -0.016002178192138672, -0.015263557434082031, -0.01452493667602539, -0.01378631591796875, -0.01304769515991211, -0.012309074401855469, -0.011570453643798828, -0.010831832885742188, -0.010093212127685547, -0.009354591369628906, -0.008615970611572266, -0.007877349853515625, -0.007138729095458984, -0.006400108337402344, -0.005661487579345703, -0.0049228668212890625, -0.004184246063232422, -0.0034456253051757812, -0.0027070045471191406, -0.0019683837890625, -0.0012297630310058594, -0.0004911422729492188, 0.0002474784851074219, 0.0009860992431640625, 0.0017247200012207031, 0.0024633407592773438, 0.0032019615173339844, 0.003940582275390625, 0.004679203033447266, 0.005417823791503906, 0.006156444549560547, 0.0068950653076171875, 0.007633686065673828, 0.008372306823730469, 0.00911092758178711, 0.00984954833984375, 0.01058816909790039, 0.011326789855957031, 0.012065410614013672, 0.012804031372070312, 0.013542652130126953, 0.014281272888183594, 0.015019893646240234, 0.015758514404296875, 0.016497135162353516, 0.017235755920410156, 0.017974376678466797, 0.018712997436523438, 0.019451618194580078, 0.02019023895263672, 0.02092885971069336, 0.02166748046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 7.0, 4.0, 8.0, 11.0, 10.0, 12.0, 11.0, 14.0, 32.0, 22.0, 33.0, 47.0, 63.0, 63.0, 89.0, 92.0, 93.0, 86.0, 55.0, 46.0, 41.0, 30.0, 25.0, 17.0, 15.0, 11.0, 7.0, 6.0, 11.0, 4.0, 8.0, 2.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01202392578125, -0.011667966842651367, -0.011312007904052734, -0.010956048965454102, -0.010600090026855469, -0.010244131088256836, -0.009888172149658203, -0.00953221321105957, -0.009176254272460938, -0.008820295333862305, -0.008464336395263672, -0.008108377456665039, -0.007752418518066406, -0.0073964595794677734, -0.007040500640869141, -0.006684541702270508, -0.006328582763671875, -0.005972623825073242, -0.005616664886474609, -0.0052607059478759766, -0.004904747009277344, -0.004548788070678711, -0.004192829132080078, -0.0038368701934814453, -0.0034809112548828125, -0.0031249523162841797, -0.002768993377685547, -0.002413034439086914, -0.0020570755004882812, -0.0017011165618896484, -0.0013451576232910156, -0.0009891986846923828, -0.00063323974609375, -0.0002772808074951172, 7.867813110351562e-05, 0.00043463706970214844, 0.0007905960083007812, 0.001146554946899414, 0.0015025138854980469, 0.0018584728240966797, 0.0022144317626953125, 0.0025703907012939453, 0.002926349639892578, 0.003282308578491211, 0.0036382675170898438, 0.0039942264556884766, 0.004350185394287109, 0.004706144332885742, 0.005062103271484375, 0.005418062210083008, 0.005774021148681641, 0.0061299800872802734, 0.006485939025878906, 0.006841897964477539, 0.007197856903076172, 0.007553815841674805, 0.007909774780273438, 0.00826573371887207, 0.008621692657470703, 0.008977651596069336, 0.009333610534667969, 0.009689569473266602, 0.010045528411865234, 0.010401487350463867, 0.0107574462890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 10.0, 22.0, 56.0, 113.0, 161.0, 242.0, 197.0, 119.0, 46.0, 15.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3078640103340149, -0.30131030082702637, -0.29475662112236023, -0.2882029116153717, -0.28164923191070557, -0.27509552240371704, -0.2685418128967285, -0.2619881331920624, -0.25543442368507385, -0.24888072907924652, -0.2423270344734192, -0.23577332496643066, -0.22921963036060333, -0.222665935754776, -0.21611224114894867, -0.20955854654312134, -0.2030048668384552, -0.19645117223262787, -0.18989747762680054, -0.183343768119812, -0.17679007351398468, -0.17023637890815735, -0.16368268430233002, -0.15712898969650269, -0.15057528018951416, -0.14402158558368683, -0.1374678909778595, -0.13091418147087097, -0.12436049431562424, -0.11780679225921631, -0.11125309765338898, -0.10469940304756165, -0.09814571589231491, -0.09159202128648758, -0.08503831923007965, -0.07848462462425232, -0.07193093001842499, -0.06537723541259766, -0.05882353335618973, -0.052269838750362396, -0.045716140419244766, -0.039162442088127136, -0.032608747482299805, -0.026055049151182175, -0.019501352682709694, -0.012947656214237213, -0.006393957883119583, 0.0001597367227077484, 0.006713435053825378, 0.01326713152229786, 0.01982082799077034, 0.02637452632188797, 0.0329282209277153, 0.03948191925883293, 0.04603561758995056, 0.05258931219577789, 0.05914301052689552, 0.06569670885801315, 0.07225040346384048, 0.07880410552024841, 0.08535780012607574, 0.09191149473190308, 0.09846518933773041, 0.10501888394355774, 0.11157258599996567]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 11.0, 5.0, 12.0, 6.0, 16.0, 16.0, 21.0, 29.0, 34.0, 26.0, 24.0, 37.0, 42.0, 48.0, 40.0, 43.0, 48.0, 42.0, 42.0, 39.0, 37.0, 39.0, 34.0, 32.0, 33.0, 42.0, 38.0, 19.0, 27.0, 18.0, 15.0, 12.0, 9.0, 10.0, 14.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06885600090026855, -0.0666867271065712, -0.06451745331287384, -0.06234818324446678, -0.060178909450769424, -0.05800963565707207, -0.05584036558866501, -0.05367109179496765, -0.051501818001270294, -0.04933254420757294, -0.04716327041387558, -0.04499400034546852, -0.042824726551771164, -0.04065545275807381, -0.03848618268966675, -0.03631690889596939, -0.034147635102272034, -0.031978361308574677, -0.02980908937752247, -0.02763981744647026, -0.025470543652772903, -0.023301269859075546, -0.02113199792802334, -0.01896272599697113, -0.016793452203273773, -0.01462417934089899, -0.012454906478524208, -0.010285633616149426, -0.008116360753774643, -0.00594708789139986, -0.003777815029025078, -0.0016085421666502953, 0.0005607306957244873, 0.00273000355809927, 0.004899276420474052, 0.007068549282848835, 0.009237822145223618, 0.0114070950075984, 0.013576367869973183, 0.01574563980102539, 0.017914913594722748, 0.020084187388420105, 0.022253459319472313, 0.02442273125052452, 0.026592005044221878, 0.028761278837919235, 0.030930550768971443, 0.03309982270002365, 0.03526909649372101, 0.037438370287418365, 0.03960764408111572, 0.04177691414952278, 0.04394618794322014, 0.046115461736917496, 0.048284731805324554, 0.05045400559902191, 0.05262327939271927, 0.054792553186416626, 0.05696182698011398, 0.05913109704852104, 0.0613003708422184, 0.06346964091062546, 0.06563891470432281, 0.06780818849802017, 0.06997746229171753]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 16.0, 11.0, 14.0, 13.0, 28.0, 36.0, 54.0, 78.0, 129.0, 236.0, 411.0, 823.0, 2074.0, 7289.0, 66766.0, 3925301.0, 172072.0, 12949.0, 3685.0, 1280.0, 450.0, 238.0, 105.0, 71.0, 42.0, 26.0, 21.0, 18.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.05145263671875, -0.04982566833496094, -0.048198699951171875, -0.04657173156738281, -0.04494476318359375, -0.04331779479980469, -0.041690826416015625, -0.04006385803222656, -0.0384368896484375, -0.03680992126464844, -0.035182952880859375, -0.03355598449707031, -0.03192901611328125, -0.030302047729492188, -0.028675079345703125, -0.027048110961914062, -0.025421142578125, -0.023794174194335938, -0.022167205810546875, -0.020540237426757812, -0.01891326904296875, -0.017286300659179688, -0.015659332275390625, -0.014032363891601562, -0.0124053955078125, -0.010778427124023438, -0.009151458740234375, -0.0075244903564453125, -0.00589752197265625, -0.0042705535888671875, -0.002643585205078125, -0.0010166168212890625, 0.0006103515625, 0.0022373199462890625, 0.003864288330078125, 0.0054912567138671875, 0.00711822509765625, 0.008745193481445312, 0.010372161865234375, 0.011999130249023438, 0.0136260986328125, 0.015253067016601562, 0.016880035400390625, 0.018507003784179688, 0.02013397216796875, 0.021760940551757812, 0.023387908935546875, 0.025014877319335938, 0.026641845703125, 0.028268814086914062, 0.029895782470703125, 0.03152275085449219, 0.03314971923828125, 0.03477668762207031, 0.036403656005859375, 0.03803062438964844, 0.0396575927734375, 0.04128456115722656, 0.042911529541015625, 0.04453849792480469, 0.04616546630859375, 0.04779243469238281, 0.049419403076171875, 0.05104637145996094, 0.05267333984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 16.0, 61.0, 154.0, 233.0, 285.0, 155.0, 68.0, 12.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.04165816307067871, -0.04056119918823242, -0.03946423530578613, -0.038367271423339844, -0.037270307540893555, -0.036173343658447266, -0.03507637977600098, -0.03397941589355469, -0.0328824520111084, -0.03178548812866211, -0.03068852424621582, -0.02959156036376953, -0.028494596481323242, -0.027397632598876953, -0.026300668716430664, -0.025203704833984375, -0.024106740951538086, -0.023009777069091797, -0.021912813186645508, -0.02081584930419922, -0.01971888542175293, -0.01862192153930664, -0.01752495765686035, -0.016427993774414062, -0.015331029891967773, -0.014234066009521484, -0.013137102127075195, -0.012040138244628906, -0.010943174362182617, -0.009846210479736328, -0.008749246597290039, -0.00765228271484375, -0.006555318832397461, -0.005458354949951172, -0.004361391067504883, -0.0032644271850585938, -0.0021674633026123047, -0.0010704994201660156, 2.6464462280273438e-05, 0.0011234283447265625, 0.0022203922271728516, 0.0033173561096191406, 0.00441431999206543, 0.005511283874511719, 0.006608247756958008, 0.007705211639404297, 0.008802175521850586, 0.009899139404296875, 0.010996103286743164, 0.012093067169189453, 0.013190031051635742, 0.014286994934082031, 0.01538395881652832, 0.01648092269897461, 0.0175778865814209, 0.018674850463867188, 0.019771814346313477, 0.020868778228759766, 0.021965742111206055, 0.023062705993652344, 0.024159669876098633, 0.025256633758544922, 0.02635359764099121, 0.0274505615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 14.0, 22.0, 24.0, 38.0, 42.0, 71.0, 150.0, 237.0, 427.0, 814.0, 1799.0, 4307.0, 14023.0, 73115.0, 892424.0, 3011274.0, 159581.0, 24493.0, 6592.0, 2475.0, 1044.0, 532.0, 315.0, 164.0, 97.0, 60.0, 31.0, 27.0, 21.0, 21.0, 9.0, 9.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0307159423828125, -0.029911518096923828, -0.029107093811035156, -0.028302669525146484, -0.027498245239257812, -0.02669382095336914, -0.02588939666748047, -0.025084972381591797, -0.024280548095703125, -0.023476123809814453, -0.02267169952392578, -0.02186727523803711, -0.021062850952148438, -0.020258426666259766, -0.019454002380371094, -0.018649578094482422, -0.01784515380859375, -0.017040729522705078, -0.016236305236816406, -0.015431880950927734, -0.014627456665039062, -0.01382303237915039, -0.013018608093261719, -0.012214183807373047, -0.011409759521484375, -0.010605335235595703, -0.009800910949707031, -0.00899648666381836, -0.008192062377929688, -0.007387638092041016, -0.006583213806152344, -0.005778789520263672, -0.004974365234375, -0.004169940948486328, -0.0033655166625976562, -0.0025610923767089844, -0.0017566680908203125, -0.0009522438049316406, -0.00014781951904296875, 0.0006566047668457031, 0.001461029052734375, 0.002265453338623047, 0.0030698776245117188, 0.0038743019104003906, 0.0046787261962890625, 0.005483150482177734, 0.006287574768066406, 0.007091999053955078, 0.00789642333984375, 0.008700847625732422, 0.009505271911621094, 0.010309696197509766, 0.011114120483398438, 0.01191854476928711, 0.012722969055175781, 0.013527393341064453, 0.014331817626953125, 0.015136241912841797, 0.01594066619873047, 0.01674509048461914, 0.017549514770507812, 0.018353939056396484, 0.019158363342285156, 0.019962787628173828, 0.0207672119140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 12.0, 7.0, 11.0, 30.0, 36.0, 62.0, 86.0, 135.0, 229.0, 425.0, 890.0, 972.0, 441.0, 245.0, 143.0, 92.0, 69.0, 71.0, 46.0, 17.0, 15.0, 13.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01522064208984375, -0.014614462852478027, -0.014008283615112305, -0.013402104377746582, -0.01279592514038086, -0.012189745903015137, -0.011583566665649414, -0.010977387428283691, -0.010371208190917969, -0.009765028953552246, -0.009158849716186523, -0.0085526704788208, -0.007946491241455078, -0.0073403120040893555, -0.006734132766723633, -0.00612795352935791, -0.0055217742919921875, -0.004915595054626465, -0.004309415817260742, -0.0037032365798950195, -0.003097057342529297, -0.0024908781051635742, -0.0018846988677978516, -0.001278519630432129, -0.0006723403930664062, -6.61611557006836e-05, 0.0005400180816650391, 0.0011461973190307617, 0.0017523765563964844, 0.002358555793762207, 0.0029647350311279297, 0.0035709142684936523, 0.004177093505859375, 0.004783272743225098, 0.00538945198059082, 0.005995631217956543, 0.006601810455322266, 0.007207989692687988, 0.007814168930053711, 0.008420348167419434, 0.009026527404785156, 0.009632706642150879, 0.010238885879516602, 0.010845065116882324, 0.011451244354248047, 0.01205742359161377, 0.012663602828979492, 0.013269782066345215, 0.013875961303710938, 0.01448214054107666, 0.015088319778442383, 0.015694499015808105, 0.016300678253173828, 0.01690685749053955, 0.017513036727905273, 0.018119215965270996, 0.01872539520263672, 0.01933157444000244, 0.019937753677368164, 0.020543932914733887, 0.02115011215209961, 0.021756291389465332, 0.022362470626831055, 0.022968649864196777, 0.0235748291015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 11.0, 75.0, 206.0, 313.0, 242.0, 97.0, 33.0, 16.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18169555068016052, -0.17504625022411346, -0.1683969348669052, -0.16174763441085815, -0.1550983339548111, -0.14844903349876404, -0.1417997181415558, -0.13515041768550873, -0.12850111722946167, -0.12185180932283401, -0.11520250886678696, -0.1085532009601593, -0.10190390050411224, -0.09525459259748459, -0.08860528469085693, -0.08195598423480988, -0.07530666887760162, -0.06865736097097397, -0.06200806051492691, -0.055358752608299255, -0.0487094484269619, -0.04206014424562454, -0.03541083633899689, -0.02876153215765953, -0.022112227976322174, -0.015462922863662243, -0.008813617751002312, -0.002164311707019806, 0.004484992474317551, 0.011134296655654907, 0.017783604562282562, 0.02443290874361992, 0.03108219802379608, 0.03773150220513344, 0.044380806386470795, 0.05103011429309845, 0.057679418474435806, 0.06432872265577316, 0.07097803056240082, 0.07762733101844788, 0.08427663892507553, 0.09092594683170319, 0.09757524728775024, 0.1042245551943779, 0.11087386310100555, 0.11752316355705261, 0.12417247146368027, 0.13082177937030792, 0.13747107982635498, 0.14412038028240204, 0.1507696956396103, 0.15741899609565735, 0.1640682965517044, 0.17071759700775146, 0.17736691236495972, 0.18401621282100677, 0.19066551327705383, 0.1973148137331009, 0.20396412909030914, 0.2106134295463562, 0.21726273000240326, 0.22391203045845032, 0.23056134581565857, 0.23721064627170563, 0.24385996162891388]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 18.0, 12.0, 21.0, 27.0, 32.0, 29.0, 38.0, 46.0, 41.0, 62.0, 60.0, 57.0, 53.0, 44.0, 52.0, 50.0, 55.0, 53.0, 43.0, 36.0, 19.0, 27.0, 34.0, 19.0, 11.0, 13.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06785237789154053, -0.06599041074514389, -0.06412844359874725, -0.062266476452350616, -0.06040450930595398, -0.05854254215955734, -0.056680575013160706, -0.05481860786676407, -0.05295664072036743, -0.051094673573970795, -0.04923270642757416, -0.04737073928117752, -0.045508772134780884, -0.04364680498838425, -0.04178483784198761, -0.03992287069559097, -0.038060903549194336, -0.0361989364027977, -0.03433696925640106, -0.032475002110004425, -0.030613034963607788, -0.02875106781721115, -0.026889100670814514, -0.025027133524417877, -0.02316516637802124, -0.021303199231624603, -0.019441232085227966, -0.01757926493883133, -0.015717297792434692, -0.013855330646038055, -0.011993363499641418, -0.010131396353244781, -0.008269429206848145, -0.006407462060451508, -0.004545494914054871, -0.0026835277676582336, -0.0008215606212615967, 0.0010404065251350403, 0.0029023736715316772, 0.004764340817928314, 0.006626307964324951, 0.008488275110721588, 0.010350242257118225, 0.012212209403514862, 0.014074176549911499, 0.015936143696308136, 0.017798110842704773, 0.01966007798910141, 0.021522045135498047, 0.023384012281894684, 0.02524597942829132, 0.027107946574687958, 0.028969913721084595, 0.03083188086748123, 0.03269384801387787, 0.034555815160274506, 0.03641778230667114, 0.03827974945306778, 0.040141716599464417, 0.04200368374586105, 0.04386565089225769, 0.04572761803865433, 0.047589585185050964, 0.0494515523314476, 0.05131351947784424]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 0.0, 12.0, 12.0, 13.0, 22.0, 22.0, 39.0, 57.0, 80.0, 126.0, 127.0, 176.0, 257.0, 387.0, 561.0, 834.0, 1378.0, 3537.0, 20609.0, 271936.0, 666619.0, 69000.0, 7326.0, 2137.0, 1041.0, 639.0, 408.0, 325.0, 231.0, 172.0, 131.0, 93.0, 55.0, 49.0, 32.0, 28.0, 24.0, 19.0, 9.0, 5.0, 2.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055023193359375, -0.05326223373413086, -0.05150127410888672, -0.04974031448364258, -0.04797935485839844, -0.0462183952331543, -0.044457435607910156, -0.042696475982666016, -0.040935516357421875, -0.039174556732177734, -0.037413597106933594, -0.03565263748168945, -0.03389167785644531, -0.03213071823120117, -0.03036975860595703, -0.02860879898071289, -0.02684783935546875, -0.02508687973022461, -0.02332592010498047, -0.021564960479736328, -0.019804000854492188, -0.018043041229248047, -0.016282081604003906, -0.014521121978759766, -0.012760162353515625, -0.010999202728271484, -0.009238243103027344, -0.007477283477783203, -0.0057163238525390625, -0.003955364227294922, -0.0021944046020507812, -0.0004334449768066406, 0.0013275146484375, 0.0030884742736816406, 0.004849433898925781, 0.006610393524169922, 0.008371353149414062, 0.010132312774658203, 0.011893272399902344, 0.013654232025146484, 0.015415191650390625, 0.017176151275634766, 0.018937110900878906, 0.020698070526123047, 0.022459030151367188, 0.024219989776611328, 0.02598094940185547, 0.02774190902709961, 0.02950286865234375, 0.03126382827758789, 0.03302478790283203, 0.03478574752807617, 0.03654670715332031, 0.03830766677856445, 0.040068626403808594, 0.041829586029052734, 0.043590545654296875, 0.045351505279541016, 0.047112464904785156, 0.0488734245300293, 0.05063438415527344, 0.05239534378051758, 0.05415630340576172, 0.05591726303100586, 0.05767822265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 17.0, 65.0, 143.0, 226.0, 268.0, 177.0, 72.0, 16.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0421142578125, -0.04103493690490723, -0.03995561599731445, -0.03887629508972168, -0.037796974182128906, -0.03671765327453613, -0.03563833236694336, -0.034559011459350586, -0.03347969055175781, -0.03240036964416504, -0.031321048736572266, -0.030241727828979492, -0.02916240692138672, -0.028083086013793945, -0.027003765106201172, -0.0259244441986084, -0.024845123291015625, -0.02376580238342285, -0.022686481475830078, -0.021607160568237305, -0.02052783966064453, -0.019448518753051758, -0.018369197845458984, -0.01728987693786621, -0.016210556030273438, -0.015131235122680664, -0.01405191421508789, -0.012972593307495117, -0.011893272399902344, -0.01081395149230957, -0.009734630584716797, -0.008655309677124023, -0.00757598876953125, -0.0064966678619384766, -0.005417346954345703, -0.00433802604675293, -0.0032587051391601562, -0.002179384231567383, -0.0011000633239746094, -2.0742416381835938e-05, 0.0010585784912109375, 0.002137899398803711, 0.0032172203063964844, 0.004296541213989258, 0.005375862121582031, 0.006455183029174805, 0.007534503936767578, 0.008613824844360352, 0.009693145751953125, 0.010772466659545898, 0.011851787567138672, 0.012931108474731445, 0.014010429382324219, 0.015089750289916992, 0.016169071197509766, 0.01724839210510254, 0.018327713012695312, 0.019407033920288086, 0.02048635482788086, 0.021565675735473633, 0.022644996643066406, 0.02372431755065918, 0.024803638458251953, 0.025882959365844727, 0.0269622802734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 8.0, 5.0, 11.0, 12.0, 25.0, 23.0, 50.0, 53.0, 78.0, 120.0, 214.0, 418.0, 905.0, 2898.0, 12529.0, 72831.0, 387355.0, 454490.0, 94931.0, 16043.0, 3431.0, 1091.0, 436.0, 227.0, 131.0, 74.0, 54.0, 41.0, 23.0, 19.0, 8.0, 5.0, 4.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03662109375, -0.035546302795410156, -0.03447151184082031, -0.03339672088623047, -0.032321929931640625, -0.03124713897705078, -0.030172348022460938, -0.029097557067871094, -0.02802276611328125, -0.026947975158691406, -0.025873184204101562, -0.02479839324951172, -0.023723602294921875, -0.02264881134033203, -0.021574020385742188, -0.020499229431152344, -0.0194244384765625, -0.018349647521972656, -0.017274856567382812, -0.01620006561279297, -0.015125274658203125, -0.014050483703613281, -0.012975692749023438, -0.011900901794433594, -0.01082611083984375, -0.009751319885253906, -0.008676528930664062, -0.007601737976074219, -0.006526947021484375, -0.005452156066894531, -0.0043773651123046875, -0.0033025741577148438, -0.002227783203125, -0.0011529922485351562, -7.82012939453125e-05, 0.0009965896606445312, 0.002071380615234375, 0.0031461715698242188, 0.0042209625244140625, 0.005295753479003906, 0.00637054443359375, 0.007445335388183594, 0.008520126342773438, 0.009594917297363281, 0.010669708251953125, 0.011744499206542969, 0.012819290161132812, 0.013894081115722656, 0.0149688720703125, 0.016043663024902344, 0.017118453979492188, 0.01819324493408203, 0.019268035888671875, 0.02034282684326172, 0.021417617797851562, 0.022492408752441406, 0.02356719970703125, 0.024641990661621094, 0.025716781616210938, 0.02679157257080078, 0.027866363525390625, 0.02894115447998047, 0.030015945434570312, 0.031090736389160156, 0.03216552734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 10.0, 15.0, 9.0, 11.0, 21.0, 26.0, 28.0, 31.0, 37.0, 52.0, 42.0, 71.0, 72.0, 59.0, 54.0, 57.0, 67.0, 63.0, 48.0, 39.0, 33.0, 32.0, 29.0, 28.0, 15.0, 19.0, 7.0, 8.0, 4.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.025726318359375, -0.024872541427612305, -0.02401876449584961, -0.023164987564086914, -0.02231121063232422, -0.021457433700561523, -0.020603656768798828, -0.019749879837036133, -0.018896102905273438, -0.018042325973510742, -0.017188549041748047, -0.01633477210998535, -0.015480995178222656, -0.014627218246459961, -0.013773441314697266, -0.01291966438293457, -0.012065887451171875, -0.01121211051940918, -0.010358333587646484, -0.009504556655883789, -0.008650779724121094, -0.0077970027923583984, -0.006943225860595703, -0.006089448928833008, -0.0052356719970703125, -0.004381895065307617, -0.003528118133544922, -0.0026743412017822266, -0.0018205642700195312, -0.0009667873382568359, -0.00011301040649414062, 0.0007407665252685547, 0.00159454345703125, 0.0024483203887939453, 0.0033020973205566406, 0.004155874252319336, 0.005009651184082031, 0.0058634281158447266, 0.006717205047607422, 0.007570981979370117, 0.008424758911132812, 0.009278535842895508, 0.010132312774658203, 0.010986089706420898, 0.011839866638183594, 0.012693643569946289, 0.013547420501708984, 0.01440119743347168, 0.015254974365234375, 0.01610875129699707, 0.016962528228759766, 0.01781630516052246, 0.018670082092285156, 0.01952385902404785, 0.020377635955810547, 0.021231412887573242, 0.022085189819335938, 0.022938966751098633, 0.023792743682861328, 0.024646520614624023, 0.02550029754638672, 0.026354074478149414, 0.02720785140991211, 0.028061628341674805, 0.0289154052734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 8.0, 23.0, 30.0, 55.0, 58.0, 95.0, 156.0, 259.0, 518.0, 863.0, 1697.0, 3303.0, 7208.0, 15896.0, 40792.0, 120497.0, 398429.0, 310554.0, 90838.0, 32038.0, 13184.0, 5923.0, 2809.0, 1412.0, 768.0, 422.0, 284.0, 145.0, 94.0, 62.0, 34.0, 28.0, 21.0, 12.0, 15.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01055145263671875, -0.01017296314239502, -0.009794473648071289, -0.009415984153747559, -0.009037494659423828, -0.008659005165100098, -0.008280515670776367, -0.007902026176452637, -0.007523536682128906, -0.007145047187805176, -0.006766557693481445, -0.006388068199157715, -0.006009578704833984, -0.005631089210510254, -0.0052525997161865234, -0.004874110221862793, -0.0044956207275390625, -0.004117131233215332, -0.0037386417388916016, -0.003360152244567871, -0.0029816627502441406, -0.00260317325592041, -0.0022246837615966797, -0.0018461942672729492, -0.0014677047729492188, -0.0010892152786254883, -0.0007107257843017578, -0.00033223628997802734, 4.6253204345703125e-05, 0.0004247426986694336, 0.0008032321929931641, 0.0011817216873168945, 0.001560211181640625, 0.0019387006759643555, 0.002317190170288086, 0.0026956796646118164, 0.003074169158935547, 0.0034526586532592773, 0.003831148147583008, 0.004209637641906738, 0.004588127136230469, 0.004966616630554199, 0.00534510612487793, 0.00572359561920166, 0.006102085113525391, 0.006480574607849121, 0.0068590641021728516, 0.007237553596496582, 0.0076160430908203125, 0.007994532585144043, 0.008373022079467773, 0.008751511573791504, 0.009130001068115234, 0.009508490562438965, 0.009886980056762695, 0.010265469551086426, 0.010643959045410156, 0.011022448539733887, 0.011400938034057617, 0.011779427528381348, 0.012157917022705078, 0.012536406517028809, 0.012914896011352539, 0.01329338550567627, 0.013671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 19.0, 23.0, 20.0, 32.0, 46.0, 50.0, 54.0, 86.0, 62.0, 81.0, 77.0, 68.0, 65.0, 56.0, 39.0, 37.0, 27.0, 19.0, 22.0, 15.0, 11.0, 10.0, 7.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.765127182006836e-05, -6.553810089826584e-05, -6.342492997646332e-05, -6.13117590546608e-05, -5.9198588132858276e-05, -5.7085417211055756e-05, -5.4972246289253235e-05, -5.2859075367450714e-05, -5.074590444564819e-05, -4.863273352384567e-05, -4.651956260204315e-05, -4.440639168024063e-05, -4.229322075843811e-05, -4.018004983663559e-05, -3.806687891483307e-05, -3.595370799303055e-05, -3.384053707122803e-05, -3.1727366149425507e-05, -2.9614195227622986e-05, -2.7501024305820465e-05, -2.5387853384017944e-05, -2.3274682462215424e-05, -2.1161511540412903e-05, -1.9048340618610382e-05, -1.693516969680786e-05, -1.482199877500534e-05, -1.270882785320282e-05, -1.0595656931400299e-05, -8.482486009597778e-06, -6.3693150877952576e-06, -4.256144165992737e-06, -2.142973244190216e-06, -2.9802322387695312e-08, 2.0833685994148254e-06, 4.196539521217346e-06, 6.309710443019867e-06, 8.422881364822388e-06, 1.0536052286624908e-05, 1.264922320842743e-05, 1.476239413022995e-05, 1.687556505203247e-05, 1.898873597383499e-05, 2.1101906895637512e-05, 2.3215077817440033e-05, 2.5328248739242554e-05, 2.7441419661045074e-05, 2.9554590582847595e-05, 3.1667761504650116e-05, 3.378093242645264e-05, 3.589410334825516e-05, 3.800727427005768e-05, 4.01204451918602e-05, 4.223361611366272e-05, 4.434678703546524e-05, 4.645995795726776e-05, 4.857312887907028e-05, 5.06862998008728e-05, 5.2799470722675323e-05, 5.4912641644477844e-05, 5.7025812566280365e-05, 5.9138983488082886e-05, 6.12521544098854e-05, 6.336532533168793e-05, 6.547849625349045e-05, 6.759166717529297e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 8.0, 8.0, 17.0, 21.0, 44.0, 51.0, 90.0, 112.0, 208.0, 448.0, 921.0, 1949.0, 4917.0, 14916.0, 53913.0, 226015.0, 516044.0, 168932.0, 40706.0, 11740.0, 4078.0, 1653.0, 789.0, 385.0, 224.0, 125.0, 77.0, 46.0, 38.0, 25.0, 13.0, 12.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0157470703125, -0.015314459800720215, -0.01488184928894043, -0.014449238777160645, -0.01401662826538086, -0.013584017753601074, -0.013151407241821289, -0.012718796730041504, -0.012286186218261719, -0.011853575706481934, -0.011420965194702148, -0.010988354682922363, -0.010555744171142578, -0.010123133659362793, -0.009690523147583008, -0.009257912635803223, -0.008825302124023438, -0.008392691612243652, -0.007960081100463867, -0.007527470588684082, -0.007094860076904297, -0.006662249565124512, -0.0062296390533447266, -0.005797028541564941, -0.005364418029785156, -0.004931807518005371, -0.004499197006225586, -0.004066586494445801, -0.0036339759826660156, -0.0032013654708862305, -0.0027687549591064453, -0.00233614444732666, -0.001903533935546875, -0.0014709234237670898, -0.0010383129119873047, -0.0006057024002075195, -0.00017309188842773438, 0.0002595186233520508, 0.0006921291351318359, 0.001124739646911621, 0.0015573501586914062, 0.0019899606704711914, 0.0024225711822509766, 0.0028551816940307617, 0.003287792205810547, 0.003720402717590332, 0.004153013229370117, 0.004585623741149902, 0.0050182342529296875, 0.005450844764709473, 0.005883455276489258, 0.006316065788269043, 0.006748676300048828, 0.007181286811828613, 0.0076138973236083984, 0.008046507835388184, 0.008479118347167969, 0.008911728858947754, 0.009344339370727539, 0.009776949882507324, 0.01020956039428711, 0.010642170906066895, 0.01107478141784668, 0.011507391929626465, 0.01194000244140625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 10.0, 4.0, 15.0, 13.0, 26.0, 23.0, 29.0, 38.0, 38.0, 54.0, 85.0, 78.0, 97.0, 92.0, 75.0, 56.0, 47.0, 52.0, 37.0, 18.0, 17.0, 15.0, 13.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01104736328125, -0.010728597640991211, -0.010409832000732422, -0.010091066360473633, -0.009772300720214844, -0.009453535079956055, -0.009134769439697266, -0.008816003799438477, -0.008497238159179688, -0.008178472518920898, -0.00785970687866211, -0.00754094123840332, -0.007222175598144531, -0.006903409957885742, -0.006584644317626953, -0.006265878677368164, -0.005947113037109375, -0.005628347396850586, -0.005309581756591797, -0.004990816116333008, -0.004672050476074219, -0.00435328483581543, -0.004034519195556641, -0.0037157535552978516, -0.0033969879150390625, -0.0030782222747802734, -0.0027594566345214844, -0.0024406909942626953, -0.0021219253540039062, -0.0018031597137451172, -0.0014843940734863281, -0.001165628433227539, -0.00084686279296875, -0.0005280971527099609, -0.00020933151245117188, 0.00010943412780761719, 0.00042819976806640625, 0.0007469654083251953, 0.0010657310485839844, 0.0013844966888427734, 0.0017032623291015625, 0.0020220279693603516, 0.0023407936096191406, 0.0026595592498779297, 0.0029783248901367188, 0.003297090530395508, 0.003615856170654297, 0.003934621810913086, 0.004253387451171875, 0.004572153091430664, 0.004890918731689453, 0.005209684371948242, 0.005528450012207031, 0.00584721565246582, 0.006165981292724609, 0.0064847469329833984, 0.0068035125732421875, 0.0071222782135009766, 0.007441043853759766, 0.007759809494018555, 0.008078575134277344, 0.008397340774536133, 0.008716106414794922, 0.009034872055053711, 0.0093536376953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 11.0, 24.0, 38.0, 77.0, 144.0, 224.0, 208.0, 149.0, 63.0, 48.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.30767813324928284, -0.3015662133693695, -0.29545432329177856, -0.28934240341186523, -0.2832304835319519, -0.27711859345436096, -0.27100667357444763, -0.2648947536945343, -0.25878286361694336, -0.25267094373703003, -0.2465590387582779, -0.24044713377952576, -0.23433522880077362, -0.2282233089208603, -0.22211140394210815, -0.21599948406219482, -0.2098875641822815, -0.20377565920352936, -0.19766373932361603, -0.1915518343448639, -0.18543992936611176, -0.17932800948619843, -0.1732161045074463, -0.16710418462753296, -0.16099229454994202, -0.15488038957118988, -0.14876846969127655, -0.14265656471252441, -0.13654465973377228, -0.13043273985385895, -0.12432083487510681, -0.11820892244577408, -0.11209701001644135, -0.10598509758710861, -0.09987319260835648, -0.09376128017902374, -0.08764936774969101, -0.08153745532035828, -0.07542555034160614, -0.06931363791227341, -0.06320172548294067, -0.05708981677889824, -0.050977904349565506, -0.04486599564552307, -0.03875408321619034, -0.0326421745121479, -0.02653026580810547, -0.020418353378772736, -0.0143064484000206, -0.008194537833333015, -0.002082628197968006, 0.004029281437397003, 0.010141192004084587, 0.01625310257077217, 0.022365011274814606, 0.02847692370414734, 0.034588832408189774, 0.04070074111223221, 0.04681265354156494, 0.052924562245607376, 0.05903647094964981, 0.06514838337898254, 0.07126028835773468, 0.07737220823764801, 0.08348411321640015]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 8.0, 17.0, 12.0, 13.0, 13.0, 23.0, 20.0, 11.0, 26.0, 24.0, 15.0, 36.0, 41.0, 30.0, 48.0, 47.0, 34.0, 52.0, 51.0, 48.0, 39.0, 34.0, 30.0, 43.0, 30.0, 32.0, 22.0, 23.0, 26.0, 22.0, 22.0, 16.0, 11.0, 9.0, 11.0, 11.0, 7.0, 6.0, 6.0, 9.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0], "bins": [-0.0684361457824707, -0.06653998792171478, -0.06464383751153946, -0.06274768710136414, -0.060851529240608215, -0.05895537510514259, -0.05705922096967697, -0.05516306683421135, -0.05326691269874573, -0.051370758563280106, -0.049474604427814484, -0.04757845029234886, -0.04568229615688324, -0.04378614202141762, -0.041889987885951996, -0.039993833750486374, -0.03809767961502075, -0.03620152547955513, -0.03430537134408951, -0.032409217208623886, -0.030513063073158264, -0.028616908937692642, -0.02672075480222702, -0.0248246006667614, -0.022928446531295776, -0.021032292395830154, -0.019136138260364532, -0.01723998412489891, -0.015343829989433289, -0.013447675853967667, -0.011551521718502045, -0.009655367583036423, -0.007759213447570801, -0.005863059312105179, -0.003966905176639557, -0.002070751041173935, -0.000174596905708313, 0.001721557229757309, 0.003617711365222931, 0.005513865500688553, 0.007410019636154175, 0.009306173771619797, 0.011202327907085419, 0.01309848204255104, 0.014994636178016663, 0.016890790313482285, 0.018786944448947906, 0.02068309858441353, 0.02257925271987915, 0.024475406855344772, 0.026371560990810394, 0.028267715126276016, 0.030163869261741638, 0.03206002339720726, 0.03395617753267288, 0.035852331668138504, 0.037748485803604126, 0.03964463993906975, 0.04154079407453537, 0.04343694821000099, 0.045333102345466614, 0.047229256480932236, 0.04912541061639786, 0.05102156475186348, 0.0529177188873291]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 4.0, 15.0, 14.0, 24.0, 30.0, 43.0, 72.0, 163.0, 249.0, 585.0, 1842.0, 7668.0, 157810.0, 3981877.0, 36139.0, 5193.0, 1623.0, 474.0, 212.0, 96.0, 52.0, 32.0, 15.0, 11.0, 11.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061279296875, -0.059543609619140625, -0.05780792236328125, -0.056072235107421875, -0.0543365478515625, -0.052600860595703125, -0.05086517333984375, -0.049129486083984375, -0.047393798828125, -0.045658111572265625, -0.04392242431640625, -0.042186737060546875, -0.0404510498046875, -0.038715362548828125, -0.03697967529296875, -0.035243988037109375, -0.03350830078125, -0.031772613525390625, -0.03003692626953125, -0.028301239013671875, -0.0265655517578125, -0.024829864501953125, -0.02309417724609375, -0.021358489990234375, -0.019622802734375, -0.017887115478515625, -0.01615142822265625, -0.014415740966796875, -0.0126800537109375, -0.010944366455078125, -0.00920867919921875, -0.007472991943359375, -0.0057373046875, -0.004001617431640625, -0.00226593017578125, -0.000530242919921875, 0.0012054443359375, 0.002941131591796875, 0.00467681884765625, 0.006412506103515625, 0.008148193359375, 0.009883880615234375, 0.01161956787109375, 0.013355255126953125, 0.0150909423828125, 0.016826629638671875, 0.01856231689453125, 0.020298004150390625, 0.02203369140625, 0.023769378662109375, 0.02550506591796875, 0.027240753173828125, 0.0289764404296875, 0.030712127685546875, 0.03244781494140625, 0.034183502197265625, 0.035919189453125, 0.037654876708984375, 0.03939056396484375, 0.041126251220703125, 0.0428619384765625, 0.044597625732421875, 0.04633331298828125, 0.048069000244140625, 0.0498046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 24.0, 68.0, 166.0, 250.0, 265.0, 150.0, 48.0, 10.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042572021484375, -0.04147505760192871, -0.04037809371948242, -0.03928112983703613, -0.038184165954589844, -0.037087202072143555, -0.035990238189697266, -0.03489327430725098, -0.03379631042480469, -0.0326993465423584, -0.03160238265991211, -0.03050541877746582, -0.02940845489501953, -0.028311491012573242, -0.027214527130126953, -0.026117563247680664, -0.025020599365234375, -0.023923635482788086, -0.022826671600341797, -0.021729707717895508, -0.02063274383544922, -0.01953577995300293, -0.01843881607055664, -0.01734185218811035, -0.016244888305664062, -0.015147924423217773, -0.014050960540771484, -0.012953996658325195, -0.011857032775878906, -0.010760068893432617, -0.009663105010986328, -0.008566141128540039, -0.00746917724609375, -0.006372213363647461, -0.005275249481201172, -0.004178285598754883, -0.0030813217163085938, -0.0019843578338623047, -0.0008873939514160156, 0.00020956993103027344, 0.0013065338134765625, 0.0024034976959228516, 0.0035004615783691406, 0.00459742546081543, 0.005694389343261719, 0.006791353225708008, 0.007888317108154297, 0.008985280990600586, 0.010082244873046875, 0.011179208755493164, 0.012276172637939453, 0.013373136520385742, 0.014470100402832031, 0.01556706428527832, 0.01666402816772461, 0.0177609920501709, 0.018857955932617188, 0.019954919815063477, 0.021051883697509766, 0.022148847579956055, 0.023245811462402344, 0.024342775344848633, 0.025439739227294922, 0.02653670310974121, 0.0276336669921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 9.0, 9.0, 18.0, 26.0, 29.0, 39.0, 49.0, 86.0, 103.0, 184.0, 341.0, 576.0, 1153.0, 2605.0, 7104.0, 25239.0, 125710.0, 1837490.0, 2023115.0, 131938.0, 25921.0, 7268.0, 2655.0, 1161.0, 552.0, 309.0, 190.0, 119.0, 84.0, 41.0, 37.0, 29.0, 26.0, 11.0, 19.0, 10.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0210418701171875, -0.020423173904418945, -0.01980447769165039, -0.019185781478881836, -0.01856708526611328, -0.017948389053344727, -0.017329692840576172, -0.016710996627807617, -0.016092300415039062, -0.015473604202270508, -0.014854907989501953, -0.014236211776733398, -0.013617515563964844, -0.012998819351196289, -0.012380123138427734, -0.01176142692565918, -0.011142730712890625, -0.01052403450012207, -0.009905338287353516, -0.009286642074584961, -0.008667945861816406, -0.008049249649047852, -0.007430553436279297, -0.006811857223510742, -0.0061931610107421875, -0.005574464797973633, -0.004955768585205078, -0.0043370723724365234, -0.0037183761596679688, -0.003099679946899414, -0.0024809837341308594, -0.0018622875213623047, -0.00124359130859375, -0.0006248950958251953, -6.198883056640625e-06, 0.0006124973297119141, 0.0012311935424804688, 0.0018498897552490234, 0.002468585968017578, 0.003087282180786133, 0.0037059783935546875, 0.004324674606323242, 0.004943370819091797, 0.0055620670318603516, 0.006180763244628906, 0.006799459457397461, 0.007418155670166016, 0.00803685188293457, 0.008655548095703125, 0.00927424430847168, 0.009892940521240234, 0.010511636734008789, 0.011130332946777344, 0.011749029159545898, 0.012367725372314453, 0.012986421585083008, 0.013605117797851562, 0.014223814010620117, 0.014842510223388672, 0.015461206436157227, 0.01607990264892578, 0.016698598861694336, 0.01731729507446289, 0.017935991287231445, 0.0185546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 7.0, 13.0, 10.0, 37.0, 45.0, 52.0, 87.0, 125.0, 183.0, 409.0, 864.0, 970.0, 516.0, 270.0, 140.0, 98.0, 66.0, 52.0, 39.0, 22.0, 12.0, 16.0, 7.0, 10.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00981903076171875, -0.009374737739562988, -0.008930444717407227, -0.008486151695251465, -0.008041858673095703, -0.007597565650939941, -0.00715327262878418, -0.006708979606628418, -0.006264686584472656, -0.0058203935623168945, -0.005376100540161133, -0.004931807518005371, -0.004487514495849609, -0.004043221473693848, -0.003598928451538086, -0.0031546354293823242, -0.0027103424072265625, -0.0022660493850708008, -0.001821756362915039, -0.0013774633407592773, -0.0009331703186035156, -0.0004888772964477539, -4.458427429199219e-05, 0.00039970874786376953, 0.0008440017700195312, 0.001288294792175293, 0.0017325878143310547, 0.0021768808364868164, 0.002621173858642578, 0.00306546688079834, 0.0035097599029541016, 0.003954052925109863, 0.004398345947265625, 0.004842638969421387, 0.0052869319915771484, 0.00573122501373291, 0.006175518035888672, 0.006619811058044434, 0.007064104080200195, 0.007508397102355957, 0.007952690124511719, 0.00839698314666748, 0.008841276168823242, 0.009285569190979004, 0.009729862213134766, 0.010174155235290527, 0.010618448257446289, 0.01106274127960205, 0.011507034301757812, 0.011951327323913574, 0.012395620346069336, 0.012839913368225098, 0.01328420639038086, 0.013728499412536621, 0.014172792434692383, 0.014617085456848145, 0.015061378479003906, 0.015505671501159668, 0.01594996452331543, 0.01639425754547119, 0.016838550567626953, 0.017282843589782715, 0.017727136611938477, 0.01817142963409424, 0.01861572265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 14.0, 66.0, 265.0, 397.0, 192.0, 46.0, 14.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16530798375606537, -0.15923459827899933, -0.1531612128019333, -0.14708782732486725, -0.1410144418478012, -0.13494105637073517, -0.12886765599250793, -0.12279427796602249, -0.11672089248895645, -0.11064750701189041, -0.10457412153482437, -0.09850072860717773, -0.0924273431301117, -0.08635395765304565, -0.08028057217597961, -0.07420718669891357, -0.06813380122184753, -0.062060415744781494, -0.055987030267715454, -0.049913641065359116, -0.043840255588293076, -0.037766870111227036, -0.0316934809088707, -0.025620095431804657, -0.019546709954738617, -0.013473323546350002, -0.007399937137961388, -0.0013265497982501984, 0.004746835678815842, 0.010820221155881882, 0.01689361035823822, 0.02296699583530426, 0.029040366411209106, 0.035113751888275146, 0.041187137365341187, 0.047260526567697525, 0.053333912044763565, 0.059407297521829605, 0.06548068672418594, 0.07155407220125198, 0.07762745767831802, 0.08370084315538406, 0.0897742286324501, 0.09584762156009674, 0.10192100703716278, 0.10799439251422882, 0.11406777799129486, 0.1201411634683609, 0.12621454894542694, 0.13228793442249298, 0.13836131989955902, 0.14443470537662506, 0.1505080908536911, 0.15658147633075714, 0.16265487670898438, 0.16872826218605042, 0.17480164766311646, 0.1808750331401825, 0.18694841861724854, 0.19302180409431458, 0.19909518957138062, 0.20516857504844666, 0.2112419605255127, 0.21731534600257874, 0.22338873147964478]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 6.0, 8.0, 11.0, 15.0, 15.0, 26.0, 28.0, 28.0, 40.0, 46.0, 37.0, 56.0, 49.0, 63.0, 53.0, 63.0, 45.0, 52.0, 73.0, 43.0, 47.0, 36.0, 37.0, 27.0, 25.0, 17.0, 14.0, 12.0, 6.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04286658763885498, -0.041534166783094406, -0.04020174592733383, -0.03886932507157326, -0.03753690421581268, -0.03620448336005211, -0.034872062504291534, -0.03353964164853096, -0.032207220792770386, -0.03087479993700981, -0.029542379081249237, -0.028209958225488663, -0.02687753736972809, -0.025545116513967514, -0.02421269565820694, -0.022880274802446365, -0.02154785394668579, -0.020215433090925217, -0.018883012235164642, -0.017550591379404068, -0.016218170523643494, -0.01488574966788292, -0.013553328812122345, -0.01222090795636177, -0.010888487100601196, -0.009556066244840622, -0.008223645389080048, -0.006891224533319473, -0.005558803677558899, -0.004226382821798325, -0.0028939619660377502, -0.001561541110277176, -0.00022912025451660156, 0.0011033006012439728, 0.002435721457004547, 0.0037681423127651215, 0.005100563168525696, 0.00643298402428627, 0.0077654048800468445, 0.009097825735807419, 0.010430246591567993, 0.011762667447328568, 0.013095088303089142, 0.014427509158849716, 0.01575993001461029, 0.017092350870370865, 0.01842477172613144, 0.019757192581892014, 0.021089613437652588, 0.022422034293413162, 0.023754455149173737, 0.02508687600493431, 0.026419296860694885, 0.02775171771645546, 0.029084138572216034, 0.03041655942797661, 0.03174898028373718, 0.03308140113949776, 0.03441382199525833, 0.035746242851018906, 0.03707866370677948, 0.038411084562540054, 0.03974350541830063, 0.0410759262740612, 0.04240834712982178]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 11.0, 9.0, 24.0, 17.0, 22.0, 40.0, 46.0, 92.0, 98.0, 127.0, 209.0, 304.0, 396.0, 606.0, 1040.0, 2548.0, 9293.0, 78308.0, 735044.0, 196700.0, 16316.0, 3448.0, 1413.0, 792.0, 489.0, 334.0, 236.0, 152.0, 122.0, 80.0, 60.0, 48.0, 22.0, 26.0, 18.0, 18.0, 6.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.044158935546875, -0.04276418685913086, -0.04136943817138672, -0.03997468948364258, -0.03857994079589844, -0.0371851921081543, -0.035790443420410156, -0.034395694732666016, -0.033000946044921875, -0.031606197357177734, -0.030211448669433594, -0.028816699981689453, -0.027421951293945312, -0.026027202606201172, -0.02463245391845703, -0.02323770523071289, -0.02184295654296875, -0.02044820785522461, -0.01905345916748047, -0.017658710479736328, -0.016263961791992188, -0.014869213104248047, -0.013474464416503906, -0.012079715728759766, -0.010684967041015625, -0.009290218353271484, -0.007895469665527344, -0.006500720977783203, -0.0051059722900390625, -0.003711223602294922, -0.0023164749145507812, -0.0009217262268066406, 0.0004730224609375, 0.0018677711486816406, 0.0032625198364257812, 0.004657268524169922, 0.0060520172119140625, 0.007446765899658203, 0.008841514587402344, 0.010236263275146484, 0.011631011962890625, 0.013025760650634766, 0.014420509338378906, 0.015815258026123047, 0.017210006713867188, 0.018604755401611328, 0.01999950408935547, 0.02139425277709961, 0.02278900146484375, 0.02418375015258789, 0.02557849884033203, 0.026973247528076172, 0.028367996215820312, 0.029762744903564453, 0.031157493591308594, 0.032552242279052734, 0.033946990966796875, 0.035341739654541016, 0.036736488342285156, 0.0381312370300293, 0.03952598571777344, 0.04092073440551758, 0.04231548309326172, 0.04371023178100586, 0.04510498046875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 35.0, 86.0, 196.0, 255.0, 231.0, 139.0, 30.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.0412602424621582, -0.040162086486816406, -0.03906393051147461, -0.03796577453613281, -0.036867618560791016, -0.03576946258544922, -0.03467130661010742, -0.033573150634765625, -0.03247499465942383, -0.03137683868408203, -0.030278682708740234, -0.029180526733398438, -0.02808237075805664, -0.026984214782714844, -0.025886058807373047, -0.02478790283203125, -0.023689746856689453, -0.022591590881347656, -0.02149343490600586, -0.020395278930664062, -0.019297122955322266, -0.01819896697998047, -0.017100811004638672, -0.016002655029296875, -0.014904499053955078, -0.013806343078613281, -0.012708187103271484, -0.011610031127929688, -0.01051187515258789, -0.009413719177246094, -0.008315563201904297, -0.0072174072265625, -0.006119251251220703, -0.005021095275878906, -0.003922939300537109, -0.0028247833251953125, -0.0017266273498535156, -0.0006284713745117188, 0.0004696846008300781, 0.001567840576171875, 0.002665996551513672, 0.0037641525268554688, 0.004862308502197266, 0.0059604644775390625, 0.007058620452880859, 0.008156776428222656, 0.009254932403564453, 0.01035308837890625, 0.011451244354248047, 0.012549400329589844, 0.01364755630493164, 0.014745712280273438, 0.015843868255615234, 0.01694202423095703, 0.018040180206298828, 0.019138336181640625, 0.020236492156982422, 0.02133464813232422, 0.022432804107666016, 0.023530960083007812, 0.02462911605834961, 0.025727272033691406, 0.026825428009033203, 0.027923583984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 11.0, 18.0, 25.0, 16.0, 29.0, 22.0, 57.0, 63.0, 84.0, 87.0, 136.0, 250.0, 563.0, 1456.0, 4576.0, 17635.0, 80643.0, 346841.0, 439814.0, 120649.0, 25694.0, 6318.0, 1874.0, 729.0, 343.0, 176.0, 113.0, 65.0, 62.0, 47.0, 24.0, 26.0, 17.0, 13.0, 25.0, 5.0, 9.0, 6.0, 11.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0229644775390625, -0.022249698638916016, -0.02153491973876953, -0.020820140838623047, -0.020105361938476562, -0.019390583038330078, -0.018675804138183594, -0.01796102523803711, -0.017246246337890625, -0.01653146743774414, -0.015816688537597656, -0.015101909637451172, -0.014387130737304688, -0.013672351837158203, -0.012957572937011719, -0.012242794036865234, -0.01152801513671875, -0.010813236236572266, -0.010098457336425781, -0.009383678436279297, -0.008668899536132812, -0.007954120635986328, -0.007239341735839844, -0.006524562835693359, -0.005809783935546875, -0.005095005035400391, -0.004380226135253906, -0.003665447235107422, -0.0029506683349609375, -0.002235889434814453, -0.0015211105346679688, -0.0008063316345214844, -9.1552734375e-05, 0.0006232261657714844, 0.0013380050659179688, 0.002052783966064453, 0.0027675628662109375, 0.003482341766357422, 0.004197120666503906, 0.004911899566650391, 0.005626678466796875, 0.006341457366943359, 0.007056236267089844, 0.007771015167236328, 0.008485794067382812, 0.009200572967529297, 0.009915351867675781, 0.010630130767822266, 0.01134490966796875, 0.012059688568115234, 0.012774467468261719, 0.013489246368408203, 0.014204025268554688, 0.014918804168701172, 0.015633583068847656, 0.01634836196899414, 0.017063140869140625, 0.01777791976928711, 0.018492698669433594, 0.019207477569580078, 0.019922256469726562, 0.020637035369873047, 0.02135181427001953, 0.022066593170166016, 0.0227813720703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 3.0, 14.0, 16.0, 7.0, 12.0, 16.0, 22.0, 28.0, 28.0, 26.0, 35.0, 40.0, 33.0, 26.0, 45.0, 44.0, 45.0, 38.0, 46.0, 43.0, 47.0, 36.0, 45.0, 38.0, 35.0, 22.0, 24.0, 29.0, 15.0, 24.0, 15.0, 16.0, 11.0, 12.0, 8.0, 15.0, 6.0, 3.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0175933837890625, -0.017058610916137695, -0.01652383804321289, -0.015989065170288086, -0.015454292297363281, -0.014919519424438477, -0.014384746551513672, -0.013849973678588867, -0.013315200805664062, -0.012780427932739258, -0.012245655059814453, -0.011710882186889648, -0.011176109313964844, -0.010641336441040039, -0.010106563568115234, -0.00957179069519043, -0.009037017822265625, -0.00850224494934082, -0.007967472076416016, -0.007432699203491211, -0.006897926330566406, -0.0063631534576416016, -0.005828380584716797, -0.005293607711791992, -0.0047588348388671875, -0.004224061965942383, -0.003689289093017578, -0.0031545162200927734, -0.0026197433471679688, -0.002084970474243164, -0.0015501976013183594, -0.0010154247283935547, -0.00048065185546875, 5.412101745605469e-05, 0.0005888938903808594, 0.001123666763305664, 0.0016584396362304688, 0.0021932125091552734, 0.002727985382080078, 0.003262758255004883, 0.0037975311279296875, 0.004332304000854492, 0.004867076873779297, 0.0054018497467041016, 0.005936622619628906, 0.006471395492553711, 0.007006168365478516, 0.00754094123840332, 0.008075714111328125, 0.00861048698425293, 0.009145259857177734, 0.009680032730102539, 0.010214805603027344, 0.010749578475952148, 0.011284351348876953, 0.011819124221801758, 0.012353897094726562, 0.012888669967651367, 0.013423442840576172, 0.013958215713500977, 0.014492988586425781, 0.015027761459350586, 0.01556253433227539, 0.016097307205200195, 0.016632080078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 7.0, 11.0, 17.0, 19.0, 40.0, 53.0, 77.0, 108.0, 157.0, 215.0, 360.0, 582.0, 884.0, 1571.0, 3197.0, 6859.0, 16518.0, 49548.0, 207068.0, 529925.0, 162990.0, 40946.0, 14467.0, 6062.0, 2894.0, 1549.0, 899.0, 510.0, 359.0, 231.0, 147.0, 96.0, 63.0, 43.0, 28.0, 22.0, 15.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00937652587890625, -0.009078145027160645, -0.008779764175415039, -0.008481383323669434, -0.008183002471923828, -0.007884621620178223, -0.007586240768432617, -0.007287859916687012, -0.006989479064941406, -0.006691098213195801, -0.006392717361450195, -0.00609433650970459, -0.005795955657958984, -0.005497574806213379, -0.0051991939544677734, -0.004900813102722168, -0.0046024322509765625, -0.004304051399230957, -0.0040056705474853516, -0.003707289695739746, -0.0034089088439941406, -0.003110527992248535, -0.0028121471405029297, -0.0025137662887573242, -0.0022153854370117188, -0.0019170045852661133, -0.0016186237335205078, -0.0013202428817749023, -0.0010218620300292969, -0.0007234811782836914, -0.00042510032653808594, -0.00012671947479248047, 0.000171661376953125, 0.00047004222869873047, 0.0007684230804443359, 0.0010668039321899414, 0.0013651847839355469, 0.0016635656356811523, 0.001961946487426758, 0.0022603273391723633, 0.0025587081909179688, 0.0028570890426635742, 0.0031554698944091797, 0.003453850746154785, 0.0037522315979003906, 0.004050612449645996, 0.0043489933013916016, 0.004647374153137207, 0.0049457550048828125, 0.005244135856628418, 0.0055425167083740234, 0.005840897560119629, 0.006139278411865234, 0.00643765926361084, 0.006736040115356445, 0.007034420967102051, 0.007332801818847656, 0.007631182670593262, 0.007929563522338867, 0.008227944374084473, 0.008526325225830078, 0.008824706077575684, 0.009123086929321289, 0.009421467781066895, 0.0097198486328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 3.0, 4.0, 13.0, 12.0, 11.0, 12.0, 16.0, 17.0, 22.0, 24.0, 36.0, 41.0, 36.0, 42.0, 63.0, 56.0, 57.0, 59.0, 65.0, 63.0, 51.0, 34.0, 36.0, 37.0, 31.0, 28.0, 17.0, 20.0, 15.0, 18.0, 10.0, 4.0, 9.0, 8.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.612041473388672e-05, -3.492273390293121e-05, -3.372505307197571e-05, -3.25273722410202e-05, -3.13296914100647e-05, -3.0132010579109192e-05, -2.8934329748153687e-05, -2.773664891719818e-05, -2.6538968086242676e-05, -2.534128725528717e-05, -2.4143606424331665e-05, -2.294592559337616e-05, -2.1748244762420654e-05, -2.055056393146515e-05, -1.9352883100509644e-05, -1.8155202269554138e-05, -1.6957521438598633e-05, -1.5759840607643127e-05, -1.4562159776687622e-05, -1.3364478945732117e-05, -1.2166798114776611e-05, -1.0969117283821106e-05, -9.7714364528656e-06, -8.573755621910095e-06, -7.37607479095459e-06, -6.1783939599990845e-06, -4.980713129043579e-06, -3.7830322980880737e-06, -2.5853514671325684e-06, -1.387670636177063e-06, -1.8998980522155762e-07, 1.0076910257339478e-06, 2.205371856689453e-06, 3.4030526876449585e-06, 4.600733518600464e-06, 5.798414349555969e-06, 6.996095180511475e-06, 8.19377601146698e-06, 9.391456842422485e-06, 1.058913767337799e-05, 1.1786818504333496e-05, 1.2984499335289001e-05, 1.4182180166244507e-05, 1.5379860997200012e-05, 1.6577541828155518e-05, 1.7775222659111023e-05, 1.897290349006653e-05, 2.0170584321022034e-05, 2.136826515197754e-05, 2.2565945982933044e-05, 2.376362681388855e-05, 2.4961307644844055e-05, 2.615898847579956e-05, 2.7356669306755066e-05, 2.855435013771057e-05, 2.9752030968666077e-05, 3.094971179962158e-05, 3.214739263057709e-05, 3.334507346153259e-05, 3.45427542924881e-05, 3.5740435123443604e-05, 3.693811595439911e-05, 3.8135796785354614e-05, 3.933347761631012e-05, 4.0531158447265625e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 5.0, 10.0, 13.0, 23.0, 31.0, 58.0, 82.0, 172.0, 349.0, 675.0, 1481.0, 3511.0, 9000.0, 27729.0, 129061.0, 642353.0, 181375.0, 34325.0, 10818.0, 4178.0, 1698.0, 796.0, 367.0, 177.0, 84.0, 55.0, 37.0, 18.0, 15.0, 8.0, 6.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01335906982421875, -0.012922286987304688, -0.012485504150390625, -0.012048721313476562, -0.0116119384765625, -0.011175155639648438, -0.010738372802734375, -0.010301589965820312, -0.00986480712890625, -0.009428024291992188, -0.008991241455078125, -0.008554458618164062, -0.00811767578125, -0.0076808929443359375, -0.007244110107421875, -0.0068073272705078125, -0.00637054443359375, -0.0059337615966796875, -0.005496978759765625, -0.0050601959228515625, -0.0046234130859375, -0.0041866302490234375, -0.003749847412109375, -0.0033130645751953125, -0.00287628173828125, -0.0024394989013671875, -0.002002716064453125, -0.0015659332275390625, -0.001129150390625, -0.0006923675537109375, -0.000255584716796875, 0.0001811981201171875, 0.00061798095703125, 0.0010547637939453125, 0.001491546630859375, 0.0019283294677734375, 0.0023651123046875, 0.0028018951416015625, 0.003238677978515625, 0.0036754608154296875, 0.00411224365234375, 0.0045490264892578125, 0.004985809326171875, 0.0054225921630859375, 0.005859375, 0.0062961578369140625, 0.006732940673828125, 0.0071697235107421875, 0.00760650634765625, 0.008043289184570312, 0.008480072021484375, 0.008916854858398438, 0.0093536376953125, 0.009790420532226562, 0.010227203369140625, 0.010663986206054688, 0.01110076904296875, 0.011537551879882812, 0.011974334716796875, 0.012411117553710938, 0.012847900390625, 0.013284683227539062, 0.013721466064453125, 0.014158248901367188, 0.01459503173828125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 8.0, 9.0, 11.0, 24.0, 23.0, 59.0, 81.0, 101.0, 115.0, 125.0, 97.0, 79.0, 69.0, 35.0, 28.0, 30.0, 22.0, 13.0, 4.0, 12.0, 9.0, 4.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01129150390625, -0.011002719402313232, -0.010713934898376465, -0.010425150394439697, -0.01013636589050293, -0.009847581386566162, -0.009558796882629395, -0.009270012378692627, -0.00898122787475586, -0.008692443370819092, -0.008403658866882324, -0.008114874362945557, -0.007826089859008789, -0.0075373053550720215, -0.007248520851135254, -0.006959736347198486, -0.006670951843261719, -0.006382167339324951, -0.006093382835388184, -0.005804598331451416, -0.0055158138275146484, -0.005227029323577881, -0.004938244819641113, -0.004649460315704346, -0.004360675811767578, -0.0040718913078308105, -0.003783106803894043, -0.0034943222999572754, -0.003205537796020508, -0.0029167532920837402, -0.0026279687881469727, -0.002339184284210205, -0.0020503997802734375, -0.00176161527633667, -0.0014728307723999023, -0.0011840462684631348, -0.0008952617645263672, -0.0006064772605895996, -0.00031769275665283203, -2.8908252716064453e-05, 0.0002598762512207031, 0.0005486607551574707, 0.0008374452590942383, 0.0011262297630310059, 0.0014150142669677734, 0.001703798770904541, 0.0019925832748413086, 0.002281367778778076, 0.0025701522827148438, 0.0028589367866516113, 0.003147721290588379, 0.0034365057945251465, 0.003725290298461914, 0.004014074802398682, 0.004302859306335449, 0.004591643810272217, 0.004880428314208984, 0.005169212818145752, 0.0054579973220825195, 0.005746781826019287, 0.006035566329956055, 0.006324350833892822, 0.00661313533782959, 0.006901919841766357, 0.007190704345703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 35.0, 115.0, 346.0, 351.0, 123.0, 20.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07965835928916931, -0.07075013220310211, -0.06184190511703491, -0.05293367803096771, -0.04402545094490051, -0.03511722385883331, -0.026208996772766113, -0.017300769686698914, -0.008392542600631714, 0.0005156844854354858, 0.009423911571502686, 0.018332138657569885, 0.027240365743637085, 0.036148592829704285, 0.045056819915771484, 0.053965047001838684, 0.06287327408790588, 0.07178150117397308, 0.08068972826004028, 0.08959795534610748, 0.09850618243217468, 0.10741440951824188, 0.11632263660430908, 0.12523086369037628, 0.13413909077644348, 0.14304731786251068, 0.15195554494857788, 0.16086377203464508, 0.16977199912071228, 0.17868022620677948, 0.18758845329284668, 0.19649668037891388, 0.20540493726730347, 0.21431316435337067, 0.22322139143943787, 0.23212961852550507, 0.24103784561157227, 0.24994607269763947, 0.25885429978370667, 0.26776254177093506, 0.27667075395584106, 0.28557896614074707, 0.29448720812797546, 0.30339545011520386, 0.31230366230010986, 0.32121187448501587, 0.33012011647224426, 0.33902835845947266, 0.34793657064437866, 0.35684478282928467, 0.36575302481651306, 0.37466126680374146, 0.38356947898864746, 0.39247769117355347, 0.40138593316078186, 0.41029417514801025, 0.41920238733291626, 0.42811059951782227, 0.43701884150505066, 0.44592708349227905, 0.45483529567718506, 0.46374350786209106, 0.47265174984931946, 0.48155999183654785, 0.49046820402145386]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 12.0, 5.0, 8.0, 9.0, 11.0, 18.0, 16.0, 25.0, 22.0, 33.0, 41.0, 33.0, 39.0, 47.0, 55.0, 54.0, 49.0, 49.0, 36.0, 50.0, 44.0, 56.0, 35.0, 34.0, 37.0, 26.0, 23.0, 26.0, 23.0, 21.0, 13.0, 15.0, 9.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057605743408203125, -0.05559876561164856, -0.053591787815093994, -0.05158481374382973, -0.04957783594727516, -0.047570858150720596, -0.04556388407945633, -0.043556906282901764, -0.0415499284863472, -0.03954295068979263, -0.03753597289323807, -0.0355289988219738, -0.033522021025419235, -0.03151504322886467, -0.029508067294955254, -0.027501091361045837, -0.025494113564491272, -0.023487135767936707, -0.02148015983402729, -0.019473183900117874, -0.01746620610356331, -0.015459229238331318, -0.013452252373099327, -0.011445275507867336, -0.009438298642635345, -0.007431321777403355, -0.005424344912171364, -0.003417368046939373, -0.0014103911817073822, 0.0005965856835246086, 0.0026035625487565994, 0.00461053941398859, 0.006617516279220581, 0.008624493144452572, 0.010631470009684563, 0.012638446874916553, 0.014645423740148544, 0.01665240153670311, 0.018659377470612526, 0.020666353404521942, 0.022673331201076508, 0.024680308997631073, 0.02668728493154049, 0.028694260865449905, 0.03070123866200447, 0.032708216458559036, 0.0347151905298233, 0.03672216832637787, 0.038729146122932434, 0.040736123919487, 0.042743101716041565, 0.04475007578730583, 0.0467570535838604, 0.04876403138041496, 0.05077100545167923, 0.052777983248233795, 0.05478496104478836, 0.056791938841342926, 0.05879891663789749, 0.06080589070916176, 0.06281286478042603, 0.06481984257698059, 0.06682682037353516, 0.06883379817008972, 0.07084077596664429]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 3.0, 3.0, 4.0, 13.0, 16.0, 13.0, 21.0, 38.0, 58.0, 111.0, 175.0, 407.0, 1133.0, 4686.0, 74569.0, 4074687.0, 32392.0, 4062.0, 1123.0, 351.0, 175.0, 81.0, 59.0, 31.0, 24.0, 12.0, 10.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06512451171875, -0.06328392028808594, -0.061443328857421875, -0.05960273742675781, -0.05776214599609375, -0.05592155456542969, -0.054080963134765625, -0.05224037170410156, -0.0503997802734375, -0.04855918884277344, -0.046718597412109375, -0.04487800598144531, -0.04303741455078125, -0.04119682312011719, -0.039356231689453125, -0.03751564025878906, -0.035675048828125, -0.03383445739746094, -0.031993865966796875, -0.030153274536132812, -0.02831268310546875, -0.026472091674804688, -0.024631500244140625, -0.022790908813476562, -0.0209503173828125, -0.019109725952148438, -0.017269134521484375, -0.015428543090820312, -0.01358795166015625, -0.011747360229492188, -0.009906768798828125, -0.008066177368164062, -0.0062255859375, -0.0043849945068359375, -0.002544403076171875, -0.0007038116455078125, 0.00113677978515625, 0.0029773712158203125, 0.004817962646484375, 0.0066585540771484375, 0.0084991455078125, 0.010339736938476562, 0.012180328369140625, 0.014020919799804688, 0.01586151123046875, 0.017702102661132812, 0.019542694091796875, 0.021383285522460938, 0.023223876953125, 0.025064468383789062, 0.026905059814453125, 0.028745651245117188, 0.03058624267578125, 0.03242683410644531, 0.034267425537109375, 0.03610801696777344, 0.0379486083984375, 0.03978919982910156, 0.041629791259765625, 0.04347038269042969, 0.04531097412109375, 0.04715156555175781, 0.048992156982421875, 0.05083274841308594, 0.05267333984375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 11.0, 36.0, 103.0, 218.0, 259.0, 208.0, 128.0, 24.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043182373046875, -0.04208731651306152, -0.04099225997924805, -0.03989720344543457, -0.038802146911621094, -0.03770709037780762, -0.03661203384399414, -0.035516977310180664, -0.03442192077636719, -0.03332686424255371, -0.032231807708740234, -0.031136751174926758, -0.03004169464111328, -0.028946638107299805, -0.027851581573486328, -0.02675652503967285, -0.025661468505859375, -0.0245664119720459, -0.023471355438232422, -0.022376298904418945, -0.02128124237060547, -0.020186185836791992, -0.019091129302978516, -0.01799607276916504, -0.016901016235351562, -0.015805959701538086, -0.01471090316772461, -0.013615846633911133, -0.012520790100097656, -0.01142573356628418, -0.010330677032470703, -0.009235620498657227, -0.00814056396484375, -0.0070455074310302734, -0.005950450897216797, -0.00485539436340332, -0.0037603378295898438, -0.002665281295776367, -0.0015702247619628906, -0.00047516822814941406, 0.0006198883056640625, 0.001714944839477539, 0.0028100013732910156, 0.003905057907104492, 0.005000114440917969, 0.006095170974731445, 0.007190227508544922, 0.008285284042358398, 0.009380340576171875, 0.010475397109985352, 0.011570453643798828, 0.012665510177612305, 0.013760566711425781, 0.014855623245239258, 0.015950679779052734, 0.01704573631286621, 0.018140792846679688, 0.019235849380493164, 0.02033090591430664, 0.021425962448120117, 0.022521018981933594, 0.02361607551574707, 0.024711132049560547, 0.025806188583374023, 0.0269012451171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 5.0, 15.0, 11.0, 15.0, 29.0, 33.0, 46.0, 50.0, 90.0, 115.0, 221.0, 300.0, 497.0, 860.0, 1596.0, 3289.0, 7172.0, 18744.0, 56012.0, 219673.0, 3021580.0, 700965.0, 109278.0, 32114.0, 11661.0, 4809.0, 2163.0, 1165.0, 663.0, 383.0, 239.0, 156.0, 84.0, 65.0, 55.0, 38.0, 19.0, 14.0, 11.0, 15.0, 9.0, 7.0, 8.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0116119384765625, -0.011208176612854004, -0.010804414749145508, -0.010400652885437012, -0.009996891021728516, -0.00959312915802002, -0.009189367294311523, -0.008785605430603027, -0.008381843566894531, -0.007978081703186035, -0.007574319839477539, -0.007170557975769043, -0.006766796112060547, -0.006363034248352051, -0.005959272384643555, -0.005555510520935059, -0.0051517486572265625, -0.004747986793518066, -0.00434422492980957, -0.003940463066101074, -0.003536701202392578, -0.003132939338684082, -0.002729177474975586, -0.00232541561126709, -0.0019216537475585938, -0.0015178918838500977, -0.0011141300201416016, -0.0007103681564331055, -0.0003066062927246094, 9.715557098388672e-05, 0.0005009174346923828, 0.0009046792984008789, 0.001308441162109375, 0.001712203025817871, 0.002115964889526367, 0.0025197267532348633, 0.0029234886169433594, 0.0033272504806518555, 0.0037310123443603516, 0.004134774208068848, 0.004538536071777344, 0.00494229793548584, 0.005346059799194336, 0.005749821662902832, 0.006153583526611328, 0.006557345390319824, 0.00696110725402832, 0.007364869117736816, 0.0077686309814453125, 0.008172392845153809, 0.008576154708862305, 0.0089799165725708, 0.009383678436279297, 0.009787440299987793, 0.010191202163696289, 0.010594964027404785, 0.010998725891113281, 0.011402487754821777, 0.011806249618530273, 0.01221001148223877, 0.012613773345947266, 0.013017535209655762, 0.013421297073364258, 0.013825058937072754, 0.01422882080078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 9.0, 6.0, 12.0, 16.0, 26.0, 27.0, 42.0, 64.0, 83.0, 123.0, 217.0, 449.0, 1148.0, 940.0, 361.0, 176.0, 99.0, 70.0, 50.0, 44.0, 27.0, 15.0, 11.0, 13.0, 5.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01171875, -0.011425018310546875, -0.01113128662109375, -0.010837554931640625, -0.0105438232421875, -0.010250091552734375, -0.00995635986328125, -0.009662628173828125, -0.009368896484375, -0.009075164794921875, -0.00878143310546875, -0.008487701416015625, -0.0081939697265625, -0.007900238037109375, -0.00760650634765625, -0.007312774658203125, -0.00701904296875, -0.006725311279296875, -0.00643157958984375, -0.006137847900390625, -0.0058441162109375, -0.005550384521484375, -0.00525665283203125, -0.004962921142578125, -0.004669189453125, -0.004375457763671875, -0.00408172607421875, -0.003787994384765625, -0.0034942626953125, -0.003200531005859375, -0.00290679931640625, -0.002613067626953125, -0.0023193359375, -0.002025604248046875, -0.00173187255859375, -0.001438140869140625, -0.0011444091796875, -0.000850677490234375, -0.00055694580078125, -0.000263214111328125, 3.0517578125e-05, 0.000324249267578125, 0.00061798095703125, 0.000911712646484375, 0.0012054443359375, 0.001499176025390625, 0.00179290771484375, 0.002086639404296875, 0.00238037109375, 0.002674102783203125, 0.00296783447265625, 0.003261566162109375, 0.0035552978515625, 0.003849029541015625, 0.00414276123046875, 0.004436492919921875, 0.004730224609375, 0.005023956298828125, 0.00531768798828125, 0.005611419677734375, 0.0059051513671875, 0.006198883056640625, 0.00649261474609375, 0.006786346435546875, 0.007080078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 31.0, 86.0, 163.0, 256.0, 245.0, 122.0, 54.0, 17.0, 13.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07017068564891815, -0.06733938306570053, -0.06450808793306351, -0.061676785349845886, -0.058845486491918564, -0.05601418763399124, -0.05318288505077362, -0.0503515861928463, -0.047520287334918976, -0.04468898847699165, -0.04185768589377403, -0.03902638703584671, -0.03619508817791939, -0.033363789319992065, -0.030532486736774445, -0.027701187878847122, -0.0248698852956295, -0.02203858457505703, -0.019207285717129707, -0.016375984996557236, -0.013544685207307339, -0.010713385418057442, -0.00788208469748497, -0.005050785839557648, -0.002219485118985176, 0.0006118149030953646, 0.0034431149251759052, 0.0062744151800870895, 0.009105714969336987, 0.011937014758586884, 0.014768315479159355, 0.017599614337086678, 0.02043091505765915, 0.02326221577823162, 0.026093514636158943, 0.028924815356731415, 0.03175611421465874, 0.03458741307258606, 0.03741871565580368, 0.040250014513731, 0.043081313371658325, 0.04591261222958565, 0.04874391481280327, 0.05157521367073059, 0.05440651252865791, 0.057237811386585236, 0.060069113969802856, 0.06290040910243988, 0.0657317191362381, 0.06856302171945572, 0.07139431685209274, 0.07422561943531036, 0.07705692201852798, 0.07988821715116501, 0.08271951973438263, 0.08555081486701965, 0.08838211745023727, 0.0912134200334549, 0.09404471516609192, 0.09687601774930954, 0.09970732033252716, 0.10253861546516418, 0.1053699180483818, 0.10820122063159943, 0.11103251576423645]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 15.0, 12.0, 12.0, 15.0, 27.0, 29.0, 29.0, 47.0, 40.0, 30.0, 62.0, 47.0, 37.0, 40.0, 40.0, 54.0, 51.0, 46.0, 50.0, 23.0, 34.0, 47.0, 26.0, 31.0, 22.0, 23.0, 20.0, 21.0, 14.0, 10.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.028755545616149902, -0.028004396706819534, -0.027253245934844017, -0.0265020951628685, -0.02575094625353813, -0.024999797344207764, -0.024248646572232246, -0.02349749580025673, -0.02274634689092636, -0.021995197981595993, -0.021244047209620476, -0.02049289643764496, -0.01974174752831459, -0.018990598618984222, -0.018239447847008705, -0.017488297075033188, -0.01673714816570282, -0.015985999256372452, -0.015234848484396935, -0.014483698643743992, -0.01373254880309105, -0.012981398962438107, -0.012230249121785164, -0.011479099281132221, -0.010727949440479279, -0.009976799599826336, -0.009225649759173393, -0.00847449991852045, -0.007723350077867508, -0.006972200237214565, -0.006221050396561623, -0.00546990055590868, -0.004718750715255737, -0.003967600874602795, -0.003216451033949852, -0.0024653011932969093, -0.0017141513526439667, -0.000963001511991024, -0.00021185167133808136, 0.0005392981693148613, 0.001290448009967804, 0.0020415978506207466, 0.0027927476912736893, 0.003543897531926632, 0.004295047372579575, 0.005046197213232517, 0.00579734705388546, 0.0065484968945384026, 0.007299646735191345, 0.008050796575844288, 0.00880194641649723, 0.009553096257150173, 0.010304246097803116, 0.011055395938456059, 0.011806545779109001, 0.012557695619761944, 0.013308845460414886, 0.014059995301067829, 0.014811145141720772, 0.015562294982373714, 0.016313444823026657, 0.017064593732357025, 0.017815744504332542, 0.01856689527630806, 0.019318044185638428]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 12.0, 18.0, 20.0, 32.0, 45.0, 66.0, 76.0, 112.0, 137.0, 201.0, 268.0, 385.0, 625.0, 1101.0, 2149.0, 7587.0, 65372.0, 702387.0, 241531.0, 18974.0, 3514.0, 1424.0, 781.0, 483.0, 356.0, 247.0, 169.0, 125.0, 92.0, 52.0, 50.0, 32.0, 34.0, 21.0, 16.0, 11.0, 11.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.03997802734375, -0.038793087005615234, -0.03760814666748047, -0.0364232063293457, -0.03523826599121094, -0.03405332565307617, -0.032868385314941406, -0.03168344497680664, -0.030498504638671875, -0.02931356430053711, -0.028128623962402344, -0.026943683624267578, -0.025758743286132812, -0.024573802947998047, -0.02338886260986328, -0.022203922271728516, -0.02101898193359375, -0.019834041595458984, -0.01864910125732422, -0.017464160919189453, -0.016279220581054688, -0.015094280242919922, -0.013909339904785156, -0.01272439956665039, -0.011539459228515625, -0.01035451889038086, -0.009169578552246094, -0.007984638214111328, -0.0067996978759765625, -0.005614757537841797, -0.004429817199707031, -0.0032448768615722656, -0.0020599365234375, -0.0008749961853027344, 0.00030994415283203125, 0.0014948844909667969, 0.0026798248291015625, 0.003864765167236328, 0.005049705505371094, 0.006234645843505859, 0.007419586181640625, 0.00860452651977539, 0.009789466857910156, 0.010974407196044922, 0.012159347534179688, 0.013344287872314453, 0.014529228210449219, 0.015714168548583984, 0.01689910888671875, 0.018084049224853516, 0.01926898956298828, 0.020453929901123047, 0.021638870239257812, 0.022823810577392578, 0.024008750915527344, 0.02519369125366211, 0.026378631591796875, 0.02756357192993164, 0.028748512268066406, 0.029933452606201172, 0.031118392944335938, 0.0323033332824707, 0.03348827362060547, 0.034673213958740234, 0.035858154296875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 24.0, 54.0, 148.0, 258.0, 239.0, 176.0, 68.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041168212890625, -0.04011249542236328, -0.03905677795410156, -0.038001060485839844, -0.036945343017578125, -0.035889625549316406, -0.03483390808105469, -0.03377819061279297, -0.03272247314453125, -0.03166675567626953, -0.030611038208007812, -0.029555320739746094, -0.028499603271484375, -0.027443885803222656, -0.026388168334960938, -0.02533245086669922, -0.0242767333984375, -0.02322101593017578, -0.022165298461914062, -0.021109580993652344, -0.020053863525390625, -0.018998146057128906, -0.017942428588867188, -0.01688671112060547, -0.01583099365234375, -0.014775276184082031, -0.013719558715820312, -0.012663841247558594, -0.011608123779296875, -0.010552406311035156, -0.009496688842773438, -0.008440971374511719, -0.00738525390625, -0.006329536437988281, -0.0052738189697265625, -0.004218101501464844, -0.003162384033203125, -0.0021066665649414062, -0.0010509490966796875, 4.76837158203125e-06, 0.00106048583984375, 0.0021162033081054688, 0.0031719207763671875, 0.004227638244628906, 0.005283355712890625, 0.006339073181152344, 0.0073947906494140625, 0.008450508117675781, 0.0095062255859375, 0.010561943054199219, 0.011617660522460938, 0.012673377990722656, 0.013729095458984375, 0.014784812927246094, 0.015840530395507812, 0.01689624786376953, 0.01795196533203125, 0.01900768280029297, 0.020063400268554688, 0.021119117736816406, 0.022174835205078125, 0.023230552673339844, 0.024286270141601562, 0.02534198760986328, 0.026397705078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 12.0, 9.0, 24.0, 21.0, 24.0, 52.0, 57.0, 76.0, 82.0, 122.0, 267.0, 604.0, 1819.0, 7412.0, 36915.0, 238498.0, 587351.0, 143913.0, 23739.0, 4973.0, 1409.0, 432.0, 226.0, 125.0, 85.0, 70.0, 51.0, 44.0, 26.0, 25.0, 19.0, 13.0, 19.0, 11.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02484130859375, -0.02407383918762207, -0.02330636978149414, -0.02253890037536621, -0.02177143096923828, -0.02100396156311035, -0.020236492156982422, -0.019469022750854492, -0.018701553344726562, -0.017934083938598633, -0.017166614532470703, -0.016399145126342773, -0.015631675720214844, -0.014864206314086914, -0.014096736907958984, -0.013329267501831055, -0.012561798095703125, -0.011794328689575195, -0.011026859283447266, -0.010259389877319336, -0.009491920471191406, -0.008724451065063477, -0.007956981658935547, -0.007189512252807617, -0.0064220428466796875, -0.005654573440551758, -0.004887104034423828, -0.0041196346282958984, -0.0033521652221679688, -0.002584695816040039, -0.0018172264099121094, -0.0010497570037841797, -0.00028228759765625, 0.0004851818084716797, 0.0012526512145996094, 0.002020120620727539, 0.0027875900268554688, 0.0035550594329833984, 0.004322528839111328, 0.005089998245239258, 0.0058574676513671875, 0.006624937057495117, 0.007392406463623047, 0.008159875869750977, 0.008927345275878906, 0.009694814682006836, 0.010462284088134766, 0.011229753494262695, 0.011997222900390625, 0.012764692306518555, 0.013532161712646484, 0.014299631118774414, 0.015067100524902344, 0.015834569931030273, 0.016602039337158203, 0.017369508743286133, 0.018136978149414062, 0.018904447555541992, 0.019671916961669922, 0.02043938636779785, 0.02120685577392578, 0.02197432518005371, 0.02274179458618164, 0.02350926399230957, 0.0242767333984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 4.0, 15.0, 12.0, 10.0, 18.0, 20.0, 29.0, 38.0, 39.0, 48.0, 43.0, 48.0, 47.0, 52.0, 50.0, 42.0, 60.0, 64.0, 50.0, 50.0, 43.0, 38.0, 38.0, 30.0, 19.0, 20.0, 13.0, 11.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.019025325775146484, -0.01839733123779297, -0.017769336700439453, -0.017141342163085938, -0.016513347625732422, -0.015885353088378906, -0.01525735855102539, -0.014629364013671875, -0.01400136947631836, -0.013373374938964844, -0.012745380401611328, -0.012117385864257812, -0.011489391326904297, -0.010861396789550781, -0.010233402252197266, -0.00960540771484375, -0.008977413177490234, -0.008349418640136719, -0.007721424102783203, -0.0070934295654296875, -0.006465435028076172, -0.005837440490722656, -0.005209445953369141, -0.004581451416015625, -0.003953456878662109, -0.0033254623413085938, -0.002697467803955078, -0.0020694732666015625, -0.0014414787292480469, -0.0008134841918945312, -0.00018548965454101562, 0.0004425048828125, 0.0010704994201660156, 0.0016984939575195312, 0.002326488494873047, 0.0029544830322265625, 0.003582477569580078, 0.004210472106933594, 0.004838466644287109, 0.005466461181640625, 0.006094455718994141, 0.006722450256347656, 0.007350444793701172, 0.007978439331054688, 0.008606433868408203, 0.009234428405761719, 0.009862422943115234, 0.01049041748046875, 0.011118412017822266, 0.011746406555175781, 0.012374401092529297, 0.013002395629882812, 0.013630390167236328, 0.014258384704589844, 0.01488637924194336, 0.015514373779296875, 0.01614236831665039, 0.016770362854003906, 0.017398357391357422, 0.018026351928710938, 0.018654346466064453, 0.01928234100341797, 0.019910335540771484, 0.020538330078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 13.0, 11.0, 16.0, 27.0, 65.0, 86.0, 127.0, 232.0, 446.0, 859.0, 1860.0, 4843.0, 34402.0, 898134.0, 95535.0, 7304.0, 2325.0, 1021.0, 536.0, 285.0, 175.0, 92.0, 47.0, 35.0, 29.0, 14.0, 7.0, 9.0, 5.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0259552001953125, -0.02510833740234375, -0.024261474609375, -0.02341461181640625, -0.0225677490234375, -0.02172088623046875, -0.0208740234375, -0.02002716064453125, -0.0191802978515625, -0.01833343505859375, -0.017486572265625, -0.01663970947265625, -0.0157928466796875, -0.01494598388671875, -0.01409912109375, -0.01325225830078125, -0.0124053955078125, -0.01155853271484375, -0.010711669921875, -0.00986480712890625, -0.0090179443359375, -0.00817108154296875, -0.00732421875, -0.00647735595703125, -0.0056304931640625, -0.00478363037109375, -0.003936767578125, -0.00308990478515625, -0.0022430419921875, -0.00139617919921875, -0.00054931640625, 0.00029754638671875, 0.0011444091796875, 0.00199127197265625, 0.002838134765625, 0.00368499755859375, 0.0045318603515625, 0.00537872314453125, 0.0062255859375, 0.00707244873046875, 0.0079193115234375, 0.00876617431640625, 0.009613037109375, 0.01045989990234375, 0.0113067626953125, 0.01215362548828125, 0.01300048828125, 0.01384735107421875, 0.0146942138671875, 0.01554107666015625, 0.016387939453125, 0.01723480224609375, 0.0180816650390625, 0.01892852783203125, 0.019775390625, 0.02062225341796875, 0.0214691162109375, 0.02231597900390625, 0.023162841796875, 0.02400970458984375, 0.0248565673828125, 0.02570343017578125, 0.02655029296875, 0.02739715576171875, 0.0282440185546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 7.0, 3.0, 4.0, 16.0, 21.0, 22.0, 33.0, 49.0, 60.0, 63.0, 82.0, 122.0, 110.0, 106.0, 64.0, 54.0, 48.0, 30.0, 16.0, 17.0, 15.0, 12.0, 9.0, 6.0, 4.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.543231964111328e-05, -5.3120777010917664e-05, -5.0809234380722046e-05, -4.849769175052643e-05, -4.618614912033081e-05, -4.387460649013519e-05, -4.1563063859939575e-05, -3.925152122974396e-05, -3.693997859954834e-05, -3.462843596935272e-05, -3.2316893339157104e-05, -3.0005350708961487e-05, -2.769380807876587e-05, -2.538226544857025e-05, -2.3070722818374634e-05, -2.0759180188179016e-05, -1.84476375579834e-05, -1.613609492778778e-05, -1.3824552297592163e-05, -1.1513009667396545e-05, -9.201467037200928e-06, -6.88992440700531e-06, -4.578381776809692e-06, -2.2668391466140747e-06, 4.470348358154297e-08, 2.3562461137771606e-06, 4.667788743972778e-06, 6.979331374168396e-06, 9.290874004364014e-06, 1.1602416634559631e-05, 1.3913959264755249e-05, 1.6225501894950867e-05, 1.8537044525146484e-05, 2.0848587155342102e-05, 2.316012978553772e-05, 2.5471672415733337e-05, 2.7783215045928955e-05, 3.0094757676124573e-05, 3.240630030632019e-05, 3.471784293651581e-05, 3.7029385566711426e-05, 3.9340928196907043e-05, 4.165247082710266e-05, 4.396401345729828e-05, 4.6275556087493896e-05, 4.8587098717689514e-05, 5.089864134788513e-05, 5.321018397808075e-05, 5.552172660827637e-05, 5.7833269238471985e-05, 6.01448118686676e-05, 6.245635449886322e-05, 6.476789712905884e-05, 6.707943975925446e-05, 6.939098238945007e-05, 7.170252501964569e-05, 7.401406764984131e-05, 7.632561028003693e-05, 7.863715291023254e-05, 8.094869554042816e-05, 8.326023817062378e-05, 8.55717808008194e-05, 8.788332343101501e-05, 9.019486606121063e-05, 9.250640869140625e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 20.0, 12.0, 21.0, 36.0, 55.0, 63.0, 103.0, 166.0, 192.0, 313.0, 427.0, 719.0, 1189.0, 2084.0, 3961.0, 9358.0, 31247.0, 179457.0, 658802.0, 120516.0, 23568.0, 7833.0, 3397.0, 1835.0, 1177.0, 675.0, 388.0, 257.0, 219.0, 149.0, 101.0, 56.0, 35.0, 39.0, 23.0, 18.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.01378631591796875, -0.013407588005065918, -0.013028860092163086, -0.012650132179260254, -0.012271404266357422, -0.01189267635345459, -0.011513948440551758, -0.011135220527648926, -0.010756492614746094, -0.010377764701843262, -0.00999903678894043, -0.009620308876037598, -0.009241580963134766, -0.008862853050231934, -0.008484125137329102, -0.00810539722442627, -0.0077266693115234375, -0.0073479413986206055, -0.0069692134857177734, -0.006590485572814941, -0.006211757659912109, -0.005833029747009277, -0.005454301834106445, -0.005075573921203613, -0.004696846008300781, -0.004318118095397949, -0.003939390182495117, -0.003560662269592285, -0.003181934356689453, -0.002803206443786621, -0.002424478530883789, -0.002045750617980957, -0.001667022705078125, -0.001288294792175293, -0.0009095668792724609, -0.0005308389663696289, -0.00015211105346679688, 0.00022661685943603516, 0.0006053447723388672, 0.0009840726852416992, 0.0013628005981445312, 0.0017415285110473633, 0.0021202564239501953, 0.0024989843368530273, 0.0028777122497558594, 0.0032564401626586914, 0.0036351680755615234, 0.0040138959884643555, 0.0043926239013671875, 0.0047713518142700195, 0.0051500797271728516, 0.005528807640075684, 0.005907535552978516, 0.006286263465881348, 0.00666499137878418, 0.007043719291687012, 0.007422447204589844, 0.007801175117492676, 0.008179903030395508, 0.00855863094329834, 0.008937358856201172, 0.009316086769104004, 0.009694814682006836, 0.010073542594909668, 0.0104522705078125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 10.0, 25.0, 29.0, 49.0, 100.0, 143.0, 220.0, 148.0, 87.0, 68.0, 27.0, 25.0, 12.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01192474365234375, -0.01153409481048584, -0.01114344596862793, -0.01075279712677002, -0.01036214828491211, -0.0099714994430542, -0.009580850601196289, -0.009190201759338379, -0.008799552917480469, -0.008408904075622559, -0.008018255233764648, -0.007627606391906738, -0.007236957550048828, -0.006846308708190918, -0.006455659866333008, -0.006065011024475098, -0.0056743621826171875, -0.005283713340759277, -0.004893064498901367, -0.004502415657043457, -0.004111766815185547, -0.0037211179733276367, -0.0033304691314697266, -0.0029398202896118164, -0.0025491714477539062, -0.002158522605895996, -0.001767873764038086, -0.0013772249221801758, -0.0009865760803222656, -0.0005959272384643555, -0.0002052783966064453, 0.00018537044525146484, 0.000576019287109375, 0.0009666681289672852, 0.0013573169708251953, 0.0017479658126831055, 0.0021386146545410156, 0.0025292634963989258, 0.002919912338256836, 0.003310561180114746, 0.0037012100219726562, 0.004091858863830566, 0.0044825077056884766, 0.004873156547546387, 0.005263805389404297, 0.005654454231262207, 0.006045103073120117, 0.006435751914978027, 0.0068264007568359375, 0.007217049598693848, 0.007607698440551758, 0.007998347282409668, 0.008388996124267578, 0.008779644966125488, 0.009170293807983398, 0.009560942649841309, 0.009951591491699219, 0.010342240333557129, 0.010732889175415039, 0.01112353801727295, 0.01151418685913086, 0.01190483570098877, 0.01229548454284668, 0.01268613338470459, 0.0130767822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 49.0, 308.0, 528.0, 97.0, 12.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24851584434509277, -0.2355944961309433, -0.22267313301563263, -0.20975178480148315, -0.19683042168617249, -0.183909073472023, -0.17098772525787354, -0.15806636214256287, -0.1451449990272522, -0.13222365081310272, -0.11930228769779205, -0.10638093948364258, -0.09345957636833191, -0.08053822815418243, -0.06761687248945236, -0.05469551682472229, -0.041774168610572815, -0.028852812945842743, -0.01593145914375782, -0.0030101053416728973, 0.009911250323057175, 0.022832602262496948, 0.03575395792722702, 0.04867531359195709, 0.061596669256687164, 0.07451802492141724, 0.08743938058614731, 0.10036073625087738, 0.11328208446502686, 0.12620344758033752, 0.139124795794487, 0.15204614400863647, 0.16496750712394714, 0.17788885533809662, 0.1908102184534073, 0.20373156666755676, 0.21665292978286743, 0.2295742779970169, 0.24249562621116638, 0.25541698932647705, 0.2683383524417877, 0.2812597155570984, 0.29418104887008667, 0.30710241198539734, 0.320023775100708, 0.3329451084136963, 0.34586647152900696, 0.3587878346443176, 0.3717091679573059, 0.3846305310726166, 0.39755186438560486, 0.4104732275009155, 0.4233945906162262, 0.43631595373153687, 0.44923728704452515, 0.4621586501598358, 0.4750800132751465, 0.48800137639045715, 0.5009227395057678, 0.5138440728187561, 0.5267654061317444, 0.5396867990493774, 0.5526081323623657, 0.565529465675354, 0.5784508585929871]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 8.0, 13.0, 12.0, 7.0, 7.0, 18.0, 18.0, 16.0, 14.0, 20.0, 39.0, 26.0, 32.0, 25.0, 46.0, 46.0, 46.0, 31.0, 38.0, 45.0, 36.0, 24.0, 42.0, 47.0, 35.0, 36.0, 28.0, 19.0, 29.0, 23.0, 25.0, 26.0, 9.0, 24.0, 12.0, 17.0, 11.0, 5.0, 6.0, 11.0, 3.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.052956461906433105, -0.05148741602897644, -0.05001836642622948, -0.04854931682348251, -0.04708027094602585, -0.04561122506856918, -0.04414217546582222, -0.042673125863075256, -0.04120407998561859, -0.039735034108161926, -0.03826598450541496, -0.036796934902668, -0.035327889025211334, -0.03385884314775467, -0.032389793545007706, -0.03092074580490589, -0.029451698064804077, -0.027982650324702263, -0.02651360258460045, -0.025044554844498634, -0.02357550710439682, -0.022106459364295006, -0.02063741162419319, -0.019168363884091377, -0.017699316143989563, -0.01623026840388775, -0.014761220663785934, -0.01329217292368412, -0.011823125183582306, -0.010354077443480492, -0.008885029703378677, -0.007415981963276863, -0.005946934223175049, -0.0044778864830732346, -0.0030088387429714203, -0.001539791002869606, -7.074326276779175e-05, 0.0013983044773340225, 0.002867352217435837, 0.004336399957537651, 0.005805447697639465, 0.00727449543774128, 0.008743543177843094, 0.010212590917944908, 0.011681638658046722, 0.013150686398148537, 0.014619734138250351, 0.016088781878352165, 0.01755782961845398, 0.019026877358555794, 0.020495925098657608, 0.021964972838759422, 0.023434020578861237, 0.02490306831896305, 0.026372116059064865, 0.02784116379916668, 0.029310211539268494, 0.030779259279370308, 0.03224830701947212, 0.033717356622219086, 0.03518640249967575, 0.036655448377132416, 0.03812449797987938, 0.03959354758262634, 0.04106259346008301]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 11.0, 14.0, 31.0, 54.0, 83.0, 156.0, 272.0, 652.0, 2427.0, 21735.0, 4058389.0, 102240.0, 5844.0, 1500.0, 469.0, 152.0, 109.0, 48.0, 34.0, 21.0, 5.0, 10.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047332763671875, -0.045623779296875, -0.043914794921875, -0.042205810546875, -0.040496826171875, -0.038787841796875, -0.037078857421875, -0.035369873046875, -0.033660888671875, -0.031951904296875, -0.030242919921875, -0.028533935546875, -0.026824951171875, -0.025115966796875, -0.023406982421875, -0.021697998046875, -0.019989013671875, -0.018280029296875, -0.016571044921875, -0.014862060546875, -0.013153076171875, -0.011444091796875, -0.009735107421875, -0.008026123046875, -0.006317138671875, -0.004608154296875, -0.002899169921875, -0.001190185546875, 0.000518798828125, 0.002227783203125, 0.003936767578125, 0.005645751953125, 0.007354736328125, 0.009063720703125, 0.010772705078125, 0.012481689453125, 0.014190673828125, 0.015899658203125, 0.017608642578125, 0.019317626953125, 0.021026611328125, 0.022735595703125, 0.024444580078125, 0.026153564453125, 0.027862548828125, 0.029571533203125, 0.031280517578125, 0.032989501953125, 0.034698486328125, 0.036407470703125, 0.038116455078125, 0.039825439453125, 0.041534423828125, 0.043243408203125, 0.044952392578125, 0.046661376953125, 0.048370361328125, 0.050079345703125, 0.051788330078125, 0.053497314453125, 0.055206298828125, 0.056915283203125, 0.058624267578125, 0.060333251953125, 0.062042236328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 20.0, 49.0, 163.0, 252.0, 246.0, 173.0, 67.0, 15.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04248046875, -0.04139089584350586, -0.04030132293701172, -0.03921175003051758, -0.03812217712402344, -0.0370326042175293, -0.035943031311035156, -0.034853458404541016, -0.033763885498046875, -0.032674312591552734, -0.031584739685058594, -0.030495166778564453, -0.029405593872070312, -0.028316020965576172, -0.02722644805908203, -0.02613687515258789, -0.02504730224609375, -0.02395772933959961, -0.02286815643310547, -0.021778583526611328, -0.020689010620117188, -0.019599437713623047, -0.018509864807128906, -0.017420291900634766, -0.016330718994140625, -0.015241146087646484, -0.014151573181152344, -0.013062000274658203, -0.011972427368164062, -0.010882854461669922, -0.009793281555175781, -0.00870370864868164, -0.0076141357421875, -0.006524562835693359, -0.005434989929199219, -0.004345417022705078, -0.0032558441162109375, -0.002166271209716797, -0.0010766983032226562, 1.2874603271484375e-05, 0.001102447509765625, 0.0021920204162597656, 0.0032815933227539062, 0.004371166229248047, 0.0054607391357421875, 0.006550312042236328, 0.007639884948730469, 0.00872945785522461, 0.00981903076171875, 0.01090860366821289, 0.011998176574707031, 0.013087749481201172, 0.014177322387695312, 0.015266895294189453, 0.016356468200683594, 0.017446041107177734, 0.018535614013671875, 0.019625186920166016, 0.020714759826660156, 0.021804332733154297, 0.022893905639648438, 0.023983478546142578, 0.02507305145263672, 0.02616262435913086, 0.027252197265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 14.0, 21.0, 27.0, 49.0, 67.0, 136.0, 245.0, 384.0, 798.0, 1611.0, 3376.0, 8172.0, 22300.0, 73347.0, 361860.0, 3342008.0, 282590.0, 63396.0, 19998.0, 7313.0, 3246.0, 1507.0, 774.0, 446.0, 222.0, 126.0, 80.0, 55.0, 39.0, 15.0, 11.0, 13.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0161285400390625, -0.01571965217590332, -0.01531076431274414, -0.014901876449584961, -0.014492988586425781, -0.014084100723266602, -0.013675212860107422, -0.013266324996948242, -0.012857437133789062, -0.012448549270629883, -0.012039661407470703, -0.011630773544311523, -0.011221885681152344, -0.010812997817993164, -0.010404109954833984, -0.009995222091674805, -0.009586334228515625, -0.009177446365356445, -0.008768558502197266, -0.008359670639038086, -0.007950782775878906, -0.0075418949127197266, -0.007133007049560547, -0.006724119186401367, -0.0063152313232421875, -0.005906343460083008, -0.005497455596923828, -0.0050885677337646484, -0.004679679870605469, -0.004270792007446289, -0.0038619041442871094, -0.0034530162811279297, -0.00304412841796875, -0.0026352405548095703, -0.0022263526916503906, -0.001817464828491211, -0.0014085769653320312, -0.0009996891021728516, -0.0005908012390136719, -0.0001819133758544922, 0.0002269744873046875, 0.0006358623504638672, 0.0010447502136230469, 0.0014536380767822266, 0.0018625259399414062, 0.002271413803100586, 0.0026803016662597656, 0.0030891895294189453, 0.003498077392578125, 0.003906965255737305, 0.004315853118896484, 0.004724740982055664, 0.005133628845214844, 0.0055425167083740234, 0.005951404571533203, 0.006360292434692383, 0.0067691802978515625, 0.007178068161010742, 0.007586956024169922, 0.007995843887329102, 0.008404731750488281, 0.008813619613647461, 0.00922250747680664, 0.00963139533996582, 0.010040283203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 17.0, 8.0, 12.0, 27.0, 36.0, 51.0, 78.0, 128.0, 185.0, 518.0, 1553.0, 795.0, 263.0, 140.0, 70.0, 53.0, 38.0, 24.0, 19.0, 10.0, 13.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.012226462364196777, -0.011910200119018555, -0.011593937873840332, -0.01127767562866211, -0.010961413383483887, -0.010645151138305664, -0.010328888893127441, -0.010012626647949219, -0.009696364402770996, -0.009380102157592773, -0.00906383991241455, -0.008747577667236328, -0.008431315422058105, -0.008115053176879883, -0.00779879093170166, -0.0074825286865234375, -0.007166266441345215, -0.006850004196166992, -0.0065337419509887695, -0.006217479705810547, -0.005901217460632324, -0.0055849552154541016, -0.005268692970275879, -0.004952430725097656, -0.004636168479919434, -0.004319906234741211, -0.004003643989562988, -0.0036873817443847656, -0.003371119499206543, -0.0030548572540283203, -0.0027385950088500977, -0.002422332763671875, -0.0021060705184936523, -0.0017898082733154297, -0.001473546028137207, -0.0011572837829589844, -0.0008410215377807617, -0.0005247592926025391, -0.0002084970474243164, 0.00010776519775390625, 0.0004240274429321289, 0.0007402896881103516, 0.0010565519332885742, 0.0013728141784667969, 0.0016890764236450195, 0.002005338668823242, 0.002321600914001465, 0.0026378631591796875, 0.00295412540435791, 0.003270387649536133, 0.0035866498947143555, 0.003902912139892578, 0.004219174385070801, 0.0045354366302490234, 0.004851698875427246, 0.005167961120605469, 0.005484223365783691, 0.005800485610961914, 0.006116747856140137, 0.006433010101318359, 0.006749272346496582, 0.007065534591674805, 0.007381796836853027, 0.00769805908203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 10.0, 18.0, 58.0, 122.0, 219.0, 221.0, 208.0, 91.0, 48.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035044461488723755, -0.032751962542533875, -0.030459459871053696, -0.028166960924863815, -0.025874460116028786, -0.023581959307193756, -0.021289460361003876, -0.018996959552168846, -0.016704458743333817, -0.014411957934498787, -0.012119458056986332, -0.009826958179473877, -0.007534457370638847, -0.005241956561803818, -0.0029494566842913628, -0.0006569568067789078, 0.0016355440020561218, 0.003928044345229864, 0.006220544688403606, 0.008513044565916061, 0.010805545374751091, 0.01309804618358612, 0.015390546061098576, 0.01768304593861103, 0.01997554674744606, 0.02226804755628109, 0.02456054836511612, 0.026853047311306, 0.02914554812014103, 0.03143804892897606, 0.03373054787516594, 0.03602305054664612, 0.0383155420422554, 0.04060804098844528, 0.04290054365992546, 0.04519304260611534, 0.04748554527759552, 0.0497780442237854, 0.05207054316997528, 0.05436304211616516, 0.05665554478764534, 0.05894804373383522, 0.0612405464053154, 0.06353304535150528, 0.06582554429769516, 0.06811805069446564, 0.07041054964065552, 0.0727030485868454, 0.07499554753303528, 0.07728804647922516, 0.07958054542541504, 0.08187305182218552, 0.0841655507683754, 0.08645804971456528, 0.08875054866075516, 0.09104304760694504, 0.09333555400371552, 0.0956280529499054, 0.09792055189609528, 0.10021305829286575, 0.10250555723905563, 0.10479805618524551, 0.1070905551314354, 0.10938305407762527, 0.11167555302381516]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 3.0, 6.0, 18.0, 8.0, 14.0, 10.0, 18.0, 27.0, 21.0, 23.0, 26.0, 30.0, 30.0, 37.0, 26.0, 41.0, 32.0, 50.0, 37.0, 33.0, 43.0, 48.0, 39.0, 35.0, 25.0, 26.0, 29.0, 30.0, 24.0, 20.0, 19.0, 19.0, 20.0, 18.0, 25.0, 14.0, 9.0, 7.0, 6.0, 10.0, 10.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.014193177223205566, -0.013718122616410255, -0.013243068009614944, -0.012768013402819633, -0.012292958796024323, -0.011817904189229012, -0.0113428495824337, -0.01086779497563839, -0.010392740368843079, -0.009917685762047768, -0.009442631155252457, -0.008967576548457146, -0.008492521941661835, -0.008017467334866524, -0.007542412728071213, -0.007067358121275902, -0.006592303514480591, -0.00611724890768528, -0.005642194300889969, -0.005167139694094658, -0.004692085087299347, -0.004217030480504036, -0.003741975873708725, -0.003266921266913414, -0.002791866660118103, -0.002316812053322792, -0.001841757446527481, -0.00136670283973217, -0.0008916482329368591, -0.00041659362614154816, 5.846098065376282e-05, 0.0005335155874490738, 0.0010085701942443848, 0.0014836248010396957, 0.0019586794078350067, 0.0024337340146303177, 0.0029087886214256287, 0.0033838432282209396, 0.0038588978350162506, 0.004333952441811562, 0.0048090070486068726, 0.0052840616554021835, 0.0057591162621974945, 0.0062341708689928055, 0.0067092254757881165, 0.007184280082583427, 0.007659334689378738, 0.00813438929617405, 0.00860944390296936, 0.009084498509764671, 0.009559553116559982, 0.010034607723355293, 0.010509662330150604, 0.010984716936945915, 0.011459771543741226, 0.011934826150536537, 0.012409880757331848, 0.012884935364127159, 0.01335998997092247, 0.013835044577717781, 0.014310099184513092, 0.014785153791308403, 0.015260208398103714, 0.015735263004899025, 0.016210317611694336]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 9.0, 8.0, 17.0, 24.0, 43.0, 40.0, 57.0, 60.0, 77.0, 120.0, 169.0, 239.0, 350.0, 537.0, 911.0, 1770.0, 5382.0, 29930.0, 409090.0, 548416.0, 39742.0, 6602.0, 2026.0, 977.0, 605.0, 396.0, 268.0, 196.0, 123.0, 96.0, 63.0, 55.0, 23.0, 28.0, 20.0, 11.0, 11.0, 10.0, 11.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.034912109375, -0.03375101089477539, -0.03258991241455078, -0.03142881393432617, -0.030267715454101562, -0.029106616973876953, -0.027945518493652344, -0.026784420013427734, -0.025623321533203125, -0.024462223052978516, -0.023301124572753906, -0.022140026092529297, -0.020978927612304688, -0.019817829132080078, -0.01865673065185547, -0.01749563217163086, -0.01633453369140625, -0.01517343521118164, -0.014012336730957031, -0.012851238250732422, -0.011690139770507812, -0.010529041290283203, -0.009367942810058594, -0.008206844329833984, -0.007045745849609375, -0.005884647369384766, -0.004723548889160156, -0.003562450408935547, -0.0024013519287109375, -0.0012402534484863281, -7.915496826171875e-05, 0.0010819435119628906, 0.0022430419921875, 0.0034041404724121094, 0.004565238952636719, 0.005726337432861328, 0.0068874359130859375, 0.008048534393310547, 0.009209632873535156, 0.010370731353759766, 0.011531829833984375, 0.012692928314208984, 0.013854026794433594, 0.015015125274658203, 0.016176223754882812, 0.017337322235107422, 0.01849842071533203, 0.01965951919555664, 0.02082061767578125, 0.02198171615600586, 0.02314281463623047, 0.024303913116455078, 0.025465011596679688, 0.026626110076904297, 0.027787208557128906, 0.028948307037353516, 0.030109405517578125, 0.031270503997802734, 0.032431602478027344, 0.03359270095825195, 0.03475379943847656, 0.03591489791870117, 0.03707599639892578, 0.03823709487915039, 0.039398193359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 9.0, 13.0, 54.0, 145.0, 238.0, 242.0, 183.0, 87.0, 21.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04095458984375, -0.03990745544433594, -0.038860321044921875, -0.03781318664550781, -0.03676605224609375, -0.03571891784667969, -0.034671783447265625, -0.03362464904785156, -0.0325775146484375, -0.03153038024902344, -0.030483245849609375, -0.029436111450195312, -0.02838897705078125, -0.027341842651367188, -0.026294708251953125, -0.025247573852539062, -0.024200439453125, -0.023153305053710938, -0.022106170654296875, -0.021059036254882812, -0.02001190185546875, -0.018964767456054688, -0.017917633056640625, -0.016870498657226562, -0.0158233642578125, -0.014776229858398438, -0.013729095458984375, -0.012681961059570312, -0.01163482666015625, -0.010587692260742188, -0.009540557861328125, -0.008493423461914062, -0.0074462890625, -0.0063991546630859375, -0.005352020263671875, -0.0043048858642578125, -0.00325775146484375, -0.0022106170654296875, -0.001163482666015625, -0.0001163482666015625, 0.0009307861328125, 0.0019779205322265625, 0.003025054931640625, 0.0040721893310546875, 0.00511932373046875, 0.0061664581298828125, 0.007213592529296875, 0.008260726928710938, 0.009307861328125, 0.010354995727539062, 0.011402130126953125, 0.012449264526367188, 0.01349639892578125, 0.014543533325195312, 0.015590667724609375, 0.016637802124023438, 0.0176849365234375, 0.018732070922851562, 0.019779205322265625, 0.020826339721679688, 0.02187347412109375, 0.022920608520507812, 0.023967742919921875, 0.025014877319335938, 0.02606201171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 9.0, 11.0, 21.0, 28.0, 57.0, 72.0, 89.0, 216.0, 491.0, 1678.0, 6469.0, 38228.0, 312316.0, 576905.0, 94394.0, 13149.0, 2868.0, 768.0, 327.0, 136.0, 99.0, 68.0, 34.0, 33.0, 18.0, 20.0, 12.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030462026596069336, -0.029643535614013672, -0.028825044631958008, -0.028006553649902344, -0.02718806266784668, -0.026369571685791016, -0.02555108070373535, -0.024732589721679688, -0.023914098739624023, -0.02309560775756836, -0.022277116775512695, -0.02145862579345703, -0.020640134811401367, -0.019821643829345703, -0.01900315284729004, -0.018184661865234375, -0.01736617088317871, -0.016547679901123047, -0.015729188919067383, -0.014910697937011719, -0.014092206954956055, -0.01327371597290039, -0.012455224990844727, -0.011636734008789062, -0.010818243026733398, -0.009999752044677734, -0.00918126106262207, -0.008362770080566406, -0.007544279098510742, -0.006725788116455078, -0.005907297134399414, -0.00508880615234375, -0.004270315170288086, -0.003451824188232422, -0.002633333206176758, -0.0018148422241210938, -0.0009963512420654297, -0.00017786026000976562, 0.0006406307220458984, 0.0014591217041015625, 0.0022776126861572266, 0.0030961036682128906, 0.003914594650268555, 0.004733085632324219, 0.005551576614379883, 0.006370067596435547, 0.007188558578491211, 0.008007049560546875, 0.008825540542602539, 0.009644031524658203, 0.010462522506713867, 0.011281013488769531, 0.012099504470825195, 0.01291799545288086, 0.013736486434936523, 0.014554977416992188, 0.015373468399047852, 0.016191959381103516, 0.01701045036315918, 0.017828941345214844, 0.018647432327270508, 0.019465923309326172, 0.020284414291381836, 0.0211029052734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 6.0, 5.0, 6.0, 5.0, 10.0, 8.0, 9.0, 13.0, 21.0, 17.0, 14.0, 22.0, 22.0, 28.0, 26.0, 33.0, 38.0, 50.0, 49.0, 48.0, 39.0, 37.0, 42.0, 43.0, 42.0, 47.0, 48.0, 37.0, 41.0, 26.0, 29.0, 26.0, 18.0, 7.0, 18.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 8.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01403045654296875, -0.013564467430114746, -0.013098478317260742, -0.012632489204406738, -0.012166500091552734, -0.01170051097869873, -0.011234521865844727, -0.010768532752990723, -0.010302543640136719, -0.009836554527282715, -0.009370565414428711, -0.008904576301574707, -0.008438587188720703, -0.0079725980758667, -0.007506608963012695, -0.007040619850158691, -0.0065746307373046875, -0.006108641624450684, -0.00564265251159668, -0.005176663398742676, -0.004710674285888672, -0.004244685173034668, -0.003778696060180664, -0.00331270694732666, -0.0028467178344726562, -0.0023807287216186523, -0.0019147396087646484, -0.0014487504959106445, -0.0009827613830566406, -0.0005167722702026367, -5.078315734863281e-05, 0.0004152059555053711, 0.000881195068359375, 0.001347184181213379, 0.0018131732940673828, 0.0022791624069213867, 0.0027451515197753906, 0.0032111406326293945, 0.0036771297454833984, 0.004143118858337402, 0.004609107971191406, 0.00507509708404541, 0.005541086196899414, 0.006007075309753418, 0.006473064422607422, 0.006939053535461426, 0.00740504264831543, 0.007871031761169434, 0.008337020874023438, 0.008803009986877441, 0.009268999099731445, 0.00973498821258545, 0.010200977325439453, 0.010666966438293457, 0.011132955551147461, 0.011598944664001465, 0.012064933776855469, 0.012530922889709473, 0.012996912002563477, 0.01346290111541748, 0.013928890228271484, 0.014394879341125488, 0.014860868453979492, 0.015326857566833496, 0.0157928466796875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 11.0, 12.0, 16.0, 22.0, 48.0, 89.0, 125.0, 233.0, 312.0, 557.0, 875.0, 1459.0, 2667.0, 5297.0, 13234.0, 44754.0, 313752.0, 554872.0, 76805.0, 18522.0, 7110.0, 3275.0, 1799.0, 1033.0, 635.0, 399.0, 252.0, 165.0, 68.0, 54.0, 28.0, 29.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.009185791015625, -0.008859634399414062, -0.008533477783203125, -0.008207321166992188, -0.00788116455078125, -0.0075550079345703125, -0.007228851318359375, -0.0069026947021484375, -0.0065765380859375, -0.0062503814697265625, -0.005924224853515625, -0.0055980682373046875, -0.00527191162109375, -0.0049457550048828125, -0.004619598388671875, -0.0042934417724609375, -0.00396728515625, -0.0036411285400390625, -0.003314971923828125, -0.0029888153076171875, -0.00266265869140625, -0.0023365020751953125, -0.002010345458984375, -0.0016841888427734375, -0.0013580322265625, -0.0010318756103515625, -0.000705718994140625, -0.0003795623779296875, -5.340576171875e-05, 0.0002727508544921875, 0.000598907470703125, 0.0009250640869140625, 0.001251220703125, 0.0015773773193359375, 0.001903533935546875, 0.0022296905517578125, 0.00255584716796875, 0.0028820037841796875, 0.003208160400390625, 0.0035343170166015625, 0.0038604736328125, 0.0041866302490234375, 0.004512786865234375, 0.0048389434814453125, 0.00516510009765625, 0.0054912567138671875, 0.005817413330078125, 0.0061435699462890625, 0.0064697265625, 0.0067958831787109375, 0.007122039794921875, 0.0074481964111328125, 0.00777435302734375, 0.008100509643554688, 0.008426666259765625, 0.008752822875976562, 0.0090789794921875, 0.009405136108398438, 0.009731292724609375, 0.010057449340820312, 0.01038360595703125, 0.010709762573242188, 0.011035919189453125, 0.011362075805664062, 0.011688232421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 11.0, 26.0, 35.0, 63.0, 71.0, 112.0, 163.0, 152.0, 114.0, 87.0, 68.0, 36.0, 33.0, 14.0, 9.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010836124420166016, -0.00010476727038621902, -0.00010117329657077789, -9.757932275533676e-05, -9.398534893989563e-05, -9.03913751244545e-05, -8.679740130901337e-05, -8.320342749357224e-05, -7.96094536781311e-05, -7.601547986268997e-05, -7.242150604724884e-05, -6.882753223180771e-05, -6.523355841636658e-05, -6.163958460092545e-05, -5.8045610785484314e-05, -5.445163697004318e-05, -5.085766315460205e-05, -4.726368933916092e-05, -4.366971552371979e-05, -4.0075741708278656e-05, -3.6481767892837524e-05, -3.288779407739639e-05, -2.929382026195526e-05, -2.569984644651413e-05, -2.2105872631072998e-05, -1.8511898815631866e-05, -1.4917925000190735e-05, -1.1323951184749603e-05, -7.729977369308472e-06, -4.13600355386734e-06, -5.420297384262085e-07, 3.051944077014923e-06, 6.645917892456055e-06, 1.0239891707897186e-05, 1.3833865523338318e-05, 1.742783933877945e-05, 2.102181315422058e-05, 2.4615786969661713e-05, 2.8209760785102844e-05, 3.1803734600543976e-05, 3.539770841598511e-05, 3.899168223142624e-05, 4.258565604686737e-05, 4.61796298623085e-05, 4.9773603677749634e-05, 5.3367577493190765e-05, 5.69615513086319e-05, 6.055552512407303e-05, 6.414949893951416e-05, 6.774347275495529e-05, 7.133744657039642e-05, 7.493142038583755e-05, 7.852539420127869e-05, 8.211936801671982e-05, 8.571334183216095e-05, 8.930731564760208e-05, 9.290128946304321e-05, 9.649526327848434e-05, 0.00010008923709392548, 0.00010368321090936661, 0.00010727718472480774, 0.00011087115854024887, 0.00011446513235569, 0.00011805910617113113, 0.00012165307998657227]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 18.0, 43.0, 55.0, 85.0, 178.0, 328.0, 584.0, 1164.0, 2442.0, 5733.0, 18711.0, 102101.0, 693181.0, 183537.0, 26937.0, 7616.0, 2935.0, 1386.0, 700.0, 343.0, 206.0, 98.0, 65.0, 30.0, 24.0, 8.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01219940185546875, -0.01180112361907959, -0.01140284538269043, -0.01100456714630127, -0.01060628890991211, -0.01020801067352295, -0.009809732437133789, -0.009411454200744629, -0.009013175964355469, -0.008614897727966309, -0.008216619491577148, -0.007818341255187988, -0.007420063018798828, -0.007021784782409668, -0.006623506546020508, -0.006225228309631348, -0.0058269500732421875, -0.005428671836853027, -0.005030393600463867, -0.004632115364074707, -0.004233837127685547, -0.0038355588912963867, -0.0034372806549072266, -0.0030390024185180664, -0.0026407241821289062, -0.002242445945739746, -0.001844167709350586, -0.0014458894729614258, -0.0010476112365722656, -0.0006493330001831055, -0.0002510547637939453, 0.00014722347259521484, 0.000545501708984375, 0.0009437799453735352, 0.0013420581817626953, 0.0017403364181518555, 0.0021386146545410156, 0.0025368928909301758, 0.002935171127319336, 0.003333449363708496, 0.0037317276000976562, 0.004130005836486816, 0.0045282840728759766, 0.004926562309265137, 0.005324840545654297, 0.005723118782043457, 0.006121397018432617, 0.006519675254821777, 0.0069179534912109375, 0.007316231727600098, 0.007714509963989258, 0.008112788200378418, 0.008511066436767578, 0.008909344673156738, 0.009307622909545898, 0.009705901145935059, 0.010104179382324219, 0.010502457618713379, 0.010900735855102539, 0.0112990140914917, 0.01169729232788086, 0.01209557056427002, 0.01249384880065918, 0.01289212703704834, 0.0132904052734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 7.0, 13.0, 8.0, 21.0, 27.0, 45.0, 52.0, 89.0, 134.0, 125.0, 137.0, 94.0, 67.0, 48.0, 30.0, 16.0, 18.0, 12.0, 6.0, 6.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0086669921875, -0.008392810821533203, -0.008118629455566406, -0.00784444808959961, -0.0075702667236328125, -0.007296085357666016, -0.007021903991699219, -0.006747722625732422, -0.006473541259765625, -0.006199359893798828, -0.005925178527832031, -0.005650997161865234, -0.0053768157958984375, -0.005102634429931641, -0.004828453063964844, -0.004554271697998047, -0.00428009033203125, -0.004005908966064453, -0.0037317276000976562, -0.0034575462341308594, -0.0031833648681640625, -0.0029091835021972656, -0.0026350021362304688, -0.002360820770263672, -0.002086639404296875, -0.0018124580383300781, -0.0015382766723632812, -0.0012640953063964844, -0.0009899139404296875, -0.0007157325744628906, -0.00044155120849609375, -0.00016736984252929688, 0.0001068115234375, 0.0003809928894042969, 0.0006551742553710938, 0.0009293556213378906, 0.0012035369873046875, 0.0014777183532714844, 0.0017518997192382812, 0.002026081085205078, 0.002300262451171875, 0.002574443817138672, 0.0028486251831054688, 0.0031228065490722656, 0.0033969879150390625, 0.0036711692810058594, 0.003945350646972656, 0.004219532012939453, 0.00449371337890625, 0.004767894744873047, 0.005042076110839844, 0.005316257476806641, 0.0055904388427734375, 0.005864620208740234, 0.006138801574707031, 0.006412982940673828, 0.006687164306640625, 0.006961345672607422, 0.007235527038574219, 0.007509708404541016, 0.0077838897705078125, 0.00805807113647461, 0.008332252502441406, 0.008606433868408203, 0.008880615234375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 126.0, 596.0, 257.0, 24.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11658167093992233, -0.10318668931722641, -0.08979170024394989, -0.07639671862125397, -0.06300173699855804, -0.04960675537586212, -0.0362117663025856, -0.02281678467988968, -0.009421803057193756, 0.003973180428147316, 0.017368163913488388, 0.03076314926147461, 0.04415813088417053, 0.057553112506866455, 0.07094810158014297, 0.0843430832028389, 0.09773806482553482, 0.11113304644823074, 0.12452803552150726, 0.13792301714420319, 0.1513179987668991, 0.16471298038959503, 0.17810797691345215, 0.19150295853614807, 0.204897940158844, 0.21829292178153992, 0.23168790340423584, 0.24508288502693176, 0.2584778666496277, 0.2718728482723236, 0.28526782989501953, 0.29866284132003784, 0.3120577931404114, 0.3254527747631073, 0.3388477563858032, 0.35224273800849915, 0.36563771963119507, 0.379032701253891, 0.3924276828765869, 0.4058226943016052, 0.41921764612197876, 0.4326126277446747, 0.4460076093673706, 0.45940259099006653, 0.47279757261276245, 0.4861925542354584, 0.4995875358581543, 0.5129825472831726, 0.5263775587081909, 0.5397725701332092, 0.5531675219535828, 0.5665625333786011, 0.5799574851989746, 0.5933524966239929, 0.6067474484443665, 0.6201424598693848, 0.6335374116897583, 0.6469324231147766, 0.6603273749351501, 0.6737223863601685, 0.687117338180542, 0.7005123496055603, 0.7139073014259338, 0.7273023128509521, 0.7406972646713257]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 0.0, 6.0, 3.0, 9.0, 9.0, 7.0, 8.0, 15.0, 14.0, 20.0, 23.0, 20.0, 35.0, 34.0, 48.0, 36.0, 31.0, 41.0, 43.0, 52.0, 44.0, 43.0, 40.0, 37.0, 43.0, 38.0, 43.0, 34.0, 28.0, 34.0, 21.0, 16.0, 27.0, 16.0, 11.0, 12.0, 10.0, 15.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03747373819351196, -0.03609912469983101, -0.034724511206150055, -0.0333498977124691, -0.03197528421878815, -0.030600670725107193, -0.02922605723142624, -0.027851443737745285, -0.02647683024406433, -0.025102216750383377, -0.023727603256702423, -0.02235298976302147, -0.020978376269340515, -0.01960376277565956, -0.018229149281978607, -0.016854535788297653, -0.0154799222946167, -0.014105308800935745, -0.012730695307254791, -0.011356081813573837, -0.009981468319892883, -0.00860685482621193, -0.007232241332530975, -0.005857627838850021, -0.004483014345169067, -0.0031084008514881134, -0.0017337873578071594, -0.00035917386412620544, 0.0010154396295547485, 0.0023900531232357025, 0.0037646666169166565, 0.0051392801105976105, 0.0065138936042785645, 0.007888507097959518, 0.009263120591640472, 0.010637734085321426, 0.01201234757900238, 0.013386961072683334, 0.014761574566364288, 0.016136188060045242, 0.017510801553726196, 0.01888541504740715, 0.020260028541088104, 0.021634642034769058, 0.023009255528450012, 0.024383869022130966, 0.02575848251581192, 0.027133096009492874, 0.028507709503173828, 0.029882322996854782, 0.031256936490535736, 0.03263154998421669, 0.034006163477897644, 0.0353807769715786, 0.03675539046525955, 0.038130003958940506, 0.03950461745262146, 0.040879230946302414, 0.04225384443998337, 0.04362845793366432, 0.045003071427345276, 0.04637768492102623, 0.047752298414707184, 0.04912691190838814, 0.05050152540206909]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 20.0, 15.0, 23.0, 24.0, 30.0, 56.0, 73.0, 102.0, 173.0, 315.0, 708.0, 1710.0, 5739.0, 37967.0, 3711244.0, 409592.0, 18683.0, 4548.0, 1612.0, 795.0, 359.0, 162.0, 108.0, 50.0, 35.0, 34.0, 20.0, 14.0, 11.0, 11.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034332275390625, -0.03325319290161133, -0.032174110412597656, -0.031095027923583984, -0.030015945434570312, -0.02893686294555664, -0.02785778045654297, -0.026778697967529297, -0.025699615478515625, -0.024620532989501953, -0.02354145050048828, -0.02246236801147461, -0.021383285522460938, -0.020304203033447266, -0.019225120544433594, -0.018146038055419922, -0.01706695556640625, -0.015987873077392578, -0.014908790588378906, -0.013829708099365234, -0.012750625610351562, -0.01167154312133789, -0.010592460632324219, -0.009513378143310547, -0.008434295654296875, -0.007355213165283203, -0.006276130676269531, -0.005197048187255859, -0.0041179656982421875, -0.0030388832092285156, -0.0019598007202148438, -0.0008807182312011719, 0.0001983642578125, 0.0012774467468261719, 0.0023565292358398438, 0.0034356117248535156, 0.0045146942138671875, 0.005593776702880859, 0.006672859191894531, 0.007751941680908203, 0.008831024169921875, 0.009910106658935547, 0.010989189147949219, 0.01206827163696289, 0.013147354125976562, 0.014226436614990234, 0.015305519104003906, 0.016384601593017578, 0.01746368408203125, 0.018542766571044922, 0.019621849060058594, 0.020700931549072266, 0.021780014038085938, 0.02285909652709961, 0.02393817901611328, 0.025017261505126953, 0.026096343994140625, 0.027175426483154297, 0.02825450897216797, 0.02933359146118164, 0.030412673950195312, 0.031491756439208984, 0.032570838928222656, 0.03364992141723633, 0.03472900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 8.0, 44.0, 104.0, 217.0, 247.0, 205.0, 121.0, 39.0, 7.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041534423828125, -0.0404813289642334, -0.0394282341003418, -0.038375139236450195, -0.037322044372558594, -0.03626894950866699, -0.03521585464477539, -0.03416275978088379, -0.03310966491699219, -0.032056570053100586, -0.031003475189208984, -0.029950380325317383, -0.02889728546142578, -0.02784419059753418, -0.026791095733642578, -0.025738000869750977, -0.024684906005859375, -0.023631811141967773, -0.022578716278076172, -0.02152562141418457, -0.02047252655029297, -0.019419431686401367, -0.018366336822509766, -0.017313241958618164, -0.016260147094726562, -0.015207052230834961, -0.01415395736694336, -0.013100862503051758, -0.012047767639160156, -0.010994672775268555, -0.009941577911376953, -0.008888483047485352, -0.00783538818359375, -0.0067822933197021484, -0.005729198455810547, -0.004676103591918945, -0.0036230087280273438, -0.002569913864135742, -0.0015168190002441406, -0.00046372413635253906, 0.0005893707275390625, 0.001642465591430664, 0.0026955604553222656, 0.003748655319213867, 0.004801750183105469, 0.00585484504699707, 0.006907939910888672, 0.007961034774780273, 0.009014129638671875, 0.010067224502563477, 0.011120319366455078, 0.01217341423034668, 0.013226509094238281, 0.014279603958129883, 0.015332698822021484, 0.016385793685913086, 0.017438888549804688, 0.01849198341369629, 0.01954507827758789, 0.020598173141479492, 0.021651268005371094, 0.022704362869262695, 0.023757457733154297, 0.0248105525970459, 0.0258636474609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 7.0, 13.0, 15.0, 21.0, 29.0, 45.0, 75.0, 112.0, 164.0, 253.0, 437.0, 747.0, 1396.0, 2978.0, 6960.0, 19926.0, 69798.0, 378072.0, 3360462.0, 267238.0, 56672.0, 17002.0, 6118.0, 2711.0, 1256.0, 727.0, 377.0, 242.0, 134.0, 103.0, 62.0, 36.0, 23.0, 17.0, 14.0, 8.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.013092041015625, -0.01266169548034668, -0.01223134994506836, -0.011801004409790039, -0.011370658874511719, -0.010940313339233398, -0.010509967803955078, -0.010079622268676758, -0.009649276733398438, -0.009218931198120117, -0.008788585662841797, -0.008358240127563477, -0.007927894592285156, -0.007497549057006836, -0.007067203521728516, -0.006636857986450195, -0.006206512451171875, -0.005776166915893555, -0.005345821380615234, -0.004915475845336914, -0.004485130310058594, -0.0040547847747802734, -0.003624439239501953, -0.003194093704223633, -0.0027637481689453125, -0.002333402633666992, -0.0019030570983886719, -0.0014727115631103516, -0.0010423660278320312, -0.0006120204925537109, -0.00018167495727539062, 0.0002486705780029297, 0.00067901611328125, 0.0011093616485595703, 0.0015397071838378906, 0.001970052719116211, 0.0024003982543945312, 0.0028307437896728516, 0.003261089324951172, 0.003691434860229492, 0.0041217803955078125, 0.004552125930786133, 0.004982471466064453, 0.0054128170013427734, 0.005843162536621094, 0.006273508071899414, 0.006703853607177734, 0.007134199142456055, 0.007564544677734375, 0.007994890213012695, 0.008425235748291016, 0.008855581283569336, 0.009285926818847656, 0.009716272354125977, 0.010146617889404297, 0.010576963424682617, 0.011007308959960938, 0.011437654495239258, 0.011868000030517578, 0.012298345565795898, 0.012728691101074219, 0.013159036636352539, 0.01358938217163086, 0.01401972770690918, 0.0144500732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 12.0, 11.0, 14.0, 43.0, 56.0, 82.0, 151.0, 369.0, 1570.0, 1166.0, 265.0, 129.0, 67.0, 46.0, 34.0, 23.0, 14.0, 5.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01904296875, -0.01851201057434082, -0.01798105239868164, -0.01745009422302246, -0.01691913604736328, -0.0163881778717041, -0.015857219696044922, -0.015326261520385742, -0.014795303344726562, -0.014264345169067383, -0.013733386993408203, -0.013202428817749023, -0.012671470642089844, -0.012140512466430664, -0.011609554290771484, -0.011078596115112305, -0.010547637939453125, -0.010016679763793945, -0.009485721588134766, -0.008954763412475586, -0.008423805236816406, -0.007892847061157227, -0.007361888885498047, -0.006830930709838867, -0.0062999725341796875, -0.005769014358520508, -0.005238056182861328, -0.0047070980072021484, -0.004176139831542969, -0.003645181655883789, -0.0031142234802246094, -0.0025832653045654297, -0.00205230712890625, -0.0015213489532470703, -0.0009903907775878906, -0.00045943260192871094, 7.152557373046875e-05, 0.0006024837493896484, 0.0011334419250488281, 0.0016644001007080078, 0.0021953582763671875, 0.002726316452026367, 0.003257274627685547, 0.0037882328033447266, 0.004319190979003906, 0.004850149154663086, 0.005381107330322266, 0.005912065505981445, 0.006443023681640625, 0.006973981857299805, 0.007504940032958984, 0.008035898208618164, 0.008566856384277344, 0.009097814559936523, 0.009628772735595703, 0.010159730911254883, 0.010690689086914062, 0.011221647262573242, 0.011752605438232422, 0.012283563613891602, 0.012814521789550781, 0.013345479965209961, 0.01387643814086914, 0.01440739631652832, 0.0149383544921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 20.0, 69.0, 135.0, 270.0, 249.0, 143.0, 69.0, 23.0, 14.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10573011636734009, -0.10251280665397644, -0.0992954894900322, -0.09607817977666855, -0.0928608626127243, -0.08964355289936066, -0.08642624318599701, -0.08320892602205276, -0.07999160885810852, -0.07677429914474487, -0.07355698198080063, -0.07033967226743698, -0.06712235510349274, -0.06390504539012909, -0.06068773195147514, -0.0574704185128212, -0.05425310879945755, -0.051035795360803604, -0.04781848192214966, -0.04460117220878601, -0.041383855044841766, -0.03816654533147812, -0.03494923189282417, -0.03173191845417023, -0.02851460501551628, -0.025297291576862335, -0.02207997813820839, -0.018862666562199593, -0.015645353123545647, -0.0124280396848917, -0.009210728108882904, -0.005993414670228958, -0.002776101231575012, 0.0004412117414176464, 0.003658524714410305, 0.006875837221741676, 0.010093150660395622, 0.013310464099049568, 0.016527775675058365, 0.01974508911371231, 0.022962402552366257, 0.026179715991020203, 0.02939702942967415, 0.032614342868328094, 0.03583165258169174, 0.039048969745635986, 0.042266279458999634, 0.04548359289765358, 0.048700906336307526, 0.05191821977496147, 0.05513553321361542, 0.058352842926979065, 0.06157016009092331, 0.06478746980428696, 0.0680047869682312, 0.07122209668159485, 0.0744394063949585, 0.07765671610832214, 0.08087403327226639, 0.08409134298563004, 0.08730866014957428, 0.09052596986293793, 0.09374327957630157, 0.09696059674024582, 0.10017791390419006]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 10.0, 19.0, 14.0, 23.0, 24.0, 27.0, 47.0, 41.0, 63.0, 55.0, 48.0, 56.0, 40.0, 58.0, 72.0, 64.0, 49.0, 47.0, 41.0, 28.0, 25.0, 28.0, 19.0, 24.0, 22.0, 8.0, 4.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03852194547653198, -0.03750026971101761, -0.036478593945503235, -0.03545691445469856, -0.03443523868918419, -0.033413562923669815, -0.03239188343286514, -0.03137020766735077, -0.030348531901836395, -0.02932685613632202, -0.0283051785081625, -0.027283500880002975, -0.0262618251144886, -0.025240149348974228, -0.024218471720814705, -0.023196794092655182, -0.022175118327140808, -0.021153442561626434, -0.02013176493346691, -0.01911008730530739, -0.018088411539793015, -0.01706673577427864, -0.016045058146119118, -0.01502338144928217, -0.014001704752445221, -0.012980028055608273, -0.011958351358771324, -0.010936674661934376, -0.009914997965097427, -0.008893321268260479, -0.00787164457142353, -0.006849967874586582, -0.005828291177749634, -0.004806614480912685, -0.003784937784075737, -0.0027632610872387886, -0.0017415843904018402, -0.0007199076935648918, 0.0003017690032720566, 0.001323445700109005, 0.0023451223969459534, 0.0033667990937829018, 0.00438847579061985, 0.0054101524874567986, 0.006431829184293747, 0.007453505881130695, 0.008475182577967644, 0.009496859274804592, 0.01051853597164154, 0.011540212668478489, 0.012561889365315437, 0.013583566062152386, 0.014605242758989334, 0.015626918524503708, 0.01664859615266323, 0.017670273780822754, 0.018691949546337128, 0.0197136253118515, 0.020735302940011024, 0.021756980568170547, 0.02277865633368492, 0.023800332099199295, 0.024822009727358818, 0.02584368735551834, 0.026865363121032715]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 5.0, 9.0, 18.0, 17.0, 36.0, 28.0, 54.0, 86.0, 109.0, 145.0, 241.0, 350.0, 586.0, 1116.0, 2731.0, 11544.0, 131478.0, 806315.0, 80297.0, 8596.0, 2250.0, 950.0, 534.0, 337.0, 205.0, 151.0, 98.0, 72.0, 41.0, 32.0, 36.0, 21.0, 13.0, 13.0, 10.0, 2.0, 2.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047821044921875, -0.04619550704956055, -0.044569969177246094, -0.04294443130493164, -0.04131889343261719, -0.039693355560302734, -0.03806781768798828, -0.03644227981567383, -0.034816741943359375, -0.03319120407104492, -0.03156566619873047, -0.029940128326416016, -0.028314590454101562, -0.02668905258178711, -0.025063514709472656, -0.023437976837158203, -0.02181243896484375, -0.020186901092529297, -0.018561363220214844, -0.01693582534790039, -0.015310287475585938, -0.013684749603271484, -0.012059211730957031, -0.010433673858642578, -0.008808135986328125, -0.007182598114013672, -0.005557060241699219, -0.003931522369384766, -0.0023059844970703125, -0.0006804466247558594, 0.0009450912475585938, 0.002570629119873047, 0.0041961669921875, 0.005821704864501953, 0.007447242736816406, 0.00907278060913086, 0.010698318481445312, 0.012323856353759766, 0.013949394226074219, 0.015574932098388672, 0.017200469970703125, 0.018826007843017578, 0.02045154571533203, 0.022077083587646484, 0.023702621459960938, 0.02532815933227539, 0.026953697204589844, 0.028579235076904297, 0.03020477294921875, 0.0318303108215332, 0.033455848693847656, 0.03508138656616211, 0.03670692443847656, 0.038332462310791016, 0.03995800018310547, 0.04158353805541992, 0.043209075927734375, 0.04483461380004883, 0.04646015167236328, 0.048085689544677734, 0.04971122741699219, 0.05133676528930664, 0.052962303161621094, 0.05458784103393555, 0.05621337890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 19.0, 59.0, 177.0, 238.0, 229.0, 180.0, 63.0, 20.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04144287109375, -0.04037928581237793, -0.03931570053100586, -0.03825211524963379, -0.03718852996826172, -0.03612494468688965, -0.03506135940551758, -0.03399777412414551, -0.03293418884277344, -0.03187060356140137, -0.030807018280029297, -0.029743432998657227, -0.028679847717285156, -0.027616262435913086, -0.026552677154541016, -0.025489091873168945, -0.024425506591796875, -0.023361921310424805, -0.022298336029052734, -0.021234750747680664, -0.020171165466308594, -0.019107580184936523, -0.018043994903564453, -0.016980409622192383, -0.015916824340820312, -0.014853239059448242, -0.013789653778076172, -0.012726068496704102, -0.011662483215332031, -0.010598897933959961, -0.00953531265258789, -0.00847172737121582, -0.00740814208984375, -0.00634455680847168, -0.005280971527099609, -0.004217386245727539, -0.0031538009643554688, -0.0020902156829833984, -0.0010266304016113281, 3.695487976074219e-05, 0.0011005401611328125, 0.002164125442504883, 0.003227710723876953, 0.0042912960052490234, 0.005354881286621094, 0.006418466567993164, 0.007482051849365234, 0.008545637130737305, 0.009609222412109375, 0.010672807693481445, 0.011736392974853516, 0.012799978256225586, 0.013863563537597656, 0.014927148818969727, 0.015990734100341797, 0.017054319381713867, 0.018117904663085938, 0.019181489944458008, 0.020245075225830078, 0.02130866050720215, 0.02237224578857422, 0.02343583106994629, 0.02449941635131836, 0.02556300163269043, 0.0266265869140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 1.0, 6.0, 13.0, 10.0, 15.0, 31.0, 36.0, 81.0, 137.0, 305.0, 655.0, 1851.0, 5546.0, 23341.0, 200826.0, 669009.0, 123166.0, 16582.0, 4320.0, 1459.0, 597.0, 258.0, 118.0, 55.0, 41.0, 18.0, 15.0, 10.0, 5.0, 7.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.033416748046875, -0.03227996826171875, -0.0311431884765625, -0.03000640869140625, -0.02886962890625, -0.02773284912109375, -0.0265960693359375, -0.02545928955078125, -0.024322509765625, -0.02318572998046875, -0.0220489501953125, -0.02091217041015625, -0.019775390625, -0.01863861083984375, -0.0175018310546875, -0.01636505126953125, -0.015228271484375, -0.01409149169921875, -0.0129547119140625, -0.01181793212890625, -0.01068115234375, -0.00954437255859375, -0.0084075927734375, -0.00727081298828125, -0.006134033203125, -0.00499725341796875, -0.0038604736328125, -0.00272369384765625, -0.0015869140625, -0.00045013427734375, 0.0006866455078125, 0.00182342529296875, 0.002960205078125, 0.00409698486328125, 0.0052337646484375, 0.00637054443359375, 0.00750732421875, 0.00864410400390625, 0.0097808837890625, 0.01091766357421875, 0.012054443359375, 0.01319122314453125, 0.0143280029296875, 0.01546478271484375, 0.0166015625, 0.01773834228515625, 0.0188751220703125, 0.02001190185546875, 0.021148681640625, 0.02228546142578125, 0.0234222412109375, 0.02455902099609375, 0.02569580078125, 0.02683258056640625, 0.0279693603515625, 0.02910614013671875, 0.030242919921875, 0.03137969970703125, 0.0325164794921875, 0.03365325927734375, 0.0347900390625, 0.03592681884765625, 0.0370635986328125, 0.03820037841796875, 0.039337158203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 7.0, 4.0, 6.0, 19.0, 10.0, 16.0, 16.0, 16.0, 21.0, 33.0, 32.0, 44.0, 30.0, 42.0, 54.0, 60.0, 59.0, 60.0, 48.0, 55.0, 53.0, 43.0, 40.0, 31.0, 36.0, 31.0, 20.0, 17.0, 18.0, 14.0, 10.0, 9.0, 9.0, 6.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02130126953125, -0.02065873146057129, -0.020016193389892578, -0.019373655319213867, -0.018731117248535156, -0.018088579177856445, -0.017446041107177734, -0.016803503036499023, -0.016160964965820312, -0.015518426895141602, -0.01487588882446289, -0.01423335075378418, -0.013590812683105469, -0.012948274612426758, -0.012305736541748047, -0.011663198471069336, -0.011020660400390625, -0.010378122329711914, -0.009735584259033203, -0.009093046188354492, -0.008450508117675781, -0.00780797004699707, -0.007165431976318359, -0.0065228939056396484, -0.0058803558349609375, -0.0052378177642822266, -0.004595279693603516, -0.003952741622924805, -0.0033102035522460938, -0.002667665481567383, -0.002025127410888672, -0.001382589340209961, -0.00074005126953125, -9.751319885253906e-05, 0.0005450248718261719, 0.0011875629425048828, 0.0018301010131835938, 0.0024726390838623047, 0.0031151771545410156, 0.0037577152252197266, 0.0044002532958984375, 0.0050427913665771484, 0.005685329437255859, 0.00632786750793457, 0.006970405578613281, 0.007612943649291992, 0.008255481719970703, 0.008898019790649414, 0.009540557861328125, 0.010183095932006836, 0.010825634002685547, 0.011468172073364258, 0.012110710144042969, 0.01275324821472168, 0.01339578628540039, 0.014038324356079102, 0.014680862426757812, 0.015323400497436523, 0.015965938568115234, 0.016608476638793945, 0.017251014709472656, 0.017893552780151367, 0.018536090850830078, 0.01917862892150879, 0.0198211669921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 15.0, 17.0, 19.0, 33.0, 38.0, 52.0, 75.0, 82.0, 121.0, 217.0, 320.0, 438.0, 683.0, 1075.0, 1841.0, 3041.0, 5687.0, 11337.0, 27492.0, 114548.0, 687379.0, 137549.0, 29893.0, 12130.0, 5872.0, 3330.0, 1915.0, 1160.0, 721.0, 450.0, 309.0, 203.0, 142.0, 103.0, 65.0, 54.0, 42.0, 30.0, 25.0, 10.0, 13.0, 4.0, 5.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.012979388236999512, -0.012508153915405273, -0.012036919593811035, -0.011565685272216797, -0.011094450950622559, -0.01062321662902832, -0.010151982307434082, -0.009680747985839844, -0.009209513664245605, -0.008738279342651367, -0.008267045021057129, -0.007795810699462891, -0.007324576377868652, -0.006853342056274414, -0.006382107734680176, -0.0059108734130859375, -0.005439639091491699, -0.004968404769897461, -0.004497170448303223, -0.004025936126708984, -0.003554701805114746, -0.003083467483520508, -0.0026122331619262695, -0.0021409988403320312, -0.001669764518737793, -0.0011985301971435547, -0.0007272958755493164, -0.0002560615539550781, 0.00021517276763916016, 0.0006864070892333984, 0.0011576414108276367, 0.001628875732421875, 0.0021001100540161133, 0.0025713443756103516, 0.00304257869720459, 0.003513813018798828, 0.003985047340393066, 0.004456281661987305, 0.004927515983581543, 0.005398750305175781, 0.0058699846267700195, 0.006341218948364258, 0.006812453269958496, 0.007283687591552734, 0.007754921913146973, 0.008226156234741211, 0.00869739055633545, 0.009168624877929688, 0.009639859199523926, 0.010111093521118164, 0.010582327842712402, 0.01105356216430664, 0.011524796485900879, 0.011996030807495117, 0.012467265129089355, 0.012938499450683594, 0.013409733772277832, 0.01388096809387207, 0.014352202415466309, 0.014823436737060547, 0.015294671058654785, 0.015765905380249023, 0.01623713970184326, 0.0167083740234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 5.0, 10.0, 7.0, 12.0, 14.0, 19.0, 18.0, 33.0, 31.0, 44.0, 86.0, 67.0, 86.0, 80.0, 70.0, 76.0, 51.0, 65.0, 59.0, 45.0, 22.0, 21.0, 21.0, 8.0, 15.0, 14.0, 7.0, 5.0, 2.0, 1.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.753206253051758e-05, -6.52587041258812e-05, -6.298534572124481e-05, -6.071198731660843e-05, -5.8438628911972046e-05, -5.616527050733566e-05, -5.389191210269928e-05, -5.16185536980629e-05, -4.9345195293426514e-05, -4.707183688879013e-05, -4.479847848415375e-05, -4.2525120079517365e-05, -4.025176167488098e-05, -3.79784032702446e-05, -3.5705044865608215e-05, -3.343168646097183e-05, -3.115832805633545e-05, -2.8884969651699066e-05, -2.6611611247062683e-05, -2.43382528424263e-05, -2.2064894437789917e-05, -1.9791536033153534e-05, -1.751817762851715e-05, -1.5244819223880768e-05, -1.2971460819244385e-05, -1.0698102414608002e-05, -8.424744009971619e-06, -6.151385605335236e-06, -3.8780272006988525e-06, -1.6046687960624695e-06, 6.686896085739136e-07, 2.9420480132102966e-06, 5.21540641784668e-06, 7.488764822483063e-06, 9.762123227119446e-06, 1.2035481631755829e-05, 1.4308840036392212e-05, 1.6582198441028595e-05, 1.8855556845664978e-05, 2.112891525030136e-05, 2.3402273654937744e-05, 2.5675632059574127e-05, 2.794899046421051e-05, 3.0222348868846893e-05, 3.2495707273483276e-05, 3.476906567811966e-05, 3.704242408275604e-05, 3.9315782487392426e-05, 4.158914089202881e-05, 4.386249929666519e-05, 4.6135857701301575e-05, 4.840921610593796e-05, 5.068257451057434e-05, 5.2955932915210724e-05, 5.522929131984711e-05, 5.750264972448349e-05, 5.977600812911987e-05, 6.204936653375626e-05, 6.432272493839264e-05, 6.659608334302902e-05, 6.88694417476654e-05, 7.114280015230179e-05, 7.341615855693817e-05, 7.568951696157455e-05, 7.796287536621094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 8.0, 7.0, 10.0, 9.0, 28.0, 35.0, 52.0, 92.0, 151.0, 228.0, 385.0, 596.0, 1066.0, 1817.0, 3368.0, 6336.0, 13436.0, 32492.0, 107862.0, 565432.0, 227436.0, 50265.0, 18809.0, 8593.0, 4333.0, 2384.0, 1289.0, 758.0, 519.0, 283.0, 165.0, 106.0, 66.0, 36.0, 25.0, 23.0, 10.0, 12.0, 12.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0120849609375, -0.011703848838806152, -0.011322736740112305, -0.010941624641418457, -0.01056051254272461, -0.010179400444030762, -0.009798288345336914, -0.009417176246643066, -0.009036064147949219, -0.008654952049255371, -0.008273839950561523, -0.007892727851867676, -0.007511615753173828, -0.0071305036544799805, -0.006749391555786133, -0.006368279457092285, -0.0059871673583984375, -0.00560605525970459, -0.005224943161010742, -0.0048438310623168945, -0.004462718963623047, -0.004081606864929199, -0.0037004947662353516, -0.003319382667541504, -0.0029382705688476562, -0.0025571584701538086, -0.002176046371459961, -0.0017949342727661133, -0.0014138221740722656, -0.001032710075378418, -0.0006515979766845703, -0.00027048587799072266, 0.000110626220703125, 0.0004917383193969727, 0.0008728504180908203, 0.001253962516784668, 0.0016350746154785156, 0.0020161867141723633, 0.002397298812866211, 0.0027784109115600586, 0.0031595230102539062, 0.003540635108947754, 0.0039217472076416016, 0.004302859306335449, 0.004683971405029297, 0.0050650835037231445, 0.005446195602416992, 0.00582730770111084, 0.0062084197998046875, 0.006589531898498535, 0.006970643997192383, 0.0073517560958862305, 0.007732868194580078, 0.008113980293273926, 0.008495092391967773, 0.008876204490661621, 0.009257316589355469, 0.009638428688049316, 0.010019540786743164, 0.010400652885437012, 0.01078176498413086, 0.011162877082824707, 0.011543989181518555, 0.011925101280212402, 0.01230621337890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 11.0, 9.0, 4.0, 16.0, 11.0, 25.0, 40.0, 81.0, 164.0, 223.0, 151.0, 75.0, 39.0, 24.0, 19.0, 11.0, 13.0, 8.0, 10.0, 3.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.014251708984375, -0.013826489448547363, -0.013401269912719727, -0.01297605037689209, -0.012550830841064453, -0.012125611305236816, -0.01170039176940918, -0.011275172233581543, -0.010849952697753906, -0.01042473316192627, -0.009999513626098633, -0.009574294090270996, -0.00914907455444336, -0.008723855018615723, -0.008298635482788086, -0.00787341594696045, -0.0074481964111328125, -0.007022976875305176, -0.006597757339477539, -0.006172537803649902, -0.005747318267822266, -0.005322098731994629, -0.004896879196166992, -0.0044716596603393555, -0.004046440124511719, -0.003621220588684082, -0.0031960010528564453, -0.0027707815170288086, -0.002345561981201172, -0.0019203424453735352, -0.0014951229095458984, -0.0010699033737182617, -0.000644683837890625, -0.00021946430206298828, 0.00020575523376464844, 0.0006309747695922852, 0.0010561943054199219, 0.0014814138412475586, 0.0019066333770751953, 0.002331852912902832, 0.0027570724487304688, 0.0031822919845581055, 0.003607511520385742, 0.004032731056213379, 0.004457950592041016, 0.004883170127868652, 0.005308389663696289, 0.005733609199523926, 0.0061588287353515625, 0.006584048271179199, 0.007009267807006836, 0.007434487342834473, 0.00785970687866211, 0.008284926414489746, 0.008710145950317383, 0.00913536548614502, 0.009560585021972656, 0.009985804557800293, 0.01041102409362793, 0.010836243629455566, 0.011261463165283203, 0.01168668270111084, 0.012111902236938477, 0.012537121772766113, 0.01296234130859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 12.0, 82.0, 519.0, 353.0, 39.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2535634934902191, -0.23243510723114014, -0.21130673587322235, -0.19017834961414337, -0.16904997825622559, -0.1479215919971466, -0.12679320573806763, -0.10566483438014984, -0.08453644812107086, -0.06340806931257248, -0.0422796867787838, -0.021151304244995117, -2.292543649673462e-05, 0.021105453372001648, 0.04223383963108063, 0.06336221098899841, 0.08449059724807739, 0.10561897605657578, 0.12674735486507416, 0.14787574112415314, 0.16900411248207092, 0.1901324987411499, 0.21126088500022888, 0.23238925635814667, 0.25351762771606445, 0.27464601397514343, 0.2957744002342224, 0.316902756690979, 0.338031142950058, 0.35915952920913696, 0.38028791546821594, 0.4014163017272949, 0.4225446581840515, 0.4436730444431305, 0.4648014307022095, 0.48592978715896606, 0.5070582032203674, 0.528186559677124, 0.5493149757385254, 0.570443332195282, 0.5915716886520386, 0.6127000451087952, 0.6338284611701965, 0.6549568176269531, 0.6760852336883545, 0.6972135901451111, 0.7183419466018677, 0.739470362663269, 0.7605987787246704, 0.781727135181427, 0.8028555512428284, 0.823983907699585, 0.8451123237609863, 0.8662406802177429, 0.8873690366744995, 0.9084974527359009, 0.9296258091926575, 0.9507541656494141, 0.9718825817108154, 0.993010938167572, 1.0141392946243286, 1.03526771068573, 1.0563961267471313, 1.0775244235992432, 1.0986528396606445]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 8.0, 15.0, 16.0, 22.0, 31.0, 18.0, 30.0, 45.0, 33.0, 59.0, 45.0, 52.0, 50.0, 59.0, 41.0, 37.0, 40.0, 49.0, 32.0, 28.0, 28.0, 32.0, 36.0, 34.0, 23.0, 32.0, 15.0, 12.0, 10.0, 7.0, 4.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05206841230392456, -0.050088535994291306, -0.04810865968465805, -0.046128787100315094, -0.04414891079068184, -0.042169034481048584, -0.04018916189670563, -0.03820928558707237, -0.03622940927743912, -0.03424953296780586, -0.03226965665817261, -0.03028978407382965, -0.028309907764196396, -0.02633003145456314, -0.024350157007575035, -0.02237028256058693, -0.020390406250953674, -0.01841052994132042, -0.016430655494332314, -0.014450780116021633, -0.012470904737710953, -0.010491029359400272, -0.008511153981089592, -0.006531278602778912, -0.004551403224468231, -0.002571527846157551, -0.0005916524678468704, 0.00138822291046381, 0.0033680982887744904, 0.005347973667085171, 0.007327849045395851, 0.009307724423706532, 0.011287599802017212, 0.013267475180327892, 0.015247350558638573, 0.01722722500562668, 0.019207101315259933, 0.02118697762489319, 0.023166852071881294, 0.0251467265188694, 0.027126602828502655, 0.02910647913813591, 0.031086353585124016, 0.03306622803211212, 0.03504610434174538, 0.03702598065137863, 0.03900585323572159, 0.04098572954535484, 0.0429656058549881, 0.04494548216462135, 0.04692535847425461, 0.048905231058597565, 0.05088510736823082, 0.052864983677864075, 0.05484485626220703, 0.056824732571840286, 0.05880460888147354, 0.060784485191106796, 0.06276436150074005, 0.06474423408508301, 0.06672410666942596, 0.06870398670434952, 0.07068385928869247, 0.07266373932361603, 0.07464361190795898]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 13.0, 23.0, 28.0, 29.0, 35.0, 52.0, 109.0, 164.0, 279.0, 532.0, 1118.0, 2951.0, 11087.0, 97873.0, 3886780.0, 169458.0, 16260.0, 4284.0, 1686.0, 715.0, 327.0, 147.0, 84.0, 64.0, 47.0, 45.0, 16.0, 8.0, 10.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03831815719604492, -0.037177085876464844, -0.036036014556884766, -0.03489494323730469, -0.03375387191772461, -0.03261280059814453, -0.03147172927856445, -0.030330657958984375, -0.029189586639404297, -0.02804851531982422, -0.02690744400024414, -0.025766372680664062, -0.024625301361083984, -0.023484230041503906, -0.022343158721923828, -0.02120208740234375, -0.020061016082763672, -0.018919944763183594, -0.017778873443603516, -0.016637802124023438, -0.01549673080444336, -0.014355659484863281, -0.013214588165283203, -0.012073516845703125, -0.010932445526123047, -0.009791374206542969, -0.00865030288696289, -0.0075092315673828125, -0.006368160247802734, -0.005227088928222656, -0.004086017608642578, -0.0029449462890625, -0.0018038749694824219, -0.0006628036499023438, 0.0004782676696777344, 0.0016193389892578125, 0.0027604103088378906, 0.0039014816284179688, 0.005042552947998047, 0.006183624267578125, 0.007324695587158203, 0.008465766906738281, 0.00960683822631836, 0.010747909545898438, 0.011888980865478516, 0.013030052185058594, 0.014171123504638672, 0.01531219482421875, 0.016453266143798828, 0.017594337463378906, 0.018735408782958984, 0.019876480102539062, 0.02101755142211914, 0.02215862274169922, 0.023299694061279297, 0.024440765380859375, 0.025581836700439453, 0.02672290802001953, 0.02786397933959961, 0.029005050659179688, 0.030146121978759766, 0.031287193298339844, 0.03242826461791992, 0.0335693359375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 30.0, 99.0, 197.0, 260.0, 218.0, 120.0, 49.0, 10.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0418701171875, -0.04078531265258789, -0.03970050811767578, -0.03861570358276367, -0.03753089904785156, -0.03644609451293945, -0.035361289978027344, -0.034276485443115234, -0.033191680908203125, -0.032106876373291016, -0.031022071838378906, -0.029937267303466797, -0.028852462768554688, -0.027767658233642578, -0.02668285369873047, -0.02559804916381836, -0.02451324462890625, -0.02342844009399414, -0.02234363555908203, -0.021258831024169922, -0.020174026489257812, -0.019089221954345703, -0.018004417419433594, -0.016919612884521484, -0.015834808349609375, -0.014750003814697266, -0.013665199279785156, -0.012580394744873047, -0.011495590209960938, -0.010410785675048828, -0.009325981140136719, -0.00824117660522461, -0.0071563720703125, -0.006071567535400391, -0.004986763000488281, -0.003901958465576172, -0.0028171539306640625, -0.0017323493957519531, -0.0006475448608398438, 0.0004372596740722656, 0.001522064208984375, 0.0026068687438964844, 0.0036916732788085938, 0.004776477813720703, 0.0058612823486328125, 0.006946086883544922, 0.008030891418457031, 0.00911569595336914, 0.01020050048828125, 0.01128530502319336, 0.012370109558105469, 0.013454914093017578, 0.014539718627929688, 0.015624523162841797, 0.016709327697753906, 0.017794132232666016, 0.018878936767578125, 0.019963741302490234, 0.021048545837402344, 0.022133350372314453, 0.023218154907226562, 0.024302959442138672, 0.02538776397705078, 0.02647256851196289, 0.027557373046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 12.0, 9.0, 14.0, 20.0, 30.0, 48.0, 71.0, 76.0, 123.0, 220.0, 326.0, 505.0, 895.0, 1456.0, 2618.0, 4942.0, 9975.0, 22516.0, 56667.0, 177322.0, 1279409.0, 2281007.0, 233746.0, 70800.0, 26894.0, 11891.0, 5569.0, 3018.0, 1533.0, 939.0, 574.0, 355.0, 237.0, 152.0, 109.0, 74.0, 43.0, 30.0, 25.0, 12.0, 5.0, 4.0, 8.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01238250732421875, -0.01201939582824707, -0.01165628433227539, -0.011293172836303711, -0.010930061340332031, -0.010566949844360352, -0.010203838348388672, -0.009840726852416992, -0.009477615356445312, -0.009114503860473633, -0.008751392364501953, -0.008388280868530273, -0.008025169372558594, -0.007662057876586914, -0.007298946380615234, -0.006935834884643555, -0.006572723388671875, -0.006209611892700195, -0.005846500396728516, -0.005483388900756836, -0.005120277404785156, -0.0047571659088134766, -0.004394054412841797, -0.004030942916870117, -0.0036678314208984375, -0.003304719924926758, -0.002941608428955078, -0.0025784969329833984, -0.0022153854370117188, -0.001852273941040039, -0.0014891624450683594, -0.0011260509490966797, -0.000762939453125, -0.0003998279571533203, -3.6716461181640625e-05, 0.00032639503479003906, 0.0006895065307617188, 0.0010526180267333984, 0.0014157295227050781, 0.0017788410186767578, 0.0021419525146484375, 0.002505064010620117, 0.002868175506591797, 0.0032312870025634766, 0.0035943984985351562, 0.003957509994506836, 0.004320621490478516, 0.004683732986450195, 0.005046844482421875, 0.005409955978393555, 0.005773067474365234, 0.006136178970336914, 0.006499290466308594, 0.0068624019622802734, 0.007225513458251953, 0.007588624954223633, 0.007951736450195312, 0.008314847946166992, 0.008677959442138672, 0.009041070938110352, 0.009404182434082031, 0.009767293930053711, 0.01013040542602539, 0.01049351692199707, 0.01085662841796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 10.0, 15.0, 27.0, 30.0, 62.0, 71.0, 140.0, 194.0, 439.0, 1204.0, 1002.0, 327.0, 177.0, 110.0, 63.0, 54.0, 36.0, 29.0, 15.0, 14.0, 9.0, 10.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147857666015625, -0.014335870742797852, -0.013885974884033203, -0.013436079025268555, -0.012986183166503906, -0.012536287307739258, -0.01208639144897461, -0.011636495590209961, -0.011186599731445312, -0.010736703872680664, -0.010286808013916016, -0.009836912155151367, -0.009387016296386719, -0.00893712043762207, -0.008487224578857422, -0.008037328720092773, -0.007587432861328125, -0.0071375370025634766, -0.006687641143798828, -0.00623774528503418, -0.005787849426269531, -0.005337953567504883, -0.004888057708740234, -0.004438161849975586, -0.0039882659912109375, -0.003538370132446289, -0.0030884742736816406, -0.002638578414916992, -0.0021886825561523438, -0.0017387866973876953, -0.0012888908386230469, -0.0008389949798583984, -0.00038909912109375, 6.079673767089844e-05, 0.0005106925964355469, 0.0009605884552001953, 0.0014104843139648438, 0.0018603801727294922, 0.0023102760314941406, 0.002760171890258789, 0.0032100677490234375, 0.003659963607788086, 0.004109859466552734, 0.004559755325317383, 0.005009651184082031, 0.00545954704284668, 0.005909442901611328, 0.0063593387603759766, 0.006809234619140625, 0.0072591304779052734, 0.007709026336669922, 0.00815892219543457, 0.008608818054199219, 0.009058713912963867, 0.009508609771728516, 0.009958505630493164, 0.010408401489257812, 0.010858297348022461, 0.01130819320678711, 0.011758089065551758, 0.012207984924316406, 0.012657880783081055, 0.013107776641845703, 0.013557672500610352, 0.014007568359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 23.0, 73.0, 152.0, 232.0, 217.0, 152.0, 64.0, 45.0, 12.0, 9.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.122259221971035, -0.11855294555425644, -0.11484666913747787, -0.11114039272069931, -0.10743411630392075, -0.10372783988714218, -0.10002155601978302, -0.09631527960300446, -0.09260900318622589, -0.08890272676944733, -0.08519645035266876, -0.0814901739358902, -0.07778389751911163, -0.07407762110233307, -0.0703713446855545, -0.06666506826877594, -0.06295879185199738, -0.05925251543521881, -0.05554623901844025, -0.05183996260166168, -0.04813368618488312, -0.04442740976810455, -0.04072112962603569, -0.037014853209257126, -0.03330857679247856, -0.029602300375699997, -0.025896023958921432, -0.02218974567949772, -0.018483469262719154, -0.01477719284594059, -0.011070914566516876, -0.007364638149738312, -0.0036583691835403442, 4.790769889950752e-05, 0.0037541845813393593, 0.007460461929440498, 0.011166738346219063, 0.014873014762997627, 0.01857929304242134, 0.022285569459199905, 0.02599184587597847, 0.029698122292757034, 0.0334043987095356, 0.03711067885160446, 0.040816955268383026, 0.04452323168516159, 0.048229508101940155, 0.05193578451871872, 0.055642060935497284, 0.05934833735227585, 0.06305461376905441, 0.06676089018583298, 0.07046716660261154, 0.0741734430193901, 0.07787972688674927, 0.08158600330352783, 0.0852922797203064, 0.08899855613708496, 0.09270483255386353, 0.09641110897064209, 0.10011738538742065, 0.10382366180419922, 0.10752993822097778, 0.11123621463775635, 0.11494249105453491]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 17.0, 13.0, 17.0, 25.0, 36.0, 32.0, 35.0, 38.0, 45.0, 45.0, 57.0, 52.0, 59.0, 57.0, 47.0, 64.0, 59.0, 49.0, 34.0, 31.0, 31.0, 26.0, 24.0, 23.0, 13.0, 8.0, 13.0, 11.0, 10.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042626380920410156, -0.041429273784160614, -0.04023216292262077, -0.03903505206108093, -0.03783794492483139, -0.03664083778858185, -0.03544372692704201, -0.03424661606550217, -0.033049508929252625, -0.03185240179300308, -0.03065529093146324, -0.02945818193256855, -0.02826107293367386, -0.027063963934779167, -0.025866854935884476, -0.024669745936989784, -0.023472636938095093, -0.0222755279392004, -0.02107841894030571, -0.01988130994141102, -0.018684200942516327, -0.017487091943621635, -0.016289982944726944, -0.015092873945832253, -0.013895764946937561, -0.01269865594804287, -0.011501546949148178, -0.010304437950253487, -0.009107328951358795, -0.007910219952464104, -0.006713110953569412, -0.005516001954674721, -0.004318892955780029, -0.003121783956885338, -0.0019246749579906464, -0.0007275659590959549, 0.00046954303979873657, 0.001666652038693428, 0.0028637610375881195, 0.004060870036482811, 0.0052579790353775024, 0.006455088034272194, 0.007652197033166885, 0.008849306032061577, 0.010046415030956268, 0.01124352402985096, 0.012440633028745651, 0.013637742027640343, 0.014834851026535034, 0.016031960025429726, 0.017229069024324417, 0.01842617802321911, 0.0196232870221138, 0.02082039602100849, 0.022017505019903183, 0.023214614018797874, 0.024411723017692566, 0.025608832016587257, 0.02680594101548195, 0.02800305001437664, 0.029200159013271332, 0.030397268012166023, 0.031594377011060715, 0.032791487872600555, 0.0339885950088501]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 4.0, 14.0, 32.0, 21.0, 39.0, 43.0, 69.0, 101.0, 160.0, 177.0, 313.0, 490.0, 841.0, 1721.0, 4792.0, 26078.0, 328252.0, 623343.0, 49813.0, 7385.0, 2150.0, 1010.0, 525.0, 377.0, 245.0, 152.0, 99.0, 78.0, 55.0, 43.0, 32.0, 22.0, 15.0, 16.0, 6.0, 8.0, 5.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.046875, -0.045416831970214844, -0.04395866394042969, -0.04250049591064453, -0.041042327880859375, -0.03958415985107422, -0.03812599182128906, -0.036667823791503906, -0.03520965576171875, -0.033751487731933594, -0.03229331970214844, -0.03083515167236328, -0.029376983642578125, -0.02791881561279297, -0.026460647583007812, -0.025002479553222656, -0.0235443115234375, -0.022086143493652344, -0.020627975463867188, -0.01916980743408203, -0.017711639404296875, -0.01625347137451172, -0.014795303344726562, -0.013337135314941406, -0.01187896728515625, -0.010420799255371094, -0.008962631225585938, -0.007504463195800781, -0.006046295166015625, -0.004588127136230469, -0.0031299591064453125, -0.0016717910766601562, -0.000213623046875, 0.0012445449829101562, 0.0027027130126953125, 0.004160881042480469, 0.005619049072265625, 0.007077217102050781, 0.008535385131835938, 0.009993553161621094, 0.01145172119140625, 0.012909889221191406, 0.014368057250976562, 0.01582622528076172, 0.017284393310546875, 0.01874256134033203, 0.020200729370117188, 0.021658897399902344, 0.0231170654296875, 0.024575233459472656, 0.026033401489257812, 0.02749156951904297, 0.028949737548828125, 0.03040790557861328, 0.03186607360839844, 0.033324241638183594, 0.03478240966796875, 0.036240577697753906, 0.03769874572753906, 0.03915691375732422, 0.040615081787109375, 0.04207324981689453, 0.04353141784667969, 0.044989585876464844, 0.04644775390625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 10.0, 11.0, 54.0, 152.0, 232.0, 251.0, 170.0, 87.0, 25.0, 9.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043121337890625, -0.042018890380859375, -0.04091644287109375, -0.039813995361328125, -0.0387115478515625, -0.037609100341796875, -0.03650665283203125, -0.035404205322265625, -0.0343017578125, -0.033199310302734375, -0.03209686279296875, -0.030994415283203125, -0.0298919677734375, -0.028789520263671875, -0.02768707275390625, -0.026584625244140625, -0.025482177734375, -0.024379730224609375, -0.02327728271484375, -0.022174835205078125, -0.0210723876953125, -0.019969940185546875, -0.01886749267578125, -0.017765045166015625, -0.01666259765625, -0.015560150146484375, -0.01445770263671875, -0.013355255126953125, -0.0122528076171875, -0.011150360107421875, -0.01004791259765625, -0.008945465087890625, -0.007843017578125, -0.006740570068359375, -0.00563812255859375, -0.004535675048828125, -0.0034332275390625, -0.002330780029296875, -0.00122833251953125, -0.000125885009765625, 0.0009765625, 0.002079010009765625, 0.00318145751953125, 0.004283905029296875, 0.0053863525390625, 0.006488800048828125, 0.00759124755859375, 0.008693695068359375, 0.009796142578125, 0.010898590087890625, 0.01200103759765625, 0.013103485107421875, 0.0142059326171875, 0.015308380126953125, 0.01641082763671875, 0.017513275146484375, 0.01861572265625, 0.019718170166015625, 0.02082061767578125, 0.021923065185546875, 0.0230255126953125, 0.024127960205078125, 0.02523040771484375, 0.026332855224609375, 0.027435302734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 5.0, 13.0, 20.0, 37.0, 37.0, 85.0, 175.0, 307.0, 718.0, 1911.0, 5837.0, 22530.0, 135076.0, 614311.0, 221807.0, 33633.0, 7768.0, 2513.0, 918.0, 410.0, 171.0, 106.0, 43.0, 27.0, 22.0, 20.0, 11.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03076171875, -0.029788970947265625, -0.02881622314453125, -0.027843475341796875, -0.0268707275390625, -0.025897979736328125, -0.02492523193359375, -0.023952484130859375, -0.022979736328125, -0.022006988525390625, -0.02103424072265625, -0.020061492919921875, -0.0190887451171875, -0.018115997314453125, -0.01714324951171875, -0.016170501708984375, -0.01519775390625, -0.014225006103515625, -0.01325225830078125, -0.012279510498046875, -0.0113067626953125, -0.010334014892578125, -0.00936126708984375, -0.008388519287109375, -0.007415771484375, -0.006443023681640625, -0.00547027587890625, -0.004497528076171875, -0.0035247802734375, -0.002552032470703125, -0.00157928466796875, -0.000606536865234375, 0.0003662109375, 0.001338958740234375, 0.00231170654296875, 0.003284454345703125, 0.0042572021484375, 0.005229949951171875, 0.00620269775390625, 0.007175445556640625, 0.008148193359375, 0.009120941162109375, 0.01009368896484375, 0.011066436767578125, 0.0120391845703125, 0.013011932373046875, 0.01398468017578125, 0.014957427978515625, 0.01593017578125, 0.016902923583984375, 0.01787567138671875, 0.018848419189453125, 0.0198211669921875, 0.020793914794921875, 0.02176666259765625, 0.022739410400390625, 0.023712158203125, 0.024684906005859375, 0.02565765380859375, 0.026630401611328125, 0.0276031494140625, 0.028575897216796875, 0.02954864501953125, 0.030521392822265625, 0.031494140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 17.0, 15.0, 22.0, 21.0, 37.0, 40.0, 43.0, 52.0, 59.0, 65.0, 71.0, 88.0, 71.0, 79.0, 46.0, 50.0, 37.0, 45.0, 35.0, 25.0, 13.0, 13.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032470703125, -0.03155374526977539, -0.03063678741455078, -0.029719829559326172, -0.028802871704101562, -0.027885913848876953, -0.026968955993652344, -0.026051998138427734, -0.025135040283203125, -0.024218082427978516, -0.023301124572753906, -0.022384166717529297, -0.021467208862304688, -0.020550251007080078, -0.01963329315185547, -0.01871633529663086, -0.01779937744140625, -0.01688241958618164, -0.01596546173095703, -0.015048503875732422, -0.014131546020507812, -0.013214588165283203, -0.012297630310058594, -0.011380672454833984, -0.010463714599609375, -0.009546756744384766, -0.008629798889160156, -0.007712841033935547, -0.0067958831787109375, -0.005878925323486328, -0.004961967468261719, -0.004045009613037109, -0.0031280517578125, -0.0022110939025878906, -0.0012941360473632812, -0.0003771781921386719, 0.0005397796630859375, 0.0014567375183105469, 0.0023736953735351562, 0.0032906532287597656, 0.004207611083984375, 0.005124568939208984, 0.006041526794433594, 0.006958484649658203, 0.007875442504882812, 0.008792400360107422, 0.009709358215332031, 0.01062631607055664, 0.01154327392578125, 0.01246023178100586, 0.013377189636230469, 0.014294147491455078, 0.015211105346679688, 0.016128063201904297, 0.017045021057128906, 0.017961978912353516, 0.018878936767578125, 0.019795894622802734, 0.020712852478027344, 0.021629810333251953, 0.022546768188476562, 0.023463726043701172, 0.02438068389892578, 0.02529764175415039, 0.026214599609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 9.0, 6.0, 32.0, 40.0, 62.0, 117.0, 229.0, 437.0, 952.0, 1809.0, 3887.0, 8684.0, 26164.0, 140934.0, 714989.0, 112494.0, 22663.0, 7994.0, 3549.0, 1705.0, 841.0, 427.0, 236.0, 126.0, 65.0, 27.0, 20.0, 14.0, 8.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019927978515625, -0.019365787506103516, -0.01880359649658203, -0.018241405487060547, -0.017679214477539062, -0.017117023468017578, -0.016554832458496094, -0.01599264144897461, -0.015430450439453125, -0.01486825942993164, -0.014306068420410156, -0.013743877410888672, -0.013181686401367188, -0.012619495391845703, -0.012057304382324219, -0.011495113372802734, -0.01093292236328125, -0.010370731353759766, -0.009808540344238281, -0.009246349334716797, -0.008684158325195312, -0.008121967315673828, -0.007559776306152344, -0.006997585296630859, -0.006435394287109375, -0.005873203277587891, -0.005311012268066406, -0.004748821258544922, -0.0041866302490234375, -0.003624439239501953, -0.0030622482299804688, -0.0025000572204589844, -0.0019378662109375, -0.0013756752014160156, -0.0008134841918945312, -0.0002512931823730469, 0.0003108978271484375, 0.0008730888366699219, 0.0014352798461914062, 0.0019974708557128906, 0.002559661865234375, 0.0031218528747558594, 0.0036840438842773438, 0.004246234893798828, 0.0048084259033203125, 0.005370616912841797, 0.005932807922363281, 0.006494998931884766, 0.00705718994140625, 0.007619380950927734, 0.008181571960449219, 0.008743762969970703, 0.009305953979492188, 0.009868144989013672, 0.010430335998535156, 0.01099252700805664, 0.011554718017578125, 0.01211690902709961, 0.012679100036621094, 0.013241291046142578, 0.013803482055664062, 0.014365673065185547, 0.014927864074707031, 0.015490055084228516, 0.01605224609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 9.0, 7.0, 6.0, 8.0, 17.0, 21.0, 33.0, 36.0, 61.0, 83.0, 85.0, 98.0, 129.0, 101.0, 64.0, 58.0, 32.0, 44.0, 22.0, 24.0, 7.0, 12.0, 6.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.832050323486328e-05, -7.60173425078392e-05, -7.371418178081512e-05, -7.141102105379105e-05, -6.910786032676697e-05, -6.680469959974289e-05, -6.450153887271881e-05, -6.219837814569473e-05, -5.9895217418670654e-05, -5.7592056691646576e-05, -5.52888959646225e-05, -5.298573523759842e-05, -5.068257451057434e-05, -4.837941378355026e-05, -4.6076253056526184e-05, -4.3773092329502106e-05, -4.146993160247803e-05, -3.916677087545395e-05, -3.686361014842987e-05, -3.456044942140579e-05, -3.2257288694381714e-05, -2.9954127967357635e-05, -2.7650967240333557e-05, -2.534780651330948e-05, -2.30446457862854e-05, -2.0741485059261322e-05, -1.8438324332237244e-05, -1.6135163605213165e-05, -1.3832002878189087e-05, -1.1528842151165009e-05, -9.22568142414093e-06, -6.922520697116852e-06, -4.6193599700927734e-06, -2.316199243068695e-06, -1.30385160446167e-08, 2.2901222109794617e-06, 4.59328293800354e-06, 6.896443665027618e-06, 9.199604392051697e-06, 1.1502765119075775e-05, 1.3805925846099854e-05, 1.6109086573123932e-05, 1.841224730014801e-05, 2.071540802717209e-05, 2.3018568754196167e-05, 2.5321729481220245e-05, 2.7624890208244324e-05, 2.9928050935268402e-05, 3.223121166229248e-05, 3.453437238931656e-05, 3.683753311634064e-05, 3.9140693843364716e-05, 4.1443854570388794e-05, 4.374701529741287e-05, 4.605017602443695e-05, 4.835333675146103e-05, 5.065649747848511e-05, 5.2959658205509186e-05, 5.5262818932533264e-05, 5.756597965955734e-05, 5.986914038658142e-05, 6.21723011136055e-05, 6.447546184062958e-05, 6.677862256765366e-05, 6.908178329467773e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 10.0, 15.0, 19.0, 34.0, 60.0, 109.0, 234.0, 387.0, 828.0, 1857.0, 4155.0, 11138.0, 38319.0, 269418.0, 627249.0, 67458.0, 16687.0, 5959.0, 2437.0, 1122.0, 495.0, 239.0, 145.0, 71.0, 39.0, 21.0, 12.0, 7.0, 8.0, 1.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017425537109375, -0.016828298568725586, -0.016231060028076172, -0.015633821487426758, -0.015036582946777344, -0.01443934440612793, -0.013842105865478516, -0.013244867324829102, -0.012647628784179688, -0.012050390243530273, -0.01145315170288086, -0.010855913162231445, -0.010258674621582031, -0.009661436080932617, -0.009064197540283203, -0.008466958999633789, -0.007869720458984375, -0.007272481918334961, -0.006675243377685547, -0.006078004837036133, -0.005480766296386719, -0.004883527755737305, -0.004286289215087891, -0.0036890506744384766, -0.0030918121337890625, -0.0024945735931396484, -0.0018973350524902344, -0.0013000965118408203, -0.0007028579711914062, -0.00010561943054199219, 0.0004916191101074219, 0.001088857650756836, 0.00168609619140625, 0.002283334732055664, 0.002880573272705078, 0.003477811813354492, 0.004075050354003906, 0.00467228889465332, 0.005269527435302734, 0.0058667659759521484, 0.0064640045166015625, 0.0070612430572509766, 0.007658481597900391, 0.008255720138549805, 0.008852958679199219, 0.009450197219848633, 0.010047435760498047, 0.010644674301147461, 0.011241912841796875, 0.011839151382446289, 0.012436389923095703, 0.013033628463745117, 0.013630867004394531, 0.014228105545043945, 0.01482534408569336, 0.015422582626342773, 0.016019821166992188, 0.0166170597076416, 0.017214298248291016, 0.01781153678894043, 0.018408775329589844, 0.019006013870239258, 0.019603252410888672, 0.020200490951538086, 0.0207977294921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 3.0, 9.0, 8.0, 2.0, 8.0, 11.0, 16.0, 36.0, 44.0, 71.0, 130.0, 242.0, 171.0, 83.0, 48.0, 31.0, 17.0, 18.0, 6.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01788330078125, -0.017351627349853516, -0.01681995391845703, -0.016288280487060547, -0.015756607055664062, -0.015224933624267578, -0.014693260192871094, -0.01416158676147461, -0.013629913330078125, -0.01309823989868164, -0.012566566467285156, -0.012034893035888672, -0.011503219604492188, -0.010971546173095703, -0.010439872741699219, -0.009908199310302734, -0.00937652587890625, -0.008844852447509766, -0.008313179016113281, -0.007781505584716797, -0.0072498321533203125, -0.006718158721923828, -0.006186485290527344, -0.005654811859130859, -0.005123138427734375, -0.004591464996337891, -0.004059791564941406, -0.003528118133544922, -0.0029964447021484375, -0.002464771270751953, -0.0019330978393554688, -0.0014014244079589844, -0.0008697509765625, -0.0003380775451660156, 0.00019359588623046875, 0.0007252693176269531, 0.0012569427490234375, 0.0017886161804199219, 0.0023202896118164062, 0.0028519630432128906, 0.003383636474609375, 0.003915309906005859, 0.004446983337402344, 0.004978656768798828, 0.0055103302001953125, 0.006042003631591797, 0.006573677062988281, 0.007105350494384766, 0.00763702392578125, 0.008168697357177734, 0.008700370788574219, 0.009232044219970703, 0.009763717651367188, 0.010295391082763672, 0.010827064514160156, 0.01135873794555664, 0.011890411376953125, 0.01242208480834961, 0.012953758239746094, 0.013485431671142578, 0.014017105102539062, 0.014548778533935547, 0.015080451965332031, 0.015612125396728516, 0.016143798828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 27.0, 765.0, 218.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24215254187583923, -0.2005024403333664, -0.15885233879089355, -0.11720222234725952, -0.07555212080478668, -0.03390201926231384, 0.00774809718132019, 0.049398183822631836, 0.09104830026626587, 0.1326984018087387, 0.17434850335121155, 0.21599861979484558, 0.2576487064361572, 0.29929882287979126, 0.3409489393234253, 0.38259902596473694, 0.42424914240837097, 0.465899258852005, 0.5075493454933167, 0.5491994619369507, 0.5908495783805847, 0.6324996948242188, 0.674149751663208, 0.715799868106842, 0.7574499845504761, 0.7991001009941101, 0.8407502174377441, 0.8824002742767334, 0.9240503907203674, 0.9657005071640015, 1.0073506832122803, 1.0490007400512695, 1.0906509160995483, 1.1323009729385376, 1.1739511489868164, 1.2156012058258057, 1.2572513818740845, 1.2989014387130737, 1.3405516147613525, 1.3822016716003418, 1.423851728439331, 1.4655017852783203, 1.5071519613265991, 1.5488020181655884, 1.5904521942138672, 1.6321022510528564, 1.6737523078918457, 1.7154024839401245, 1.7570526599884033, 1.7987027168273926, 1.8403528928756714, 1.8820029497146606, 1.9236531257629395, 1.9653031826019287, 2.006953239440918, 2.0486032962799072, 2.0902533531188965, 2.1319034099578857, 2.173553466796875, 2.2152037620544434, 2.2568538188934326, 2.298503875732422, 2.340153932571411, 2.3818039894104004, 2.4234542846679688]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 0.0, 8.0, 4.0, 6.0, 10.0, 11.0, 12.0, 18.0, 23.0, 24.0, 24.0, 22.0, 26.0, 46.0, 46.0, 45.0, 37.0, 49.0, 52.0, 53.0, 45.0, 41.0, 44.0, 43.0, 47.0, 44.0, 28.0, 30.0, 28.0, 26.0, 23.0, 13.0, 17.0, 14.0, 17.0, 8.0, 8.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08045566082000732, -0.07813984900712967, -0.07582403719425201, -0.07350822538137436, -0.0711924135684967, -0.06887660175561905, -0.0665607899427414, -0.06424497812986374, -0.061929166316986084, -0.05961335450410843, -0.057297542691230774, -0.05498173087835312, -0.052665919065475464, -0.05035010725259781, -0.048034295439720154, -0.0457184836268425, -0.043402671813964844, -0.04108686000108719, -0.038771048188209534, -0.03645523637533188, -0.034139424562454224, -0.03182361274957657, -0.029507800936698914, -0.02719198912382126, -0.024876177310943604, -0.02256036549806595, -0.020244553685188293, -0.01792874187231064, -0.015612930059432983, -0.013297118246555328, -0.010981306433677673, -0.008665494620800018, -0.006349682807922363, -0.004033870995044708, -0.0017180591821670532, 0.0005977526307106018, 0.002913564443588257, 0.005229376256465912, 0.007545188069343567, 0.009860999882221222, 0.012176811695098877, 0.014492623507976532, 0.016808435320854187, 0.019124247133731842, 0.021440058946609497, 0.023755870759487152, 0.026071682572364807, 0.028387494385242462, 0.030703306198120117, 0.03301911801099777, 0.03533492982387543, 0.03765074163675308, 0.03996655344963074, 0.04228236526250839, 0.04459817707538605, 0.0469139888882637, 0.04922980070114136, 0.05154561251401901, 0.05386142432689667, 0.05617723613977432, 0.05849304795265198, 0.06080885976552963, 0.06312467157840729, 0.06544048339128494, 0.0677562952041626]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 12.0, 15.0, 28.0, 72.0, 111.0, 331.0, 1032.0, 9465.0, 3977194.0, 200307.0, 4610.0, 771.0, 195.0, 78.0, 35.0, 13.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08599853515625, -0.08337783813476562, -0.08075714111328125, -0.07813644409179688, -0.0755157470703125, -0.07289505004882812, -0.07027435302734375, -0.06765365600585938, -0.065032958984375, -0.062412261962890625, -0.05979156494140625, -0.057170867919921875, -0.0545501708984375, -0.051929473876953125, -0.04930877685546875, -0.046688079833984375, -0.0440673828125, -0.041446685791015625, -0.03882598876953125, -0.036205291748046875, -0.0335845947265625, -0.030963897705078125, -0.02834320068359375, -0.025722503662109375, -0.023101806640625, -0.020481109619140625, -0.01786041259765625, -0.015239715576171875, -0.0126190185546875, -0.009998321533203125, -0.00737762451171875, -0.004756927490234375, -0.00213623046875, 0.000484466552734375, 0.00310516357421875, 0.005725860595703125, 0.0083465576171875, 0.010967254638671875, 0.01358795166015625, 0.016208648681640625, 0.018829345703125, 0.021450042724609375, 0.02407073974609375, 0.026691436767578125, 0.0293121337890625, 0.031932830810546875, 0.03455352783203125, 0.037174224853515625, 0.039794921875, 0.042415618896484375, 0.04503631591796875, 0.047657012939453125, 0.0502777099609375, 0.052898406982421875, 0.05551910400390625, 0.058139801025390625, 0.060760498046875, 0.06338119506835938, 0.06600189208984375, 0.06862258911132812, 0.0712432861328125, 0.07386398315429688, 0.07648468017578125, 0.07910537719726562, 0.08172607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 23.0, 56.0, 146.0, 224.0, 249.0, 174.0, 81.0, 33.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04217529296875, -0.04109692573547363, -0.040018558502197266, -0.0389401912689209, -0.03786182403564453, -0.036783456802368164, -0.0357050895690918, -0.03462672233581543, -0.03354835510253906, -0.032469987869262695, -0.03139162063598633, -0.03031325340270996, -0.029234886169433594, -0.028156518936157227, -0.02707815170288086, -0.025999784469604492, -0.024921417236328125, -0.023843050003051758, -0.02276468276977539, -0.021686315536499023, -0.020607948303222656, -0.01952958106994629, -0.018451213836669922, -0.017372846603393555, -0.016294479370117188, -0.01521611213684082, -0.014137744903564453, -0.013059377670288086, -0.011981010437011719, -0.010902643203735352, -0.009824275970458984, -0.008745908737182617, -0.00766754150390625, -0.006589174270629883, -0.005510807037353516, -0.0044324398040771484, -0.0033540725708007812, -0.002275705337524414, -0.0011973381042480469, -0.00011897087097167969, 0.0009593963623046875, 0.0020377635955810547, 0.003116130828857422, 0.004194498062133789, 0.005272865295410156, 0.0063512325286865234, 0.007429599761962891, 0.008507966995239258, 0.009586334228515625, 0.010664701461791992, 0.01174306869506836, 0.012821435928344727, 0.013899803161621094, 0.014978170394897461, 0.016056537628173828, 0.017134904861450195, 0.018213272094726562, 0.01929163932800293, 0.020370006561279297, 0.021448373794555664, 0.02252674102783203, 0.0236051082611084, 0.024683475494384766, 0.025761842727661133, 0.0268402099609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 3.0, 12.0, 26.0, 22.0, 26.0, 31.0, 61.0, 99.0, 120.0, 170.0, 253.0, 420.0, 627.0, 999.0, 1801.0, 3672.0, 8166.0, 21239.0, 66483.0, 285304.0, 3055242.0, 594814.0, 103157.0, 30498.0, 10873.0, 4625.0, 2212.0, 1191.0, 720.0, 437.0, 287.0, 216.0, 128.0, 103.0, 78.0, 55.0, 28.0, 17.0, 13.0, 9.0, 13.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01421356201171875, -0.01373445987701416, -0.01325535774230957, -0.01277625560760498, -0.01229715347290039, -0.0118180513381958, -0.011338949203491211, -0.010859847068786621, -0.010380744934082031, -0.009901642799377441, -0.009422540664672852, -0.008943438529968262, -0.008464336395263672, -0.007985234260559082, -0.007506132125854492, -0.007027029991149902, -0.0065479278564453125, -0.006068825721740723, -0.005589723587036133, -0.005110621452331543, -0.004631519317626953, -0.004152417182922363, -0.0036733150482177734, -0.0031942129135131836, -0.0027151107788085938, -0.002236008644104004, -0.001756906509399414, -0.0012778043746948242, -0.0007987022399902344, -0.00031960010528564453, 0.0001595020294189453, 0.0006386041641235352, 0.001117706298828125, 0.0015968084335327148, 0.0020759105682373047, 0.0025550127029418945, 0.0030341148376464844, 0.0035132169723510742, 0.003992319107055664, 0.004471421241760254, 0.004950523376464844, 0.005429625511169434, 0.0059087276458740234, 0.006387829780578613, 0.006866931915283203, 0.007346034049987793, 0.007825136184692383, 0.008304238319396973, 0.008783340454101562, 0.009262442588806152, 0.009741544723510742, 0.010220646858215332, 0.010699748992919922, 0.011178851127624512, 0.011657953262329102, 0.012137055397033691, 0.012616157531738281, 0.013095259666442871, 0.013574361801147461, 0.01405346393585205, 0.01453256607055664, 0.01501166820526123, 0.01549077033996582, 0.01596987247467041, 0.016448974609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 18.0, 15.0, 32.0, 39.0, 62.0, 73.0, 153.0, 269.0, 718.0, 1405.0, 618.0, 252.0, 127.0, 99.0, 61.0, 37.0, 26.0, 18.0, 12.0, 8.0, 11.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.016993045806884766, -0.01646900177001953, -0.015944957733154297, -0.015420913696289062, -0.014896869659423828, -0.014372825622558594, -0.01384878158569336, -0.013324737548828125, -0.01280069351196289, -0.012276649475097656, -0.011752605438232422, -0.011228561401367188, -0.010704517364501953, -0.010180473327636719, -0.009656429290771484, -0.00913238525390625, -0.008608341217041016, -0.008084297180175781, -0.007560253143310547, -0.0070362091064453125, -0.006512165069580078, -0.005988121032714844, -0.005464076995849609, -0.004940032958984375, -0.004415988922119141, -0.0038919448852539062, -0.003367900848388672, -0.0028438568115234375, -0.002319812774658203, -0.0017957687377929688, -0.0012717247009277344, -0.0007476806640625, -0.00022363662719726562, 0.00030040740966796875, 0.0008244514465332031, 0.0013484954833984375, 0.0018725395202636719, 0.0023965835571289062, 0.0029206275939941406, 0.003444671630859375, 0.003968715667724609, 0.004492759704589844, 0.005016803741455078, 0.0055408477783203125, 0.006064891815185547, 0.006588935852050781, 0.007112979888916016, 0.00763702392578125, 0.008161067962646484, 0.008685111999511719, 0.009209156036376953, 0.009733200073242188, 0.010257244110107422, 0.010781288146972656, 0.01130533218383789, 0.011829376220703125, 0.01235342025756836, 0.012877464294433594, 0.013401508331298828, 0.013925552368164062, 0.014449596405029297, 0.014973640441894531, 0.015497684478759766, 0.016021728515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 17.0, 27.0, 52.0, 96.0, 138.0, 153.0, 169.0, 149.0, 93.0, 51.0, 23.0, 12.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0438237302005291, -0.04082870110869408, -0.037833672016859055, -0.03483864292502403, -0.03184361383318901, -0.02884858474135399, -0.025853553786873817, -0.022858524695038795, -0.019863495603203773, -0.01686846651136875, -0.01387343741953373, -0.010878407396376133, -0.007883378304541111, -0.004888349212706089, -0.0018933191895484924, 0.0011017099022865295, 0.0040967389941215515, 0.0070917680859565735, 0.010086797177791595, 0.013081827200949192, 0.01607685536146164, 0.01907188445329666, 0.022066915407776833, 0.025061944499611855, 0.028056973591446877, 0.0310520026832819, 0.03404703363776207, 0.03704206272959709, 0.040037091821432114, 0.043032120913267136, 0.04602715000510216, 0.04902217909693718, 0.0520172044634819, 0.055012233555316925, 0.05800726264715195, 0.06100229173898697, 0.06399732083082199, 0.06699234992265701, 0.06998737901449203, 0.07298240810632706, 0.07597743719816208, 0.0789724662899971, 0.08196749538183212, 0.08496252447366714, 0.08795755356550217, 0.09095258265733719, 0.09394761174917221, 0.09694264084100723, 0.09993767738342285, 0.10293270647525787, 0.1059277355670929, 0.10892276465892792, 0.11191779375076294, 0.11491282284259796, 0.11790785193443298, 0.120902881026268, 0.12389791011810303, 0.12689293920993805, 0.12988796830177307, 0.1328829973936081, 0.13587802648544312, 0.13887305557727814, 0.14186808466911316, 0.14486311376094818, 0.1478581428527832]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 6.0, 6.0, 15.0, 15.0, 20.0, 24.0, 27.0, 31.0, 33.0, 35.0, 26.0, 38.0, 41.0, 44.0, 40.0, 41.0, 32.0, 45.0, 48.0, 38.0, 45.0, 42.0, 39.0, 27.0, 27.0, 28.0, 26.0, 24.0, 16.0, 21.0, 12.0, 18.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03086036443710327, -0.02982611395418644, -0.028791863471269608, -0.027757612988352776, -0.026723362505435944, -0.02568911202251911, -0.02465486153960228, -0.023620611056685448, -0.022586360573768616, -0.021552110090851784, -0.020517859607934952, -0.01948360912501812, -0.018449358642101288, -0.017415108159184456, -0.016380857676267624, -0.015346607193350792, -0.01431235671043396, -0.013278106227517128, -0.012243855744600296, -0.011209605261683464, -0.010175354778766632, -0.0091411042958498, -0.008106853812932968, -0.007072603330016136, -0.006038352847099304, -0.005004102364182472, -0.00396985188126564, -0.0029356013983488083, -0.0019013509154319763, -0.0008671004325151443, 0.00016715005040168762, 0.0012014005333185196, 0.0022356510162353516, 0.0032699014991521835, 0.0043041519820690155, 0.0053384024649858475, 0.0063726529479026794, 0.007406903430819511, 0.008441153913736343, 0.009475404396653175, 0.010509654879570007, 0.01154390536248684, 0.012578155845403671, 0.013612406328320503, 0.014646656811237335, 0.015680907294154167, 0.016715157777071, 0.01774940825998783, 0.018783658742904663, 0.019817909225821495, 0.020852159708738327, 0.02188641019165516, 0.02292066067457199, 0.023954911157488823, 0.024989161640405655, 0.026023412123322487, 0.02705766260623932, 0.02809191308915615, 0.029126163572072983, 0.030160414054989815, 0.031194664537906647, 0.03222891688346863, 0.03326316550374031, 0.03429741412401199, 0.035331666469573975]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 5.0, 18.0, 19.0, 31.0, 39.0, 59.0, 71.0, 106.0, 185.0, 281.0, 429.0, 760.0, 1734.0, 5929.0, 47588.0, 715044.0, 254229.0, 15998.0, 3177.0, 1176.0, 627.0, 382.0, 190.0, 146.0, 98.0, 67.0, 43.0, 33.0, 18.0, 14.0, 18.0, 12.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055511474609375, -0.05376434326171875, -0.0520172119140625, -0.05027008056640625, -0.04852294921875, -0.04677581787109375, -0.0450286865234375, -0.04328155517578125, -0.041534423828125, -0.03978729248046875, -0.0380401611328125, -0.03629302978515625, -0.0345458984375, -0.03279876708984375, -0.0310516357421875, -0.02930450439453125, -0.027557373046875, -0.02581024169921875, -0.0240631103515625, -0.02231597900390625, -0.02056884765625, -0.01882171630859375, -0.0170745849609375, -0.01532745361328125, -0.013580322265625, -0.01183319091796875, -0.0100860595703125, -0.00833892822265625, -0.006591796875, -0.00484466552734375, -0.0030975341796875, -0.00135040283203125, 0.000396728515625, 0.00214385986328125, 0.0038909912109375, 0.00563812255859375, 0.00738525390625, 0.00913238525390625, 0.0108795166015625, 0.01262664794921875, 0.014373779296875, 0.01612091064453125, 0.0178680419921875, 0.01961517333984375, 0.0213623046875, 0.02310943603515625, 0.0248565673828125, 0.02660369873046875, 0.028350830078125, 0.03009796142578125, 0.0318450927734375, 0.03359222412109375, 0.03533935546875, 0.03708648681640625, 0.0388336181640625, 0.04058074951171875, 0.042327880859375, 0.04407501220703125, 0.0458221435546875, 0.04756927490234375, 0.04931640625, 0.05106353759765625, 0.0528106689453125, 0.05455780029296875, 0.056304931640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 12.0, 30.0, 84.0, 158.0, 243.0, 227.0, 154.0, 57.0, 27.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.04031658172607422, -0.03925132751464844, -0.038186073303222656, -0.037120819091796875, -0.036055564880371094, -0.03499031066894531, -0.03392505645751953, -0.03285980224609375, -0.03179454803466797, -0.030729293823242188, -0.029664039611816406, -0.028598785400390625, -0.027533531188964844, -0.026468276977539062, -0.02540302276611328, -0.0243377685546875, -0.02327251434326172, -0.022207260131835938, -0.021142005920410156, -0.020076751708984375, -0.019011497497558594, -0.017946243286132812, -0.01688098907470703, -0.01581573486328125, -0.014750480651855469, -0.013685226440429688, -0.012619972229003906, -0.011554718017578125, -0.010489463806152344, -0.009424209594726562, -0.008358955383300781, -0.007293701171875, -0.006228446960449219, -0.0051631927490234375, -0.004097938537597656, -0.003032684326171875, -0.0019674301147460938, -0.0009021759033203125, 0.00016307830810546875, 0.00122833251953125, 0.0022935867309570312, 0.0033588409423828125, 0.004424095153808594, 0.005489349365234375, 0.006554603576660156, 0.0076198577880859375, 0.008685111999511719, 0.0097503662109375, 0.010815620422363281, 0.011880874633789062, 0.012946128845214844, 0.014011383056640625, 0.015076637268066406, 0.016141891479492188, 0.01720714569091797, 0.01827239990234375, 0.01933765411376953, 0.020402908325195312, 0.021468162536621094, 0.022533416748046875, 0.023598670959472656, 0.024663925170898438, 0.02572917938232422, 0.02679443359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 7.0, 5.0, 8.0, 4.0, 8.0, 14.0, 17.0, 26.0, 22.0, 57.0, 80.0, 159.0, 288.0, 526.0, 1211.0, 2903.0, 7534.0, 22415.0, 79831.0, 299449.0, 431137.0, 145474.0, 37779.0, 11845.0, 4248.0, 1819.0, 788.0, 358.0, 206.0, 106.0, 73.0, 42.0, 23.0, 17.0, 18.0, 12.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0225372314453125, -0.02181529998779297, -0.021093368530273438, -0.020371437072753906, -0.019649505615234375, -0.018927574157714844, -0.018205642700195312, -0.01748371124267578, -0.01676177978515625, -0.01603984832763672, -0.015317916870117188, -0.014595985412597656, -0.013874053955078125, -0.013152122497558594, -0.012430191040039062, -0.011708259582519531, -0.010986328125, -0.010264396667480469, -0.009542465209960938, -0.008820533752441406, -0.008098602294921875, -0.007376670837402344, -0.0066547393798828125, -0.005932807922363281, -0.00521087646484375, -0.004488945007324219, -0.0037670135498046875, -0.0030450820922851562, -0.002323150634765625, -0.0016012191772460938, -0.0008792877197265625, -0.00015735626220703125, 0.0005645751953125, 0.0012865066528320312, 0.0020084381103515625, 0.0027303695678710938, 0.003452301025390625, 0.004174232482910156, 0.0048961639404296875, 0.005618095397949219, 0.00634002685546875, 0.007061958312988281, 0.0077838897705078125, 0.008505821228027344, 0.009227752685546875, 0.009949684143066406, 0.010671615600585938, 0.011393547058105469, 0.012115478515625, 0.012837409973144531, 0.013559341430664062, 0.014281272888183594, 0.015003204345703125, 0.015725135803222656, 0.016447067260742188, 0.01716899871826172, 0.01789093017578125, 0.01861286163330078, 0.019334793090820312, 0.020056724548339844, 0.020778656005859375, 0.021500587463378906, 0.022222518920898438, 0.02294445037841797, 0.0236663818359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 10.0, 11.0, 13.0, 16.0, 15.0, 17.0, 20.0, 21.0, 37.0, 36.0, 51.0, 48.0, 51.0, 49.0, 50.0, 56.0, 61.0, 43.0, 49.0, 45.0, 37.0, 31.0, 35.0, 33.0, 23.0, 16.0, 14.0, 14.0, 17.0, 11.0, 9.0, 13.0, 7.0, 7.0, 2.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02447509765625, -0.02374863624572754, -0.023022174835205078, -0.022295713424682617, -0.021569252014160156, -0.020842790603637695, -0.020116329193115234, -0.019389867782592773, -0.018663406372070312, -0.01793694496154785, -0.01721048355102539, -0.01648402214050293, -0.01575756072998047, -0.015031099319458008, -0.014304637908935547, -0.013578176498413086, -0.012851715087890625, -0.012125253677368164, -0.011398792266845703, -0.010672330856323242, -0.009945869445800781, -0.00921940803527832, -0.00849294662475586, -0.0077664852142333984, -0.0070400238037109375, -0.0063135623931884766, -0.005587100982666016, -0.004860639572143555, -0.004134178161621094, -0.003407716751098633, -0.002681255340576172, -0.001954793930053711, -0.00122833251953125, -0.0005018711090087891, 0.00022459030151367188, 0.0009510517120361328, 0.0016775131225585938, 0.0024039745330810547, 0.0031304359436035156, 0.0038568973541259766, 0.0045833587646484375, 0.0053098201751708984, 0.006036281585693359, 0.00676274299621582, 0.007489204406738281, 0.008215665817260742, 0.008942127227783203, 0.009668588638305664, 0.010395050048828125, 0.011121511459350586, 0.011847972869873047, 0.012574434280395508, 0.013300895690917969, 0.01402735710144043, 0.01475381851196289, 0.015480279922485352, 0.016206741333007812, 0.016933202743530273, 0.017659664154052734, 0.018386125564575195, 0.019112586975097656, 0.019839048385620117, 0.020565509796142578, 0.02129197120666504, 0.0220184326171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 7.0, 1.0, 5.0, 13.0, 3.0, 18.0, 40.0, 65.0, 109.0, 210.0, 446.0, 1008.0, 2239.0, 5477.0, 14826.0, 54587.0, 388011.0, 485995.0, 67482.0, 17505.0, 5982.0, 2486.0, 1022.0, 478.0, 252.0, 127.0, 70.0, 31.0, 26.0, 16.0, 7.0, 7.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0196533203125, -0.019137024879455566, -0.018620729446411133, -0.0181044340133667, -0.017588138580322266, -0.017071843147277832, -0.0165555477142334, -0.016039252281188965, -0.015522956848144531, -0.015006661415100098, -0.014490365982055664, -0.01397407054901123, -0.013457775115966797, -0.012941479682922363, -0.01242518424987793, -0.011908888816833496, -0.011392593383789062, -0.010876297950744629, -0.010360002517700195, -0.009843707084655762, -0.009327411651611328, -0.008811116218566895, -0.008294820785522461, -0.007778525352478027, -0.007262229919433594, -0.00674593448638916, -0.0062296390533447266, -0.005713343620300293, -0.005197048187255859, -0.004680752754211426, -0.004164457321166992, -0.0036481618881225586, -0.003131866455078125, -0.0026155710220336914, -0.002099275588989258, -0.0015829801559448242, -0.0010666847229003906, -0.000550389289855957, -3.409385681152344e-05, 0.00048220157623291016, 0.0009984970092773438, 0.0015147924423217773, 0.002031087875366211, 0.0025473833084106445, 0.003063678741455078, 0.0035799741744995117, 0.004096269607543945, 0.004612565040588379, 0.0051288604736328125, 0.005645155906677246, 0.00616145133972168, 0.006677746772766113, 0.007194042205810547, 0.0077103376388549805, 0.008226633071899414, 0.008742928504943848, 0.009259223937988281, 0.009775519371032715, 0.010291814804077148, 0.010808110237121582, 0.011324405670166016, 0.01184070110321045, 0.012356996536254883, 0.012873291969299316, 0.01338958740234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 10.0, 4.0, 7.0, 12.0, 19.0, 18.0, 24.0, 35.0, 43.0, 71.0, 90.0, 94.0, 90.0, 99.0, 93.0, 83.0, 48.0, 41.0, 27.0, 22.0, 19.0, 13.0, 3.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.16908073425293e-05, -5.980487912893295e-05, -5.791895091533661e-05, -5.6033022701740265e-05, -5.414709448814392e-05, -5.226116627454758e-05, -5.037523806095123e-05, -4.848930984735489e-05, -4.6603381633758545e-05, -4.47174534201622e-05, -4.283152520656586e-05, -4.094559699296951e-05, -3.905966877937317e-05, -3.7173740565776825e-05, -3.528781235218048e-05, -3.340188413858414e-05, -3.151595592498779e-05, -2.963002771139145e-05, -2.7744099497795105e-05, -2.585817128419876e-05, -2.3972243070602417e-05, -2.2086314857006073e-05, -2.020038664340973e-05, -1.8314458429813385e-05, -1.642853021621704e-05, -1.4542602002620697e-05, -1.2656673789024353e-05, -1.0770745575428009e-05, -8.884817361831665e-06, -6.998889148235321e-06, -5.112960934638977e-06, -3.227032721042633e-06, -1.341104507446289e-06, 5.448237061500549e-07, 2.430751919746399e-06, 4.316680133342743e-06, 6.202608346939087e-06, 8.088536560535431e-06, 9.974464774131775e-06, 1.1860392987728119e-05, 1.3746321201324463e-05, 1.5632249414920807e-05, 1.751817762851715e-05, 1.9404105842113495e-05, 2.129003405570984e-05, 2.3175962269306183e-05, 2.5061890482902527e-05, 2.694781869649887e-05, 2.8833746910095215e-05, 3.071967512369156e-05, 3.26056033372879e-05, 3.449153155088425e-05, 3.637745976448059e-05, 3.8263387978076935e-05, 4.014931619167328e-05, 4.203524440526962e-05, 4.392117261886597e-05, 4.580710083246231e-05, 4.7693029046058655e-05, 4.9578957259655e-05, 5.146488547325134e-05, 5.335081368684769e-05, 5.523674190044403e-05, 5.7122670114040375e-05, 5.900859832763672e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 4.0, 11.0, 11.0, 28.0, 36.0, 43.0, 80.0, 144.0, 239.0, 365.0, 617.0, 1132.0, 2203.0, 4223.0, 9211.0, 22877.0, 66167.0, 247910.0, 468334.0, 150584.0, 44071.0, 16012.0, 6981.0, 3331.0, 1740.0, 934.0, 516.0, 282.0, 154.0, 109.0, 60.0, 47.0, 24.0, 18.0, 11.0, 11.0, 6.0, 2.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01018524169921875, -0.009825587272644043, -0.009465932846069336, -0.009106278419494629, -0.008746623992919922, -0.008386969566345215, -0.008027315139770508, -0.007667660713195801, -0.007308006286621094, -0.006948351860046387, -0.00658869743347168, -0.006229043006896973, -0.005869388580322266, -0.005509734153747559, -0.0051500797271728516, -0.0047904253005981445, -0.0044307708740234375, -0.0040711164474487305, -0.0037114620208740234, -0.0033518075942993164, -0.0029921531677246094, -0.0026324987411499023, -0.0022728443145751953, -0.0019131898880004883, -0.0015535354614257812, -0.0011938810348510742, -0.0008342266082763672, -0.00047457218170166016, -0.00011491775512695312, 0.0002447366714477539, 0.0006043910980224609, 0.000964045524597168, 0.001323699951171875, 0.001683354377746582, 0.002043008804321289, 0.002402663230895996, 0.002762317657470703, 0.00312197208404541, 0.003481626510620117, 0.0038412809371948242, 0.004200935363769531, 0.004560589790344238, 0.004920244216918945, 0.005279898643493652, 0.005639553070068359, 0.005999207496643066, 0.0063588619232177734, 0.0067185163497924805, 0.0070781707763671875, 0.0074378252029418945, 0.0077974796295166016, 0.008157134056091309, 0.008516788482666016, 0.008876442909240723, 0.00923609733581543, 0.009595751762390137, 0.009955406188964844, 0.01031506061553955, 0.010674715042114258, 0.011034369468688965, 0.011394023895263672, 0.011753678321838379, 0.012113332748413086, 0.012472987174987793, 0.0128326416015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 7.0, 1.0, 5.0, 10.0, 7.0, 6.0, 13.0, 11.0, 8.0, 21.0, 26.0, 29.0, 50.0, 72.0, 100.0, 109.0, 112.0, 100.0, 88.0, 54.0, 32.0, 24.0, 19.0, 17.0, 18.0, 6.0, 5.0, 11.0, 10.0, 5.0, 5.0, 8.0, 1.0, 5.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0130767822265625, -0.012671709060668945, -0.01226663589477539, -0.011861562728881836, -0.011456489562988281, -0.011051416397094727, -0.010646343231201172, -0.010241270065307617, -0.009836196899414062, -0.009431123733520508, -0.009026050567626953, -0.008620977401733398, -0.008215904235839844, -0.007810831069946289, -0.007405757904052734, -0.00700068473815918, -0.006595611572265625, -0.00619053840637207, -0.005785465240478516, -0.005380392074584961, -0.004975318908691406, -0.0045702457427978516, -0.004165172576904297, -0.003760099411010742, -0.0033550262451171875, -0.002949953079223633, -0.002544879913330078, -0.0021398067474365234, -0.0017347335815429688, -0.001329660415649414, -0.0009245872497558594, -0.0005195140838623047, -0.00011444091796875, 0.0002906322479248047, 0.0006957054138183594, 0.001100778579711914, 0.0015058517456054688, 0.0019109249114990234, 0.002315998077392578, 0.002721071243286133, 0.0031261444091796875, 0.003531217575073242, 0.003936290740966797, 0.0043413639068603516, 0.004746437072753906, 0.005151510238647461, 0.005556583404541016, 0.00596165657043457, 0.006366729736328125, 0.00677180290222168, 0.007176876068115234, 0.007581949234008789, 0.007987022399902344, 0.008392095565795898, 0.008797168731689453, 0.009202241897583008, 0.009607315063476562, 0.010012388229370117, 0.010417461395263672, 0.010822534561157227, 0.011227607727050781, 0.011632680892944336, 0.01203775405883789, 0.012442827224731445, 0.012847900390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 16.0, 25.0, 38.0, 94.0, 159.0, 220.0, 199.0, 127.0, 71.0, 23.0, 12.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15328632295131683, -0.14713303744792938, -0.14097975194454193, -0.13482646644115448, -0.12867318093776703, -0.12251989543437958, -0.11636660993099213, -0.11021332442760468, -0.10406003892421722, -0.09790675342082977, -0.09175346791744232, -0.08560018241405487, -0.07944689691066742, -0.07329361140727997, -0.06714032590389252, -0.060987040400505066, -0.054833754897117615, -0.048680469393730164, -0.04252718389034271, -0.03637389838695526, -0.03022061288356781, -0.02406732738018036, -0.017914041876792908, -0.011760756373405457, -0.005607470870018005, 0.0005458146333694458, 0.006699100136756897, 0.012852385640144348, 0.0190056711435318, 0.02515895664691925, 0.0313122421503067, 0.03746552765369415, 0.0436188280582428, 0.04977211356163025, 0.0559253990650177, 0.06207868456840515, 0.0682319700717926, 0.07438525557518005, 0.0805385410785675, 0.08669182658195496, 0.09284511208534241, 0.09899839758872986, 0.10515168309211731, 0.11130496859550476, 0.11745825409889221, 0.12361153960227966, 0.12976482510566711, 0.13591811060905457, 0.14207139611244202, 0.14822468161582947, 0.15437796711921692, 0.16053125262260437, 0.16668453812599182, 0.17283782362937927, 0.17899110913276672, 0.18514439463615417, 0.19129768013954163, 0.19745096564292908, 0.20360425114631653, 0.20975753664970398, 0.21591082215309143, 0.22206410765647888, 0.22821739315986633, 0.23437067866325378, 0.24052396416664124]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 8.0, 7.0, 7.0, 10.0, 19.0, 15.0, 17.0, 11.0, 24.0, 19.0, 26.0, 26.0, 30.0, 30.0, 35.0, 33.0, 30.0, 35.0, 39.0, 37.0, 41.0, 35.0, 49.0, 38.0, 37.0, 34.0, 22.0, 30.0, 30.0, 25.0, 24.0, 25.0, 20.0, 25.0, 15.0, 12.0, 11.0, 11.0, 6.0, 7.0, 8.0, 4.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05563068389892578, -0.053804561495780945, -0.05197844281792641, -0.05015232414007187, -0.04832620173692703, -0.046500079333782196, -0.04467396065592766, -0.04284784197807312, -0.041021719574928284, -0.03919559717178345, -0.03736947849392891, -0.03554335981607437, -0.033717237412929535, -0.0318911150097847, -0.03006499633193016, -0.028238875791430473, -0.026412755250930786, -0.0245866347104311, -0.022760514169931412, -0.020934393629431725, -0.019108273088932037, -0.01728215254843235, -0.015456032007932663, -0.013629911467432976, -0.011803790926933289, -0.009977670386433601, -0.008151549845933914, -0.006325429305434227, -0.00449930876493454, -0.0026731882244348526, -0.0008470676839351654, 0.0009790528565645218, 0.002805173397064209, 0.004631293937563896, 0.006457414478063583, 0.00828353501856327, 0.010109655559062958, 0.011935776099562645, 0.013761896640062332, 0.01558801718056202, 0.017414137721061707, 0.019240258261561394, 0.02106637880206108, 0.022892499342560768, 0.024718619883060455, 0.026544740423560143, 0.02837086096405983, 0.030196981504559517, 0.032023102045059204, 0.03384922444820404, 0.03567534312605858, 0.037501461803913116, 0.03932758420705795, 0.04115370661020279, 0.04297982528805733, 0.044805943965911865, 0.0466320663690567, 0.04845818877220154, 0.050284307450056076, 0.052110426127910614, 0.05393654853105545, 0.05576267093420029, 0.057588789612054825, 0.05941490828990936, 0.0612410306930542]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 15.0, 23.0, 41.0, 116.0, 308.0, 929.0, 5564.0, 3851131.0, 331018.0, 4074.0, 700.0, 208.0, 91.0, 20.0, 14.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11968994140625, -0.11625862121582031, -0.11282730102539062, -0.10939598083496094, -0.10596466064453125, -0.10253334045410156, -0.09910202026367188, -0.09567070007324219, -0.0922393798828125, -0.08880805969238281, -0.08537673950195312, -0.08194541931152344, -0.07851409912109375, -0.07508277893066406, -0.07165145874023438, -0.06822013854980469, -0.064788818359375, -0.06135749816894531, -0.057926177978515625, -0.05449485778808594, -0.05106353759765625, -0.04763221740722656, -0.044200897216796875, -0.04076957702636719, -0.0373382568359375, -0.03390693664550781, -0.030475616455078125, -0.027044296264648438, -0.02361297607421875, -0.020181655883789062, -0.016750335693359375, -0.013319015502929688, -0.0098876953125, -0.0064563751220703125, -0.003025054931640625, 0.0004062652587890625, 0.00383758544921875, 0.0072689056396484375, 0.010700225830078125, 0.014131546020507812, 0.0175628662109375, 0.020994186401367188, 0.024425506591796875, 0.027856826782226562, 0.03128814697265625, 0.03471946716308594, 0.038150787353515625, 0.04158210754394531, 0.045013427734375, 0.04844474792480469, 0.051876068115234375, 0.05530738830566406, 0.05873870849609375, 0.06217002868652344, 0.06560134887695312, 0.06903266906738281, 0.0724639892578125, 0.07589530944824219, 0.07932662963867188, 0.08275794982910156, 0.08618927001953125, 0.08962059020996094, 0.09305191040039062, 0.09648323059082031, 0.09991455078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 14.0, 55.0, 115.0, 199.0, 224.0, 184.0, 122.0, 57.0, 22.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040618896484375, -0.03956246376037598, -0.03850603103637695, -0.03744959831237793, -0.036393165588378906, -0.03533673286437988, -0.03428030014038086, -0.033223867416381836, -0.03216743469238281, -0.03111100196838379, -0.030054569244384766, -0.028998136520385742, -0.02794170379638672, -0.026885271072387695, -0.025828838348388672, -0.02477240562438965, -0.023715972900390625, -0.0226595401763916, -0.021603107452392578, -0.020546674728393555, -0.01949024200439453, -0.018433809280395508, -0.017377376556396484, -0.01632094383239746, -0.015264511108398438, -0.014208078384399414, -0.01315164566040039, -0.012095212936401367, -0.011038780212402344, -0.00998234748840332, -0.008925914764404297, -0.007869482040405273, -0.00681304931640625, -0.0057566165924072266, -0.004700183868408203, -0.0036437511444091797, -0.0025873184204101562, -0.0015308856964111328, -0.0004744529724121094, 0.0005819797515869141, 0.0016384124755859375, 0.002694845199584961, 0.0037512779235839844, 0.004807710647583008, 0.005864143371582031, 0.006920576095581055, 0.007977008819580078, 0.009033441543579102, 0.010089874267578125, 0.011146306991577148, 0.012202739715576172, 0.013259172439575195, 0.014315605163574219, 0.015372037887573242, 0.016428470611572266, 0.01748490333557129, 0.018541336059570312, 0.019597768783569336, 0.02065420150756836, 0.021710634231567383, 0.022767066955566406, 0.02382349967956543, 0.024879932403564453, 0.025936365127563477, 0.0269927978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 9.0, 16.0, 14.0, 21.0, 27.0, 33.0, 69.0, 93.0, 107.0, 183.0, 276.0, 438.0, 743.0, 1334.0, 2338.0, 4589.0, 9775.0, 23605.0, 68455.0, 268071.0, 2531398.0, 1050329.0, 154512.0, 45789.0, 16666.0, 7168.0, 3536.0, 1895.0, 1022.0, 663.0, 379.0, 243.0, 139.0, 114.0, 65.0, 44.0, 31.0, 29.0, 15.0, 7.0, 10.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01361083984375, -0.013154387474060059, -0.012697935104370117, -0.012241482734680176, -0.011785030364990234, -0.011328577995300293, -0.010872125625610352, -0.01041567325592041, -0.009959220886230469, -0.009502768516540527, -0.009046316146850586, -0.008589863777160645, -0.008133411407470703, -0.007676959037780762, -0.00722050666809082, -0.006764054298400879, -0.0063076019287109375, -0.005851149559020996, -0.005394697189331055, -0.004938244819641113, -0.004481792449951172, -0.0040253400802612305, -0.003568887710571289, -0.0031124353408813477, -0.0026559829711914062, -0.002199530601501465, -0.0017430782318115234, -0.001286625862121582, -0.0008301734924316406, -0.0003737211227416992, 8.273124694824219e-05, 0.0005391836166381836, 0.000995635986328125, 0.0014520883560180664, 0.0019085407257080078, 0.0023649930953979492, 0.0028214454650878906, 0.003277897834777832, 0.0037343502044677734, 0.004190802574157715, 0.004647254943847656, 0.005103707313537598, 0.005560159683227539, 0.0060166120529174805, 0.006473064422607422, 0.006929516792297363, 0.007385969161987305, 0.007842421531677246, 0.008298873901367188, 0.008755326271057129, 0.00921177864074707, 0.009668231010437012, 0.010124683380126953, 0.010581135749816895, 0.011037588119506836, 0.011494040489196777, 0.011950492858886719, 0.01240694522857666, 0.012863397598266602, 0.013319849967956543, 0.013776302337646484, 0.014232754707336426, 0.014689207077026367, 0.015145659446716309, 0.01560211181640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 4.0, 9.0, 11.0, 21.0, 29.0, 44.0, 78.0, 91.0, 145.0, 266.0, 545.0, 1114.0, 828.0, 371.0, 186.0, 118.0, 53.0, 46.0, 42.0, 25.0, 16.0, 7.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0229339599609375, -0.02234208583831787, -0.021750211715698242, -0.021158337593078613, -0.020566463470458984, -0.019974589347839355, -0.019382715225219727, -0.018790841102600098, -0.01819896697998047, -0.01760709285736084, -0.01701521873474121, -0.016423344612121582, -0.015831470489501953, -0.015239596366882324, -0.014647722244262695, -0.014055848121643066, -0.013463973999023438, -0.012872099876403809, -0.01228022575378418, -0.01168835163116455, -0.011096477508544922, -0.010504603385925293, -0.009912729263305664, -0.009320855140686035, -0.008728981018066406, -0.008137106895446777, -0.0075452327728271484, -0.0069533586502075195, -0.006361484527587891, -0.005769610404968262, -0.005177736282348633, -0.004585862159729004, -0.003993988037109375, -0.003402113914489746, -0.002810239791870117, -0.0022183656692504883, -0.0016264915466308594, -0.0010346174240112305, -0.00044274330139160156, 0.00014913082122802734, 0.0007410049438476562, 0.0013328790664672852, 0.001924753189086914, 0.002516627311706543, 0.003108501434326172, 0.0037003755569458008, 0.00429224967956543, 0.004884123802185059, 0.0054759979248046875, 0.006067872047424316, 0.006659746170043945, 0.007251620292663574, 0.007843494415283203, 0.008435368537902832, 0.009027242660522461, 0.00961911678314209, 0.010210990905761719, 0.010802865028381348, 0.011394739151000977, 0.011986613273620605, 0.012578487396240234, 0.013170361518859863, 0.013762235641479492, 0.014354109764099121, 0.01494598388671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 22.0, 32.0, 87.0, 171.0, 199.0, 229.0, 123.0, 72.0, 29.0, 24.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12743130326271057, -0.1228400319814682, -0.11824875324964523, -0.11365748196840286, -0.1090662032365799, -0.10447493195533752, -0.09988366067409515, -0.09529238939285278, -0.09070111066102982, -0.08610983937978745, -0.08151856064796448, -0.0769272893667221, -0.07233601808547974, -0.06774473935365677, -0.0631534680724144, -0.05856219306588173, -0.05397091805934906, -0.04937964305281639, -0.04478836804628372, -0.04019709676504135, -0.03560582175850868, -0.031014546751976013, -0.026423273608088493, -0.021832000464200974, -0.017240725457668304, -0.01264945138245821, -0.008058177307248116, -0.003466903232038021, 0.0011243708431720734, 0.005715645849704742, 0.010306918993592262, 0.014898192137479782, 0.01948946714401245, 0.02408074215054512, 0.02867201529443264, 0.03326328843832016, 0.03785456344485283, 0.0424458384513855, 0.04703710973262787, 0.05162838473916054, 0.05621965974569321, 0.060810934752225876, 0.06540220975875854, 0.06999348104000092, 0.07458475232124329, 0.07917603105306625, 0.08376730233430862, 0.08835858106613159, 0.09294985234737396, 0.09754112362861633, 0.1021324023604393, 0.10672367364168167, 0.11131495237350464, 0.11590622365474701, 0.12049749493598938, 0.12508876621723175, 0.12968003749847412, 0.1342713087797165, 0.13886258006095886, 0.14345386624336243, 0.1480451375246048, 0.15263640880584717, 0.15722768008708954, 0.1618189513683319, 0.16641023755073547]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 14.0, 15.0, 23.0, 18.0, 20.0, 27.0, 31.0, 30.0, 36.0, 38.0, 56.0, 38.0, 50.0, 40.0, 36.0, 47.0, 44.0, 39.0, 41.0, 43.0, 28.0, 34.0, 30.0, 27.0, 29.0, 28.0, 18.0, 18.0, 14.0, 11.0, 7.0, 11.0, 11.0, 3.0, 7.0, 5.0, 9.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.04679727554321289, -0.0455031618475914, -0.04420904815196991, -0.04291493445634842, -0.04162082076072693, -0.04032670706510544, -0.03903259336948395, -0.03773847967386246, -0.03644436597824097, -0.035150252282619476, -0.033856138586997986, -0.032562024891376495, -0.031267911195755005, -0.029973797500133514, -0.028679683804512024, -0.027385570108890533, -0.026091456413269043, -0.024797342717647552, -0.023503229022026062, -0.02220911532640457, -0.02091500163078308, -0.01962088793516159, -0.0183267742395401, -0.01703266054391861, -0.01573854684829712, -0.014444433152675629, -0.013150319457054138, -0.011856205761432648, -0.010562092065811157, -0.009267978370189667, -0.007973864674568176, -0.006679750978946686, -0.005385637283325195, -0.004091523587703705, -0.0027974098920822144, -0.0015032961964607239, -0.0002091825008392334, 0.001084931194782257, 0.0023790448904037476, 0.003673158586025238, 0.0049672722816467285, 0.006261385977268219, 0.0075554996728897095, 0.0088496133685112, 0.01014372706413269, 0.011437840759754181, 0.012731954455375671, 0.014026068150997162, 0.015320181846618652, 0.016614295542240143, 0.017908409237861633, 0.019202522933483124, 0.020496636629104614, 0.021790750324726105, 0.023084864020347595, 0.024378977715969086, 0.025673091411590576, 0.026967205107212067, 0.028261318802833557, 0.029555432498455048, 0.030849546194076538, 0.03214365988969803, 0.03343777358531952, 0.03473188728094101, 0.0360260009765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 1.0, 3.0, 6.0, 11.0, 5.0, 12.0, 12.0, 21.0, 30.0, 30.0, 65.0, 71.0, 88.0, 110.0, 181.0, 251.0, 373.0, 650.0, 1159.0, 2915.0, 11205.0, 65192.0, 617961.0, 304808.0, 32353.0, 6695.0, 1976.0, 824.0, 475.0, 306.0, 209.0, 119.0, 111.0, 82.0, 68.0, 45.0, 27.0, 27.0, 21.0, 11.0, 12.0, 10.0, 6.0, 2.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056060791015625, -0.05424165725708008, -0.052422523498535156, -0.050603389739990234, -0.04878425598144531, -0.04696512222290039, -0.04514598846435547, -0.04332685470581055, -0.041507720947265625, -0.0396885871887207, -0.03786945343017578, -0.03605031967163086, -0.03423118591308594, -0.032412052154541016, -0.030592918395996094, -0.028773784637451172, -0.02695465087890625, -0.025135517120361328, -0.023316383361816406, -0.021497249603271484, -0.019678115844726562, -0.01785898208618164, -0.01603984832763672, -0.014220714569091797, -0.012401580810546875, -0.010582447052001953, -0.008763313293457031, -0.006944179534912109, -0.0051250457763671875, -0.0033059120178222656, -0.0014867782592773438, 0.0003323554992675781, 0.0021514892578125, 0.003970623016357422, 0.005789756774902344, 0.007608890533447266, 0.009428024291992188, 0.01124715805053711, 0.013066291809082031, 0.014885425567626953, 0.016704559326171875, 0.018523693084716797, 0.02034282684326172, 0.02216196060180664, 0.023981094360351562, 0.025800228118896484, 0.027619361877441406, 0.029438495635986328, 0.03125762939453125, 0.03307676315307617, 0.034895896911621094, 0.036715030670166016, 0.03853416442871094, 0.04035329818725586, 0.04217243194580078, 0.0439915657043457, 0.045810699462890625, 0.04762983322143555, 0.04944896697998047, 0.05126810073852539, 0.05308723449707031, 0.054906368255615234, 0.056725502014160156, 0.05854463577270508, 0.06036376953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 28.0, 70.0, 162.0, 205.0, 227.0, 160.0, 86.0, 39.0, 11.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042572021484375, -0.04150867462158203, -0.04044532775878906, -0.039381980895996094, -0.038318634033203125, -0.037255287170410156, -0.03619194030761719, -0.03512859344482422, -0.03406524658203125, -0.03300189971923828, -0.03193855285644531, -0.030875205993652344, -0.029811859130859375, -0.028748512268066406, -0.027685165405273438, -0.02662181854248047, -0.0255584716796875, -0.02449512481689453, -0.023431777954101562, -0.022368431091308594, -0.021305084228515625, -0.020241737365722656, -0.019178390502929688, -0.01811504364013672, -0.01705169677734375, -0.01598834991455078, -0.014925003051757812, -0.013861656188964844, -0.012798309326171875, -0.011734962463378906, -0.010671615600585938, -0.009608268737792969, -0.008544921875, -0.007481575012207031, -0.0064182281494140625, -0.005354881286621094, -0.004291534423828125, -0.0032281875610351562, -0.0021648406982421875, -0.0011014938354492188, -3.814697265625e-05, 0.0010251998901367188, 0.0020885467529296875, 0.0031518936157226562, 0.004215240478515625, 0.005278587341308594, 0.0063419342041015625, 0.007405281066894531, 0.0084686279296875, 0.009531974792480469, 0.010595321655273438, 0.011658668518066406, 0.012722015380859375, 0.013785362243652344, 0.014848709106445312, 0.01591205596923828, 0.01697540283203125, 0.01803874969482422, 0.019102096557617188, 0.020165443420410156, 0.021228790283203125, 0.022292137145996094, 0.023355484008789062, 0.02441883087158203, 0.025482177734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 10.0, 8.0, 27.0, 26.0, 58.0, 97.0, 245.0, 663.0, 3268.0, 23068.0, 346531.0, 625736.0, 42335.0, 4894.0, 994.0, 296.0, 125.0, 58.0, 40.0, 18.0, 13.0, 14.0, 7.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06717777252197266, -0.06501960754394531, -0.06286144256591797, -0.060703277587890625, -0.05854511260986328, -0.05638694763183594, -0.054228782653808594, -0.05207061767578125, -0.049912452697753906, -0.04775428771972656, -0.04559612274169922, -0.043437957763671875, -0.04127979278564453, -0.03912162780761719, -0.036963462829589844, -0.0348052978515625, -0.032647132873535156, -0.030488967895507812, -0.02833080291748047, -0.026172637939453125, -0.02401447296142578, -0.021856307983398438, -0.019698143005371094, -0.01753997802734375, -0.015381813049316406, -0.013223648071289062, -0.011065483093261719, -0.008907318115234375, -0.006749153137207031, -0.0045909881591796875, -0.0024328231811523438, -0.000274658203125, 0.0018835067749023438, 0.0040416717529296875, 0.006199836730957031, 0.008358001708984375, 0.010516166687011719, 0.012674331665039062, 0.014832496643066406, 0.01699066162109375, 0.019148826599121094, 0.021306991577148438, 0.02346515655517578, 0.025623321533203125, 0.02778148651123047, 0.029939651489257812, 0.032097816467285156, 0.0342559814453125, 0.036414146423339844, 0.03857231140136719, 0.04073047637939453, 0.042888641357421875, 0.04504680633544922, 0.04720497131347656, 0.049363136291503906, 0.05152130126953125, 0.053679466247558594, 0.05583763122558594, 0.05799579620361328, 0.060153961181640625, 0.06231212615966797, 0.06447029113769531, 0.06662845611572266, 0.06878662109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 11.0, 8.0, 8.0, 7.0, 13.0, 14.0, 18.0, 23.0, 18.0, 34.0, 34.0, 39.0, 32.0, 38.0, 41.0, 58.0, 53.0, 53.0, 48.0, 53.0, 48.0, 46.0, 40.0, 46.0, 37.0, 26.0, 26.0, 20.0, 12.0, 14.0, 17.0, 16.0, 7.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02911376953125, -0.028299331665039062, -0.027484893798828125, -0.026670455932617188, -0.02585601806640625, -0.025041580200195312, -0.024227142333984375, -0.023412704467773438, -0.0225982666015625, -0.021783828735351562, -0.020969390869140625, -0.020154953002929688, -0.01934051513671875, -0.018526077270507812, -0.017711639404296875, -0.016897201538085938, -0.016082763671875, -0.015268325805664062, -0.014453887939453125, -0.013639450073242188, -0.01282501220703125, -0.012010574340820312, -0.011196136474609375, -0.010381698608398438, -0.0095672607421875, -0.008752822875976562, -0.007938385009765625, -0.0071239471435546875, -0.00630950927734375, -0.0054950714111328125, -0.004680633544921875, -0.0038661956787109375, -0.0030517578125, -0.0022373199462890625, -0.001422882080078125, -0.0006084442138671875, 0.00020599365234375, 0.0010204315185546875, 0.001834869384765625, 0.0026493072509765625, 0.0034637451171875, 0.0042781829833984375, 0.005092620849609375, 0.0059070587158203125, 0.00672149658203125, 0.0075359344482421875, 0.008350372314453125, 0.009164810180664062, 0.009979248046875, 0.010793685913085938, 0.011608123779296875, 0.012422561645507812, 0.01323699951171875, 0.014051437377929688, 0.014865875244140625, 0.015680313110351562, 0.0164947509765625, 0.017309188842773438, 0.018123626708984375, 0.018938064575195312, 0.01975250244140625, 0.020566940307617188, 0.021381378173828125, 0.022195816040039062, 0.02301025390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 4.0, 11.0, 10.0, 10.0, 31.0, 43.0, 58.0, 83.0, 153.0, 201.0, 334.0, 537.0, 904.0, 1678.0, 2806.0, 5223.0, 9487.0, 18954.0, 41821.0, 103015.0, 264486.0, 338941.0, 148711.0, 58450.0, 25039.0, 12415.0, 6475.0, 3578.0, 2079.0, 1155.0, 707.0, 388.0, 285.0, 165.0, 77.0, 73.0, 49.0, 34.0, 30.0, 16.0, 8.0, 7.0, 6.0, 6.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.0119171142578125, -0.0115966796875, -0.0112762451171875, -0.010955810546875, -0.0106353759765625, -0.01031494140625, -0.0099945068359375, -0.009674072265625, -0.0093536376953125, -0.009033203125, -0.0087127685546875, -0.008392333984375, -0.0080718994140625, -0.00775146484375, -0.0074310302734375, -0.007110595703125, -0.0067901611328125, -0.0064697265625, -0.0061492919921875, -0.005828857421875, -0.0055084228515625, -0.00518798828125, -0.0048675537109375, -0.004547119140625, -0.0042266845703125, -0.00390625, -0.0035858154296875, -0.003265380859375, -0.0029449462890625, -0.00262451171875, -0.0023040771484375, -0.001983642578125, -0.0016632080078125, -0.0013427734375, -0.0010223388671875, -0.000701904296875, -0.0003814697265625, -6.103515625e-05, 0.0002593994140625, 0.000579833984375, 0.0009002685546875, 0.001220703125, 0.0015411376953125, 0.001861572265625, 0.0021820068359375, 0.00250244140625, 0.0028228759765625, 0.003143310546875, 0.0034637451171875, 0.0037841796875, 0.0041046142578125, 0.004425048828125, 0.0047454833984375, 0.00506591796875, 0.0053863525390625, 0.005706787109375, 0.0060272216796875, 0.00634765625, 0.0066680908203125, 0.006988525390625, 0.0073089599609375, 0.00762939453125, 0.0079498291015625, 0.008270263671875, 0.0085906982421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 12.0, 13.0, 19.0, 17.0, 25.0, 22.0, 21.0, 25.0, 38.0, 59.0, 76.0, 95.0, 101.0, 103.0, 72.0, 64.0, 44.0, 35.0, 26.0, 26.0, 10.0, 25.0, 23.0, 18.0, 15.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.941225051879883e-05, -4.7946348786354065e-05, -4.64804470539093e-05, -4.501454532146454e-05, -4.3548643589019775e-05, -4.208274185657501e-05, -4.061684012413025e-05, -3.9150938391685486e-05, -3.768503665924072e-05, -3.621913492679596e-05, -3.4753233194351196e-05, -3.328733146190643e-05, -3.182142972946167e-05, -3.0355527997016907e-05, -2.8889626264572144e-05, -2.742372453212738e-05, -2.5957822799682617e-05, -2.4491921067237854e-05, -2.302601933479309e-05, -2.1560117602348328e-05, -2.0094215869903564e-05, -1.86283141374588e-05, -1.7162412405014038e-05, -1.5696510672569275e-05, -1.4230608940124512e-05, -1.2764707207679749e-05, -1.1298805475234985e-05, -9.832903742790222e-06, -8.367002010345459e-06, -6.901100277900696e-06, -5.435198545455933e-06, -3.9692968130111694e-06, -2.5033950805664062e-06, -1.037493348121643e-06, 4.284083843231201e-07, 1.8943101167678833e-06, 3.3602118492126465e-06, 4.82611358165741e-06, 6.292015314102173e-06, 7.757917046546936e-06, 9.2238187789917e-06, 1.0689720511436462e-05, 1.2155622243881226e-05, 1.3621523976325989e-05, 1.5087425708770752e-05, 1.6553327441215515e-05, 1.801922917366028e-05, 1.948513090610504e-05, 2.0951032638549805e-05, 2.2416934370994568e-05, 2.388283610343933e-05, 2.5348737835884094e-05, 2.6814639568328857e-05, 2.828054130077362e-05, 2.9746443033218384e-05, 3.121234476566315e-05, 3.267824649810791e-05, 3.414414823055267e-05, 3.5610049962997437e-05, 3.70759516954422e-05, 3.854185342788696e-05, 4.0007755160331726e-05, 4.147365689277649e-05, 4.293955862522125e-05, 4.4405460357666016e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 11.0, 13.0, 20.0, 17.0, 30.0, 43.0, 59.0, 97.0, 159.0, 247.0, 378.0, 699.0, 1276.0, 2272.0, 4773.0, 10179.0, 23580.0, 63126.0, 211578.0, 457256.0, 178530.0, 54605.0, 21152.0, 9185.0, 4273.0, 2230.0, 1082.0, 667.0, 373.0, 218.0, 140.0, 95.0, 58.0, 44.0, 34.0, 15.0, 11.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01343536376953125, -0.012978911399841309, -0.012522459030151367, -0.012066006660461426, -0.011609554290771484, -0.011153101921081543, -0.010696649551391602, -0.01024019718170166, -0.009783744812011719, -0.009327292442321777, -0.008870840072631836, -0.008414387702941895, -0.007957935333251953, -0.007501482963562012, -0.00704503059387207, -0.006588578224182129, -0.0061321258544921875, -0.005675673484802246, -0.005219221115112305, -0.004762768745422363, -0.004306316375732422, -0.0038498640060424805, -0.003393411636352539, -0.0029369592666625977, -0.0024805068969726562, -0.002024054527282715, -0.0015676021575927734, -0.001111149787902832, -0.0006546974182128906, -0.00019824504852294922, 0.0002582073211669922, 0.0007146596908569336, 0.001171112060546875, 0.0016275644302368164, 0.002084016799926758, 0.0025404691696166992, 0.0029969215393066406, 0.003453373908996582, 0.0039098262786865234, 0.004366278648376465, 0.004822731018066406, 0.005279183387756348, 0.005735635757446289, 0.0061920881271362305, 0.006648540496826172, 0.007104992866516113, 0.007561445236206055, 0.008017897605895996, 0.008474349975585938, 0.008930802345275879, 0.00938725471496582, 0.009843707084655762, 0.010300159454345703, 0.010756611824035645, 0.011213064193725586, 0.011669516563415527, 0.012125968933105469, 0.01258242130279541, 0.013038873672485352, 0.013495326042175293, 0.013951778411865234, 0.014408230781555176, 0.014864683151245117, 0.015321135520935059, 0.015777587890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 10.0, 7.0, 12.0, 17.0, 19.0, 36.0, 50.0, 81.0, 102.0, 126.0, 137.0, 97.0, 94.0, 59.0, 44.0, 27.0, 20.0, 12.0, 9.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0213165283203125, -0.02069377899169922, -0.020071029663085938, -0.019448280334472656, -0.018825531005859375, -0.018202781677246094, -0.017580032348632812, -0.01695728302001953, -0.01633453369140625, -0.01571178436279297, -0.015089035034179688, -0.014466285705566406, -0.013843536376953125, -0.013220787048339844, -0.012598037719726562, -0.011975288391113281, -0.0113525390625, -0.010729789733886719, -0.010107040405273438, -0.009484291076660156, -0.008861541748046875, -0.008238792419433594, -0.0076160430908203125, -0.006993293762207031, -0.00637054443359375, -0.005747795104980469, -0.0051250457763671875, -0.004502296447753906, -0.003879547119140625, -0.0032567977905273438, -0.0026340484619140625, -0.0020112991333007812, -0.0013885498046875, -0.0007658004760742188, -0.0001430511474609375, 0.00047969818115234375, 0.001102447509765625, 0.0017251968383789062, 0.0023479461669921875, 0.0029706954956054688, 0.00359344482421875, 0.004216194152832031, 0.0048389434814453125, 0.005461692810058594, 0.006084442138671875, 0.006707191467285156, 0.0073299407958984375, 0.007952690124511719, 0.008575439453125, 0.009198188781738281, 0.009820938110351562, 0.010443687438964844, 0.011066436767578125, 0.011689186096191406, 0.012311935424804688, 0.012934684753417969, 0.01355743408203125, 0.014180183410644531, 0.014802932739257812, 0.015425682067871094, 0.016048431396484375, 0.016671180725097656, 0.017293930053710938, 0.01791667938232422, 0.0185394287109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 24.0, 48.0, 112.0, 196.0, 222.0, 203.0, 92.0, 49.0, 24.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18874108791351318, -0.18003621697425842, -0.17133136093616486, -0.1626265048980713, -0.15392163395881653, -0.14521676301956177, -0.1365119069814682, -0.12780705094337463, -0.11910218000411987, -0.11039731651544571, -0.10169245302677155, -0.09298758953809738, -0.08428272604942322, -0.07557786256074905, -0.06687299907207489, -0.058168135583400726, -0.04946327209472656, -0.0407584086060524, -0.032053545117378235, -0.02334868162870407, -0.014643818140029907, -0.005938954651355743, 0.0027659088373184204, 0.011470772325992584, 0.020175635814666748, 0.028880499303340912, 0.037585362792015076, 0.04629022628068924, 0.0549950897693634, 0.06369995325803757, 0.07240481674671173, 0.0811096802353859, 0.08981457352638245, 0.09851943701505661, 0.10722430050373077, 0.11592916399240494, 0.1246340274810791, 0.13333889842033386, 0.14204375445842743, 0.150748610496521, 0.15945348143577576, 0.16815835237503052, 0.17686320841312408, 0.18556806445121765, 0.1942729353904724, 0.20297780632972717, 0.21168266236782074, 0.2203875184059143, 0.22909238934516907, 0.23779726028442383, 0.2465021163225174, 0.25520697236061096, 0.2639118432998657, 0.2726167142391205, 0.28132158517837524, 0.2900264263153076, 0.2987312972545624, 0.30743616819381714, 0.3161410093307495, 0.3248458802700043, 0.33355075120925903, 0.3422556221485138, 0.35096049308776855, 0.3596653342247009, 0.3683702051639557]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 9.0, 7.0, 12.0, 10.0, 14.0, 10.0, 20.0, 34.0, 28.0, 25.0, 29.0, 26.0, 48.0, 41.0, 43.0, 40.0, 43.0, 58.0, 31.0, 37.0, 49.0, 36.0, 39.0, 36.0, 43.0, 33.0, 32.0, 29.0, 35.0, 18.0, 14.0, 14.0, 16.0, 14.0, 7.0, 5.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08456116914749146, -0.08184190839529037, -0.0791226476430893, -0.07640337944030762, -0.07368411868810654, -0.07096485793590546, -0.06824558973312378, -0.0655263289809227, -0.06280706822872162, -0.06008780747652054, -0.05736854299902916, -0.05464927852153778, -0.0519300177693367, -0.04921075701713562, -0.04649149253964424, -0.04377222806215286, -0.04105296730995178, -0.0383337065577507, -0.03561444208025932, -0.032895177602767944, -0.030175916850566864, -0.027456654235720634, -0.024737391620874405, -0.022018129006028175, -0.019298866391181946, -0.016579603776335716, -0.013860341161489487, -0.011141078546643257, -0.008421815931797028, -0.005702553316950798, -0.0029832907021045685, -0.00026402808725833893, 0.0024552345275878906, 0.00517449714243412, 0.00789375975728035, 0.01061302237212658, 0.013332284986972809, 0.01605154760181904, 0.018770810216665268, 0.021490072831511497, 0.024209335446357727, 0.026928598061203957, 0.029647860676050186, 0.032367125153541565, 0.035086385905742645, 0.037805646657943726, 0.040524911135435104, 0.04324417561292648, 0.045963436365127563, 0.048682697117328644, 0.05140196159482002, 0.0541212260723114, 0.05684048682451248, 0.05955974757671356, 0.06227901205420494, 0.06499827653169632, 0.0677175372838974, 0.07043679803609848, 0.07315605878829956, 0.07587532699108124, 0.07859458774328232, 0.0813138484954834, 0.08403311669826508, 0.08675237745046616, 0.08947163820266724]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 17.0, 25.0, 46.0, 134.0, 350.0, 1027.0, 8835.0, 3777842.0, 399195.0, 5679.0, 771.0, 233.0, 80.0, 19.0, 8.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1053466796875, -0.10223579406738281, -0.09912490844726562, -0.09601402282714844, -0.09290313720703125, -0.08979225158691406, -0.08668136596679688, -0.08357048034667969, -0.0804595947265625, -0.07734870910644531, -0.07423782348632812, -0.07112693786621094, -0.06801605224609375, -0.06490516662597656, -0.061794281005859375, -0.05868339538574219, -0.055572509765625, -0.05246162414550781, -0.049350738525390625, -0.04623985290527344, -0.04312896728515625, -0.04001808166503906, -0.036907196044921875, -0.03379631042480469, -0.0306854248046875, -0.027574539184570312, -0.024463653564453125, -0.021352767944335938, -0.01824188232421875, -0.015130996704101562, -0.012020111083984375, -0.008909225463867188, -0.00579833984375, -0.0026874542236328125, 0.000423431396484375, 0.0035343170166015625, 0.00664520263671875, 0.009756088256835938, 0.012866973876953125, 0.015977859497070312, 0.0190887451171875, 0.022199630737304688, 0.025310516357421875, 0.028421401977539062, 0.03153228759765625, 0.03464317321777344, 0.037754058837890625, 0.04086494445800781, 0.043975830078125, 0.04708671569824219, 0.050197601318359375, 0.05330848693847656, 0.05641937255859375, 0.05953025817871094, 0.06264114379882812, 0.06575202941894531, 0.0688629150390625, 0.07197380065917969, 0.07508468627929688, 0.07819557189941406, 0.08130645751953125, 0.08441734313964844, 0.08752822875976562, 0.09063911437988281, 0.09375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 12.0, 34.0, 57.0, 131.0, 209.0, 218.0, 156.0, 108.0, 55.0, 16.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.043975830078125, -0.042882680892944336, -0.04178953170776367, -0.04069638252258301, -0.039603233337402344, -0.03851008415222168, -0.037416934967041016, -0.03632378578186035, -0.03523063659667969, -0.03413748741149902, -0.03304433822631836, -0.031951189041137695, -0.03085803985595703, -0.029764890670776367, -0.028671741485595703, -0.02757859230041504, -0.026485443115234375, -0.02539229393005371, -0.024299144744873047, -0.023205995559692383, -0.02211284637451172, -0.021019697189331055, -0.01992654800415039, -0.018833398818969727, -0.017740249633789062, -0.0166471004486084, -0.015553951263427734, -0.01446080207824707, -0.013367652893066406, -0.012274503707885742, -0.011181354522705078, -0.010088205337524414, -0.00899505615234375, -0.007901906967163086, -0.006808757781982422, -0.005715608596801758, -0.004622459411621094, -0.0035293102264404297, -0.0024361610412597656, -0.0013430118560791016, -0.0002498626708984375, 0.0008432865142822266, 0.0019364356994628906, 0.0030295848846435547, 0.004122734069824219, 0.005215883255004883, 0.006309032440185547, 0.007402181625366211, 0.008495330810546875, 0.009588479995727539, 0.010681629180908203, 0.011774778366088867, 0.012867927551269531, 0.013961076736450195, 0.01505422592163086, 0.016147375106811523, 0.017240524291992188, 0.01833367347717285, 0.019426822662353516, 0.02051997184753418, 0.021613121032714844, 0.022706270217895508, 0.023799419403076172, 0.024892568588256836, 0.0259857177734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 15.0, 21.0, 32.0, 52.0, 69.0, 102.0, 161.0, 297.0, 391.0, 727.0, 1232.0, 2479.0, 5141.0, 11797.0, 30904.0, 95327.0, 390473.0, 2671200.0, 761375.0, 148687.0, 43884.0, 16261.0, 6700.0, 3057.0, 1598.0, 908.0, 565.0, 324.0, 190.0, 109.0, 60.0, 39.0, 26.0, 12.0, 16.0, 9.0, 7.0, 11.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751708984375, -0.01699686050415039, -0.01647663116455078, -0.015956401824951172, -0.015436172485351562, -0.014915943145751953, -0.014395713806152344, -0.013875484466552734, -0.013355255126953125, -0.012835025787353516, -0.012314796447753906, -0.011794567108154297, -0.011274337768554688, -0.010754108428955078, -0.010233879089355469, -0.00971364974975586, -0.00919342041015625, -0.00867319107055664, -0.008152961730957031, -0.007632732391357422, -0.0071125030517578125, -0.006592273712158203, -0.006072044372558594, -0.005551815032958984, -0.005031585693359375, -0.004511356353759766, -0.003991127014160156, -0.003470897674560547, -0.0029506683349609375, -0.002430438995361328, -0.0019102096557617188, -0.0013899803161621094, -0.0008697509765625, -0.0003495216369628906, 0.00017070770263671875, 0.0006909370422363281, 0.0012111663818359375, 0.0017313957214355469, 0.0022516250610351562, 0.0027718544006347656, 0.003292083740234375, 0.0038123130798339844, 0.004332542419433594, 0.004852771759033203, 0.0053730010986328125, 0.005893230438232422, 0.006413459777832031, 0.006933689117431641, 0.00745391845703125, 0.00797414779663086, 0.008494377136230469, 0.009014606475830078, 0.009534835815429688, 0.010055065155029297, 0.010575294494628906, 0.011095523834228516, 0.011615753173828125, 0.012135982513427734, 0.012656211853027344, 0.013176441192626953, 0.013696670532226562, 0.014216899871826172, 0.014737129211425781, 0.01525735855102539, 0.015777587890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 10.0, 6.0, 6.0, 10.0, 23.0, 20.0, 34.0, 40.0, 63.0, 72.0, 99.0, 134.0, 191.0, 370.0, 596.0, 782.0, 583.0, 340.0, 193.0, 131.0, 84.0, 65.0, 45.0, 42.0, 30.0, 22.0, 21.0, 13.0, 11.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0158233642578125, -0.015320301055908203, -0.014817237854003906, -0.01431417465209961, -0.013811111450195312, -0.013308048248291016, -0.012804985046386719, -0.012301921844482422, -0.011798858642578125, -0.011295795440673828, -0.010792732238769531, -0.010289669036865234, -0.009786605834960938, -0.00928354263305664, -0.008780479431152344, -0.008277416229248047, -0.00777435302734375, -0.007271289825439453, -0.006768226623535156, -0.006265163421630859, -0.0057621002197265625, -0.005259037017822266, -0.004755973815917969, -0.004252910614013672, -0.003749847412109375, -0.003246784210205078, -0.0027437210083007812, -0.0022406578063964844, -0.0017375946044921875, -0.0012345314025878906, -0.0007314682006835938, -0.00022840499877929688, 0.000274658203125, 0.0007777214050292969, 0.0012807846069335938, 0.0017838478088378906, 0.0022869110107421875, 0.0027899742126464844, 0.0032930374145507812, 0.003796100616455078, 0.004299163818359375, 0.004802227020263672, 0.005305290222167969, 0.005808353424072266, 0.0063114166259765625, 0.006814479827880859, 0.007317543029785156, 0.007820606231689453, 0.00832366943359375, 0.008826732635498047, 0.009329795837402344, 0.00983285903930664, 0.010335922241210938, 0.010838985443115234, 0.011342048645019531, 0.011845111846923828, 0.012348175048828125, 0.012851238250732422, 0.013354301452636719, 0.013857364654541016, 0.014360427856445312, 0.01486349105834961, 0.015366554260253906, 0.015869617462158203, 0.0163726806640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 8.0, 5.0, 17.0, 56.0, 99.0, 165.0, 203.0, 198.0, 135.0, 65.0, 26.0, 14.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19494816660881042, -0.18960313498973846, -0.1842581033706665, -0.17891307175159454, -0.17356804013252258, -0.16822299361228943, -0.16287797689437866, -0.1575329303741455, -0.15218789875507355, -0.1468428671360016, -0.14149783551692963, -0.13615280389785767, -0.1308077722787857, -0.12546274065971375, -0.12011770159006119, -0.11477266252040863, -0.10942763835191727, -0.1040826067328453, -0.09873757511377335, -0.09339253604412079, -0.08804750442504883, -0.08270247280597687, -0.07735744118690491, -0.07201240956783295, -0.06666737794876099, -0.061322346329689026, -0.05597731098532677, -0.050632279366254807, -0.04528724402189255, -0.03994221240282059, -0.03459718078374863, -0.029252145439386368, -0.02390711009502411, -0.018562076613307, -0.013217044062912464, -0.007872011512517929, -0.0025269780308008194, 0.0028180554509162903, 0.00816308706998825, 0.01350812241435051, 0.01885315403342247, 0.02419818751513958, 0.02954322099685669, 0.03488825261592865, 0.04023328423500061, 0.04557831957936287, 0.05092335119843483, 0.05626838654279709, 0.06161341816186905, 0.06695844978094101, 0.07230348140001297, 0.07764852046966553, 0.08299355208873749, 0.08833858370780945, 0.09368361532688141, 0.09902864694595337, 0.10437367856502533, 0.10971871018409729, 0.11506374180316925, 0.12040877342224121, 0.12575380504131317, 0.13109883666038513, 0.1364438831806183, 0.14178891479969025, 0.1471339464187622]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 7.0, 7.0, 10.0, 19.0, 14.0, 27.0, 31.0, 16.0, 33.0, 28.0, 40.0, 41.0, 37.0, 41.0, 41.0, 41.0, 46.0, 36.0, 44.0, 50.0, 35.0, 44.0, 25.0, 31.0, 41.0, 22.0, 22.0, 30.0, 21.0, 13.0, 19.0, 12.0, 12.0, 11.0, 9.0, 3.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.041091322898864746, -0.03955479711294174, -0.03801827132701874, -0.03648174926638603, -0.03494522348046303, -0.033408697694540024, -0.03187217563390732, -0.030335649847984314, -0.02879912406206131, -0.027262598276138306, -0.02572607435286045, -0.024189550429582596, -0.02265302464365959, -0.021116498857736588, -0.019579974934458733, -0.018043451011180878, -0.016506925225257874, -0.014970400370657444, -0.013433875516057014, -0.011897350661456585, -0.010360825806856155, -0.008824300952255726, -0.007287776097655296, -0.005751251243054867, -0.004214726388454437, -0.0026782015338540077, -0.0011416766792535782, 0.00039484817534685135, 0.0019313730299472809, 0.0034678978845477104, 0.00500442273914814, 0.0065409475937485695, 0.008077472448348999, 0.009613997302949429, 0.011150522157549858, 0.012687047012150288, 0.014223571866750717, 0.01576009765267372, 0.017296621575951576, 0.01883314549922943, 0.020369671285152435, 0.02190619707107544, 0.023442720994353294, 0.02497924491763115, 0.026515770703554153, 0.028052296489477158, 0.029588820412755013, 0.031125344336032867, 0.03266187012195587, 0.034198395907878876, 0.03573492169380188, 0.037271443754434586, 0.03880796954035759, 0.040344495326280594, 0.0418810173869133, 0.043417543172836304, 0.04495406895875931, 0.04649059474468231, 0.048027120530605316, 0.04956364259123802, 0.051100168377161026, 0.05263669416308403, 0.054173216223716736, 0.05570974200963974, 0.057246267795562744]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 12.0, 13.0, 12.0, 37.0, 46.0, 49.0, 85.0, 113.0, 211.0, 280.0, 455.0, 968.0, 2546.0, 8640.0, 52676.0, 662196.0, 286995.0, 24412.0, 5246.0, 1666.0, 720.0, 398.0, 249.0, 167.0, 99.0, 85.0, 41.0, 50.0, 22.0, 14.0, 13.0, 10.0, 6.0, 0.0, 6.0, 0.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08245849609375, -0.07994556427001953, -0.07743263244628906, -0.0749197006225586, -0.07240676879882812, -0.06989383697509766, -0.06738090515136719, -0.06486797332763672, -0.06235504150390625, -0.05984210968017578, -0.05732917785644531, -0.054816246032714844, -0.052303314208984375, -0.049790382385253906, -0.04727745056152344, -0.04476451873779297, -0.0422515869140625, -0.03973865509033203, -0.03722572326660156, -0.034712791442871094, -0.032199859619140625, -0.029686927795410156, -0.027173995971679688, -0.02466106414794922, -0.02214813232421875, -0.01963520050048828, -0.017122268676757812, -0.014609336853027344, -0.012096405029296875, -0.009583473205566406, -0.0070705413818359375, -0.004557609558105469, -0.002044677734375, 0.00046825408935546875, 0.0029811859130859375, 0.005494117736816406, 0.008007049560546875, 0.010519981384277344, 0.013032913208007812, 0.015545845031738281, 0.01805877685546875, 0.02057170867919922, 0.023084640502929688, 0.025597572326660156, 0.028110504150390625, 0.030623435974121094, 0.03313636779785156, 0.03564929962158203, 0.0381622314453125, 0.04067516326904297, 0.04318809509277344, 0.045701026916503906, 0.048213958740234375, 0.050726890563964844, 0.05323982238769531, 0.05575275421142578, 0.05826568603515625, 0.06077861785888672, 0.06329154968261719, 0.06580448150634766, 0.06831741333007812, 0.0708303451538086, 0.07334327697753906, 0.07585620880126953, 0.078369140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 13.0, 36.0, 80.0, 149.0, 200.0, 199.0, 162.0, 92.0, 50.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04388427734375, -0.04278898239135742, -0.041693687438964844, -0.040598392486572266, -0.03950309753417969, -0.03840780258178711, -0.03731250762939453, -0.03621721267700195, -0.035121917724609375, -0.0340266227722168, -0.03293132781982422, -0.03183603286743164, -0.030740737915039062, -0.029645442962646484, -0.028550148010253906, -0.027454853057861328, -0.02635955810546875, -0.025264263153076172, -0.024168968200683594, -0.023073673248291016, -0.021978378295898438, -0.02088308334350586, -0.01978778839111328, -0.018692493438720703, -0.017597198486328125, -0.016501903533935547, -0.015406608581542969, -0.01431131362915039, -0.013216018676757812, -0.012120723724365234, -0.011025428771972656, -0.009930133819580078, -0.0088348388671875, -0.007739543914794922, -0.006644248962402344, -0.005548954010009766, -0.0044536590576171875, -0.0033583641052246094, -0.0022630691528320312, -0.0011677742004394531, -7.2479248046875e-05, 0.0010228157043457031, 0.0021181106567382812, 0.0032134056091308594, 0.0043087005615234375, 0.005403995513916016, 0.006499290466308594, 0.007594585418701172, 0.00868988037109375, 0.009785175323486328, 0.010880470275878906, 0.011975765228271484, 0.013071060180664062, 0.01416635513305664, 0.015261650085449219, 0.016356945037841797, 0.017452239990234375, 0.018547534942626953, 0.01964282989501953, 0.02073812484741211, 0.021833419799804688, 0.022928714752197266, 0.024024009704589844, 0.025119304656982422, 0.026214599609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 17.0, 19.0, 24.0, 28.0, 54.0, 107.0, 157.0, 232.0, 477.0, 925.0, 2206.0, 5622.0, 15487.0, 53709.0, 258707.0, 525886.0, 135506.0, 32048.0, 10195.0, 3813.0, 1657.0, 743.0, 368.0, 201.0, 106.0, 77.0, 35.0, 32.0, 24.0, 12.0, 15.0, 13.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.041229248046875, -0.039868831634521484, -0.03850841522216797, -0.03714799880981445, -0.03578758239746094, -0.03442716598510742, -0.033066749572753906, -0.03170633316040039, -0.030345916748046875, -0.02898550033569336, -0.027625083923339844, -0.026264667510986328, -0.024904251098632812, -0.023543834686279297, -0.02218341827392578, -0.020823001861572266, -0.01946258544921875, -0.018102169036865234, -0.01674175262451172, -0.015381336212158203, -0.014020919799804688, -0.012660503387451172, -0.011300086975097656, -0.00993967056274414, -0.008579254150390625, -0.007218837738037109, -0.005858421325683594, -0.004498004913330078, -0.0031375885009765625, -0.0017771720886230469, -0.00041675567626953125, 0.0009436607360839844, 0.0023040771484375, 0.0036644935607910156, 0.005024909973144531, 0.006385326385498047, 0.0077457427978515625, 0.009106159210205078, 0.010466575622558594, 0.01182699203491211, 0.013187408447265625, 0.01454782485961914, 0.015908241271972656, 0.017268657684326172, 0.018629074096679688, 0.019989490509033203, 0.02134990692138672, 0.022710323333740234, 0.02407073974609375, 0.025431156158447266, 0.02679157257080078, 0.028151988983154297, 0.029512405395507812, 0.030872821807861328, 0.032233238220214844, 0.03359365463256836, 0.034954071044921875, 0.03631448745727539, 0.037674903869628906, 0.03903532028198242, 0.04039573669433594, 0.04175615310668945, 0.04311656951904297, 0.044476985931396484, 0.04583740234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 10.0, 10.0, 13.0, 15.0, 26.0, 19.0, 27.0, 25.0, 26.0, 61.0, 44.0, 50.0, 54.0, 63.0, 69.0, 64.0, 72.0, 46.0, 48.0, 46.0, 34.0, 28.0, 31.0, 20.0, 16.0, 14.0, 8.0, 9.0, 14.0, 5.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.033416748046875, -0.032242774963378906, -0.031068801879882812, -0.02989482879638672, -0.028720855712890625, -0.02754688262939453, -0.026372909545898438, -0.025198936462402344, -0.02402496337890625, -0.022850990295410156, -0.021677017211914062, -0.02050304412841797, -0.019329071044921875, -0.01815509796142578, -0.016981124877929688, -0.015807151794433594, -0.0146331787109375, -0.013459205627441406, -0.012285232543945312, -0.011111259460449219, -0.009937286376953125, -0.008763313293457031, -0.0075893402099609375, -0.006415367126464844, -0.00524139404296875, -0.004067420959472656, -0.0028934478759765625, -0.0017194747924804688, -0.000545501708984375, 0.0006284713745117188, 0.0018024444580078125, 0.0029764175415039062, 0.004150390625, 0.005324363708496094, 0.0064983367919921875, 0.007672309875488281, 0.008846282958984375, 0.010020256042480469, 0.011194229125976562, 0.012368202209472656, 0.01354217529296875, 0.014716148376464844, 0.015890121459960938, 0.01706409454345703, 0.018238067626953125, 0.01941204071044922, 0.020586013793945312, 0.021759986877441406, 0.0229339599609375, 0.024107933044433594, 0.025281906127929688, 0.02645587921142578, 0.027629852294921875, 0.02880382537841797, 0.029977798461914062, 0.031151771545410156, 0.03232574462890625, 0.033499717712402344, 0.03467369079589844, 0.03584766387939453, 0.037021636962890625, 0.03819561004638672, 0.03936958312988281, 0.040543556213378906, 0.041717529296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 17.0, 23.0, 30.0, 65.0, 108.0, 212.0, 361.0, 730.0, 1463.0, 2962.0, 7149.0, 18576.0, 68336.0, 585936.0, 296519.0, 42405.0, 13419.0, 5484.0, 2369.0, 1153.0, 545.0, 318.0, 173.0, 93.0, 35.0, 29.0, 13.0, 9.0, 8.0, 1.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032257080078125, -0.031176090240478516, -0.03009510040283203, -0.029014110565185547, -0.027933120727539062, -0.026852130889892578, -0.025771141052246094, -0.02469015121459961, -0.023609161376953125, -0.02252817153930664, -0.021447181701660156, -0.020366191864013672, -0.019285202026367188, -0.018204212188720703, -0.01712322235107422, -0.016042232513427734, -0.01496124267578125, -0.013880252838134766, -0.012799263000488281, -0.011718273162841797, -0.010637283325195312, -0.009556293487548828, -0.008475303649902344, -0.007394313812255859, -0.006313323974609375, -0.005232334136962891, -0.004151344299316406, -0.003070354461669922, -0.0019893646240234375, -0.0009083747863769531, 0.00017261505126953125, 0.0012536048889160156, 0.0023345947265625, 0.0034155845642089844, 0.004496574401855469, 0.005577564239501953, 0.0066585540771484375, 0.007739543914794922, 0.008820533752441406, 0.00990152359008789, 0.010982513427734375, 0.01206350326538086, 0.013144493103027344, 0.014225482940673828, 0.015306472778320312, 0.016387462615966797, 0.01746845245361328, 0.018549442291259766, 0.01963043212890625, 0.020711421966552734, 0.02179241180419922, 0.022873401641845703, 0.023954391479492188, 0.025035381317138672, 0.026116371154785156, 0.02719736099243164, 0.028278350830078125, 0.02935934066772461, 0.030440330505371094, 0.03152132034301758, 0.03260231018066406, 0.03368330001831055, 0.03476428985595703, 0.035845279693603516, 0.03692626953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 10.0, 4.0, 5.0, 6.0, 11.0, 22.0, 21.0, 31.0, 24.0, 52.0, 63.0, 61.0, 95.0, 119.0, 81.0, 72.0, 72.0, 38.0, 39.0, 36.0, 36.0, 23.0, 9.0, 15.0, 10.0, 4.0, 3.0, 6.0, 1.0, 3.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3795833587646484e-05, -3.254413604736328e-05, -3.129243850708008e-05, -3.0040740966796875e-05, -2.8789043426513672e-05, -2.753734588623047e-05, -2.6285648345947266e-05, -2.5033950805664062e-05, -2.378225326538086e-05, -2.2530555725097656e-05, -2.1278858184814453e-05, -2.002716064453125e-05, -1.8775463104248047e-05, -1.7523765563964844e-05, -1.627206802368164e-05, -1.5020370483398438e-05, -1.3768672943115234e-05, -1.2516975402832031e-05, -1.1265277862548828e-05, -1.0013580322265625e-05, -8.761882781982422e-06, -7.510185241699219e-06, -6.258487701416016e-06, -5.0067901611328125e-06, -3.7550926208496094e-06, -2.5033950805664062e-06, -1.2516975402832031e-06, 0.0, 1.2516975402832031e-06, 2.5033950805664062e-06, 3.7550926208496094e-06, 5.0067901611328125e-06, 6.258487701416016e-06, 7.510185241699219e-06, 8.761882781982422e-06, 1.0013580322265625e-05, 1.1265277862548828e-05, 1.2516975402832031e-05, 1.3768672943115234e-05, 1.5020370483398438e-05, 1.627206802368164e-05, 1.7523765563964844e-05, 1.8775463104248047e-05, 2.002716064453125e-05, 2.1278858184814453e-05, 2.2530555725097656e-05, 2.378225326538086e-05, 2.5033950805664062e-05, 2.6285648345947266e-05, 2.753734588623047e-05, 2.8789043426513672e-05, 3.0040740966796875e-05, 3.129243850708008e-05, 3.254413604736328e-05, 3.3795833587646484e-05, 3.504753112792969e-05, 3.629922866821289e-05, 3.7550926208496094e-05, 3.88026237487793e-05, 4.00543212890625e-05, 4.13060188293457e-05, 4.2557716369628906e-05, 4.380941390991211e-05, 4.506111145019531e-05, 4.6312808990478516e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 6.0, 2.0, 14.0, 12.0, 17.0, 30.0, 51.0, 50.0, 82.0, 125.0, 210.0, 377.0, 632.0, 1375.0, 2646.0, 6047.0, 14250.0, 37514.0, 141514.0, 587588.0, 182296.0, 44433.0, 16026.0, 6871.0, 3056.0, 1512.0, 739.0, 442.0, 231.0, 132.0, 84.0, 48.0, 40.0, 28.0, 7.0, 12.0, 12.0, 9.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0258331298828125, -0.024988174438476562, -0.024143218994140625, -0.023298263549804688, -0.02245330810546875, -0.021608352661132812, -0.020763397216796875, -0.019918441772460938, -0.019073486328125, -0.018228530883789062, -0.017383575439453125, -0.016538619995117188, -0.01569366455078125, -0.014848709106445312, -0.014003753662109375, -0.013158798217773438, -0.0123138427734375, -0.011468887329101562, -0.010623931884765625, -0.009778976440429688, -0.00893402099609375, -0.008089065551757812, -0.007244110107421875, -0.0063991546630859375, -0.00555419921875, -0.0047092437744140625, -0.003864288330078125, -0.0030193328857421875, -0.00217437744140625, -0.0013294219970703125, -0.000484466552734375, 0.0003604888916015625, 0.0012054443359375, 0.0020503997802734375, 0.002895355224609375, 0.0037403106689453125, 0.00458526611328125, 0.0054302215576171875, 0.006275177001953125, 0.0071201324462890625, 0.007965087890625, 0.008810043334960938, 0.009654998779296875, 0.010499954223632812, 0.01134490966796875, 0.012189865112304688, 0.013034820556640625, 0.013879776000976562, 0.0147247314453125, 0.015569686889648438, 0.016414642333984375, 0.017259597778320312, 0.01810455322265625, 0.018949508666992188, 0.019794464111328125, 0.020639419555664062, 0.021484375, 0.022329330444335938, 0.023174285888671875, 0.024019241333007812, 0.02486419677734375, 0.025709152221679688, 0.026554107666015625, 0.027399063110351562, 0.0282440185546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 6.0, 8.0, 18.0, 14.0, 29.0, 39.0, 54.0, 87.0, 135.0, 170.0, 143.0, 74.0, 39.0, 46.0, 26.0, 21.0, 18.0, 7.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036285400390625, -0.03523540496826172, -0.03418540954589844, -0.033135414123535156, -0.032085418701171875, -0.031035423278808594, -0.029985427856445312, -0.02893543243408203, -0.02788543701171875, -0.02683544158935547, -0.025785446166992188, -0.024735450744628906, -0.023685455322265625, -0.022635459899902344, -0.021585464477539062, -0.02053546905517578, -0.0194854736328125, -0.01843547821044922, -0.017385482788085938, -0.016335487365722656, -0.015285491943359375, -0.014235496520996094, -0.013185501098632812, -0.012135505676269531, -0.01108551025390625, -0.010035514831542969, -0.008985519409179688, -0.007935523986816406, -0.006885528564453125, -0.005835533142089844, -0.0047855377197265625, -0.0037355422973632812, -0.002685546875, -0.0016355514526367188, -0.0005855560302734375, 0.00046443939208984375, 0.001514434814453125, 0.0025644302368164062, 0.0036144256591796875, 0.004664421081542969, 0.00571441650390625, 0.006764411926269531, 0.007814407348632812, 0.008864402770996094, 0.009914398193359375, 0.010964393615722656, 0.012014389038085938, 0.013064384460449219, 0.0141143798828125, 0.015164375305175781, 0.016214370727539062, 0.017264366149902344, 0.018314361572265625, 0.019364356994628906, 0.020414352416992188, 0.02146434783935547, 0.02251434326171875, 0.02356433868408203, 0.024614334106445312, 0.025664329528808594, 0.026714324951171875, 0.027764320373535156, 0.028814315795898438, 0.02986431121826172, 0.030914306640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 18.0, 37.0, 73.0, 177.0, 285.0, 247.0, 107.0, 31.0, 11.0, 7.0, 3.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32874804735183716, -0.3120640814304352, -0.2953801155090332, -0.2786961495876312, -0.26201218366622925, -0.24532820284366608, -0.2286442220211029, -0.21196025609970093, -0.19527629017829895, -0.17859232425689697, -0.161908358335495, -0.14522437751293182, -0.12854041159152985, -0.11185644567012787, -0.0951724722981453, -0.07848849892616272, -0.06180453300476074, -0.045120563358068466, -0.02843659371137619, -0.011752624064683914, 0.004931345582008362, 0.02161531150341034, 0.038299284875392914, 0.05498325824737549, 0.07166722416877747, 0.08835119009017944, 0.10503516346216202, 0.12171913683414459, 0.13840310275554657, 0.15508706867694855, 0.17177104949951172, 0.1884550154209137, 0.2051389217376709, 0.22182288765907288, 0.23850685358047485, 0.25519081950187683, 0.2718747854232788, 0.2885587811470032, 0.30524274706840515, 0.32192671298980713, 0.3386106789112091, 0.3552946448326111, 0.37197861075401306, 0.38866257667541504, 0.4053465723991394, 0.422030508518219, 0.43871450424194336, 0.45539847016334534, 0.4720824360847473, 0.4887664020061493, 0.5054503679275513, 0.5221343636512756, 0.5388182997703552, 0.5555022954940796, 0.5721862316131592, 0.5888702273368835, 0.6055542230606079, 0.6222382187843323, 0.6389221549034119, 0.6556061506271362, 0.6722900867462158, 0.6889740824699402, 0.7056580185890198, 0.7223420143127441, 0.7390259504318237]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 7.0, 6.0, 5.0, 7.0, 13.0, 12.0, 27.0, 23.0, 30.0, 27.0, 29.0, 40.0, 51.0, 60.0, 30.0, 50.0, 49.0, 51.0, 44.0, 52.0, 54.0, 46.0, 33.0, 36.0, 29.0, 29.0, 31.0, 18.0, 21.0, 21.0, 11.0, 18.0, 12.0, 7.0, 6.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14844787120819092, -0.14396806061267853, -0.13948823511600494, -0.13500842452049255, -0.13052861392498016, -0.12604880332946777, -0.12156897783279419, -0.1170891672372818, -0.11260934919118881, -0.10812953114509583, -0.10364972054958344, -0.09916990250349045, -0.09469008445739746, -0.09021027386188507, -0.08573045581579208, -0.0812506377696991, -0.0767708271741867, -0.07229100912809372, -0.06781119853258133, -0.06333138048648834, -0.058851566165685654, -0.054371751844882965, -0.04989193379878998, -0.04541211947798729, -0.0409323051571846, -0.03645249083638191, -0.031972676515579224, -0.027492858469486237, -0.023013044148683548, -0.01853322982788086, -0.014053413644433022, -0.009573597460985184, -0.005093783140182495, -0.0006139678880572319, 0.0038658473640680313, 0.008345662616193295, 0.012825477868318558, 0.017305292189121246, 0.021785108372569084, 0.026264924556016922, 0.03074473887681961, 0.0352245531976223, 0.03970436751842499, 0.044184185564517975, 0.04866399988532066, 0.05314381420612335, 0.05762363225221634, 0.06210344657301903, 0.06658326089382172, 0.0710630789399147, 0.0755428895354271, 0.08002270758152008, 0.08450251817703247, 0.08898233622312546, 0.09346215426921844, 0.09794196486473083, 0.10242178291082382, 0.10690160095691681, 0.1113814115524292, 0.11586122959852219, 0.12034104764461517, 0.12482085824012756, 0.12930066883563995, 0.13378049433231354, 0.13826030492782593]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 11.0, 8.0, 9.0, 12.0, 9.0, 17.0, 17.0, 37.0, 32.0, 57.0, 92.0, 122.0, 245.0, 354.0, 629.0, 1189.0, 3027.0, 8982.0, 37960.0, 321473.0, 3389123.0, 368630.0, 43960.0, 11021.0, 3965.0, 1684.0, 711.0, 366.0, 199.0, 120.0, 75.0, 40.0, 46.0, 18.0, 9.0, 14.0, 7.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039794921875, -0.03867483139038086, -0.03755474090576172, -0.03643465042114258, -0.03531455993652344, -0.0341944694519043, -0.033074378967285156, -0.031954288482666016, -0.030834197998046875, -0.029714107513427734, -0.028594017028808594, -0.027473926544189453, -0.026353836059570312, -0.025233745574951172, -0.02411365509033203, -0.02299356460571289, -0.02187347412109375, -0.02075338363647461, -0.01963329315185547, -0.018513202667236328, -0.017393112182617188, -0.016273021697998047, -0.015152931213378906, -0.014032840728759766, -0.012912750244140625, -0.011792659759521484, -0.010672569274902344, -0.009552478790283203, -0.008432388305664062, -0.007312297821044922, -0.006192207336425781, -0.005072116851806641, -0.0039520263671875, -0.0028319358825683594, -0.0017118453979492188, -0.0005917549133300781, 0.0005283355712890625, 0.0016484260559082031, 0.0027685165405273438, 0.0038886070251464844, 0.005008697509765625, 0.006128787994384766, 0.007248878479003906, 0.008368968963623047, 0.009489059448242188, 0.010609149932861328, 0.011729240417480469, 0.01284933090209961, 0.01396942138671875, 0.01508951187133789, 0.01620960235595703, 0.017329692840576172, 0.018449783325195312, 0.019569873809814453, 0.020689964294433594, 0.021810054779052734, 0.022930145263671875, 0.024050235748291016, 0.025170326232910156, 0.026290416717529297, 0.027410507202148438, 0.028530597686767578, 0.02965068817138672, 0.03077077865600586, 0.031890869140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 19.0, 40.0, 80.0, 130.0, 152.0, 179.0, 145.0, 109.0, 77.0, 29.0, 20.0, 9.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04071044921875, -0.03967642784118652, -0.03864240646362305, -0.03760838508605957, -0.036574363708496094, -0.03554034233093262, -0.03450632095336914, -0.033472299575805664, -0.03243827819824219, -0.03140425682067871, -0.030370235443115234, -0.029336214065551758, -0.02830219268798828, -0.027268171310424805, -0.026234149932861328, -0.02520012855529785, -0.024166107177734375, -0.0231320858001709, -0.022098064422607422, -0.021064043045043945, -0.02003002166748047, -0.018996000289916992, -0.017961978912353516, -0.01692795753479004, -0.015893936157226562, -0.014859914779663086, -0.01382589340209961, -0.012791872024536133, -0.011757850646972656, -0.01072382926940918, -0.009689807891845703, -0.008655786514282227, -0.00762176513671875, -0.0065877437591552734, -0.005553722381591797, -0.00451970100402832, -0.0034856796264648438, -0.002451658248901367, -0.0014176368713378906, -0.00038361549377441406, 0.0006504058837890625, 0.001684427261352539, 0.0027184486389160156, 0.003752470016479492, 0.004786491394042969, 0.005820512771606445, 0.006854534149169922, 0.007888555526733398, 0.008922576904296875, 0.009956598281860352, 0.010990619659423828, 0.012024641036987305, 0.013058662414550781, 0.014092683792114258, 0.015126705169677734, 0.01616072654724121, 0.017194747924804688, 0.018228769302368164, 0.01926279067993164, 0.020296812057495117, 0.021330833435058594, 0.02236485481262207, 0.023398876190185547, 0.024432897567749023, 0.0254669189453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 15.0, 7.0, 26.0, 28.0, 49.0, 78.0, 127.0, 207.0, 360.0, 765.0, 1447.0, 3517.0, 9151.0, 30624.0, 139943.0, 1149751.0, 2539407.0, 248674.0, 48299.0, 13246.0, 4578.0, 1892.0, 918.0, 488.0, 263.0, 146.0, 104.0, 59.0, 42.0, 18.0, 16.0, 12.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024658203125, -0.02375030517578125, -0.0228424072265625, -0.02193450927734375, -0.021026611328125, -0.02011871337890625, -0.0192108154296875, -0.01830291748046875, -0.01739501953125, -0.01648712158203125, -0.0155792236328125, -0.01467132568359375, -0.013763427734375, -0.01285552978515625, -0.0119476318359375, -0.01103973388671875, -0.0101318359375, -0.00922393798828125, -0.0083160400390625, -0.00740814208984375, -0.006500244140625, -0.00559234619140625, -0.0046844482421875, -0.00377655029296875, -0.00286865234375, -0.00196075439453125, -0.0010528564453125, -0.00014495849609375, 0.000762939453125, 0.00167083740234375, 0.0025787353515625, 0.00348663330078125, 0.00439453125, 0.00530242919921875, 0.0062103271484375, 0.00711822509765625, 0.008026123046875, 0.00893402099609375, 0.0098419189453125, 0.01074981689453125, 0.01165771484375, 0.01256561279296875, 0.0134735107421875, 0.01438140869140625, 0.015289306640625, 0.01619720458984375, 0.0171051025390625, 0.01801300048828125, 0.0189208984375, 0.01982879638671875, 0.0207366943359375, 0.02164459228515625, 0.022552490234375, 0.02346038818359375, 0.0243682861328125, 0.02527618408203125, 0.02618408203125, 0.02709197998046875, 0.0279998779296875, 0.02890777587890625, 0.029815673828125, 0.03072357177734375, 0.0316314697265625, 0.03253936767578125, 0.033447265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 10.0, 8.0, 9.0, 17.0, 17.0, 38.0, 45.0, 54.0, 74.0, 109.0, 154.0, 252.0, 409.0, 599.0, 764.0, 515.0, 305.0, 185.0, 145.0, 106.0, 56.0, 47.0, 34.0, 30.0, 28.0, 9.0, 11.0, 13.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.024505615234375, -0.023789405822753906, -0.023073196411132812, -0.02235698699951172, -0.021640777587890625, -0.02092456817626953, -0.020208358764648438, -0.019492149353027344, -0.01877593994140625, -0.018059730529785156, -0.017343521118164062, -0.01662731170654297, -0.015911102294921875, -0.015194892883300781, -0.014478683471679688, -0.013762474060058594, -0.0130462646484375, -0.012330055236816406, -0.011613845825195312, -0.010897636413574219, -0.010181427001953125, -0.009465217590332031, -0.008749008178710938, -0.008032798767089844, -0.00731658935546875, -0.006600379943847656, -0.0058841705322265625, -0.005167961120605469, -0.004451751708984375, -0.0037355422973632812, -0.0030193328857421875, -0.0023031234741210938, -0.0015869140625, -0.0008707046508789062, -0.0001544952392578125, 0.0005617141723632812, 0.001277923583984375, 0.0019941329956054688, 0.0027103424072265625, 0.0034265518188476562, 0.00414276123046875, 0.004858970642089844, 0.0055751800537109375, 0.006291389465332031, 0.007007598876953125, 0.007723808288574219, 0.008440017700195312, 0.009156227111816406, 0.0098724365234375, 0.010588645935058594, 0.011304855346679688, 0.012021064758300781, 0.012737274169921875, 0.013453483581542969, 0.014169692993164062, 0.014885902404785156, 0.01560211181640625, 0.016318321228027344, 0.017034530639648438, 0.01775074005126953, 0.018466949462890625, 0.01918315887451172, 0.019899368286132812, 0.020615577697753906, 0.021331787109375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 13.0, 27.0, 34.0, 102.0, 165.0, 163.0, 195.0, 140.0, 83.0, 43.0, 15.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2875499129295349, -0.28025999665260315, -0.2729701101779938, -0.265680193901062, -0.25839030742645264, -0.2511003911495209, -0.2438104897737503, -0.23652058839797974, -0.22923068702220917, -0.2219407856464386, -0.21465088427066803, -0.20736098289489746, -0.2000710666179657, -0.19278118014335632, -0.18549126386642456, -0.178201362490654, -0.17091146111488342, -0.16362155973911285, -0.15633165836334229, -0.14904175698757172, -0.14175185561180115, -0.13446193933486938, -0.12717203795909882, -0.11988213658332825, -0.11259223520755768, -0.10530233383178711, -0.09801243245601654, -0.09072252362966537, -0.0834326222538948, -0.07614272087812424, -0.06885281205177307, -0.0615629106760025, -0.05427302420139313, -0.04698312282562256, -0.03969321772456169, -0.032403312623500824, -0.025113411247730255, -0.017823509871959686, -0.010533604770898819, -0.0032436996698379517, 0.004046201705932617, 0.011336104944348335, 0.018626008182764053, 0.02591591142117977, 0.03320581465959549, 0.04049571603536606, 0.047785621136426926, 0.05507552623748779, 0.06236542761325836, 0.06965532898902893, 0.0769452303647995, 0.08423513919115067, 0.09152504056692123, 0.0988149419426918, 0.10610485076904297, 0.11339475214481354, 0.1206846535205841, 0.12797455489635468, 0.13526445627212524, 0.1425543576478958, 0.14984425902366638, 0.15713417530059814, 0.1644240766763687, 0.17171397805213928, 0.17900387942790985]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 1.0, 7.0, 2.0, 5.0, 4.0, 9.0, 7.0, 10.0, 14.0, 16.0, 13.0, 17.0, 18.0, 18.0, 20.0, 31.0, 25.0, 40.0, 39.0, 20.0, 31.0, 46.0, 44.0, 47.0, 43.0, 26.0, 45.0, 33.0, 38.0, 50.0, 35.0, 35.0, 17.0, 24.0, 26.0, 20.0, 16.0, 22.0, 13.0, 10.0, 9.0, 5.0, 8.0, 10.0, 9.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056313395500183105, -0.05434640869498253, -0.05237942188978195, -0.050412435084581375, -0.0484454482793808, -0.04647846147418022, -0.044511474668979645, -0.04254448786377907, -0.04057750105857849, -0.038610514253377914, -0.03664352744817734, -0.03467654064297676, -0.032709553837776184, -0.030742567032575607, -0.02877558022737503, -0.026808593422174454, -0.024841606616973877, -0.0228746198117733, -0.020907633006572723, -0.018940646201372147, -0.01697365939617157, -0.015006672590970993, -0.013039685785770416, -0.01107269898056984, -0.009105712175369263, -0.007138725370168686, -0.005171738564968109, -0.0032047517597675323, -0.0012377649545669556, 0.0007292218506336212, 0.002696208655834198, 0.004663195461034775, 0.0066301822662353516, 0.008597169071435928, 0.010564155876636505, 0.012531142681837082, 0.014498129487037659, 0.016465116292238235, 0.018432103097438812, 0.02039908990263939, 0.022366076707839966, 0.024333063513040543, 0.02630005031824112, 0.028267037123441696, 0.030234023928642273, 0.03220101073384285, 0.034167997539043427, 0.036134984344244, 0.03810197114944458, 0.04006895795464516, 0.042035944759845734, 0.04400293156504631, 0.04596991837024689, 0.047936905175447464, 0.04990389198064804, 0.05187087878584862, 0.053837865591049194, 0.05580485239624977, 0.05777183920145035, 0.059738826006650925, 0.0617058128118515, 0.06367279589176178, 0.06563978642225266, 0.06760677695274353, 0.06957376003265381]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 3.0, 8.0, 11.0, 16.0, 31.0, 39.0, 64.0, 100.0, 164.0, 225.0, 377.0, 840.0, 2107.0, 7275.0, 35724.0, 386705.0, 550349.0, 50543.0, 9174.0, 2529.0, 998.0, 486.0, 251.0, 177.0, 100.0, 70.0, 57.0, 38.0, 18.0, 18.0, 9.0, 8.0, 8.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09368705749511719, -0.09093856811523438, -0.08819007873535156, -0.08544158935546875, -0.08269309997558594, -0.07994461059570312, -0.07719612121582031, -0.0744476318359375, -0.07169914245605469, -0.06895065307617188, -0.06620216369628906, -0.06345367431640625, -0.06070518493652344, -0.057956695556640625, -0.05520820617675781, -0.052459716796875, -0.04971122741699219, -0.046962738037109375, -0.04421424865722656, -0.04146575927734375, -0.03871726989746094, -0.035968780517578125, -0.03322029113769531, -0.0304718017578125, -0.027723312377929688, -0.024974822998046875, -0.022226333618164062, -0.01947784423828125, -0.016729354858398438, -0.013980865478515625, -0.011232376098632812, -0.00848388671875, -0.0057353973388671875, -0.002986907958984375, -0.0002384185791015625, 0.00251007080078125, 0.0052585601806640625, 0.008007049560546875, 0.010755538940429688, 0.0135040283203125, 0.016252517700195312, 0.019001007080078125, 0.021749496459960938, 0.02449798583984375, 0.027246475219726562, 0.029994964599609375, 0.03274345397949219, 0.035491943359375, 0.03824043273925781, 0.040988922119140625, 0.04373741149902344, 0.04648590087890625, 0.04923439025878906, 0.051982879638671875, 0.05473136901855469, 0.0574798583984375, 0.06022834777832031, 0.06297683715820312, 0.06572532653808594, 0.06847381591796875, 0.07122230529785156, 0.07397079467773438, 0.07671928405761719, 0.0794677734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 22.0, 56.0, 82.0, 133.0, 157.0, 196.0, 119.0, 104.0, 64.0, 31.0, 17.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0426025390625, -0.04154157638549805, -0.040480613708496094, -0.03941965103149414, -0.03835868835449219, -0.037297725677490234, -0.03623676300048828, -0.03517580032348633, -0.034114837646484375, -0.03305387496948242, -0.03199291229248047, -0.030931949615478516, -0.029870986938476562, -0.02881002426147461, -0.027749061584472656, -0.026688098907470703, -0.02562713623046875, -0.024566173553466797, -0.023505210876464844, -0.02244424819946289, -0.021383285522460938, -0.020322322845458984, -0.01926136016845703, -0.018200397491455078, -0.017139434814453125, -0.016078472137451172, -0.015017509460449219, -0.013956546783447266, -0.012895584106445312, -0.01183462142944336, -0.010773658752441406, -0.009712696075439453, -0.0086517333984375, -0.007590770721435547, -0.006529808044433594, -0.005468845367431641, -0.0044078826904296875, -0.0033469200134277344, -0.0022859573364257812, -0.0012249946594238281, -0.000164031982421875, 0.0008969306945800781, 0.0019578933715820312, 0.0030188560485839844, 0.0040798187255859375, 0.005140781402587891, 0.006201744079589844, 0.007262706756591797, 0.00832366943359375, 0.009384632110595703, 0.010445594787597656, 0.01150655746459961, 0.012567520141601562, 0.013628482818603516, 0.014689445495605469, 0.015750408172607422, 0.016811370849609375, 0.017872333526611328, 0.01893329620361328, 0.019994258880615234, 0.021055221557617188, 0.02211618423461914, 0.023177146911621094, 0.024238109588623047, 0.025299072265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 0.0, 4.0, 5.0, 10.0, 14.0, 21.0, 28.0, 46.0, 54.0, 96.0, 224.0, 422.0, 1212.0, 3652.0, 12903.0, 57831.0, 418022.0, 467736.0, 66005.0, 13989.0, 3990.0, 1282.0, 491.0, 213.0, 110.0, 71.0, 36.0, 22.0, 15.0, 19.0, 10.0, 5.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06671142578125, -0.06456184387207031, -0.062412261962890625, -0.06026268005371094, -0.05811309814453125, -0.05596351623535156, -0.053813934326171875, -0.05166435241699219, -0.0495147705078125, -0.04736518859863281, -0.045215606689453125, -0.04306602478027344, -0.04091644287109375, -0.03876686096191406, -0.036617279052734375, -0.03446769714355469, -0.032318115234375, -0.030168533325195312, -0.028018951416015625, -0.025869369506835938, -0.02371978759765625, -0.021570205688476562, -0.019420623779296875, -0.017271041870117188, -0.0151214599609375, -0.012971878051757812, -0.010822296142578125, -0.008672714233398438, -0.00652313232421875, -0.0043735504150390625, -0.002223968505859375, -7.43865966796875e-05, 0.0020751953125, 0.0042247772216796875, 0.006374359130859375, 0.008523941040039062, 0.01067352294921875, 0.012823104858398438, 0.014972686767578125, 0.017122268676757812, 0.0192718505859375, 0.021421432495117188, 0.023571014404296875, 0.025720596313476562, 0.02787017822265625, 0.030019760131835938, 0.032169342041015625, 0.03431892395019531, 0.036468505859375, 0.03861808776855469, 0.040767669677734375, 0.04291725158691406, 0.04506683349609375, 0.04721641540527344, 0.049365997314453125, 0.05151557922363281, 0.0536651611328125, 0.05581474304199219, 0.057964324951171875, 0.06011390686035156, 0.06226348876953125, 0.06441307067871094, 0.06656265258789062, 0.06871223449707031, 0.07086181640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 5.0, 4.0, 6.0, 9.0, 12.0, 16.0, 12.0, 21.0, 18.0, 33.0, 27.0, 36.0, 43.0, 55.0, 66.0, 69.0, 70.0, 76.0, 59.0, 52.0, 40.0, 58.0, 39.0, 23.0, 40.0, 21.0, 14.0, 16.0, 11.0, 12.0, 8.0, 6.0, 4.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.05108642578125, -0.049653053283691406, -0.04821968078613281, -0.04678630828857422, -0.045352935791015625, -0.04391956329345703, -0.04248619079589844, -0.041052818298339844, -0.03961944580078125, -0.038186073303222656, -0.03675270080566406, -0.03531932830810547, -0.033885955810546875, -0.03245258331298828, -0.031019210815429688, -0.029585838317871094, -0.0281524658203125, -0.026719093322753906, -0.025285720825195312, -0.02385234832763672, -0.022418975830078125, -0.02098560333251953, -0.019552230834960938, -0.018118858337402344, -0.01668548583984375, -0.015252113342285156, -0.013818740844726562, -0.012385368347167969, -0.010951995849609375, -0.009518623352050781, -0.008085250854492188, -0.006651878356933594, -0.005218505859375, -0.0037851333618164062, -0.0023517608642578125, -0.0009183883666992188, 0.000514984130859375, 0.0019483566284179688, 0.0033817291259765625, 0.004815101623535156, 0.00624847412109375, 0.007681846618652344, 0.009115219116210938, 0.010548591613769531, 0.011981964111328125, 0.013415336608886719, 0.014848709106445312, 0.016282081604003906, 0.0177154541015625, 0.019148826599121094, 0.020582199096679688, 0.02201557159423828, 0.023448944091796875, 0.02488231658935547, 0.026315689086914062, 0.027749061584472656, 0.02918243408203125, 0.030615806579589844, 0.03204917907714844, 0.03348255157470703, 0.034915924072265625, 0.03634929656982422, 0.03778266906738281, 0.039216041564941406, 0.0406494140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 12.0, 5.0, 17.0, 28.0, 35.0, 41.0, 72.0, 108.0, 131.0, 202.0, 360.0, 569.0, 877.0, 1408.0, 2642.0, 4851.0, 9780.0, 21785.0, 61049.0, 278287.0, 499026.0, 106888.0, 32521.0, 13368.0, 6321.0, 3344.0, 1961.0, 1014.0, 612.0, 405.0, 282.0, 174.0, 114.0, 87.0, 49.0, 39.0, 25.0, 14.0, 11.0, 11.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.032958984375, -0.031995534896850586, -0.031032085418701172, -0.030068635940551758, -0.029105186462402344, -0.02814173698425293, -0.027178287506103516, -0.0262148380279541, -0.025251388549804688, -0.024287939071655273, -0.02332448959350586, -0.022361040115356445, -0.02139759063720703, -0.020434141159057617, -0.019470691680908203, -0.01850724220275879, -0.017543792724609375, -0.01658034324645996, -0.015616893768310547, -0.014653444290161133, -0.013689994812011719, -0.012726545333862305, -0.01176309585571289, -0.010799646377563477, -0.009836196899414062, -0.008872747421264648, -0.007909297943115234, -0.00694584846496582, -0.005982398986816406, -0.005018949508666992, -0.004055500030517578, -0.003092050552368164, -0.00212860107421875, -0.001165151596069336, -0.00020170211791992188, 0.0007617473602294922, 0.0017251968383789062, 0.0026886463165283203, 0.0036520957946777344, 0.0046155452728271484, 0.0055789947509765625, 0.0065424442291259766, 0.007505893707275391, 0.008469343185424805, 0.009432792663574219, 0.010396242141723633, 0.011359691619873047, 0.012323141098022461, 0.013286590576171875, 0.014250040054321289, 0.015213489532470703, 0.016176939010620117, 0.01714038848876953, 0.018103837966918945, 0.01906728744506836, 0.020030736923217773, 0.020994186401367188, 0.0219576358795166, 0.022921085357666016, 0.02388453483581543, 0.024847984313964844, 0.025811433792114258, 0.026774883270263672, 0.027738332748413086, 0.0287017822265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 10.0, 13.0, 19.0, 16.0, 28.0, 26.0, 34.0, 31.0, 44.0, 43.0, 62.0, 66.0, 86.0, 61.0, 72.0, 56.0, 53.0, 38.0, 31.0, 31.0, 28.0, 20.0, 17.0, 20.0, 17.0, 17.0, 8.0, 8.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2724270820617676e-05, -2.1904706954956055e-05, -2.1085143089294434e-05, -2.0265579223632812e-05, -1.944601535797119e-05, -1.862645149230957e-05, -1.780688762664795e-05, -1.6987323760986328e-05, -1.6167759895324707e-05, -1.5348196029663086e-05, -1.4528632164001465e-05, -1.3709068298339844e-05, -1.2889504432678223e-05, -1.2069940567016602e-05, -1.125037670135498e-05, -1.043081283569336e-05, -9.611248970031738e-06, -8.791685104370117e-06, -7.972121238708496e-06, -7.152557373046875e-06, -6.332993507385254e-06, -5.513429641723633e-06, -4.693865776062012e-06, -3.874301910400391e-06, -3.0547380447387695e-06, -2.2351741790771484e-06, -1.4156103134155273e-06, -5.960464477539062e-07, 2.2351741790771484e-07, 1.043081283569336e-06, 1.862645149230957e-06, 2.682209014892578e-06, 3.5017728805541992e-06, 4.32133674621582e-06, 5.140900611877441e-06, 5.9604644775390625e-06, 6.780028343200684e-06, 7.599592208862305e-06, 8.419156074523926e-06, 9.238719940185547e-06, 1.0058283805847168e-05, 1.0877847671508789e-05, 1.169741153717041e-05, 1.2516975402832031e-05, 1.3336539268493652e-05, 1.4156103134155273e-05, 1.4975666999816895e-05, 1.5795230865478516e-05, 1.6614794731140137e-05, 1.7434358596801758e-05, 1.825392246246338e-05, 1.9073486328125e-05, 1.989305019378662e-05, 2.0712614059448242e-05, 2.1532177925109863e-05, 2.2351741790771484e-05, 2.3171305656433105e-05, 2.3990869522094727e-05, 2.4810433387756348e-05, 2.562999725341797e-05, 2.644956111907959e-05, 2.726912498474121e-05, 2.8088688850402832e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 11.0, 17.0, 12.0, 22.0, 24.0, 44.0, 42.0, 55.0, 89.0, 134.0, 206.0, 300.0, 474.0, 764.0, 1252.0, 2199.0, 4053.0, 8190.0, 17940.0, 43039.0, 125452.0, 463331.0, 256956.0, 71283.0, 27358.0, 11942.0, 5876.0, 3043.0, 1651.0, 931.0, 602.0, 394.0, 272.0, 185.0, 118.0, 75.0, 51.0, 37.0, 26.0, 23.0, 13.0, 17.0, 14.0, 13.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.024749755859375, -0.02388906478881836, -0.02302837371826172, -0.022167682647705078, -0.021306991577148438, -0.020446300506591797, -0.019585609436035156, -0.018724918365478516, -0.017864227294921875, -0.017003536224365234, -0.016142845153808594, -0.015282154083251953, -0.014421463012695312, -0.013560771942138672, -0.012700080871582031, -0.01183938980102539, -0.01097869873046875, -0.01011800765991211, -0.009257316589355469, -0.008396625518798828, -0.0075359344482421875, -0.006675243377685547, -0.005814552307128906, -0.004953861236572266, -0.004093170166015625, -0.0032324790954589844, -0.0023717880249023438, -0.0015110969543457031, -0.0006504058837890625, 0.00021028518676757812, 0.0010709762573242188, 0.0019316673278808594, 0.0027923583984375, 0.0036530494689941406, 0.004513740539550781, 0.005374431610107422, 0.0062351226806640625, 0.007095813751220703, 0.007956504821777344, 0.008817195892333984, 0.009677886962890625, 0.010538578033447266, 0.011399269104003906, 0.012259960174560547, 0.013120651245117188, 0.013981342315673828, 0.014842033386230469, 0.01570272445678711, 0.01656341552734375, 0.01742410659790039, 0.01828479766845703, 0.019145488739013672, 0.020006179809570312, 0.020866870880126953, 0.021727561950683594, 0.022588253021240234, 0.023448944091796875, 0.024309635162353516, 0.025170326232910156, 0.026031017303466797, 0.026891708374023438, 0.027752399444580078, 0.02861309051513672, 0.02947378158569336, 0.03033447265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 18.0, 29.0, 44.0, 38.0, 63.0, 131.0, 209.0, 152.0, 90.0, 57.0, 32.0, 23.0, 13.0, 14.0, 4.0, 8.0, 8.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.04030036926269531, -0.038944244384765625, -0.03758811950683594, -0.03623199462890625, -0.03487586975097656, -0.033519744873046875, -0.03216361999511719, -0.0308074951171875, -0.029451370239257812, -0.028095245361328125, -0.026739120483398438, -0.02538299560546875, -0.024026870727539062, -0.022670745849609375, -0.021314620971679688, -0.01995849609375, -0.018602371215820312, -0.017246246337890625, -0.015890121459960938, -0.01453399658203125, -0.013177871704101562, -0.011821746826171875, -0.010465621948242188, -0.0091094970703125, -0.0077533721923828125, -0.006397247314453125, -0.0050411224365234375, -0.00368499755859375, -0.0023288726806640625, -0.000972747802734375, 0.0003833770751953125, 0.001739501953125, 0.0030956268310546875, 0.004451751708984375, 0.0058078765869140625, 0.00716400146484375, 0.008520126342773438, 0.009876251220703125, 0.011232376098632812, 0.0125885009765625, 0.013944625854492188, 0.015300750732421875, 0.016656875610351562, 0.01801300048828125, 0.019369125366210938, 0.020725250244140625, 0.022081375122070312, 0.0234375, 0.024793624877929688, 0.026149749755859375, 0.027505874633789062, 0.02886199951171875, 0.030218124389648438, 0.031574249267578125, 0.03293037414550781, 0.0342864990234375, 0.03564262390136719, 0.036998748779296875, 0.03835487365722656, 0.03971099853515625, 0.04106712341308594, 0.042423248291015625, 0.04377937316894531, 0.045135498046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 14.0, 24.0, 100.0, 313.0, 370.0, 133.0, 37.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5977062582969666, -0.5707470774650574, -0.543787956237793, -0.5168287754058838, -0.4898695945739746, -0.46291041374206543, -0.43595126271247864, -0.40899211168289185, -0.38203293085098267, -0.3550737500190735, -0.3281145989894867, -0.3011554479598999, -0.2741962671279907, -0.24723710119724274, -0.22027793526649475, -0.19331876933574677, -0.16635960340499878, -0.1394004374742508, -0.11244127154350281, -0.08548210561275482, -0.058522939682006836, -0.03156377375125885, -0.004604607820510864, 0.02235455811023712, 0.04931372404098511, 0.0762728899717331, 0.10323205590248108, 0.13019122183322906, 0.15715038776397705, 0.18410955369472504, 0.21106871962547302, 0.238027885556221, 0.2649869918823242, 0.2919461727142334, 0.3189053237438202, 0.345864474773407, 0.37282365560531616, 0.39978283643722534, 0.42674198746681213, 0.4537011384963989, 0.4806603193283081, 0.5076195001602173, 0.5345786809921265, 0.5615378022193909, 0.5884969830513, 0.6154561638832092, 0.6424152851104736, 0.6693744659423828, 0.696333646774292, 0.7232928276062012, 0.7502520084381104, 0.7772111296653748, 0.8041703104972839, 0.8311294913291931, 0.8580886125564575, 0.8850477933883667, 0.9120069742202759, 0.9389661550521851, 0.9659253358840942, 0.9928844571113586, 1.019843578338623, 1.0468027591705322, 1.0737619400024414, 1.1007211208343506, 1.1276803016662598]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 8.0, 6.0, 20.0, 16.0, 17.0, 23.0, 29.0, 28.0, 33.0, 31.0, 42.0, 47.0, 48.0, 44.0, 51.0, 35.0, 53.0, 54.0, 48.0, 40.0, 39.0, 32.0, 34.0, 31.0, 25.0, 32.0, 18.0, 18.0, 20.0, 16.0, 5.0, 6.0, 6.0, 5.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.14711350202560425, -0.14252473413944244, -0.13793596625328064, -0.13334721326828003, -0.12875844538211823, -0.12416967749595642, -0.11958090960979462, -0.11499214172363281, -0.1104033812880516, -0.1058146134018898, -0.1012258529663086, -0.09663708508014679, -0.09204831719398499, -0.08745955675840378, -0.08287078887224197, -0.07828202843666077, -0.07369326055049896, -0.06910449266433716, -0.06451573222875595, -0.05992696434259415, -0.05533820018172264, -0.050749436020851135, -0.04616066813468933, -0.041571903973817825, -0.03698313981294632, -0.032394375652074814, -0.02780560962855816, -0.023216843605041504, -0.018628079444169998, -0.014039315283298492, -0.009450549259781837, -0.0048617832362651825, -0.00027301907539367676, 0.004315746016800404, 0.008904511108994484, 0.013493276201188564, 0.018082041293382645, 0.02267080545425415, 0.027259571477770805, 0.03184833750128746, 0.036437101662158966, 0.04102586582303047, 0.04561462998390198, 0.05020339787006378, 0.05479216203093529, 0.05938092619180679, 0.0639696940779686, 0.0685584545135498, 0.07314722239971161, 0.07773599028587341, 0.08232475072145462, 0.08691351860761642, 0.09150227904319763, 0.09609104692935944, 0.10067981481552124, 0.10526858270168304, 0.10985734313726425, 0.11444611102342606, 0.11903487145900726, 0.12362363934516907, 0.12821240723133087, 0.13280117511749268, 0.1373899281024933, 0.1419786959886551, 0.1465674638748169]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 8.0, 16.0, 29.0, 31.0, 55.0, 89.0, 184.0, 493.0, 1479.0, 7633.0, 100200.0, 3854815.0, 212609.0, 13421.0, 2283.0, 575.0, 192.0, 81.0, 31.0, 25.0, 15.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0911865234375, -0.0887613296508789, -0.08633613586425781, -0.08391094207763672, -0.08148574829101562, -0.07906055450439453, -0.07663536071777344, -0.07421016693115234, -0.07178497314453125, -0.06935977935791016, -0.06693458557128906, -0.06450939178466797, -0.062084197998046875, -0.05965900421142578, -0.05723381042480469, -0.054808616638183594, -0.0523834228515625, -0.049958229064941406, -0.04753303527832031, -0.04510784149169922, -0.042682647705078125, -0.04025745391845703, -0.03783226013183594, -0.035407066345214844, -0.03298187255859375, -0.030556678771972656, -0.028131484985351562, -0.02570629119873047, -0.023281097412109375, -0.02085590362548828, -0.018430709838867188, -0.016005516052246094, -0.013580322265625, -0.011155128479003906, -0.008729934692382812, -0.006304740905761719, -0.003879547119140625, -0.0014543533325195312, 0.0009708404541015625, 0.0033960342407226562, 0.00582122802734375, 0.008246421813964844, 0.010671615600585938, 0.013096809387207031, 0.015522003173828125, 0.01794719696044922, 0.020372390747070312, 0.022797584533691406, 0.0252227783203125, 0.027647972106933594, 0.030073165893554688, 0.03249835968017578, 0.034923553466796875, 0.03734874725341797, 0.03977394104003906, 0.042199134826660156, 0.04462432861328125, 0.047049522399902344, 0.04947471618652344, 0.05189990997314453, 0.054325103759765625, 0.05675029754638672, 0.05917549133300781, 0.061600685119628906, 0.06402587890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 8.0, 29.0, 42.0, 61.0, 115.0, 126.0, 133.0, 129.0, 102.0, 79.0, 71.0, 50.0, 21.0, 19.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037841796875, -0.03689384460449219, -0.035945892333984375, -0.03499794006347656, -0.03404998779296875, -0.03310203552246094, -0.032154083251953125, -0.031206130981445312, -0.0302581787109375, -0.029310226440429688, -0.028362274169921875, -0.027414321899414062, -0.02646636962890625, -0.025518417358398438, -0.024570465087890625, -0.023622512817382812, -0.022674560546875, -0.021726608276367188, -0.020778656005859375, -0.019830703735351562, -0.01888275146484375, -0.017934799194335938, -0.016986846923828125, -0.016038894653320312, -0.0150909423828125, -0.014142990112304688, -0.013195037841796875, -0.012247085571289062, -0.01129913330078125, -0.010351181030273438, -0.009403228759765625, -0.008455276489257812, -0.00750732421875, -0.0065593719482421875, -0.005611419677734375, -0.0046634674072265625, -0.00371551513671875, -0.0027675628662109375, -0.001819610595703125, -0.0008716583251953125, 7.62939453125e-05, 0.0010242462158203125, 0.001972198486328125, 0.0029201507568359375, 0.00386810302734375, 0.0048160552978515625, 0.005764007568359375, 0.0067119598388671875, 0.007659912109375, 0.008607864379882812, 0.009555816650390625, 0.010503768920898438, 0.01145172119140625, 0.012399673461914062, 0.013347625732421875, 0.014295578002929688, 0.0152435302734375, 0.016191482543945312, 0.017139434814453125, 0.018087387084960938, 0.01903533935546875, 0.019983291625976562, 0.020931243896484375, 0.021879196166992188, 0.0228271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 9.0, 6.0, 9.0, 11.0, 20.0, 35.0, 61.0, 94.0, 172.0, 264.0, 477.0, 952.0, 1853.0, 4172.0, 11235.0, 42059.0, 235356.0, 2844409.0, 913693.0, 103905.0, 22639.0, 7099.0, 2779.0, 1373.0, 740.0, 355.0, 210.0, 112.0, 75.0, 36.0, 25.0, 17.0, 9.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.04132080078125, -0.040097713470458984, -0.03887462615966797, -0.03765153884887695, -0.03642845153808594, -0.03520536422729492, -0.033982276916503906, -0.03275918960571289, -0.031536102294921875, -0.03031301498413086, -0.029089927673339844, -0.027866840362548828, -0.026643753051757812, -0.025420665740966797, -0.02419757843017578, -0.022974491119384766, -0.02175140380859375, -0.020528316497802734, -0.01930522918701172, -0.018082141876220703, -0.016859054565429688, -0.015635967254638672, -0.014412879943847656, -0.01318979263305664, -0.011966705322265625, -0.01074361801147461, -0.009520530700683594, -0.008297443389892578, -0.0070743560791015625, -0.005851268768310547, -0.004628181457519531, -0.0034050941467285156, -0.0021820068359375, -0.0009589195251464844, 0.00026416778564453125, 0.0014872550964355469, 0.0027103424072265625, 0.003933429718017578, 0.005156517028808594, 0.006379604339599609, 0.007602691650390625, 0.00882577896118164, 0.010048866271972656, 0.011271953582763672, 0.012495040893554688, 0.013718128204345703, 0.014941215515136719, 0.016164302825927734, 0.01738739013671875, 0.018610477447509766, 0.01983356475830078, 0.021056652069091797, 0.022279739379882812, 0.023502826690673828, 0.024725914001464844, 0.02594900131225586, 0.027172088623046875, 0.02839517593383789, 0.029618263244628906, 0.030841350555419922, 0.03206443786621094, 0.03328752517700195, 0.03451061248779297, 0.035733699798583984, 0.036956787109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 9.0, 12.0, 11.0, 29.0, 29.0, 44.0, 54.0, 87.0, 93.0, 134.0, 208.0, 340.0, 596.0, 815.0, 549.0, 332.0, 198.0, 144.0, 103.0, 79.0, 49.0, 33.0, 31.0, 21.0, 16.0, 10.0, 7.0, 5.0, 5.0, 11.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.031097412109375, -0.03022027015686035, -0.029343128204345703, -0.028465986251831055, -0.027588844299316406, -0.026711702346801758, -0.02583456039428711, -0.02495741844177246, -0.024080276489257812, -0.023203134536743164, -0.022325992584228516, -0.021448850631713867, -0.02057170867919922, -0.01969456672668457, -0.018817424774169922, -0.017940282821655273, -0.017063140869140625, -0.016185998916625977, -0.015308856964111328, -0.01443171501159668, -0.013554573059082031, -0.012677431106567383, -0.011800289154052734, -0.010923147201538086, -0.010046005249023438, -0.009168863296508789, -0.00829172134399414, -0.007414579391479492, -0.006537437438964844, -0.005660295486450195, -0.004783153533935547, -0.0039060115814208984, -0.00302886962890625, -0.0021517276763916016, -0.0012745857238769531, -0.0003974437713623047, 0.00047969818115234375, 0.0013568401336669922, 0.0022339820861816406, 0.003111124038696289, 0.0039882659912109375, 0.004865407943725586, 0.005742549896240234, 0.006619691848754883, 0.007496833801269531, 0.00837397575378418, 0.009251117706298828, 0.010128259658813477, 0.011005401611328125, 0.011882543563842773, 0.012759685516357422, 0.01363682746887207, 0.014513969421386719, 0.015391111373901367, 0.016268253326416016, 0.017145395278930664, 0.018022537231445312, 0.01889967918395996, 0.01977682113647461, 0.020653963088989258, 0.021531105041503906, 0.022408246994018555, 0.023285388946533203, 0.02416253089904785, 0.0250396728515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 19.0, 45.0, 103.0, 202.0, 275.0, 196.0, 100.0, 34.0, 13.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.365337073802948, -0.35331130027770996, -0.3412855267524719, -0.3292597532272339, -0.31723397970199585, -0.3052082061767578, -0.2931824326515198, -0.28115662932395935, -0.2691308557987213, -0.2571050822734833, -0.24507930874824524, -0.2330535352230072, -0.22102774679660797, -0.20900197327136993, -0.1969761997461319, -0.18495041131973267, -0.17292465269565582, -0.16089887917041779, -0.14887310564517975, -0.13684731721878052, -0.12482154369354248, -0.11279577016830444, -0.1007699966430664, -0.08874421566724777, -0.07671844214200974, -0.0646926686167717, -0.052666887640953064, -0.04064111411571503, -0.02861533686518669, -0.016589559614658356, -0.004563786089420319, 0.007461994886398315, 0.019487768411636353, 0.03151354566216469, 0.043539322912693024, 0.05556509643793106, 0.0675908774137497, 0.07961665093898773, 0.09164242446422577, 0.1036682054400444, 0.11569397896528244, 0.12771975994110107, 0.1397455334663391, 0.15177130699157715, 0.16379708051681519, 0.17582285404205322, 0.18784862756729126, 0.1998744159936905, 0.21190018951892853, 0.22392596304416656, 0.2359517365694046, 0.24797752499580383, 0.26000329852104187, 0.2720290720462799, 0.28405484557151794, 0.296080619096756, 0.308106392621994, 0.32013216614723206, 0.3321579396724701, 0.34418371319770813, 0.35620948672294617, 0.3682352900505066, 0.38026106357574463, 0.39228683710098267, 0.4043126106262207]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 17.0, 14.0, 17.0, 18.0, 15.0, 26.0, 34.0, 30.0, 30.0, 37.0, 35.0, 31.0, 43.0, 42.0, 57.0, 45.0, 38.0, 46.0, 46.0, 44.0, 47.0, 37.0, 31.0, 30.0, 31.0, 30.0, 21.0, 12.0, 13.0, 11.0, 8.0, 11.0, 13.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10475194454193115, -0.10175108164548874, -0.09875021874904633, -0.09574934840202332, -0.0927484855055809, -0.08974762260913849, -0.08674675226211548, -0.08374588936567307, -0.08074502646923065, -0.07774416357278824, -0.07474330067634583, -0.07174243032932281, -0.0687415674328804, -0.06574070453643799, -0.06273983418941498, -0.059738971292972565, -0.05673810839653015, -0.05373724550008774, -0.050736378878355026, -0.047735512256622314, -0.0447346493601799, -0.04173378646373749, -0.038732919842004776, -0.035732053220272064, -0.03273119032382965, -0.02973032556474209, -0.026729460805654526, -0.023728596046566963, -0.0207277312874794, -0.017726866528391838, -0.014726001769304276, -0.011725137010216713, -0.00872427225112915, -0.005723407492041588, -0.0027225427329540253, 0.0002783220261335373, 0.0032791867852211, 0.006280051544308662, 0.009280916303396225, 0.012281781062483788, 0.01528264582157135, 0.018283510580658913, 0.021284375339746475, 0.024285240098834038, 0.0272861048579216, 0.030286969617009163, 0.033287834376096725, 0.03628870099782944, 0.03928956389427185, 0.042290426790714264, 0.045291293412446976, 0.04829216003417969, 0.0512930229306221, 0.054293885827064514, 0.057294752448797226, 0.06029561907052994, 0.06329648196697235, 0.06629734486341476, 0.06929820775985718, 0.07229907810688019, 0.0752999410033226, 0.07830080389976501, 0.08130167424678802, 0.08430253714323044, 0.08730340003967285]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 16.0, 23.0, 36.0, 52.0, 102.0, 176.0, 317.0, 598.0, 1430.0, 5764.0, 50008.0, 599285.0, 358443.0, 26388.0, 3778.0, 1041.0, 503.0, 238.0, 143.0, 71.0, 44.0, 21.0, 18.0, 13.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14111328125, -0.13681983947753906, -0.13252639770507812, -0.1282329559326172, -0.12393951416015625, -0.11964607238769531, -0.11535263061523438, -0.11105918884277344, -0.1067657470703125, -0.10247230529785156, -0.09817886352539062, -0.09388542175292969, -0.08959197998046875, -0.08529853820800781, -0.08100509643554688, -0.07671165466308594, -0.072418212890625, -0.06812477111816406, -0.06383132934570312, -0.05953788757324219, -0.05524444580078125, -0.05095100402832031, -0.046657562255859375, -0.04236412048339844, -0.0380706787109375, -0.03377723693847656, -0.029483795166015625, -0.025190353393554688, -0.02089691162109375, -0.016603469848632812, -0.012310028076171875, -0.008016586303710938, -0.00372314453125, 0.0005702972412109375, 0.004863739013671875, 0.009157180786132812, 0.01345062255859375, 0.017744064331054688, 0.022037506103515625, 0.026330947875976562, 0.0306243896484375, 0.03491783142089844, 0.039211273193359375, 0.04350471496582031, 0.04779815673828125, 0.05209159851074219, 0.056385040283203125, 0.06067848205566406, 0.064971923828125, 0.06926536560058594, 0.07355880737304688, 0.07785224914550781, 0.08214569091796875, 0.08643913269042969, 0.09073257446289062, 0.09502601623535156, 0.0993194580078125, 0.10361289978027344, 0.10790634155273438, 0.11219978332519531, 0.11649322509765625, 0.12078666687011719, 0.12508010864257812, 0.12937355041503906, 0.1336669921875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 13.0, 23.0, 55.0, 63.0, 105.0, 112.0, 144.0, 129.0, 107.0, 74.0, 69.0, 49.0, 31.0, 10.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.037872314453125, -0.03689837455749512, -0.035924434661865234, -0.03495049476623535, -0.03397655487060547, -0.033002614974975586, -0.0320286750793457, -0.03105473518371582, -0.030080795288085938, -0.029106855392456055, -0.028132915496826172, -0.02715897560119629, -0.026185035705566406, -0.025211095809936523, -0.02423715591430664, -0.023263216018676758, -0.022289276123046875, -0.021315336227416992, -0.02034139633178711, -0.019367456436157227, -0.018393516540527344, -0.01741957664489746, -0.016445636749267578, -0.015471696853637695, -0.014497756958007812, -0.01352381706237793, -0.012549877166748047, -0.011575937271118164, -0.010601997375488281, -0.009628057479858398, -0.008654117584228516, -0.007680177688598633, -0.00670623779296875, -0.005732297897338867, -0.004758358001708984, -0.0037844181060791016, -0.0028104782104492188, -0.001836538314819336, -0.0008625984191894531, 0.00011134147644042969, 0.0010852813720703125, 0.0020592212677001953, 0.003033161163330078, 0.004007101058959961, 0.004981040954589844, 0.0059549808502197266, 0.006928920745849609, 0.007902860641479492, 0.008876800537109375, 0.009850740432739258, 0.01082468032836914, 0.011798620223999023, 0.012772560119628906, 0.013746500015258789, 0.014720439910888672, 0.015694379806518555, 0.016668319702148438, 0.01764225959777832, 0.018616199493408203, 0.019590139389038086, 0.02056407928466797, 0.02153801918029785, 0.022511959075927734, 0.023485898971557617, 0.0244598388671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 15.0, 19.0, 32.0, 61.0, 113.0, 178.0, 434.0, 1096.0, 3153.0, 10012.0, 36912.0, 156167.0, 467567.0, 280690.0, 67202.0, 17073.0, 5009.0, 1665.0, 606.0, 249.0, 114.0, 84.0, 44.0, 24.0, 14.0, 9.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.06188201904296875, -0.0597991943359375, -0.05771636962890625, -0.055633544921875, -0.05355072021484375, -0.0514678955078125, -0.04938507080078125, -0.04730224609375, -0.04521942138671875, -0.0431365966796875, -0.04105377197265625, -0.038970947265625, -0.03688812255859375, -0.0348052978515625, -0.03272247314453125, -0.0306396484375, -0.02855682373046875, -0.0264739990234375, -0.02439117431640625, -0.022308349609375, -0.02022552490234375, -0.0181427001953125, -0.01605987548828125, -0.01397705078125, -0.01189422607421875, -0.0098114013671875, -0.00772857666015625, -0.005645751953125, -0.00356292724609375, -0.0014801025390625, 0.00060272216796875, 0.002685546875, 0.00476837158203125, 0.0068511962890625, 0.00893402099609375, 0.011016845703125, 0.01309967041015625, 0.0151824951171875, 0.01726531982421875, 0.01934814453125, 0.02143096923828125, 0.0235137939453125, 0.02559661865234375, 0.027679443359375, 0.02976226806640625, 0.0318450927734375, 0.03392791748046875, 0.0360107421875, 0.03809356689453125, 0.0401763916015625, 0.04225921630859375, 0.044342041015625, 0.04642486572265625, 0.0485076904296875, 0.05059051513671875, 0.05267333984375, 0.05475616455078125, 0.0568389892578125, 0.05892181396484375, 0.061004638671875, 0.06308746337890625, 0.0651702880859375, 0.06725311279296875, 0.0693359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 18.0, 12.0, 24.0, 20.0, 28.0, 29.0, 41.0, 31.0, 40.0, 44.0, 51.0, 47.0, 51.0, 49.0, 48.0, 65.0, 50.0, 46.0, 39.0, 34.0, 38.0, 34.0, 23.0, 17.0, 24.0, 13.0, 16.0, 12.0, 10.0, 10.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.051910400390625, -0.05044364929199219, -0.048976898193359375, -0.04751014709472656, -0.04604339599609375, -0.04457664489746094, -0.043109893798828125, -0.04164314270019531, -0.0401763916015625, -0.03870964050292969, -0.037242889404296875, -0.03577613830566406, -0.03430938720703125, -0.03284263610839844, -0.031375885009765625, -0.029909133911132812, -0.0284423828125, -0.026975631713867188, -0.025508880615234375, -0.024042129516601562, -0.02257537841796875, -0.021108627319335938, -0.019641876220703125, -0.018175125122070312, -0.0167083740234375, -0.015241622924804688, -0.013774871826171875, -0.012308120727539062, -0.01084136962890625, -0.009374618530273438, -0.007907867431640625, -0.0064411163330078125, -0.004974365234375, -0.0035076141357421875, -0.002040863037109375, -0.0005741119384765625, 0.00089263916015625, 0.0023593902587890625, 0.003826141357421875, 0.0052928924560546875, 0.0067596435546875, 0.008226394653320312, 0.009693145751953125, 0.011159896850585938, 0.01262664794921875, 0.014093399047851562, 0.015560150146484375, 0.017026901245117188, 0.01849365234375, 0.019960403442382812, 0.021427154541015625, 0.022893905639648438, 0.02436065673828125, 0.025827407836914062, 0.027294158935546875, 0.028760910034179688, 0.0302276611328125, 0.03169441223144531, 0.033161163330078125, 0.03462791442871094, 0.03609466552734375, 0.03756141662597656, 0.039028167724609375, 0.04049491882324219, 0.041961669921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 11.0, 6.0, 23.0, 30.0, 51.0, 80.0, 108.0, 145.0, 249.0, 376.0, 623.0, 1109.0, 1935.0, 3400.0, 6456.0, 13911.0, 32219.0, 86741.0, 249403.0, 389191.0, 161322.0, 57418.0, 22468.0, 9833.0, 4944.0, 2691.0, 1483.0, 834.0, 539.0, 361.0, 222.0, 130.0, 79.0, 45.0, 37.0, 31.0, 14.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.024810791015625, -0.023991823196411133, -0.023172855377197266, -0.0223538875579834, -0.02153491973876953, -0.020715951919555664, -0.019896984100341797, -0.01907801628112793, -0.018259048461914062, -0.017440080642700195, -0.016621112823486328, -0.01580214500427246, -0.014983177185058594, -0.014164209365844727, -0.01334524154663086, -0.012526273727416992, -0.011707305908203125, -0.010888338088989258, -0.01006937026977539, -0.009250402450561523, -0.008431434631347656, -0.007612466812133789, -0.006793498992919922, -0.005974531173706055, -0.0051555633544921875, -0.00433659553527832, -0.003517627716064453, -0.002698659896850586, -0.0018796920776367188, -0.0010607242584228516, -0.00024175643920898438, 0.0005772113800048828, 0.00139617919921875, 0.002215147018432617, 0.0030341148376464844, 0.0038530826568603516, 0.004672050476074219, 0.005491018295288086, 0.006309986114501953, 0.00712895393371582, 0.007947921752929688, 0.008766889572143555, 0.009585857391357422, 0.010404825210571289, 0.011223793029785156, 0.012042760848999023, 0.01286172866821289, 0.013680696487426758, 0.014499664306640625, 0.015318632125854492, 0.01613759994506836, 0.016956567764282227, 0.017775535583496094, 0.01859450340270996, 0.019413471221923828, 0.020232439041137695, 0.021051406860351562, 0.02187037467956543, 0.022689342498779297, 0.023508310317993164, 0.02432727813720703, 0.0251462459564209, 0.025965213775634766, 0.026784181594848633, 0.0276031494140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 6.0, 10.0, 12.0, 12.0, 16.0, 22.0, 24.0, 28.0, 30.0, 34.0, 44.0, 36.0, 51.0, 79.0, 70.0, 72.0, 53.0, 62.0, 58.0, 48.0, 45.0, 50.0, 18.0, 27.0, 18.0, 11.0, 8.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3365020751953125e-05, -2.2436492145061493e-05, -2.150796353816986e-05, -2.057943493127823e-05, -1.9650906324386597e-05, -1.8722377717494965e-05, -1.7793849110603333e-05, -1.68653205037117e-05, -1.593679189682007e-05, -1.5008263289928436e-05, -1.4079734683036804e-05, -1.3151206076145172e-05, -1.222267746925354e-05, -1.1294148862361908e-05, -1.0365620255470276e-05, -9.437091648578644e-06, -8.508563041687012e-06, -7.58003443479538e-06, -6.6515058279037476e-06, -5.7229772210121155e-06, -4.794448614120483e-06, -3.865920007228851e-06, -2.9373914003372192e-06, -2.008862793445587e-06, -1.080334186553955e-06, -1.51805579662323e-07, 7.767230272293091e-07, 1.7052516341209412e-06, 2.6337802410125732e-06, 3.5623088479042053e-06, 4.490837454795837e-06, 5.4193660616874695e-06, 6.3478946685791016e-06, 7.276423275470734e-06, 8.204951882362366e-06, 9.133480489253998e-06, 1.006200909614563e-05, 1.0990537703037262e-05, 1.1919066309928894e-05, 1.2847594916820526e-05, 1.3776123523712158e-05, 1.470465213060379e-05, 1.5633180737495422e-05, 1.6561709344387054e-05, 1.7490237951278687e-05, 1.841876655817032e-05, 1.934729516506195e-05, 2.0275823771953583e-05, 2.1204352378845215e-05, 2.2132880985736847e-05, 2.306140959262848e-05, 2.398993819952011e-05, 2.4918466806411743e-05, 2.5846995413303375e-05, 2.6775524020195007e-05, 2.770405262708664e-05, 2.863258123397827e-05, 2.9561109840869904e-05, 3.0489638447761536e-05, 3.141816705465317e-05, 3.23466956615448e-05, 3.327522426843643e-05, 3.4203752875328064e-05, 3.5132281482219696e-05, 3.606081008911133e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 9.0, 10.0, 26.0, 39.0, 73.0, 106.0, 253.0, 576.0, 1391.0, 3710.0, 11234.0, 39626.0, 171706.0, 553234.0, 201352.0, 45540.0, 12742.0, 4190.0, 1526.0, 639.0, 267.0, 130.0, 59.0, 31.0, 26.0, 13.0, 6.0, 8.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04278564453125, -0.04158210754394531, -0.040378570556640625, -0.03917503356933594, -0.03797149658203125, -0.03676795959472656, -0.035564422607421875, -0.03436088562011719, -0.0331573486328125, -0.03195381164550781, -0.030750274658203125, -0.029546737670898438, -0.02834320068359375, -0.027139663696289062, -0.025936126708984375, -0.024732589721679688, -0.023529052734375, -0.022325515747070312, -0.021121978759765625, -0.019918441772460938, -0.01871490478515625, -0.017511367797851562, -0.016307830810546875, -0.015104293823242188, -0.0139007568359375, -0.012697219848632812, -0.011493682861328125, -0.010290145874023438, -0.00908660888671875, -0.007883071899414062, -0.006679534912109375, -0.0054759979248046875, -0.0042724609375, -0.0030689239501953125, -0.001865386962890625, -0.0006618499755859375, 0.00054168701171875, 0.0017452239990234375, 0.002948760986328125, 0.0041522979736328125, 0.0053558349609375, 0.0065593719482421875, 0.007762908935546875, 0.008966445922851562, 0.01016998291015625, 0.011373519897460938, 0.012577056884765625, 0.013780593872070312, 0.014984130859375, 0.016187667846679688, 0.017391204833984375, 0.018594741821289062, 0.01979827880859375, 0.021001815795898438, 0.022205352783203125, 0.023408889770507812, 0.0246124267578125, 0.025815963745117188, 0.027019500732421875, 0.028223037719726562, 0.02942657470703125, 0.030630111694335938, 0.031833648681640625, 0.03303718566894531, 0.03424072265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 10.0, 11.0, 6.0, 17.0, 13.0, 16.0, 19.0, 21.0, 37.0, 41.0, 38.0, 57.0, 74.0, 65.0, 84.0, 89.0, 62.0, 68.0, 56.0, 35.0, 21.0, 28.0, 17.0, 21.0, 15.0, 13.0, 7.0, 8.0, 6.0, 10.0, 2.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02728271484375, -0.026511669158935547, -0.025740623474121094, -0.02496957778930664, -0.024198532104492188, -0.023427486419677734, -0.02265644073486328, -0.021885395050048828, -0.021114349365234375, -0.020343303680419922, -0.01957225799560547, -0.018801212310791016, -0.018030166625976562, -0.01725912094116211, -0.016488075256347656, -0.015717029571533203, -0.01494598388671875, -0.014174938201904297, -0.013403892517089844, -0.01263284683227539, -0.011861801147460938, -0.011090755462646484, -0.010319709777832031, -0.009548664093017578, -0.008777618408203125, -0.008006572723388672, -0.007235527038574219, -0.006464481353759766, -0.0056934356689453125, -0.004922389984130859, -0.004151344299316406, -0.003380298614501953, -0.0026092529296875, -0.0018382072448730469, -0.0010671615600585938, -0.0002961158752441406, 0.0004749298095703125, 0.0012459754943847656, 0.0020170211791992188, 0.002788066864013672, 0.003559112548828125, 0.004330158233642578, 0.005101203918457031, 0.005872249603271484, 0.0066432952880859375, 0.007414340972900391, 0.008185386657714844, 0.008956432342529297, 0.00972747802734375, 0.010498523712158203, 0.011269569396972656, 0.01204061508178711, 0.012811660766601562, 0.013582706451416016, 0.014353752136230469, 0.015124797821044922, 0.015895843505859375, 0.016666889190673828, 0.01743793487548828, 0.018208980560302734, 0.018980026245117188, 0.01975107192993164, 0.020522117614746094, 0.021293163299560547, 0.022064208984375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 16.0, 28.0, 77.0, 198.0, 270.0, 234.0, 115.0, 41.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5151578187942505, -0.4925801753997803, -0.47000253200531006, -0.44742491841316223, -0.424847275018692, -0.4022696316242218, -0.379692018032074, -0.35711437463760376, -0.33453673124313354, -0.31195908784866333, -0.2893814444541931, -0.2668038308620453, -0.24422618746757507, -0.22164854407310486, -0.19907091557979584, -0.17649328708648682, -0.1539156436920166, -0.1313380002975464, -0.10876037180423737, -0.08618273586034775, -0.06360509991645813, -0.04102746397256851, -0.018449828028678894, 0.004127800464630127, 0.026705443859100342, 0.04928307980298996, 0.07186071574687958, 0.0944383516907692, 0.11701598763465881, 0.13959363102912903, 0.16217125952243805, 0.18474888801574707, 0.20732659101486206, 0.22990423440933228, 0.2524818778038025, 0.2750594913959503, 0.29763713479042053, 0.32021477818489075, 0.3427923917770386, 0.3653700351715088, 0.387947678565979, 0.4105253219604492, 0.43310296535491943, 0.45568057894706726, 0.4782582223415375, 0.5008358359336853, 0.5234134793281555, 0.5459911227226257, 0.568568766117096, 0.5911464095115662, 0.6137240529060364, 0.6363016963005066, 0.658879280090332, 0.6814569234848022, 0.7040345668792725, 0.7266122102737427, 0.7491898536682129, 0.7717674970626831, 0.7943451404571533, 0.8169227838516235, 0.8395004272460938, 0.8620780110359192, 0.8846556544303894, 0.9072332978248596, 0.9298109412193298]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 5.0, 6.0, 13.0, 9.0, 16.0, 16.0, 17.0, 20.0, 26.0, 15.0, 30.0, 22.0, 35.0, 35.0, 33.0, 45.0, 38.0, 43.0, 43.0, 45.0, 47.0, 51.0, 46.0, 33.0, 39.0, 39.0, 25.0, 31.0, 30.0, 18.0, 15.0, 21.0, 16.0, 16.0, 12.0, 13.0, 10.0, 8.0, 3.0, 4.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13818055391311646, -0.13354575634002686, -0.12891094386577606, -0.12427613884210587, -0.11964133381843567, -0.11500652879476547, -0.11037172377109528, -0.10573691874742508, -0.10110211372375488, -0.09646730870008469, -0.09183250367641449, -0.0871976986527443, -0.0825628936290741, -0.0779280886054039, -0.0732932835817337, -0.06865847855806351, -0.06402367353439331, -0.059388868510723114, -0.05475406348705292, -0.05011925846338272, -0.045484453439712524, -0.04084964841604233, -0.03621484339237213, -0.031580038368701935, -0.02694523334503174, -0.022310428321361542, -0.017675623297691345, -0.013040818274021149, -0.008406013250350952, -0.0037712082266807556, 0.0008635967969894409, 0.0054984018206596375, 0.010133206844329834, 0.01476801186800003, 0.019402816891670227, 0.024037621915340424, 0.02867242693901062, 0.03330723196268082, 0.03794203698635101, 0.04257684201002121, 0.047211647033691406, 0.0518464520573616, 0.0564812570810318, 0.061116062104701996, 0.06575086712837219, 0.07038567215204239, 0.07502047717571259, 0.07965528219938278, 0.08429008722305298, 0.08892489224672318, 0.09355969727039337, 0.09819450229406357, 0.10282930731773376, 0.10746411234140396, 0.11209891736507416, 0.11673372238874435, 0.12136852741241455, 0.12600332498550415, 0.13063813745975494, 0.13527294993400574, 0.13990774750709534, 0.14454254508018494, 0.14917735755443573, 0.15381217002868652, 0.15844696760177612]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 2.0, 4.0, 10.0, 8.0, 8.0, 21.0, 32.0, 52.0, 86.0, 161.0, 363.0, 870.0, 2876.0, 14226.0, 135004.0, 3560913.0, 440714.0, 31132.0, 5578.0, 1419.0, 427.0, 185.0, 91.0, 52.0, 17.0, 8.0, 11.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08447265625, -0.08239603042602539, -0.08031940460205078, -0.07824277877807617, -0.07616615295410156, -0.07408952713012695, -0.07201290130615234, -0.06993627548217773, -0.06785964965820312, -0.06578302383422852, -0.0637063980102539, -0.0616297721862793, -0.05955314636230469, -0.05747652053833008, -0.05539989471435547, -0.05332326889038086, -0.05124664306640625, -0.04917001724243164, -0.04709339141845703, -0.04501676559448242, -0.04294013977050781, -0.0408635139465332, -0.038786888122558594, -0.036710262298583984, -0.034633636474609375, -0.032557010650634766, -0.030480384826660156, -0.028403759002685547, -0.026327133178710938, -0.024250507354736328, -0.02217388153076172, -0.02009725570678711, -0.0180206298828125, -0.01594400405883789, -0.013867378234863281, -0.011790752410888672, -0.009714126586914062, -0.007637500762939453, -0.005560874938964844, -0.0034842491149902344, -0.001407623291015625, 0.0006690025329589844, 0.0027456283569335938, 0.004822254180908203, 0.0068988800048828125, 0.008975505828857422, 0.011052131652832031, 0.01312875747680664, 0.01520538330078125, 0.01728200912475586, 0.01935863494873047, 0.021435260772705078, 0.023511886596679688, 0.025588512420654297, 0.027665138244628906, 0.029741764068603516, 0.031818389892578125, 0.033895015716552734, 0.035971641540527344, 0.03804826736450195, 0.04012489318847656, 0.04220151901245117, 0.04427814483642578, 0.04635477066040039, 0.048431396484375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 10.0, 6.0, 28.0, 35.0, 57.0, 62.0, 89.0, 100.0, 106.0, 112.0, 92.0, 99.0, 65.0, 50.0, 40.0, 23.0, 15.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03948974609375, -0.03850269317626953, -0.03751564025878906, -0.036528587341308594, -0.035541534423828125, -0.034554481506347656, -0.03356742858886719, -0.03258037567138672, -0.03159332275390625, -0.03060626983642578, -0.029619216918945312, -0.028632164001464844, -0.027645111083984375, -0.026658058166503906, -0.025671005249023438, -0.02468395233154297, -0.0236968994140625, -0.02270984649658203, -0.021722793579101562, -0.020735740661621094, -0.019748687744140625, -0.018761634826660156, -0.017774581909179688, -0.01678752899169922, -0.01580047607421875, -0.014813423156738281, -0.013826370239257812, -0.012839317321777344, -0.011852264404296875, -0.010865211486816406, -0.009878158569335938, -0.008891105651855469, -0.007904052734375, -0.006916999816894531, -0.0059299468994140625, -0.004942893981933594, -0.003955841064453125, -0.0029687881469726562, -0.0019817352294921875, -0.0009946823120117188, -7.62939453125e-06, 0.0009794235229492188, 0.0019664764404296875, 0.0029535293579101562, 0.003940582275390625, 0.004927635192871094, 0.0059146881103515625, 0.006901741027832031, 0.0078887939453125, 0.008875846862792969, 0.009862899780273438, 0.010849952697753906, 0.011837005615234375, 0.012824058532714844, 0.013811111450195312, 0.014798164367675781, 0.01578521728515625, 0.01677227020263672, 0.017759323120117188, 0.018746376037597656, 0.019733428955078125, 0.020720481872558594, 0.021707534790039062, 0.02269458770751953, 0.023681640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 7.0, 17.0, 28.0, 40.0, 76.0, 110.0, 187.0, 312.0, 619.0, 1069.0, 2315.0, 5305.0, 14000.0, 45887.0, 189008.0, 1515153.0, 2105181.0, 232922.0, 54518.0, 16392.0, 6020.0, 2429.0, 1214.0, 633.0, 327.0, 191.0, 118.0, 60.0, 36.0, 36.0, 22.0, 10.0, 10.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.031597137451171875, -0.03050994873046875, -0.029422760009765625, -0.0283355712890625, -0.027248382568359375, -0.02616119384765625, -0.025074005126953125, -0.02398681640625, -0.022899627685546875, -0.02181243896484375, -0.020725250244140625, -0.0196380615234375, -0.018550872802734375, -0.01746368408203125, -0.016376495361328125, -0.015289306640625, -0.014202117919921875, -0.01311492919921875, -0.012027740478515625, -0.0109405517578125, -0.009853363037109375, -0.00876617431640625, -0.007678985595703125, -0.006591796875, -0.005504608154296875, -0.00441741943359375, -0.003330230712890625, -0.0022430419921875, -0.001155853271484375, -6.866455078125e-05, 0.001018524169921875, 0.002105712890625, 0.003192901611328125, 0.00428009033203125, 0.005367279052734375, 0.0064544677734375, 0.007541656494140625, 0.00862884521484375, 0.009716033935546875, 0.01080322265625, 0.011890411376953125, 0.01297760009765625, 0.014064788818359375, 0.0151519775390625, 0.016239166259765625, 0.01732635498046875, 0.018413543701171875, 0.019500732421875, 0.020587921142578125, 0.02167510986328125, 0.022762298583984375, 0.0238494873046875, 0.024936676025390625, 0.02602386474609375, 0.027111053466796875, 0.0281982421875, 0.029285430908203125, 0.03037261962890625, 0.031459808349609375, 0.0325469970703125, 0.033634185791015625, 0.03472137451171875, 0.035808563232421875, 0.036895751953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 12.0, 16.0, 22.0, 36.0, 33.0, 51.0, 66.0, 88.0, 110.0, 170.0, 276.0, 482.0, 762.0, 635.0, 397.0, 230.0, 182.0, 129.0, 96.0, 60.0, 40.0, 35.0, 27.0, 22.0, 17.0, 19.0, 11.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029449462890625, -0.028578996658325195, -0.02770853042602539, -0.026838064193725586, -0.02596759796142578, -0.025097131729125977, -0.024226665496826172, -0.023356199264526367, -0.022485733032226562, -0.021615266799926758, -0.020744800567626953, -0.01987433433532715, -0.019003868103027344, -0.01813340187072754, -0.017262935638427734, -0.01639246940612793, -0.015522003173828125, -0.01465153694152832, -0.013781070709228516, -0.012910604476928711, -0.012040138244628906, -0.011169672012329102, -0.010299205780029297, -0.009428739547729492, -0.008558273315429688, -0.007687807083129883, -0.006817340850830078, -0.0059468746185302734, -0.005076408386230469, -0.004205942153930664, -0.0033354759216308594, -0.0024650096893310547, -0.00159454345703125, -0.0007240772247314453, 0.00014638900756835938, 0.001016855239868164, 0.0018873214721679688, 0.0027577877044677734, 0.003628253936767578, 0.004498720169067383, 0.0053691864013671875, 0.006239652633666992, 0.007110118865966797, 0.007980585098266602, 0.008851051330566406, 0.009721517562866211, 0.010591983795166016, 0.01146245002746582, 0.012332916259765625, 0.01320338249206543, 0.014073848724365234, 0.014944314956665039, 0.015814781188964844, 0.01668524742126465, 0.017555713653564453, 0.018426179885864258, 0.019296646118164062, 0.020167112350463867, 0.021037578582763672, 0.021908044815063477, 0.02277851104736328, 0.023648977279663086, 0.02451944351196289, 0.025389909744262695, 0.0262603759765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 27.0, 82.0, 144.0, 235.0, 236.0, 151.0, 69.0, 33.0, 10.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3945617079734802, -0.38248586654663086, -0.3704100251197815, -0.35833415389060974, -0.3462583124637604, -0.334182471036911, -0.32210659980773926, -0.3100307583808899, -0.2979549169540405, -0.28587907552719116, -0.2738032341003418, -0.26172736287117004, -0.24965152144432068, -0.2375756800174713, -0.22549982368946075, -0.2134239673614502, -0.20134812593460083, -0.18927228450775146, -0.1771964281797409, -0.16512057185173035, -0.15304473042488098, -0.14096888899803162, -0.12889303267002106, -0.1168171837925911, -0.10474133491516113, -0.09266548603773117, -0.08058963716030121, -0.06851378828287125, -0.056437939405441284, -0.04436209052801132, -0.03228624165058136, -0.020210392773151398, -0.008134543895721436, 0.003941304981708527, 0.01601715385913849, 0.02809300273656845, 0.04016885161399841, 0.052244700491428375, 0.06432054936885834, 0.0763963982462883, 0.08847224712371826, 0.10054809600114822, 0.11262394487857819, 0.12469979375600815, 0.1367756426334381, 0.14885148406028748, 0.16092734038829803, 0.1730031967163086, 0.18507903814315796, 0.19715487957000732, 0.20923073589801788, 0.22130659222602844, 0.2333824336528778, 0.24545827507972717, 0.2575341463088989, 0.2696099877357483, 0.28168582916259766, 0.293761670589447, 0.3058375120162964, 0.31791338324546814, 0.3299892246723175, 0.34206506609916687, 0.3541409373283386, 0.366216778755188, 0.37829262018203735]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 3.0, 13.0, 9.0, 13.0, 22.0, 18.0, 21.0, 27.0, 30.0, 31.0, 40.0, 39.0, 53.0, 52.0, 56.0, 47.0, 52.0, 46.0, 48.0, 52.0, 52.0, 41.0, 37.0, 38.0, 25.0, 20.0, 25.0, 27.0, 15.0, 19.0, 6.0, 6.0, 3.0, 5.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.1480148434638977, -0.14447817206382751, -0.14094151556491852, -0.13740484416484833, -0.13386818766593933, -0.13033151626586914, -0.12679485976696014, -0.12325818836688995, -0.11972152441740036, -0.11618486046791077, -0.11264819651842117, -0.10911153256893158, -0.10557486116886139, -0.10203820466995239, -0.0985015332698822, -0.09496486932039261, -0.09142820537090302, -0.08789154142141342, -0.08435487747192383, -0.08081821352243423, -0.07728154957294464, -0.07374487817287445, -0.07020821422338486, -0.06667155027389526, -0.06313488632440567, -0.05959822237491608, -0.05606155842542648, -0.05252489075064659, -0.048988226801157, -0.045451562851667404, -0.04191489517688751, -0.03837823122739792, -0.034841567277908325, -0.03130490332841873, -0.02776823751628399, -0.024231571704149246, -0.020694907754659653, -0.01715824380517006, -0.013621577993035316, -0.010084912180900574, -0.00654824823141098, -0.003011583350598812, 0.000525081530213356, 0.004061746411025524, 0.007598411291837692, 0.011135075241327286, 0.014671741053462029, 0.01820840686559677, 0.021745070815086365, 0.025281734764575958, 0.0288184005767107, 0.032355066388845444, 0.03589173033833504, 0.03942839428782463, 0.04296506196260452, 0.046501725912094116, 0.05003838986158371, 0.0535750538110733, 0.0571117177605629, 0.06064838543534279, 0.06418505311012268, 0.06772170960903168, 0.07125838100910187, 0.07479504495859146, 0.07833170890808105]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 6.0, 16.0, 6.0, 16.0, 24.0, 33.0, 36.0, 43.0, 62.0, 129.0, 193.0, 304.0, 584.0, 1136.0, 2341.0, 6525.0, 22254.0, 95648.0, 389391.0, 395827.0, 99246.0, 23027.0, 6601.0, 2510.0, 1099.0, 559.0, 315.0, 185.0, 128.0, 88.0, 81.0, 39.0, 32.0, 28.0, 11.0, 12.0, 3.0, 7.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.090850830078125, -0.0880126953125, -0.085174560546875, -0.08233642578125, -0.079498291015625, -0.07666015625, -0.073822021484375, -0.07098388671875, -0.068145751953125, -0.0653076171875, -0.062469482421875, -0.05963134765625, -0.056793212890625, -0.053955078125, -0.051116943359375, -0.04827880859375, -0.045440673828125, -0.0426025390625, -0.039764404296875, -0.03692626953125, -0.034088134765625, -0.03125, -0.028411865234375, -0.02557373046875, -0.022735595703125, -0.0198974609375, -0.017059326171875, -0.01422119140625, -0.011383056640625, -0.008544921875, -0.005706787109375, -0.00286865234375, -3.0517578125e-05, 0.0028076171875, 0.005645751953125, 0.00848388671875, 0.011322021484375, 0.01416015625, 0.016998291015625, 0.01983642578125, 0.022674560546875, 0.0255126953125, 0.028350830078125, 0.03118896484375, 0.034027099609375, 0.036865234375, 0.039703369140625, 0.04254150390625, 0.045379638671875, 0.0482177734375, 0.051055908203125, 0.05389404296875, 0.056732177734375, 0.0595703125, 0.062408447265625, 0.06524658203125, 0.068084716796875, 0.0709228515625, 0.073760986328125, 0.07659912109375, 0.079437255859375, 0.082275390625, 0.085113525390625, 0.08795166015625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 8.0, 12.0, 22.0, 44.0, 49.0, 74.0, 76.0, 103.0, 105.0, 92.0, 94.0, 77.0, 80.0, 57.0, 43.0, 27.0, 16.0, 10.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03814697265625, -0.03719615936279297, -0.03624534606933594, -0.035294532775878906, -0.034343719482421875, -0.033392906188964844, -0.03244209289550781, -0.03149127960205078, -0.03054046630859375, -0.02958965301513672, -0.028638839721679688, -0.027688026428222656, -0.026737213134765625, -0.025786399841308594, -0.024835586547851562, -0.02388477325439453, -0.0229339599609375, -0.02198314666748047, -0.021032333374023438, -0.020081520080566406, -0.019130706787109375, -0.018179893493652344, -0.017229080200195312, -0.01627826690673828, -0.01532745361328125, -0.014376640319824219, -0.013425827026367188, -0.012475013732910156, -0.011524200439453125, -0.010573387145996094, -0.009622573852539062, -0.008671760559082031, -0.007720947265625, -0.006770133972167969, -0.0058193206787109375, -0.004868507385253906, -0.003917694091796875, -0.0029668807983398438, -0.0020160675048828125, -0.0010652542114257812, -0.00011444091796875, 0.0008363723754882812, 0.0017871856689453125, 0.0027379989624023438, 0.003688812255859375, 0.004639625549316406, 0.0055904388427734375, 0.006541252136230469, 0.0074920654296875, 0.008442878723144531, 0.009393692016601562, 0.010344505310058594, 0.011295318603515625, 0.012246131896972656, 0.013196945190429688, 0.014147758483886719, 0.01509857177734375, 0.01604938507080078, 0.017000198364257812, 0.017951011657714844, 0.018901824951171875, 0.019852638244628906, 0.020803451538085938, 0.02175426483154297, 0.022705078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 5.0, 11.0, 13.0, 25.0, 31.0, 40.0, 51.0, 79.0, 142.0, 211.0, 319.0, 532.0, 1037.0, 1850.0, 3483.0, 7054.0, 14484.0, 31045.0, 67192.0, 146840.0, 272196.0, 255794.0, 131429.0, 60203.0, 27741.0, 13166.0, 6348.0, 3235.0, 1689.0, 880.0, 526.0, 309.0, 177.0, 130.0, 77.0, 68.0, 41.0, 32.0, 21.0, 16.0, 8.0, 13.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.051910400390625, -0.05046558380126953, -0.04902076721191406, -0.047575950622558594, -0.046131134033203125, -0.044686317443847656, -0.04324150085449219, -0.04179668426513672, -0.04035186767578125, -0.03890705108642578, -0.03746223449707031, -0.036017417907714844, -0.034572601318359375, -0.033127784729003906, -0.03168296813964844, -0.03023815155029297, -0.0287933349609375, -0.02734851837158203, -0.025903701782226562, -0.024458885192871094, -0.023014068603515625, -0.021569252014160156, -0.020124435424804688, -0.01867961883544922, -0.01723480224609375, -0.01578998565673828, -0.014345169067382812, -0.012900352478027344, -0.011455535888671875, -0.010010719299316406, -0.008565902709960938, -0.007121086120605469, -0.00567626953125, -0.004231452941894531, -0.0027866363525390625, -0.0013418197631835938, 0.000102996826171875, 0.0015478134155273438, 0.0029926300048828125, 0.004437446594238281, 0.00588226318359375, 0.007327079772949219, 0.008771896362304688, 0.010216712951660156, 0.011661529541015625, 0.013106346130371094, 0.014551162719726562, 0.01599597930908203, 0.0174407958984375, 0.01888561248779297, 0.020330429077148438, 0.021775245666503906, 0.023220062255859375, 0.024664878845214844, 0.026109695434570312, 0.02755451202392578, 0.02899932861328125, 0.03044414520263672, 0.03188896179199219, 0.033333778381347656, 0.034778594970703125, 0.036223411560058594, 0.03766822814941406, 0.03911304473876953, 0.040557861328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 18.0, 9.0, 8.0, 17.0, 18.0, 15.0, 17.0, 31.0, 27.0, 27.0, 24.0, 44.0, 32.0, 28.0, 33.0, 39.0, 50.0, 48.0, 39.0, 53.0, 39.0, 38.0, 33.0, 31.0, 43.0, 28.0, 28.0, 25.0, 25.0, 17.0, 28.0, 13.0, 16.0, 11.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.046417236328125, -0.04493141174316406, -0.043445587158203125, -0.04195976257324219, -0.04047393798828125, -0.03898811340332031, -0.037502288818359375, -0.03601646423339844, -0.0345306396484375, -0.03304481506347656, -0.031558990478515625, -0.030073165893554688, -0.02858734130859375, -0.027101516723632812, -0.025615692138671875, -0.024129867553710938, -0.02264404296875, -0.021158218383789062, -0.019672393798828125, -0.018186569213867188, -0.01670074462890625, -0.015214920043945312, -0.013729095458984375, -0.012243270874023438, -0.0107574462890625, -0.009271621704101562, -0.007785797119140625, -0.0062999725341796875, -0.00481414794921875, -0.0033283233642578125, -0.001842498779296875, -0.0003566741943359375, 0.001129150390625, 0.0026149749755859375, 0.004100799560546875, 0.0055866241455078125, 0.00707244873046875, 0.008558273315429688, 0.010044097900390625, 0.011529922485351562, 0.0130157470703125, 0.014501571655273438, 0.015987396240234375, 0.017473220825195312, 0.01895904541015625, 0.020444869995117188, 0.021930694580078125, 0.023416519165039062, 0.02490234375, 0.026388168334960938, 0.027873992919921875, 0.029359817504882812, 0.03084564208984375, 0.03233146667480469, 0.033817291259765625, 0.03530311584472656, 0.0367889404296875, 0.03827476501464844, 0.039760589599609375, 0.04124641418457031, 0.04273223876953125, 0.04421806335449219, 0.045703887939453125, 0.04718971252441406, 0.048675537109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 12.0, 22.0, 22.0, 35.0, 86.0, 132.0, 236.0, 410.0, 886.0, 1891.0, 4315.0, 10627.0, 29102.0, 95917.0, 399278.0, 371366.0, 88777.0, 27678.0, 10141.0, 3913.0, 1821.0, 904.0, 451.0, 204.0, 121.0, 82.0, 40.0, 30.0, 18.0, 7.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050750732421875, -0.0491633415222168, -0.047575950622558594, -0.04598855972290039, -0.04440116882324219, -0.042813777923583984, -0.04122638702392578, -0.03963899612426758, -0.038051605224609375, -0.03646421432495117, -0.03487682342529297, -0.033289432525634766, -0.03170204162597656, -0.03011465072631836, -0.028527259826660156, -0.026939868927001953, -0.02535247802734375, -0.023765087127685547, -0.022177696228027344, -0.02059030532836914, -0.019002914428710938, -0.017415523529052734, -0.01582813262939453, -0.014240741729736328, -0.012653350830078125, -0.011065959930419922, -0.009478569030761719, -0.007891178131103516, -0.0063037872314453125, -0.004716396331787109, -0.0031290054321289062, -0.0015416145324707031, 4.57763671875e-05, 0.0016331672668457031, 0.0032205581665039062, 0.004807949066162109, 0.0063953399658203125, 0.007982730865478516, 0.009570121765136719, 0.011157512664794922, 0.012744903564453125, 0.014332294464111328, 0.01591968536376953, 0.017507076263427734, 0.019094467163085938, 0.02068185806274414, 0.022269248962402344, 0.023856639862060547, 0.02544403076171875, 0.027031421661376953, 0.028618812561035156, 0.03020620346069336, 0.03179359436035156, 0.033380985260009766, 0.03496837615966797, 0.03655576705932617, 0.038143157958984375, 0.03973054885864258, 0.04131793975830078, 0.042905330657958984, 0.04449272155761719, 0.04608011245727539, 0.047667503356933594, 0.0492548942565918, 0.05084228515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 11.0, 6.0, 12.0, 17.0, 21.0, 32.0, 40.0, 55.0, 62.0, 78.0, 88.0, 88.0, 110.0, 64.0, 67.0, 62.0, 41.0, 25.0, 21.0, 21.0, 15.0, 15.0, 4.0, 8.0, 10.0, 0.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9591064453125e-05, -4.8022717237472534e-05, -4.645437002182007e-05, -4.48860228061676e-05, -4.331767559051514e-05, -4.174932837486267e-05, -4.0180981159210205e-05, -3.861263394355774e-05, -3.7044286727905273e-05, -3.547593951225281e-05, -3.390759229660034e-05, -3.2339245080947876e-05, -3.077089786529541e-05, -2.9202550649642944e-05, -2.763420343399048e-05, -2.6065856218338013e-05, -2.4497509002685547e-05, -2.292916178703308e-05, -2.1360814571380615e-05, -1.979246735572815e-05, -1.8224120140075684e-05, -1.6655772924423218e-05, -1.5087425708770752e-05, -1.3519078493118286e-05, -1.195073127746582e-05, -1.0382384061813354e-05, -8.814036846160889e-06, -7.245689630508423e-06, -5.677342414855957e-06, -4.108995199203491e-06, -2.5406479835510254e-06, -9.723007678985596e-07, 5.960464477539062e-07, 2.164393663406372e-06, 3.732740879058838e-06, 5.301088094711304e-06, 6.8694353103637695e-06, 8.437782526016235e-06, 1.0006129741668701e-05, 1.1574476957321167e-05, 1.3142824172973633e-05, 1.4711171388626099e-05, 1.6279518604278564e-05, 1.784786581993103e-05, 1.9416213035583496e-05, 2.0984560251235962e-05, 2.2552907466888428e-05, 2.4121254682540894e-05, 2.568960189819336e-05, 2.7257949113845825e-05, 2.882629632949829e-05, 3.0394643545150757e-05, 3.196299076080322e-05, 3.353133797645569e-05, 3.5099685192108154e-05, 3.666803240776062e-05, 3.8236379623413086e-05, 3.980472683906555e-05, 4.137307405471802e-05, 4.2941421270370483e-05, 4.450976848602295e-05, 4.6078115701675415e-05, 4.764646291732788e-05, 4.921481013298035e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 11.0, 11.0, 16.0, 22.0, 36.0, 60.0, 89.0, 103.0, 203.0, 310.0, 488.0, 721.0, 1190.0, 2034.0, 3542.0, 6045.0, 10868.0, 19936.0, 38432.0, 78581.0, 177222.0, 310412.0, 210344.0, 92052.0, 44587.0, 22891.0, 11998.0, 6711.0, 3804.0, 2286.0, 1298.0, 791.0, 522.0, 320.0, 195.0, 135.0, 95.0, 57.0, 50.0, 23.0, 23.0, 11.0, 10.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0267181396484375, -0.02592301368713379, -0.025127887725830078, -0.024332761764526367, -0.023537635803222656, -0.022742509841918945, -0.021947383880615234, -0.021152257919311523, -0.020357131958007812, -0.0195620059967041, -0.01876688003540039, -0.01797175407409668, -0.01717662811279297, -0.016381502151489258, -0.015586376190185547, -0.014791250228881836, -0.013996124267578125, -0.013200998306274414, -0.012405872344970703, -0.011610746383666992, -0.010815620422363281, -0.01002049446105957, -0.00922536849975586, -0.008430242538452148, -0.0076351165771484375, -0.0068399906158447266, -0.006044864654541016, -0.005249738693237305, -0.004454612731933594, -0.003659486770629883, -0.002864360809326172, -0.002069234848022461, -0.00127410888671875, -0.00047898292541503906, 0.0003161430358886719, 0.0011112689971923828, 0.0019063949584960938, 0.0027015209197998047, 0.0034966468811035156, 0.0042917728424072266, 0.0050868988037109375, 0.0058820247650146484, 0.006677150726318359, 0.00747227668762207, 0.008267402648925781, 0.009062528610229492, 0.009857654571533203, 0.010652780532836914, 0.011447906494140625, 0.012243032455444336, 0.013038158416748047, 0.013833284378051758, 0.014628410339355469, 0.01542353630065918, 0.01621866226196289, 0.0170137882232666, 0.017808914184570312, 0.018604040145874023, 0.019399166107177734, 0.020194292068481445, 0.020989418029785156, 0.021784543991088867, 0.022579669952392578, 0.02337479591369629, 0.024169921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 7.0, 5.0, 4.0, 3.0, 14.0, 12.0, 16.0, 29.0, 33.0, 36.0, 40.0, 49.0, 82.0, 96.0, 93.0, 78.0, 72.0, 70.0, 53.0, 42.0, 40.0, 25.0, 20.0, 17.0, 20.0, 6.0, 6.0, 8.0, 4.0, 1.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.030586719512939453, -0.029252052307128906, -0.02791738510131836, -0.026582717895507812, -0.025248050689697266, -0.02391338348388672, -0.022578716278076172, -0.021244049072265625, -0.019909381866455078, -0.01857471466064453, -0.017240047454833984, -0.015905380249023438, -0.01457071304321289, -0.013236045837402344, -0.011901378631591797, -0.01056671142578125, -0.009232044219970703, -0.007897377014160156, -0.006562709808349609, -0.0052280426025390625, -0.0038933753967285156, -0.0025587081909179688, -0.0012240409851074219, 0.000110626220703125, 0.0014452934265136719, 0.0027799606323242188, 0.004114627838134766, 0.0054492950439453125, 0.006783962249755859, 0.008118629455566406, 0.009453296661376953, 0.0107879638671875, 0.012122631072998047, 0.013457298278808594, 0.01479196548461914, 0.016126632690429688, 0.017461299896240234, 0.01879596710205078, 0.020130634307861328, 0.021465301513671875, 0.022799968719482422, 0.02413463592529297, 0.025469303131103516, 0.026803970336914062, 0.02813863754272461, 0.029473304748535156, 0.030807971954345703, 0.03214263916015625, 0.0334773063659668, 0.034811973571777344, 0.03614664077758789, 0.03748130798339844, 0.038815975189208984, 0.04015064239501953, 0.04148530960083008, 0.042819976806640625, 0.04415464401245117, 0.04548931121826172, 0.046823978424072266, 0.04815864562988281, 0.04949331283569336, 0.050827980041503906, 0.05216264724731445, 0.053497314453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 15.0, 22.0, 47.0, 82.0, 156.0, 179.0, 170.0, 139.0, 97.0, 44.0, 10.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36915159225463867, -0.34852245450019836, -0.32789331674575806, -0.30726417899131775, -0.28663504123687744, -0.2660059332847595, -0.2453767955303192, -0.2247476577758789, -0.2041185200214386, -0.1834893822669983, -0.16286024451255798, -0.14223112165927887, -0.12160198390483856, -0.10097284615039825, -0.08034371584653854, -0.05971458554267883, -0.039085447788238525, -0.018456313759088516, 0.002172820270061493, 0.022801954299211502, 0.04343108832836151, 0.06406022608280182, 0.08468935638666153, 0.10531848669052124, 0.12594762444496155, 0.14657676219940186, 0.16720589995384216, 0.18783502280712128, 0.20846416056156158, 0.2290932983160019, 0.249722421169281, 0.2703515589237213, 0.29098063707351685, 0.31160977482795715, 0.33223891258239746, 0.35286805033683777, 0.3734971880912781, 0.394126296043396, 0.4147554337978363, 0.4353845715522766, 0.4560137093067169, 0.4766428470611572, 0.49727198481559753, 0.5179011225700378, 0.5385302305221558, 0.5591593980789185, 0.5797885060310364, 0.6004176139831543, 0.621046781539917, 0.6416758894920349, 0.6623050570487976, 0.6829341650009155, 0.7035633325576782, 0.7241924405097961, 0.7448216080665588, 0.7654507160186768, 0.7860798835754395, 0.8067089915275574, 0.8273381590843201, 0.847967267036438, 0.8685964345932007, 0.8892255425453186, 0.9098547101020813, 0.9304838180541992, 0.9511129260063171]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 3.0, 2.0, 9.0, 8.0, 9.0, 17.0, 17.0, 25.0, 27.0, 35.0, 39.0, 28.0, 39.0, 40.0, 45.0, 51.0, 49.0, 49.0, 54.0, 57.0, 48.0, 42.0, 33.0, 40.0, 29.0, 25.0, 25.0, 30.0, 18.0, 29.0, 10.0, 12.0, 10.0, 5.0, 8.0, 5.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19132137298583984, -0.1847739815711975, -0.17822657525539398, -0.17167916893959045, -0.16513177752494812, -0.1585843861103058, -0.15203697979450226, -0.14548957347869873, -0.1389421820640564, -0.13239479064941406, -0.12584738433361053, -0.1192999854683876, -0.11275258660316467, -0.10620518773794174, -0.09965778887271881, -0.09311039000749588, -0.08656299114227295, -0.08001559227705002, -0.07346819341182709, -0.06692079454660416, -0.060373395681381226, -0.053825996816158295, -0.047278597950935364, -0.04073119908571243, -0.0341838002204895, -0.02763640135526657, -0.02108900249004364, -0.01454160362482071, -0.007994204759597778, -0.0014468058943748474, 0.0051005929708480835, 0.011647991836071014, 0.018195390701293945, 0.024742789566516876, 0.03129018843173981, 0.03783758729696274, 0.04438498616218567, 0.0509323850274086, 0.05747978389263153, 0.06402718275785446, 0.07057458162307739, 0.07712198048830032, 0.08366937935352325, 0.09021677821874619, 0.09676417708396912, 0.10331157594919205, 0.10985897481441498, 0.11640637367963791, 0.12295377254486084, 0.12950116395950317, 0.1360485702753067, 0.14259597659111023, 0.14914336800575256, 0.1556907594203949, 0.16223816573619843, 0.16878557205200195, 0.1753329634666443, 0.18188035488128662, 0.18842776119709015, 0.19497516751289368, 0.201522558927536, 0.20806995034217834, 0.21461735665798187, 0.2211647629737854, 0.22771215438842773]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 2.0, 13.0, 11.0, 11.0, 29.0, 59.0, 114.0, 240.0, 784.0, 2738.0, 11991.0, 79498.0, 2251930.0, 1762420.0, 69466.0, 11324.0, 2498.0, 708.0, 254.0, 90.0, 36.0, 26.0, 10.0, 11.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07861328125, -0.07629871368408203, -0.07398414611816406, -0.0716695785522461, -0.06935501098632812, -0.06704044342041016, -0.06472587585449219, -0.06241130828857422, -0.06009674072265625, -0.05778217315673828, -0.05546760559082031, -0.053153038024902344, -0.050838470458984375, -0.048523902893066406, -0.04620933532714844, -0.04389476776123047, -0.0415802001953125, -0.03926563262939453, -0.03695106506347656, -0.034636497497558594, -0.032321929931640625, -0.030007362365722656, -0.027692794799804688, -0.02537822723388672, -0.02306365966796875, -0.02074909210205078, -0.018434524536132812, -0.016119956970214844, -0.013805389404296875, -0.011490821838378906, -0.009176254272460938, -0.006861686706542969, -0.004547119140625, -0.0022325515747070312, 8.20159912109375e-05, 0.0023965835571289062, 0.004711151123046875, 0.007025718688964844, 0.009340286254882812, 0.011654853820800781, 0.01396942138671875, 0.01628398895263672, 0.018598556518554688, 0.020913124084472656, 0.023227691650390625, 0.025542259216308594, 0.027856826782226562, 0.03017139434814453, 0.0324859619140625, 0.03480052947998047, 0.03711509704589844, 0.039429664611816406, 0.041744232177734375, 0.044058799743652344, 0.04637336730957031, 0.04868793487548828, 0.05100250244140625, 0.05331707000732422, 0.05563163757324219, 0.057946205139160156, 0.060260772705078125, 0.0625753402709961, 0.06488990783691406, 0.06720447540283203, 0.06951904296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 7.0, 7.0, 13.0, 25.0, 36.0, 50.0, 49.0, 69.0, 68.0, 92.0, 80.0, 90.0, 78.0, 65.0, 55.0, 50.0, 44.0, 34.0, 26.0, 34.0, 10.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.038330078125, -0.03739738464355469, -0.036464691162109375, -0.03553199768066406, -0.03459930419921875, -0.03366661071777344, -0.032733917236328125, -0.03180122375488281, -0.0308685302734375, -0.029935836791992188, -0.029003143310546875, -0.028070449829101562, -0.02713775634765625, -0.026205062866210938, -0.025272369384765625, -0.024339675903320312, -0.023406982421875, -0.022474288940429688, -0.021541595458984375, -0.020608901977539062, -0.01967620849609375, -0.018743515014648438, -0.017810821533203125, -0.016878128051757812, -0.0159454345703125, -0.015012741088867188, -0.014080047607421875, -0.013147354125976562, -0.01221466064453125, -0.011281967163085938, -0.010349273681640625, -0.009416580200195312, -0.00848388671875, -0.0075511932373046875, -0.006618499755859375, -0.0056858062744140625, -0.00475311279296875, -0.0038204193115234375, -0.002887725830078125, -0.0019550323486328125, -0.0010223388671875, -8.96453857421875e-05, 0.000843048095703125, 0.0017757415771484375, 0.00270843505859375, 0.0036411285400390625, 0.004573822021484375, 0.0055065155029296875, 0.006439208984375, 0.0073719024658203125, 0.008304595947265625, 0.009237289428710938, 0.01016998291015625, 0.011102676391601562, 0.012035369873046875, 0.012968063354492188, 0.0139007568359375, 0.014833450317382812, 0.015766143798828125, 0.016698837280273438, 0.01763153076171875, 0.018564224243164062, 0.019496917724609375, 0.020429611206054688, 0.0213623046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 14.0, 17.0, 29.0, 52.0, 59.0, 115.0, 224.0, 308.0, 574.0, 1163.0, 2509.0, 6029.0, 16891.0, 57561.0, 285178.0, 2721516.0, 927684.0, 125942.0, 31009.0, 10054.0, 3811.0, 1632.0, 815.0, 410.0, 232.0, 154.0, 91.0, 51.0, 44.0, 37.0, 23.0, 9.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.053924560546875, -0.05241680145263672, -0.05090904235839844, -0.049401283264160156, -0.047893524169921875, -0.046385765075683594, -0.04487800598144531, -0.04337024688720703, -0.04186248779296875, -0.04035472869873047, -0.03884696960449219, -0.037339210510253906, -0.035831451416015625, -0.034323692321777344, -0.03281593322753906, -0.03130817413330078, -0.0298004150390625, -0.02829265594482422, -0.026784896850585938, -0.025277137756347656, -0.023769378662109375, -0.022261619567871094, -0.020753860473632812, -0.01924610137939453, -0.01773834228515625, -0.01623058319091797, -0.014722824096679688, -0.013215065002441406, -0.011707305908203125, -0.010199546813964844, -0.008691787719726562, -0.007184028625488281, -0.00567626953125, -0.004168510437011719, -0.0026607513427734375, -0.0011529922485351562, 0.000354766845703125, 0.0018625259399414062, 0.0033702850341796875, 0.004878044128417969, 0.00638580322265625, 0.007893562316894531, 0.009401321411132812, 0.010909080505371094, 0.012416839599609375, 0.013924598693847656, 0.015432357788085938, 0.01694011688232422, 0.0184478759765625, 0.01995563507080078, 0.021463394165039062, 0.022971153259277344, 0.024478912353515625, 0.025986671447753906, 0.027494430541992188, 0.02900218963623047, 0.03050994873046875, 0.03201770782470703, 0.03352546691894531, 0.035033226013183594, 0.036540985107421875, 0.038048744201660156, 0.03955650329589844, 0.04106426239013672, 0.042572021484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 18.0, 20.0, 23.0, 27.0, 41.0, 48.0, 58.0, 110.0, 132.0, 158.0, 274.0, 458.0, 648.0, 652.0, 434.0, 285.0, 170.0, 115.0, 97.0, 55.0, 49.0, 44.0, 26.0, 16.0, 13.0, 18.0, 12.0, 7.0, 8.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.031595706939697266, -0.03050708770751953, -0.029418468475341797, -0.028329849243164062, -0.027241230010986328, -0.026152610778808594, -0.02506399154663086, -0.023975372314453125, -0.02288675308227539, -0.021798133850097656, -0.020709514617919922, -0.019620895385742188, -0.018532276153564453, -0.01744365692138672, -0.016355037689208984, -0.01526641845703125, -0.014177799224853516, -0.013089179992675781, -0.012000560760498047, -0.010911941528320312, -0.009823322296142578, -0.008734703063964844, -0.007646083831787109, -0.006557464599609375, -0.005468845367431641, -0.004380226135253906, -0.003291606903076172, -0.0022029876708984375, -0.0011143684387207031, -2.574920654296875e-05, 0.0010628700256347656, 0.0021514892578125, 0.0032401084899902344, 0.004328727722167969, 0.005417346954345703, 0.0065059661865234375, 0.007594585418701172, 0.008683204650878906, 0.00977182388305664, 0.010860443115234375, 0.01194906234741211, 0.013037681579589844, 0.014126300811767578, 0.015214920043945312, 0.016303539276123047, 0.01739215850830078, 0.018480777740478516, 0.01956939697265625, 0.020658016204833984, 0.02174663543701172, 0.022835254669189453, 0.023923873901367188, 0.025012493133544922, 0.026101112365722656, 0.02718973159790039, 0.028278350830078125, 0.02936697006225586, 0.030455589294433594, 0.03154420852661133, 0.03263282775878906, 0.0337214469909668, 0.03481006622314453, 0.035898685455322266, 0.0369873046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 7.0, 10.0, 21.0, 39.0, 73.0, 141.0, 185.0, 209.0, 154.0, 82.0, 41.0, 18.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.7030559778213501, -0.6887065768241882, -0.6743571758270264, -0.6600077748298645, -0.6456583738327026, -0.631308913230896, -0.6169595718383789, -0.6026101112365723, -0.5882607102394104, -0.5739113092422485, -0.5595619082450867, -0.5452125072479248, -0.5308631062507629, -0.5165137052536011, -0.5021642446517944, -0.48781487345695496, -0.4734654724597931, -0.4591160714626312, -0.44476667046546936, -0.4304172396659851, -0.41606783866882324, -0.4017184376716614, -0.3873690366744995, -0.37301963567733765, -0.3586702346801758, -0.3443208336830139, -0.32997143268585205, -0.3156220316886902, -0.30127260088920593, -0.28692319989204407, -0.2725737988948822, -0.25822439789772034, -0.24387499690055847, -0.2295255959033966, -0.21517618000507355, -0.20082677900791168, -0.18647736310958862, -0.17212796211242676, -0.1577785611152649, -0.14342916011810303, -0.12907974421977997, -0.1147303357720375, -0.10038092732429504, -0.08603152632713318, -0.07168211787939072, -0.057332709431648254, -0.04298330843448639, -0.028633899986743927, -0.014284491539001465, 6.491504609584808e-05, 0.014414321631193161, 0.028763726353645325, 0.04311313480138779, 0.05746254324913025, 0.07181194424629211, 0.08616135269403458, 0.10051076114177704, 0.1148601695895195, 0.12920957803726196, 0.14355897903442383, 0.1579083800315857, 0.17225779592990875, 0.18660719692707062, 0.20095661282539368, 0.21530601382255554]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 10.0, 11.0, 8.0, 16.0, 17.0, 23.0, 34.0, 38.0, 29.0, 35.0, 52.0, 50.0, 56.0, 50.0, 51.0, 57.0, 55.0, 40.0, 49.0, 41.0, 44.0, 41.0, 31.0, 40.0, 19.0, 26.0, 15.0, 8.0, 9.0, 12.0, 8.0, 5.0, 12.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.19820666313171387, -0.1929558664560318, -0.18770508468151093, -0.18245428800582886, -0.17720350623130798, -0.17195270955562592, -0.16670191287994385, -0.16145113110542297, -0.1562003344297409, -0.15094953775405884, -0.14569875597953796, -0.1404479593038559, -0.13519716262817383, -0.12994638085365295, -0.12469558417797089, -0.11944479495286942, -0.11419400572776794, -0.10894321650266647, -0.103692427277565, -0.09844163060188293, -0.09319084137678146, -0.08794005215167999, -0.08268925547599792, -0.07743846625089645, -0.07218767702579498, -0.06693688780069351, -0.06168609485030174, -0.05643530189990997, -0.0511845126748085, -0.04593372344970703, -0.04068293049931526, -0.03543213754892349, -0.03018134832382202, -0.0249305572360754, -0.01967976614832878, -0.014428975060582161, -0.00917818397283554, -0.003927392885088921, 0.0013233982026576996, 0.006574191153049469, 0.01182498037815094, 0.01707577146589756, 0.02232656255364418, 0.0275773536413908, 0.03282814472913742, 0.03807893395423889, 0.04332972690463066, 0.04858051985502243, 0.0538313090801239, 0.05908209830522537, 0.06433288753032684, 0.06958368420600891, 0.07483447343111038, 0.08008526265621185, 0.08533605933189392, 0.09058684855699539, 0.09583763778209686, 0.10108842700719833, 0.1063392162322998, 0.11159001290798187, 0.11684080213308334, 0.12209159135818481, 0.12734238803386688, 0.13259318470954895, 0.13784396648406982]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 11.0, 5.0, 17.0, 18.0, 35.0, 41.0, 64.0, 75.0, 104.0, 219.0, 323.0, 613.0, 1164.0, 2611.0, 5708.0, 13537.0, 34915.0, 94287.0, 230520.0, 328553.0, 203754.0, 80787.0, 29740.0, 11718.0, 4899.0, 2232.0, 1133.0, 619.0, 309.0, 198.0, 108.0, 89.0, 36.0, 29.0, 24.0, 13.0, 5.0, 13.0, 11.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06817626953125, -0.06585884094238281, -0.06354141235351562, -0.06122398376464844, -0.05890655517578125, -0.05658912658691406, -0.054271697998046875, -0.05195426940917969, -0.0496368408203125, -0.04731941223144531, -0.045001983642578125, -0.04268455505371094, -0.04036712646484375, -0.03804969787597656, -0.035732269287109375, -0.03341484069824219, -0.031097412109375, -0.028779983520507812, -0.026462554931640625, -0.024145126342773438, -0.02182769775390625, -0.019510269165039062, -0.017192840576171875, -0.014875411987304688, -0.0125579833984375, -0.010240554809570312, -0.007923126220703125, -0.0056056976318359375, -0.00328826904296875, -0.0009708404541015625, 0.001346588134765625, 0.0036640167236328125, 0.0059814453125, 0.008298873901367188, 0.010616302490234375, 0.012933731079101562, 0.01525115966796875, 0.017568588256835938, 0.019886016845703125, 0.022203445434570312, 0.0245208740234375, 0.026838302612304688, 0.029155731201171875, 0.03147315979003906, 0.03379058837890625, 0.03610801696777344, 0.038425445556640625, 0.04074287414550781, 0.043060302734375, 0.04537773132324219, 0.047695159912109375, 0.05001258850097656, 0.05233001708984375, 0.05464744567871094, 0.056964874267578125, 0.05928230285644531, 0.0615997314453125, 0.06391716003417969, 0.06623458862304688, 0.06855201721191406, 0.07086944580078125, 0.07318687438964844, 0.07550430297851562, 0.07782173156738281, 0.08013916015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 10.0, 16.0, 26.0, 22.0, 51.0, 42.0, 72.0, 73.0, 64.0, 83.0, 70.0, 77.0, 81.0, 60.0, 50.0, 36.0, 44.0, 34.0, 23.0, 16.0, 14.0, 13.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0379638671875, -0.03702497482299805, -0.036086082458496094, -0.03514719009399414, -0.03420829772949219, -0.033269405364990234, -0.03233051300048828, -0.03139162063598633, -0.030452728271484375, -0.029513835906982422, -0.02857494354248047, -0.027636051177978516, -0.026697158813476562, -0.02575826644897461, -0.024819374084472656, -0.023880481719970703, -0.02294158935546875, -0.022002696990966797, -0.021063804626464844, -0.02012491226196289, -0.019186019897460938, -0.018247127532958984, -0.01730823516845703, -0.016369342803955078, -0.015430450439453125, -0.014491558074951172, -0.013552665710449219, -0.012613773345947266, -0.011674880981445312, -0.01073598861694336, -0.009797096252441406, -0.008858203887939453, -0.0079193115234375, -0.006980419158935547, -0.006041526794433594, -0.005102634429931641, -0.0041637420654296875, -0.0032248497009277344, -0.0022859573364257812, -0.0013470649719238281, -0.000408172607421875, 0.0005307197570800781, 0.0014696121215820312, 0.0024085044860839844, 0.0033473968505859375, 0.004286289215087891, 0.005225181579589844, 0.006164073944091797, 0.00710296630859375, 0.008041858673095703, 0.008980751037597656, 0.00991964340209961, 0.010858535766601562, 0.011797428131103516, 0.012736320495605469, 0.013675212860107422, 0.014614105224609375, 0.015552997589111328, 0.01649188995361328, 0.017430782318115234, 0.018369674682617188, 0.01930856704711914, 0.020247459411621094, 0.021186351776123047, 0.022125244140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 12.0, 20.0, 36.0, 27.0, 58.0, 76.0, 110.0, 158.0, 282.0, 497.0, 936.0, 1927.0, 4514.0, 11458.0, 31577.0, 93570.0, 250231.0, 360738.0, 188524.0, 65874.0, 22702.0, 8382.0, 3474.0, 1437.0, 783.0, 412.0, 251.0, 154.0, 100.0, 56.0, 43.0, 30.0, 24.0, 11.0, 16.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.082763671875, -0.08028125762939453, -0.07779884338378906, -0.0753164291381836, -0.07283401489257812, -0.07035160064697266, -0.06786918640136719, -0.06538677215576172, -0.06290435791015625, -0.06042194366455078, -0.05793952941894531, -0.055457115173339844, -0.052974700927734375, -0.050492286682128906, -0.04800987243652344, -0.04552745819091797, -0.0430450439453125, -0.04056262969970703, -0.03808021545410156, -0.035597801208496094, -0.033115386962890625, -0.030632972717285156, -0.028150558471679688, -0.02566814422607422, -0.02318572998046875, -0.02070331573486328, -0.018220901489257812, -0.015738487243652344, -0.013256072998046875, -0.010773658752441406, -0.008291244506835938, -0.005808830261230469, -0.003326416015625, -0.0008440017700195312, 0.0016384124755859375, 0.004120826721191406, 0.006603240966796875, 0.009085655212402344, 0.011568069458007812, 0.014050483703613281, 0.01653289794921875, 0.01901531219482422, 0.021497726440429688, 0.023980140686035156, 0.026462554931640625, 0.028944969177246094, 0.03142738342285156, 0.03390979766845703, 0.0363922119140625, 0.03887462615966797, 0.04135704040527344, 0.043839454650878906, 0.046321868896484375, 0.048804283142089844, 0.05128669738769531, 0.05376911163330078, 0.05625152587890625, 0.05873394012451172, 0.06121635437011719, 0.06369876861572266, 0.06618118286132812, 0.0686635971069336, 0.07114601135253906, 0.07362842559814453, 0.07611083984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 8.0, 8.0, 21.0, 7.0, 18.0, 27.0, 19.0, 30.0, 30.0, 31.0, 44.0, 36.0, 44.0, 47.0, 44.0, 54.0, 45.0, 47.0, 67.0, 51.0, 28.0, 45.0, 42.0, 27.0, 28.0, 19.0, 29.0, 15.0, 11.0, 20.0, 11.0, 8.0, 8.0, 6.0, 3.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.070556640625, -0.06837654113769531, -0.06619644165039062, -0.06401634216308594, -0.06183624267578125, -0.05965614318847656, -0.057476043701171875, -0.05529594421386719, -0.0531158447265625, -0.05093574523925781, -0.048755645751953125, -0.04657554626464844, -0.04439544677734375, -0.04221534729003906, -0.040035247802734375, -0.03785514831542969, -0.035675048828125, -0.03349494934082031, -0.031314849853515625, -0.029134750366210938, -0.02695465087890625, -0.024774551391601562, -0.022594451904296875, -0.020414352416992188, -0.0182342529296875, -0.016054153442382812, -0.013874053955078125, -0.011693954467773438, -0.00951385498046875, -0.0073337554931640625, -0.005153656005859375, -0.0029735565185546875, -0.00079345703125, 0.0013866424560546875, 0.003566741943359375, 0.0057468414306640625, 0.00792694091796875, 0.010107040405273438, 0.012287139892578125, 0.014467239379882812, 0.0166473388671875, 0.018827438354492188, 0.021007537841796875, 0.023187637329101562, 0.02536773681640625, 0.027547836303710938, 0.029727935791015625, 0.03190803527832031, 0.034088134765625, 0.03626823425292969, 0.038448333740234375, 0.04062843322753906, 0.04280853271484375, 0.04498863220214844, 0.047168731689453125, 0.04934883117675781, 0.0515289306640625, 0.05370903015136719, 0.055889129638671875, 0.05806922912597656, 0.06024932861328125, 0.06242942810058594, 0.06460952758789062, 0.06678962707519531, 0.0689697265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 17.0, 17.0, 22.0, 57.0, 44.0, 94.0, 154.0, 254.0, 441.0, 818.0, 1505.0, 2819.0, 5339.0, 10447.0, 21331.0, 46019.0, 105107.0, 255252.0, 327173.0, 150277.0, 63179.0, 28993.0, 14115.0, 6990.0, 3682.0, 1944.0, 1012.0, 531.0, 340.0, 179.0, 130.0, 58.0, 56.0, 40.0, 24.0, 20.0, 15.0, 14.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.039398193359375, -0.038135528564453125, -0.03687286376953125, -0.035610198974609375, -0.0343475341796875, -0.033084869384765625, -0.03182220458984375, -0.030559539794921875, -0.029296875, -0.028034210205078125, -0.02677154541015625, -0.025508880615234375, -0.0242462158203125, -0.022983551025390625, -0.02172088623046875, -0.020458221435546875, -0.019195556640625, -0.017932891845703125, -0.01667022705078125, -0.015407562255859375, -0.0141448974609375, -0.012882232666015625, -0.01161956787109375, -0.010356903076171875, -0.00909423828125, -0.007831573486328125, -0.00656890869140625, -0.005306243896484375, -0.0040435791015625, -0.002780914306640625, -0.00151824951171875, -0.000255584716796875, 0.001007080078125, 0.002269744873046875, 0.00353240966796875, 0.004795074462890625, 0.0060577392578125, 0.007320404052734375, 0.00858306884765625, 0.009845733642578125, 0.0111083984375, 0.012371063232421875, 0.01363372802734375, 0.014896392822265625, 0.0161590576171875, 0.017421722412109375, 0.01868438720703125, 0.019947052001953125, 0.021209716796875, 0.022472381591796875, 0.02373504638671875, 0.024997711181640625, 0.0262603759765625, 0.027523040771484375, 0.02878570556640625, 0.030048370361328125, 0.03131103515625, 0.032573699951171875, 0.03383636474609375, 0.035099029541015625, 0.0363616943359375, 0.037624359130859375, 0.03888702392578125, 0.040149688720703125, 0.041412353515625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 7.0, 11.0, 7.0, 9.0, 12.0, 10.0, 17.0, 23.0, 25.0, 35.0, 33.0, 37.0, 51.0, 58.0, 44.0, 64.0, 51.0, 47.0, 51.0, 61.0, 59.0, 42.0, 30.0, 34.0, 26.0, 28.0, 19.0, 16.0, 13.0, 25.0, 13.0, 7.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-2.568960189819336e-05, -2.493336796760559e-05, -2.4177134037017822e-05, -2.3420900106430054e-05, -2.2664666175842285e-05, -2.1908432245254517e-05, -2.1152198314666748e-05, -2.039596438407898e-05, -1.963973045349121e-05, -1.8883496522903442e-05, -1.8127262592315674e-05, -1.7371028661727905e-05, -1.6614794731140137e-05, -1.5858560800552368e-05, -1.51023268699646e-05, -1.4346092939376831e-05, -1.3589859008789062e-05, -1.2833625078201294e-05, -1.2077391147613525e-05, -1.1321157217025757e-05, -1.0564923286437988e-05, -9.80868935585022e-06, -9.052455425262451e-06, -8.296221494674683e-06, -7.539987564086914e-06, -6.7837536334991455e-06, -6.027519702911377e-06, -5.271285772323608e-06, -4.51505184173584e-06, -3.7588179111480713e-06, -3.0025839805603027e-06, -2.246350049972534e-06, -1.4901161193847656e-06, -7.338821887969971e-07, 2.2351741790771484e-08, 7.7858567237854e-07, 1.5348196029663086e-06, 2.291053533554077e-06, 3.0472874641418457e-06, 3.8035213947296143e-06, 4.559755325317383e-06, 5.315989255905151e-06, 6.07222318649292e-06, 6.8284571170806885e-06, 7.584691047668457e-06, 8.340924978256226e-06, 9.097158908843994e-06, 9.853392839431763e-06, 1.0609626770019531e-05, 1.13658607006073e-05, 1.2122094631195068e-05, 1.2878328561782837e-05, 1.3634562492370605e-05, 1.4390796422958374e-05, 1.5147030353546143e-05, 1.590326428413391e-05, 1.665949821472168e-05, 1.7415732145309448e-05, 1.8171966075897217e-05, 1.8928200006484985e-05, 1.9684433937072754e-05, 2.0440667867660522e-05, 2.119690179824829e-05, 2.195313572883606e-05, 2.2709369659423828e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 10.0, 8.0, 15.0, 14.0, 25.0, 43.0, 55.0, 111.0, 141.0, 272.0, 535.0, 1072.0, 2372.0, 5446.0, 12625.0, 31365.0, 83313.0, 239801.0, 392683.0, 175608.0, 61268.0, 23683.0, 10038.0, 4191.0, 1923.0, 870.0, 438.0, 246.0, 133.0, 78.0, 59.0, 50.0, 19.0, 22.0, 13.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044281005859375, -0.042868614196777344, -0.04145622253417969, -0.04004383087158203, -0.038631439208984375, -0.03721904754638672, -0.03580665588378906, -0.034394264221191406, -0.03298187255859375, -0.031569480895996094, -0.030157089233398438, -0.02874469757080078, -0.027332305908203125, -0.02591991424560547, -0.024507522583007812, -0.023095130920410156, -0.0216827392578125, -0.020270347595214844, -0.018857955932617188, -0.01744556427001953, -0.016033172607421875, -0.014620780944824219, -0.013208389282226562, -0.011795997619628906, -0.01038360595703125, -0.008971214294433594, -0.0075588226318359375, -0.006146430969238281, -0.004734039306640625, -0.0033216476440429688, -0.0019092559814453125, -0.0004968643188476562, 0.00091552734375, 0.0023279190063476562, 0.0037403106689453125, 0.005152702331542969, 0.006565093994140625, 0.007977485656738281, 0.009389877319335938, 0.010802268981933594, 0.01221466064453125, 0.013627052307128906, 0.015039443969726562, 0.01645183563232422, 0.017864227294921875, 0.01927661895751953, 0.020689010620117188, 0.022101402282714844, 0.0235137939453125, 0.024926185607910156, 0.026338577270507812, 0.02775096893310547, 0.029163360595703125, 0.03057575225830078, 0.03198814392089844, 0.033400535583496094, 0.03481292724609375, 0.036225318908691406, 0.03763771057128906, 0.03905010223388672, 0.040462493896484375, 0.04187488555908203, 0.04328727722167969, 0.044699668884277344, 0.046112060546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 2.0, 11.0, 2.0, 12.0, 8.0, 7.0, 15.0, 16.0, 18.0, 18.0, 33.0, 35.0, 39.0, 44.0, 75.0, 67.0, 71.0, 75.0, 89.0, 51.0, 68.0, 53.0, 37.0, 27.0, 14.0, 11.0, 14.0, 15.0, 14.0, 5.0, 8.0, 11.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04376220703125, -0.0423583984375, -0.04095458984375, -0.03955078125, -0.03814697265625, -0.0367431640625, -0.03533935546875, -0.033935546875, -0.03253173828125, -0.0311279296875, -0.02972412109375, -0.0283203125, -0.02691650390625, -0.0255126953125, -0.02410888671875, -0.022705078125, -0.02130126953125, -0.0198974609375, -0.01849365234375, -0.01708984375, -0.01568603515625, -0.0142822265625, -0.01287841796875, -0.011474609375, -0.01007080078125, -0.0086669921875, -0.00726318359375, -0.005859375, -0.00445556640625, -0.0030517578125, -0.00164794921875, -0.000244140625, 0.00115966796875, 0.0025634765625, 0.00396728515625, 0.00537109375, 0.00677490234375, 0.0081787109375, 0.00958251953125, 0.010986328125, 0.01239013671875, 0.0137939453125, 0.01519775390625, 0.0166015625, 0.01800537109375, 0.0194091796875, 0.02081298828125, 0.022216796875, 0.02362060546875, 0.0250244140625, 0.02642822265625, 0.02783203125, 0.02923583984375, 0.0306396484375, 0.03204345703125, 0.033447265625, 0.03485107421875, 0.0362548828125, 0.03765869140625, 0.0390625, 0.04046630859375, 0.0418701171875, 0.04327392578125, 0.044677734375, 0.04608154296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 9.0, 23.0, 44.0, 110.0, 176.0, 227.0, 203.0, 94.0, 44.0, 31.0, 11.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8330325484275818, -0.8026156425476074, -0.7721987366676331, -0.7417818307876587, -0.7113649249076843, -0.68094801902771, -0.6505311131477356, -0.6201142072677612, -0.5896973013877869, -0.5592803955078125, -0.5288634896278381, -0.49844658374786377, -0.4680296778678894, -0.43761277198791504, -0.4071958661079407, -0.3767789602279663, -0.34636205434799194, -0.3159451484680176, -0.2855282425880432, -0.25511133670806885, -0.22469443082809448, -0.19427752494812012, -0.16386061906814575, -0.1334437131881714, -0.10302680730819702, -0.07260990142822266, -0.04219299554824829, -0.011776089668273926, 0.01864081621170044, 0.049057722091674805, 0.07947462797164917, 0.10989153385162354, 0.14030838012695312, 0.1707252860069275, 0.20114219188690186, 0.23155909776687622, 0.2619760036468506, 0.29239290952682495, 0.3228098154067993, 0.3532267212867737, 0.38364362716674805, 0.4140605330467224, 0.4444774389266968, 0.47489434480667114, 0.5053112506866455, 0.5357281565666199, 0.5661450624465942, 0.5965619683265686, 0.626978874206543, 0.6573957800865173, 0.6878126859664917, 0.7182295918464661, 0.7486464977264404, 0.7790634036064148, 0.8094803094863892, 0.8398972153663635, 0.8703141212463379, 0.9007310271263123, 0.9311479330062866, 0.961564838886261, 0.9919817447662354, 1.0223987102508545, 1.052815556526184, 1.0832324028015137, 1.1136493682861328]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 8.0, 7.0, 10.0, 14.0, 17.0, 16.0, 28.0, 13.0, 25.0, 27.0, 33.0, 28.0, 39.0, 43.0, 31.0, 46.0, 35.0, 53.0, 52.0, 36.0, 51.0, 37.0, 42.0, 32.0, 35.0, 31.0, 32.0, 18.0, 21.0, 26.0, 22.0, 15.0, 13.0, 13.0, 8.0, 12.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2080647349357605, -0.20061497390270233, -0.19316521286964417, -0.1857154369354248, -0.17826567590236664, -0.17081591486930847, -0.1633661389350891, -0.15591637790203094, -0.14846661686897278, -0.1410168558359146, -0.13356709480285645, -0.12611731886863708, -0.11866755783557892, -0.11121779680252075, -0.10376802831888199, -0.09631825983524323, -0.08886849880218506, -0.08141873776912689, -0.07396896928548813, -0.06651920080184937, -0.0590694397687912, -0.051619675010442734, -0.04416991025209427, -0.036720145493745804, -0.02927038073539734, -0.021820615977048874, -0.014370851218700409, -0.006921086460351944, 0.000528678297996521, 0.007978443056344986, 0.015428207814693451, 0.022877972573041916, 0.03032773733139038, 0.037777502089738846, 0.04522726684808731, 0.052677031606435776, 0.06012679636478424, 0.06757655739784241, 0.07502632588148117, 0.08247609436511993, 0.0899258553981781, 0.09737561643123627, 0.10482538491487503, 0.1122751533985138, 0.11972491443157196, 0.12717467546463013, 0.1346244513988495, 0.14207421243190765, 0.14952397346496582, 0.156973734498024, 0.16442349553108215, 0.1718732714653015, 0.17932303249835968, 0.18677279353141785, 0.1942225694656372, 0.20167233049869537, 0.20912209153175354, 0.2165718525648117, 0.22402161359786987, 0.23147138953208923, 0.2389211505651474, 0.24637091159820557, 0.2538206875324249, 0.2612704336643219, 0.26872020959854126]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 5.0, 15.0, 25.0, 37.0, 38.0, 48.0, 75.0, 101.0, 186.0, 275.0, 449.0, 769.0, 1321.0, 2468.0, 4575.0, 9270.0, 20011.0, 47754.0, 138485.0, 568534.0, 2013092.0, 1037997.0, 224397.0, 70385.0, 28048.0, 12696.0, 6025.0, 3070.0, 1647.0, 960.0, 588.0, 365.0, 203.0, 125.0, 72.0, 41.0, 26.0, 33.0, 10.0, 10.0, 6.0, 9.0, 5.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.0399169921875, -0.03876638412475586, -0.03761577606201172, -0.03646516799926758, -0.03531455993652344, -0.0341639518737793, -0.033013343811035156, -0.031862735748291016, -0.030712127685546875, -0.029561519622802734, -0.028410911560058594, -0.027260303497314453, -0.026109695434570312, -0.024959087371826172, -0.02380847930908203, -0.02265787124633789, -0.02150726318359375, -0.02035665512084961, -0.01920604705810547, -0.018055438995361328, -0.016904830932617188, -0.015754222869873047, -0.014603614807128906, -0.013453006744384766, -0.012302398681640625, -0.011151790618896484, -0.010001182556152344, -0.008850574493408203, -0.0076999664306640625, -0.006549358367919922, -0.005398750305175781, -0.004248142242431641, -0.0030975341796875, -0.0019469261169433594, -0.0007963180541992188, 0.0003542900085449219, 0.0015048980712890625, 0.002655506134033203, 0.0038061141967773438, 0.004956722259521484, 0.006107330322265625, 0.007257938385009766, 0.008408546447753906, 0.009559154510498047, 0.010709762573242188, 0.011860370635986328, 0.013010978698730469, 0.01416158676147461, 0.01531219482421875, 0.01646280288696289, 0.01761341094970703, 0.018764019012451172, 0.019914627075195312, 0.021065235137939453, 0.022215843200683594, 0.023366451263427734, 0.024517059326171875, 0.025667667388916016, 0.026818275451660156, 0.027968883514404297, 0.029119491577148438, 0.030270099639892578, 0.03142070770263672, 0.03257131576538086, 0.033721923828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 5.0, 11.0, 7.0, 6.0, 14.0, 16.0, 27.0, 39.0, 39.0, 40.0, 44.0, 41.0, 67.0, 73.0, 63.0, 63.0, 73.0, 63.0, 50.0, 48.0, 37.0, 37.0, 33.0, 28.0, 20.0, 13.0, 12.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035064697265625, -0.03414416313171387, -0.033223628997802734, -0.0323030948638916, -0.03138256072998047, -0.030462026596069336, -0.029541492462158203, -0.02862095832824707, -0.027700424194335938, -0.026779890060424805, -0.025859355926513672, -0.02493882179260254, -0.024018287658691406, -0.023097753524780273, -0.02217721939086914, -0.021256685256958008, -0.020336151123046875, -0.019415616989135742, -0.01849508285522461, -0.017574548721313477, -0.016654014587402344, -0.01573348045349121, -0.014812946319580078, -0.013892412185668945, -0.012971878051757812, -0.01205134391784668, -0.011130809783935547, -0.010210275650024414, -0.009289741516113281, -0.008369207382202148, -0.007448673248291016, -0.006528139114379883, -0.00560760498046875, -0.004687070846557617, -0.0037665367126464844, -0.0028460025787353516, -0.0019254684448242188, -0.001004934310913086, -8.440017700195312e-05, 0.0008361339569091797, 0.0017566680908203125, 0.0026772022247314453, 0.003597736358642578, 0.004518270492553711, 0.005438804626464844, 0.0063593387603759766, 0.007279872894287109, 0.008200407028198242, 0.009120941162109375, 0.010041475296020508, 0.01096200942993164, 0.011882543563842773, 0.012803077697753906, 0.013723611831665039, 0.014644145965576172, 0.015564680099487305, 0.016485214233398438, 0.01740574836730957, 0.018326282501220703, 0.019246816635131836, 0.02016735076904297, 0.0210878849029541, 0.022008419036865234, 0.022928953170776367, 0.0238494873046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 11.0, 10.0, 24.0, 24.0, 39.0, 55.0, 74.0, 131.0, 224.0, 395.0, 742.0, 1508.0, 3392.0, 9380.0, 30259.0, 134636.0, 1076186.0, 2602458.0, 260674.0, 50832.0, 14076.0, 5005.0, 2004.0, 928.0, 491.0, 234.0, 149.0, 88.0, 73.0, 51.0, 25.0, 27.0, 15.0, 10.0, 11.0, 3.0, 9.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05841064453125, -0.05633831024169922, -0.05426597595214844, -0.052193641662597656, -0.050121307373046875, -0.048048973083496094, -0.04597663879394531, -0.04390430450439453, -0.04183197021484375, -0.03975963592529297, -0.03768730163574219, -0.035614967346191406, -0.033542633056640625, -0.031470298767089844, -0.029397964477539062, -0.02732563018798828, -0.0252532958984375, -0.02318096160888672, -0.021108627319335938, -0.019036293029785156, -0.016963958740234375, -0.014891624450683594, -0.012819290161132812, -0.010746955871582031, -0.00867462158203125, -0.006602287292480469, -0.0045299530029296875, -0.0024576187133789062, -0.000385284423828125, 0.0016870498657226562, 0.0037593841552734375, 0.005831718444824219, 0.007904052734375, 0.009976387023925781, 0.012048721313476562, 0.014121055603027344, 0.016193389892578125, 0.018265724182128906, 0.020338058471679688, 0.02241039276123047, 0.02448272705078125, 0.02655506134033203, 0.028627395629882812, 0.030699729919433594, 0.032772064208984375, 0.034844398498535156, 0.03691673278808594, 0.03898906707763672, 0.0410614013671875, 0.04313373565673828, 0.04520606994628906, 0.047278404235839844, 0.049350738525390625, 0.051423072814941406, 0.05349540710449219, 0.05556774139404297, 0.05764007568359375, 0.05971240997314453, 0.06178474426269531, 0.0638570785522461, 0.06592941284179688, 0.06800174713134766, 0.07007408142089844, 0.07214641571044922, 0.07421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 9.0, 11.0, 13.0, 20.0, 29.0, 37.0, 37.0, 46.0, 84.0, 98.0, 148.0, 217.0, 303.0, 562.0, 815.0, 601.0, 320.0, 221.0, 150.0, 110.0, 68.0, 38.0, 34.0, 28.0, 14.0, 10.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04632568359375, -0.044579505920410156, -0.04283332824707031, -0.04108715057373047, -0.039340972900390625, -0.03759479522705078, -0.03584861755371094, -0.034102439880371094, -0.03235626220703125, -0.030610084533691406, -0.028863906860351562, -0.02711772918701172, -0.025371551513671875, -0.02362537384033203, -0.021879196166992188, -0.020133018493652344, -0.0183868408203125, -0.016640663146972656, -0.014894485473632812, -0.013148307800292969, -0.011402130126953125, -0.009655952453613281, -0.007909774780273438, -0.006163597106933594, -0.00441741943359375, -0.0026712417602539062, -0.0009250640869140625, 0.0008211135864257812, 0.002567291259765625, 0.004313468933105469, 0.0060596466064453125, 0.007805824279785156, 0.009552001953125, 0.011298179626464844, 0.013044357299804688, 0.014790534973144531, 0.016536712646484375, 0.01828289031982422, 0.020029067993164062, 0.021775245666503906, 0.02352142333984375, 0.025267601013183594, 0.027013778686523438, 0.02875995635986328, 0.030506134033203125, 0.03225231170654297, 0.03399848937988281, 0.035744667053222656, 0.0374908447265625, 0.039237022399902344, 0.04098320007324219, 0.04272937774658203, 0.044475555419921875, 0.04622173309326172, 0.04796791076660156, 0.049714088439941406, 0.05146026611328125, 0.053206443786621094, 0.05495262145996094, 0.05669879913330078, 0.058444976806640625, 0.06019115447998047, 0.06193733215332031, 0.06368350982666016, 0.0654296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 8.0, 18.0, 37.0, 65.0, 84.0, 125.0, 176.0, 161.0, 113.0, 93.0, 45.0, 18.0, 15.0, 9.0, 4.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.546423077583313, -0.5311840772628784, -0.5159451365470886, -0.500706136226654, -0.4854671359062195, -0.4702281653881073, -0.4549891948699951, -0.43975019454956055, -0.42451122403144836, -0.4092722535133362, -0.3940332531929016, -0.37879428267478943, -0.36355531215667725, -0.3483163118362427, -0.3330773413181305, -0.3178383708000183, -0.30259937047958374, -0.28736039996147156, -0.272121399641037, -0.2568824291229248, -0.24164344370365143, -0.22640445828437805, -0.21116548776626587, -0.1959265023469925, -0.18068751692771912, -0.16544853150844574, -0.15020954608917236, -0.13497057557106018, -0.1197315901517868, -0.10449260473251343, -0.08925362676382065, -0.07401464879512787, -0.05877566337585449, -0.043536681681871414, -0.028297699987888336, -0.013058718293905258, 0.00218026340007782, 0.017419248819351196, 0.032658226788043976, 0.047897204756736755, 0.06313619017601013, 0.07837517559528351, 0.09361415356397629, 0.10885313153266907, 0.12409211695194244, 0.13933110237121582, 0.154570072889328, 0.16980905830860138, 0.18504804372787476, 0.20028702914714813, 0.2155260145664215, 0.2307649850845337, 0.24600397050380707, 0.26124295592308044, 0.2764819264411926, 0.2917209267616272, 0.3069598972797394, 0.32219886779785156, 0.33743786811828613, 0.3526768386363983, 0.3679158091545105, 0.38315480947494507, 0.39839377999305725, 0.41363275051116943, 0.428871750831604]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 10.0, 6.0, 11.0, 10.0, 18.0, 27.0, 19.0, 29.0, 29.0, 16.0, 27.0, 41.0, 42.0, 35.0, 37.0, 45.0, 45.0, 55.0, 43.0, 45.0, 36.0, 43.0, 43.0, 37.0, 27.0, 30.0, 20.0, 24.0, 23.0, 16.0, 15.0, 20.0, 16.0, 14.0, 6.0, 6.0, 4.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1954876184463501, -0.18972140550613403, -0.18395519256591797, -0.1781889647245407, -0.17242275178432465, -0.16665653884410858, -0.16089031100273132, -0.15512409806251526, -0.1493578851222992, -0.14359167218208313, -0.13782545924186707, -0.1320592314004898, -0.12629301846027374, -0.12052680552005768, -0.11476058512926102, -0.10899436473846436, -0.10322815179824829, -0.09746193885803223, -0.09169571846723557, -0.0859294980764389, -0.08016328513622284, -0.07439707219600677, -0.06863085180521011, -0.06286463141441345, -0.05709841847419739, -0.051332201808691025, -0.04556598514318466, -0.0397997684776783, -0.034033551812171936, -0.028267335146665573, -0.02250111848115921, -0.016734901815652847, -0.010968685150146484, -0.0052024684846401215, 0.0005637481808662415, 0.006329964846372604, 0.012096181511878967, 0.01786239817738533, 0.023628614842891693, 0.029394831508398056, 0.03516104817390442, 0.04092726483941078, 0.046693481504917145, 0.05245969817042351, 0.05822591483592987, 0.06399212777614594, 0.0697583481669426, 0.07552456855773926, 0.08129078149795532, 0.08705699443817139, 0.09282321482896805, 0.09858943521976471, 0.10435564815998077, 0.11012186110019684, 0.1158880814909935, 0.12165430188179016, 0.12742051482200623, 0.1331867277622223, 0.13895294070243835, 0.1447191685438156, 0.15048538148403168, 0.15625159442424774, 0.162017822265625, 0.16778403520584106, 0.17355024814605713]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 11.0, 28.0, 46.0, 66.0, 105.0, 170.0, 311.0, 520.0, 966.0, 1696.0, 3314.0, 6527.0, 14035.0, 31552.0, 75055.0, 173287.0, 290667.0, 242772.0, 117298.0, 49127.0, 21255.0, 9601.0, 4677.0, 2405.0, 1253.0, 735.0, 405.0, 235.0, 146.0, 98.0, 61.0, 32.0, 28.0, 13.0, 10.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.063232421875, -0.06130218505859375, -0.0593719482421875, -0.05744171142578125, -0.055511474609375, -0.05358123779296875, -0.0516510009765625, -0.04972076416015625, -0.04779052734375, -0.04586029052734375, -0.0439300537109375, -0.04199981689453125, -0.040069580078125, -0.03813934326171875, -0.0362091064453125, -0.03427886962890625, -0.0323486328125, -0.03041839599609375, -0.0284881591796875, -0.02655792236328125, -0.024627685546875, -0.02269744873046875, -0.0207672119140625, -0.01883697509765625, -0.01690673828125, -0.01497650146484375, -0.0130462646484375, -0.01111602783203125, -0.009185791015625, -0.00725555419921875, -0.0053253173828125, -0.00339508056640625, -0.00146484375, 0.00046539306640625, 0.0023956298828125, 0.00432586669921875, 0.006256103515625, 0.00818634033203125, 0.0101165771484375, 0.01204681396484375, 0.01397705078125, 0.01590728759765625, 0.0178375244140625, 0.01976776123046875, 0.021697998046875, 0.02362823486328125, 0.0255584716796875, 0.02748870849609375, 0.0294189453125, 0.03134918212890625, 0.0332794189453125, 0.03520965576171875, 0.037139892578125, 0.03907012939453125, 0.0410003662109375, 0.04293060302734375, 0.04486083984375, 0.04679107666015625, 0.0487213134765625, 0.05065155029296875, 0.052581787109375, 0.05451202392578125, 0.0564422607421875, 0.05837249755859375, 0.060302734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 11.0, 12.0, 20.0, 20.0, 18.0, 36.0, 42.0, 29.0, 49.0, 45.0, 45.0, 54.0, 53.0, 45.0, 65.0, 58.0, 49.0, 54.0, 58.0, 43.0, 35.0, 38.0, 25.0, 23.0, 22.0, 8.0, 8.0, 8.0, 6.0, 3.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.037200927734375, -0.0362701416015625, -0.03533935546875, -0.0344085693359375, -0.033477783203125, -0.0325469970703125, -0.0316162109375, -0.0306854248046875, -0.029754638671875, -0.0288238525390625, -0.02789306640625, -0.0269622802734375, -0.026031494140625, -0.0251007080078125, -0.024169921875, -0.0232391357421875, -0.022308349609375, -0.0213775634765625, -0.02044677734375, -0.0195159912109375, -0.018585205078125, -0.0176544189453125, -0.0167236328125, -0.0157928466796875, -0.014862060546875, -0.0139312744140625, -0.01300048828125, -0.0120697021484375, -0.011138916015625, -0.0102081298828125, -0.00927734375, -0.0083465576171875, -0.007415771484375, -0.0064849853515625, -0.00555419921875, -0.0046234130859375, -0.003692626953125, -0.0027618408203125, -0.0018310546875, -0.0009002685546875, 3.0517578125e-05, 0.0009613037109375, 0.00189208984375, 0.0028228759765625, 0.003753662109375, 0.0046844482421875, 0.005615234375, 0.0065460205078125, 0.007476806640625, 0.0084075927734375, 0.00933837890625, 0.0102691650390625, 0.011199951171875, 0.0121307373046875, 0.0130615234375, 0.0139923095703125, 0.014923095703125, 0.0158538818359375, 0.01678466796875, 0.0177154541015625, 0.018646240234375, 0.0195770263671875, 0.0205078125, 0.0214385986328125, 0.022369384765625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 11.0, 11.0, 10.0, 16.0, 21.0, 35.0, 56.0, 73.0, 124.0, 202.0, 309.0, 525.0, 939.0, 1705.0, 3084.0, 6255.0, 12780.0, 27557.0, 63295.0, 150119.0, 299639.0, 264901.0, 120827.0, 51142.0, 22751.0, 10623.0, 5284.0, 2629.0, 1506.0, 798.0, 526.0, 295.0, 164.0, 105.0, 76.0, 55.0, 27.0, 23.0, 20.0, 15.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05780029296875, -0.055986881256103516, -0.05417346954345703, -0.05236005783081055, -0.05054664611816406, -0.04873323440551758, -0.046919822692871094, -0.04510641098022461, -0.043292999267578125, -0.04147958755493164, -0.039666175842285156, -0.03785276412963867, -0.03603935241699219, -0.0342259407043457, -0.03241252899169922, -0.030599117279052734, -0.02878570556640625, -0.026972293853759766, -0.02515888214111328, -0.023345470428466797, -0.021532058715820312, -0.019718647003173828, -0.017905235290527344, -0.01609182357788086, -0.014278411865234375, -0.01246500015258789, -0.010651588439941406, -0.008838176727294922, -0.0070247650146484375, -0.005211353302001953, -0.0033979415893554688, -0.0015845298767089844, 0.0002288818359375, 0.0020422935485839844, 0.0038557052612304688, 0.005669116973876953, 0.0074825286865234375, 0.009295940399169922, 0.011109352111816406, 0.01292276382446289, 0.014736175537109375, 0.01654958724975586, 0.018362998962402344, 0.020176410675048828, 0.021989822387695312, 0.023803234100341797, 0.02561664581298828, 0.027430057525634766, 0.02924346923828125, 0.031056880950927734, 0.03287029266357422, 0.0346837043762207, 0.03649711608886719, 0.03831052780151367, 0.040123939514160156, 0.04193735122680664, 0.043750762939453125, 0.04556417465209961, 0.047377586364746094, 0.04919099807739258, 0.05100440979003906, 0.05281782150268555, 0.05463123321533203, 0.056444644927978516, 0.058258056640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 4.0, 7.0, 7.0, 14.0, 8.0, 14.0, 16.0, 21.0, 23.0, 29.0, 36.0, 32.0, 35.0, 39.0, 52.0, 46.0, 53.0, 48.0, 52.0, 41.0, 47.0, 42.0, 45.0, 33.0, 29.0, 33.0, 31.0, 23.0, 23.0, 23.0, 16.0, 10.0, 15.0, 7.0, 8.0, 7.0, 5.0, 2.0, 1.0, 7.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.07452392578125, -0.07228755950927734, -0.07005119323730469, -0.06781482696533203, -0.06557846069335938, -0.06334209442138672, -0.06110572814941406, -0.058869361877441406, -0.05663299560546875, -0.054396629333496094, -0.05216026306152344, -0.04992389678955078, -0.047687530517578125, -0.04545116424560547, -0.04321479797363281, -0.040978431701660156, -0.0387420654296875, -0.036505699157714844, -0.03426933288574219, -0.03203296661376953, -0.029796600341796875, -0.02756023406982422, -0.025323867797851562, -0.023087501525878906, -0.02085113525390625, -0.018614768981933594, -0.016378402709960938, -0.014142036437988281, -0.011905670166015625, -0.009669303894042969, -0.0074329376220703125, -0.005196571350097656, -0.002960205078125, -0.0007238388061523438, 0.0015125274658203125, 0.0037488937377929688, 0.005985260009765625, 0.008221626281738281, 0.010457992553710938, 0.012694358825683594, 0.01493072509765625, 0.017167091369628906, 0.019403457641601562, 0.02163982391357422, 0.023876190185546875, 0.02611255645751953, 0.028348922729492188, 0.030585289001464844, 0.0328216552734375, 0.035058021545410156, 0.03729438781738281, 0.03953075408935547, 0.041767120361328125, 0.04400348663330078, 0.04623985290527344, 0.048476219177246094, 0.05071258544921875, 0.052948951721191406, 0.05518531799316406, 0.05742168426513672, 0.059658050537109375, 0.06189441680908203, 0.06413078308105469, 0.06636714935302734, 0.068603515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 9.0, 12.0, 25.0, 16.0, 39.0, 42.0, 85.0, 132.0, 191.0, 279.0, 388.0, 770.0, 1255.0, 2053.0, 3396.0, 6124.0, 10979.0, 21096.0, 43646.0, 101193.0, 241083.0, 318665.0, 163923.0, 67359.0, 30822.0, 15367.0, 8300.0, 4536.0, 2730.0, 1564.0, 901.0, 561.0, 360.0, 227.0, 129.0, 86.0, 62.0, 35.0, 23.0, 20.0, 20.0, 19.0, 6.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.021343708038330078, -0.020638465881347656, -0.019933223724365234, -0.019227981567382812, -0.01852273941040039, -0.01781749725341797, -0.017112255096435547, -0.016407012939453125, -0.015701770782470703, -0.014996528625488281, -0.01429128646850586, -0.013586044311523438, -0.012880802154541016, -0.012175559997558594, -0.011470317840576172, -0.01076507568359375, -0.010059833526611328, -0.009354591369628906, -0.008649349212646484, -0.007944107055664062, -0.007238864898681641, -0.006533622741699219, -0.005828380584716797, -0.005123138427734375, -0.004417896270751953, -0.0037126541137695312, -0.0030074119567871094, -0.0023021697998046875, -0.0015969276428222656, -0.0008916854858398438, -0.00018644332885742188, 0.000518798828125, 0.0012240409851074219, 0.0019292831420898438, 0.0026345252990722656, 0.0033397674560546875, 0.004045009613037109, 0.004750251770019531, 0.005455493927001953, 0.006160736083984375, 0.006865978240966797, 0.007571220397949219, 0.00827646255493164, 0.008981704711914062, 0.009686946868896484, 0.010392189025878906, 0.011097431182861328, 0.01180267333984375, 0.012507915496826172, 0.013213157653808594, 0.013918399810791016, 0.014623641967773438, 0.01532888412475586, 0.01603412628173828, 0.016739368438720703, 0.017444610595703125, 0.018149852752685547, 0.01885509490966797, 0.01956033706665039, 0.020265579223632812, 0.020970821380615234, 0.021676063537597656, 0.022381305694580078, 0.0230865478515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 9.0, 10.0, 6.0, 21.0, 30.0, 38.0, 55.0, 53.0, 94.0, 106.0, 103.0, 116.0, 92.0, 63.0, 52.0, 35.0, 25.0, 20.0, 17.0, 10.0, 11.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.057718276977539e-05, -2.958253026008606e-05, -2.858787775039673e-05, -2.7593225240707397e-05, -2.6598572731018066e-05, -2.5603920221328735e-05, -2.4609267711639404e-05, -2.3614615201950073e-05, -2.2619962692260742e-05, -2.162531018257141e-05, -2.063065767288208e-05, -1.963600516319275e-05, -1.8641352653503418e-05, -1.7646700143814087e-05, -1.6652047634124756e-05, -1.5657395124435425e-05, -1.4662742614746094e-05, -1.3668090105056763e-05, -1.2673437595367432e-05, -1.16787850856781e-05, -1.068413257598877e-05, -9.689480066299438e-06, -8.694827556610107e-06, -7.700175046920776e-06, -6.705522537231445e-06, -5.710870027542114e-06, -4.716217517852783e-06, -3.721565008163452e-06, -2.726912498474121e-06, -1.73225998878479e-06, -7.37607479095459e-07, 2.5704503059387207e-07, 1.2516975402832031e-06, 2.246350049972534e-06, 3.2410025596618652e-06, 4.235655069351196e-06, 5.230307579040527e-06, 6.224960088729858e-06, 7.2196125984191895e-06, 8.21426510810852e-06, 9.208917617797852e-06, 1.0203570127487183e-05, 1.1198222637176514e-05, 1.2192875146865845e-05, 1.3187527656555176e-05, 1.4182180166244507e-05, 1.5176832675933838e-05, 1.617148518562317e-05, 1.71661376953125e-05, 1.816079020500183e-05, 1.9155442714691162e-05, 2.0150095224380493e-05, 2.1144747734069824e-05, 2.2139400243759155e-05, 2.3134052753448486e-05, 2.4128705263137817e-05, 2.512335777282715e-05, 2.611801028251648e-05, 2.711266279220581e-05, 2.810731530189514e-05, 2.9101967811584473e-05, 3.0096620321273804e-05, 3.1091272830963135e-05, 3.2085925340652466e-05, 3.30805778503418e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 12.0, 5.0, 16.0, 28.0, 39.0, 52.0, 95.0, 180.0, 283.0, 533.0, 913.0, 1732.0, 3122.0, 6227.0, 13136.0, 30759.0, 86512.0, 251027.0, 373671.0, 178190.0, 58693.0, 22446.0, 10072.0, 4932.0, 2620.0, 1432.0, 779.0, 422.0, 241.0, 139.0, 83.0, 42.0, 33.0, 28.0, 20.0, 7.0, 9.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251922607421875, -0.02438807487487793, -0.02358388900756836, -0.02277970314025879, -0.02197551727294922, -0.02117133140563965, -0.020367145538330078, -0.019562959671020508, -0.018758773803710938, -0.017954587936401367, -0.017150402069091797, -0.016346216201782227, -0.015542030334472656, -0.014737844467163086, -0.013933658599853516, -0.013129472732543945, -0.012325286865234375, -0.011521100997924805, -0.010716915130615234, -0.009912729263305664, -0.009108543395996094, -0.008304357528686523, -0.007500171661376953, -0.006695985794067383, -0.0058917999267578125, -0.005087614059448242, -0.004283428192138672, -0.0034792423248291016, -0.0026750564575195312, -0.001870870590209961, -0.0010666847229003906, -0.0002624988555908203, 0.00054168701171875, 0.0013458728790283203, 0.0021500587463378906, 0.002954244613647461, 0.0037584304809570312, 0.0045626163482666016, 0.005366802215576172, 0.006170988082885742, 0.0069751739501953125, 0.007779359817504883, 0.008583545684814453, 0.009387731552124023, 0.010191917419433594, 0.010996103286743164, 0.011800289154052734, 0.012604475021362305, 0.013408660888671875, 0.014212846755981445, 0.015017032623291016, 0.015821218490600586, 0.016625404357910156, 0.017429590225219727, 0.018233776092529297, 0.019037961959838867, 0.019842147827148438, 0.020646333694458008, 0.021450519561767578, 0.02225470542907715, 0.02305889129638672, 0.02386307716369629, 0.02466726303100586, 0.02547144889831543, 0.026275634765625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 7.0, 5.0, 10.0, 15.0, 21.0, 32.0, 29.0, 48.0, 47.0, 54.0, 71.0, 79.0, 87.0, 74.0, 69.0, 67.0, 59.0, 35.0, 34.0, 29.0, 29.0, 18.0, 15.0, 8.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026885986328125, -0.026009321212768555, -0.02513265609741211, -0.024255990982055664, -0.02337932586669922, -0.022502660751342773, -0.021625995635986328, -0.020749330520629883, -0.019872665405273438, -0.018996000289916992, -0.018119335174560547, -0.0172426700592041, -0.016366004943847656, -0.015489339828491211, -0.014612674713134766, -0.01373600959777832, -0.012859344482421875, -0.01198267936706543, -0.011106014251708984, -0.010229349136352539, -0.009352684020996094, -0.008476018905639648, -0.007599353790283203, -0.006722688674926758, -0.0058460235595703125, -0.004969358444213867, -0.004092693328857422, -0.0032160282135009766, -0.0023393630981445312, -0.001462697982788086, -0.0005860328674316406, 0.0002906322479248047, 0.00116729736328125, 0.0020439624786376953, 0.0029206275939941406, 0.003797292709350586, 0.004673957824707031, 0.0055506229400634766, 0.006427288055419922, 0.007303953170776367, 0.008180618286132812, 0.009057283401489258, 0.009933948516845703, 0.010810613632202148, 0.011687278747558594, 0.012563943862915039, 0.013440608978271484, 0.01431727409362793, 0.015193939208984375, 0.01607060432434082, 0.016947269439697266, 0.01782393455505371, 0.018700599670410156, 0.0195772647857666, 0.020453929901123047, 0.021330595016479492, 0.022207260131835938, 0.023083925247192383, 0.023960590362548828, 0.024837255477905273, 0.02571392059326172, 0.026590585708618164, 0.02746725082397461, 0.028343915939331055, 0.0292205810546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 12.0, 23.0, 45.0, 73.0, 129.0, 150.0, 128.0, 135.0, 97.0, 64.0, 50.0, 22.0, 15.0, 16.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6170962452888489, -0.6004340648651123, -0.583771824836731, -0.5671096444129944, -0.5504474639892578, -0.5337852835655212, -0.5171231031417847, -0.5004608631134033, -0.48379868268966675, -0.4671365022659302, -0.4504742920398712, -0.43381208181381226, -0.4171499013900757, -0.4004877209663391, -0.38382551074028015, -0.3671633005142212, -0.3505011200904846, -0.33383893966674805, -0.3171767294406891, -0.3005145192146301, -0.28385233879089355, -0.267190158367157, -0.250527948141098, -0.23386575281620026, -0.2172035574913025, -0.20054136216640472, -0.18387916684150696, -0.1672169715166092, -0.15055477619171143, -0.13389258086681366, -0.1172303855419159, -0.10056819021701813, -0.08390593528747559, -0.06724373996257782, -0.050581544637680054, -0.03391934931278229, -0.01725715398788452, -0.0005949586629867554, 0.01606723666191101, 0.03272943198680878, 0.04939162731170654, 0.06605382263660431, 0.08271601796150208, 0.09937821328639984, 0.11604040861129761, 0.13270260393619537, 0.14936479926109314, 0.1660269945859909, 0.18268918991088867, 0.19935138523578644, 0.2160135805606842, 0.23267577588558197, 0.24933797121047974, 0.2660001516342163, 0.28266236186027527, 0.29932457208633423, 0.3159867525100708, 0.3326489329338074, 0.34931114315986633, 0.3659733533859253, 0.38263553380966187, 0.39929771423339844, 0.4159599244594574, 0.43262213468551636, 0.44928431510925293]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 6.0, 7.0, 12.0, 7.0, 9.0, 7.0, 17.0, 21.0, 18.0, 15.0, 30.0, 41.0, 35.0, 42.0, 33.0, 41.0, 49.0, 45.0, 51.0, 40.0, 55.0, 41.0, 44.0, 33.0, 40.0, 27.0, 37.0, 31.0, 38.0, 21.0, 8.0, 21.0, 18.0, 13.0, 7.0, 3.0, 11.0, 6.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2074335217475891, -0.20127350091934204, -0.19511348009109497, -0.1889534592628479, -0.18279342353343964, -0.17663340270519257, -0.1704733818769455, -0.16431336104869843, -0.15815332531929016, -0.1519933044910431, -0.14583328366279602, -0.13967326283454895, -0.13351322710514069, -0.12735320627689362, -0.12119318544864655, -0.11503316462039948, -0.1088731437921524, -0.10271312296390533, -0.09655309468507767, -0.0903930738568306, -0.08423304557800293, -0.07807302474975586, -0.07191300392150879, -0.06575298309326172, -0.05959295481443405, -0.05343293026089668, -0.047272905707359314, -0.041112884879112244, -0.034952860325574875, -0.028792835772037506, -0.022632814943790436, -0.016472790390253067, -0.010312765836715698, -0.004152742214500904, 0.00200728140771389, 0.00816730409860611, 0.014327328652143478, 0.020487353205680847, 0.026647374033927917, 0.032807398587465286, 0.038967423141002655, 0.045127447694540024, 0.05128747224807739, 0.05744749307632446, 0.06360751390457153, 0.0697675421833992, 0.07592756301164627, 0.08208759129047394, 0.08824761211872101, 0.09440763294696808, 0.10056766122579575, 0.10672768205404282, 0.11288771033287048, 0.11904773116111755, 0.12520775198936462, 0.1313677728176117, 0.13752779364585876, 0.14368781447410583, 0.1498478353023529, 0.15600785613059998, 0.16216789186000824, 0.1683279126882553, 0.17448793351650238, 0.18064795434474945, 0.18680799007415771]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 0.0, 6.0, 6.0, 9.0, 16.0, 19.0, 29.0, 39.0, 59.0, 75.0, 99.0, 168.0, 295.0, 474.0, 813.0, 1580.0, 2904.0, 6412.0, 15136.0, 42112.0, 149648.0, 965925.0, 2403310.0, 463799.0, 91314.0, 29214.0, 11131.0, 4773.0, 2210.0, 1173.0, 622.0, 353.0, 194.0, 143.0, 78.0, 46.0, 30.0, 25.0, 16.0, 9.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0574951171875, -0.055912017822265625, -0.05432891845703125, -0.052745819091796875, -0.0511627197265625, -0.049579620361328125, -0.04799652099609375, -0.046413421630859375, -0.044830322265625, -0.043247222900390625, -0.04166412353515625, -0.040081024169921875, -0.0384979248046875, -0.036914825439453125, -0.03533172607421875, -0.033748626708984375, -0.03216552734375, -0.030582427978515625, -0.02899932861328125, -0.027416229248046875, -0.0258331298828125, -0.024250030517578125, -0.02266693115234375, -0.021083831787109375, -0.019500732421875, -0.017917633056640625, -0.01633453369140625, -0.014751434326171875, -0.0131683349609375, -0.011585235595703125, -0.01000213623046875, -0.008419036865234375, -0.0068359375, -0.005252838134765625, -0.00366973876953125, -0.002086639404296875, -0.0005035400390625, 0.001079559326171875, 0.00266265869140625, 0.004245758056640625, 0.005828857421875, 0.007411956787109375, 0.00899505615234375, 0.010578155517578125, 0.0121612548828125, 0.013744354248046875, 0.01532745361328125, 0.016910552978515625, 0.01849365234375, 0.020076751708984375, 0.02165985107421875, 0.023242950439453125, 0.0248260498046875, 0.026409149169921875, 0.02799224853515625, 0.029575347900390625, 0.031158447265625, 0.032741546630859375, 0.03432464599609375, 0.035907745361328125, 0.0374908447265625, 0.039073944091796875, 0.04065704345703125, 0.042240142822265625, 0.0438232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 10.0, 11.0, 21.0, 13.0, 26.0, 31.0, 27.0, 25.0, 46.0, 40.0, 45.0, 56.0, 55.0, 58.0, 63.0, 45.0, 64.0, 60.0, 56.0, 46.0, 37.0, 33.0, 37.0, 18.0, 24.0, 21.0, 9.0, 5.0, 8.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.03386068344116211, -0.03293132781982422, -0.03200197219848633, -0.031072616577148438, -0.030143260955810547, -0.029213905334472656, -0.028284549713134766, -0.027355194091796875, -0.026425838470458984, -0.025496482849121094, -0.024567127227783203, -0.023637771606445312, -0.022708415985107422, -0.02177906036376953, -0.02084970474243164, -0.01992034912109375, -0.01899099349975586, -0.01806163787841797, -0.017132282257080078, -0.016202926635742188, -0.015273571014404297, -0.014344215393066406, -0.013414859771728516, -0.012485504150390625, -0.011556148529052734, -0.010626792907714844, -0.009697437286376953, -0.008768081665039062, -0.007838726043701172, -0.006909370422363281, -0.005980014801025391, -0.0050506591796875, -0.004121303558349609, -0.0031919479370117188, -0.002262592315673828, -0.0013332366943359375, -0.0004038810729980469, 0.0005254745483398438, 0.0014548301696777344, 0.002384185791015625, 0.0033135414123535156, 0.004242897033691406, 0.005172252655029297, 0.0061016082763671875, 0.007030963897705078, 0.007960319519042969, 0.00888967514038086, 0.00981903076171875, 0.01074838638305664, 0.011677742004394531, 0.012607097625732422, 0.013536453247070312, 0.014465808868408203, 0.015395164489746094, 0.016324520111083984, 0.017253875732421875, 0.018183231353759766, 0.019112586975097656, 0.020041942596435547, 0.020971298217773438, 0.021900653839111328, 0.02283000946044922, 0.02375936508178711, 0.024688720703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 12.0, 18.0, 22.0, 23.0, 22.0, 40.0, 68.0, 93.0, 136.0, 208.0, 347.0, 634.0, 1069.0, 1879.0, 3873.0, 8462.0, 20567.0, 57930.0, 207477.0, 1529241.0, 2005394.0, 248766.0, 66407.0, 23314.0, 9377.0, 4279.0, 2014.0, 1033.0, 573.0, 355.0, 236.0, 119.0, 91.0, 73.0, 47.0, 21.0, 14.0, 13.0, 9.0, 6.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.059478759765625, -0.05778217315673828, -0.05608558654785156, -0.054388999938964844, -0.052692413330078125, -0.050995826721191406, -0.04929924011230469, -0.04760265350341797, -0.04590606689453125, -0.04420948028564453, -0.04251289367675781, -0.040816307067871094, -0.039119720458984375, -0.037423133850097656, -0.03572654724121094, -0.03402996063232422, -0.0323333740234375, -0.03063678741455078, -0.028940200805664062, -0.027243614196777344, -0.025547027587890625, -0.023850440979003906, -0.022153854370117188, -0.02045726776123047, -0.01876068115234375, -0.01706409454345703, -0.015367507934570312, -0.013670921325683594, -0.011974334716796875, -0.010277748107910156, -0.008581161499023438, -0.006884574890136719, -0.00518798828125, -0.0034914016723632812, -0.0017948150634765625, -9.822845458984375e-05, 0.001598358154296875, 0.0032949447631835938, 0.0049915313720703125, 0.006688117980957031, 0.00838470458984375, 0.010081291198730469, 0.011777877807617188, 0.013474464416503906, 0.015171051025390625, 0.016867637634277344, 0.018564224243164062, 0.02026081085205078, 0.0219573974609375, 0.02365398406982422, 0.025350570678710938, 0.027047157287597656, 0.028743743896484375, 0.030440330505371094, 0.03213691711425781, 0.03383350372314453, 0.03553009033203125, 0.03722667694091797, 0.03892326354980469, 0.040619850158691406, 0.042316436767578125, 0.044013023376464844, 0.04570960998535156, 0.04740619659423828, 0.049102783203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 8.0, 9.0, 12.0, 12.0, 19.0, 36.0, 38.0, 59.0, 66.0, 75.0, 106.0, 163.0, 230.0, 393.0, 665.0, 781.0, 476.0, 268.0, 194.0, 104.0, 78.0, 71.0, 51.0, 34.0, 30.0, 23.0, 23.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059417724609375, -0.057679176330566406, -0.05594062805175781, -0.05420207977294922, -0.052463531494140625, -0.05072498321533203, -0.04898643493652344, -0.047247886657714844, -0.04550933837890625, -0.043770790100097656, -0.04203224182128906, -0.04029369354248047, -0.038555145263671875, -0.03681659698486328, -0.03507804870605469, -0.033339500427246094, -0.0316009521484375, -0.029862403869628906, -0.028123855590820312, -0.02638530731201172, -0.024646759033203125, -0.02290821075439453, -0.021169662475585938, -0.019431114196777344, -0.01769256591796875, -0.015954017639160156, -0.014215469360351562, -0.012476921081542969, -0.010738372802734375, -0.008999824523925781, -0.0072612762451171875, -0.005522727966308594, -0.0037841796875, -0.0020456314086914062, -0.0003070831298828125, 0.0014314651489257812, 0.003170013427734375, 0.004908561706542969, 0.0066471099853515625, 0.008385658264160156, 0.01012420654296875, 0.011862754821777344, 0.013601303100585938, 0.015339851379394531, 0.017078399658203125, 0.01881694793701172, 0.020555496215820312, 0.022294044494628906, 0.0240325927734375, 0.025771141052246094, 0.027509689331054688, 0.02924823760986328, 0.030986785888671875, 0.03272533416748047, 0.03446388244628906, 0.036202430725097656, 0.03794097900390625, 0.039679527282714844, 0.04141807556152344, 0.04315662384033203, 0.044895172119140625, 0.04663372039794922, 0.04837226867675781, 0.050110816955566406, 0.051849365234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 8.0, 13.0, 24.0, 44.0, 123.0, 214.0, 249.0, 173.0, 92.0, 28.0, 16.0, 6.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3506079316139221, -0.32650020718574524, -0.30239245295524597, -0.2782847285270691, -0.2541769742965698, -0.23006924986839294, -0.20596152544021606, -0.181853786110878, -0.15774604678153992, -0.13363830745220184, -0.10953057557344437, -0.08542284369468689, -0.061315104365348816, -0.03720736503601074, -0.013099640607833862, 0.011008098721504211, 0.035115838050842285, 0.05922357365489006, 0.08333130925893784, 0.10743904113769531, 0.1315467804670334, 0.15565451979637146, 0.17976224422454834, 0.2038699835538864, 0.2279777228832245, 0.25208544731140137, 0.27619320154190063, 0.3003009259700775, 0.3244086503982544, 0.34851640462875366, 0.37262412905693054, 0.3967318534851074, 0.42083966732025146, 0.44494739174842834, 0.4690551459789276, 0.4931628704071045, 0.5172706246376038, 0.541378378868103, 0.5654860734939575, 0.5895938277244568, 0.613701581954956, 0.6378093361854553, 0.6619170308113098, 0.6860247850418091, 0.7101325392723083, 0.7342402935028076, 0.7583479881286621, 0.7824557423591614, 0.8065634369850159, 0.8306711912155151, 0.8547788858413696, 0.8788866400718689, 0.9029943943023682, 0.9271020889282227, 0.9512098431587219, 0.9753175973892212, 0.9994252920150757, 1.0235329866409302, 1.0476408004760742, 1.0717484951019287, 1.0958561897277832, 1.1199640035629272, 1.1440716981887817, 1.1681793928146362, 1.1922872066497803]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 1.0, 3.0, 7.0, 14.0, 8.0, 13.0, 20.0, 19.0, 27.0, 30.0, 32.0, 40.0, 31.0, 36.0, 38.0, 50.0, 52.0, 41.0, 65.0, 55.0, 44.0, 50.0, 49.0, 46.0, 51.0, 48.0, 22.0, 24.0, 24.0, 11.0, 11.0, 6.0, 12.0, 8.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2203013300895691, -0.21291813254356384, -0.2055349498987198, -0.19815175235271454, -0.19076856970787048, -0.18338537216186523, -0.17600217461585999, -0.16861897706985474, -0.16123579442501068, -0.15385259687900543, -0.14646941423416138, -0.13908621668815613, -0.13170301914215088, -0.12431983649730682, -0.11693663895130157, -0.10955344885587692, -0.10217025876045227, -0.09478706866502762, -0.08740387856960297, -0.08002068102359772, -0.07263749092817307, -0.06525430083274841, -0.05787110701203346, -0.05048791319131851, -0.04310472309589386, -0.03572153300046921, -0.028338339179754257, -0.020955147221684456, -0.013571955263614655, -0.0061887651681900024, 0.0011944286525249481, 0.008577622473239899, 0.01596081256866455, 0.023344004526734352, 0.030727196484804153, 0.038110390305519104, 0.045493580400943756, 0.05287677049636841, 0.06025996431708336, 0.06764315813779831, 0.07502634823322296, 0.08240953832864761, 0.08979272842407227, 0.09717592597007751, 0.10455911606550217, 0.11194230616092682, 0.11932550370693207, 0.12670868635177612, 0.13409188389778137, 0.14147508144378662, 0.14885826408863068, 0.15624146163463593, 0.16362464427947998, 0.17100784182548523, 0.17839103937149048, 0.18577423691749573, 0.19315741956233978, 0.20054061710834503, 0.2079237997531891, 0.21530699729919434, 0.22269019484519958, 0.23007337749004364, 0.2374565750360489, 0.24483975768089294, 0.2522229552268982]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 8.0, 28.0, 39.0, 39.0, 63.0, 118.0, 179.0, 329.0, 544.0, 1059.0, 2010.0, 3863.0, 8043.0, 16389.0, 35411.0, 78747.0, 169011.0, 271757.0, 234532.0, 122209.0, 55336.0, 24944.0, 11849.0, 5669.0, 2910.0, 1464.0, 820.0, 459.0, 285.0, 156.0, 73.0, 74.0, 41.0, 19.0, 17.0, 5.0, 8.0, 13.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.0621337890625, -0.06039714813232422, -0.05866050720214844, -0.056923866271972656, -0.055187225341796875, -0.053450584411621094, -0.05171394348144531, -0.04997730255126953, -0.04824066162109375, -0.04650402069091797, -0.04476737976074219, -0.043030738830566406, -0.041294097900390625, -0.039557456970214844, -0.03782081604003906, -0.03608417510986328, -0.0343475341796875, -0.03261089324951172, -0.030874252319335938, -0.029137611389160156, -0.027400970458984375, -0.025664329528808594, -0.023927688598632812, -0.02219104766845703, -0.02045440673828125, -0.01871776580810547, -0.016981124877929688, -0.015244483947753906, -0.013507843017578125, -0.011771202087402344, -0.010034561157226562, -0.008297920227050781, -0.006561279296875, -0.004824638366699219, -0.0030879974365234375, -0.0013513565063476562, 0.000385284423828125, 0.0021219253540039062, 0.0038585662841796875, 0.005595207214355469, 0.00733184814453125, 0.009068489074707031, 0.010805130004882812, 0.012541770935058594, 0.014278411865234375, 0.016015052795410156, 0.017751693725585938, 0.01948833465576172, 0.0212249755859375, 0.02296161651611328, 0.024698257446289062, 0.026434898376464844, 0.028171539306640625, 0.029908180236816406, 0.03164482116699219, 0.03338146209716797, 0.03511810302734375, 0.03685474395751953, 0.03859138488769531, 0.040328025817871094, 0.042064666748046875, 0.043801307678222656, 0.04553794860839844, 0.04727458953857422, 0.04901123046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 12.0, 11.0, 18.0, 17.0, 35.0, 33.0, 24.0, 38.0, 34.0, 33.0, 33.0, 53.0, 58.0, 45.0, 56.0, 53.0, 45.0, 58.0, 43.0, 42.0, 36.0, 42.0, 36.0, 27.0, 15.0, 20.0, 13.0, 8.0, 12.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.036956787109375, -0.03601646423339844, -0.035076141357421875, -0.03413581848144531, -0.03319549560546875, -0.03225517272949219, -0.031314849853515625, -0.030374526977539062, -0.0294342041015625, -0.028493881225585938, -0.027553558349609375, -0.026613235473632812, -0.02567291259765625, -0.024732589721679688, -0.023792266845703125, -0.022851943969726562, -0.02191162109375, -0.020971298217773438, -0.020030975341796875, -0.019090652465820312, -0.01815032958984375, -0.017210006713867188, -0.016269683837890625, -0.015329360961914062, -0.0143890380859375, -0.013448715209960938, -0.012508392333984375, -0.011568069458007812, -0.01062774658203125, -0.009687423706054688, -0.008747100830078125, -0.0078067779541015625, -0.006866455078125, -0.0059261322021484375, -0.004985809326171875, -0.0040454864501953125, -0.00310516357421875, -0.0021648406982421875, -0.001224517822265625, -0.0002841949462890625, 0.0006561279296875, 0.0015964508056640625, 0.002536773681640625, 0.0034770965576171875, 0.00441741943359375, 0.0053577423095703125, 0.006298065185546875, 0.0072383880615234375, 0.0081787109375, 0.009119033813476562, 0.010059356689453125, 0.010999679565429688, 0.01194000244140625, 0.012880325317382812, 0.013820648193359375, 0.014760971069335938, 0.0157012939453125, 0.016641616821289062, 0.017581939697265625, 0.018522262573242188, 0.01946258544921875, 0.020402908325195312, 0.021343231201171875, 0.022283554077148438, 0.023223876953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 5.0, 9.0, 15.0, 13.0, 19.0, 20.0, 40.0, 61.0, 79.0, 157.0, 265.0, 338.0, 529.0, 909.0, 1542.0, 2687.0, 4813.0, 9025.0, 17331.0, 35510.0, 79776.0, 185088.0, 340143.0, 202606.0, 88312.0, 38715.0, 18636.0, 9535.0, 5154.0, 2944.0, 1657.0, 942.0, 572.0, 379.0, 226.0, 149.0, 104.0, 65.0, 61.0, 30.0, 24.0, 22.0, 18.0, 7.0, 6.0, 8.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.061859130859375, -0.06006908416748047, -0.05827903747558594, -0.056488990783691406, -0.054698944091796875, -0.052908897399902344, -0.05111885070800781, -0.04932880401611328, -0.04753875732421875, -0.04574871063232422, -0.04395866394042969, -0.042168617248535156, -0.040378570556640625, -0.038588523864746094, -0.03679847717285156, -0.03500843048095703, -0.0332183837890625, -0.03142833709716797, -0.029638290405273438, -0.027848243713378906, -0.026058197021484375, -0.024268150329589844, -0.022478103637695312, -0.02068805694580078, -0.01889801025390625, -0.01710796356201172, -0.015317916870117188, -0.013527870178222656, -0.011737823486328125, -0.009947776794433594, -0.008157730102539062, -0.006367683410644531, -0.00457763671875, -0.0027875900268554688, -0.0009975433349609375, 0.0007925033569335938, 0.002582550048828125, 0.004372596740722656, 0.0061626434326171875, 0.007952690124511719, 0.00974273681640625, 0.011532783508300781, 0.013322830200195312, 0.015112876892089844, 0.016902923583984375, 0.018692970275878906, 0.020483016967773438, 0.02227306365966797, 0.0240631103515625, 0.02585315704345703, 0.027643203735351562, 0.029433250427246094, 0.031223297119140625, 0.033013343811035156, 0.03480339050292969, 0.03659343719482422, 0.03838348388671875, 0.04017353057861328, 0.04196357727050781, 0.043753623962402344, 0.045543670654296875, 0.047333717346191406, 0.04912376403808594, 0.05091381072998047, 0.052703857421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 4.0, 11.0, 10.0, 10.0, 15.0, 20.0, 20.0, 21.0, 36.0, 23.0, 33.0, 45.0, 45.0, 46.0, 51.0, 57.0, 54.0, 53.0, 52.0, 38.0, 46.0, 41.0, 31.0, 36.0, 24.0, 23.0, 33.0, 19.0, 19.0, 17.0, 12.0, 12.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.10028076171875, -0.09762096405029297, -0.09496116638183594, -0.0923013687133789, -0.08964157104492188, -0.08698177337646484, -0.08432197570800781, -0.08166217803955078, -0.07900238037109375, -0.07634258270263672, -0.07368278503417969, -0.07102298736572266, -0.06836318969726562, -0.0657033920288086, -0.06304359436035156, -0.06038379669189453, -0.0577239990234375, -0.05506420135498047, -0.05240440368652344, -0.049744606018066406, -0.047084808349609375, -0.044425010681152344, -0.04176521301269531, -0.03910541534423828, -0.03644561767578125, -0.03378582000732422, -0.031126022338867188, -0.028466224670410156, -0.025806427001953125, -0.023146629333496094, -0.020486831665039062, -0.01782703399658203, -0.015167236328125, -0.012507438659667969, -0.009847640991210938, -0.007187843322753906, -0.004528045654296875, -0.0018682479858398438, 0.0007915496826171875, 0.0034513473510742188, 0.00611114501953125, 0.008770942687988281, 0.011430740356445312, 0.014090538024902344, 0.016750335693359375, 0.019410133361816406, 0.022069931030273438, 0.02472972869873047, 0.0273895263671875, 0.03004932403564453, 0.03270912170410156, 0.035368919372558594, 0.038028717041015625, 0.040688514709472656, 0.04334831237792969, 0.04600811004638672, 0.04866790771484375, 0.05132770538330078, 0.05398750305175781, 0.056647300720214844, 0.059307098388671875, 0.061966896057128906, 0.06462669372558594, 0.06728649139404297, 0.0699462890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 8.0, 4.0, 5.0, 10.0, 15.0, 19.0, 35.0, 48.0, 79.0, 110.0, 163.0, 277.0, 417.0, 622.0, 1010.0, 1716.0, 2737.0, 4534.0, 7577.0, 13482.0, 26290.0, 60327.0, 173494.0, 420092.0, 202657.0, 68724.0, 29118.0, 14427.0, 8137.0, 4740.0, 2916.0, 1780.0, 1058.0, 685.0, 465.0, 293.0, 155.0, 108.0, 71.0, 53.0, 31.0, 22.0, 13.0, 17.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.022064208984375, -0.021406888961791992, -0.020749568939208984, -0.020092248916625977, -0.01943492889404297, -0.01877760887145996, -0.018120288848876953, -0.017462968826293945, -0.016805648803710938, -0.01614832878112793, -0.015491008758544922, -0.014833688735961914, -0.014176368713378906, -0.013519048690795898, -0.01286172866821289, -0.012204408645629883, -0.011547088623046875, -0.010889768600463867, -0.01023244857788086, -0.009575128555297852, -0.008917808532714844, -0.008260488510131836, -0.007603168487548828, -0.00694584846496582, -0.0062885284423828125, -0.005631208419799805, -0.004973888397216797, -0.004316568374633789, -0.0036592483520507812, -0.0030019283294677734, -0.0023446083068847656, -0.0016872882843017578, -0.00102996826171875, -0.0003726482391357422, 0.0002846717834472656, 0.0009419918060302734, 0.0015993118286132812, 0.002256631851196289, 0.002913951873779297, 0.0035712718963623047, 0.0042285919189453125, 0.00488591194152832, 0.005543231964111328, 0.006200551986694336, 0.006857872009277344, 0.0075151920318603516, 0.00817251205444336, 0.008829832077026367, 0.009487152099609375, 0.010144472122192383, 0.01080179214477539, 0.011459112167358398, 0.012116432189941406, 0.012773752212524414, 0.013431072235107422, 0.01408839225769043, 0.014745712280273438, 0.015403032302856445, 0.016060352325439453, 0.01671767234802246, 0.01737499237060547, 0.018032312393188477, 0.018689632415771484, 0.019346952438354492, 0.0200042724609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 4.0, 8.0, 9.0, 8.0, 10.0, 16.0, 27.0, 20.0, 30.0, 34.0, 34.0, 47.0, 50.0, 60.0, 65.0, 55.0, 58.0, 58.0, 45.0, 48.0, 51.0, 34.0, 32.0, 28.0, 25.0, 26.0, 21.0, 11.0, 17.0, 14.0, 14.0, 9.0, 4.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1832995116710663e-05, -2.119503915309906e-05, -2.0557083189487457e-05, -1.9919127225875854e-05, -1.9281171262264252e-05, -1.864321529865265e-05, -1.8005259335041046e-05, -1.7367303371429443e-05, -1.672934740781784e-05, -1.6091391444206238e-05, -1.5453435480594635e-05, -1.4815479516983032e-05, -1.417752355337143e-05, -1.3539567589759827e-05, -1.2901611626148224e-05, -1.2263655662536621e-05, -1.1625699698925018e-05, -1.0987743735313416e-05, -1.0349787771701813e-05, -9.71183180809021e-06, -9.073875844478607e-06, -8.435919880867004e-06, -7.797963917255402e-06, -7.160007953643799e-06, -6.522051990032196e-06, -5.884096026420593e-06, -5.2461400628089905e-06, -4.608184099197388e-06, -3.970228135585785e-06, -3.332272171974182e-06, -2.6943162083625793e-06, -2.0563602447509766e-06, -1.4184042811393738e-06, -7.80448317527771e-07, -1.424923539161682e-07, 4.954636096954346e-07, 1.1334195733070374e-06, 1.7713755369186401e-06, 2.409331500530243e-06, 3.0472874641418457e-06, 3.6852434277534485e-06, 4.323199391365051e-06, 4.961155354976654e-06, 5.599111318588257e-06, 6.23706728219986e-06, 6.875023245811462e-06, 7.512979209423065e-06, 8.150935173034668e-06, 8.78889113664627e-06, 9.426847100257874e-06, 1.0064803063869476e-05, 1.0702759027481079e-05, 1.1340714991092682e-05, 1.1978670954704285e-05, 1.2616626918315887e-05, 1.325458288192749e-05, 1.3892538845539093e-05, 1.4530494809150696e-05, 1.5168450772762299e-05, 1.58064067363739e-05, 1.6444362699985504e-05, 1.7082318663597107e-05, 1.772027462720871e-05, 1.8358230590820312e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 8.0, 23.0, 36.0, 28.0, 47.0, 68.0, 81.0, 162.0, 287.0, 427.0, 700.0, 1250.0, 2203.0, 4201.0, 8515.0, 19211.0, 48308.0, 145990.0, 425246.0, 257131.0, 80029.0, 29246.0, 12353.0, 5920.0, 2959.0, 1673.0, 915.0, 588.0, 344.0, 210.0, 124.0, 85.0, 50.0, 30.0, 23.0, 24.0, 15.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0203857421875, -0.01967644691467285, -0.018967151641845703, -0.018257856369018555, -0.017548561096191406, -0.016839265823364258, -0.01612997055053711, -0.015420675277709961, -0.014711380004882812, -0.014002084732055664, -0.013292789459228516, -0.012583494186401367, -0.011874198913574219, -0.01116490364074707, -0.010455608367919922, -0.009746313095092773, -0.009037017822265625, -0.008327722549438477, -0.007618427276611328, -0.00690913200378418, -0.006199836730957031, -0.005490541458129883, -0.004781246185302734, -0.004071950912475586, -0.0033626556396484375, -0.002653360366821289, -0.0019440650939941406, -0.0012347698211669922, -0.0005254745483398438, 0.0001838207244873047, 0.0008931159973144531, 0.0016024112701416016, 0.00231170654296875, 0.0030210018157958984, 0.003730297088623047, 0.004439592361450195, 0.005148887634277344, 0.005858182907104492, 0.006567478179931641, 0.007276773452758789, 0.007986068725585938, 0.008695363998413086, 0.009404659271240234, 0.010113954544067383, 0.010823249816894531, 0.01153254508972168, 0.012241840362548828, 0.012951135635375977, 0.013660430908203125, 0.014369726181030273, 0.015079021453857422, 0.01578831672668457, 0.01649761199951172, 0.017206907272338867, 0.017916202545166016, 0.018625497817993164, 0.019334793090820312, 0.02004408836364746, 0.02075338363647461, 0.021462678909301758, 0.022171974182128906, 0.022881269454956055, 0.023590564727783203, 0.02429986000061035, 0.0250091552734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 4.0, 9.0, 6.0, 4.0, 17.0, 19.0, 21.0, 43.0, 48.0, 63.0, 99.0, 120.0, 95.0, 92.0, 102.0, 53.0, 35.0, 34.0, 30.0, 17.0, 10.0, 13.0, 12.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02825927734375, -0.027256488800048828, -0.026253700256347656, -0.025250911712646484, -0.024248123168945312, -0.02324533462524414, -0.02224254608154297, -0.021239757537841797, -0.020236968994140625, -0.019234180450439453, -0.01823139190673828, -0.01722860336303711, -0.016225814819335938, -0.015223026275634766, -0.014220237731933594, -0.013217449188232422, -0.01221466064453125, -0.011211872100830078, -0.010209083557128906, -0.009206295013427734, -0.008203506469726562, -0.007200717926025391, -0.006197929382324219, -0.005195140838623047, -0.004192352294921875, -0.003189563751220703, -0.0021867752075195312, -0.0011839866638183594, -0.0001811981201171875, 0.0008215904235839844, 0.0018243789672851562, 0.002827167510986328, 0.0038299560546875, 0.004832744598388672, 0.005835533142089844, 0.006838321685791016, 0.007841110229492188, 0.00884389877319336, 0.009846687316894531, 0.010849475860595703, 0.011852264404296875, 0.012855052947998047, 0.013857841491699219, 0.01486063003540039, 0.015863418579101562, 0.016866207122802734, 0.017868995666503906, 0.018871784210205078, 0.01987457275390625, 0.020877361297607422, 0.021880149841308594, 0.022882938385009766, 0.023885726928710938, 0.02488851547241211, 0.02589130401611328, 0.026894092559814453, 0.027896881103515625, 0.028899669647216797, 0.02990245819091797, 0.03090524673461914, 0.03190803527832031, 0.032910823822021484, 0.033913612365722656, 0.03491640090942383, 0.035919189453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 8.0, 17.0, 21.0, 70.0, 138.0, 203.0, 226.0, 145.0, 92.0, 42.0, 21.0, 8.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310897350311279, -0.8031781911849976, -0.7752665877342224, -0.747355043888092, -0.7194434404373169, -0.6915318965911865, -0.6636203527450562, -0.6357088088989258, -0.6077972054481506, -0.5798856616020203, -0.5519740581512451, -0.5240625143051147, -0.496150940656662, -0.46823936700820923, -0.44032782316207886, -0.4124162495136261, -0.38450467586517334, -0.3565931022167206, -0.3286815285682678, -0.30076998472213745, -0.2728584110736847, -0.24494683742523193, -0.21703527867794037, -0.1891237199306488, -0.16121214628219604, -0.1333005726337433, -0.10538901388645172, -0.07747744768857956, -0.0495658814907074, -0.02165430784225464, 0.006257250905036926, 0.03416880965232849, 0.062080323696136475, 0.08999188989400864, 0.1179034560918808, 0.14581501483917236, 0.17372658848762512, 0.20163816213607788, 0.22954972088336945, 0.257461279630661, 0.28537285327911377, 0.31328442692756653, 0.3411960005760193, 0.36910754442214966, 0.3970191180706024, 0.4249306917190552, 0.45284223556518555, 0.4807538092136383, 0.5086653828620911, 0.5365769267082214, 0.5644885301589966, 0.592400074005127, 0.6203116178512573, 0.6482232213020325, 0.6761347651481628, 0.704046368598938, 0.7319579124450684, 0.7598694562911987, 0.7877810597419739, 0.8156926035881042, 0.8436042070388794, 0.8715157508850098, 0.8994272947311401, 0.9273388385772705, 0.9552504420280457]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 5.0, 12.0, 8.0, 13.0, 12.0, 10.0, 16.0, 16.0, 14.0, 19.0, 30.0, 26.0, 34.0, 31.0, 43.0, 27.0, 35.0, 41.0, 41.0, 37.0, 52.0, 54.0, 41.0, 45.0, 25.0, 38.0, 39.0, 29.0, 35.0, 25.0, 23.0, 19.0, 13.0, 10.0, 17.0, 12.0, 8.0, 5.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.23471873998641968, -0.22769717872142792, -0.22067561745643616, -0.2136540561914444, -0.20663249492645264, -0.19961093366146088, -0.19258937239646912, -0.18556781113147736, -0.1785462498664856, -0.17152468860149384, -0.16450312733650208, -0.15748156607151031, -0.15046000480651855, -0.1434384435415268, -0.13641688227653503, -0.12939532101154327, -0.12237375974655151, -0.11535219848155975, -0.108330637216568, -0.10130907595157623, -0.09428751468658447, -0.08726595342159271, -0.08024439215660095, -0.07322283089160919, -0.06620126962661743, -0.05917970836162567, -0.05215814709663391, -0.04513658583164215, -0.03811502456665039, -0.03109346330165863, -0.02407190203666687, -0.01705034077167511, -0.01002877950668335, -0.0030072182416915894, 0.004014343023300171, 0.011035904288291931, 0.01805746555328369, 0.02507902681827545, 0.03210058808326721, 0.03912214934825897, 0.04614371061325073, 0.05316527187824249, 0.06018683314323425, 0.06720839440822601, 0.07422995567321777, 0.08125151693820953, 0.0882730782032013, 0.09529463946819305, 0.10231620073318481, 0.10933776199817657, 0.11635932326316833, 0.1233808845281601, 0.13040244579315186, 0.13742400705814362, 0.14444556832313538, 0.15146712958812714, 0.1584886908531189, 0.16551025211811066, 0.17253181338310242, 0.17955337464809418, 0.18657493591308594, 0.1935964971780777, 0.20061805844306946, 0.20763961970806122, 0.21466118097305298]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 16.0, 18.0, 30.0, 59.0, 65.0, 126.0, 215.0, 332.0, 641.0, 1160.0, 2533.0, 5634.0, 14247.0, 39687.0, 128976.0, 532801.0, 1858206.0, 1216661.0, 274458.0, 75622.0, 25198.0, 9741.0, 4043.0, 1825.0, 929.0, 455.0, 255.0, 127.0, 76.0, 50.0, 24.0, 20.0, 10.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08184814453125, -0.07962274551391602, -0.07739734649658203, -0.07517194747924805, -0.07294654846191406, -0.07072114944458008, -0.0684957504272461, -0.06627035140991211, -0.06404495239257812, -0.06181955337524414, -0.059594154357910156, -0.05736875534057617, -0.05514335632324219, -0.0529179573059082, -0.05069255828857422, -0.048467159271240234, -0.04624176025390625, -0.044016361236572266, -0.04179096221923828, -0.0395655632019043, -0.03734016418457031, -0.03511476516723633, -0.032889366149902344, -0.03066396713256836, -0.028438568115234375, -0.02621316909790039, -0.023987770080566406, -0.021762371063232422, -0.019536972045898438, -0.017311573028564453, -0.015086174011230469, -0.012860774993896484, -0.0106353759765625, -0.008409976959228516, -0.006184577941894531, -0.003959178924560547, -0.0017337799072265625, 0.0004916191101074219, 0.0027170181274414062, 0.004942417144775391, 0.007167816162109375, 0.00939321517944336, 0.011618614196777344, 0.013844013214111328, 0.016069412231445312, 0.018294811248779297, 0.02052021026611328, 0.022745609283447266, 0.02497100830078125, 0.027196407318115234, 0.02942180633544922, 0.0316472053527832, 0.03387260437011719, 0.03609800338745117, 0.038323402404785156, 0.04054880142211914, 0.042774200439453125, 0.04499959945678711, 0.047224998474121094, 0.04945039749145508, 0.05167579650878906, 0.05390119552612305, 0.05612659454345703, 0.058351993560791016, 0.060577392578125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 6.0, 4.0, 8.0, 12.0, 22.0, 19.0, 25.0, 28.0, 38.0, 40.0, 39.0, 33.0, 47.0, 41.0, 53.0, 54.0, 59.0, 53.0, 55.0, 42.0, 44.0, 45.0, 48.0, 28.0, 34.0, 23.0, 22.0, 20.0, 19.0, 8.0, 11.0, 3.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.037109375, -0.0361628532409668, -0.035216331481933594, -0.03426980972290039, -0.03332328796386719, -0.032376766204833984, -0.03143024444580078, -0.030483722686767578, -0.029537200927734375, -0.028590679168701172, -0.02764415740966797, -0.026697635650634766, -0.025751113891601562, -0.02480459213256836, -0.023858070373535156, -0.022911548614501953, -0.02196502685546875, -0.021018505096435547, -0.020071983337402344, -0.01912546157836914, -0.018178939819335938, -0.017232418060302734, -0.01628589630126953, -0.015339374542236328, -0.014392852783203125, -0.013446331024169922, -0.012499809265136719, -0.011553287506103516, -0.010606765747070312, -0.00966024398803711, -0.008713722229003906, -0.007767200469970703, -0.0068206787109375, -0.005874156951904297, -0.004927635192871094, -0.003981113433837891, -0.0030345916748046875, -0.0020880699157714844, -0.0011415481567382812, -0.00019502639770507812, 0.000751495361328125, 0.0016980171203613281, 0.0026445388793945312, 0.0035910606384277344, 0.0045375823974609375, 0.005484104156494141, 0.006430625915527344, 0.007377147674560547, 0.00832366943359375, 0.009270191192626953, 0.010216712951660156, 0.01116323471069336, 0.012109756469726562, 0.013056278228759766, 0.014002799987792969, 0.014949321746826172, 0.015895843505859375, 0.016842365264892578, 0.01778888702392578, 0.018735408782958984, 0.019681930541992188, 0.02062845230102539, 0.021574974060058594, 0.022521495819091797, 0.023468017578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 9.0, 10.0, 13.0, 12.0, 23.0, 22.0, 32.0, 45.0, 77.0, 126.0, 191.0, 268.0, 520.0, 796.0, 1618.0, 3421.0, 8211.0, 24592.0, 107758.0, 877577.0, 2746536.0, 340033.0, 55830.0, 15301.0, 5672.0, 2525.0, 1270.0, 687.0, 398.0, 240.0, 142.0, 99.0, 73.0, 48.0, 14.0, 23.0, 18.0, 16.0, 10.0, 7.0, 5.0, 1.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0816650390625, -0.07855987548828125, -0.0754547119140625, -0.07234954833984375, -0.069244384765625, -0.06613922119140625, -0.0630340576171875, -0.05992889404296875, -0.05682373046875, -0.05371856689453125, -0.0506134033203125, -0.04750823974609375, -0.044403076171875, -0.04129791259765625, -0.0381927490234375, -0.03508758544921875, -0.031982421875, -0.02887725830078125, -0.0257720947265625, -0.02266693115234375, -0.019561767578125, -0.01645660400390625, -0.0133514404296875, -0.01024627685546875, -0.00714111328125, -0.00403594970703125, -0.0009307861328125, 0.00217437744140625, 0.005279541015625, 0.00838470458984375, 0.0114898681640625, 0.01459503173828125, 0.0177001953125, 0.02080535888671875, 0.0239105224609375, 0.02701568603515625, 0.030120849609375, 0.03322601318359375, 0.0363311767578125, 0.03943634033203125, 0.04254150390625, 0.04564666748046875, 0.0487518310546875, 0.05185699462890625, 0.054962158203125, 0.05806732177734375, 0.0611724853515625, 0.06427764892578125, 0.0673828125, 0.07048797607421875, 0.0735931396484375, 0.07669830322265625, 0.079803466796875, 0.08290863037109375, 0.0860137939453125, 0.08911895751953125, 0.09222412109375, 0.09532928466796875, 0.0984344482421875, 0.10153961181640625, 0.104644775390625, 0.10774993896484375, 0.1108551025390625, 0.11396026611328125, 0.1170654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 6.0, 13.0, 16.0, 30.0, 25.0, 42.0, 56.0, 108.0, 145.0, 196.0, 277.0, 388.0, 464.0, 529.0, 471.0, 398.0, 263.0, 209.0, 131.0, 82.0, 57.0, 41.0, 38.0, 19.0, 17.0, 10.0, 9.0, 7.0, 7.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117431640625, -0.11394023895263672, -0.11044883728027344, -0.10695743560791016, -0.10346603393554688, -0.0999746322631836, -0.09648323059082031, -0.09299182891845703, -0.08950042724609375, -0.08600902557373047, -0.08251762390136719, -0.0790262222290039, -0.07553482055664062, -0.07204341888427734, -0.06855201721191406, -0.06506061553955078, -0.0615692138671875, -0.05807781219482422, -0.05458641052246094, -0.051095008850097656, -0.047603607177734375, -0.044112205505371094, -0.04062080383300781, -0.03712940216064453, -0.03363800048828125, -0.03014659881591797, -0.026655197143554688, -0.023163795471191406, -0.019672393798828125, -0.016180992126464844, -0.012689590454101562, -0.009198188781738281, -0.005706787109375, -0.0022153854370117188, 0.0012760162353515625, 0.004767417907714844, 0.008258819580078125, 0.011750221252441406, 0.015241622924804688, 0.01873302459716797, 0.02222442626953125, 0.02571582794189453, 0.029207229614257812, 0.032698631286621094, 0.036190032958984375, 0.039681434631347656, 0.04317283630371094, 0.04666423797607422, 0.0501556396484375, 0.05364704132080078, 0.05713844299316406, 0.060629844665527344, 0.06412124633789062, 0.0676126480102539, 0.07110404968261719, 0.07459545135498047, 0.07808685302734375, 0.08157825469970703, 0.08506965637207031, 0.0885610580444336, 0.09205245971679688, 0.09554386138916016, 0.09903526306152344, 0.10252666473388672, 0.10601806640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 3.0, 6.0, 10.0, 18.0, 18.0, 51.0, 61.0, 130.0, 163.0, 179.0, 141.0, 70.0, 54.0, 26.0, 17.0, 15.0, 9.0, 6.0, 1.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08148193359375, -2.024336099624634, -1.9671903848648071, -1.9100446701049805, -1.8528988361358643, -1.7957531213760376, -1.738607406616211, -1.6814615726470947, -1.6243157386779785, -1.5671700239181519, -1.5100241899490356, -1.452878475189209, -1.3957326412200928, -1.3385869264602661, -1.2814412117004395, -1.2242953777313232, -1.1671496629714966, -1.11000394821167, -1.0528581142425537, -0.995712399482727, -0.9385665655136108, -0.8814208507537842, -0.8242750763893127, -0.7671293020248413, -0.7099835276603699, -0.6528377532958984, -0.595691978931427, -0.5385462045669556, -0.4814004600048065, -0.4242546856403351, -0.36710894107818604, -0.3099631667137146, -0.25281739234924316, -0.19567161798477173, -0.1385258585214615, -0.08138009905815125, -0.02423432469367981, 0.032911449670791626, 0.09005719423294067, 0.1472029685974121, 0.20434874296188354, 0.261494517326355, 0.3186402916908264, 0.37578603625297546, 0.4329318106174469, 0.49007758498191833, 0.5472233295440674, 0.6043691039085388, 0.6615148782730103, 0.7186606526374817, 0.7758064270019531, 0.8329521417617798, 0.890097975730896, 0.9472436904907227, 1.0043895244598389, 1.0615352392196655, 1.1186809539794922, 1.1758266687393188, 1.232972502708435, 1.2901182174682617, 1.347264051437378, 1.4044097661972046, 1.4615554809570312, 1.5187013149261475, 1.5758471488952637]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 5.0, 8.0, 8.0, 10.0, 9.0, 10.0, 17.0, 25.0, 29.0, 32.0, 36.0, 32.0, 45.0, 45.0, 41.0, 61.0, 50.0, 59.0, 54.0, 49.0, 47.0, 35.0, 40.0, 43.0, 41.0, 36.0, 19.0, 12.0, 25.0, 18.0, 21.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8582518696784973, -0.8347288370132446, -0.8112058639526367, -0.787682831287384, -0.7641597986221313, -0.7406368255615234, -0.7171137928962708, -0.6935907602310181, -0.6700677871704102, -0.6465447545051575, -0.6230217814445496, -0.5994987487792969, -0.5759757161140442, -0.5524527430534363, -0.5289297103881836, -0.5054067373275757, -0.4818836748600006, -0.4583606719970703, -0.4348376393318176, -0.41131463646888733, -0.38779163360595703, -0.36426860094070435, -0.34074559807777405, -0.31722259521484375, -0.29369956254959106, -0.27017655968666077, -0.24665354192256927, -0.22313052415847778, -0.19960752129554749, -0.176084503531456, -0.1525614857673645, -0.1290384829044342, -0.1055154800415039, -0.08199246972799301, -0.05846945568919182, -0.034946441650390625, -0.01142343133687973, 0.012099578976631165, 0.035622596740722656, 0.059145599603652954, 0.08266861736774445, 0.10619162768125534, 0.12971463799476624, 0.15323765575885773, 0.17676067352294922, 0.20028367638587952, 0.223806694149971, 0.2473296970129013, 0.2708527147769928, 0.2943757176399231, 0.3178987503051758, 0.3414217531681061, 0.3649447560310364, 0.38846778869628906, 0.41199079155921936, 0.43551379442214966, 0.45903682708740234, 0.48255982995033264, 0.5060828328132629, 0.5296058654785156, 0.5531288981437683, 0.5766518712043762, 0.6001749038696289, 0.6236978769302368, 0.6472209095954895]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 5.0, 14.0, 17.0, 26.0, 30.0, 47.0, 64.0, 104.0, 152.0, 262.0, 435.0, 761.0, 1459.0, 2797.0, 5698.0, 13020.0, 34119.0, 102430.0, 310461.0, 368241.0, 134815.0, 43512.0, 16100.0, 6875.0, 3230.0, 1636.0, 874.0, 546.0, 304.0, 195.0, 98.0, 64.0, 47.0, 29.0, 28.0, 10.0, 9.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0751953125, -0.07277870178222656, -0.07036209106445312, -0.06794548034667969, -0.06552886962890625, -0.06311225891113281, -0.060695648193359375, -0.05827903747558594, -0.0558624267578125, -0.05344581604003906, -0.051029205322265625, -0.04861259460449219, -0.04619598388671875, -0.04377937316894531, -0.041362762451171875, -0.03894615173339844, -0.036529541015625, -0.03411293029785156, -0.031696319580078125, -0.029279708862304688, -0.02686309814453125, -0.024446487426757812, -0.022029876708984375, -0.019613265991210938, -0.0171966552734375, -0.014780044555664062, -0.012363433837890625, -0.009946823120117188, -0.00753021240234375, -0.0051136016845703125, -0.002696990966796875, -0.0002803802490234375, 0.00213623046875, 0.0045528411865234375, 0.006969451904296875, 0.009386062622070312, 0.01180267333984375, 0.014219284057617188, 0.016635894775390625, 0.019052505493164062, 0.0214691162109375, 0.023885726928710938, 0.026302337646484375, 0.028718948364257812, 0.03113555908203125, 0.03355216979980469, 0.035968780517578125, 0.03838539123535156, 0.040802001953125, 0.04321861267089844, 0.045635223388671875, 0.04805183410644531, 0.05046844482421875, 0.05288505554199219, 0.055301666259765625, 0.05771827697753906, 0.0601348876953125, 0.06255149841308594, 0.06496810913085938, 0.06738471984863281, 0.06980133056640625, 0.07221794128417969, 0.07463455200195312, 0.07705116271972656, 0.0794677734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 4.0, 9.0, 24.0, 17.0, 21.0, 25.0, 37.0, 44.0, 39.0, 61.0, 70.0, 64.0, 67.0, 52.0, 58.0, 65.0, 66.0, 62.0, 39.0, 34.0, 29.0, 26.0, 16.0, 16.0, 9.0, 10.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.064208984375, -0.06207752227783203, -0.05994606018066406, -0.057814598083496094, -0.055683135986328125, -0.053551673889160156, -0.05142021179199219, -0.04928874969482422, -0.04715728759765625, -0.04502582550048828, -0.04289436340332031, -0.040762901306152344, -0.038631439208984375, -0.036499977111816406, -0.03436851501464844, -0.03223705291748047, -0.0301055908203125, -0.02797412872314453, -0.025842666625976562, -0.023711204528808594, -0.021579742431640625, -0.019448280334472656, -0.017316818237304688, -0.015185356140136719, -0.01305389404296875, -0.010922431945800781, -0.008790969848632812, -0.006659507751464844, -0.004528045654296875, -0.0023965835571289062, -0.0002651214599609375, 0.0018663406372070312, 0.003997802734375, 0.006129264831542969, 0.008260726928710938, 0.010392189025878906, 0.012523651123046875, 0.014655113220214844, 0.016786575317382812, 0.01891803741455078, 0.02104949951171875, 0.02318096160888672, 0.025312423706054688, 0.027443885803222656, 0.029575347900390625, 0.031706809997558594, 0.03383827209472656, 0.03596973419189453, 0.0381011962890625, 0.04023265838623047, 0.04236412048339844, 0.044495582580566406, 0.046627044677734375, 0.048758506774902344, 0.05088996887207031, 0.05302143096923828, 0.05515289306640625, 0.05728435516357422, 0.05941581726074219, 0.061547279357910156, 0.06367874145507812, 0.0658102035522461, 0.06794166564941406, 0.07007312774658203, 0.07220458984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 8.0, 3.0, 7.0, 5.0, 6.0, 10.0, 14.0, 28.0, 63.0, 51.0, 129.0, 224.0, 410.0, 867.0, 1977.0, 5833.0, 22074.0, 138722.0, 730675.0, 118519.0, 19848.0, 5414.0, 1935.0, 844.0, 379.0, 193.0, 124.0, 52.0, 52.0, 22.0, 25.0, 15.0, 4.0, 4.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17545127868652344, -0.17036056518554688, -0.1652698516845703, -0.16017913818359375, -0.1550884246826172, -0.14999771118164062, -0.14490699768066406, -0.1398162841796875, -0.13472557067871094, -0.12963485717773438, -0.12454414367675781, -0.11945343017578125, -0.11436271667480469, -0.10927200317382812, -0.10418128967285156, -0.099090576171875, -0.09399986267089844, -0.08890914916992188, -0.08381843566894531, -0.07872772216796875, -0.07363700866699219, -0.06854629516601562, -0.06345558166503906, -0.0583648681640625, -0.05327415466308594, -0.048183441162109375, -0.04309272766113281, -0.03800201416015625, -0.03291130065917969, -0.027820587158203125, -0.022729873657226562, -0.01763916015625, -0.012548446655273438, -0.007457733154296875, -0.0023670196533203125, 0.00272369384765625, 0.007814407348632812, 0.012905120849609375, 0.017995834350585938, 0.0230865478515625, 0.028177261352539062, 0.033267974853515625, 0.03835868835449219, 0.04344940185546875, 0.04854011535644531, 0.053630828857421875, 0.05872154235839844, 0.063812255859375, 0.06890296936035156, 0.07399368286132812, 0.07908439636230469, 0.08417510986328125, 0.08926582336425781, 0.09435653686523438, 0.09944725036621094, 0.1045379638671875, 0.10962867736816406, 0.11471939086914062, 0.11981010437011719, 0.12490081787109375, 0.1299915313720703, 0.13508224487304688, 0.14017295837402344, 0.145263671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 15.0, 17.0, 23.0, 31.0, 31.0, 31.0, 47.0, 58.0, 61.0, 79.0, 78.0, 67.0, 64.0, 64.0, 54.0, 42.0, 38.0, 43.0, 33.0, 18.0, 25.0, 11.0, 6.0, 9.0, 5.0, 12.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3149070739746094, -0.30583953857421875, -0.2967720031738281, -0.2877044677734375, -0.2786369323730469, -0.26956939697265625, -0.2605018615722656, -0.251434326171875, -0.24236679077148438, -0.23329925537109375, -0.22423171997070312, -0.2151641845703125, -0.20609664916992188, -0.19702911376953125, -0.18796157836914062, -0.17889404296875, -0.16982650756835938, -0.16075897216796875, -0.15169143676757812, -0.1426239013671875, -0.13355636596679688, -0.12448883056640625, -0.11542129516601562, -0.106353759765625, -0.09728622436523438, -0.08821868896484375, -0.07915115356445312, -0.0700836181640625, -0.061016082763671875, -0.05194854736328125, -0.042881011962890625, -0.0338134765625, -0.024745941162109375, -0.01567840576171875, -0.006610870361328125, 0.0024566650390625, 0.011524200439453125, 0.02059173583984375, 0.029659271240234375, 0.038726806640625, 0.047794342041015625, 0.05686187744140625, 0.06592941284179688, 0.0749969482421875, 0.08406448364257812, 0.09313201904296875, 0.10219955444335938, 0.11126708984375, 0.12033462524414062, 0.12940216064453125, 0.13846969604492188, 0.1475372314453125, 0.15660476684570312, 0.16567230224609375, 0.17473983764648438, 0.183807373046875, 0.19287490844726562, 0.20194244384765625, 0.21100997924804688, 0.2200775146484375, 0.22914505004882812, 0.23821258544921875, 0.24728012084960938, 0.25634765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 14.0, 25.0, 61.0, 184.0, 877.0, 9990.0, 1002515.0, 32801.0, 1602.0, 258.0, 91.0, 34.0, 17.0, 17.0, 8.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2783241271972656, -0.27051544189453125, -0.2627067565917969, -0.2548980712890625, -0.24708938598632812, -0.23928070068359375, -0.23147201538085938, -0.223663330078125, -0.21585464477539062, -0.20804595947265625, -0.20023727416992188, -0.1924285888671875, -0.18461990356445312, -0.17681121826171875, -0.16900253295898438, -0.16119384765625, -0.15338516235351562, -0.14557647705078125, -0.13776779174804688, -0.1299591064453125, -0.12215042114257812, -0.11434173583984375, -0.10653305053710938, -0.098724365234375, -0.09091567993164062, -0.08310699462890625, -0.07529830932617188, -0.0674896240234375, -0.059680938720703125, -0.05187225341796875, -0.044063568115234375, -0.0362548828125, -0.028446197509765625, -0.02063751220703125, -0.012828826904296875, -0.0050201416015625, 0.002788543701171875, 0.01059722900390625, 0.018405914306640625, 0.026214599609375, 0.034023284912109375, 0.04183197021484375, 0.049640655517578125, 0.0574493408203125, 0.06525802612304688, 0.07306671142578125, 0.08087539672851562, 0.08868408203125, 0.09649276733398438, 0.10430145263671875, 0.11211013793945312, 0.1199188232421875, 0.12772750854492188, 0.13553619384765625, 0.14334487915039062, 0.151153564453125, 0.15896224975585938, 0.16677093505859375, 0.17457962036132812, 0.1823883056640625, 0.19019699096679688, 0.19800567626953125, 0.20581436157226562, 0.213623046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 0.0, 7.0, 10.0, 9.0, 13.0, 6.0, 9.0, 8.0, 21.0, 21.0, 32.0, 34.0, 42.0, 62.0, 79.0, 72.0, 84.0, 79.0, 57.0, 63.0, 57.0, 46.0, 37.0, 21.0, 20.0, 24.0, 13.0, 21.0, 11.0, 9.0, 12.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.811981201171875e-05, -1.7550773918628693e-05, -1.6981735825538635e-05, -1.6412697732448578e-05, -1.584365963935852e-05, -1.5274621546268463e-05, -1.4705583453178406e-05, -1.4136545360088348e-05, -1.3567507266998291e-05, -1.2998469173908234e-05, -1.2429431080818176e-05, -1.1860392987728119e-05, -1.1291354894638062e-05, -1.0722316801548004e-05, -1.0153278708457947e-05, -9.58424061536789e-06, -9.015202522277832e-06, -8.446164429187775e-06, -7.877126336097717e-06, -7.30808824300766e-06, -6.7390501499176025e-06, -6.170012056827545e-06, -5.600973963737488e-06, -5.03193587064743e-06, -4.462897777557373e-06, -3.893859684467316e-06, -3.3248215913772583e-06, -2.755783498287201e-06, -2.1867454051971436e-06, -1.6177073121070862e-06, -1.0486692190170288e-06, -4.796311259269714e-07, 8.940696716308594e-08, 6.584450602531433e-07, 1.2274831533432007e-06, 1.796521246433258e-06, 2.3655593395233154e-06, 2.934597432613373e-06, 3.50363552570343e-06, 4.0726736187934875e-06, 4.641711711883545e-06, 5.210749804973602e-06, 5.77978789806366e-06, 6.348825991153717e-06, 6.917864084243774e-06, 7.486902177333832e-06, 8.05594027042389e-06, 8.624978363513947e-06, 9.194016456604004e-06, 9.763054549694061e-06, 1.0332092642784119e-05, 1.0901130735874176e-05, 1.1470168828964233e-05, 1.203920692205429e-05, 1.2608245015144348e-05, 1.3177283108234406e-05, 1.3746321201324463e-05, 1.431535929441452e-05, 1.4884397387504578e-05, 1.5453435480594635e-05, 1.6022473573684692e-05, 1.659151166677475e-05, 1.7160549759864807e-05, 1.7729587852954865e-05, 1.8298625946044922e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 7.0, 2.0, 9.0, 9.0, 11.0, 9.0, 27.0, 44.0, 57.0, 112.0, 232.0, 517.0, 1249.0, 3855.0, 22204.0, 931513.0, 79275.0, 6293.0, 1766.0, 674.0, 304.0, 158.0, 92.0, 37.0, 19.0, 19.0, 15.0, 9.0, 10.0, 2.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.1353588104248047, -0.13094711303710938, -0.12653541564941406, -0.12212371826171875, -0.11771202087402344, -0.11330032348632812, -0.10888862609863281, -0.1044769287109375, -0.10006523132324219, -0.09565353393554688, -0.09124183654785156, -0.08683013916015625, -0.08241844177246094, -0.07800674438476562, -0.07359504699707031, -0.069183349609375, -0.06477165222167969, -0.060359954833984375, -0.05594825744628906, -0.05153656005859375, -0.04712486267089844, -0.042713165283203125, -0.03830146789550781, -0.0338897705078125, -0.029478073120117188, -0.025066375732421875, -0.020654678344726562, -0.01624298095703125, -0.011831283569335938, -0.007419586181640625, -0.0030078887939453125, 0.00140380859375, 0.0058155059814453125, 0.010227203369140625, 0.014638900756835938, 0.01905059814453125, 0.023462295532226562, 0.027873992919921875, 0.03228569030761719, 0.0366973876953125, 0.04110908508300781, 0.045520782470703125, 0.04993247985839844, 0.05434417724609375, 0.05875587463378906, 0.06316757202148438, 0.06757926940917969, 0.071990966796875, 0.07640266418457031, 0.08081436157226562, 0.08522605895996094, 0.08963775634765625, 0.09404945373535156, 0.09846115112304688, 0.10287284851074219, 0.1072845458984375, 0.11169624328613281, 0.11610794067382812, 0.12051963806152344, 0.12493133544921875, 0.12934303283691406, 0.13375473022460938, 0.1381664276123047, 0.142578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 10.0, 12.0, 13.0, 23.0, 36.0, 53.0, 88.0, 124.0, 167.0, 161.0, 100.0, 57.0, 42.0, 23.0, 15.0, 15.0, 13.0, 7.0, 3.0, 6.0, 1.0, 5.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11578369140625, -0.11200237274169922, -0.10822105407714844, -0.10443973541259766, -0.10065841674804688, -0.0968770980834961, -0.09309577941894531, -0.08931446075439453, -0.08553314208984375, -0.08175182342529297, -0.07797050476074219, -0.0741891860961914, -0.07040786743164062, -0.06662654876708984, -0.06284523010253906, -0.05906391143798828, -0.0552825927734375, -0.05150127410888672, -0.04771995544433594, -0.043938636779785156, -0.040157318115234375, -0.036375999450683594, -0.03259468078613281, -0.02881336212158203, -0.02503204345703125, -0.02125072479248047, -0.017469406127929688, -0.013688087463378906, -0.009906768798828125, -0.006125450134277344, -0.0023441314697265625, 0.0014371871948242188, 0.005218505859375, 0.008999824523925781, 0.012781143188476562, 0.016562461853027344, 0.020343780517578125, 0.024125099182128906, 0.027906417846679688, 0.03168773651123047, 0.03546905517578125, 0.03925037384033203, 0.04303169250488281, 0.046813011169433594, 0.050594329833984375, 0.054375648498535156, 0.05815696716308594, 0.06193828582763672, 0.0657196044921875, 0.06950092315673828, 0.07328224182128906, 0.07706356048583984, 0.08084487915039062, 0.0846261978149414, 0.08840751647949219, 0.09218883514404297, 0.09597015380859375, 0.09975147247314453, 0.10353279113769531, 0.1073141098022461, 0.11109542846679688, 0.11487674713134766, 0.11865806579589844, 0.12243938446044922, 0.126220703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 18.0, 36.0, 66.0, 142.0, 249.0, 209.0, 135.0, 57.0, 32.0, 16.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5250473022460938, -2.4546053409576416, -2.3841633796691895, -2.313721179962158, -2.243279218673706, -2.172837257385254, -2.1023950576782227, -2.0319530963897705, -1.9615111351013184, -1.8910691738128662, -1.8206270933151245, -1.7501850128173828, -1.6797430515289307, -1.6093010902404785, -1.5388590097427368, -1.4684169292449951, -1.397974967956543, -1.3275330066680908, -1.2570909261703491, -1.1866488456726074, -1.1162068843841553, -1.0457649230957031, -0.9753228425979614, -0.9048808217048645, -0.8344388008117676, -0.7639967799186707, -0.6935547590255737, -0.6231127381324768, -0.5526707172393799, -0.48222869634628296, -0.41178667545318604, -0.3413446545600891, -0.2709026336669922, -0.20046061277389526, -0.13001859188079834, -0.059576570987701416, 0.010865449905395508, 0.08130747079849243, 0.15174949169158936, 0.22219151258468628, 0.2926335334777832, 0.3630755543708801, 0.43351757526397705, 0.503959596157074, 0.5744016170501709, 0.6448436379432678, 0.7152856588363647, 0.7857276797294617, 0.8561697006225586, 0.9266117215156555, 0.9970537424087524, 1.0674958229064941, 1.1379377841949463, 1.2083797454833984, 1.2788218259811401, 1.3492639064788818, 1.419705867767334, 1.4901478290557861, 1.5605899095535278, 1.6310319900512695, 1.7014739513397217, 1.7719159126281738, 1.8423579931259155, 1.9128000736236572, 1.9832420349121094]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 8.0, 12.0, 18.0, 19.0, 38.0, 55.0, 69.0, 101.0, 138.0, 131.0, 121.0, 96.0, 71.0, 46.0, 33.0, 15.0, 17.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7596776485443115, -2.692523717880249, -2.6253700256347656, -2.558216094970703, -2.4910624027252197, -2.4239084720611572, -2.356754779815674, -2.2896008491516113, -2.222446918487549, -2.1552929878234863, -2.088139295578003, -2.0209853649139404, -1.953831672668457, -1.8866777420043945, -1.8195239305496216, -1.7523701190948486, -1.6852164268493652, -1.6180626153945923, -1.5509088039398193, -1.4837549924850464, -1.4166011810302734, -1.349447250366211, -1.282293438911438, -1.215139627456665, -1.147985816001892, -1.0808320045471191, -1.0136781930923462, -0.9465243220329285, -0.8793705105781555, -0.8122166991233826, -0.7450628280639648, -0.6779090166091919, -0.6107549667358398, -0.5436011552810669, -0.47644731402397156, -0.4092934727668762, -0.34213966131210327, -0.2749858498573303, -0.20783200860023499, -0.14067816734313965, -0.0735243558883667, -0.006370529532432556, 0.06078329682350159, 0.12793712317943573, 0.19509094953536987, 0.2622447609901428, 0.32939860224723816, 0.3965524435043335, 0.46370625495910645, 0.5308600664138794, 0.5980138778686523, 0.6651677489280701, 0.732321560382843, 0.799475371837616, 0.8666292428970337, 0.9337830543518066, 1.0009368658065796, 1.0680906772613525, 1.1352444887161255, 1.2023983001708984, 1.269552230834961, 1.3367059230804443, 1.4038598537445068, 1.4710136651992798, 1.5381674766540527]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 17.0, 26.0, 49.0, 88.0, 419.0, 235.0, 90.0, 34.0, 18.0, 9.0, 13.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.3536224365234375, -0.345184326171875, -0.3367462158203125, -0.32830810546875, -0.3198699951171875, -0.311431884765625, -0.3029937744140625, -0.2945556640625, -0.2861175537109375, -0.277679443359375, -0.2692413330078125, -0.26080322265625, -0.2523651123046875, -0.243927001953125, -0.2354888916015625, -0.22705078125, -0.2186126708984375, -0.210174560546875, -0.2017364501953125, -0.19329833984375, -0.1848602294921875, -0.176422119140625, -0.1679840087890625, -0.1595458984375, -0.1511077880859375, -0.142669677734375, -0.1342315673828125, -0.12579345703125, -0.1173553466796875, -0.108917236328125, -0.1004791259765625, -0.092041015625, -0.0836029052734375, -0.075164794921875, -0.0667266845703125, -0.05828857421875, -0.0498504638671875, -0.041412353515625, -0.0329742431640625, -0.0245361328125, -0.0160980224609375, -0.007659912109375, 0.0007781982421875, 0.00921630859375, 0.0176544189453125, 0.026092529296875, 0.0345306396484375, 0.04296875, 0.0514068603515625, 0.059844970703125, 0.0682830810546875, 0.07672119140625, 0.0851593017578125, 0.093597412109375, 0.1020355224609375, 0.1104736328125, 0.1189117431640625, 0.127349853515625, 0.1357879638671875, 0.14422607421875, 0.1526641845703125, 0.161102294921875, 0.1695404052734375, 0.177978515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 17.0, 13.0, 15.0, 22.0, 24.0, 45.0, 57.0, 113.0, 190.0, 293.0, 677.0, 1841.0, 6688.0, 64705.0, 8289246.0, 18330.0, 3739.0, 1206.0, 560.0, 299.0, 164.0, 85.0, 71.0, 38.0, 30.0, 28.0, 15.0, 15.0, 10.0, 7.0, 2.0, 8.0, 1.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.41914132237434387, -0.4061570167541504, -0.3931727409362793, -0.3801884353160858, -0.3672041594982147, -0.35421985387802124, -0.34123557806015015, -0.32825127243995667, -0.3152669668197632, -0.3022826611995697, -0.2892983853816986, -0.2763140797615051, -0.26332980394363403, -0.25034549832344055, -0.23736120760440826, -0.22437691688537598, -0.2113926261663437, -0.1984083354473114, -0.1854240447282791, -0.17243975400924683, -0.15945544838905334, -0.14647115767002106, -0.13348686695098877, -0.12050256878137589, -0.1075182780623436, -0.09453398734331131, -0.08154968917369843, -0.06856539845466614, -0.05558110401034355, -0.042596809566020966, -0.029612518846988678, -0.016628220677375793, -0.003643929958343506, 0.009340363554656506, 0.022324657067656517, 0.035308949649333954, 0.04829324409365654, 0.061277538537979126, 0.07426182925701141, 0.0872461274266243, 0.10023041814565659, 0.11321470886468887, 0.12619900703430176, 0.13918329775333405, 0.15216758847236633, 0.16515189409255981, 0.1781361699104309, 0.1911204755306244, 0.20410476624965668, 0.21708905696868896, 0.23007334768772125, 0.24305763840675354, 0.256041944026947, 0.2690262198448181, 0.2820105254650116, 0.2949948310852051, 0.30797910690307617, 0.32096341252326965, 0.33394768834114075, 0.34693199396133423, 0.3599162697792053, 0.3729005753993988, 0.3858848810195923, 0.3988691568374634, 0.41185346245765686]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 2.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6559098958969116, -0.6344291567802429, -0.6129484176635742, -0.5914676785469055, -0.5699869394302368, -0.5485062599182129, -0.5270255208015442, -0.5055447816848755, -0.4840640425682068, -0.4625833034515381, -0.4411025643348694, -0.41962185502052307, -0.39814111590385437, -0.37666037678718567, -0.35517966747283936, -0.33369892835617065, -0.31221818923950195, -0.29073745012283325, -0.26925671100616455, -0.24777600169181824, -0.22629526257514954, -0.20481452345848083, -0.18333379924297333, -0.16185307502746582, -0.14037233591079712, -0.11889160424470901, -0.09741087257862091, -0.0759301409125328, -0.0544494092464447, -0.0329686775803566, -0.011487945914268494, 0.009992778301239014, 0.031473517417907715, 0.05295424908399582, 0.07443498075008392, 0.09591571241617203, 0.11739644408226013, 0.13887718319892883, 0.16035790741443634, 0.18183863162994385, 0.20331937074661255, 0.22480010986328125, 0.24628083407878876, 0.26776155829429626, 0.28924229741096497, 0.31072303652763367, 0.33220374584198, 0.3536844849586487, 0.3751652240753174, 0.3966459631919861, 0.4181267023086548, 0.4396074116230011, 0.4610881507396698, 0.4825688898563385, 0.5040495991706848, 0.5255303382873535, 0.5470110774040222, 0.5684918165206909, 0.5899725556373596, 0.6114532947540283, 0.6329339742660522, 0.654414713382721, 0.6758954524993896, 0.6973761916160583, 0.718856930732727]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 14.0, 37.0, 64.0, 117.0, 150.0, 180.0, 164.0, 88.0, 74.0, 45.0, 29.0, 18.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11444091796875, -0.1120295524597168, -0.1096181869506836, -0.10720682144165039, -0.10479545593261719, -0.10238409042358398, -0.09997272491455078, -0.09756135940551758, -0.09514999389648438, -0.09273862838745117, -0.09032726287841797, -0.08791589736938477, -0.08550453186035156, -0.08309316635131836, -0.08068180084228516, -0.07827043533325195, -0.07585906982421875, -0.07344770431518555, -0.07103633880615234, -0.06862497329711914, -0.06621360778808594, -0.06380224227905273, -0.06139087677001953, -0.05897951126098633, -0.056568145751953125, -0.05415678024291992, -0.05174541473388672, -0.049334049224853516, -0.04692268371582031, -0.04451131820678711, -0.042099952697753906, -0.0396885871887207, -0.0372772216796875, -0.0348658561706543, -0.032454490661621094, -0.03004312515258789, -0.027631759643554688, -0.025220394134521484, -0.02280902862548828, -0.020397663116455078, -0.017986297607421875, -0.015574932098388672, -0.013163566589355469, -0.010752201080322266, -0.008340835571289062, -0.005929470062255859, -0.0035181045532226562, -0.0011067390441894531, 0.00130462646484375, 0.003715991973876953, 0.006127357482910156, 0.00853872299194336, 0.010950088500976562, 0.013361454010009766, 0.01577281951904297, 0.018184185028076172, 0.020595550537109375, 0.023006916046142578, 0.02541828155517578, 0.027829647064208984, 0.030241012573242188, 0.03265237808227539, 0.035063743591308594, 0.0374751091003418, 0.039886474609375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 11.0, 13.0, 20.0, 27.0, 32.0, 53.0, 89.0, 215.0, 415.0, 1086.0, 3083.0, 11695.0, 69985.0, 352769.0, 68331.0, 11397.0, 3076.0, 1037.0, 452.0, 205.0, 99.0, 60.0, 37.0, 25.0, 9.0, 18.0, 5.0, 3.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0], "bins": [-1.7060546875, -1.6668319702148438, -1.6276092529296875, -1.5883865356445312, -1.549163818359375, -1.5099411010742188, -1.4707183837890625, -1.4314956665039062, -1.39227294921875, -1.3530502319335938, -1.3138275146484375, -1.2746047973632812, -1.235382080078125, -1.1961593627929688, -1.1569366455078125, -1.1177139282226562, -1.0784912109375, -1.0392684936523438, -1.0000457763671875, -0.9608230590820312, -0.921600341796875, -0.8823776245117188, -0.8431549072265625, -0.8039321899414062, -0.76470947265625, -0.7254867553710938, -0.6862640380859375, -0.6470413208007812, -0.607818603515625, -0.5685958862304688, -0.5293731689453125, -0.49015045166015625, -0.450927734375, -0.41170501708984375, -0.3724822998046875, -0.33325958251953125, -0.294036865234375, -0.25481414794921875, -0.2155914306640625, -0.17636871337890625, -0.13714599609375, -0.09792327880859375, -0.0587005615234375, -0.01947784423828125, 0.019744873046875, 0.05896759033203125, 0.0981903076171875, 0.13741302490234375, 0.1766357421875, 0.21585845947265625, 0.2550811767578125, 0.29430389404296875, 0.333526611328125, 0.37274932861328125, 0.4119720458984375, 0.45119476318359375, 0.49041748046875, 0.5296401977539062, 0.5688629150390625, 0.6080856323242188, 0.647308349609375, 0.6865310668945312, 0.7257537841796875, 0.7649765014648438, 0.80419921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 11.0, 23.0, 36.0, 67.0, 114.0, 158.0, 198.0, 159.0, 93.0, 59.0, 36.0, 21.0, 14.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.400146484375, -0.3919086456298828, -0.3836708068847656, -0.37543296813964844, -0.36719512939453125, -0.35895729064941406, -0.3507194519042969, -0.3424816131591797, -0.3342437744140625, -0.3260059356689453, -0.3177680969238281, -0.30953025817871094, -0.30129241943359375, -0.29305458068847656, -0.2848167419433594, -0.2765789031982422, -0.268341064453125, -0.2601032257080078, -0.2518653869628906, -0.24362754821777344, -0.23538970947265625, -0.22715187072753906, -0.21891403198242188, -0.2106761932373047, -0.2024383544921875, -0.1942005157470703, -0.18596267700195312, -0.17772483825683594, -0.16948699951171875, -0.16124916076660156, -0.15301132202148438, -0.1447734832763672, -0.13653564453125, -0.1282978057861328, -0.12005996704101562, -0.11182212829589844, -0.10358428955078125, -0.09534645080566406, -0.08710861206054688, -0.07887077331542969, -0.0706329345703125, -0.06239509582519531, -0.054157257080078125, -0.04591941833496094, -0.03768157958984375, -0.029443740844726562, -0.021205902099609375, -0.012968063354492188, -0.004730224609375, 0.0035076141357421875, 0.011745452880859375, 0.019983291625976562, 0.02822113037109375, 0.03645896911621094, 0.044696807861328125, 0.05293464660644531, 0.0611724853515625, 0.06941032409667969, 0.07764816284179688, 0.08588600158691406, 0.09412384033203125, 0.10236167907714844, 0.11059951782226562, 0.11883735656738281, 0.1270751953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 15.0, 8.0, 7.0, 11.0, 12.0, 11.0, 20.0, 21.0, 14.0, 26.0, 33.0, 30.0, 20.0, 25.0, 30.0, 25.0, 17.0, 26.0, 18.0, 18.0, 18.0, 20.0, 8.0, 7.0, 8.0, 6.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.26477158069610596, -0.2574709951877594, -0.25017037987709045, -0.2428697943687439, -0.23556920886039734, -0.2282686084508896, -0.22096800804138184, -0.21366742253303528, -0.20636682212352753, -0.19906622171401978, -0.19176563620567322, -0.18446503579616547, -0.1771644502878189, -0.16986384987831116, -0.1625632643699646, -0.15526266396045685, -0.1479620635509491, -0.14066146314144135, -0.1333608776330948, -0.12606027722358704, -0.11875968426465988, -0.11145909130573273, -0.10415849834680557, -0.09685790538787842, -0.08955731987953186, -0.0822567269206047, -0.07495613396167755, -0.0676555335521698, -0.060354940593242645, -0.05305434763431549, -0.045753754675388336, -0.03845315799117088, -0.03115256130695343, -0.023851966485381126, -0.016551371663808823, -0.009250778704881668, -0.0019501838833093643, 0.0053504109382629395, 0.012651003897190094, 0.019951600581407547, 0.0272521935403347, 0.034552786499261856, 0.04185338318347931, 0.049153976142406464, 0.05645456910133362, 0.06375516951084137, 0.07105575501918793, 0.07835635542869568, 0.08565694838762283, 0.09295754134654999, 0.10025813430547714, 0.1075587272644043, 0.11485932767391205, 0.1221599206328392, 0.12946051359176636, 0.1367611140012741, 0.14406169950962067, 0.15136229991912842, 0.15866288542747498, 0.16596348583698273, 0.17326407134532928, 0.18056467175483704, 0.1878652572631836, 0.19516585767269135, 0.2024664580821991]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 4.0, 9.0, 9.0, 10.0, 11.0, 17.0, 15.0, 19.0, 24.0, 19.0, 31.0, 32.0, 44.0, 35.0, 26.0, 28.0, 26.0, 22.0, 15.0, 17.0, 8.0, 12.0, 7.0, 3.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47320419549942017, -0.45864179730415344, -0.4440793991088867, -0.42951700091362, -0.41495460271835327, -0.40039223432540894, -0.3858298063278198, -0.3712674379348755, -0.35670503973960876, -0.34214264154434204, -0.3275802433490753, -0.3130178451538086, -0.29845544695854187, -0.28389304876327515, -0.2693306803703308, -0.2547682821750641, -0.24020586907863617, -0.22564347088336945, -0.21108107268810272, -0.1965186893939972, -0.18195629119873047, -0.16739389300346375, -0.15283149480819702, -0.1382690966129303, -0.12370670586824417, -0.10914430767297745, -0.09458191692829132, -0.0800195187330246, -0.06545712053775787, -0.05089472979307175, -0.03633233159780502, -0.021769940853118896, -0.007207542657852173, 0.007354852743446827, 0.021917248144745827, 0.0364796444773674, 0.051042038947343826, 0.06560443341732025, 0.08016683161258698, 0.0947292223572731, 0.10929162055253983, 0.12385401874780655, 0.13841640949249268, 0.1529788076877594, 0.16754120588302612, 0.18210360407829285, 0.19666600227355957, 0.2112283855676651, 0.22579078376293182, 0.24035318195819855, 0.2549155652523041, 0.2694779634475708, 0.2840403616428375, 0.29860275983810425, 0.31316515803337097, 0.3277275562286377, 0.3422899544239044, 0.35685235261917114, 0.37141475081443787, 0.3859771490097046, 0.4005395472049713, 0.41510194540023804, 0.4296643137931824, 0.4442267119884491, 0.4587891101837158]}, "eval/loss": 4.157788276672363, "eval/bleu": 4.030183230582677e-18, "eval/runtime": 2571.6238, "eval/samples_per_second": 5.74, "eval/steps_per_second": 0.717} \ No newline at end of file